cybershiptrooper

iarcuschin commited on Oct 15, 2024

Commit

92ed75d

verified ·

1 Parent(s): 0f12a50

Add new models (#16)

Browse files

- Add new models (16c725ef7db17b751e6fd485e830244efe7fd9da)

Co-authored-by: Ivan Arcuschin <[email protected]>

Files changed (43) hide show

106/edges.pkl +3 -0
106/ll_model.pth +3 -0
106/ll_model_cfg.pkl +3 -0
106/meta.json +1 -0
121/edges.pkl +3 -0
121/ll_model.pth +3 -0
121/ll_model_cfg.pkl +3 -0
121/meta.json +1 -0
130/edges.pkl +3 -0
130/ll_model.pth +3 -0
130/ll_model_cfg.pkl +3 -0
130/meta.json +1 -0
15/edges.pkl +3 -0
15/ll_model.pth +3 -0
15/ll_model_cfg.pkl +3 -0
15/meta.json +1 -0
41/edges.pkl +3 -0
41/ll_model.pth +3 -0
41/ll_model_cfg.pkl +3 -0
41/meta.json +1 -0
43/edges.pkl +3 -0
43/ll_model.pth +3 -0
43/ll_model_cfg.pkl +3 -0
43/meta.json +1 -0
49/edges.pkl +3 -0
49/ll_model.pth +3 -0
49/ll_model_cfg.pkl +3 -0
49/meta.json +1 -0
66/edges.pkl +3 -0
66/ll_model.pth +3 -0
66/ll_model_cfg.pkl +3 -0
66/meta.json +1 -0
68/edges.pkl +3 -0
68/ll_model.pth +3 -0
68/ll_model_cfg.pkl +3 -0
68/meta.json +1 -0
73/edges.pkl +3 -0
73/ll_model.pth +3 -0
73/ll_model_cfg.pkl +3 -0
73/meta.json +1 -0
benchmark_cases_metadata.csv +10 -0
benchmark_cases_metadata.parquet +2 -2
benchmark_metadata.json +1455 -156

106/edges.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fda9b02cdb2f5d7252c229a12290c6d81381606b1bfad02979549f304bf2a5d0
+size 134

106/ll_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:580798eae1391aca366f15c0442c3ef1c02b1b323d610d1d9ddee0faee5e664f
+size 14698

106/ll_model_cfg.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:24bca874c32c8c431cdb732e3222b4090604cde6f05ce1359710b630220650e3
+size 1093

106/meta.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-106-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}

121/edges.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
+size 113

121/ll_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8054e00aea3c35c5ee77c693f9feeba493c499fe3218e70780137938138a4675
+size 15118

121/ll_model_cfg.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9f027ad4de6828c6f5bb7a3f3c8aabd9658526e33b2284eba366977823b89c0a
+size 1093

121/meta.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-121-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}

130/edges.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:af2a7430f7477a79df1fce6300cf37e1c46d73c31a7f91e06221ef4a6ebf9bed
+size 223

130/ll_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4be63b6e0776e45f04d0905702a3a520b2b6449691ae6e34b8504693ac6805be
+size 21304

130/ll_model_cfg.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:192503b894021c736145328500ab1f316e60ed7a121cf04b089bcd05d04e50b4
+size 1093

130/meta.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-130-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}

15/edges.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ecc8ce1a212f987b85ec909238ebc7d01d36c58389391fc96d69ca007fa2d384
+size 244

15/ll_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:22ff8d1015f06b8912051e6787ba4e058047facdaadd1d9322e7e89c070c131f
+size 20728

15/ll_model_cfg.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f4162b8d5712db86a2025499b1561c655fd97402716ff352305c296c7a04ff65
+size 1093

15/meta.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-15-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}

41/edges.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
+size 113

41/ll_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7d59c31ceb0d0c9afb12dc1f63ade3c4f9edba0dfd80d5779ae27188da2c21d8
+size 14862

41/ll_model_cfg.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f1dee34cba288862b06c2ff669839e06b6c17aa46cdb685f4a2c5a8c3be8a39b
+size 1093

41/meta.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-41-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}

43/edges.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
+size 113

43/ll_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:26cc6d6ffa5ae93ce73055d831d4a7119bca2166c2ed9731992c48b4b3debb49
+size 15054

43/ll_model_cfg.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:89a74c42552b846f4562163c6fe74a474edfa36e1972eb97bb3ce0d8aaf9444c
+size 1093

43/meta.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-43-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}

49/edges.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
+size 113

49/ll_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:aab9be464531a3cf85f25e3ccb3153c15b6de9876d56799d8705d0784979a1ea
+size 14634

49/ll_model_cfg.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e47363d4486f828a419ba208bee3a725d431ab80e418a8318f55cf6cd6bf310
+size 1093

49/meta.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-49-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}

66/edges.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
+size 113

66/ll_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fa63d9e5b124ffb9ce9061e04b03b1ff551c8085fc51ddea31f488b152f5f7c3
+size 14762

66/ll_model_cfg.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b04d734fcc61084204ead0d8cc11c5782598f6f6e4bf3e14b94eab7b0bc9d676
+size 1093

66/meta.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-66-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}

68/edges.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
+size 113

68/ll_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a1b739ebc05faa4d388c20ef60ab59e44695c4a82323ed7c9c3801ae8e502db9
+size 14670

68/ll_model_cfg.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:be188cb9baf70c65af2c4ecf92c6de170c15a41599109f95c6b632f15bb3eec3
+size 1093

68/meta.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-68-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}

73/edges.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
+size 113

73/ll_model.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:809fe1d4c9f818bac9a85b358d0722f6ed8527d56f988fe66d62f0eceac0f097
+size 14698

73/ll_model_cfg.pkl ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:db76917a80935813594508b1d79b7a0836a20daf67e263161432430b095fd111
+size 1093

73/meta.json ADDED Viewed

	@@ -0,0 +1 @@

+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-73-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}

benchmark_cases_metadata.csv CHANGED Viewed

@@ -27,6 +27,7 @@ ioi,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi,Indirect O
 30,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/30,Tags numeric tokens in a sequence based on whether they fall within a given range.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 90,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/90,Replaces a specific token with another one.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/edges.pkl,2,4,10,1,custom,4,16,gelu,12,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,9,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 39,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/39,Returns the fraction of 'x' in the input up to the i-th position for all i.,60,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl,2,120,60,30,custom,4,480,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.08432740427115679,True,False,standard,False,1,False,345600,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 75,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75,Double each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 101,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/101,Check if each element is a square of an integer.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi_next_token,"Indirect Object Identification (IOI) task, trained using next token prediction.",16,16,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/edges.pkl,6,64,1024,16,gpt2,4,3072,gelu_new,50257,1e-05,False,True,False,False,False,False,GPT2LMHeadModel,False,gpt2,gpt2,LNPre,1,causal,False,,0.02886751345948129,True,False,standard,False,50257,False,2457600,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,,,,True,True,1.0,,,True,,256.0,True,True,"val/accuracy,val/IIA",,,True,0.65,False,0.0,True,max,,True,
@@ -34,14 +35,17 @@ ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi
 14,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/14,Returns the count of 'a' in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/edges.pkl,2,8,10,2,custom,4,32,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.15689290811054724,True,False,standard,False,10,False,1536,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 95,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/95,Counts the distinct prime factors of each number in the input list.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12060453783110546,True,False,standard,False,3,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 84,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/84,Apply the arctangent function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 93,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93,Swaps the nth with the n+1th element if n%2==1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/edges.pkl,3,20,10,5,custom,4,80,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10886621079036347,True,False,standard,False,11,False,14400,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 37,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/37,Reverses each word in the sequence except for specified exclusions.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
 34,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/34,Calculate the ratio of vowels to consonants in each word.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/edges.pkl,2,16,10,4,custom,4,64,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,5,False,6144,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
 26,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/26,Creates a cascading effect by repeating each token in sequence incrementally.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl,2,21,10,5,custom,4,84,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12344267996967354,True,False,standard,False,27,False,10416,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
 19,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/19,Removes consecutive duplicate tokens from a sequence.,15,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/edges.pkl,2,32,15,8,custom,4,128,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.15689290811054724,True,False,standard,False,3,False,24576,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,,True,,,True,True,,,,True,,True,,True,,,True,
 53,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/53,Increment elements at odd indices by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13151918984428584,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 40,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/40,Sum the last and previous to last digits of a number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/edges.pkl,2,4,10,1,custom,4,16,gelu,31,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.09847319278346618,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 51,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/51,Checks if each element is a Fibonacci number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl,2,4,10,1,custom,4,16,gelu,102,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.07525766947068778,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 122,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122,Check if each number is divisible by 3.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 85,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/85,Square each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 2,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/2,Reverse the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/edges.pkl,4,56,10,14,custom,4,224,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.07593263966019993,True,False,standard,False,26,False,150528,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
@@ -51,6 +55,7 @@ ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi
 20,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/20,Detect spam messages based on appearance of spam keywords.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/edges.pkl,2,13,10,3,custom,4,52,gelu,14,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16,True,False,standard,False,2,False,3952,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
 25,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/25,Normalizes token frequencies in a sequence to a range between 0 and 1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/edges.pkl,2,62,10,15,custom,4,248,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.08295613557843402,True,False,standard,False,56,False,91264,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 11,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/11,Counts the number of words in a sequence based on their length.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,5,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,500.0,,gelu,True,True,1.0,,,True,,,True,True,,,,True,,True,,True,,,True,
 54,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/54,Applies the hyperbolic tangent to each element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 124,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/124,Check if all elements in a list are equal.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.11547005383792516,True,False,standard,False,2,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 102,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/102,"Reflects each element within a range (default is [2, 7]).",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/edges.pkl,2,4,10,1,custom,4,16,gelu,42,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1059625885652035,True,False,standard,False,6,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
@@ -60,15 +65,20 @@ ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi
 86,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/86,"Check if each element is a power of 2. Return 1 if true, otherwise 0.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 105,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/105,Replaces each number with the next prime after that number.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.11202240672224079,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 58,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/58,Mirrors the first half of the sequence to the second half.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl,3,32,10,8,custom,4,128,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10415112878465911,True,False,standard,False,11,False,36864,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 70,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/70,Apply the cosine function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 62,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/62,Replaces each element with its factorial.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1414213562373095,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 111,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/111,Returns the last element of the sequence and pads the rest with zeros.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.09847319278346618,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 35,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/35,Alternates capitalization of each character in words.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/edges.pkl,2,9,10,2,custom,4,36,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,1872,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
 3,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/3,Returns the fraction of 'x' in the input up to the i-th position for all i.,5,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/edges.pkl,2,12,5,3,custom,4,48,gelu,6,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.22188007849009167,True,False,standard,False,1,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,10.0,2000.0,,gelu,True,True,0.1,,strict,False,,,True,True,,,,True,,True,,True,,,True,
 36,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/36,"Classifies each token as 'positive', 'negative', or 'neutral' based on emojis.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl,2,6,10,1,custom,4,24,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.19402850002906638,True,False,standard,False,3,False,768,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
 64,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/64,Cubes each element in the sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 8,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/8,Identity,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 103,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/103,Swap consecutive numbers in a list,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10787197799411874,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 56,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/56,Sets every third element to zero.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13333333333333333,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 97,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/97,Scale a sequence by its maximum element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl,3,200,10,50,custom,4,800,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.05405899027195888,True,False,standard,False,64,False,1440000,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 46,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46,Decrements each element in the sequence by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,

 30,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/30,Tags numeric tokens in a sequence based on whether they fall within a given range.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 90,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/90,Replaces a specific token with another one.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/edges.pkl,2,4,10,1,custom,4,16,gelu,12,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,9,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 39,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/39,Returns the fraction of 'x' in the input up to the i-th position for all i.,60,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl,2,120,60,30,custom,4,480,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.08432740427115679,True,False,standard,False,1,False,345600,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
+130,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/130,"Clips each element to be within a range (make the default range [2, 7]).",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/edges.pkl,3,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.10079052613579392,True,False,standard,False,6,False,576,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 75,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75,Double each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 101,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/101,Check if each element is a square of an integer.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi_next_token,"Indirect Object Identification (IOI) task, trained using next token prediction.",16,16,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/edges.pkl,6,64,1024,16,gpt2,4,3072,gelu_new,50257,1e-05,False,True,False,False,False,False,GPT2LMHeadModel,False,gpt2,gpt2,LNPre,1,causal,False,,0.02886751345948129,True,False,standard,False,50257,False,2457600,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,,,,True,True,1.0,,,True,,256.0,True,True,"val/accuracy,val/IIA",,,True,0.65,False,0.0,True,max,,True,
 14,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/14,Returns the count of 'a' in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/edges.pkl,2,8,10,2,custom,4,32,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.15689290811054724,True,False,standard,False,10,False,1536,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 95,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/95,Counts the distinct prime factors of each number in the input list.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12060453783110546,True,False,standard,False,3,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 84,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/84,Apply the arctangent function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
+66,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/66,Round each element in the input sequence to the nearest integer.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13151918984428584,True,False,standard,False,6,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 93,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93,Swaps the nth with the n+1th element if n%2==1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/edges.pkl,3,20,10,5,custom,4,80,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10886621079036347,True,False,standard,False,11,False,14400,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 37,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/37,Reverses each word in the sequence except for specified exclusions.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
 34,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/34,Calculate the ratio of vowels to consonants in each word.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/edges.pkl,2,16,10,4,custom,4,64,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,5,False,6144,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
 26,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/26,Creates a cascading effect by repeating each token in sequence incrementally.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl,2,21,10,5,custom,4,84,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12344267996967354,True,False,standard,False,27,False,10416,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
+15,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/15,Returns each token multiplied by two and subtracted by its index.,5,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/edges.pkl,3,4,5,1,custom,4,16,gelu,7,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.06553855364152325,True,False,standard,False,12,False,576,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 19,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/19,Removes consecutive duplicate tokens from a sequence.,15,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/edges.pkl,2,32,15,8,custom,4,128,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.15689290811054724,True,False,standard,False,3,False,24576,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,,True,,,True,True,,,,True,,True,,True,,,True,
 53,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/53,Increment elements at odd indices by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13151918984428584,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 40,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/40,Sum the last and previous to last digits of a number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/edges.pkl,2,4,10,1,custom,4,16,gelu,31,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.09847319278346618,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 51,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/51,Checks if each element is a Fibonacci number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl,2,4,10,1,custom,4,16,gelu,102,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.07525766947068778,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
+43,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/43,Returns the corresponding Fibonacci number for each element in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1131370849898476,True,False,standard,False,19,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 122,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122,Check if each number is divisible by 3.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 85,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/85,Square each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 2,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/2,Reverse the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/edges.pkl,4,56,10,14,custom,4,224,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.07593263966019993,True,False,standard,False,26,False,150528,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 20,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/20,Detect spam messages based on appearance of spam keywords.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/edges.pkl,2,13,10,3,custom,4,52,gelu,14,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16,True,False,standard,False,2,False,3952,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
 25,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/25,Normalizes token frequencies in a sequence to a range between 0 and 1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/edges.pkl,2,62,10,15,custom,4,248,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.08295613557843402,True,False,standard,False,56,False,91264,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 11,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/11,Counts the number of words in a sequence based on their length.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,5,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,500.0,,gelu,True,True,1.0,,,True,,,True,True,,,,True,,True,,True,,,True,
+41,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/41,Make each element of the input sequence absolute,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12344267996967354,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 54,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/54,Applies the hyperbolic tangent to each element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 124,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/124,Check if all elements in a list are equal.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.11547005383792516,True,False,standard,False,2,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 102,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/102,"Reflects each element within a range (default is [2, 7]).",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/edges.pkl,2,4,10,1,custom,4,16,gelu,42,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1059625885652035,True,False,standard,False,6,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 86,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/86,"Check if each element is a power of 2. Return 1 if true, otherwise 0.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 105,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/105,Replaces each number with the next prime after that number.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.11202240672224079,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 58,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/58,Mirrors the first half of the sequence to the second half.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl,3,32,10,8,custom,4,128,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10415112878465911,True,False,standard,False,11,False,36864,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
+68,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/68,Increment each element until it becomes a multiple of 3,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,5,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 70,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/70,Apply the cosine function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 62,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/62,Replaces each element with its factorial.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1414213562373095,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 111,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/111,Returns the last element of the sequence and pads the rest with zeros.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.09847319278346618,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
+121,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/121,Compute arcsine of all elements in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.11202240672224079,True,False,standard,False,20,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 35,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/35,Alternates capitalization of each character in words.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/edges.pkl,2,9,10,2,custom,4,36,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,1872,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
 3,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/3,Returns the fraction of 'x' in the input up to the i-th position for all i.,5,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/edges.pkl,2,12,5,3,custom,4,48,gelu,6,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.22188007849009167,True,False,standard,False,1,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,10.0,2000.0,,gelu,True,True,0.1,,strict,False,,,True,True,,,,True,,True,,True,,,True,
 36,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/36,"Classifies each token as 'positive', 'negative', or 'neutral' based on emojis.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl,2,6,10,1,custom,4,24,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.19402850002906638,True,False,standard,False,3,False,768,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
+106,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/106,Sets all elements to zero except for the element at index 1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13719886811400708,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 64,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/64,Cubes each element in the sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 8,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/8,Identity,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
+73,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/73,Apply the sine function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 103,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/103,Swap consecutive numbers in a list,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10787197799411874,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 56,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/56,Sets every third element to zero.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13333333333333333,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 97,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/97,Scale a sequence by its maximum element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl,3,200,10,50,custom,4,800,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.05405899027195888,True,False,standard,False,64,False,1440000,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
+49,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/49,Decrements each element in the sequence until it becomes a multiple of 3.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.15689290811054724,True,False,standard,False,4,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 46,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46,Decrements each element in the sequence by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,

benchmark_cases_metadata.parquet CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:729585ec39204363367ad83efc6bf10185f4e191fe490714be2ab026d1c9864c
-size 75187

 version https://git-lfs.github.com/spec/v1
+oid sha256:049d63f22c918edb98d89c9eb69f091016c4780b033e5559523abd7e50188238
+size 76100

benchmark_metadata.json CHANGED Viewed

@@ -3352,6 +3352,150 @@
       "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth",
       "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl"
     },
     {
       "case_id": "75",
       "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75",
@@ -4233,6 +4377,140 @@
       "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth",
       "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl"
     },
     {
       "case_id": "93",
       "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93",
@@ -4663,40 +4941,159 @@
       "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl"
     },
     {
-      "case_id": "19",
-      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/19",
-      "task_description": "Removes consecutive duplicate tokens from a sequence.",
       "vocab": [
-        "a",
-        "b",
-        "c"
       ],
-      "max_seq_len": 15,
       "min_seq_len": 4,
       "files": [
         {
           "file_name": "edges.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/meta.json"
         }
       ],
       "transformer_cfg": {
-        "n_layers": 2,
-        "d_model": 32,
-        "n_ctx": 15,
-        "d_head": 8,
-        "model_name": "custom",
         "n_heads": 4,
         "d_mlp": 128,
         "act_fn": "gelu",
@@ -5241,6 +5638,140 @@
       "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth",
       "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl"
     },
     {
       "case_id": "122",
       "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122",
@@ -6371,10 +6902,20 @@
       "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl"
     },
     {
-      "case_id": "54",
-      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/54",
-      "task_description": "Applies the hyperbolic tangent to each element.",
       "vocab": [
         0,
         1,
         2,
@@ -6384,19 +6925,143 @@
         6,
         7,
         8,
-        9,
-        10
       ],
       "max_seq_len": 10,
       "min_seq_len": 4,
       "files": [
         {
           "file_name": "edges.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
@@ -7572,9 +8237,9 @@
       "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl"
     },
     {
-      "case_id": "70",
-      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/70",
-      "task_description": "Apply the cosine function to each element of the input sequence.",
       "vocab": [
         0,
         1,
@@ -7593,19 +8258,19 @@
       "files": [
         {
           "file_name": "edges.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json"
         }
       ],
       "transformer_cfg": {
@@ -7639,12 +8304,12 @@
         "attention_dir": "causal",
         "attn_only": false,
         "seed": 0,
-        "initializer_range": 0.1392621247645583,
         "init_weights": true,
         "scale_attn_by_inverse_layer_idx": false,
         "positional_embedding_type": "standard",
         "final_rms": false,
-        "d_vocab_out": 11,
         "parallel_attn_mlp": false,
         "rotary_dim": null,
         "n_params": 384,
@@ -7662,7 +8327,7 @@
         "num_experts": null,
         "experts_per_token": null
       },
-      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl",
       "training_args": {
         "output_dir": "/circuits-benchmark/results",
         "atol": 0.05,
@@ -7670,7 +8335,7 @@
         "use_single_loss": true,
         "iit_weight": 1.0,
         "behavior_weight": 0.4,
-        "strict_weight": 0.7,
         "epochs": 1000,
         "early_stop_accuracy_threshold": 99.9,
         "act_fn": "gelu",
@@ -7692,14 +8357,14 @@
         "siit_sampling": "sample_all",
         "val_iia_sampling": "all"
       },
-      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json",
-      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth",
-      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl"
     },
     {
-      "case_id": "62",
-      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/62",
-      "task_description": "Replaces each element with its factorial.",
       "vocab": [
         0,
         1,
@@ -7718,19 +8383,19 @@
       "files": [
         {
           "file_name": "edges.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json"
         }
       ],
       "transformer_cfg": {
@@ -7764,12 +8429,12 @@
         "attention_dir": "causal",
         "attn_only": false,
         "seed": 0,
-        "initializer_range": 0.1414213562373095,
         "init_weights": true,
         "scale_attn_by_inverse_layer_idx": false,
         "positional_embedding_type": "standard",
         "final_rms": false,
-        "d_vocab_out": 10,
         "parallel_attn_mlp": false,
         "rotary_dim": null,
         "n_params": 384,
@@ -7787,7 +8452,7 @@
         "num_experts": null,
         "experts_per_token": null
       },
-      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl",
       "training_args": {
         "output_dir": "/circuits-benchmark/results",
         "atol": 0.05,
@@ -7817,14 +8482,14 @@
         "siit_sampling": "sample_all",
         "val_iia_sampling": "all"
       },
-      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json",
-      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth",
-      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl"
     },
     {
-      "case_id": "111",
-      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/111",
-      "task_description": "Returns the last element of the sequence and pads the rest with zeros.",
       "vocab": [
         0,
         1,
@@ -7843,29 +8508,29 @@
       "files": [
         {
           "file_name": "edges.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json"
         }
       ],
       "transformer_cfg": {
-        "n_layers": 3,
-        "d_model": 24,
         "n_ctx": 10,
-        "d_head": 6,
         "model_name": "custom",
         "n_heads": 4,
-        "d_mlp": 96,
         "act_fn": "gelu",
         "d_vocab": 13,
         "eps": 1e-05,
@@ -7886,18 +8551,18 @@
         "init_mode": "gpt2",
         "normalization_type": null,
         "n_devices": 1,
-        "attention_dir": "bidirectional",
         "attn_only": false,
         "seed": 0,
-        "initializer_range": 0.09847319278346618,
         "init_weights": true,
         "scale_attn_by_inverse_layer_idx": false,
         "positional_embedding_type": "standard",
         "final_rms": false,
-        "d_vocab_out": 11,
         "parallel_attn_mlp": false,
         "rotary_dim": null,
-        "n_params": 20736,
         "use_hook_tokens": false,
         "gated_mlp": false,
         "default_prepend_bos": true,
@@ -7912,7 +8577,7 @@
         "num_experts": null,
         "experts_per_token": null
       },
-      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl",
       "training_args": {
         "output_dir": "/circuits-benchmark/results",
         "atol": 0.05,
@@ -7920,7 +8585,7 @@
         "use_single_loss": true,
         "iit_weight": 1.0,
         "behavior_weight": 0.4,
-        "strict_weight": 0.4,
         "epochs": 1000,
         "early_stop_accuracy_threshold": 99.9,
         "act_fn": "gelu",
@@ -7942,54 +8607,57 @@
         "siit_sampling": "sample_all",
         "val_iia_sampling": "all"
       },
-      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json",
-      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth",
-      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl"
     },
     {
-      "case_id": "35",
-      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/35",
-      "task_description": "Alternates capitalization of each character in words.",
       "vocab": [
-        "J",
-        "LB",
-        "TPSI",
-        "V",
-        "b",
-        "no",
-        "oCLrZaW",
-        "poiVg"
       ],
       "max_seq_len": 10,
       "min_seq_len": 4,
       "files": [
         {
           "file_name": "edges.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/meta.json"
         }
       ],
       "transformer_cfg": {
-        "n_layers": 2,
-        "d_model": 9,
         "n_ctx": 10,
-        "d_head": 2,
         "model_name": "custom",
         "n_heads": 4,
-        "d_mlp": 36,
         "act_fn": "gelu",
-        "d_vocab": 10,
         "eps": 1e-05,
         "use_attn_result": true,
         "use_attn_scale": true,
@@ -8008,18 +8676,18 @@
         "init_mode": "gpt2",
         "normalization_type": null,
         "n_devices": 1,
-        "attention_dir": "causal",
         "attn_only": false,
         "seed": 0,
-        "initializer_range": 0.1539600717839002,
         "init_weights": true,
         "scale_attn_by_inverse_layer_idx": false,
         "positional_embedding_type": "standard",
         "final_rms": false,
-        "d_vocab_out": 8,
         "parallel_attn_mlp": false,
         "rotary_dim": null,
-        "n_params": 1872,
         "use_hook_tokens": false,
         "gated_mlp": false,
         "default_prepend_bos": true,
@@ -8029,9 +8697,265 @@
         "post_embedding_ln": false,
         "rotary_base": 10000,
         "trust_remote_code": false,
-        "rotary_adjacent_pairs": false
-      },
-      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl",
       "training_args": {
         "atol": 0.05,
         "lr": 0.01,
@@ -8136,58 +9060,289 @@
         "lr": 0.01,
         "use_single_loss": false,
         "iit_weight": 1.0,
-        "behavior_weight": 1.0,
-        "strict_weight": 10.0,
-        "epochs": 2000,
         "act_fn": "gelu",
         "clip_grad_norm": 0.1,
-        "lr_scheduler": "",
         "model_pair": "strict",
-        "same_size": false
       },
-      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/meta.json",
-      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model.pth",
-      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/edges.pkl"
     },
     {
-      "case_id": "36",
-      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/36",
-      "task_description": "Classifies each token as 'positive', 'negative', or 'neutral' based on emojis.",
       "vocab": [
-        "\ud83d\udcd8",
-        "\ud83d\ude0a",
-        "\ud83d\ude22"
       ],
       "max_seq_len": 10,
       "min_seq_len": 4,
       "files": [
         {
           "file_name": "edges.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json"
         }
       ],
       "transformer_cfg": {
         "n_layers": 2,
-        "d_model": 6,
         "n_ctx": 10,
         "d_head": 1,
         "model_name": "custom",
         "n_heads": 4,
-        "d_mlp": 24,
         "act_fn": "gelu",
-        "d_vocab": 5,
         "eps": 1e-05,
         "use_attn_result": true,
         "use_attn_scale": true,
@@ -8209,15 +9364,15 @@
         "attention_dir": "causal",
         "attn_only": false,
         "seed": 0,
-        "initializer_range": 0.19402850002906638,
         "init_weights": true,
         "scale_attn_by_inverse_layer_idx": false,
         "positional_embedding_type": "standard",
         "final_rms": false,
-        "d_vocab_out": 3,
         "parallel_attn_mlp": false,
         "rotary_dim": null,
-        "n_params": 768,
         "use_hook_tokens": false,
         "gated_mlp": false,
         "default_prepend_bos": true,
@@ -8227,30 +9382,49 @@
         "post_embedding_ln": false,
         "rotary_base": 10000,
         "trust_remote_code": false,
-        "rotary_adjacent_pairs": false
       },
-      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl",
       "training_args": {
         "atol": 0.05,
-        "lr": 0.01,
-        "use_single_loss": false,
         "iit_weight": 1.0,
-        "behavior_weight": 1.0,
-        "strict_weight": 1.0,
-        "epochs": 2000,
         "act_fn": "gelu",
         "clip_grad_norm": 0.1,
-        "lr_scheduler": "",
-        "model_pair": "strict"
       },
-      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json",
-      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth",
-      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl"
     },
     {
-      "case_id": "64",
-      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/64",
-      "task_description": "Cubes each element in the sequence.",
       "vocab": [
         0,
         1,
@@ -8269,19 +9443,19 @@
       "files": [
         {
           "file_name": "edges.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json"
         }
       ],
       "transformer_cfg": {
@@ -8338,7 +9512,7 @@
         "num_experts": null,
         "experts_per_token": null
       },
-      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl",
       "training_args": {
         "output_dir": "/circuits-benchmark/results",
         "atol": 0.05,
@@ -8368,14 +9542,14 @@
         "siit_sampling": "sample_all",
         "val_iia_sampling": "all"
       },
-      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json",
-      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth",
-      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl"
     },
     {
-      "case_id": "8",
-      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/8",
-      "task_description": "Identity",
       "vocab": [
         0,
         1,
@@ -8394,19 +9568,19 @@
       "files": [
         {
           "file_name": "edges.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
-          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json"
         }
       ],
       "transformer_cfg": {
@@ -8463,7 +9637,7 @@
         "num_experts": null,
         "experts_per_token": null
       },
-      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl",
       "training_args": {
         "output_dir": "/circuits-benchmark/results",
         "atol": 0.05,
@@ -8481,7 +9655,7 @@
         "lr_scheduler": "linear",
         "model_pair": "strict",
         "same_size": false,
-        "seed": 67,
         "batch_size": 256,
         "include_mlp": false,
         "detach_while_caching": true,
@@ -8493,9 +9667,9 @@
         "siit_sampling": "sample_all",
         "val_iia_sampling": "all"
       },
-      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json",
-      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth",
-      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl"
     },
     {
       "case_id": "103",
@@ -8872,6 +10046,131 @@
       "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth",
       "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl"
     },
     {
       "case_id": "46",
       "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46",

       "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth",
       "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl"
     },
+    {
+      "case_id": "130",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/130",
+      "task_description": "Clips each element to be within a range (make the default range [2, 7]).",
+      "vocab": [
+        -15,
+        -14,
+        -13,
+        -12,
+        -11,
+        -10,
+        -9,
+        -8,
+        -7,
+        -6,
+        -5,
+        -4,
+        -3,
+        -2,
+        -1,
+        0,
+        1,
+        2,
+        3,
+        4,
+        5,
+        6,
+        7,
+        8,
+        9,
+        10,
+        11,
+        12,
+        13,
+        14
+      ],
+      "max_seq_len": 10,
+      "min_seq_len": 4,
+      "files": [
+        {
+          "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/edges.pkl"
+        },
+        {
+          "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model.pth"
+        },
+        {
+          "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model_cfg.pkl"
+        },
+        {
+          "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/meta.json"
+        }
+      ],
+      "transformer_cfg": {
+        "n_layers": 3,
+        "d_model": 4,
+        "n_ctx": 10,
+        "d_head": 1,
+        "model_name": "custom",
+        "n_heads": 4,
+        "d_mlp": 16,
+        "act_fn": "gelu",
+        "d_vocab": 32,
+        "eps": 1e-05,
+        "use_attn_result": true,
+        "use_attn_scale": true,
+        "use_split_qkv_input": true,
+        "use_hook_mlp_in": true,
+        "use_attn_in": false,
+        "use_local_attn": false,
+        "original_architecture": null,
+        "from_checkpoint": false,
+        "checkpoint_index": null,
+        "checkpoint_label_type": null,
+        "checkpoint_value": null,
+        "tokenizer_name": null,
+        "window_size": null,
+        "attn_types": null,
+        "init_mode": "gpt2",
+        "normalization_type": null,
+        "n_devices": 1,
+        "attention_dir": "causal",
+        "attn_only": false,
+        "seed": 0,
+        "initializer_range": 0.10079052613579392,
+        "init_weights": true,
+        "scale_attn_by_inverse_layer_idx": false,
+        "positional_embedding_type": "standard",
+        "final_rms": false,
+        "d_vocab_out": 6,
+        "parallel_attn_mlp": false,
+        "rotary_dim": null,
+        "n_params": 576,
+        "use_hook_tokens": false,
+        "gated_mlp": false,
+        "default_prepend_bos": true,
+        "dtype": "torch.float32",
+        "tokenizer_prepends_bos": null,
+        "n_key_value_heads": null,
+        "post_embedding_ln": false,
+        "rotary_base": 10000,
+        "trust_remote_code": false,
+        "rotary_adjacent_pairs": false,
+        "load_in_4bit": false,
+        "num_experts": null,
+        "experts_per_token": null
+      },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model_cfg.pkl",
+      "training_args": {
+        "output_dir": "/circuits-benchmark/results",
+        "atol": 0.05,
+        "lr": 0.001,
+        "use_single_loss": true,
+        "iit_weight": 1.0,
+        "behavior_weight": 0.4,
+        "strict_weight": 1.0,
+        "epochs": 1000,
+        "early_stop_accuracy_threshold": 99.9,
+        "act_fn": "gelu",
+        "use_wandb": true,
+        "save_model_to_wandb": true,
+        "clip_grad_norm": 0.1,
+        "lr_scheduler": "linear",
+        "model_pair": "strict",
+        "same_size": false,
+        "seed": 67,
+        "batch_size": 256,
+        "include_mlp": false,
+        "detach_while_caching": true,
+        "scheduler_val_metric": [
+          "val/accuracy",
+          "val/IIA",
+          "val/strict_accuracy"
+        ],
+        "siit_sampling": "sample_all",
+        "val_iia_sampling": "all"
+      },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/edges.pkl"
+    },
     {
       "case_id": "75",
       "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75",
       "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth",
       "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl"
     },
+    {
+      "case_id": "66",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/66",
+      "task_description": "Round each element in the input sequence to the nearest integer.",
+      "vocab": [
+        0.0,
+        0.25,
+        0.5,
+        0.75,
+        1.0,
+        1.25,
+        1.5,
+        1.75,
+        2.0,
+        2.25,
+        2.5,
+        2.75,
+        3.0,
+        3.25,
+        3.5,
+        3.75,
+        4.0,
+        4.25,
+        4.5,
+        4.75
+      ],
+      "max_seq_len": 10,
+      "min_seq_len": 4,
+      "files": [
+        {
+          "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/edges.pkl"
+        },
+        {
+          "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model.pth"
+        },
+        {
+          "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model_cfg.pkl"
+        },
+        {
+          "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/meta.json"
+        }
+      ],
+      "transformer_cfg": {
+        "n_layers": 2,
+        "d_model": 4,
+        "n_ctx": 10,
+        "d_head": 1,
+        "model_name": "custom",
+        "n_heads": 4,
+        "d_mlp": 16,
+        "act_fn": "gelu",
+        "d_vocab": 22,
+        "eps": 1e-05,
+        "use_attn_result": true,
+        "use_attn_scale": true,
+        "use_split_qkv_input": true,
+        "use_hook_mlp_in": true,
+        "use_attn_in": false,
+        "use_local_attn": false,
+        "original_architecture": null,
+        "from_checkpoint": false,
+        "checkpoint_index": null,
+        "checkpoint_label_type": null,
+        "checkpoint_value": null,
+        "tokenizer_name": null,
+        "window_size": null,
+        "attn_types": null,
+        "init_mode": "gpt2",
+        "normalization_type": null,
+        "n_devices": 1,
+        "attention_dir": "causal",
+        "attn_only": false,
+        "seed": 0,
+        "initializer_range": 0.13151918984428584,
+        "init_weights": true,
+        "scale_attn_by_inverse_layer_idx": false,
+        "positional_embedding_type": "standard",
+        "final_rms": false,
+        "d_vocab_out": 6,
+        "parallel_attn_mlp": false,
+        "rotary_dim": null,
+        "n_params": 384,
+        "use_hook_tokens": false,
+        "gated_mlp": false,
+        "default_prepend_bos": true,
+        "dtype": "torch.float32",
+        "tokenizer_prepends_bos": null,
+        "n_key_value_heads": null,
+        "post_embedding_ln": false,
+        "rotary_base": 10000,
+        "trust_remote_code": false,
+        "rotary_adjacent_pairs": false,
+        "load_in_4bit": false,
+        "num_experts": null,
+        "experts_per_token": null
+      },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model_cfg.pkl",
+      "training_args": {
+        "output_dir": "/circuits-benchmark/results",
+        "atol": 0.05,
+        "lr": 0.001,
+        "use_single_loss": true,
+        "iit_weight": 1.0,
+        "behavior_weight": 0.4,
+        "strict_weight": 0.7,
+        "epochs": 1000,
+        "early_stop_accuracy_threshold": 99.9,
+        "act_fn": "gelu",
+        "use_wandb": true,
+        "save_model_to_wandb": true,
+        "clip_grad_norm": 0.1,
+        "lr_scheduler": "linear",
+        "model_pair": "strict",
+        "same_size": false,
+        "seed": 92,
+        "batch_size": 256,
+        "include_mlp": false,
+        "detach_while_caching": true,
+        "scheduler_val_metric": [
+          "val/accuracy",
+          "val/IIA",
+          "val/strict_accuracy"
+        ],
+        "siit_sampling": "sample_all",
+        "val_iia_sampling": "all"
+      },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/edges.pkl"
+    },
     {
       "case_id": "93",
       "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93",
       "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl"
     },
     {
+      "case_id": "15",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/15",
+      "task_description": "Returns each token multiplied by two and subtracted by its index.",
       "vocab": [
+        0,
+        1,
+        2,
+        3,
+        4
       ],
+      "max_seq_len": 5,
       "min_seq_len": 4,
       "files": [
         {
           "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/meta.json"
         }
       ],
       "transformer_cfg": {
+        "n_layers": 3,
+        "d_model": 4,
+        "n_ctx": 5,
+        "d_head": 1,
+        "model_name": "custom",
+        "n_heads": 4,
+        "d_mlp": 16,
+        "act_fn": "gelu",
+        "d_vocab": 7,
+        "eps": 1e-05,
+        "use_attn_result": true,
+        "use_attn_scale": true,
+        "use_split_qkv_input": true,
+        "use_hook_mlp_in": true,
+        "use_attn_in": false,
+        "use_local_attn": false,
+        "original_architecture": null,
+        "from_checkpoint": false,
+        "checkpoint_index": null,
+        "checkpoint_label_type": null,
+        "checkpoint_value": null,
+        "tokenizer_name": null,
+        "window_size": null,
+        "attn_types": null,
+        "init_mode": "gpt2",
+        "normalization_type": null,
+        "n_devices": 1,
+        "attention_dir": "causal",
+        "attn_only": false,
+        "seed": 0,
+        "initializer_range": 0.06553855364152325,
+        "init_weights": true,
+        "scale_attn_by_inverse_layer_idx": false,
+        "positional_embedding_type": "standard",
+        "final_rms": false,
+        "d_vocab_out": 12,
+        "parallel_attn_mlp": false,
+        "rotary_dim": null,
+        "n_params": 576,
+        "use_hook_tokens": false,
+        "gated_mlp": false,
+        "default_prepend_bos": true,
+        "dtype": "torch.float32",
+        "tokenizer_prepends_bos": null,
+        "n_key_value_heads": null,
+        "post_embedding_ln": false,
+        "rotary_base": 10000,
+        "trust_remote_code": false,
+        "rotary_adjacent_pairs": false,
+        "load_in_4bit": false,
+        "num_experts": null,
+        "experts_per_token": null
+      },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model_cfg.pkl",
+      "training_args": {
+        "output_dir": "/circuits-benchmark/results",
+        "atol": 0.05,
+        "lr": 0.001,
+        "use_single_loss": true,
+        "iit_weight": 1.0,
+        "behavior_weight": 0.4,
+        "strict_weight": 1.0,
+        "epochs": 1000,
+        "early_stop_accuracy_threshold": 99.9,
+        "act_fn": "gelu",
+        "use_wandb": true,
+        "save_model_to_wandb": true,
+        "clip_grad_norm": 0.1,
+        "lr_scheduler": "linear",
+        "model_pair": "strict",
+        "same_size": false,
+        "seed": 67,
+        "batch_size": 256,
+        "include_mlp": false,
+        "detach_while_caching": true,
+        "scheduler_val_metric": [
+          "val/accuracy",
+          "val/IIA",
+          "val/strict_accuracy"
+        ],
+        "siit_sampling": "sample_all",
+        "val_iia_sampling": "all"
+      },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/edges.pkl"
+    },
+    {
+      "case_id": "19",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/19",
+      "task_description": "Removes consecutive duplicate tokens from a sequence.",
+      "vocab": [
+        "a",
+        "b",
+        "c"
+      ],
+      "max_seq_len": 15,
+      "min_seq_len": 4,
+      "files": [
+        {
+          "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/edges.pkl"
+        },
+        {
+          "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model.pth"
+        },
+        {
+          "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model_cfg.pkl"
+        },
+        {
+          "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/meta.json"
+        }
+      ],
+      "transformer_cfg": {
+        "n_layers": 2,
+        "d_model": 32,
+        "n_ctx": 15,
+        "d_head": 8,
+        "model_name": "custom",
         "n_heads": 4,
         "d_mlp": 128,
         "act_fn": "gelu",
       "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth",
       "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl"
     },
+    {
+      "case_id": "43",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/43",
+      "task_description": "Returns the corresponding Fibonacci number for each element in the input sequence.",
+      "vocab": [
+        0,
+        1,
+        2,
+        3,
+        4,
+        5,
+        6,
+        7,
+        8,
+        9,
+        10,
+        11,
+        12,
+        13,
+        14,
+        15,
+        16,
+        17,
+        18,
+        19
+      ],
+      "max_seq_len": 10,
+      "min_seq_len": 4,
+      "files": [
+        {
+          "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/edges.pkl"
+        },
+        {
+          "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model.pth"
+        },
+        {
+          "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model_cfg.pkl"
+        },
+        {
+          "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/meta.json"
+        }
+      ],
+      "transformer_cfg": {
+        "n_layers": 2,
+        "d_model": 4,
+        "n_ctx": 10,
+        "d_head": 1,
+        "model_name": "custom",
+        "n_heads": 4,
+        "d_mlp": 16,
+        "act_fn": "gelu",
+        "d_vocab": 22,
+        "eps": 1e-05,
+        "use_attn_result": true,
+        "use_attn_scale": true,
+        "use_split_qkv_input": true,
+        "use_hook_mlp_in": true,
+        "use_attn_in": false,
+        "use_local_attn": false,
+        "original_architecture": null,
+        "from_checkpoint": false,
+        "checkpoint_index": null,
+        "checkpoint_label_type": null,
+        "checkpoint_value": null,
+        "tokenizer_name": null,
+        "window_size": null,
+        "attn_types": null,
+        "init_mode": "gpt2",
+        "normalization_type": null,
+        "n_devices": 1,
+        "attention_dir": "causal",
+        "attn_only": false,
+        "seed": 0,
+        "initializer_range": 0.1131370849898476,
+        "init_weights": true,
+        "scale_attn_by_inverse_layer_idx": false,
+        "positional_embedding_type": "standard",
+        "final_rms": false,
+        "d_vocab_out": 19,
+        "parallel_attn_mlp": false,
+        "rotary_dim": null,
+        "n_params": 384,
+        "use_hook_tokens": false,
+        "gated_mlp": false,
+        "default_prepend_bos": true,
+        "dtype": "torch.float32",
+        "tokenizer_prepends_bos": null,
+        "n_key_value_heads": null,
+        "post_embedding_ln": false,
+        "rotary_base": 10000,
+        "trust_remote_code": false,
+        "rotary_adjacent_pairs": false,
+        "load_in_4bit": false,
+        "num_experts": null,
+        "experts_per_token": null
+      },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model_cfg.pkl",
+      "training_args": {
+        "output_dir": "/circuits-benchmark/results",
+        "atol": 0.05,
+        "lr": 0.001,
+        "use_single_loss": true,
+        "iit_weight": 1.0,
+        "behavior_weight": 0.4,
+        "strict_weight": 1.0,
+        "epochs": 1000,
+        "early_stop_accuracy_threshold": 99.9,
+        "act_fn": "gelu",
+        "use_wandb": true,
+        "save_model_to_wandb": true,
+        "clip_grad_norm": 0.1,
+        "lr_scheduler": "linear",
+        "model_pair": "strict",
+        "same_size": false,
+        "seed": 67,
+        "batch_size": 256,
+        "include_mlp": false,
+        "detach_while_caching": true,
+        "scheduler_val_metric": [
+          "val/accuracy",
+          "val/IIA",
+          "val/strict_accuracy"
+        ],
+        "siit_sampling": "sample_all",
+        "val_iia_sampling": "all"
+      },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/edges.pkl"
+    },
     {
       "case_id": "122",
       "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122",
       "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl"
     },
     {
+      "case_id": "41",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/41",
+      "task_description": "Make each element of the input sequence absolute",
       "vocab": [
+        -10,
+        -9,
+        -8,
+        -7,
+        -6,
+        -5,
+        -4,
+        -3,
+        -2,
+        -1,
         0,
         1,
         2,
         6,
         7,
         8,
+        9
       ],
       "max_seq_len": 10,
       "min_seq_len": 4,
       "files": [
         {
           "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model.pth"
+        },
+        {
+          "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model_cfg.pkl"
+        },
+        {
+          "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/meta.json"
+        }
+      ],
+      "transformer_cfg": {
+        "n_layers": 2,
+        "d_model": 4,
+        "n_ctx": 10,
+        "d_head": 1,
+        "model_name": "custom",
+        "n_heads": 4,
+        "d_mlp": 16,
+        "act_fn": "gelu",
+        "d_vocab": 22,
+        "eps": 1e-05,
+        "use_attn_result": true,
+        "use_attn_scale": true,
+        "use_split_qkv_input": true,
+        "use_hook_mlp_in": true,
+        "use_attn_in": false,
+        "use_local_attn": false,
+        "original_architecture": null,
+        "from_checkpoint": false,
+        "checkpoint_index": null,
+        "checkpoint_label_type": null,
+        "checkpoint_value": null,
+        "tokenizer_name": null,
+        "window_size": null,
+        "attn_types": null,
+        "init_mode": "gpt2",
+        "normalization_type": null,
+        "n_devices": 1,
+        "attention_dir": "causal",
+        "attn_only": false,
+        "seed": 0,
+        "initializer_range": 0.12344267996967354,
+        "init_weights": true,
+        "scale_attn_by_inverse_layer_idx": false,
+        "positional_embedding_type": "standard",
+        "final_rms": false,
+        "d_vocab_out": 11,
+        "parallel_attn_mlp": false,
+        "rotary_dim": null,
+        "n_params": 384,
+        "use_hook_tokens": false,
+        "gated_mlp": false,
+        "default_prepend_bos": true,
+        "dtype": "torch.float32",
+        "tokenizer_prepends_bos": null,
+        "n_key_value_heads": null,
+        "post_embedding_ln": false,
+        "rotary_base": 10000,
+        "trust_remote_code": false,
+        "rotary_adjacent_pairs": false,
+        "load_in_4bit": false,
+        "num_experts": null,
+        "experts_per_token": null
+      },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model_cfg.pkl",
+      "training_args": {
+        "output_dir": "/circuits-benchmark/results",
+        "atol": 0.05,
+        "lr": 0.001,
+        "use_single_loss": true,
+        "iit_weight": 1.0,
+        "behavior_weight": 0.4,
+        "strict_weight": 1.0,
+        "epochs": 1000,
+        "early_stop_accuracy_threshold": 99.9,
+        "act_fn": "gelu",
+        "use_wandb": true,
+        "save_model_to_wandb": true,
+        "clip_grad_norm": 0.1,
+        "lr_scheduler": "linear",
+        "model_pair": "strict",
+        "same_size": false,
+        "seed": 67,
+        "batch_size": 256,
+        "include_mlp": false,
+        "detach_while_caching": true,
+        "scheduler_val_metric": [
+          "val/accuracy",
+          "val/IIA",
+          "val/strict_accuracy"
+        ],
+        "siit_sampling": "sample_all",
+        "val_iia_sampling": "all"
+      },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/edges.pkl"
+    },
+    {
+      "case_id": "54",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/54",
+      "task_description": "Applies the hyperbolic tangent to each element.",
+      "vocab": [
+        0,
+        1,
+        2,
+        3,
+        4,
+        5,
+        6,
+        7,
+        8,
+        9,
+        10
+      ],
+      "max_seq_len": 10,
+      "min_seq_len": 4,
+      "files": [
+        {
+          "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/edges.pkl"
+        },
+        {
+          "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
       "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl"
     },
     {
+      "case_id": "68",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/68",
+      "task_description": "Increment each element until it becomes a multiple of 3",
       "vocab": [
         0,
         1,
       "files": [
         {
           "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/meta.json"
         }
       ],
       "transformer_cfg": {
         "attention_dir": "causal",
         "attn_only": false,
         "seed": 0,
+        "initializer_range": 0.1539600717839002,
         "init_weights": true,
         "scale_attn_by_inverse_layer_idx": false,
         "positional_embedding_type": "standard",
         "final_rms": false,
+        "d_vocab_out": 5,
         "parallel_attn_mlp": false,
         "rotary_dim": null,
         "n_params": 384,
         "num_experts": null,
         "experts_per_token": null
       },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model_cfg.pkl",
       "training_args": {
         "output_dir": "/circuits-benchmark/results",
         "atol": 0.05,
         "use_single_loss": true,
         "iit_weight": 1.0,
         "behavior_weight": 0.4,
+        "strict_weight": 1.0,
         "epochs": 1000,
         "early_stop_accuracy_threshold": 99.9,
         "act_fn": "gelu",
         "siit_sampling": "sample_all",
         "val_iia_sampling": "all"
       },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/edges.pkl"
     },
     {
+      "case_id": "70",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/70",
+      "task_description": "Apply the cosine function to each element of the input sequence.",
       "vocab": [
         0,
         1,
       "files": [
         {
           "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json"
         }
       ],
       "transformer_cfg": {
         "attention_dir": "causal",
         "attn_only": false,
         "seed": 0,
+        "initializer_range": 0.1392621247645583,
         "init_weights": true,
         "scale_attn_by_inverse_layer_idx": false,
         "positional_embedding_type": "standard",
         "final_rms": false,
+        "d_vocab_out": 11,
         "parallel_attn_mlp": false,
         "rotary_dim": null,
         "n_params": 384,
         "num_experts": null,
         "experts_per_token": null
       },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl",
       "training_args": {
         "output_dir": "/circuits-benchmark/results",
         "atol": 0.05,
         "siit_sampling": "sample_all",
         "val_iia_sampling": "all"
       },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl"
     },
     {
+      "case_id": "62",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/62",
+      "task_description": "Replaces each element with its factorial.",
       "vocab": [
         0,
         1,
       "files": [
         {
           "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json"
         }
       ],
       "transformer_cfg": {
+        "n_layers": 2,
+        "d_model": 4,
         "n_ctx": 10,
+        "d_head": 1,
         "model_name": "custom",
         "n_heads": 4,
+        "d_mlp": 16,
         "act_fn": "gelu",
         "d_vocab": 13,
         "eps": 1e-05,
         "init_mode": "gpt2",
         "normalization_type": null,
         "n_devices": 1,
+        "attention_dir": "causal",
         "attn_only": false,
         "seed": 0,
+        "initializer_range": 0.1414213562373095,
         "init_weights": true,
         "scale_attn_by_inverse_layer_idx": false,
         "positional_embedding_type": "standard",
         "final_rms": false,
+        "d_vocab_out": 10,
         "parallel_attn_mlp": false,
         "rotary_dim": null,
+        "n_params": 384,
         "use_hook_tokens": false,
         "gated_mlp": false,
         "default_prepend_bos": true,
         "num_experts": null,
         "experts_per_token": null
       },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl",
       "training_args": {
         "output_dir": "/circuits-benchmark/results",
         "atol": 0.05,
         "use_single_loss": true,
         "iit_weight": 1.0,
         "behavior_weight": 0.4,
+        "strict_weight": 0.7,
         "epochs": 1000,
         "early_stop_accuracy_threshold": 99.9,
         "act_fn": "gelu",
         "siit_sampling": "sample_all",
         "val_iia_sampling": "all"
       },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl"
     },
     {
+      "case_id": "111",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/111",
+      "task_description": "Returns the last element of the sequence and pads the rest with zeros.",
       "vocab": [
+        0,
+        1,
+        2,
+        3,
+        4,
+        5,
+        6,
+        7,
+        8,
+        9,
+        10
       ],
       "max_seq_len": 10,
       "min_seq_len": 4,
       "files": [
         {
           "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json"
         }
       ],
       "transformer_cfg": {
+        "n_layers": 3,
+        "d_model": 24,
         "n_ctx": 10,
+        "d_head": 6,
         "model_name": "custom",
         "n_heads": 4,
+        "d_mlp": 96,
         "act_fn": "gelu",
+        "d_vocab": 13,
         "eps": 1e-05,
         "use_attn_result": true,
         "use_attn_scale": true,
         "init_mode": "gpt2",
         "normalization_type": null,
         "n_devices": 1,
+        "attention_dir": "bidirectional",
         "attn_only": false,
         "seed": 0,
+        "initializer_range": 0.09847319278346618,
         "init_weights": true,
         "scale_attn_by_inverse_layer_idx": false,
         "positional_embedding_type": "standard",
         "final_rms": false,
+        "d_vocab_out": 11,
         "parallel_attn_mlp": false,
         "rotary_dim": null,
+        "n_params": 20736,
         "use_hook_tokens": false,
         "gated_mlp": false,
         "default_prepend_bos": true,
         "post_embedding_ln": false,
         "rotary_base": 10000,
         "trust_remote_code": false,
+        "rotary_adjacent_pairs": false,
+        "load_in_4bit": false,
+        "num_experts": null,
+        "experts_per_token": null
+      },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl",
+      "training_args": {
+        "output_dir": "/circuits-benchmark/results",
+        "atol": 0.05,
+        "lr": 0.001,
+        "use_single_loss": true,
+        "iit_weight": 1.0,
+        "behavior_weight": 0.4,
+        "strict_weight": 0.4,
+        "epochs": 1000,
+        "early_stop_accuracy_threshold": 99.9,
+        "act_fn": "gelu",
+        "use_wandb": true,
+        "save_model_to_wandb": true,
+        "clip_grad_norm": 0.1,
+        "lr_scheduler": "linear",
+        "model_pair": "strict",
+        "same_size": false,
+        "seed": 67,
+        "batch_size": 256,
+        "include_mlp": false,
+        "detach_while_caching": true,
+        "scheduler_val_metric": [
+          "val/accuracy",
+          "val/IIA",
+          "val/strict_accuracy"
+        ],
+        "siit_sampling": "sample_all",
+        "val_iia_sampling": "all"
+      },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl"
+    },
+    {
+      "case_id": "121",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/121",
+      "task_description": "Compute arcsine of all elements in the input sequence.",
+      "vocab": [
+        -1.0,
+        -0.9,
+        -0.8,
+        -0.7,
+        -0.6,
+        -0.5,
+        -0.4,
+        -0.30000000000000004,
+        -0.19999999999999996,
+        -0.09999999999999998,
+        0.0,
+        0.10000000000000009,
+        0.19999999999999996,
+        0.30000000000000004,
+        0.3999999999999999,
+        0.5,
+        0.6000000000000001,
+        0.7,
+        0.8,
+        0.8999999999999999
+      ],
+      "max_seq_len": 10,
+      "min_seq_len": 4,
+      "files": [
+        {
+          "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/edges.pkl"
+        },
+        {
+          "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model.pth"
+        },
+        {
+          "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model_cfg.pkl"
+        },
+        {
+          "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/meta.json"
+        }
+      ],
+      "transformer_cfg": {
+        "n_layers": 2,
+        "d_model": 4,
+        "n_ctx": 10,
+        "d_head": 1,
+        "model_name": "custom",
+        "n_heads": 4,
+        "d_mlp": 16,
+        "act_fn": "gelu",
+        "d_vocab": 22,
+        "eps": 1e-05,
+        "use_attn_result": true,
+        "use_attn_scale": true,
+        "use_split_qkv_input": true,
+        "use_hook_mlp_in": true,
+        "use_attn_in": false,
+        "use_local_attn": false,
+        "original_architecture": null,
+        "from_checkpoint": false,
+        "checkpoint_index": null,
+        "checkpoint_label_type": null,
+        "checkpoint_value": null,
+        "tokenizer_name": null,
+        "window_size": null,
+        "attn_types": null,
+        "init_mode": "gpt2",
+        "normalization_type": null,
+        "n_devices": 1,
+        "attention_dir": "causal",
+        "attn_only": false,
+        "seed": 0,
+        "initializer_range": 0.11202240672224079,
+        "init_weights": true,
+        "scale_attn_by_inverse_layer_idx": false,
+        "positional_embedding_type": "standard",
+        "final_rms": false,
+        "d_vocab_out": 20,
+        "parallel_attn_mlp": false,
+        "rotary_dim": null,
+        "n_params": 384,
+        "use_hook_tokens": false,
+        "gated_mlp": false,
+        "default_prepend_bos": true,
+        "dtype": "torch.float32",
+        "tokenizer_prepends_bos": null,
+        "n_key_value_heads": null,
+        "post_embedding_ln": false,
+        "rotary_base": 10000,
+        "trust_remote_code": false,
+        "rotary_adjacent_pairs": false,
+        "load_in_4bit": false,
+        "num_experts": null,
+        "experts_per_token": null
+      },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model_cfg.pkl",
+      "training_args": {
+        "output_dir": "/circuits-benchmark/results",
+        "atol": 0.05,
+        "lr": 0.001,
+        "use_single_loss": true,
+        "iit_weight": 1.0,
+        "behavior_weight": 0.4,
+        "strict_weight": 1.0,
+        "epochs": 1000,
+        "early_stop_accuracy_threshold": 99.9,
+        "act_fn": "gelu",
+        "use_wandb": true,
+        "save_model_to_wandb": true,
+        "clip_grad_norm": 0.1,
+        "lr_scheduler": "linear",
+        "model_pair": "strict",
+        "same_size": false,
+        "seed": 67,
+        "batch_size": 256,
+        "include_mlp": false,
+        "detach_while_caching": true,
+        "scheduler_val_metric": [
+          "val/accuracy",
+          "val/IIA",
+          "val/strict_accuracy"
+        ],
+        "siit_sampling": "sample_all",
+        "val_iia_sampling": "all"
+      },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/edges.pkl"
+    },
+    {
+      "case_id": "35",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/35",
+      "task_description": "Alternates capitalization of each character in words.",
+      "vocab": [
+        "J",
+        "LB",
+        "TPSI",
+        "V",
+        "b",
+        "no",
+        "oCLrZaW",
+        "poiVg"
+      ],
+      "max_seq_len": 10,
+      "min_seq_len": 4,
+      "files": [
+        {
+          "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/edges.pkl"
+        },
+        {
+          "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model.pth"
+        },
+        {
+          "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl"
+        },
+        {
+          "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/meta.json"
+        }
+      ],
+      "transformer_cfg": {
+        "n_layers": 2,
+        "d_model": 9,
+        "n_ctx": 10,
+        "d_head": 2,
+        "model_name": "custom",
+        "n_heads": 4,
+        "d_mlp": 36,
+        "act_fn": "gelu",
+        "d_vocab": 10,
+        "eps": 1e-05,
+        "use_attn_result": true,
+        "use_attn_scale": true,
+        "use_split_qkv_input": true,
+        "use_hook_mlp_in": true,
+        "use_attn_in": false,
+        "use_local_attn": false,
+        "original_architecture": null,
+        "from_checkpoint": false,
+        "checkpoint_index": null,
+        "checkpoint_label_type": null,
+        "checkpoint_value": null,
+        "tokenizer_name": null,
+        "window_size": null,
+        "attn_types": null,
+        "init_mode": "gpt2",
+        "normalization_type": null,
+        "n_devices": 1,
+        "attention_dir": "causal",
+        "attn_only": false,
+        "seed": 0,
+        "initializer_range": 0.1539600717839002,
+        "init_weights": true,
+        "scale_attn_by_inverse_layer_idx": false,
+        "positional_embedding_type": "standard",
+        "final_rms": false,
+        "d_vocab_out": 8,
+        "parallel_attn_mlp": false,
+        "rotary_dim": null,
+        "n_params": 1872,
+        "use_hook_tokens": false,
+        "gated_mlp": false,
+        "default_prepend_bos": true,
+        "dtype": "torch.float32",
+        "tokenizer_prepends_bos": null,
+        "n_key_value_heads": null,
+        "post_embedding_ln": false,
+        "rotary_base": 10000,
+        "trust_remote_code": false,
+        "rotary_adjacent_pairs": false
+      },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl",
       "training_args": {
         "atol": 0.05,
         "lr": 0.01,
         "lr": 0.01,
         "use_single_loss": false,
         "iit_weight": 1.0,
+        "behavior_weight": 1.0,
+        "strict_weight": 10.0,
+        "epochs": 2000,
+        "act_fn": "gelu",
+        "clip_grad_norm": 0.1,
+        "lr_scheduler": "",
+        "model_pair": "strict",
+        "same_size": false
+      },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/edges.pkl"
+    },
+    {
+      "case_id": "36",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/36",
+      "task_description": "Classifies each token as 'positive', 'negative', or 'neutral' based on emojis.",
+      "vocab": [
+        "\ud83d\udcd8",
+        "\ud83d\ude0a",
+        "\ud83d\ude22"
+      ],
+      "max_seq_len": 10,
+      "min_seq_len": 4,
+      "files": [
+        {
+          "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl"
+        },
+        {
+          "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth"
+        },
+        {
+          "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl"
+        },
+        {
+          "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json"
+        }
+      ],
+      "transformer_cfg": {
+        "n_layers": 2,
+        "d_model": 6,
+        "n_ctx": 10,
+        "d_head": 1,
+        "model_name": "custom",
+        "n_heads": 4,
+        "d_mlp": 24,
+        "act_fn": "gelu",
+        "d_vocab": 5,
+        "eps": 1e-05,
+        "use_attn_result": true,
+        "use_attn_scale": true,
+        "use_split_qkv_input": true,
+        "use_hook_mlp_in": true,
+        "use_attn_in": false,
+        "use_local_attn": false,
+        "original_architecture": null,
+        "from_checkpoint": false,
+        "checkpoint_index": null,
+        "checkpoint_label_type": null,
+        "checkpoint_value": null,
+        "tokenizer_name": null,
+        "window_size": null,
+        "attn_types": null,
+        "init_mode": "gpt2",
+        "normalization_type": null,
+        "n_devices": 1,
+        "attention_dir": "causal",
+        "attn_only": false,
+        "seed": 0,
+        "initializer_range": 0.19402850002906638,
+        "init_weights": true,
+        "scale_attn_by_inverse_layer_idx": false,
+        "positional_embedding_type": "standard",
+        "final_rms": false,
+        "d_vocab_out": 3,
+        "parallel_attn_mlp": false,
+        "rotary_dim": null,
+        "n_params": 768,
+        "use_hook_tokens": false,
+        "gated_mlp": false,
+        "default_prepend_bos": true,
+        "dtype": "torch.float32",
+        "tokenizer_prepends_bos": null,
+        "n_key_value_heads": null,
+        "post_embedding_ln": false,
+        "rotary_base": 10000,
+        "trust_remote_code": false,
+        "rotary_adjacent_pairs": false
+      },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl",
+      "training_args": {
+        "atol": 0.05,
+        "lr": 0.01,
+        "use_single_loss": false,
+        "iit_weight": 1.0,
+        "behavior_weight": 1.0,
+        "strict_weight": 1.0,
+        "epochs": 2000,
+        "act_fn": "gelu",
+        "clip_grad_norm": 0.1,
+        "lr_scheduler": "",
+        "model_pair": "strict"
+      },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl"
+    },
+    {
+      "case_id": "106",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/106",
+      "task_description": "Sets all elements to zero except for the element at index 1.",
+      "vocab": [
+        0,
+        1,
+        2,
+        3,
+        4,
+        5,
+        6,
+        7,
+        8,
+        9,
+        10
+      ],
+      "max_seq_len": 10,
+      "min_seq_len": 4,
+      "files": [
+        {
+          "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/edges.pkl"
+        },
+        {
+          "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model.pth"
+        },
+        {
+          "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model_cfg.pkl"
+        },
+        {
+          "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/meta.json"
+        }
+      ],
+      "transformer_cfg": {
+        "n_layers": 2,
+        "d_model": 4,
+        "n_ctx": 10,
+        "d_head": 1,
+        "model_name": "custom",
+        "n_heads": 4,
+        "d_mlp": 16,
+        "act_fn": "gelu",
+        "d_vocab": 13,
+        "eps": 1e-05,
+        "use_attn_result": true,
+        "use_attn_scale": true,
+        "use_split_qkv_input": true,
+        "use_hook_mlp_in": true,
+        "use_attn_in": false,
+        "use_local_attn": false,
+        "original_architecture": null,
+        "from_checkpoint": false,
+        "checkpoint_index": null,
+        "checkpoint_label_type": null,
+        "checkpoint_value": null,
+        "tokenizer_name": null,
+        "window_size": null,
+        "attn_types": null,
+        "init_mode": "gpt2",
+        "normalization_type": null,
+        "n_devices": 1,
+        "attention_dir": "causal",
+        "attn_only": false,
+        "seed": 0,
+        "initializer_range": 0.13719886811400708,
+        "init_weights": true,
+        "scale_attn_by_inverse_layer_idx": false,
+        "positional_embedding_type": "standard",
+        "final_rms": false,
+        "d_vocab_out": 11,
+        "parallel_attn_mlp": false,
+        "rotary_dim": null,
+        "n_params": 384,
+        "use_hook_tokens": false,
+        "gated_mlp": false,
+        "default_prepend_bos": true,
+        "dtype": "torch.float32",
+        "tokenizer_prepends_bos": null,
+        "n_key_value_heads": null,
+        "post_embedding_ln": false,
+        "rotary_base": 10000,
+        "trust_remote_code": false,
+        "rotary_adjacent_pairs": false,
+        "load_in_4bit": false,
+        "num_experts": null,
+        "experts_per_token": null
+      },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model_cfg.pkl",
+      "training_args": {
+        "output_dir": "/circuits-benchmark/results",
+        "atol": 0.05,
+        "lr": 0.001,
+        "use_single_loss": true,
+        "iit_weight": 1.0,
+        "behavior_weight": 0.4,
+        "strict_weight": 0.7,
+        "epochs": 1000,
+        "early_stop_accuracy_threshold": 99.9,
         "act_fn": "gelu",
+        "use_wandb": true,
+        "save_model_to_wandb": true,
         "clip_grad_norm": 0.1,
+        "lr_scheduler": "linear",
         "model_pair": "strict",
+        "same_size": false,
+        "seed": 92,
+        "batch_size": 256,
+        "include_mlp": false,
+        "detach_while_caching": true,
+        "scheduler_val_metric": [
+          "val/accuracy",
+          "val/IIA",
+          "val/strict_accuracy"
+        ],
+        "siit_sampling": "sample_all",
+        "val_iia_sampling": "all"
       },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/edges.pkl"
     },
     {
+      "case_id": "64",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/64",
+      "task_description": "Cubes each element in the sequence.",
       "vocab": [
+        0,
+        1,
+        2,
+        3,
+        4,
+        5,
+        6,
+        7,
+        8,
+        9,
+        10
       ],
       "max_seq_len": 10,
       "min_seq_len": 4,
       "files": [
         {
           "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json"
         }
       ],
       "transformer_cfg": {
         "n_layers": 2,
+        "d_model": 4,
         "n_ctx": 10,
         "d_head": 1,
         "model_name": "custom",
         "n_heads": 4,
+        "d_mlp": 16,
         "act_fn": "gelu",
+        "d_vocab": 13,
         "eps": 1e-05,
         "use_attn_result": true,
         "use_attn_scale": true,
         "attention_dir": "causal",
         "attn_only": false,
         "seed": 0,
+        "initializer_range": 0.1392621247645583,
         "init_weights": true,
         "scale_attn_by_inverse_layer_idx": false,
         "positional_embedding_type": "standard",
         "final_rms": false,
+        "d_vocab_out": 11,
         "parallel_attn_mlp": false,
         "rotary_dim": null,
+        "n_params": 384,
         "use_hook_tokens": false,
         "gated_mlp": false,
         "default_prepend_bos": true,
         "post_embedding_ln": false,
         "rotary_base": 10000,
         "trust_remote_code": false,
+        "rotary_adjacent_pairs": false,
+        "load_in_4bit": false,
+        "num_experts": null,
+        "experts_per_token": null
       },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl",
       "training_args": {
+        "output_dir": "/circuits-benchmark/results",
         "atol": 0.05,
+        "lr": 0.001,
+        "use_single_loss": true,
         "iit_weight": 1.0,
+        "behavior_weight": 0.4,
+        "strict_weight": 0.7,
+        "epochs": 1000,
+        "early_stop_accuracy_threshold": 99.9,
         "act_fn": "gelu",
+        "use_wandb": true,
+        "save_model_to_wandb": true,
         "clip_grad_norm": 0.1,
+        "lr_scheduler": "linear",
+        "model_pair": "strict",
+        "same_size": false,
+        "seed": 67,
+        "batch_size": 256,
+        "include_mlp": false,
+        "detach_while_caching": true,
+        "scheduler_val_metric": [
+          "val/accuracy",
+          "val/IIA",
+          "val/strict_accuracy"
+        ],
+        "siit_sampling": "sample_all",
+        "val_iia_sampling": "all"
       },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl"
     },
     {
+      "case_id": "8",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/8",
+      "task_description": "Identity",
       "vocab": [
         0,
         1,
       "files": [
         {
           "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json"
         }
       ],
       "transformer_cfg": {
         "num_experts": null,
         "experts_per_token": null
       },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl",
       "training_args": {
         "output_dir": "/circuits-benchmark/results",
         "atol": 0.05,
         "siit_sampling": "sample_all",
         "val_iia_sampling": "all"
       },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl"
     },
     {
+      "case_id": "73",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/73",
+      "task_description": "Apply the sine function to each element of the input sequence.",
       "vocab": [
         0,
         1,
       "files": [
         {
           "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/edges.pkl"
         },
         {
           "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model.pth"
         },
         {
           "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model_cfg.pkl"
         },
         {
           "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/meta.json"
         }
       ],
       "transformer_cfg": {
         "num_experts": null,
         "experts_per_token": null
       },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model_cfg.pkl",
       "training_args": {
         "output_dir": "/circuits-benchmark/results",
         "atol": 0.05,
         "lr_scheduler": "linear",
         "model_pair": "strict",
         "same_size": false,
+        "seed": 92,
         "batch_size": 256,
         "include_mlp": false,
         "detach_while_caching": true,
         "siit_sampling": "sample_all",
         "val_iia_sampling": "all"
       },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/edges.pkl"
     },
     {
       "case_id": "103",
       "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth",
       "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl"
     },
+    {
+      "case_id": "49",
+      "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/49",
+      "task_description": "Decrements each element in the sequence until it becomes a multiple of 3.",
+      "vocab": [
+        0,
+        1,
+        2,
+        3,
+        4,
+        5,
+        6,
+        7,
+        8,
+        9,
+        10
+      ],
+      "max_seq_len": 10,
+      "min_seq_len": 4,
+      "files": [
+        {
+          "file_name": "edges.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/edges.pkl"
+        },
+        {
+          "file_name": "ll_model.pth",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model.pth"
+        },
+        {
+          "file_name": "ll_model_cfg.pkl",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model_cfg.pkl"
+        },
+        {
+          "file_name": "meta.json",
+          "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/meta.json"
+        }
+      ],
+      "transformer_cfg": {
+        "n_layers": 2,
+        "d_model": 4,
+        "n_ctx": 10,
+        "d_head": 1,
+        "model_name": "custom",
+        "n_heads": 4,
+        "d_mlp": 16,
+        "act_fn": "gelu",
+        "d_vocab": 13,
+        "eps": 1e-05,
+        "use_attn_result": true,
+        "use_attn_scale": true,
+        "use_split_qkv_input": true,
+        "use_hook_mlp_in": true,
+        "use_attn_in": false,
+        "use_local_attn": false,
+        "original_architecture": null,
+        "from_checkpoint": false,
+        "checkpoint_index": null,
+        "checkpoint_label_type": null,
+        "checkpoint_value": null,
+        "tokenizer_name": null,
+        "window_size": null,
+        "attn_types": null,
+        "init_mode": "gpt2",
+        "normalization_type": null,
+        "n_devices": 1,
+        "attention_dir": "causal",
+        "attn_only": false,
+        "seed": 0,
+        "initializer_range": 0.15689290811054724,
+        "init_weights": true,
+        "scale_attn_by_inverse_layer_idx": false,
+        "positional_embedding_type": "standard",
+        "final_rms": false,
+        "d_vocab_out": 4,
+        "parallel_attn_mlp": false,
+        "rotary_dim": null,
+        "n_params": 384,
+        "use_hook_tokens": false,
+        "gated_mlp": false,
+        "default_prepend_bos": true,
+        "dtype": "torch.float32",
+        "tokenizer_prepends_bos": null,
+        "n_key_value_heads": null,
+        "post_embedding_ln": false,
+        "rotary_base": 10000,
+        "trust_remote_code": false,
+        "rotary_adjacent_pairs": false,
+        "load_in_4bit": false,
+        "num_experts": null,
+        "experts_per_token": null
+      },
+      "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model_cfg.pkl",
+      "training_args": {
+        "output_dir": "/circuits-benchmark/results",
+        "atol": 0.05,
+        "lr": 0.001,
+        "use_single_loss": true,
+        "iit_weight": 1.0,
+        "behavior_weight": 0.4,
+        "strict_weight": 0.7,
+        "epochs": 1000,
+        "early_stop_accuracy_threshold": 99.9,
+        "act_fn": "gelu",
+        "use_wandb": true,
+        "save_model_to_wandb": true,
+        "clip_grad_norm": 0.1,
+        "lr_scheduler": "linear",
+        "model_pair": "strict",
+        "same_size": false,
+        "seed": 92,
+        "batch_size": 256,
+        "include_mlp": false,
+        "detach_while_caching": true,
+        "scheduler_val_metric": [
+          "val/accuracy",
+          "val/IIA",
+          "val/strict_accuracy"
+        ],
+        "siit_sampling": "sample_all",
+        "val_iia_sampling": "all"
+      },
+      "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/meta.json",
+      "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model.pth",
+      "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/edges.pkl"
+    },
     {
       "case_id": "46",
       "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46",