Add new models (#16)
Browse files- Add new models (16c725ef7db17b751e6fd485e830244efe7fd9da)
Co-authored-by: Ivan Arcuschin <[email protected]>
- 106/edges.pkl +3 -0
- 106/ll_model.pth +3 -0
- 106/ll_model_cfg.pkl +3 -0
- 106/meta.json +1 -0
- 121/edges.pkl +3 -0
- 121/ll_model.pth +3 -0
- 121/ll_model_cfg.pkl +3 -0
- 121/meta.json +1 -0
- 130/edges.pkl +3 -0
- 130/ll_model.pth +3 -0
- 130/ll_model_cfg.pkl +3 -0
- 130/meta.json +1 -0
- 15/edges.pkl +3 -0
- 15/ll_model.pth +3 -0
- 15/ll_model_cfg.pkl +3 -0
- 15/meta.json +1 -0
- 41/edges.pkl +3 -0
- 41/ll_model.pth +3 -0
- 41/ll_model_cfg.pkl +3 -0
- 41/meta.json +1 -0
- 43/edges.pkl +3 -0
- 43/ll_model.pth +3 -0
- 43/ll_model_cfg.pkl +3 -0
- 43/meta.json +1 -0
- 49/edges.pkl +3 -0
- 49/ll_model.pth +3 -0
- 49/ll_model_cfg.pkl +3 -0
- 49/meta.json +1 -0
- 66/edges.pkl +3 -0
- 66/ll_model.pth +3 -0
- 66/ll_model_cfg.pkl +3 -0
- 66/meta.json +1 -0
- 68/edges.pkl +3 -0
- 68/ll_model.pth +3 -0
- 68/ll_model_cfg.pkl +3 -0
- 68/meta.json +1 -0
- 73/edges.pkl +3 -0
- 73/ll_model.pth +3 -0
- 73/ll_model_cfg.pkl +3 -0
- 73/meta.json +1 -0
- benchmark_cases_metadata.csv +10 -0
- benchmark_cases_metadata.parquet +2 -2
- benchmark_metadata.json +1455 -156
106/edges.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fda9b02cdb2f5d7252c229a12290c6d81381606b1bfad02979549f304bf2a5d0
|
| 3 |
+
size 134
|
106/ll_model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:580798eae1391aca366f15c0442c3ef1c02b1b323d610d1d9ddee0faee5e664f
|
| 3 |
+
size 14698
|
106/ll_model_cfg.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:24bca874c32c8c431cdb732e3222b4090604cde6f05ce1359710b630220650e3
|
| 3 |
+
size 1093
|
106/meta.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-106-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
121/edges.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
|
| 3 |
+
size 113
|
121/ll_model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:8054e00aea3c35c5ee77c693f9feeba493c499fe3218e70780137938138a4675
|
| 3 |
+
size 15118
|
121/ll_model_cfg.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f027ad4de6828c6f5bb7a3f3c8aabd9658526e33b2284eba366977823b89c0a
|
| 3 |
+
size 1093
|
121/meta.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-121-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
130/edges.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:af2a7430f7477a79df1fce6300cf37e1c46d73c31a7f91e06221ef4a6ebf9bed
|
| 3 |
+
size 223
|
130/ll_model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4be63b6e0776e45f04d0905702a3a520b2b6449691ae6e34b8504693ac6805be
|
| 3 |
+
size 21304
|
130/ll_model_cfg.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:192503b894021c736145328500ab1f316e60ed7a121cf04b089bcd05d04e50b4
|
| 3 |
+
size 1093
|
130/meta.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-130-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
15/edges.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ecc8ce1a212f987b85ec909238ebc7d01d36c58389391fc96d69ca007fa2d384
|
| 3 |
+
size 244
|
15/ll_model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:22ff8d1015f06b8912051e6787ba4e058047facdaadd1d9322e7e89c070c131f
|
| 3 |
+
size 20728
|
15/ll_model_cfg.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f4162b8d5712db86a2025499b1561c655fd97402716ff352305c296c7a04ff65
|
| 3 |
+
size 1093
|
15/meta.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-15-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
41/edges.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
|
| 3 |
+
size 113
|
41/ll_model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7d59c31ceb0d0c9afb12dc1f63ade3c4f9edba0dfd80d5779ae27188da2c21d8
|
| 3 |
+
size 14862
|
41/ll_model_cfg.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f1dee34cba288862b06c2ff669839e06b6c17aa46cdb685f4a2c5a8c3be8a39b
|
| 3 |
+
size 1093
|
41/meta.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-41-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
43/edges.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
|
| 3 |
+
size 113
|
43/ll_model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:26cc6d6ffa5ae93ce73055d831d4a7119bca2166c2ed9731992c48b4b3debb49
|
| 3 |
+
size 15054
|
43/ll_model_cfg.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:89a74c42552b846f4562163c6fe74a474edfa36e1972eb97bb3ce0d8aaf9444c
|
| 3 |
+
size 1093
|
43/meta.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-43-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
49/edges.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
|
| 3 |
+
size 113
|
49/ll_model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:aab9be464531a3cf85f25e3ccb3153c15b6de9876d56799d8705d0784979a1ea
|
| 3 |
+
size 14634
|
49/ll_model_cfg.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2e47363d4486f828a419ba208bee3a725d431ab80e418a8318f55cf6cd6bf310
|
| 3 |
+
size 1093
|
49/meta.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-49-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
66/edges.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
|
| 3 |
+
size 113
|
66/ll_model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fa63d9e5b124ffb9ce9061e04b03b1ff551c8085fc51ddea31f488b152f5f7c3
|
| 3 |
+
size 14762
|
66/ll_model_cfg.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b04d734fcc61084204ead0d8cc11c5782598f6f6e4bf3e14b94eab7b0bc9d676
|
| 3 |
+
size 1093
|
66/meta.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-66-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
68/edges.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
|
| 3 |
+
size 113
|
68/ll_model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a1b739ebc05faa4d388c20ef60ab59e44695c4a82323ed7c9c3801ae8e502db9
|
| 3 |
+
size 14670
|
68/ll_model_cfg.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:be188cb9baf70c65af2c4ecf92c6de170c15a41599109f95c6b632f15bb3eec3
|
| 3 |
+
size 1093
|
68/meta.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-68-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
73/edges.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
|
| 3 |
+
size 113
|
73/ll_model.pth
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:809fe1d4c9f818bac9a85b358d0722f6ed8527d56f988fe66d62f0eceac0f097
|
| 3 |
+
size 14698
|
73/ll_model_cfg.pkl
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:db76917a80935813594508b1d79b7a0836a20daf67e263161432430b095fd111
|
| 3 |
+
size 1093
|
73/meta.json
ADDED
|
@@ -0,0 +1 @@
|
|
|
|
|
|
|
| 1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-73-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
benchmark_cases_metadata.csv
CHANGED
|
@@ -27,6 +27,7 @@ ioi,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi,Indirect O
|
|
| 27 |
30,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/30,Tags numeric tokens in a sequence based on whether they fall within a given range.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 28 |
90,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/90,Replaces a specific token with another one.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/edges.pkl,2,4,10,1,custom,4,16,gelu,12,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,9,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 29 |
39,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/39,Returns the fraction of 'x' in the input up to the i-th position for all i.,60,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl,2,120,60,30,custom,4,480,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.08432740427115679,True,False,standard,False,1,False,345600,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
|
| 30 |
75,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75,Double each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 31 |
101,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/101,Check if each element is a square of an integer.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 32 |
ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi_next_token,"Indirect Object Identification (IOI) task, trained using next token prediction.",16,16,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/edges.pkl,6,64,1024,16,gpt2,4,3072,gelu_new,50257,1e-05,False,True,False,False,False,False,GPT2LMHeadModel,False,gpt2,gpt2,LNPre,1,causal,False,,0.02886751345948129,True,False,standard,False,50257,False,2457600,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,,,,True,True,1.0,,,True,,256.0,True,True,"val/accuracy,val/IIA",,,True,0.65,False,0.0,True,max,,True,
|
|
@@ -34,14 +35,17 @@ ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi
|
|
| 34 |
14,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/14,Returns the count of 'a' in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/edges.pkl,2,8,10,2,custom,4,32,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.15689290811054724,True,False,standard,False,10,False,1536,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 35 |
95,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/95,Counts the distinct prime factors of each number in the input list.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12060453783110546,True,False,standard,False,3,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 36 |
84,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/84,Apply the arctangent function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
|
| 37 |
93,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93,Swaps the nth with the n+1th element if n%2==1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/edges.pkl,3,20,10,5,custom,4,80,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10886621079036347,True,False,standard,False,11,False,14400,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 38 |
37,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/37,Reverses each word in the sequence except for specified exclusions.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
| 39 |
34,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/34,Calculate the ratio of vowels to consonants in each word.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/edges.pkl,2,16,10,4,custom,4,64,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,5,False,6144,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
| 40 |
26,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/26,Creates a cascading effect by repeating each token in sequence incrementally.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl,2,21,10,5,custom,4,84,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12344267996967354,True,False,standard,False,27,False,10416,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
|
|
|
| 41 |
19,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/19,Removes consecutive duplicate tokens from a sequence.,15,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/edges.pkl,2,32,15,8,custom,4,128,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.15689290811054724,True,False,standard,False,3,False,24576,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,,True,,,True,True,,,,True,,True,,True,,,True,
|
| 42 |
53,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/53,Increment elements at odd indices by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13151918984428584,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 43 |
40,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/40,Sum the last and previous to last digits of a number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/edges.pkl,2,4,10,1,custom,4,16,gelu,31,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.09847319278346618,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 44 |
51,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/51,Checks if each element is a Fibonacci number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl,2,4,10,1,custom,4,16,gelu,102,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.07525766947068778,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
|
| 45 |
122,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122,Check if each number is divisible by 3.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 46 |
85,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/85,Square each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 47 |
2,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/2,Reverse the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/edges.pkl,4,56,10,14,custom,4,224,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.07593263966019993,True,False,standard,False,26,False,150528,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
@@ -51,6 +55,7 @@ ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi
|
|
| 51 |
20,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/20,Detect spam messages based on appearance of spam keywords.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/edges.pkl,2,13,10,3,custom,4,52,gelu,14,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16,True,False,standard,False,2,False,3952,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
| 52 |
25,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/25,Normalizes token frequencies in a sequence to a range between 0 and 1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/edges.pkl,2,62,10,15,custom,4,248,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.08295613557843402,True,False,standard,False,56,False,91264,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 53 |
11,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/11,Counts the number of words in a sequence based on their length.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,5,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,500.0,,gelu,True,True,1.0,,,True,,,True,True,,,,True,,True,,True,,,True,
|
|
|
|
| 54 |
54,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/54,Applies the hyperbolic tangent to each element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 55 |
124,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/124,Check if all elements in a list are equal.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.11547005383792516,True,False,standard,False,2,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 56 |
102,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/102,"Reflects each element within a range (default is [2, 7]).",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/edges.pkl,2,4,10,1,custom,4,16,gelu,42,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1059625885652035,True,False,standard,False,6,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
@@ -60,15 +65,20 @@ ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi
|
|
| 60 |
86,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/86,"Check if each element is a power of 2. Return 1 if true, otherwise 0.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 61 |
105,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/105,Replaces each number with the next prime after that number.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.11202240672224079,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 62 |
58,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/58,Mirrors the first half of the sequence to the second half.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl,3,32,10,8,custom,4,128,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10415112878465911,True,False,standard,False,11,False,36864,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
|
| 63 |
70,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/70,Apply the cosine function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 64 |
62,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/62,Replaces each element with its factorial.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1414213562373095,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 65 |
111,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/111,Returns the last element of the sequence and pads the rest with zeros.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.09847319278346618,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
|
| 66 |
35,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/35,Alternates capitalization of each character in words.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/edges.pkl,2,9,10,2,custom,4,36,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,1872,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
| 67 |
3,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/3,Returns the fraction of 'x' in the input up to the i-th position for all i.,5,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/edges.pkl,2,12,5,3,custom,4,48,gelu,6,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.22188007849009167,True,False,standard,False,1,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,10.0,2000.0,,gelu,True,True,0.1,,strict,False,,,True,True,,,,True,,True,,True,,,True,
|
| 68 |
36,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/36,"Classifies each token as 'positive', 'negative', or 'neutral' based on emojis.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl,2,6,10,1,custom,4,24,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.19402850002906638,True,False,standard,False,3,False,768,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
|
|
|
| 69 |
64,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/64,Cubes each element in the sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 70 |
8,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/8,Identity,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
|
| 71 |
103,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/103,Swap consecutive numbers in a list,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10787197799411874,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 72 |
56,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/56,Sets every third element to zero.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13333333333333333,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 73 |
97,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/97,Scale a sequence by its maximum element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl,3,200,10,50,custom,4,800,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.05405899027195888,True,False,standard,False,64,False,1440000,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
|
| 74 |
46,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46,Decrements each element in the sequence by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
|
| 27 |
30,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/30,Tags numeric tokens in a sequence based on whether they fall within a given range.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 28 |
90,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/90,Replaces a specific token with another one.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/edges.pkl,2,4,10,1,custom,4,16,gelu,12,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,9,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 29 |
39,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/39,Returns the fraction of 'x' in the input up to the i-th position for all i.,60,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl,2,120,60,30,custom,4,480,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.08432740427115679,True,False,standard,False,1,False,345600,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 30 |
+
130,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/130,"Clips each element to be within a range (make the default range [2, 7]).",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/edges.pkl,3,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.10079052613579392,True,False,standard,False,6,False,576,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 31 |
75,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75,Double each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 32 |
101,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/101,Check if each element is a square of an integer.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 33 |
ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi_next_token,"Indirect Object Identification (IOI) task, trained using next token prediction.",16,16,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/edges.pkl,6,64,1024,16,gpt2,4,3072,gelu_new,50257,1e-05,False,True,False,False,False,False,GPT2LMHeadModel,False,gpt2,gpt2,LNPre,1,causal,False,,0.02886751345948129,True,False,standard,False,50257,False,2457600,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,,,,True,True,1.0,,,True,,256.0,True,True,"val/accuracy,val/IIA",,,True,0.65,False,0.0,True,max,,True,
|
|
|
|
| 35 |
14,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/14,Returns the count of 'a' in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/edges.pkl,2,8,10,2,custom,4,32,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.15689290811054724,True,False,standard,False,10,False,1536,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 36 |
95,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/95,Counts the distinct prime factors of each number in the input list.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12060453783110546,True,False,standard,False,3,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 37 |
84,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/84,Apply the arctangent function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 38 |
+
66,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/66,Round each element in the input sequence to the nearest integer.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13151918984428584,True,False,standard,False,6,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 39 |
93,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93,Swaps the nth with the n+1th element if n%2==1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/edges.pkl,3,20,10,5,custom,4,80,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10886621079036347,True,False,standard,False,11,False,14400,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 40 |
37,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/37,Reverses each word in the sequence except for specified exclusions.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
| 41 |
34,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/34,Calculate the ratio of vowels to consonants in each word.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/edges.pkl,2,16,10,4,custom,4,64,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,5,False,6144,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
| 42 |
26,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/26,Creates a cascading effect by repeating each token in sequence incrementally.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl,2,21,10,5,custom,4,84,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12344267996967354,True,False,standard,False,27,False,10416,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
| 43 |
+
15,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/15,Returns each token multiplied by two and subtracted by its index.,5,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/edges.pkl,3,4,5,1,custom,4,16,gelu,7,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.06553855364152325,True,False,standard,False,12,False,576,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 44 |
19,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/19,Removes consecutive duplicate tokens from a sequence.,15,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/edges.pkl,2,32,15,8,custom,4,128,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.15689290811054724,True,False,standard,False,3,False,24576,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,,True,,,True,True,,,,True,,True,,True,,,True,
|
| 45 |
53,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/53,Increment elements at odd indices by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13151918984428584,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 46 |
40,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/40,Sum the last and previous to last digits of a number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/edges.pkl,2,4,10,1,custom,4,16,gelu,31,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.09847319278346618,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 47 |
51,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/51,Checks if each element is a Fibonacci number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl,2,4,10,1,custom,4,16,gelu,102,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.07525766947068778,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 48 |
+
43,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/43,Returns the corresponding Fibonacci number for each element in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1131370849898476,True,False,standard,False,19,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 49 |
122,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122,Check if each number is divisible by 3.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 50 |
85,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/85,Square each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 51 |
2,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/2,Reverse the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/edges.pkl,4,56,10,14,custom,4,224,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.07593263966019993,True,False,standard,False,26,False,150528,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
|
| 55 |
20,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/20,Detect spam messages based on appearance of spam keywords.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/edges.pkl,2,13,10,3,custom,4,52,gelu,14,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16,True,False,standard,False,2,False,3952,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
| 56 |
25,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/25,Normalizes token frequencies in a sequence to a range between 0 and 1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/edges.pkl,2,62,10,15,custom,4,248,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.08295613557843402,True,False,standard,False,56,False,91264,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 57 |
11,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/11,Counts the number of words in a sequence based on their length.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,5,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,500.0,,gelu,True,True,1.0,,,True,,,True,True,,,,True,,True,,True,,,True,
|
| 58 |
+
41,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/41,Make each element of the input sequence absolute,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12344267996967354,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 59 |
54,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/54,Applies the hyperbolic tangent to each element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 60 |
124,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/124,Check if all elements in a list are equal.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.11547005383792516,True,False,standard,False,2,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 61 |
102,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/102,"Reflects each element within a range (default is [2, 7]).",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/edges.pkl,2,4,10,1,custom,4,16,gelu,42,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1059625885652035,True,False,standard,False,6,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
|
| 65 |
86,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/86,"Check if each element is a power of 2. Return 1 if true, otherwise 0.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 66 |
105,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/105,Replaces each number with the next prime after that number.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.11202240672224079,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 67 |
58,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/58,Mirrors the first half of the sequence to the second half.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl,3,32,10,8,custom,4,128,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10415112878465911,True,False,standard,False,11,False,36864,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 68 |
+
68,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/68,Increment each element until it becomes a multiple of 3,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,5,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 69 |
70,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/70,Apply the cosine function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 70 |
62,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/62,Replaces each element with its factorial.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1414213562373095,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 71 |
111,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/111,Returns the last element of the sequence and pads the rest with zeros.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.09847319278346618,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 72 |
+
121,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/121,Compute arcsine of all elements in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.11202240672224079,True,False,standard,False,20,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 73 |
35,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/35,Alternates capitalization of each character in words.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/edges.pkl,2,9,10,2,custom,4,36,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,1872,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
| 74 |
3,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/3,Returns the fraction of 'x' in the input up to the i-th position for all i.,5,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/edges.pkl,2,12,5,3,custom,4,48,gelu,6,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.22188007849009167,True,False,standard,False,1,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,10.0,2000.0,,gelu,True,True,0.1,,strict,False,,,True,True,,,,True,,True,,True,,,True,
|
| 75 |
36,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/36,"Classifies each token as 'positive', 'negative', or 'neutral' based on emojis.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl,2,6,10,1,custom,4,24,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.19402850002906638,True,False,standard,False,3,False,768,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
| 76 |
+
106,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/106,Sets all elements to zero except for the element at index 1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13719886811400708,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 77 |
64,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/64,Cubes each element in the sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 78 |
8,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/8,Identity,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 79 |
+
73,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/73,Apply the sine function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 80 |
103,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/103,Swap consecutive numbers in a list,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10787197799411874,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 81 |
56,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/56,Sets every third element to zero.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13333333333333333,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 82 |
97,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/97,Scale a sequence by its maximum element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl,3,200,10,50,custom,4,800,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.05405899027195888,True,False,standard,False,64,False,1440000,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 83 |
+
49,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/49,Decrements each element in the sequence until it becomes a multiple of 3.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.15689290811054724,True,False,standard,False,4,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
| 84 |
46,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46,Decrements each element in the sequence by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
benchmark_cases_metadata.parquet
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:049d63f22c918edb98d89c9eb69f091016c4780b033e5559523abd7e50188238
|
| 3 |
+
size 76100
|
benchmark_metadata.json
CHANGED
|
@@ -3352,6 +3352,150 @@
|
|
| 3352 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth",
|
| 3353 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl"
|
| 3354 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 3355 |
{
|
| 3356 |
"case_id": "75",
|
| 3357 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75",
|
|
@@ -4233,6 +4377,140 @@
|
|
| 4233 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth",
|
| 4234 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl"
|
| 4235 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4236 |
{
|
| 4237 |
"case_id": "93",
|
| 4238 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93",
|
|
@@ -4663,40 +4941,159 @@
|
|
| 4663 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl"
|
| 4664 |
},
|
| 4665 |
{
|
| 4666 |
-
"case_id": "
|
| 4667 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
| 4668 |
-
"task_description": "
|
| 4669 |
"vocab": [
|
| 4670 |
-
|
| 4671 |
-
|
| 4672 |
-
|
|
|
|
|
|
|
| 4673 |
],
|
| 4674 |
-
"max_seq_len":
|
| 4675 |
"min_seq_len": 4,
|
| 4676 |
"files": [
|
| 4677 |
{
|
| 4678 |
"file_name": "edges.pkl",
|
| 4679 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 4680 |
},
|
| 4681 |
{
|
| 4682 |
"file_name": "ll_model.pth",
|
| 4683 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 4684 |
},
|
| 4685 |
{
|
| 4686 |
"file_name": "ll_model_cfg.pkl",
|
| 4687 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 4688 |
},
|
| 4689 |
{
|
| 4690 |
"file_name": "meta.json",
|
| 4691 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 4692 |
}
|
| 4693 |
],
|
| 4694 |
"transformer_cfg": {
|
| 4695 |
-
"n_layers":
|
| 4696 |
-
"d_model":
|
| 4697 |
-
"n_ctx":
|
| 4698 |
-
"d_head":
|
| 4699 |
-
"model_name": "custom",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 4700 |
"n_heads": 4,
|
| 4701 |
"d_mlp": 128,
|
| 4702 |
"act_fn": "gelu",
|
|
@@ -5241,6 +5638,140 @@
|
|
| 5241 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth",
|
| 5242 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl"
|
| 5243 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 5244 |
{
|
| 5245 |
"case_id": "122",
|
| 5246 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122",
|
|
@@ -6371,10 +6902,20 @@
|
|
| 6371 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl"
|
| 6372 |
},
|
| 6373 |
{
|
| 6374 |
-
"case_id": "
|
| 6375 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
| 6376 |
-
"task_description": "
|
| 6377 |
"vocab": [
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 6378 |
0,
|
| 6379 |
1,
|
| 6380 |
2,
|
|
@@ -6384,19 +6925,143 @@
|
|
| 6384 |
6,
|
| 6385 |
7,
|
| 6386 |
8,
|
| 6387 |
-
9
|
| 6388 |
-
10
|
| 6389 |
],
|
| 6390 |
"max_seq_len": 10,
|
| 6391 |
"min_seq_len": 4,
|
| 6392 |
"files": [
|
| 6393 |
{
|
| 6394 |
"file_name": "edges.pkl",
|
| 6395 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 6396 |
},
|
| 6397 |
{
|
| 6398 |
"file_name": "ll_model.pth",
|
| 6399 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 6400 |
},
|
| 6401 |
{
|
| 6402 |
"file_name": "ll_model_cfg.pkl",
|
|
@@ -7572,9 +8237,9 @@
|
|
| 7572 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl"
|
| 7573 |
},
|
| 7574 |
{
|
| 7575 |
-
"case_id": "
|
| 7576 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
| 7577 |
-
"task_description": "
|
| 7578 |
"vocab": [
|
| 7579 |
0,
|
| 7580 |
1,
|
|
@@ -7593,19 +8258,19 @@
|
|
| 7593 |
"files": [
|
| 7594 |
{
|
| 7595 |
"file_name": "edges.pkl",
|
| 7596 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7597 |
},
|
| 7598 |
{
|
| 7599 |
"file_name": "ll_model.pth",
|
| 7600 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7601 |
},
|
| 7602 |
{
|
| 7603 |
"file_name": "ll_model_cfg.pkl",
|
| 7604 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7605 |
},
|
| 7606 |
{
|
| 7607 |
"file_name": "meta.json",
|
| 7608 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7609 |
}
|
| 7610 |
],
|
| 7611 |
"transformer_cfg": {
|
|
@@ -7639,12 +8304,12 @@
|
|
| 7639 |
"attention_dir": "causal",
|
| 7640 |
"attn_only": false,
|
| 7641 |
"seed": 0,
|
| 7642 |
-
"initializer_range": 0.
|
| 7643 |
"init_weights": true,
|
| 7644 |
"scale_attn_by_inverse_layer_idx": false,
|
| 7645 |
"positional_embedding_type": "standard",
|
| 7646 |
"final_rms": false,
|
| 7647 |
-
"d_vocab_out":
|
| 7648 |
"parallel_attn_mlp": false,
|
| 7649 |
"rotary_dim": null,
|
| 7650 |
"n_params": 384,
|
|
@@ -7662,7 +8327,7 @@
|
|
| 7662 |
"num_experts": null,
|
| 7663 |
"experts_per_token": null
|
| 7664 |
},
|
| 7665 |
-
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7666 |
"training_args": {
|
| 7667 |
"output_dir": "/circuits-benchmark/results",
|
| 7668 |
"atol": 0.05,
|
|
@@ -7670,7 +8335,7 @@
|
|
| 7670 |
"use_single_loss": true,
|
| 7671 |
"iit_weight": 1.0,
|
| 7672 |
"behavior_weight": 0.4,
|
| 7673 |
-
"strict_weight": 0
|
| 7674 |
"epochs": 1000,
|
| 7675 |
"early_stop_accuracy_threshold": 99.9,
|
| 7676 |
"act_fn": "gelu",
|
|
@@ -7692,14 +8357,14 @@
|
|
| 7692 |
"siit_sampling": "sample_all",
|
| 7693 |
"val_iia_sampling": "all"
|
| 7694 |
},
|
| 7695 |
-
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7696 |
-
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7697 |
-
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7698 |
},
|
| 7699 |
{
|
| 7700 |
-
"case_id": "
|
| 7701 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
| 7702 |
-
"task_description": "
|
| 7703 |
"vocab": [
|
| 7704 |
0,
|
| 7705 |
1,
|
|
@@ -7718,19 +8383,19 @@
|
|
| 7718 |
"files": [
|
| 7719 |
{
|
| 7720 |
"file_name": "edges.pkl",
|
| 7721 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7722 |
},
|
| 7723 |
{
|
| 7724 |
"file_name": "ll_model.pth",
|
| 7725 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7726 |
},
|
| 7727 |
{
|
| 7728 |
"file_name": "ll_model_cfg.pkl",
|
| 7729 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7730 |
},
|
| 7731 |
{
|
| 7732 |
"file_name": "meta.json",
|
| 7733 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7734 |
}
|
| 7735 |
],
|
| 7736 |
"transformer_cfg": {
|
|
@@ -7764,12 +8429,12 @@
|
|
| 7764 |
"attention_dir": "causal",
|
| 7765 |
"attn_only": false,
|
| 7766 |
"seed": 0,
|
| 7767 |
-
"initializer_range": 0.
|
| 7768 |
"init_weights": true,
|
| 7769 |
"scale_attn_by_inverse_layer_idx": false,
|
| 7770 |
"positional_embedding_type": "standard",
|
| 7771 |
"final_rms": false,
|
| 7772 |
-
"d_vocab_out":
|
| 7773 |
"parallel_attn_mlp": false,
|
| 7774 |
"rotary_dim": null,
|
| 7775 |
"n_params": 384,
|
|
@@ -7787,7 +8452,7 @@
|
|
| 7787 |
"num_experts": null,
|
| 7788 |
"experts_per_token": null
|
| 7789 |
},
|
| 7790 |
-
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7791 |
"training_args": {
|
| 7792 |
"output_dir": "/circuits-benchmark/results",
|
| 7793 |
"atol": 0.05,
|
|
@@ -7817,14 +8482,14 @@
|
|
| 7817 |
"siit_sampling": "sample_all",
|
| 7818 |
"val_iia_sampling": "all"
|
| 7819 |
},
|
| 7820 |
-
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7821 |
-
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7822 |
-
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7823 |
},
|
| 7824 |
{
|
| 7825 |
-
"case_id": "
|
| 7826 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
| 7827 |
-
"task_description": "
|
| 7828 |
"vocab": [
|
| 7829 |
0,
|
| 7830 |
1,
|
|
@@ -7843,29 +8508,29 @@
|
|
| 7843 |
"files": [
|
| 7844 |
{
|
| 7845 |
"file_name": "edges.pkl",
|
| 7846 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7847 |
},
|
| 7848 |
{
|
| 7849 |
"file_name": "ll_model.pth",
|
| 7850 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7851 |
},
|
| 7852 |
{
|
| 7853 |
"file_name": "ll_model_cfg.pkl",
|
| 7854 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7855 |
},
|
| 7856 |
{
|
| 7857 |
"file_name": "meta.json",
|
| 7858 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7859 |
}
|
| 7860 |
],
|
| 7861 |
"transformer_cfg": {
|
| 7862 |
-
"n_layers":
|
| 7863 |
-
"d_model":
|
| 7864 |
"n_ctx": 10,
|
| 7865 |
-
"d_head":
|
| 7866 |
"model_name": "custom",
|
| 7867 |
"n_heads": 4,
|
| 7868 |
-
"d_mlp":
|
| 7869 |
"act_fn": "gelu",
|
| 7870 |
"d_vocab": 13,
|
| 7871 |
"eps": 1e-05,
|
|
@@ -7886,18 +8551,18 @@
|
|
| 7886 |
"init_mode": "gpt2",
|
| 7887 |
"normalization_type": null,
|
| 7888 |
"n_devices": 1,
|
| 7889 |
-
"attention_dir": "
|
| 7890 |
"attn_only": false,
|
| 7891 |
"seed": 0,
|
| 7892 |
-
"initializer_range": 0.
|
| 7893 |
"init_weights": true,
|
| 7894 |
"scale_attn_by_inverse_layer_idx": false,
|
| 7895 |
"positional_embedding_type": "standard",
|
| 7896 |
"final_rms": false,
|
| 7897 |
-
"d_vocab_out":
|
| 7898 |
"parallel_attn_mlp": false,
|
| 7899 |
"rotary_dim": null,
|
| 7900 |
-
"n_params":
|
| 7901 |
"use_hook_tokens": false,
|
| 7902 |
"gated_mlp": false,
|
| 7903 |
"default_prepend_bos": true,
|
|
@@ -7912,7 +8577,7 @@
|
|
| 7912 |
"num_experts": null,
|
| 7913 |
"experts_per_token": null
|
| 7914 |
},
|
| 7915 |
-
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7916 |
"training_args": {
|
| 7917 |
"output_dir": "/circuits-benchmark/results",
|
| 7918 |
"atol": 0.05,
|
|
@@ -7920,7 +8585,7 @@
|
|
| 7920 |
"use_single_loss": true,
|
| 7921 |
"iit_weight": 1.0,
|
| 7922 |
"behavior_weight": 0.4,
|
| 7923 |
-
"strict_weight": 0.
|
| 7924 |
"epochs": 1000,
|
| 7925 |
"early_stop_accuracy_threshold": 99.9,
|
| 7926 |
"act_fn": "gelu",
|
|
@@ -7942,54 +8607,57 @@
|
|
| 7942 |
"siit_sampling": "sample_all",
|
| 7943 |
"val_iia_sampling": "all"
|
| 7944 |
},
|
| 7945 |
-
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7946 |
-
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7947 |
-
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7948 |
},
|
| 7949 |
{
|
| 7950 |
-
"case_id": "
|
| 7951 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
| 7952 |
-
"task_description": "
|
| 7953 |
"vocab": [
|
| 7954 |
-
|
| 7955 |
-
|
| 7956 |
-
|
| 7957 |
-
|
| 7958 |
-
|
| 7959 |
-
|
| 7960 |
-
|
| 7961 |
-
|
|
|
|
|
|
|
|
|
|
| 7962 |
],
|
| 7963 |
"max_seq_len": 10,
|
| 7964 |
"min_seq_len": 4,
|
| 7965 |
"files": [
|
| 7966 |
{
|
| 7967 |
"file_name": "edges.pkl",
|
| 7968 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7969 |
},
|
| 7970 |
{
|
| 7971 |
"file_name": "ll_model.pth",
|
| 7972 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7973 |
},
|
| 7974 |
{
|
| 7975 |
"file_name": "ll_model_cfg.pkl",
|
| 7976 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7977 |
},
|
| 7978 |
{
|
| 7979 |
"file_name": "meta.json",
|
| 7980 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 7981 |
}
|
| 7982 |
],
|
| 7983 |
"transformer_cfg": {
|
| 7984 |
-
"n_layers":
|
| 7985 |
-
"d_model":
|
| 7986 |
"n_ctx": 10,
|
| 7987 |
-
"d_head":
|
| 7988 |
"model_name": "custom",
|
| 7989 |
"n_heads": 4,
|
| 7990 |
-
"d_mlp":
|
| 7991 |
"act_fn": "gelu",
|
| 7992 |
-
"d_vocab":
|
| 7993 |
"eps": 1e-05,
|
| 7994 |
"use_attn_result": true,
|
| 7995 |
"use_attn_scale": true,
|
|
@@ -8008,18 +8676,18 @@
|
|
| 8008 |
"init_mode": "gpt2",
|
| 8009 |
"normalization_type": null,
|
| 8010 |
"n_devices": 1,
|
| 8011 |
-
"attention_dir": "
|
| 8012 |
"attn_only": false,
|
| 8013 |
"seed": 0,
|
| 8014 |
-
"initializer_range": 0.
|
| 8015 |
"init_weights": true,
|
| 8016 |
"scale_attn_by_inverse_layer_idx": false,
|
| 8017 |
"positional_embedding_type": "standard",
|
| 8018 |
"final_rms": false,
|
| 8019 |
-
"d_vocab_out":
|
| 8020 |
"parallel_attn_mlp": false,
|
| 8021 |
"rotary_dim": null,
|
| 8022 |
-
"n_params":
|
| 8023 |
"use_hook_tokens": false,
|
| 8024 |
"gated_mlp": false,
|
| 8025 |
"default_prepend_bos": true,
|
|
@@ -8029,9 +8697,265 @@
|
|
| 8029 |
"post_embedding_ln": false,
|
| 8030 |
"rotary_base": 10000,
|
| 8031 |
"trust_remote_code": false,
|
| 8032 |
-
"rotary_adjacent_pairs": false
|
| 8033 |
-
|
| 8034 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 8035 |
"training_args": {
|
| 8036 |
"atol": 0.05,
|
| 8037 |
"lr": 0.01,
|
|
@@ -8136,58 +9060,289 @@
|
|
| 8136 |
"lr": 0.01,
|
| 8137 |
"use_single_loss": false,
|
| 8138 |
"iit_weight": 1.0,
|
| 8139 |
-
"behavior_weight": 1.0,
|
| 8140 |
-
"strict_weight": 10.0,
|
| 8141 |
-
"epochs": 2000,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 8142 |
"act_fn": "gelu",
|
|
|
|
|
|
|
| 8143 |
"clip_grad_norm": 0.1,
|
| 8144 |
-
"lr_scheduler": "",
|
| 8145 |
"model_pair": "strict",
|
| 8146 |
-
"same_size": false
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 8147 |
},
|
| 8148 |
-
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8149 |
-
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8150 |
-
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8151 |
},
|
| 8152 |
{
|
| 8153 |
-
"case_id": "
|
| 8154 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
| 8155 |
-
"task_description": "
|
| 8156 |
"vocab": [
|
| 8157 |
-
|
| 8158 |
-
|
| 8159 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 8160 |
],
|
| 8161 |
"max_seq_len": 10,
|
| 8162 |
"min_seq_len": 4,
|
| 8163 |
"files": [
|
| 8164 |
{
|
| 8165 |
"file_name": "edges.pkl",
|
| 8166 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8167 |
},
|
| 8168 |
{
|
| 8169 |
"file_name": "ll_model.pth",
|
| 8170 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8171 |
},
|
| 8172 |
{
|
| 8173 |
"file_name": "ll_model_cfg.pkl",
|
| 8174 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8175 |
},
|
| 8176 |
{
|
| 8177 |
"file_name": "meta.json",
|
| 8178 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8179 |
}
|
| 8180 |
],
|
| 8181 |
"transformer_cfg": {
|
| 8182 |
"n_layers": 2,
|
| 8183 |
-
"d_model":
|
| 8184 |
"n_ctx": 10,
|
| 8185 |
"d_head": 1,
|
| 8186 |
"model_name": "custom",
|
| 8187 |
"n_heads": 4,
|
| 8188 |
-
"d_mlp":
|
| 8189 |
"act_fn": "gelu",
|
| 8190 |
-
"d_vocab":
|
| 8191 |
"eps": 1e-05,
|
| 8192 |
"use_attn_result": true,
|
| 8193 |
"use_attn_scale": true,
|
|
@@ -8209,15 +9364,15 @@
|
|
| 8209 |
"attention_dir": "causal",
|
| 8210 |
"attn_only": false,
|
| 8211 |
"seed": 0,
|
| 8212 |
-
"initializer_range": 0.
|
| 8213 |
"init_weights": true,
|
| 8214 |
"scale_attn_by_inverse_layer_idx": false,
|
| 8215 |
"positional_embedding_type": "standard",
|
| 8216 |
"final_rms": false,
|
| 8217 |
-
"d_vocab_out":
|
| 8218 |
"parallel_attn_mlp": false,
|
| 8219 |
"rotary_dim": null,
|
| 8220 |
-
"n_params":
|
| 8221 |
"use_hook_tokens": false,
|
| 8222 |
"gated_mlp": false,
|
| 8223 |
"default_prepend_bos": true,
|
|
@@ -8227,30 +9382,49 @@
|
|
| 8227 |
"post_embedding_ln": false,
|
| 8228 |
"rotary_base": 10000,
|
| 8229 |
"trust_remote_code": false,
|
| 8230 |
-
"rotary_adjacent_pairs": false
|
|
|
|
|
|
|
|
|
|
| 8231 |
},
|
| 8232 |
-
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8233 |
"training_args": {
|
|
|
|
| 8234 |
"atol": 0.05,
|
| 8235 |
-
"lr": 0.
|
| 8236 |
-
"use_single_loss":
|
| 8237 |
"iit_weight": 1.0,
|
| 8238 |
-
"behavior_weight":
|
| 8239 |
-
"strict_weight":
|
| 8240 |
-
"epochs":
|
|
|
|
| 8241 |
"act_fn": "gelu",
|
|
|
|
|
|
|
| 8242 |
"clip_grad_norm": 0.1,
|
| 8243 |
-
"lr_scheduler": "",
|
| 8244 |
-
"model_pair": "strict"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 8245 |
},
|
| 8246 |
-
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8247 |
-
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8248 |
-
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8249 |
},
|
| 8250 |
{
|
| 8251 |
-
"case_id": "
|
| 8252 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
| 8253 |
-
"task_description": "
|
| 8254 |
"vocab": [
|
| 8255 |
0,
|
| 8256 |
1,
|
|
@@ -8269,19 +9443,19 @@
|
|
| 8269 |
"files": [
|
| 8270 |
{
|
| 8271 |
"file_name": "edges.pkl",
|
| 8272 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8273 |
},
|
| 8274 |
{
|
| 8275 |
"file_name": "ll_model.pth",
|
| 8276 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8277 |
},
|
| 8278 |
{
|
| 8279 |
"file_name": "ll_model_cfg.pkl",
|
| 8280 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8281 |
},
|
| 8282 |
{
|
| 8283 |
"file_name": "meta.json",
|
| 8284 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8285 |
}
|
| 8286 |
],
|
| 8287 |
"transformer_cfg": {
|
|
@@ -8338,7 +9512,7 @@
|
|
| 8338 |
"num_experts": null,
|
| 8339 |
"experts_per_token": null
|
| 8340 |
},
|
| 8341 |
-
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8342 |
"training_args": {
|
| 8343 |
"output_dir": "/circuits-benchmark/results",
|
| 8344 |
"atol": 0.05,
|
|
@@ -8368,14 +9542,14 @@
|
|
| 8368 |
"siit_sampling": "sample_all",
|
| 8369 |
"val_iia_sampling": "all"
|
| 8370 |
},
|
| 8371 |
-
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8372 |
-
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8373 |
-
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8374 |
},
|
| 8375 |
{
|
| 8376 |
-
"case_id": "
|
| 8377 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
| 8378 |
-
"task_description": "
|
| 8379 |
"vocab": [
|
| 8380 |
0,
|
| 8381 |
1,
|
|
@@ -8394,19 +9568,19 @@
|
|
| 8394 |
"files": [
|
| 8395 |
{
|
| 8396 |
"file_name": "edges.pkl",
|
| 8397 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8398 |
},
|
| 8399 |
{
|
| 8400 |
"file_name": "ll_model.pth",
|
| 8401 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8402 |
},
|
| 8403 |
{
|
| 8404 |
"file_name": "ll_model_cfg.pkl",
|
| 8405 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8406 |
},
|
| 8407 |
{
|
| 8408 |
"file_name": "meta.json",
|
| 8409 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8410 |
}
|
| 8411 |
],
|
| 8412 |
"transformer_cfg": {
|
|
@@ -8463,7 +9637,7 @@
|
|
| 8463 |
"num_experts": null,
|
| 8464 |
"experts_per_token": null
|
| 8465 |
},
|
| 8466 |
-
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8467 |
"training_args": {
|
| 8468 |
"output_dir": "/circuits-benchmark/results",
|
| 8469 |
"atol": 0.05,
|
|
@@ -8481,7 +9655,7 @@
|
|
| 8481 |
"lr_scheduler": "linear",
|
| 8482 |
"model_pair": "strict",
|
| 8483 |
"same_size": false,
|
| 8484 |
-
"seed":
|
| 8485 |
"batch_size": 256,
|
| 8486 |
"include_mlp": false,
|
| 8487 |
"detach_while_caching": true,
|
|
@@ -8493,9 +9667,9 @@
|
|
| 8493 |
"siit_sampling": "sample_all",
|
| 8494 |
"val_iia_sampling": "all"
|
| 8495 |
},
|
| 8496 |
-
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8497 |
-
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8498 |
-
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
| 8499 |
},
|
| 8500 |
{
|
| 8501 |
"case_id": "103",
|
|
@@ -8872,6 +10046,131 @@
|
|
| 8872 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth",
|
| 8873 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl"
|
| 8874 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 8875 |
{
|
| 8876 |
"case_id": "46",
|
| 8877 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46",
|
|
|
|
| 3352 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth",
|
| 3353 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl"
|
| 3354 |
},
|
| 3355 |
+
{
|
| 3356 |
+
"case_id": "130",
|
| 3357 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/130",
|
| 3358 |
+
"task_description": "Clips each element to be within a range (make the default range [2, 7]).",
|
| 3359 |
+
"vocab": [
|
| 3360 |
+
-15,
|
| 3361 |
+
-14,
|
| 3362 |
+
-13,
|
| 3363 |
+
-12,
|
| 3364 |
+
-11,
|
| 3365 |
+
-10,
|
| 3366 |
+
-9,
|
| 3367 |
+
-8,
|
| 3368 |
+
-7,
|
| 3369 |
+
-6,
|
| 3370 |
+
-5,
|
| 3371 |
+
-4,
|
| 3372 |
+
-3,
|
| 3373 |
+
-2,
|
| 3374 |
+
-1,
|
| 3375 |
+
0,
|
| 3376 |
+
1,
|
| 3377 |
+
2,
|
| 3378 |
+
3,
|
| 3379 |
+
4,
|
| 3380 |
+
5,
|
| 3381 |
+
6,
|
| 3382 |
+
7,
|
| 3383 |
+
8,
|
| 3384 |
+
9,
|
| 3385 |
+
10,
|
| 3386 |
+
11,
|
| 3387 |
+
12,
|
| 3388 |
+
13,
|
| 3389 |
+
14
|
| 3390 |
+
],
|
| 3391 |
+
"max_seq_len": 10,
|
| 3392 |
+
"min_seq_len": 4,
|
| 3393 |
+
"files": [
|
| 3394 |
+
{
|
| 3395 |
+
"file_name": "edges.pkl",
|
| 3396 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/edges.pkl"
|
| 3397 |
+
},
|
| 3398 |
+
{
|
| 3399 |
+
"file_name": "ll_model.pth",
|
| 3400 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model.pth"
|
| 3401 |
+
},
|
| 3402 |
+
{
|
| 3403 |
+
"file_name": "ll_model_cfg.pkl",
|
| 3404 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model_cfg.pkl"
|
| 3405 |
+
},
|
| 3406 |
+
{
|
| 3407 |
+
"file_name": "meta.json",
|
| 3408 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/meta.json"
|
| 3409 |
+
}
|
| 3410 |
+
],
|
| 3411 |
+
"transformer_cfg": {
|
| 3412 |
+
"n_layers": 3,
|
| 3413 |
+
"d_model": 4,
|
| 3414 |
+
"n_ctx": 10,
|
| 3415 |
+
"d_head": 1,
|
| 3416 |
+
"model_name": "custom",
|
| 3417 |
+
"n_heads": 4,
|
| 3418 |
+
"d_mlp": 16,
|
| 3419 |
+
"act_fn": "gelu",
|
| 3420 |
+
"d_vocab": 32,
|
| 3421 |
+
"eps": 1e-05,
|
| 3422 |
+
"use_attn_result": true,
|
| 3423 |
+
"use_attn_scale": true,
|
| 3424 |
+
"use_split_qkv_input": true,
|
| 3425 |
+
"use_hook_mlp_in": true,
|
| 3426 |
+
"use_attn_in": false,
|
| 3427 |
+
"use_local_attn": false,
|
| 3428 |
+
"original_architecture": null,
|
| 3429 |
+
"from_checkpoint": false,
|
| 3430 |
+
"checkpoint_index": null,
|
| 3431 |
+
"checkpoint_label_type": null,
|
| 3432 |
+
"checkpoint_value": null,
|
| 3433 |
+
"tokenizer_name": null,
|
| 3434 |
+
"window_size": null,
|
| 3435 |
+
"attn_types": null,
|
| 3436 |
+
"init_mode": "gpt2",
|
| 3437 |
+
"normalization_type": null,
|
| 3438 |
+
"n_devices": 1,
|
| 3439 |
+
"attention_dir": "causal",
|
| 3440 |
+
"attn_only": false,
|
| 3441 |
+
"seed": 0,
|
| 3442 |
+
"initializer_range": 0.10079052613579392,
|
| 3443 |
+
"init_weights": true,
|
| 3444 |
+
"scale_attn_by_inverse_layer_idx": false,
|
| 3445 |
+
"positional_embedding_type": "standard",
|
| 3446 |
+
"final_rms": false,
|
| 3447 |
+
"d_vocab_out": 6,
|
| 3448 |
+
"parallel_attn_mlp": false,
|
| 3449 |
+
"rotary_dim": null,
|
| 3450 |
+
"n_params": 576,
|
| 3451 |
+
"use_hook_tokens": false,
|
| 3452 |
+
"gated_mlp": false,
|
| 3453 |
+
"default_prepend_bos": true,
|
| 3454 |
+
"dtype": "torch.float32",
|
| 3455 |
+
"tokenizer_prepends_bos": null,
|
| 3456 |
+
"n_key_value_heads": null,
|
| 3457 |
+
"post_embedding_ln": false,
|
| 3458 |
+
"rotary_base": 10000,
|
| 3459 |
+
"trust_remote_code": false,
|
| 3460 |
+
"rotary_adjacent_pairs": false,
|
| 3461 |
+
"load_in_4bit": false,
|
| 3462 |
+
"num_experts": null,
|
| 3463 |
+
"experts_per_token": null
|
| 3464 |
+
},
|
| 3465 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model_cfg.pkl",
|
| 3466 |
+
"training_args": {
|
| 3467 |
+
"output_dir": "/circuits-benchmark/results",
|
| 3468 |
+
"atol": 0.05,
|
| 3469 |
+
"lr": 0.001,
|
| 3470 |
+
"use_single_loss": true,
|
| 3471 |
+
"iit_weight": 1.0,
|
| 3472 |
+
"behavior_weight": 0.4,
|
| 3473 |
+
"strict_weight": 1.0,
|
| 3474 |
+
"epochs": 1000,
|
| 3475 |
+
"early_stop_accuracy_threshold": 99.9,
|
| 3476 |
+
"act_fn": "gelu",
|
| 3477 |
+
"use_wandb": true,
|
| 3478 |
+
"save_model_to_wandb": true,
|
| 3479 |
+
"clip_grad_norm": 0.1,
|
| 3480 |
+
"lr_scheduler": "linear",
|
| 3481 |
+
"model_pair": "strict",
|
| 3482 |
+
"same_size": false,
|
| 3483 |
+
"seed": 67,
|
| 3484 |
+
"batch_size": 256,
|
| 3485 |
+
"include_mlp": false,
|
| 3486 |
+
"detach_while_caching": true,
|
| 3487 |
+
"scheduler_val_metric": [
|
| 3488 |
+
"val/accuracy",
|
| 3489 |
+
"val/IIA",
|
| 3490 |
+
"val/strict_accuracy"
|
| 3491 |
+
],
|
| 3492 |
+
"siit_sampling": "sample_all",
|
| 3493 |
+
"val_iia_sampling": "all"
|
| 3494 |
+
},
|
| 3495 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/meta.json",
|
| 3496 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model.pth",
|
| 3497 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/edges.pkl"
|
| 3498 |
+
},
|
| 3499 |
{
|
| 3500 |
"case_id": "75",
|
| 3501 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75",
|
|
|
|
| 4377 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth",
|
| 4378 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl"
|
| 4379 |
},
|
| 4380 |
+
{
|
| 4381 |
+
"case_id": "66",
|
| 4382 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/66",
|
| 4383 |
+
"task_description": "Round each element in the input sequence to the nearest integer.",
|
| 4384 |
+
"vocab": [
|
| 4385 |
+
0.0,
|
| 4386 |
+
0.25,
|
| 4387 |
+
0.5,
|
| 4388 |
+
0.75,
|
| 4389 |
+
1.0,
|
| 4390 |
+
1.25,
|
| 4391 |
+
1.5,
|
| 4392 |
+
1.75,
|
| 4393 |
+
2.0,
|
| 4394 |
+
2.25,
|
| 4395 |
+
2.5,
|
| 4396 |
+
2.75,
|
| 4397 |
+
3.0,
|
| 4398 |
+
3.25,
|
| 4399 |
+
3.5,
|
| 4400 |
+
3.75,
|
| 4401 |
+
4.0,
|
| 4402 |
+
4.25,
|
| 4403 |
+
4.5,
|
| 4404 |
+
4.75
|
| 4405 |
+
],
|
| 4406 |
+
"max_seq_len": 10,
|
| 4407 |
+
"min_seq_len": 4,
|
| 4408 |
+
"files": [
|
| 4409 |
+
{
|
| 4410 |
+
"file_name": "edges.pkl",
|
| 4411 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/edges.pkl"
|
| 4412 |
+
},
|
| 4413 |
+
{
|
| 4414 |
+
"file_name": "ll_model.pth",
|
| 4415 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model.pth"
|
| 4416 |
+
},
|
| 4417 |
+
{
|
| 4418 |
+
"file_name": "ll_model_cfg.pkl",
|
| 4419 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model_cfg.pkl"
|
| 4420 |
+
},
|
| 4421 |
+
{
|
| 4422 |
+
"file_name": "meta.json",
|
| 4423 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/meta.json"
|
| 4424 |
+
}
|
| 4425 |
+
],
|
| 4426 |
+
"transformer_cfg": {
|
| 4427 |
+
"n_layers": 2,
|
| 4428 |
+
"d_model": 4,
|
| 4429 |
+
"n_ctx": 10,
|
| 4430 |
+
"d_head": 1,
|
| 4431 |
+
"model_name": "custom",
|
| 4432 |
+
"n_heads": 4,
|
| 4433 |
+
"d_mlp": 16,
|
| 4434 |
+
"act_fn": "gelu",
|
| 4435 |
+
"d_vocab": 22,
|
| 4436 |
+
"eps": 1e-05,
|
| 4437 |
+
"use_attn_result": true,
|
| 4438 |
+
"use_attn_scale": true,
|
| 4439 |
+
"use_split_qkv_input": true,
|
| 4440 |
+
"use_hook_mlp_in": true,
|
| 4441 |
+
"use_attn_in": false,
|
| 4442 |
+
"use_local_attn": false,
|
| 4443 |
+
"original_architecture": null,
|
| 4444 |
+
"from_checkpoint": false,
|
| 4445 |
+
"checkpoint_index": null,
|
| 4446 |
+
"checkpoint_label_type": null,
|
| 4447 |
+
"checkpoint_value": null,
|
| 4448 |
+
"tokenizer_name": null,
|
| 4449 |
+
"window_size": null,
|
| 4450 |
+
"attn_types": null,
|
| 4451 |
+
"init_mode": "gpt2",
|
| 4452 |
+
"normalization_type": null,
|
| 4453 |
+
"n_devices": 1,
|
| 4454 |
+
"attention_dir": "causal",
|
| 4455 |
+
"attn_only": false,
|
| 4456 |
+
"seed": 0,
|
| 4457 |
+
"initializer_range": 0.13151918984428584,
|
| 4458 |
+
"init_weights": true,
|
| 4459 |
+
"scale_attn_by_inverse_layer_idx": false,
|
| 4460 |
+
"positional_embedding_type": "standard",
|
| 4461 |
+
"final_rms": false,
|
| 4462 |
+
"d_vocab_out": 6,
|
| 4463 |
+
"parallel_attn_mlp": false,
|
| 4464 |
+
"rotary_dim": null,
|
| 4465 |
+
"n_params": 384,
|
| 4466 |
+
"use_hook_tokens": false,
|
| 4467 |
+
"gated_mlp": false,
|
| 4468 |
+
"default_prepend_bos": true,
|
| 4469 |
+
"dtype": "torch.float32",
|
| 4470 |
+
"tokenizer_prepends_bos": null,
|
| 4471 |
+
"n_key_value_heads": null,
|
| 4472 |
+
"post_embedding_ln": false,
|
| 4473 |
+
"rotary_base": 10000,
|
| 4474 |
+
"trust_remote_code": false,
|
| 4475 |
+
"rotary_adjacent_pairs": false,
|
| 4476 |
+
"load_in_4bit": false,
|
| 4477 |
+
"num_experts": null,
|
| 4478 |
+
"experts_per_token": null
|
| 4479 |
+
},
|
| 4480 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model_cfg.pkl",
|
| 4481 |
+
"training_args": {
|
| 4482 |
+
"output_dir": "/circuits-benchmark/results",
|
| 4483 |
+
"atol": 0.05,
|
| 4484 |
+
"lr": 0.001,
|
| 4485 |
+
"use_single_loss": true,
|
| 4486 |
+
"iit_weight": 1.0,
|
| 4487 |
+
"behavior_weight": 0.4,
|
| 4488 |
+
"strict_weight": 0.7,
|
| 4489 |
+
"epochs": 1000,
|
| 4490 |
+
"early_stop_accuracy_threshold": 99.9,
|
| 4491 |
+
"act_fn": "gelu",
|
| 4492 |
+
"use_wandb": true,
|
| 4493 |
+
"save_model_to_wandb": true,
|
| 4494 |
+
"clip_grad_norm": 0.1,
|
| 4495 |
+
"lr_scheduler": "linear",
|
| 4496 |
+
"model_pair": "strict",
|
| 4497 |
+
"same_size": false,
|
| 4498 |
+
"seed": 92,
|
| 4499 |
+
"batch_size": 256,
|
| 4500 |
+
"include_mlp": false,
|
| 4501 |
+
"detach_while_caching": true,
|
| 4502 |
+
"scheduler_val_metric": [
|
| 4503 |
+
"val/accuracy",
|
| 4504 |
+
"val/IIA",
|
| 4505 |
+
"val/strict_accuracy"
|
| 4506 |
+
],
|
| 4507 |
+
"siit_sampling": "sample_all",
|
| 4508 |
+
"val_iia_sampling": "all"
|
| 4509 |
+
},
|
| 4510 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/meta.json",
|
| 4511 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model.pth",
|
| 4512 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/edges.pkl"
|
| 4513 |
+
},
|
| 4514 |
{
|
| 4515 |
"case_id": "93",
|
| 4516 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93",
|
|
|
|
| 4941 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl"
|
| 4942 |
},
|
| 4943 |
{
|
| 4944 |
+
"case_id": "15",
|
| 4945 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/15",
|
| 4946 |
+
"task_description": "Returns each token multiplied by two and subtracted by its index.",
|
| 4947 |
"vocab": [
|
| 4948 |
+
0,
|
| 4949 |
+
1,
|
| 4950 |
+
2,
|
| 4951 |
+
3,
|
| 4952 |
+
4
|
| 4953 |
],
|
| 4954 |
+
"max_seq_len": 5,
|
| 4955 |
"min_seq_len": 4,
|
| 4956 |
"files": [
|
| 4957 |
{
|
| 4958 |
"file_name": "edges.pkl",
|
| 4959 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/edges.pkl"
|
| 4960 |
},
|
| 4961 |
{
|
| 4962 |
"file_name": "ll_model.pth",
|
| 4963 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model.pth"
|
| 4964 |
},
|
| 4965 |
{
|
| 4966 |
"file_name": "ll_model_cfg.pkl",
|
| 4967 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model_cfg.pkl"
|
| 4968 |
},
|
| 4969 |
{
|
| 4970 |
"file_name": "meta.json",
|
| 4971 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/meta.json"
|
| 4972 |
}
|
| 4973 |
],
|
| 4974 |
"transformer_cfg": {
|
| 4975 |
+
"n_layers": 3,
|
| 4976 |
+
"d_model": 4,
|
| 4977 |
+
"n_ctx": 5,
|
| 4978 |
+
"d_head": 1,
|
| 4979 |
+
"model_name": "custom",
|
| 4980 |
+
"n_heads": 4,
|
| 4981 |
+
"d_mlp": 16,
|
| 4982 |
+
"act_fn": "gelu",
|
| 4983 |
+
"d_vocab": 7,
|
| 4984 |
+
"eps": 1e-05,
|
| 4985 |
+
"use_attn_result": true,
|
| 4986 |
+
"use_attn_scale": true,
|
| 4987 |
+
"use_split_qkv_input": true,
|
| 4988 |
+
"use_hook_mlp_in": true,
|
| 4989 |
+
"use_attn_in": false,
|
| 4990 |
+
"use_local_attn": false,
|
| 4991 |
+
"original_architecture": null,
|
| 4992 |
+
"from_checkpoint": false,
|
| 4993 |
+
"checkpoint_index": null,
|
| 4994 |
+
"checkpoint_label_type": null,
|
| 4995 |
+
"checkpoint_value": null,
|
| 4996 |
+
"tokenizer_name": null,
|
| 4997 |
+
"window_size": null,
|
| 4998 |
+
"attn_types": null,
|
| 4999 |
+
"init_mode": "gpt2",
|
| 5000 |
+
"normalization_type": null,
|
| 5001 |
+
"n_devices": 1,
|
| 5002 |
+
"attention_dir": "causal",
|
| 5003 |
+
"attn_only": false,
|
| 5004 |
+
"seed": 0,
|
| 5005 |
+
"initializer_range": 0.06553855364152325,
|
| 5006 |
+
"init_weights": true,
|
| 5007 |
+
"scale_attn_by_inverse_layer_idx": false,
|
| 5008 |
+
"positional_embedding_type": "standard",
|
| 5009 |
+
"final_rms": false,
|
| 5010 |
+
"d_vocab_out": 12,
|
| 5011 |
+
"parallel_attn_mlp": false,
|
| 5012 |
+
"rotary_dim": null,
|
| 5013 |
+
"n_params": 576,
|
| 5014 |
+
"use_hook_tokens": false,
|
| 5015 |
+
"gated_mlp": false,
|
| 5016 |
+
"default_prepend_bos": true,
|
| 5017 |
+
"dtype": "torch.float32",
|
| 5018 |
+
"tokenizer_prepends_bos": null,
|
| 5019 |
+
"n_key_value_heads": null,
|
| 5020 |
+
"post_embedding_ln": false,
|
| 5021 |
+
"rotary_base": 10000,
|
| 5022 |
+
"trust_remote_code": false,
|
| 5023 |
+
"rotary_adjacent_pairs": false,
|
| 5024 |
+
"load_in_4bit": false,
|
| 5025 |
+
"num_experts": null,
|
| 5026 |
+
"experts_per_token": null
|
| 5027 |
+
},
|
| 5028 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model_cfg.pkl",
|
| 5029 |
+
"training_args": {
|
| 5030 |
+
"output_dir": "/circuits-benchmark/results",
|
| 5031 |
+
"atol": 0.05,
|
| 5032 |
+
"lr": 0.001,
|
| 5033 |
+
"use_single_loss": true,
|
| 5034 |
+
"iit_weight": 1.0,
|
| 5035 |
+
"behavior_weight": 0.4,
|
| 5036 |
+
"strict_weight": 1.0,
|
| 5037 |
+
"epochs": 1000,
|
| 5038 |
+
"early_stop_accuracy_threshold": 99.9,
|
| 5039 |
+
"act_fn": "gelu",
|
| 5040 |
+
"use_wandb": true,
|
| 5041 |
+
"save_model_to_wandb": true,
|
| 5042 |
+
"clip_grad_norm": 0.1,
|
| 5043 |
+
"lr_scheduler": "linear",
|
| 5044 |
+
"model_pair": "strict",
|
| 5045 |
+
"same_size": false,
|
| 5046 |
+
"seed": 67,
|
| 5047 |
+
"batch_size": 256,
|
| 5048 |
+
"include_mlp": false,
|
| 5049 |
+
"detach_while_caching": true,
|
| 5050 |
+
"scheduler_val_metric": [
|
| 5051 |
+
"val/accuracy",
|
| 5052 |
+
"val/IIA",
|
| 5053 |
+
"val/strict_accuracy"
|
| 5054 |
+
],
|
| 5055 |
+
"siit_sampling": "sample_all",
|
| 5056 |
+
"val_iia_sampling": "all"
|
| 5057 |
+
},
|
| 5058 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/meta.json",
|
| 5059 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model.pth",
|
| 5060 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/edges.pkl"
|
| 5061 |
+
},
|
| 5062 |
+
{
|
| 5063 |
+
"case_id": "19",
|
| 5064 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/19",
|
| 5065 |
+
"task_description": "Removes consecutive duplicate tokens from a sequence.",
|
| 5066 |
+
"vocab": [
|
| 5067 |
+
"a",
|
| 5068 |
+
"b",
|
| 5069 |
+
"c"
|
| 5070 |
+
],
|
| 5071 |
+
"max_seq_len": 15,
|
| 5072 |
+
"min_seq_len": 4,
|
| 5073 |
+
"files": [
|
| 5074 |
+
{
|
| 5075 |
+
"file_name": "edges.pkl",
|
| 5076 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/edges.pkl"
|
| 5077 |
+
},
|
| 5078 |
+
{
|
| 5079 |
+
"file_name": "ll_model.pth",
|
| 5080 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model.pth"
|
| 5081 |
+
},
|
| 5082 |
+
{
|
| 5083 |
+
"file_name": "ll_model_cfg.pkl",
|
| 5084 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model_cfg.pkl"
|
| 5085 |
+
},
|
| 5086 |
+
{
|
| 5087 |
+
"file_name": "meta.json",
|
| 5088 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/meta.json"
|
| 5089 |
+
}
|
| 5090 |
+
],
|
| 5091 |
+
"transformer_cfg": {
|
| 5092 |
+
"n_layers": 2,
|
| 5093 |
+
"d_model": 32,
|
| 5094 |
+
"n_ctx": 15,
|
| 5095 |
+
"d_head": 8,
|
| 5096 |
+
"model_name": "custom",
|
| 5097 |
"n_heads": 4,
|
| 5098 |
"d_mlp": 128,
|
| 5099 |
"act_fn": "gelu",
|
|
|
|
| 5638 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth",
|
| 5639 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl"
|
| 5640 |
},
|
| 5641 |
+
{
|
| 5642 |
+
"case_id": "43",
|
| 5643 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/43",
|
| 5644 |
+
"task_description": "Returns the corresponding Fibonacci number for each element in the input sequence.",
|
| 5645 |
+
"vocab": [
|
| 5646 |
+
0,
|
| 5647 |
+
1,
|
| 5648 |
+
2,
|
| 5649 |
+
3,
|
| 5650 |
+
4,
|
| 5651 |
+
5,
|
| 5652 |
+
6,
|
| 5653 |
+
7,
|
| 5654 |
+
8,
|
| 5655 |
+
9,
|
| 5656 |
+
10,
|
| 5657 |
+
11,
|
| 5658 |
+
12,
|
| 5659 |
+
13,
|
| 5660 |
+
14,
|
| 5661 |
+
15,
|
| 5662 |
+
16,
|
| 5663 |
+
17,
|
| 5664 |
+
18,
|
| 5665 |
+
19
|
| 5666 |
+
],
|
| 5667 |
+
"max_seq_len": 10,
|
| 5668 |
+
"min_seq_len": 4,
|
| 5669 |
+
"files": [
|
| 5670 |
+
{
|
| 5671 |
+
"file_name": "edges.pkl",
|
| 5672 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/edges.pkl"
|
| 5673 |
+
},
|
| 5674 |
+
{
|
| 5675 |
+
"file_name": "ll_model.pth",
|
| 5676 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model.pth"
|
| 5677 |
+
},
|
| 5678 |
+
{
|
| 5679 |
+
"file_name": "ll_model_cfg.pkl",
|
| 5680 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model_cfg.pkl"
|
| 5681 |
+
},
|
| 5682 |
+
{
|
| 5683 |
+
"file_name": "meta.json",
|
| 5684 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/meta.json"
|
| 5685 |
+
}
|
| 5686 |
+
],
|
| 5687 |
+
"transformer_cfg": {
|
| 5688 |
+
"n_layers": 2,
|
| 5689 |
+
"d_model": 4,
|
| 5690 |
+
"n_ctx": 10,
|
| 5691 |
+
"d_head": 1,
|
| 5692 |
+
"model_name": "custom",
|
| 5693 |
+
"n_heads": 4,
|
| 5694 |
+
"d_mlp": 16,
|
| 5695 |
+
"act_fn": "gelu",
|
| 5696 |
+
"d_vocab": 22,
|
| 5697 |
+
"eps": 1e-05,
|
| 5698 |
+
"use_attn_result": true,
|
| 5699 |
+
"use_attn_scale": true,
|
| 5700 |
+
"use_split_qkv_input": true,
|
| 5701 |
+
"use_hook_mlp_in": true,
|
| 5702 |
+
"use_attn_in": false,
|
| 5703 |
+
"use_local_attn": false,
|
| 5704 |
+
"original_architecture": null,
|
| 5705 |
+
"from_checkpoint": false,
|
| 5706 |
+
"checkpoint_index": null,
|
| 5707 |
+
"checkpoint_label_type": null,
|
| 5708 |
+
"checkpoint_value": null,
|
| 5709 |
+
"tokenizer_name": null,
|
| 5710 |
+
"window_size": null,
|
| 5711 |
+
"attn_types": null,
|
| 5712 |
+
"init_mode": "gpt2",
|
| 5713 |
+
"normalization_type": null,
|
| 5714 |
+
"n_devices": 1,
|
| 5715 |
+
"attention_dir": "causal",
|
| 5716 |
+
"attn_only": false,
|
| 5717 |
+
"seed": 0,
|
| 5718 |
+
"initializer_range": 0.1131370849898476,
|
| 5719 |
+
"init_weights": true,
|
| 5720 |
+
"scale_attn_by_inverse_layer_idx": false,
|
| 5721 |
+
"positional_embedding_type": "standard",
|
| 5722 |
+
"final_rms": false,
|
| 5723 |
+
"d_vocab_out": 19,
|
| 5724 |
+
"parallel_attn_mlp": false,
|
| 5725 |
+
"rotary_dim": null,
|
| 5726 |
+
"n_params": 384,
|
| 5727 |
+
"use_hook_tokens": false,
|
| 5728 |
+
"gated_mlp": false,
|
| 5729 |
+
"default_prepend_bos": true,
|
| 5730 |
+
"dtype": "torch.float32",
|
| 5731 |
+
"tokenizer_prepends_bos": null,
|
| 5732 |
+
"n_key_value_heads": null,
|
| 5733 |
+
"post_embedding_ln": false,
|
| 5734 |
+
"rotary_base": 10000,
|
| 5735 |
+
"trust_remote_code": false,
|
| 5736 |
+
"rotary_adjacent_pairs": false,
|
| 5737 |
+
"load_in_4bit": false,
|
| 5738 |
+
"num_experts": null,
|
| 5739 |
+
"experts_per_token": null
|
| 5740 |
+
},
|
| 5741 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model_cfg.pkl",
|
| 5742 |
+
"training_args": {
|
| 5743 |
+
"output_dir": "/circuits-benchmark/results",
|
| 5744 |
+
"atol": 0.05,
|
| 5745 |
+
"lr": 0.001,
|
| 5746 |
+
"use_single_loss": true,
|
| 5747 |
+
"iit_weight": 1.0,
|
| 5748 |
+
"behavior_weight": 0.4,
|
| 5749 |
+
"strict_weight": 1.0,
|
| 5750 |
+
"epochs": 1000,
|
| 5751 |
+
"early_stop_accuracy_threshold": 99.9,
|
| 5752 |
+
"act_fn": "gelu",
|
| 5753 |
+
"use_wandb": true,
|
| 5754 |
+
"save_model_to_wandb": true,
|
| 5755 |
+
"clip_grad_norm": 0.1,
|
| 5756 |
+
"lr_scheduler": "linear",
|
| 5757 |
+
"model_pair": "strict",
|
| 5758 |
+
"same_size": false,
|
| 5759 |
+
"seed": 67,
|
| 5760 |
+
"batch_size": 256,
|
| 5761 |
+
"include_mlp": false,
|
| 5762 |
+
"detach_while_caching": true,
|
| 5763 |
+
"scheduler_val_metric": [
|
| 5764 |
+
"val/accuracy",
|
| 5765 |
+
"val/IIA",
|
| 5766 |
+
"val/strict_accuracy"
|
| 5767 |
+
],
|
| 5768 |
+
"siit_sampling": "sample_all",
|
| 5769 |
+
"val_iia_sampling": "all"
|
| 5770 |
+
},
|
| 5771 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/meta.json",
|
| 5772 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model.pth",
|
| 5773 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/edges.pkl"
|
| 5774 |
+
},
|
| 5775 |
{
|
| 5776 |
"case_id": "122",
|
| 5777 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122",
|
|
|
|
| 6902 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl"
|
| 6903 |
},
|
| 6904 |
{
|
| 6905 |
+
"case_id": "41",
|
| 6906 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/41",
|
| 6907 |
+
"task_description": "Make each element of the input sequence absolute",
|
| 6908 |
"vocab": [
|
| 6909 |
+
-10,
|
| 6910 |
+
-9,
|
| 6911 |
+
-8,
|
| 6912 |
+
-7,
|
| 6913 |
+
-6,
|
| 6914 |
+
-5,
|
| 6915 |
+
-4,
|
| 6916 |
+
-3,
|
| 6917 |
+
-2,
|
| 6918 |
+
-1,
|
| 6919 |
0,
|
| 6920 |
1,
|
| 6921 |
2,
|
|
|
|
| 6925 |
6,
|
| 6926 |
7,
|
| 6927 |
8,
|
| 6928 |
+
9
|
|
|
|
| 6929 |
],
|
| 6930 |
"max_seq_len": 10,
|
| 6931 |
"min_seq_len": 4,
|
| 6932 |
"files": [
|
| 6933 |
{
|
| 6934 |
"file_name": "edges.pkl",
|
| 6935 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/edges.pkl"
|
| 6936 |
},
|
| 6937 |
{
|
| 6938 |
"file_name": "ll_model.pth",
|
| 6939 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model.pth"
|
| 6940 |
+
},
|
| 6941 |
+
{
|
| 6942 |
+
"file_name": "ll_model_cfg.pkl",
|
| 6943 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model_cfg.pkl"
|
| 6944 |
+
},
|
| 6945 |
+
{
|
| 6946 |
+
"file_name": "meta.json",
|
| 6947 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/meta.json"
|
| 6948 |
+
}
|
| 6949 |
+
],
|
| 6950 |
+
"transformer_cfg": {
|
| 6951 |
+
"n_layers": 2,
|
| 6952 |
+
"d_model": 4,
|
| 6953 |
+
"n_ctx": 10,
|
| 6954 |
+
"d_head": 1,
|
| 6955 |
+
"model_name": "custom",
|
| 6956 |
+
"n_heads": 4,
|
| 6957 |
+
"d_mlp": 16,
|
| 6958 |
+
"act_fn": "gelu",
|
| 6959 |
+
"d_vocab": 22,
|
| 6960 |
+
"eps": 1e-05,
|
| 6961 |
+
"use_attn_result": true,
|
| 6962 |
+
"use_attn_scale": true,
|
| 6963 |
+
"use_split_qkv_input": true,
|
| 6964 |
+
"use_hook_mlp_in": true,
|
| 6965 |
+
"use_attn_in": false,
|
| 6966 |
+
"use_local_attn": false,
|
| 6967 |
+
"original_architecture": null,
|
| 6968 |
+
"from_checkpoint": false,
|
| 6969 |
+
"checkpoint_index": null,
|
| 6970 |
+
"checkpoint_label_type": null,
|
| 6971 |
+
"checkpoint_value": null,
|
| 6972 |
+
"tokenizer_name": null,
|
| 6973 |
+
"window_size": null,
|
| 6974 |
+
"attn_types": null,
|
| 6975 |
+
"init_mode": "gpt2",
|
| 6976 |
+
"normalization_type": null,
|
| 6977 |
+
"n_devices": 1,
|
| 6978 |
+
"attention_dir": "causal",
|
| 6979 |
+
"attn_only": false,
|
| 6980 |
+
"seed": 0,
|
| 6981 |
+
"initializer_range": 0.12344267996967354,
|
| 6982 |
+
"init_weights": true,
|
| 6983 |
+
"scale_attn_by_inverse_layer_idx": false,
|
| 6984 |
+
"positional_embedding_type": "standard",
|
| 6985 |
+
"final_rms": false,
|
| 6986 |
+
"d_vocab_out": 11,
|
| 6987 |
+
"parallel_attn_mlp": false,
|
| 6988 |
+
"rotary_dim": null,
|
| 6989 |
+
"n_params": 384,
|
| 6990 |
+
"use_hook_tokens": false,
|
| 6991 |
+
"gated_mlp": false,
|
| 6992 |
+
"default_prepend_bos": true,
|
| 6993 |
+
"dtype": "torch.float32",
|
| 6994 |
+
"tokenizer_prepends_bos": null,
|
| 6995 |
+
"n_key_value_heads": null,
|
| 6996 |
+
"post_embedding_ln": false,
|
| 6997 |
+
"rotary_base": 10000,
|
| 6998 |
+
"trust_remote_code": false,
|
| 6999 |
+
"rotary_adjacent_pairs": false,
|
| 7000 |
+
"load_in_4bit": false,
|
| 7001 |
+
"num_experts": null,
|
| 7002 |
+
"experts_per_token": null
|
| 7003 |
+
},
|
| 7004 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model_cfg.pkl",
|
| 7005 |
+
"training_args": {
|
| 7006 |
+
"output_dir": "/circuits-benchmark/results",
|
| 7007 |
+
"atol": 0.05,
|
| 7008 |
+
"lr": 0.001,
|
| 7009 |
+
"use_single_loss": true,
|
| 7010 |
+
"iit_weight": 1.0,
|
| 7011 |
+
"behavior_weight": 0.4,
|
| 7012 |
+
"strict_weight": 1.0,
|
| 7013 |
+
"epochs": 1000,
|
| 7014 |
+
"early_stop_accuracy_threshold": 99.9,
|
| 7015 |
+
"act_fn": "gelu",
|
| 7016 |
+
"use_wandb": true,
|
| 7017 |
+
"save_model_to_wandb": true,
|
| 7018 |
+
"clip_grad_norm": 0.1,
|
| 7019 |
+
"lr_scheduler": "linear",
|
| 7020 |
+
"model_pair": "strict",
|
| 7021 |
+
"same_size": false,
|
| 7022 |
+
"seed": 67,
|
| 7023 |
+
"batch_size": 256,
|
| 7024 |
+
"include_mlp": false,
|
| 7025 |
+
"detach_while_caching": true,
|
| 7026 |
+
"scheduler_val_metric": [
|
| 7027 |
+
"val/accuracy",
|
| 7028 |
+
"val/IIA",
|
| 7029 |
+
"val/strict_accuracy"
|
| 7030 |
+
],
|
| 7031 |
+
"siit_sampling": "sample_all",
|
| 7032 |
+
"val_iia_sampling": "all"
|
| 7033 |
+
},
|
| 7034 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/meta.json",
|
| 7035 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model.pth",
|
| 7036 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/edges.pkl"
|
| 7037 |
+
},
|
| 7038 |
+
{
|
| 7039 |
+
"case_id": "54",
|
| 7040 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/54",
|
| 7041 |
+
"task_description": "Applies the hyperbolic tangent to each element.",
|
| 7042 |
+
"vocab": [
|
| 7043 |
+
0,
|
| 7044 |
+
1,
|
| 7045 |
+
2,
|
| 7046 |
+
3,
|
| 7047 |
+
4,
|
| 7048 |
+
5,
|
| 7049 |
+
6,
|
| 7050 |
+
7,
|
| 7051 |
+
8,
|
| 7052 |
+
9,
|
| 7053 |
+
10
|
| 7054 |
+
],
|
| 7055 |
+
"max_seq_len": 10,
|
| 7056 |
+
"min_seq_len": 4,
|
| 7057 |
+
"files": [
|
| 7058 |
+
{
|
| 7059 |
+
"file_name": "edges.pkl",
|
| 7060 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/edges.pkl"
|
| 7061 |
+
},
|
| 7062 |
+
{
|
| 7063 |
+
"file_name": "ll_model.pth",
|
| 7064 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model.pth"
|
| 7065 |
},
|
| 7066 |
{
|
| 7067 |
"file_name": "ll_model_cfg.pkl",
|
|
|
|
| 8237 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl"
|
| 8238 |
},
|
| 8239 |
{
|
| 8240 |
+
"case_id": "68",
|
| 8241 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/68",
|
| 8242 |
+
"task_description": "Increment each element until it becomes a multiple of 3",
|
| 8243 |
"vocab": [
|
| 8244 |
0,
|
| 8245 |
1,
|
|
|
|
| 8258 |
"files": [
|
| 8259 |
{
|
| 8260 |
"file_name": "edges.pkl",
|
| 8261 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/edges.pkl"
|
| 8262 |
},
|
| 8263 |
{
|
| 8264 |
"file_name": "ll_model.pth",
|
| 8265 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model.pth"
|
| 8266 |
},
|
| 8267 |
{
|
| 8268 |
"file_name": "ll_model_cfg.pkl",
|
| 8269 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model_cfg.pkl"
|
| 8270 |
},
|
| 8271 |
{
|
| 8272 |
"file_name": "meta.json",
|
| 8273 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/meta.json"
|
| 8274 |
}
|
| 8275 |
],
|
| 8276 |
"transformer_cfg": {
|
|
|
|
| 8304 |
"attention_dir": "causal",
|
| 8305 |
"attn_only": false,
|
| 8306 |
"seed": 0,
|
| 8307 |
+
"initializer_range": 0.1539600717839002,
|
| 8308 |
"init_weights": true,
|
| 8309 |
"scale_attn_by_inverse_layer_idx": false,
|
| 8310 |
"positional_embedding_type": "standard",
|
| 8311 |
"final_rms": false,
|
| 8312 |
+
"d_vocab_out": 5,
|
| 8313 |
"parallel_attn_mlp": false,
|
| 8314 |
"rotary_dim": null,
|
| 8315 |
"n_params": 384,
|
|
|
|
| 8327 |
"num_experts": null,
|
| 8328 |
"experts_per_token": null
|
| 8329 |
},
|
| 8330 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model_cfg.pkl",
|
| 8331 |
"training_args": {
|
| 8332 |
"output_dir": "/circuits-benchmark/results",
|
| 8333 |
"atol": 0.05,
|
|
|
|
| 8335 |
"use_single_loss": true,
|
| 8336 |
"iit_weight": 1.0,
|
| 8337 |
"behavior_weight": 0.4,
|
| 8338 |
+
"strict_weight": 1.0,
|
| 8339 |
"epochs": 1000,
|
| 8340 |
"early_stop_accuracy_threshold": 99.9,
|
| 8341 |
"act_fn": "gelu",
|
|
|
|
| 8357 |
"siit_sampling": "sample_all",
|
| 8358 |
"val_iia_sampling": "all"
|
| 8359 |
},
|
| 8360 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/meta.json",
|
| 8361 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model.pth",
|
| 8362 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/edges.pkl"
|
| 8363 |
},
|
| 8364 |
{
|
| 8365 |
+
"case_id": "70",
|
| 8366 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/70",
|
| 8367 |
+
"task_description": "Apply the cosine function to each element of the input sequence.",
|
| 8368 |
"vocab": [
|
| 8369 |
0,
|
| 8370 |
1,
|
|
|
|
| 8383 |
"files": [
|
| 8384 |
{
|
| 8385 |
"file_name": "edges.pkl",
|
| 8386 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl"
|
| 8387 |
},
|
| 8388 |
{
|
| 8389 |
"file_name": "ll_model.pth",
|
| 8390 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth"
|
| 8391 |
},
|
| 8392 |
{
|
| 8393 |
"file_name": "ll_model_cfg.pkl",
|
| 8394 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl"
|
| 8395 |
},
|
| 8396 |
{
|
| 8397 |
"file_name": "meta.json",
|
| 8398 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json"
|
| 8399 |
}
|
| 8400 |
],
|
| 8401 |
"transformer_cfg": {
|
|
|
|
| 8429 |
"attention_dir": "causal",
|
| 8430 |
"attn_only": false,
|
| 8431 |
"seed": 0,
|
| 8432 |
+
"initializer_range": 0.1392621247645583,
|
| 8433 |
"init_weights": true,
|
| 8434 |
"scale_attn_by_inverse_layer_idx": false,
|
| 8435 |
"positional_embedding_type": "standard",
|
| 8436 |
"final_rms": false,
|
| 8437 |
+
"d_vocab_out": 11,
|
| 8438 |
"parallel_attn_mlp": false,
|
| 8439 |
"rotary_dim": null,
|
| 8440 |
"n_params": 384,
|
|
|
|
| 8452 |
"num_experts": null,
|
| 8453 |
"experts_per_token": null
|
| 8454 |
},
|
| 8455 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl",
|
| 8456 |
"training_args": {
|
| 8457 |
"output_dir": "/circuits-benchmark/results",
|
| 8458 |
"atol": 0.05,
|
|
|
|
| 8482 |
"siit_sampling": "sample_all",
|
| 8483 |
"val_iia_sampling": "all"
|
| 8484 |
},
|
| 8485 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json",
|
| 8486 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth",
|
| 8487 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl"
|
| 8488 |
},
|
| 8489 |
{
|
| 8490 |
+
"case_id": "62",
|
| 8491 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/62",
|
| 8492 |
+
"task_description": "Replaces each element with its factorial.",
|
| 8493 |
"vocab": [
|
| 8494 |
0,
|
| 8495 |
1,
|
|
|
|
| 8508 |
"files": [
|
| 8509 |
{
|
| 8510 |
"file_name": "edges.pkl",
|
| 8511 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl"
|
| 8512 |
},
|
| 8513 |
{
|
| 8514 |
"file_name": "ll_model.pth",
|
| 8515 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth"
|
| 8516 |
},
|
| 8517 |
{
|
| 8518 |
"file_name": "ll_model_cfg.pkl",
|
| 8519 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl"
|
| 8520 |
},
|
| 8521 |
{
|
| 8522 |
"file_name": "meta.json",
|
| 8523 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json"
|
| 8524 |
}
|
| 8525 |
],
|
| 8526 |
"transformer_cfg": {
|
| 8527 |
+
"n_layers": 2,
|
| 8528 |
+
"d_model": 4,
|
| 8529 |
"n_ctx": 10,
|
| 8530 |
+
"d_head": 1,
|
| 8531 |
"model_name": "custom",
|
| 8532 |
"n_heads": 4,
|
| 8533 |
+
"d_mlp": 16,
|
| 8534 |
"act_fn": "gelu",
|
| 8535 |
"d_vocab": 13,
|
| 8536 |
"eps": 1e-05,
|
|
|
|
| 8551 |
"init_mode": "gpt2",
|
| 8552 |
"normalization_type": null,
|
| 8553 |
"n_devices": 1,
|
| 8554 |
+
"attention_dir": "causal",
|
| 8555 |
"attn_only": false,
|
| 8556 |
"seed": 0,
|
| 8557 |
+
"initializer_range": 0.1414213562373095,
|
| 8558 |
"init_weights": true,
|
| 8559 |
"scale_attn_by_inverse_layer_idx": false,
|
| 8560 |
"positional_embedding_type": "standard",
|
| 8561 |
"final_rms": false,
|
| 8562 |
+
"d_vocab_out": 10,
|
| 8563 |
"parallel_attn_mlp": false,
|
| 8564 |
"rotary_dim": null,
|
| 8565 |
+
"n_params": 384,
|
| 8566 |
"use_hook_tokens": false,
|
| 8567 |
"gated_mlp": false,
|
| 8568 |
"default_prepend_bos": true,
|
|
|
|
| 8577 |
"num_experts": null,
|
| 8578 |
"experts_per_token": null
|
| 8579 |
},
|
| 8580 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl",
|
| 8581 |
"training_args": {
|
| 8582 |
"output_dir": "/circuits-benchmark/results",
|
| 8583 |
"atol": 0.05,
|
|
|
|
| 8585 |
"use_single_loss": true,
|
| 8586 |
"iit_weight": 1.0,
|
| 8587 |
"behavior_weight": 0.4,
|
| 8588 |
+
"strict_weight": 0.7,
|
| 8589 |
"epochs": 1000,
|
| 8590 |
"early_stop_accuracy_threshold": 99.9,
|
| 8591 |
"act_fn": "gelu",
|
|
|
|
| 8607 |
"siit_sampling": "sample_all",
|
| 8608 |
"val_iia_sampling": "all"
|
| 8609 |
},
|
| 8610 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json",
|
| 8611 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth",
|
| 8612 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl"
|
| 8613 |
},
|
| 8614 |
{
|
| 8615 |
+
"case_id": "111",
|
| 8616 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/111",
|
| 8617 |
+
"task_description": "Returns the last element of the sequence and pads the rest with zeros.",
|
| 8618 |
"vocab": [
|
| 8619 |
+
0,
|
| 8620 |
+
1,
|
| 8621 |
+
2,
|
| 8622 |
+
3,
|
| 8623 |
+
4,
|
| 8624 |
+
5,
|
| 8625 |
+
6,
|
| 8626 |
+
7,
|
| 8627 |
+
8,
|
| 8628 |
+
9,
|
| 8629 |
+
10
|
| 8630 |
],
|
| 8631 |
"max_seq_len": 10,
|
| 8632 |
"min_seq_len": 4,
|
| 8633 |
"files": [
|
| 8634 |
{
|
| 8635 |
"file_name": "edges.pkl",
|
| 8636 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl"
|
| 8637 |
},
|
| 8638 |
{
|
| 8639 |
"file_name": "ll_model.pth",
|
| 8640 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth"
|
| 8641 |
},
|
| 8642 |
{
|
| 8643 |
"file_name": "ll_model_cfg.pkl",
|
| 8644 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl"
|
| 8645 |
},
|
| 8646 |
{
|
| 8647 |
"file_name": "meta.json",
|
| 8648 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json"
|
| 8649 |
}
|
| 8650 |
],
|
| 8651 |
"transformer_cfg": {
|
| 8652 |
+
"n_layers": 3,
|
| 8653 |
+
"d_model": 24,
|
| 8654 |
"n_ctx": 10,
|
| 8655 |
+
"d_head": 6,
|
| 8656 |
"model_name": "custom",
|
| 8657 |
"n_heads": 4,
|
| 8658 |
+
"d_mlp": 96,
|
| 8659 |
"act_fn": "gelu",
|
| 8660 |
+
"d_vocab": 13,
|
| 8661 |
"eps": 1e-05,
|
| 8662 |
"use_attn_result": true,
|
| 8663 |
"use_attn_scale": true,
|
|
|
|
| 8676 |
"init_mode": "gpt2",
|
| 8677 |
"normalization_type": null,
|
| 8678 |
"n_devices": 1,
|
| 8679 |
+
"attention_dir": "bidirectional",
|
| 8680 |
"attn_only": false,
|
| 8681 |
"seed": 0,
|
| 8682 |
+
"initializer_range": 0.09847319278346618,
|
| 8683 |
"init_weights": true,
|
| 8684 |
"scale_attn_by_inverse_layer_idx": false,
|
| 8685 |
"positional_embedding_type": "standard",
|
| 8686 |
"final_rms": false,
|
| 8687 |
+
"d_vocab_out": 11,
|
| 8688 |
"parallel_attn_mlp": false,
|
| 8689 |
"rotary_dim": null,
|
| 8690 |
+
"n_params": 20736,
|
| 8691 |
"use_hook_tokens": false,
|
| 8692 |
"gated_mlp": false,
|
| 8693 |
"default_prepend_bos": true,
|
|
|
|
| 8697 |
"post_embedding_ln": false,
|
| 8698 |
"rotary_base": 10000,
|
| 8699 |
"trust_remote_code": false,
|
| 8700 |
+
"rotary_adjacent_pairs": false,
|
| 8701 |
+
"load_in_4bit": false,
|
| 8702 |
+
"num_experts": null,
|
| 8703 |
+
"experts_per_token": null
|
| 8704 |
+
},
|
| 8705 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl",
|
| 8706 |
+
"training_args": {
|
| 8707 |
+
"output_dir": "/circuits-benchmark/results",
|
| 8708 |
+
"atol": 0.05,
|
| 8709 |
+
"lr": 0.001,
|
| 8710 |
+
"use_single_loss": true,
|
| 8711 |
+
"iit_weight": 1.0,
|
| 8712 |
+
"behavior_weight": 0.4,
|
| 8713 |
+
"strict_weight": 0.4,
|
| 8714 |
+
"epochs": 1000,
|
| 8715 |
+
"early_stop_accuracy_threshold": 99.9,
|
| 8716 |
+
"act_fn": "gelu",
|
| 8717 |
+
"use_wandb": true,
|
| 8718 |
+
"save_model_to_wandb": true,
|
| 8719 |
+
"clip_grad_norm": 0.1,
|
| 8720 |
+
"lr_scheduler": "linear",
|
| 8721 |
+
"model_pair": "strict",
|
| 8722 |
+
"same_size": false,
|
| 8723 |
+
"seed": 67,
|
| 8724 |
+
"batch_size": 256,
|
| 8725 |
+
"include_mlp": false,
|
| 8726 |
+
"detach_while_caching": true,
|
| 8727 |
+
"scheduler_val_metric": [
|
| 8728 |
+
"val/accuracy",
|
| 8729 |
+
"val/IIA",
|
| 8730 |
+
"val/strict_accuracy"
|
| 8731 |
+
],
|
| 8732 |
+
"siit_sampling": "sample_all",
|
| 8733 |
+
"val_iia_sampling": "all"
|
| 8734 |
+
},
|
| 8735 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json",
|
| 8736 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth",
|
| 8737 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl"
|
| 8738 |
+
},
|
| 8739 |
+
{
|
| 8740 |
+
"case_id": "121",
|
| 8741 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/121",
|
| 8742 |
+
"task_description": "Compute arcsine of all elements in the input sequence.",
|
| 8743 |
+
"vocab": [
|
| 8744 |
+
-1.0,
|
| 8745 |
+
-0.9,
|
| 8746 |
+
-0.8,
|
| 8747 |
+
-0.7,
|
| 8748 |
+
-0.6,
|
| 8749 |
+
-0.5,
|
| 8750 |
+
-0.4,
|
| 8751 |
+
-0.30000000000000004,
|
| 8752 |
+
-0.19999999999999996,
|
| 8753 |
+
-0.09999999999999998,
|
| 8754 |
+
0.0,
|
| 8755 |
+
0.10000000000000009,
|
| 8756 |
+
0.19999999999999996,
|
| 8757 |
+
0.30000000000000004,
|
| 8758 |
+
0.3999999999999999,
|
| 8759 |
+
0.5,
|
| 8760 |
+
0.6000000000000001,
|
| 8761 |
+
0.7,
|
| 8762 |
+
0.8,
|
| 8763 |
+
0.8999999999999999
|
| 8764 |
+
],
|
| 8765 |
+
"max_seq_len": 10,
|
| 8766 |
+
"min_seq_len": 4,
|
| 8767 |
+
"files": [
|
| 8768 |
+
{
|
| 8769 |
+
"file_name": "edges.pkl",
|
| 8770 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/edges.pkl"
|
| 8771 |
+
},
|
| 8772 |
+
{
|
| 8773 |
+
"file_name": "ll_model.pth",
|
| 8774 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model.pth"
|
| 8775 |
+
},
|
| 8776 |
+
{
|
| 8777 |
+
"file_name": "ll_model_cfg.pkl",
|
| 8778 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model_cfg.pkl"
|
| 8779 |
+
},
|
| 8780 |
+
{
|
| 8781 |
+
"file_name": "meta.json",
|
| 8782 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/meta.json"
|
| 8783 |
+
}
|
| 8784 |
+
],
|
| 8785 |
+
"transformer_cfg": {
|
| 8786 |
+
"n_layers": 2,
|
| 8787 |
+
"d_model": 4,
|
| 8788 |
+
"n_ctx": 10,
|
| 8789 |
+
"d_head": 1,
|
| 8790 |
+
"model_name": "custom",
|
| 8791 |
+
"n_heads": 4,
|
| 8792 |
+
"d_mlp": 16,
|
| 8793 |
+
"act_fn": "gelu",
|
| 8794 |
+
"d_vocab": 22,
|
| 8795 |
+
"eps": 1e-05,
|
| 8796 |
+
"use_attn_result": true,
|
| 8797 |
+
"use_attn_scale": true,
|
| 8798 |
+
"use_split_qkv_input": true,
|
| 8799 |
+
"use_hook_mlp_in": true,
|
| 8800 |
+
"use_attn_in": false,
|
| 8801 |
+
"use_local_attn": false,
|
| 8802 |
+
"original_architecture": null,
|
| 8803 |
+
"from_checkpoint": false,
|
| 8804 |
+
"checkpoint_index": null,
|
| 8805 |
+
"checkpoint_label_type": null,
|
| 8806 |
+
"checkpoint_value": null,
|
| 8807 |
+
"tokenizer_name": null,
|
| 8808 |
+
"window_size": null,
|
| 8809 |
+
"attn_types": null,
|
| 8810 |
+
"init_mode": "gpt2",
|
| 8811 |
+
"normalization_type": null,
|
| 8812 |
+
"n_devices": 1,
|
| 8813 |
+
"attention_dir": "causal",
|
| 8814 |
+
"attn_only": false,
|
| 8815 |
+
"seed": 0,
|
| 8816 |
+
"initializer_range": 0.11202240672224079,
|
| 8817 |
+
"init_weights": true,
|
| 8818 |
+
"scale_attn_by_inverse_layer_idx": false,
|
| 8819 |
+
"positional_embedding_type": "standard",
|
| 8820 |
+
"final_rms": false,
|
| 8821 |
+
"d_vocab_out": 20,
|
| 8822 |
+
"parallel_attn_mlp": false,
|
| 8823 |
+
"rotary_dim": null,
|
| 8824 |
+
"n_params": 384,
|
| 8825 |
+
"use_hook_tokens": false,
|
| 8826 |
+
"gated_mlp": false,
|
| 8827 |
+
"default_prepend_bos": true,
|
| 8828 |
+
"dtype": "torch.float32",
|
| 8829 |
+
"tokenizer_prepends_bos": null,
|
| 8830 |
+
"n_key_value_heads": null,
|
| 8831 |
+
"post_embedding_ln": false,
|
| 8832 |
+
"rotary_base": 10000,
|
| 8833 |
+
"trust_remote_code": false,
|
| 8834 |
+
"rotary_adjacent_pairs": false,
|
| 8835 |
+
"load_in_4bit": false,
|
| 8836 |
+
"num_experts": null,
|
| 8837 |
+
"experts_per_token": null
|
| 8838 |
+
},
|
| 8839 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model_cfg.pkl",
|
| 8840 |
+
"training_args": {
|
| 8841 |
+
"output_dir": "/circuits-benchmark/results",
|
| 8842 |
+
"atol": 0.05,
|
| 8843 |
+
"lr": 0.001,
|
| 8844 |
+
"use_single_loss": true,
|
| 8845 |
+
"iit_weight": 1.0,
|
| 8846 |
+
"behavior_weight": 0.4,
|
| 8847 |
+
"strict_weight": 1.0,
|
| 8848 |
+
"epochs": 1000,
|
| 8849 |
+
"early_stop_accuracy_threshold": 99.9,
|
| 8850 |
+
"act_fn": "gelu",
|
| 8851 |
+
"use_wandb": true,
|
| 8852 |
+
"save_model_to_wandb": true,
|
| 8853 |
+
"clip_grad_norm": 0.1,
|
| 8854 |
+
"lr_scheduler": "linear",
|
| 8855 |
+
"model_pair": "strict",
|
| 8856 |
+
"same_size": false,
|
| 8857 |
+
"seed": 67,
|
| 8858 |
+
"batch_size": 256,
|
| 8859 |
+
"include_mlp": false,
|
| 8860 |
+
"detach_while_caching": true,
|
| 8861 |
+
"scheduler_val_metric": [
|
| 8862 |
+
"val/accuracy",
|
| 8863 |
+
"val/IIA",
|
| 8864 |
+
"val/strict_accuracy"
|
| 8865 |
+
],
|
| 8866 |
+
"siit_sampling": "sample_all",
|
| 8867 |
+
"val_iia_sampling": "all"
|
| 8868 |
+
},
|
| 8869 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/meta.json",
|
| 8870 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model.pth",
|
| 8871 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/edges.pkl"
|
| 8872 |
+
},
|
| 8873 |
+
{
|
| 8874 |
+
"case_id": "35",
|
| 8875 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/35",
|
| 8876 |
+
"task_description": "Alternates capitalization of each character in words.",
|
| 8877 |
+
"vocab": [
|
| 8878 |
+
"J",
|
| 8879 |
+
"LB",
|
| 8880 |
+
"TPSI",
|
| 8881 |
+
"V",
|
| 8882 |
+
"b",
|
| 8883 |
+
"no",
|
| 8884 |
+
"oCLrZaW",
|
| 8885 |
+
"poiVg"
|
| 8886 |
+
],
|
| 8887 |
+
"max_seq_len": 10,
|
| 8888 |
+
"min_seq_len": 4,
|
| 8889 |
+
"files": [
|
| 8890 |
+
{
|
| 8891 |
+
"file_name": "edges.pkl",
|
| 8892 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/edges.pkl"
|
| 8893 |
+
},
|
| 8894 |
+
{
|
| 8895 |
+
"file_name": "ll_model.pth",
|
| 8896 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model.pth"
|
| 8897 |
+
},
|
| 8898 |
+
{
|
| 8899 |
+
"file_name": "ll_model_cfg.pkl",
|
| 8900 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl"
|
| 8901 |
+
},
|
| 8902 |
+
{
|
| 8903 |
+
"file_name": "meta.json",
|
| 8904 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/meta.json"
|
| 8905 |
+
}
|
| 8906 |
+
],
|
| 8907 |
+
"transformer_cfg": {
|
| 8908 |
+
"n_layers": 2,
|
| 8909 |
+
"d_model": 9,
|
| 8910 |
+
"n_ctx": 10,
|
| 8911 |
+
"d_head": 2,
|
| 8912 |
+
"model_name": "custom",
|
| 8913 |
+
"n_heads": 4,
|
| 8914 |
+
"d_mlp": 36,
|
| 8915 |
+
"act_fn": "gelu",
|
| 8916 |
+
"d_vocab": 10,
|
| 8917 |
+
"eps": 1e-05,
|
| 8918 |
+
"use_attn_result": true,
|
| 8919 |
+
"use_attn_scale": true,
|
| 8920 |
+
"use_split_qkv_input": true,
|
| 8921 |
+
"use_hook_mlp_in": true,
|
| 8922 |
+
"use_attn_in": false,
|
| 8923 |
+
"use_local_attn": false,
|
| 8924 |
+
"original_architecture": null,
|
| 8925 |
+
"from_checkpoint": false,
|
| 8926 |
+
"checkpoint_index": null,
|
| 8927 |
+
"checkpoint_label_type": null,
|
| 8928 |
+
"checkpoint_value": null,
|
| 8929 |
+
"tokenizer_name": null,
|
| 8930 |
+
"window_size": null,
|
| 8931 |
+
"attn_types": null,
|
| 8932 |
+
"init_mode": "gpt2",
|
| 8933 |
+
"normalization_type": null,
|
| 8934 |
+
"n_devices": 1,
|
| 8935 |
+
"attention_dir": "causal",
|
| 8936 |
+
"attn_only": false,
|
| 8937 |
+
"seed": 0,
|
| 8938 |
+
"initializer_range": 0.1539600717839002,
|
| 8939 |
+
"init_weights": true,
|
| 8940 |
+
"scale_attn_by_inverse_layer_idx": false,
|
| 8941 |
+
"positional_embedding_type": "standard",
|
| 8942 |
+
"final_rms": false,
|
| 8943 |
+
"d_vocab_out": 8,
|
| 8944 |
+
"parallel_attn_mlp": false,
|
| 8945 |
+
"rotary_dim": null,
|
| 8946 |
+
"n_params": 1872,
|
| 8947 |
+
"use_hook_tokens": false,
|
| 8948 |
+
"gated_mlp": false,
|
| 8949 |
+
"default_prepend_bos": true,
|
| 8950 |
+
"dtype": "torch.float32",
|
| 8951 |
+
"tokenizer_prepends_bos": null,
|
| 8952 |
+
"n_key_value_heads": null,
|
| 8953 |
+
"post_embedding_ln": false,
|
| 8954 |
+
"rotary_base": 10000,
|
| 8955 |
+
"trust_remote_code": false,
|
| 8956 |
+
"rotary_adjacent_pairs": false
|
| 8957 |
+
},
|
| 8958 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl",
|
| 8959 |
"training_args": {
|
| 8960 |
"atol": 0.05,
|
| 8961 |
"lr": 0.01,
|
|
|
|
| 9060 |
"lr": 0.01,
|
| 9061 |
"use_single_loss": false,
|
| 9062 |
"iit_weight": 1.0,
|
| 9063 |
+
"behavior_weight": 1.0,
|
| 9064 |
+
"strict_weight": 10.0,
|
| 9065 |
+
"epochs": 2000,
|
| 9066 |
+
"act_fn": "gelu",
|
| 9067 |
+
"clip_grad_norm": 0.1,
|
| 9068 |
+
"lr_scheduler": "",
|
| 9069 |
+
"model_pair": "strict",
|
| 9070 |
+
"same_size": false
|
| 9071 |
+
},
|
| 9072 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/meta.json",
|
| 9073 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model.pth",
|
| 9074 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/edges.pkl"
|
| 9075 |
+
},
|
| 9076 |
+
{
|
| 9077 |
+
"case_id": "36",
|
| 9078 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/36",
|
| 9079 |
+
"task_description": "Classifies each token as 'positive', 'negative', or 'neutral' based on emojis.",
|
| 9080 |
+
"vocab": [
|
| 9081 |
+
"\ud83d\udcd8",
|
| 9082 |
+
"\ud83d\ude0a",
|
| 9083 |
+
"\ud83d\ude22"
|
| 9084 |
+
],
|
| 9085 |
+
"max_seq_len": 10,
|
| 9086 |
+
"min_seq_len": 4,
|
| 9087 |
+
"files": [
|
| 9088 |
+
{
|
| 9089 |
+
"file_name": "edges.pkl",
|
| 9090 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl"
|
| 9091 |
+
},
|
| 9092 |
+
{
|
| 9093 |
+
"file_name": "ll_model.pth",
|
| 9094 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth"
|
| 9095 |
+
},
|
| 9096 |
+
{
|
| 9097 |
+
"file_name": "ll_model_cfg.pkl",
|
| 9098 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl"
|
| 9099 |
+
},
|
| 9100 |
+
{
|
| 9101 |
+
"file_name": "meta.json",
|
| 9102 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json"
|
| 9103 |
+
}
|
| 9104 |
+
],
|
| 9105 |
+
"transformer_cfg": {
|
| 9106 |
+
"n_layers": 2,
|
| 9107 |
+
"d_model": 6,
|
| 9108 |
+
"n_ctx": 10,
|
| 9109 |
+
"d_head": 1,
|
| 9110 |
+
"model_name": "custom",
|
| 9111 |
+
"n_heads": 4,
|
| 9112 |
+
"d_mlp": 24,
|
| 9113 |
+
"act_fn": "gelu",
|
| 9114 |
+
"d_vocab": 5,
|
| 9115 |
+
"eps": 1e-05,
|
| 9116 |
+
"use_attn_result": true,
|
| 9117 |
+
"use_attn_scale": true,
|
| 9118 |
+
"use_split_qkv_input": true,
|
| 9119 |
+
"use_hook_mlp_in": true,
|
| 9120 |
+
"use_attn_in": false,
|
| 9121 |
+
"use_local_attn": false,
|
| 9122 |
+
"original_architecture": null,
|
| 9123 |
+
"from_checkpoint": false,
|
| 9124 |
+
"checkpoint_index": null,
|
| 9125 |
+
"checkpoint_label_type": null,
|
| 9126 |
+
"checkpoint_value": null,
|
| 9127 |
+
"tokenizer_name": null,
|
| 9128 |
+
"window_size": null,
|
| 9129 |
+
"attn_types": null,
|
| 9130 |
+
"init_mode": "gpt2",
|
| 9131 |
+
"normalization_type": null,
|
| 9132 |
+
"n_devices": 1,
|
| 9133 |
+
"attention_dir": "causal",
|
| 9134 |
+
"attn_only": false,
|
| 9135 |
+
"seed": 0,
|
| 9136 |
+
"initializer_range": 0.19402850002906638,
|
| 9137 |
+
"init_weights": true,
|
| 9138 |
+
"scale_attn_by_inverse_layer_idx": false,
|
| 9139 |
+
"positional_embedding_type": "standard",
|
| 9140 |
+
"final_rms": false,
|
| 9141 |
+
"d_vocab_out": 3,
|
| 9142 |
+
"parallel_attn_mlp": false,
|
| 9143 |
+
"rotary_dim": null,
|
| 9144 |
+
"n_params": 768,
|
| 9145 |
+
"use_hook_tokens": false,
|
| 9146 |
+
"gated_mlp": false,
|
| 9147 |
+
"default_prepend_bos": true,
|
| 9148 |
+
"dtype": "torch.float32",
|
| 9149 |
+
"tokenizer_prepends_bos": null,
|
| 9150 |
+
"n_key_value_heads": null,
|
| 9151 |
+
"post_embedding_ln": false,
|
| 9152 |
+
"rotary_base": 10000,
|
| 9153 |
+
"trust_remote_code": false,
|
| 9154 |
+
"rotary_adjacent_pairs": false
|
| 9155 |
+
},
|
| 9156 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl",
|
| 9157 |
+
"training_args": {
|
| 9158 |
+
"atol": 0.05,
|
| 9159 |
+
"lr": 0.01,
|
| 9160 |
+
"use_single_loss": false,
|
| 9161 |
+
"iit_weight": 1.0,
|
| 9162 |
+
"behavior_weight": 1.0,
|
| 9163 |
+
"strict_weight": 1.0,
|
| 9164 |
+
"epochs": 2000,
|
| 9165 |
+
"act_fn": "gelu",
|
| 9166 |
+
"clip_grad_norm": 0.1,
|
| 9167 |
+
"lr_scheduler": "",
|
| 9168 |
+
"model_pair": "strict"
|
| 9169 |
+
},
|
| 9170 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json",
|
| 9171 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth",
|
| 9172 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl"
|
| 9173 |
+
},
|
| 9174 |
+
{
|
| 9175 |
+
"case_id": "106",
|
| 9176 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/106",
|
| 9177 |
+
"task_description": "Sets all elements to zero except for the element at index 1.",
|
| 9178 |
+
"vocab": [
|
| 9179 |
+
0,
|
| 9180 |
+
1,
|
| 9181 |
+
2,
|
| 9182 |
+
3,
|
| 9183 |
+
4,
|
| 9184 |
+
5,
|
| 9185 |
+
6,
|
| 9186 |
+
7,
|
| 9187 |
+
8,
|
| 9188 |
+
9,
|
| 9189 |
+
10
|
| 9190 |
+
],
|
| 9191 |
+
"max_seq_len": 10,
|
| 9192 |
+
"min_seq_len": 4,
|
| 9193 |
+
"files": [
|
| 9194 |
+
{
|
| 9195 |
+
"file_name": "edges.pkl",
|
| 9196 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/edges.pkl"
|
| 9197 |
+
},
|
| 9198 |
+
{
|
| 9199 |
+
"file_name": "ll_model.pth",
|
| 9200 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model.pth"
|
| 9201 |
+
},
|
| 9202 |
+
{
|
| 9203 |
+
"file_name": "ll_model_cfg.pkl",
|
| 9204 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model_cfg.pkl"
|
| 9205 |
+
},
|
| 9206 |
+
{
|
| 9207 |
+
"file_name": "meta.json",
|
| 9208 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/meta.json"
|
| 9209 |
+
}
|
| 9210 |
+
],
|
| 9211 |
+
"transformer_cfg": {
|
| 9212 |
+
"n_layers": 2,
|
| 9213 |
+
"d_model": 4,
|
| 9214 |
+
"n_ctx": 10,
|
| 9215 |
+
"d_head": 1,
|
| 9216 |
+
"model_name": "custom",
|
| 9217 |
+
"n_heads": 4,
|
| 9218 |
+
"d_mlp": 16,
|
| 9219 |
+
"act_fn": "gelu",
|
| 9220 |
+
"d_vocab": 13,
|
| 9221 |
+
"eps": 1e-05,
|
| 9222 |
+
"use_attn_result": true,
|
| 9223 |
+
"use_attn_scale": true,
|
| 9224 |
+
"use_split_qkv_input": true,
|
| 9225 |
+
"use_hook_mlp_in": true,
|
| 9226 |
+
"use_attn_in": false,
|
| 9227 |
+
"use_local_attn": false,
|
| 9228 |
+
"original_architecture": null,
|
| 9229 |
+
"from_checkpoint": false,
|
| 9230 |
+
"checkpoint_index": null,
|
| 9231 |
+
"checkpoint_label_type": null,
|
| 9232 |
+
"checkpoint_value": null,
|
| 9233 |
+
"tokenizer_name": null,
|
| 9234 |
+
"window_size": null,
|
| 9235 |
+
"attn_types": null,
|
| 9236 |
+
"init_mode": "gpt2",
|
| 9237 |
+
"normalization_type": null,
|
| 9238 |
+
"n_devices": 1,
|
| 9239 |
+
"attention_dir": "causal",
|
| 9240 |
+
"attn_only": false,
|
| 9241 |
+
"seed": 0,
|
| 9242 |
+
"initializer_range": 0.13719886811400708,
|
| 9243 |
+
"init_weights": true,
|
| 9244 |
+
"scale_attn_by_inverse_layer_idx": false,
|
| 9245 |
+
"positional_embedding_type": "standard",
|
| 9246 |
+
"final_rms": false,
|
| 9247 |
+
"d_vocab_out": 11,
|
| 9248 |
+
"parallel_attn_mlp": false,
|
| 9249 |
+
"rotary_dim": null,
|
| 9250 |
+
"n_params": 384,
|
| 9251 |
+
"use_hook_tokens": false,
|
| 9252 |
+
"gated_mlp": false,
|
| 9253 |
+
"default_prepend_bos": true,
|
| 9254 |
+
"dtype": "torch.float32",
|
| 9255 |
+
"tokenizer_prepends_bos": null,
|
| 9256 |
+
"n_key_value_heads": null,
|
| 9257 |
+
"post_embedding_ln": false,
|
| 9258 |
+
"rotary_base": 10000,
|
| 9259 |
+
"trust_remote_code": false,
|
| 9260 |
+
"rotary_adjacent_pairs": false,
|
| 9261 |
+
"load_in_4bit": false,
|
| 9262 |
+
"num_experts": null,
|
| 9263 |
+
"experts_per_token": null
|
| 9264 |
+
},
|
| 9265 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model_cfg.pkl",
|
| 9266 |
+
"training_args": {
|
| 9267 |
+
"output_dir": "/circuits-benchmark/results",
|
| 9268 |
+
"atol": 0.05,
|
| 9269 |
+
"lr": 0.001,
|
| 9270 |
+
"use_single_loss": true,
|
| 9271 |
+
"iit_weight": 1.0,
|
| 9272 |
+
"behavior_weight": 0.4,
|
| 9273 |
+
"strict_weight": 0.7,
|
| 9274 |
+
"epochs": 1000,
|
| 9275 |
+
"early_stop_accuracy_threshold": 99.9,
|
| 9276 |
"act_fn": "gelu",
|
| 9277 |
+
"use_wandb": true,
|
| 9278 |
+
"save_model_to_wandb": true,
|
| 9279 |
"clip_grad_norm": 0.1,
|
| 9280 |
+
"lr_scheduler": "linear",
|
| 9281 |
"model_pair": "strict",
|
| 9282 |
+
"same_size": false,
|
| 9283 |
+
"seed": 92,
|
| 9284 |
+
"batch_size": 256,
|
| 9285 |
+
"include_mlp": false,
|
| 9286 |
+
"detach_while_caching": true,
|
| 9287 |
+
"scheduler_val_metric": [
|
| 9288 |
+
"val/accuracy",
|
| 9289 |
+
"val/IIA",
|
| 9290 |
+
"val/strict_accuracy"
|
| 9291 |
+
],
|
| 9292 |
+
"siit_sampling": "sample_all",
|
| 9293 |
+
"val_iia_sampling": "all"
|
| 9294 |
},
|
| 9295 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/meta.json",
|
| 9296 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model.pth",
|
| 9297 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/edges.pkl"
|
| 9298 |
},
|
| 9299 |
{
|
| 9300 |
+
"case_id": "64",
|
| 9301 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/64",
|
| 9302 |
+
"task_description": "Cubes each element in the sequence.",
|
| 9303 |
"vocab": [
|
| 9304 |
+
0,
|
| 9305 |
+
1,
|
| 9306 |
+
2,
|
| 9307 |
+
3,
|
| 9308 |
+
4,
|
| 9309 |
+
5,
|
| 9310 |
+
6,
|
| 9311 |
+
7,
|
| 9312 |
+
8,
|
| 9313 |
+
9,
|
| 9314 |
+
10
|
| 9315 |
],
|
| 9316 |
"max_seq_len": 10,
|
| 9317 |
"min_seq_len": 4,
|
| 9318 |
"files": [
|
| 9319 |
{
|
| 9320 |
"file_name": "edges.pkl",
|
| 9321 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl"
|
| 9322 |
},
|
| 9323 |
{
|
| 9324 |
"file_name": "ll_model.pth",
|
| 9325 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth"
|
| 9326 |
},
|
| 9327 |
{
|
| 9328 |
"file_name": "ll_model_cfg.pkl",
|
| 9329 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl"
|
| 9330 |
},
|
| 9331 |
{
|
| 9332 |
"file_name": "meta.json",
|
| 9333 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json"
|
| 9334 |
}
|
| 9335 |
],
|
| 9336 |
"transformer_cfg": {
|
| 9337 |
"n_layers": 2,
|
| 9338 |
+
"d_model": 4,
|
| 9339 |
"n_ctx": 10,
|
| 9340 |
"d_head": 1,
|
| 9341 |
"model_name": "custom",
|
| 9342 |
"n_heads": 4,
|
| 9343 |
+
"d_mlp": 16,
|
| 9344 |
"act_fn": "gelu",
|
| 9345 |
+
"d_vocab": 13,
|
| 9346 |
"eps": 1e-05,
|
| 9347 |
"use_attn_result": true,
|
| 9348 |
"use_attn_scale": true,
|
|
|
|
| 9364 |
"attention_dir": "causal",
|
| 9365 |
"attn_only": false,
|
| 9366 |
"seed": 0,
|
| 9367 |
+
"initializer_range": 0.1392621247645583,
|
| 9368 |
"init_weights": true,
|
| 9369 |
"scale_attn_by_inverse_layer_idx": false,
|
| 9370 |
"positional_embedding_type": "standard",
|
| 9371 |
"final_rms": false,
|
| 9372 |
+
"d_vocab_out": 11,
|
| 9373 |
"parallel_attn_mlp": false,
|
| 9374 |
"rotary_dim": null,
|
| 9375 |
+
"n_params": 384,
|
| 9376 |
"use_hook_tokens": false,
|
| 9377 |
"gated_mlp": false,
|
| 9378 |
"default_prepend_bos": true,
|
|
|
|
| 9382 |
"post_embedding_ln": false,
|
| 9383 |
"rotary_base": 10000,
|
| 9384 |
"trust_remote_code": false,
|
| 9385 |
+
"rotary_adjacent_pairs": false,
|
| 9386 |
+
"load_in_4bit": false,
|
| 9387 |
+
"num_experts": null,
|
| 9388 |
+
"experts_per_token": null
|
| 9389 |
},
|
| 9390 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl",
|
| 9391 |
"training_args": {
|
| 9392 |
+
"output_dir": "/circuits-benchmark/results",
|
| 9393 |
"atol": 0.05,
|
| 9394 |
+
"lr": 0.001,
|
| 9395 |
+
"use_single_loss": true,
|
| 9396 |
"iit_weight": 1.0,
|
| 9397 |
+
"behavior_weight": 0.4,
|
| 9398 |
+
"strict_weight": 0.7,
|
| 9399 |
+
"epochs": 1000,
|
| 9400 |
+
"early_stop_accuracy_threshold": 99.9,
|
| 9401 |
"act_fn": "gelu",
|
| 9402 |
+
"use_wandb": true,
|
| 9403 |
+
"save_model_to_wandb": true,
|
| 9404 |
"clip_grad_norm": 0.1,
|
| 9405 |
+
"lr_scheduler": "linear",
|
| 9406 |
+
"model_pair": "strict",
|
| 9407 |
+
"same_size": false,
|
| 9408 |
+
"seed": 67,
|
| 9409 |
+
"batch_size": 256,
|
| 9410 |
+
"include_mlp": false,
|
| 9411 |
+
"detach_while_caching": true,
|
| 9412 |
+
"scheduler_val_metric": [
|
| 9413 |
+
"val/accuracy",
|
| 9414 |
+
"val/IIA",
|
| 9415 |
+
"val/strict_accuracy"
|
| 9416 |
+
],
|
| 9417 |
+
"siit_sampling": "sample_all",
|
| 9418 |
+
"val_iia_sampling": "all"
|
| 9419 |
},
|
| 9420 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json",
|
| 9421 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth",
|
| 9422 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl"
|
| 9423 |
},
|
| 9424 |
{
|
| 9425 |
+
"case_id": "8",
|
| 9426 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/8",
|
| 9427 |
+
"task_description": "Identity",
|
| 9428 |
"vocab": [
|
| 9429 |
0,
|
| 9430 |
1,
|
|
|
|
| 9443 |
"files": [
|
| 9444 |
{
|
| 9445 |
"file_name": "edges.pkl",
|
| 9446 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl"
|
| 9447 |
},
|
| 9448 |
{
|
| 9449 |
"file_name": "ll_model.pth",
|
| 9450 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth"
|
| 9451 |
},
|
| 9452 |
{
|
| 9453 |
"file_name": "ll_model_cfg.pkl",
|
| 9454 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl"
|
| 9455 |
},
|
| 9456 |
{
|
| 9457 |
"file_name": "meta.json",
|
| 9458 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json"
|
| 9459 |
}
|
| 9460 |
],
|
| 9461 |
"transformer_cfg": {
|
|
|
|
| 9512 |
"num_experts": null,
|
| 9513 |
"experts_per_token": null
|
| 9514 |
},
|
| 9515 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl",
|
| 9516 |
"training_args": {
|
| 9517 |
"output_dir": "/circuits-benchmark/results",
|
| 9518 |
"atol": 0.05,
|
|
|
|
| 9542 |
"siit_sampling": "sample_all",
|
| 9543 |
"val_iia_sampling": "all"
|
| 9544 |
},
|
| 9545 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json",
|
| 9546 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth",
|
| 9547 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl"
|
| 9548 |
},
|
| 9549 |
{
|
| 9550 |
+
"case_id": "73",
|
| 9551 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/73",
|
| 9552 |
+
"task_description": "Apply the sine function to each element of the input sequence.",
|
| 9553 |
"vocab": [
|
| 9554 |
0,
|
| 9555 |
1,
|
|
|
|
| 9568 |
"files": [
|
| 9569 |
{
|
| 9570 |
"file_name": "edges.pkl",
|
| 9571 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/edges.pkl"
|
| 9572 |
},
|
| 9573 |
{
|
| 9574 |
"file_name": "ll_model.pth",
|
| 9575 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model.pth"
|
| 9576 |
},
|
| 9577 |
{
|
| 9578 |
"file_name": "ll_model_cfg.pkl",
|
| 9579 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model_cfg.pkl"
|
| 9580 |
},
|
| 9581 |
{
|
| 9582 |
"file_name": "meta.json",
|
| 9583 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/meta.json"
|
| 9584 |
}
|
| 9585 |
],
|
| 9586 |
"transformer_cfg": {
|
|
|
|
| 9637 |
"num_experts": null,
|
| 9638 |
"experts_per_token": null
|
| 9639 |
},
|
| 9640 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model_cfg.pkl",
|
| 9641 |
"training_args": {
|
| 9642 |
"output_dir": "/circuits-benchmark/results",
|
| 9643 |
"atol": 0.05,
|
|
|
|
| 9655 |
"lr_scheduler": "linear",
|
| 9656 |
"model_pair": "strict",
|
| 9657 |
"same_size": false,
|
| 9658 |
+
"seed": 92,
|
| 9659 |
"batch_size": 256,
|
| 9660 |
"include_mlp": false,
|
| 9661 |
"detach_while_caching": true,
|
|
|
|
| 9667 |
"siit_sampling": "sample_all",
|
| 9668 |
"val_iia_sampling": "all"
|
| 9669 |
},
|
| 9670 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/meta.json",
|
| 9671 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model.pth",
|
| 9672 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/edges.pkl"
|
| 9673 |
},
|
| 9674 |
{
|
| 9675 |
"case_id": "103",
|
|
|
|
| 10046 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth",
|
| 10047 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl"
|
| 10048 |
},
|
| 10049 |
+
{
|
| 10050 |
+
"case_id": "49",
|
| 10051 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/49",
|
| 10052 |
+
"task_description": "Decrements each element in the sequence until it becomes a multiple of 3.",
|
| 10053 |
+
"vocab": [
|
| 10054 |
+
0,
|
| 10055 |
+
1,
|
| 10056 |
+
2,
|
| 10057 |
+
3,
|
| 10058 |
+
4,
|
| 10059 |
+
5,
|
| 10060 |
+
6,
|
| 10061 |
+
7,
|
| 10062 |
+
8,
|
| 10063 |
+
9,
|
| 10064 |
+
10
|
| 10065 |
+
],
|
| 10066 |
+
"max_seq_len": 10,
|
| 10067 |
+
"min_seq_len": 4,
|
| 10068 |
+
"files": [
|
| 10069 |
+
{
|
| 10070 |
+
"file_name": "edges.pkl",
|
| 10071 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/edges.pkl"
|
| 10072 |
+
},
|
| 10073 |
+
{
|
| 10074 |
+
"file_name": "ll_model.pth",
|
| 10075 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model.pth"
|
| 10076 |
+
},
|
| 10077 |
+
{
|
| 10078 |
+
"file_name": "ll_model_cfg.pkl",
|
| 10079 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model_cfg.pkl"
|
| 10080 |
+
},
|
| 10081 |
+
{
|
| 10082 |
+
"file_name": "meta.json",
|
| 10083 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/meta.json"
|
| 10084 |
+
}
|
| 10085 |
+
],
|
| 10086 |
+
"transformer_cfg": {
|
| 10087 |
+
"n_layers": 2,
|
| 10088 |
+
"d_model": 4,
|
| 10089 |
+
"n_ctx": 10,
|
| 10090 |
+
"d_head": 1,
|
| 10091 |
+
"model_name": "custom",
|
| 10092 |
+
"n_heads": 4,
|
| 10093 |
+
"d_mlp": 16,
|
| 10094 |
+
"act_fn": "gelu",
|
| 10095 |
+
"d_vocab": 13,
|
| 10096 |
+
"eps": 1e-05,
|
| 10097 |
+
"use_attn_result": true,
|
| 10098 |
+
"use_attn_scale": true,
|
| 10099 |
+
"use_split_qkv_input": true,
|
| 10100 |
+
"use_hook_mlp_in": true,
|
| 10101 |
+
"use_attn_in": false,
|
| 10102 |
+
"use_local_attn": false,
|
| 10103 |
+
"original_architecture": null,
|
| 10104 |
+
"from_checkpoint": false,
|
| 10105 |
+
"checkpoint_index": null,
|
| 10106 |
+
"checkpoint_label_type": null,
|
| 10107 |
+
"checkpoint_value": null,
|
| 10108 |
+
"tokenizer_name": null,
|
| 10109 |
+
"window_size": null,
|
| 10110 |
+
"attn_types": null,
|
| 10111 |
+
"init_mode": "gpt2",
|
| 10112 |
+
"normalization_type": null,
|
| 10113 |
+
"n_devices": 1,
|
| 10114 |
+
"attention_dir": "causal",
|
| 10115 |
+
"attn_only": false,
|
| 10116 |
+
"seed": 0,
|
| 10117 |
+
"initializer_range": 0.15689290811054724,
|
| 10118 |
+
"init_weights": true,
|
| 10119 |
+
"scale_attn_by_inverse_layer_idx": false,
|
| 10120 |
+
"positional_embedding_type": "standard",
|
| 10121 |
+
"final_rms": false,
|
| 10122 |
+
"d_vocab_out": 4,
|
| 10123 |
+
"parallel_attn_mlp": false,
|
| 10124 |
+
"rotary_dim": null,
|
| 10125 |
+
"n_params": 384,
|
| 10126 |
+
"use_hook_tokens": false,
|
| 10127 |
+
"gated_mlp": false,
|
| 10128 |
+
"default_prepend_bos": true,
|
| 10129 |
+
"dtype": "torch.float32",
|
| 10130 |
+
"tokenizer_prepends_bos": null,
|
| 10131 |
+
"n_key_value_heads": null,
|
| 10132 |
+
"post_embedding_ln": false,
|
| 10133 |
+
"rotary_base": 10000,
|
| 10134 |
+
"trust_remote_code": false,
|
| 10135 |
+
"rotary_adjacent_pairs": false,
|
| 10136 |
+
"load_in_4bit": false,
|
| 10137 |
+
"num_experts": null,
|
| 10138 |
+
"experts_per_token": null
|
| 10139 |
+
},
|
| 10140 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model_cfg.pkl",
|
| 10141 |
+
"training_args": {
|
| 10142 |
+
"output_dir": "/circuits-benchmark/results",
|
| 10143 |
+
"atol": 0.05,
|
| 10144 |
+
"lr": 0.001,
|
| 10145 |
+
"use_single_loss": true,
|
| 10146 |
+
"iit_weight": 1.0,
|
| 10147 |
+
"behavior_weight": 0.4,
|
| 10148 |
+
"strict_weight": 0.7,
|
| 10149 |
+
"epochs": 1000,
|
| 10150 |
+
"early_stop_accuracy_threshold": 99.9,
|
| 10151 |
+
"act_fn": "gelu",
|
| 10152 |
+
"use_wandb": true,
|
| 10153 |
+
"save_model_to_wandb": true,
|
| 10154 |
+
"clip_grad_norm": 0.1,
|
| 10155 |
+
"lr_scheduler": "linear",
|
| 10156 |
+
"model_pair": "strict",
|
| 10157 |
+
"same_size": false,
|
| 10158 |
+
"seed": 92,
|
| 10159 |
+
"batch_size": 256,
|
| 10160 |
+
"include_mlp": false,
|
| 10161 |
+
"detach_while_caching": true,
|
| 10162 |
+
"scheduler_val_metric": [
|
| 10163 |
+
"val/accuracy",
|
| 10164 |
+
"val/IIA",
|
| 10165 |
+
"val/strict_accuracy"
|
| 10166 |
+
],
|
| 10167 |
+
"siit_sampling": "sample_all",
|
| 10168 |
+
"val_iia_sampling": "all"
|
| 10169 |
+
},
|
| 10170 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/meta.json",
|
| 10171 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model.pth",
|
| 10172 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/edges.pkl"
|
| 10173 |
+
},
|
| 10174 |
{
|
| 10175 |
"case_id": "46",
|
| 10176 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46",
|