Add new models
#16
by
iarcuschin
- opened
- 106/edges.pkl +3 -0
- 106/ll_model.pth +3 -0
- 106/ll_model_cfg.pkl +3 -0
- 106/meta.json +1 -0
- 121/edges.pkl +3 -0
- 121/ll_model.pth +3 -0
- 121/ll_model_cfg.pkl +3 -0
- 121/meta.json +1 -0
- 130/edges.pkl +3 -0
- 130/ll_model.pth +3 -0
- 130/ll_model_cfg.pkl +3 -0
- 130/meta.json +1 -0
- 15/edges.pkl +3 -0
- 15/ll_model.pth +3 -0
- 15/ll_model_cfg.pkl +3 -0
- 15/meta.json +1 -0
- 41/edges.pkl +3 -0
- 41/ll_model.pth +3 -0
- 41/ll_model_cfg.pkl +3 -0
- 41/meta.json +1 -0
- 43/edges.pkl +3 -0
- 43/ll_model.pth +3 -0
- 43/ll_model_cfg.pkl +3 -0
- 43/meta.json +1 -0
- 49/edges.pkl +3 -0
- 49/ll_model.pth +3 -0
- 49/ll_model_cfg.pkl +3 -0
- 49/meta.json +1 -0
- 66/edges.pkl +3 -0
- 66/ll_model.pth +3 -0
- 66/ll_model_cfg.pkl +3 -0
- 66/meta.json +1 -0
- 68/edges.pkl +3 -0
- 68/ll_model.pth +3 -0
- 68/ll_model_cfg.pkl +3 -0
- 68/meta.json +1 -0
- 73/edges.pkl +3 -0
- 73/ll_model.pth +3 -0
- 73/ll_model_cfg.pkl +3 -0
- 73/meta.json +1 -0
- benchmark_cases_metadata.csv +10 -0
- benchmark_cases_metadata.parquet +2 -2
- benchmark_metadata.json +1455 -156
106/edges.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fda9b02cdb2f5d7252c229a12290c6d81381606b1bfad02979549f304bf2a5d0
|
3 |
+
size 134
|
106/ll_model.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:580798eae1391aca366f15c0442c3ef1c02b1b323d610d1d9ddee0faee5e664f
|
3 |
+
size 14698
|
106/ll_model_cfg.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:24bca874c32c8c431cdb732e3222b4090604cde6f05ce1359710b630220650e3
|
3 |
+
size 1093
|
106/meta.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-106-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
121/edges.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
|
3 |
+
size 113
|
121/ll_model.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8054e00aea3c35c5ee77c693f9feeba493c499fe3218e70780137938138a4675
|
3 |
+
size 15118
|
121/ll_model_cfg.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9f027ad4de6828c6f5bb7a3f3c8aabd9658526e33b2284eba366977823b89c0a
|
3 |
+
size 1093
|
121/meta.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-121-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
130/edges.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af2a7430f7477a79df1fce6300cf37e1c46d73c31a7f91e06221ef4a6ebf9bed
|
3 |
+
size 223
|
130/ll_model.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4be63b6e0776e45f04d0905702a3a520b2b6449691ae6e34b8504693ac6805be
|
3 |
+
size 21304
|
130/ll_model_cfg.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:192503b894021c736145328500ab1f316e60ed7a121cf04b089bcd05d04e50b4
|
3 |
+
size 1093
|
130/meta.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-130-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
15/edges.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ecc8ce1a212f987b85ec909238ebc7d01d36c58389391fc96d69ca007fa2d384
|
3 |
+
size 244
|
15/ll_model.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:22ff8d1015f06b8912051e6787ba4e058047facdaadd1d9322e7e89c070c131f
|
3 |
+
size 20728
|
15/ll_model_cfg.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f4162b8d5712db86a2025499b1561c655fd97402716ff352305c296c7a04ff65
|
3 |
+
size 1093
|
15/meta.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-15-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
41/edges.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
|
3 |
+
size 113
|
41/ll_model.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7d59c31ceb0d0c9afb12dc1f63ade3c4f9edba0dfd80d5779ae27188da2c21d8
|
3 |
+
size 14862
|
41/ll_model_cfg.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f1dee34cba288862b06c2ff669839e06b6c17aa46cdb685f4a2c5a8c3be8a39b
|
3 |
+
size 1093
|
41/meta.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-41-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
43/edges.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
|
3 |
+
size 113
|
43/ll_model.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:26cc6d6ffa5ae93ce73055d831d4a7119bca2166c2ed9731992c48b4b3debb49
|
3 |
+
size 15054
|
43/ll_model_cfg.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89a74c42552b846f4562163c6fe74a474edfa36e1972eb97bb3ce0d8aaf9444c
|
3 |
+
size 1093
|
43/meta.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-43-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
49/edges.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
|
3 |
+
size 113
|
49/ll_model.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:aab9be464531a3cf85f25e3ccb3153c15b6de9876d56799d8705d0784979a1ea
|
3 |
+
size 14634
|
49/ll_model_cfg.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2e47363d4486f828a419ba208bee3a725d431ab80e418a8318f55cf6cd6bf310
|
3 |
+
size 1093
|
49/meta.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-49-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
66/edges.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
|
3 |
+
size 113
|
66/ll_model.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fa63d9e5b124ffb9ce9061e04b03b1ff551c8085fc51ddea31f488b152f5f7c3
|
3 |
+
size 14762
|
66/ll_model_cfg.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b04d734fcc61084204ead0d8cc11c5782598f6f6e4bf3e14b94eab7b0bc9d676
|
3 |
+
size 1093
|
66/meta.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-66-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
68/edges.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
|
3 |
+
size 113
|
68/ll_model.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a1b739ebc05faa4d388c20ef60ab59e44695c4a82323ed7c9c3801ae8e502db9
|
3 |
+
size 14670
|
68/ll_model_cfg.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:be188cb9baf70c65af2c4ecf92c6de170c15a41599109f95c6b632f15bb3eec3
|
3 |
+
size 1093
|
68/meta.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-68-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
73/edges.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
|
3 |
+
size 113
|
73/ll_model.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:809fe1d4c9f818bac9a85b358d0722f6ed8527d56f988fe66d62f0eceac0f097
|
3 |
+
size 14698
|
73/ll_model_cfg.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:db76917a80935813594508b1d79b7a0836a20daf67e263161432430b095fd111
|
3 |
+
size 1093
|
73/meta.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-73-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
|
benchmark_cases_metadata.csv
CHANGED
@@ -27,6 +27,7 @@ ioi,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi,Indirect O
|
|
27 |
30,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/30,Tags numeric tokens in a sequence based on whether they fall within a given range.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
28 |
90,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/90,Replaces a specific token with another one.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/edges.pkl,2,4,10,1,custom,4,16,gelu,12,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,9,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
29 |
39,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/39,Returns the fraction of 'x' in the input up to the i-th position for all i.,60,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl,2,120,60,30,custom,4,480,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.08432740427115679,True,False,standard,False,1,False,345600,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
30 |
75,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75,Double each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
31 |
101,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/101,Check if each element is a square of an integer.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
32 |
ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi_next_token,"Indirect Object Identification (IOI) task, trained using next token prediction.",16,16,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/edges.pkl,6,64,1024,16,gpt2,4,3072,gelu_new,50257,1e-05,False,True,False,False,False,False,GPT2LMHeadModel,False,gpt2,gpt2,LNPre,1,causal,False,,0.02886751345948129,True,False,standard,False,50257,False,2457600,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,,,,True,True,1.0,,,True,,256.0,True,True,"val/accuracy,val/IIA",,,True,0.65,False,0.0,True,max,,True,
|
@@ -34,14 +35,17 @@ ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi
|
|
34 |
14,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/14,Returns the count of 'a' in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/edges.pkl,2,8,10,2,custom,4,32,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.15689290811054724,True,False,standard,False,10,False,1536,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
35 |
95,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/95,Counts the distinct prime factors of each number in the input list.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12060453783110546,True,False,standard,False,3,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
36 |
84,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/84,Apply the arctangent function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
37 |
93,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93,Swaps the nth with the n+1th element if n%2==1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/edges.pkl,3,20,10,5,custom,4,80,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10886621079036347,True,False,standard,False,11,False,14400,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
38 |
37,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/37,Reverses each word in the sequence except for specified exclusions.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
39 |
34,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/34,Calculate the ratio of vowels to consonants in each word.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/edges.pkl,2,16,10,4,custom,4,64,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,5,False,6144,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
40 |
26,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/26,Creates a cascading effect by repeating each token in sequence incrementally.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl,2,21,10,5,custom,4,84,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12344267996967354,True,False,standard,False,27,False,10416,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
|
|
41 |
19,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/19,Removes consecutive duplicate tokens from a sequence.,15,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/edges.pkl,2,32,15,8,custom,4,128,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.15689290811054724,True,False,standard,False,3,False,24576,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,,True,,,True,True,,,,True,,True,,True,,,True,
|
42 |
53,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/53,Increment elements at odd indices by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13151918984428584,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
43 |
40,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/40,Sum the last and previous to last digits of a number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/edges.pkl,2,4,10,1,custom,4,16,gelu,31,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.09847319278346618,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
44 |
51,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/51,Checks if each element is a Fibonacci number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl,2,4,10,1,custom,4,16,gelu,102,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.07525766947068778,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
45 |
122,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122,Check if each number is divisible by 3.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
46 |
85,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/85,Square each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
47 |
2,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/2,Reverse the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/edges.pkl,4,56,10,14,custom,4,224,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.07593263966019993,True,False,standard,False,26,False,150528,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
@@ -51,6 +55,7 @@ ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi
|
|
51 |
20,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/20,Detect spam messages based on appearance of spam keywords.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/edges.pkl,2,13,10,3,custom,4,52,gelu,14,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16,True,False,standard,False,2,False,3952,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
52 |
25,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/25,Normalizes token frequencies in a sequence to a range between 0 and 1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/edges.pkl,2,62,10,15,custom,4,248,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.08295613557843402,True,False,standard,False,56,False,91264,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
53 |
11,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/11,Counts the number of words in a sequence based on their length.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,5,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,500.0,,gelu,True,True,1.0,,,True,,,True,True,,,,True,,True,,True,,,True,
|
|
|
54 |
54,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/54,Applies the hyperbolic tangent to each element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
55 |
124,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/124,Check if all elements in a list are equal.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.11547005383792516,True,False,standard,False,2,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
56 |
102,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/102,"Reflects each element within a range (default is [2, 7]).",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/edges.pkl,2,4,10,1,custom,4,16,gelu,42,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1059625885652035,True,False,standard,False,6,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
@@ -60,15 +65,20 @@ ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi
|
|
60 |
86,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/86,"Check if each element is a power of 2. Return 1 if true, otherwise 0.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
61 |
105,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/105,Replaces each number with the next prime after that number.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.11202240672224079,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
62 |
58,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/58,Mirrors the first half of the sequence to the second half.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl,3,32,10,8,custom,4,128,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10415112878465911,True,False,standard,False,11,False,36864,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
63 |
70,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/70,Apply the cosine function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
64 |
62,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/62,Replaces each element with its factorial.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1414213562373095,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
65 |
111,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/111,Returns the last element of the sequence and pads the rest with zeros.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.09847319278346618,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
66 |
35,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/35,Alternates capitalization of each character in words.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/edges.pkl,2,9,10,2,custom,4,36,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,1872,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
67 |
3,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/3,Returns the fraction of 'x' in the input up to the i-th position for all i.,5,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/edges.pkl,2,12,5,3,custom,4,48,gelu,6,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.22188007849009167,True,False,standard,False,1,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,10.0,2000.0,,gelu,True,True,0.1,,strict,False,,,True,True,,,,True,,True,,True,,,True,
|
68 |
36,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/36,"Classifies each token as 'positive', 'negative', or 'neutral' based on emojis.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl,2,6,10,1,custom,4,24,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.19402850002906638,True,False,standard,False,3,False,768,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
|
|
69 |
64,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/64,Cubes each element in the sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
70 |
8,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/8,Identity,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
71 |
103,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/103,Swap consecutive numbers in a list,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10787197799411874,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
72 |
56,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/56,Sets every third element to zero.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13333333333333333,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
73 |
97,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/97,Scale a sequence by its maximum element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl,3,200,10,50,custom,4,800,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.05405899027195888,True,False,standard,False,64,False,1440000,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
74 |
46,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46,Decrements each element in the sequence by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
27 |
30,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/30,Tags numeric tokens in a sequence based on whether they fall within a given range.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
28 |
90,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/90,Replaces a specific token with another one.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/edges.pkl,2,4,10,1,custom,4,16,gelu,12,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,9,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
29 |
39,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/39,Returns the fraction of 'x' in the input up to the i-th position for all i.,60,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl,2,120,60,30,custom,4,480,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.08432740427115679,True,False,standard,False,1,False,345600,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
30 |
+
130,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/130,"Clips each element to be within a range (make the default range [2, 7]).",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/edges.pkl,3,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.10079052613579392,True,False,standard,False,6,False,576,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
31 |
75,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75,Double each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
32 |
101,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/101,Check if each element is a square of an integer.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
33 |
ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi_next_token,"Indirect Object Identification (IOI) task, trained using next token prediction.",16,16,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/edges.pkl,6,64,1024,16,gpt2,4,3072,gelu_new,50257,1e-05,False,True,False,False,False,False,GPT2LMHeadModel,False,gpt2,gpt2,LNPre,1,causal,False,,0.02886751345948129,True,False,standard,False,50257,False,2457600,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,,,,True,True,1.0,,,True,,256.0,True,True,"val/accuracy,val/IIA",,,True,0.65,False,0.0,True,max,,True,
|
|
|
35 |
14,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/14,Returns the count of 'a' in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/edges.pkl,2,8,10,2,custom,4,32,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.15689290811054724,True,False,standard,False,10,False,1536,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
36 |
95,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/95,Counts the distinct prime factors of each number in the input list.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12060453783110546,True,False,standard,False,3,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
37 |
84,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/84,Apply the arctangent function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
38 |
+
66,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/66,Round each element in the input sequence to the nearest integer.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13151918984428584,True,False,standard,False,6,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
39 |
93,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93,Swaps the nth with the n+1th element if n%2==1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/edges.pkl,3,20,10,5,custom,4,80,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10886621079036347,True,False,standard,False,11,False,14400,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
40 |
37,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/37,Reverses each word in the sequence except for specified exclusions.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
41 |
34,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/34,Calculate the ratio of vowels to consonants in each word.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/edges.pkl,2,16,10,4,custom,4,64,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,5,False,6144,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
42 |
26,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/26,Creates a cascading effect by repeating each token in sequence incrementally.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl,2,21,10,5,custom,4,84,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12344267996967354,True,False,standard,False,27,False,10416,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
43 |
+
15,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/15,Returns each token multiplied by two and subtracted by its index.,5,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/edges.pkl,3,4,5,1,custom,4,16,gelu,7,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.06553855364152325,True,False,standard,False,12,False,576,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
44 |
19,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/19,Removes consecutive duplicate tokens from a sequence.,15,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/edges.pkl,2,32,15,8,custom,4,128,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.15689290811054724,True,False,standard,False,3,False,24576,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,,True,,,True,True,,,,True,,True,,True,,,True,
|
45 |
53,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/53,Increment elements at odd indices by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13151918984428584,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
46 |
40,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/40,Sum the last and previous to last digits of a number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/edges.pkl,2,4,10,1,custom,4,16,gelu,31,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.09847319278346618,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
47 |
51,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/51,Checks if each element is a Fibonacci number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl,2,4,10,1,custom,4,16,gelu,102,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.07525766947068778,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
48 |
+
43,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/43,Returns the corresponding Fibonacci number for each element in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1131370849898476,True,False,standard,False,19,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
49 |
122,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122,Check if each number is divisible by 3.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
50 |
85,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/85,Square each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
51 |
2,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/2,Reverse the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/edges.pkl,4,56,10,14,custom,4,224,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.07593263966019993,True,False,standard,False,26,False,150528,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
55 |
20,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/20,Detect spam messages based on appearance of spam keywords.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/edges.pkl,2,13,10,3,custom,4,52,gelu,14,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16,True,False,standard,False,2,False,3952,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
56 |
25,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/25,Normalizes token frequencies in a sequence to a range between 0 and 1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/edges.pkl,2,62,10,15,custom,4,248,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.08295613557843402,True,False,standard,False,56,False,91264,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
57 |
11,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/11,Counts the number of words in a sequence based on their length.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,5,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,500.0,,gelu,True,True,1.0,,,True,,,True,True,,,,True,,True,,True,,,True,
|
58 |
+
41,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/41,Make each element of the input sequence absolute,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12344267996967354,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
59 |
54,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/54,Applies the hyperbolic tangent to each element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
60 |
124,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/124,Check if all elements in a list are equal.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.11547005383792516,True,False,standard,False,2,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
61 |
102,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/102,"Reflects each element within a range (default is [2, 7]).",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/edges.pkl,2,4,10,1,custom,4,16,gelu,42,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1059625885652035,True,False,standard,False,6,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
|
|
65 |
86,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/86,"Check if each element is a power of 2. Return 1 if true, otherwise 0.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
66 |
105,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/105,Replaces each number with the next prime after that number.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.11202240672224079,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
67 |
58,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/58,Mirrors the first half of the sequence to the second half.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl,3,32,10,8,custom,4,128,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10415112878465911,True,False,standard,False,11,False,36864,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
68 |
+
68,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/68,Increment each element until it becomes a multiple of 3,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,5,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
69 |
70,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/70,Apply the cosine function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
70 |
62,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/62,Replaces each element with its factorial.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1414213562373095,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
71 |
111,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/111,Returns the last element of the sequence and pads the rest with zeros.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.09847319278346618,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
72 |
+
121,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/121,Compute arcsine of all elements in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.11202240672224079,True,False,standard,False,20,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
73 |
35,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/35,Alternates capitalization of each character in words.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/edges.pkl,2,9,10,2,custom,4,36,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,1872,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
74 |
3,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/3,Returns the fraction of 'x' in the input up to the i-th position for all i.,5,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/edges.pkl,2,12,5,3,custom,4,48,gelu,6,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.22188007849009167,True,False,standard,False,1,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,10.0,2000.0,,gelu,True,True,0.1,,strict,False,,,True,True,,,,True,,True,,True,,,True,
|
75 |
36,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/36,"Classifies each token as 'positive', 'negative', or 'neutral' based on emojis.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl,2,6,10,1,custom,4,24,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.19402850002906638,True,False,standard,False,3,False,768,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
|
76 |
+
106,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/106,Sets all elements to zero except for the element at index 1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13719886811400708,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
77 |
64,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/64,Cubes each element in the sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
78 |
8,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/8,Identity,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
79 |
+
73,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/73,Apply the sine function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
80 |
103,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/103,Swap consecutive numbers in a list,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10787197799411874,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
81 |
56,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/56,Sets every third element to zero.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13333333333333333,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
82 |
97,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/97,Scale a sequence by its maximum element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl,3,200,10,50,custom,4,800,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.05405899027195888,True,False,standard,False,64,False,1440000,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
83 |
+
49,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/49,Decrements each element in the sequence until it becomes a multiple of 3.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.15689290811054724,True,False,standard,False,4,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
84 |
46,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46,Decrements each element in the sequence by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
|
benchmark_cases_metadata.parquet
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:049d63f22c918edb98d89c9eb69f091016c4780b033e5559523abd7e50188238
|
3 |
+
size 76100
|
benchmark_metadata.json
CHANGED
@@ -3352,6 +3352,150 @@
|
|
3352 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth",
|
3353 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl"
|
3354 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
3355 |
{
|
3356 |
"case_id": "75",
|
3357 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75",
|
@@ -4233,6 +4377,140 @@
|
|
4233 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth",
|
4234 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl"
|
4235 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4236 |
{
|
4237 |
"case_id": "93",
|
4238 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93",
|
@@ -4663,40 +4941,159 @@
|
|
4663 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl"
|
4664 |
},
|
4665 |
{
|
4666 |
-
"case_id": "
|
4667 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
4668 |
-
"task_description": "
|
4669 |
"vocab": [
|
4670 |
-
|
4671 |
-
|
4672 |
-
|
|
|
|
|
4673 |
],
|
4674 |
-
"max_seq_len":
|
4675 |
"min_seq_len": 4,
|
4676 |
"files": [
|
4677 |
{
|
4678 |
"file_name": "edges.pkl",
|
4679 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
4680 |
},
|
4681 |
{
|
4682 |
"file_name": "ll_model.pth",
|
4683 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
4684 |
},
|
4685 |
{
|
4686 |
"file_name": "ll_model_cfg.pkl",
|
4687 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
4688 |
},
|
4689 |
{
|
4690 |
"file_name": "meta.json",
|
4691 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
4692 |
}
|
4693 |
],
|
4694 |
"transformer_cfg": {
|
4695 |
-
"n_layers":
|
4696 |
-
"d_model":
|
4697 |
-
"n_ctx":
|
4698 |
-
"d_head":
|
4699 |
-
"model_name": "custom",
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
4700 |
"n_heads": 4,
|
4701 |
"d_mlp": 128,
|
4702 |
"act_fn": "gelu",
|
@@ -5241,6 +5638,140 @@
|
|
5241 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth",
|
5242 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl"
|
5243 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
5244 |
{
|
5245 |
"case_id": "122",
|
5246 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122",
|
@@ -6371,10 +6902,20 @@
|
|
6371 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl"
|
6372 |
},
|
6373 |
{
|
6374 |
-
"case_id": "
|
6375 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
6376 |
-
"task_description": "
|
6377 |
"vocab": [
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6378 |
0,
|
6379 |
1,
|
6380 |
2,
|
@@ -6384,19 +6925,143 @@
|
|
6384 |
6,
|
6385 |
7,
|
6386 |
8,
|
6387 |
-
9
|
6388 |
-
10
|
6389 |
],
|
6390 |
"max_seq_len": 10,
|
6391 |
"min_seq_len": 4,
|
6392 |
"files": [
|
6393 |
{
|
6394 |
"file_name": "edges.pkl",
|
6395 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
6396 |
},
|
6397 |
{
|
6398 |
"file_name": "ll_model.pth",
|
6399 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
6400 |
},
|
6401 |
{
|
6402 |
"file_name": "ll_model_cfg.pkl",
|
@@ -7572,9 +8237,9 @@
|
|
7572 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl"
|
7573 |
},
|
7574 |
{
|
7575 |
-
"case_id": "
|
7576 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
7577 |
-
"task_description": "
|
7578 |
"vocab": [
|
7579 |
0,
|
7580 |
1,
|
@@ -7593,19 +8258,19 @@
|
|
7593 |
"files": [
|
7594 |
{
|
7595 |
"file_name": "edges.pkl",
|
7596 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7597 |
},
|
7598 |
{
|
7599 |
"file_name": "ll_model.pth",
|
7600 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7601 |
},
|
7602 |
{
|
7603 |
"file_name": "ll_model_cfg.pkl",
|
7604 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7605 |
},
|
7606 |
{
|
7607 |
"file_name": "meta.json",
|
7608 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7609 |
}
|
7610 |
],
|
7611 |
"transformer_cfg": {
|
@@ -7639,12 +8304,12 @@
|
|
7639 |
"attention_dir": "causal",
|
7640 |
"attn_only": false,
|
7641 |
"seed": 0,
|
7642 |
-
"initializer_range": 0.
|
7643 |
"init_weights": true,
|
7644 |
"scale_attn_by_inverse_layer_idx": false,
|
7645 |
"positional_embedding_type": "standard",
|
7646 |
"final_rms": false,
|
7647 |
-
"d_vocab_out":
|
7648 |
"parallel_attn_mlp": false,
|
7649 |
"rotary_dim": null,
|
7650 |
"n_params": 384,
|
@@ -7662,7 +8327,7 @@
|
|
7662 |
"num_experts": null,
|
7663 |
"experts_per_token": null
|
7664 |
},
|
7665 |
-
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7666 |
"training_args": {
|
7667 |
"output_dir": "/circuits-benchmark/results",
|
7668 |
"atol": 0.05,
|
@@ -7670,7 +8335,7 @@
|
|
7670 |
"use_single_loss": true,
|
7671 |
"iit_weight": 1.0,
|
7672 |
"behavior_weight": 0.4,
|
7673 |
-
"strict_weight": 0
|
7674 |
"epochs": 1000,
|
7675 |
"early_stop_accuracy_threshold": 99.9,
|
7676 |
"act_fn": "gelu",
|
@@ -7692,14 +8357,14 @@
|
|
7692 |
"siit_sampling": "sample_all",
|
7693 |
"val_iia_sampling": "all"
|
7694 |
},
|
7695 |
-
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7696 |
-
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7697 |
-
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7698 |
},
|
7699 |
{
|
7700 |
-
"case_id": "
|
7701 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
7702 |
-
"task_description": "
|
7703 |
"vocab": [
|
7704 |
0,
|
7705 |
1,
|
@@ -7718,19 +8383,19 @@
|
|
7718 |
"files": [
|
7719 |
{
|
7720 |
"file_name": "edges.pkl",
|
7721 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7722 |
},
|
7723 |
{
|
7724 |
"file_name": "ll_model.pth",
|
7725 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7726 |
},
|
7727 |
{
|
7728 |
"file_name": "ll_model_cfg.pkl",
|
7729 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7730 |
},
|
7731 |
{
|
7732 |
"file_name": "meta.json",
|
7733 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7734 |
}
|
7735 |
],
|
7736 |
"transformer_cfg": {
|
@@ -7764,12 +8429,12 @@
|
|
7764 |
"attention_dir": "causal",
|
7765 |
"attn_only": false,
|
7766 |
"seed": 0,
|
7767 |
-
"initializer_range": 0.
|
7768 |
"init_weights": true,
|
7769 |
"scale_attn_by_inverse_layer_idx": false,
|
7770 |
"positional_embedding_type": "standard",
|
7771 |
"final_rms": false,
|
7772 |
-
"d_vocab_out":
|
7773 |
"parallel_attn_mlp": false,
|
7774 |
"rotary_dim": null,
|
7775 |
"n_params": 384,
|
@@ -7787,7 +8452,7 @@
|
|
7787 |
"num_experts": null,
|
7788 |
"experts_per_token": null
|
7789 |
},
|
7790 |
-
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7791 |
"training_args": {
|
7792 |
"output_dir": "/circuits-benchmark/results",
|
7793 |
"atol": 0.05,
|
@@ -7817,14 +8482,14 @@
|
|
7817 |
"siit_sampling": "sample_all",
|
7818 |
"val_iia_sampling": "all"
|
7819 |
},
|
7820 |
-
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7821 |
-
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7822 |
-
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7823 |
},
|
7824 |
{
|
7825 |
-
"case_id": "
|
7826 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
7827 |
-
"task_description": "
|
7828 |
"vocab": [
|
7829 |
0,
|
7830 |
1,
|
@@ -7843,29 +8508,29 @@
|
|
7843 |
"files": [
|
7844 |
{
|
7845 |
"file_name": "edges.pkl",
|
7846 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7847 |
},
|
7848 |
{
|
7849 |
"file_name": "ll_model.pth",
|
7850 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7851 |
},
|
7852 |
{
|
7853 |
"file_name": "ll_model_cfg.pkl",
|
7854 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7855 |
},
|
7856 |
{
|
7857 |
"file_name": "meta.json",
|
7858 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7859 |
}
|
7860 |
],
|
7861 |
"transformer_cfg": {
|
7862 |
-
"n_layers":
|
7863 |
-
"d_model":
|
7864 |
"n_ctx": 10,
|
7865 |
-
"d_head":
|
7866 |
"model_name": "custom",
|
7867 |
"n_heads": 4,
|
7868 |
-
"d_mlp":
|
7869 |
"act_fn": "gelu",
|
7870 |
"d_vocab": 13,
|
7871 |
"eps": 1e-05,
|
@@ -7886,18 +8551,18 @@
|
|
7886 |
"init_mode": "gpt2",
|
7887 |
"normalization_type": null,
|
7888 |
"n_devices": 1,
|
7889 |
-
"attention_dir": "
|
7890 |
"attn_only": false,
|
7891 |
"seed": 0,
|
7892 |
-
"initializer_range": 0.
|
7893 |
"init_weights": true,
|
7894 |
"scale_attn_by_inverse_layer_idx": false,
|
7895 |
"positional_embedding_type": "standard",
|
7896 |
"final_rms": false,
|
7897 |
-
"d_vocab_out":
|
7898 |
"parallel_attn_mlp": false,
|
7899 |
"rotary_dim": null,
|
7900 |
-
"n_params":
|
7901 |
"use_hook_tokens": false,
|
7902 |
"gated_mlp": false,
|
7903 |
"default_prepend_bos": true,
|
@@ -7912,7 +8577,7 @@
|
|
7912 |
"num_experts": null,
|
7913 |
"experts_per_token": null
|
7914 |
},
|
7915 |
-
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7916 |
"training_args": {
|
7917 |
"output_dir": "/circuits-benchmark/results",
|
7918 |
"atol": 0.05,
|
@@ -7920,7 +8585,7 @@
|
|
7920 |
"use_single_loss": true,
|
7921 |
"iit_weight": 1.0,
|
7922 |
"behavior_weight": 0.4,
|
7923 |
-
"strict_weight": 0.
|
7924 |
"epochs": 1000,
|
7925 |
"early_stop_accuracy_threshold": 99.9,
|
7926 |
"act_fn": "gelu",
|
@@ -7942,54 +8607,57 @@
|
|
7942 |
"siit_sampling": "sample_all",
|
7943 |
"val_iia_sampling": "all"
|
7944 |
},
|
7945 |
-
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7946 |
-
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7947 |
-
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7948 |
},
|
7949 |
{
|
7950 |
-
"case_id": "
|
7951 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
7952 |
-
"task_description": "
|
7953 |
"vocab": [
|
7954 |
-
|
7955 |
-
|
7956 |
-
|
7957 |
-
|
7958 |
-
|
7959 |
-
|
7960 |
-
|
7961 |
-
|
|
|
|
|
|
|
7962 |
],
|
7963 |
"max_seq_len": 10,
|
7964 |
"min_seq_len": 4,
|
7965 |
"files": [
|
7966 |
{
|
7967 |
"file_name": "edges.pkl",
|
7968 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7969 |
},
|
7970 |
{
|
7971 |
"file_name": "ll_model.pth",
|
7972 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7973 |
},
|
7974 |
{
|
7975 |
"file_name": "ll_model_cfg.pkl",
|
7976 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7977 |
},
|
7978 |
{
|
7979 |
"file_name": "meta.json",
|
7980 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
7981 |
}
|
7982 |
],
|
7983 |
"transformer_cfg": {
|
7984 |
-
"n_layers":
|
7985 |
-
"d_model":
|
7986 |
"n_ctx": 10,
|
7987 |
-
"d_head":
|
7988 |
"model_name": "custom",
|
7989 |
"n_heads": 4,
|
7990 |
-
"d_mlp":
|
7991 |
"act_fn": "gelu",
|
7992 |
-
"d_vocab":
|
7993 |
"eps": 1e-05,
|
7994 |
"use_attn_result": true,
|
7995 |
"use_attn_scale": true,
|
@@ -8008,18 +8676,18 @@
|
|
8008 |
"init_mode": "gpt2",
|
8009 |
"normalization_type": null,
|
8010 |
"n_devices": 1,
|
8011 |
-
"attention_dir": "
|
8012 |
"attn_only": false,
|
8013 |
"seed": 0,
|
8014 |
-
"initializer_range": 0.
|
8015 |
"init_weights": true,
|
8016 |
"scale_attn_by_inverse_layer_idx": false,
|
8017 |
"positional_embedding_type": "standard",
|
8018 |
"final_rms": false,
|
8019 |
-
"d_vocab_out":
|
8020 |
"parallel_attn_mlp": false,
|
8021 |
"rotary_dim": null,
|
8022 |
-
"n_params":
|
8023 |
"use_hook_tokens": false,
|
8024 |
"gated_mlp": false,
|
8025 |
"default_prepend_bos": true,
|
@@ -8029,9 +8697,265 @@
|
|
8029 |
"post_embedding_ln": false,
|
8030 |
"rotary_base": 10000,
|
8031 |
"trust_remote_code": false,
|
8032 |
-
"rotary_adjacent_pairs": false
|
8033 |
-
|
8034 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8035 |
"training_args": {
|
8036 |
"atol": 0.05,
|
8037 |
"lr": 0.01,
|
@@ -8136,58 +9060,289 @@
|
|
8136 |
"lr": 0.01,
|
8137 |
"use_single_loss": false,
|
8138 |
"iit_weight": 1.0,
|
8139 |
-
"behavior_weight": 1.0,
|
8140 |
-
"strict_weight": 10.0,
|
8141 |
-
"epochs": 2000,
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8142 |
"act_fn": "gelu",
|
|
|
|
|
8143 |
"clip_grad_norm": 0.1,
|
8144 |
-
"lr_scheduler": "",
|
8145 |
"model_pair": "strict",
|
8146 |
-
"same_size": false
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8147 |
},
|
8148 |
-
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8149 |
-
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8150 |
-
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8151 |
},
|
8152 |
{
|
8153 |
-
"case_id": "
|
8154 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
8155 |
-
"task_description": "
|
8156 |
"vocab": [
|
8157 |
-
|
8158 |
-
|
8159 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8160 |
],
|
8161 |
"max_seq_len": 10,
|
8162 |
"min_seq_len": 4,
|
8163 |
"files": [
|
8164 |
{
|
8165 |
"file_name": "edges.pkl",
|
8166 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8167 |
},
|
8168 |
{
|
8169 |
"file_name": "ll_model.pth",
|
8170 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8171 |
},
|
8172 |
{
|
8173 |
"file_name": "ll_model_cfg.pkl",
|
8174 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8175 |
},
|
8176 |
{
|
8177 |
"file_name": "meta.json",
|
8178 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8179 |
}
|
8180 |
],
|
8181 |
"transformer_cfg": {
|
8182 |
"n_layers": 2,
|
8183 |
-
"d_model":
|
8184 |
"n_ctx": 10,
|
8185 |
"d_head": 1,
|
8186 |
"model_name": "custom",
|
8187 |
"n_heads": 4,
|
8188 |
-
"d_mlp":
|
8189 |
"act_fn": "gelu",
|
8190 |
-
"d_vocab":
|
8191 |
"eps": 1e-05,
|
8192 |
"use_attn_result": true,
|
8193 |
"use_attn_scale": true,
|
@@ -8209,15 +9364,15 @@
|
|
8209 |
"attention_dir": "causal",
|
8210 |
"attn_only": false,
|
8211 |
"seed": 0,
|
8212 |
-
"initializer_range": 0.
|
8213 |
"init_weights": true,
|
8214 |
"scale_attn_by_inverse_layer_idx": false,
|
8215 |
"positional_embedding_type": "standard",
|
8216 |
"final_rms": false,
|
8217 |
-
"d_vocab_out":
|
8218 |
"parallel_attn_mlp": false,
|
8219 |
"rotary_dim": null,
|
8220 |
-
"n_params":
|
8221 |
"use_hook_tokens": false,
|
8222 |
"gated_mlp": false,
|
8223 |
"default_prepend_bos": true,
|
@@ -8227,30 +9382,49 @@
|
|
8227 |
"post_embedding_ln": false,
|
8228 |
"rotary_base": 10000,
|
8229 |
"trust_remote_code": false,
|
8230 |
-
"rotary_adjacent_pairs": false
|
|
|
|
|
|
|
8231 |
},
|
8232 |
-
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8233 |
"training_args": {
|
|
|
8234 |
"atol": 0.05,
|
8235 |
-
"lr": 0.
|
8236 |
-
"use_single_loss":
|
8237 |
"iit_weight": 1.0,
|
8238 |
-
"behavior_weight":
|
8239 |
-
"strict_weight":
|
8240 |
-
"epochs":
|
|
|
8241 |
"act_fn": "gelu",
|
|
|
|
|
8242 |
"clip_grad_norm": 0.1,
|
8243 |
-
"lr_scheduler": "",
|
8244 |
-
"model_pair": "strict"
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8245 |
},
|
8246 |
-
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8247 |
-
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8248 |
-
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8249 |
},
|
8250 |
{
|
8251 |
-
"case_id": "
|
8252 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
8253 |
-
"task_description": "
|
8254 |
"vocab": [
|
8255 |
0,
|
8256 |
1,
|
@@ -8269,19 +9443,19 @@
|
|
8269 |
"files": [
|
8270 |
{
|
8271 |
"file_name": "edges.pkl",
|
8272 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8273 |
},
|
8274 |
{
|
8275 |
"file_name": "ll_model.pth",
|
8276 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8277 |
},
|
8278 |
{
|
8279 |
"file_name": "ll_model_cfg.pkl",
|
8280 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8281 |
},
|
8282 |
{
|
8283 |
"file_name": "meta.json",
|
8284 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8285 |
}
|
8286 |
],
|
8287 |
"transformer_cfg": {
|
@@ -8338,7 +9512,7 @@
|
|
8338 |
"num_experts": null,
|
8339 |
"experts_per_token": null
|
8340 |
},
|
8341 |
-
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8342 |
"training_args": {
|
8343 |
"output_dir": "/circuits-benchmark/results",
|
8344 |
"atol": 0.05,
|
@@ -8368,14 +9542,14 @@
|
|
8368 |
"siit_sampling": "sample_all",
|
8369 |
"val_iia_sampling": "all"
|
8370 |
},
|
8371 |
-
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8372 |
-
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8373 |
-
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8374 |
},
|
8375 |
{
|
8376 |
-
"case_id": "
|
8377 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/
|
8378 |
-
"task_description": "
|
8379 |
"vocab": [
|
8380 |
0,
|
8381 |
1,
|
@@ -8394,19 +9568,19 @@
|
|
8394 |
"files": [
|
8395 |
{
|
8396 |
"file_name": "edges.pkl",
|
8397 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8398 |
},
|
8399 |
{
|
8400 |
"file_name": "ll_model.pth",
|
8401 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8402 |
},
|
8403 |
{
|
8404 |
"file_name": "ll_model_cfg.pkl",
|
8405 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8406 |
},
|
8407 |
{
|
8408 |
"file_name": "meta.json",
|
8409 |
-
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8410 |
}
|
8411 |
],
|
8412 |
"transformer_cfg": {
|
@@ -8463,7 +9637,7 @@
|
|
8463 |
"num_experts": null,
|
8464 |
"experts_per_token": null
|
8465 |
},
|
8466 |
-
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8467 |
"training_args": {
|
8468 |
"output_dir": "/circuits-benchmark/results",
|
8469 |
"atol": 0.05,
|
@@ -8481,7 +9655,7 @@
|
|
8481 |
"lr_scheduler": "linear",
|
8482 |
"model_pair": "strict",
|
8483 |
"same_size": false,
|
8484 |
-
"seed":
|
8485 |
"batch_size": 256,
|
8486 |
"include_mlp": false,
|
8487 |
"detach_while_caching": true,
|
@@ -8493,9 +9667,9 @@
|
|
8493 |
"siit_sampling": "sample_all",
|
8494 |
"val_iia_sampling": "all"
|
8495 |
},
|
8496 |
-
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8497 |
-
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8498 |
-
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/
|
8499 |
},
|
8500 |
{
|
8501 |
"case_id": "103",
|
@@ -8872,6 +10046,131 @@
|
|
8872 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth",
|
8873 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl"
|
8874 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
8875 |
{
|
8876 |
"case_id": "46",
|
8877 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46",
|
|
|
3352 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth",
|
3353 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl"
|
3354 |
},
|
3355 |
+
{
|
3356 |
+
"case_id": "130",
|
3357 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/130",
|
3358 |
+
"task_description": "Clips each element to be within a range (make the default range [2, 7]).",
|
3359 |
+
"vocab": [
|
3360 |
+
-15,
|
3361 |
+
-14,
|
3362 |
+
-13,
|
3363 |
+
-12,
|
3364 |
+
-11,
|
3365 |
+
-10,
|
3366 |
+
-9,
|
3367 |
+
-8,
|
3368 |
+
-7,
|
3369 |
+
-6,
|
3370 |
+
-5,
|
3371 |
+
-4,
|
3372 |
+
-3,
|
3373 |
+
-2,
|
3374 |
+
-1,
|
3375 |
+
0,
|
3376 |
+
1,
|
3377 |
+
2,
|
3378 |
+
3,
|
3379 |
+
4,
|
3380 |
+
5,
|
3381 |
+
6,
|
3382 |
+
7,
|
3383 |
+
8,
|
3384 |
+
9,
|
3385 |
+
10,
|
3386 |
+
11,
|
3387 |
+
12,
|
3388 |
+
13,
|
3389 |
+
14
|
3390 |
+
],
|
3391 |
+
"max_seq_len": 10,
|
3392 |
+
"min_seq_len": 4,
|
3393 |
+
"files": [
|
3394 |
+
{
|
3395 |
+
"file_name": "edges.pkl",
|
3396 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/edges.pkl"
|
3397 |
+
},
|
3398 |
+
{
|
3399 |
+
"file_name": "ll_model.pth",
|
3400 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model.pth"
|
3401 |
+
},
|
3402 |
+
{
|
3403 |
+
"file_name": "ll_model_cfg.pkl",
|
3404 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model_cfg.pkl"
|
3405 |
+
},
|
3406 |
+
{
|
3407 |
+
"file_name": "meta.json",
|
3408 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/meta.json"
|
3409 |
+
}
|
3410 |
+
],
|
3411 |
+
"transformer_cfg": {
|
3412 |
+
"n_layers": 3,
|
3413 |
+
"d_model": 4,
|
3414 |
+
"n_ctx": 10,
|
3415 |
+
"d_head": 1,
|
3416 |
+
"model_name": "custom",
|
3417 |
+
"n_heads": 4,
|
3418 |
+
"d_mlp": 16,
|
3419 |
+
"act_fn": "gelu",
|
3420 |
+
"d_vocab": 32,
|
3421 |
+
"eps": 1e-05,
|
3422 |
+
"use_attn_result": true,
|
3423 |
+
"use_attn_scale": true,
|
3424 |
+
"use_split_qkv_input": true,
|
3425 |
+
"use_hook_mlp_in": true,
|
3426 |
+
"use_attn_in": false,
|
3427 |
+
"use_local_attn": false,
|
3428 |
+
"original_architecture": null,
|
3429 |
+
"from_checkpoint": false,
|
3430 |
+
"checkpoint_index": null,
|
3431 |
+
"checkpoint_label_type": null,
|
3432 |
+
"checkpoint_value": null,
|
3433 |
+
"tokenizer_name": null,
|
3434 |
+
"window_size": null,
|
3435 |
+
"attn_types": null,
|
3436 |
+
"init_mode": "gpt2",
|
3437 |
+
"normalization_type": null,
|
3438 |
+
"n_devices": 1,
|
3439 |
+
"attention_dir": "causal",
|
3440 |
+
"attn_only": false,
|
3441 |
+
"seed": 0,
|
3442 |
+
"initializer_range": 0.10079052613579392,
|
3443 |
+
"init_weights": true,
|
3444 |
+
"scale_attn_by_inverse_layer_idx": false,
|
3445 |
+
"positional_embedding_type": "standard",
|
3446 |
+
"final_rms": false,
|
3447 |
+
"d_vocab_out": 6,
|
3448 |
+
"parallel_attn_mlp": false,
|
3449 |
+
"rotary_dim": null,
|
3450 |
+
"n_params": 576,
|
3451 |
+
"use_hook_tokens": false,
|
3452 |
+
"gated_mlp": false,
|
3453 |
+
"default_prepend_bos": true,
|
3454 |
+
"dtype": "torch.float32",
|
3455 |
+
"tokenizer_prepends_bos": null,
|
3456 |
+
"n_key_value_heads": null,
|
3457 |
+
"post_embedding_ln": false,
|
3458 |
+
"rotary_base": 10000,
|
3459 |
+
"trust_remote_code": false,
|
3460 |
+
"rotary_adjacent_pairs": false,
|
3461 |
+
"load_in_4bit": false,
|
3462 |
+
"num_experts": null,
|
3463 |
+
"experts_per_token": null
|
3464 |
+
},
|
3465 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model_cfg.pkl",
|
3466 |
+
"training_args": {
|
3467 |
+
"output_dir": "/circuits-benchmark/results",
|
3468 |
+
"atol": 0.05,
|
3469 |
+
"lr": 0.001,
|
3470 |
+
"use_single_loss": true,
|
3471 |
+
"iit_weight": 1.0,
|
3472 |
+
"behavior_weight": 0.4,
|
3473 |
+
"strict_weight": 1.0,
|
3474 |
+
"epochs": 1000,
|
3475 |
+
"early_stop_accuracy_threshold": 99.9,
|
3476 |
+
"act_fn": "gelu",
|
3477 |
+
"use_wandb": true,
|
3478 |
+
"save_model_to_wandb": true,
|
3479 |
+
"clip_grad_norm": 0.1,
|
3480 |
+
"lr_scheduler": "linear",
|
3481 |
+
"model_pair": "strict",
|
3482 |
+
"same_size": false,
|
3483 |
+
"seed": 67,
|
3484 |
+
"batch_size": 256,
|
3485 |
+
"include_mlp": false,
|
3486 |
+
"detach_while_caching": true,
|
3487 |
+
"scheduler_val_metric": [
|
3488 |
+
"val/accuracy",
|
3489 |
+
"val/IIA",
|
3490 |
+
"val/strict_accuracy"
|
3491 |
+
],
|
3492 |
+
"siit_sampling": "sample_all",
|
3493 |
+
"val_iia_sampling": "all"
|
3494 |
+
},
|
3495 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/meta.json",
|
3496 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model.pth",
|
3497 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/edges.pkl"
|
3498 |
+
},
|
3499 |
{
|
3500 |
"case_id": "75",
|
3501 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75",
|
|
|
4377 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth",
|
4378 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl"
|
4379 |
},
|
4380 |
+
{
|
4381 |
+
"case_id": "66",
|
4382 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/66",
|
4383 |
+
"task_description": "Round each element in the input sequence to the nearest integer.",
|
4384 |
+
"vocab": [
|
4385 |
+
0.0,
|
4386 |
+
0.25,
|
4387 |
+
0.5,
|
4388 |
+
0.75,
|
4389 |
+
1.0,
|
4390 |
+
1.25,
|
4391 |
+
1.5,
|
4392 |
+
1.75,
|
4393 |
+
2.0,
|
4394 |
+
2.25,
|
4395 |
+
2.5,
|
4396 |
+
2.75,
|
4397 |
+
3.0,
|
4398 |
+
3.25,
|
4399 |
+
3.5,
|
4400 |
+
3.75,
|
4401 |
+
4.0,
|
4402 |
+
4.25,
|
4403 |
+
4.5,
|
4404 |
+
4.75
|
4405 |
+
],
|
4406 |
+
"max_seq_len": 10,
|
4407 |
+
"min_seq_len": 4,
|
4408 |
+
"files": [
|
4409 |
+
{
|
4410 |
+
"file_name": "edges.pkl",
|
4411 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/edges.pkl"
|
4412 |
+
},
|
4413 |
+
{
|
4414 |
+
"file_name": "ll_model.pth",
|
4415 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model.pth"
|
4416 |
+
},
|
4417 |
+
{
|
4418 |
+
"file_name": "ll_model_cfg.pkl",
|
4419 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model_cfg.pkl"
|
4420 |
+
},
|
4421 |
+
{
|
4422 |
+
"file_name": "meta.json",
|
4423 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/meta.json"
|
4424 |
+
}
|
4425 |
+
],
|
4426 |
+
"transformer_cfg": {
|
4427 |
+
"n_layers": 2,
|
4428 |
+
"d_model": 4,
|
4429 |
+
"n_ctx": 10,
|
4430 |
+
"d_head": 1,
|
4431 |
+
"model_name": "custom",
|
4432 |
+
"n_heads": 4,
|
4433 |
+
"d_mlp": 16,
|
4434 |
+
"act_fn": "gelu",
|
4435 |
+
"d_vocab": 22,
|
4436 |
+
"eps": 1e-05,
|
4437 |
+
"use_attn_result": true,
|
4438 |
+
"use_attn_scale": true,
|
4439 |
+
"use_split_qkv_input": true,
|
4440 |
+
"use_hook_mlp_in": true,
|
4441 |
+
"use_attn_in": false,
|
4442 |
+
"use_local_attn": false,
|
4443 |
+
"original_architecture": null,
|
4444 |
+
"from_checkpoint": false,
|
4445 |
+
"checkpoint_index": null,
|
4446 |
+
"checkpoint_label_type": null,
|
4447 |
+
"checkpoint_value": null,
|
4448 |
+
"tokenizer_name": null,
|
4449 |
+
"window_size": null,
|
4450 |
+
"attn_types": null,
|
4451 |
+
"init_mode": "gpt2",
|
4452 |
+
"normalization_type": null,
|
4453 |
+
"n_devices": 1,
|
4454 |
+
"attention_dir": "causal",
|
4455 |
+
"attn_only": false,
|
4456 |
+
"seed": 0,
|
4457 |
+
"initializer_range": 0.13151918984428584,
|
4458 |
+
"init_weights": true,
|
4459 |
+
"scale_attn_by_inverse_layer_idx": false,
|
4460 |
+
"positional_embedding_type": "standard",
|
4461 |
+
"final_rms": false,
|
4462 |
+
"d_vocab_out": 6,
|
4463 |
+
"parallel_attn_mlp": false,
|
4464 |
+
"rotary_dim": null,
|
4465 |
+
"n_params": 384,
|
4466 |
+
"use_hook_tokens": false,
|
4467 |
+
"gated_mlp": false,
|
4468 |
+
"default_prepend_bos": true,
|
4469 |
+
"dtype": "torch.float32",
|
4470 |
+
"tokenizer_prepends_bos": null,
|
4471 |
+
"n_key_value_heads": null,
|
4472 |
+
"post_embedding_ln": false,
|
4473 |
+
"rotary_base": 10000,
|
4474 |
+
"trust_remote_code": false,
|
4475 |
+
"rotary_adjacent_pairs": false,
|
4476 |
+
"load_in_4bit": false,
|
4477 |
+
"num_experts": null,
|
4478 |
+
"experts_per_token": null
|
4479 |
+
},
|
4480 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model_cfg.pkl",
|
4481 |
+
"training_args": {
|
4482 |
+
"output_dir": "/circuits-benchmark/results",
|
4483 |
+
"atol": 0.05,
|
4484 |
+
"lr": 0.001,
|
4485 |
+
"use_single_loss": true,
|
4486 |
+
"iit_weight": 1.0,
|
4487 |
+
"behavior_weight": 0.4,
|
4488 |
+
"strict_weight": 0.7,
|
4489 |
+
"epochs": 1000,
|
4490 |
+
"early_stop_accuracy_threshold": 99.9,
|
4491 |
+
"act_fn": "gelu",
|
4492 |
+
"use_wandb": true,
|
4493 |
+
"save_model_to_wandb": true,
|
4494 |
+
"clip_grad_norm": 0.1,
|
4495 |
+
"lr_scheduler": "linear",
|
4496 |
+
"model_pair": "strict",
|
4497 |
+
"same_size": false,
|
4498 |
+
"seed": 92,
|
4499 |
+
"batch_size": 256,
|
4500 |
+
"include_mlp": false,
|
4501 |
+
"detach_while_caching": true,
|
4502 |
+
"scheduler_val_metric": [
|
4503 |
+
"val/accuracy",
|
4504 |
+
"val/IIA",
|
4505 |
+
"val/strict_accuracy"
|
4506 |
+
],
|
4507 |
+
"siit_sampling": "sample_all",
|
4508 |
+
"val_iia_sampling": "all"
|
4509 |
+
},
|
4510 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/meta.json",
|
4511 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model.pth",
|
4512 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/edges.pkl"
|
4513 |
+
},
|
4514 |
{
|
4515 |
"case_id": "93",
|
4516 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93",
|
|
|
4941 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl"
|
4942 |
},
|
4943 |
{
|
4944 |
+
"case_id": "15",
|
4945 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/15",
|
4946 |
+
"task_description": "Returns each token multiplied by two and subtracted by its index.",
|
4947 |
"vocab": [
|
4948 |
+
0,
|
4949 |
+
1,
|
4950 |
+
2,
|
4951 |
+
3,
|
4952 |
+
4
|
4953 |
],
|
4954 |
+
"max_seq_len": 5,
|
4955 |
"min_seq_len": 4,
|
4956 |
"files": [
|
4957 |
{
|
4958 |
"file_name": "edges.pkl",
|
4959 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/edges.pkl"
|
4960 |
},
|
4961 |
{
|
4962 |
"file_name": "ll_model.pth",
|
4963 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model.pth"
|
4964 |
},
|
4965 |
{
|
4966 |
"file_name": "ll_model_cfg.pkl",
|
4967 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model_cfg.pkl"
|
4968 |
},
|
4969 |
{
|
4970 |
"file_name": "meta.json",
|
4971 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/meta.json"
|
4972 |
}
|
4973 |
],
|
4974 |
"transformer_cfg": {
|
4975 |
+
"n_layers": 3,
|
4976 |
+
"d_model": 4,
|
4977 |
+
"n_ctx": 5,
|
4978 |
+
"d_head": 1,
|
4979 |
+
"model_name": "custom",
|
4980 |
+
"n_heads": 4,
|
4981 |
+
"d_mlp": 16,
|
4982 |
+
"act_fn": "gelu",
|
4983 |
+
"d_vocab": 7,
|
4984 |
+
"eps": 1e-05,
|
4985 |
+
"use_attn_result": true,
|
4986 |
+
"use_attn_scale": true,
|
4987 |
+
"use_split_qkv_input": true,
|
4988 |
+
"use_hook_mlp_in": true,
|
4989 |
+
"use_attn_in": false,
|
4990 |
+
"use_local_attn": false,
|
4991 |
+
"original_architecture": null,
|
4992 |
+
"from_checkpoint": false,
|
4993 |
+
"checkpoint_index": null,
|
4994 |
+
"checkpoint_label_type": null,
|
4995 |
+
"checkpoint_value": null,
|
4996 |
+
"tokenizer_name": null,
|
4997 |
+
"window_size": null,
|
4998 |
+
"attn_types": null,
|
4999 |
+
"init_mode": "gpt2",
|
5000 |
+
"normalization_type": null,
|
5001 |
+
"n_devices": 1,
|
5002 |
+
"attention_dir": "causal",
|
5003 |
+
"attn_only": false,
|
5004 |
+
"seed": 0,
|
5005 |
+
"initializer_range": 0.06553855364152325,
|
5006 |
+
"init_weights": true,
|
5007 |
+
"scale_attn_by_inverse_layer_idx": false,
|
5008 |
+
"positional_embedding_type": "standard",
|
5009 |
+
"final_rms": false,
|
5010 |
+
"d_vocab_out": 12,
|
5011 |
+
"parallel_attn_mlp": false,
|
5012 |
+
"rotary_dim": null,
|
5013 |
+
"n_params": 576,
|
5014 |
+
"use_hook_tokens": false,
|
5015 |
+
"gated_mlp": false,
|
5016 |
+
"default_prepend_bos": true,
|
5017 |
+
"dtype": "torch.float32",
|
5018 |
+
"tokenizer_prepends_bos": null,
|
5019 |
+
"n_key_value_heads": null,
|
5020 |
+
"post_embedding_ln": false,
|
5021 |
+
"rotary_base": 10000,
|
5022 |
+
"trust_remote_code": false,
|
5023 |
+
"rotary_adjacent_pairs": false,
|
5024 |
+
"load_in_4bit": false,
|
5025 |
+
"num_experts": null,
|
5026 |
+
"experts_per_token": null
|
5027 |
+
},
|
5028 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model_cfg.pkl",
|
5029 |
+
"training_args": {
|
5030 |
+
"output_dir": "/circuits-benchmark/results",
|
5031 |
+
"atol": 0.05,
|
5032 |
+
"lr": 0.001,
|
5033 |
+
"use_single_loss": true,
|
5034 |
+
"iit_weight": 1.0,
|
5035 |
+
"behavior_weight": 0.4,
|
5036 |
+
"strict_weight": 1.0,
|
5037 |
+
"epochs": 1000,
|
5038 |
+
"early_stop_accuracy_threshold": 99.9,
|
5039 |
+
"act_fn": "gelu",
|
5040 |
+
"use_wandb": true,
|
5041 |
+
"save_model_to_wandb": true,
|
5042 |
+
"clip_grad_norm": 0.1,
|
5043 |
+
"lr_scheduler": "linear",
|
5044 |
+
"model_pair": "strict",
|
5045 |
+
"same_size": false,
|
5046 |
+
"seed": 67,
|
5047 |
+
"batch_size": 256,
|
5048 |
+
"include_mlp": false,
|
5049 |
+
"detach_while_caching": true,
|
5050 |
+
"scheduler_val_metric": [
|
5051 |
+
"val/accuracy",
|
5052 |
+
"val/IIA",
|
5053 |
+
"val/strict_accuracy"
|
5054 |
+
],
|
5055 |
+
"siit_sampling": "sample_all",
|
5056 |
+
"val_iia_sampling": "all"
|
5057 |
+
},
|
5058 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/meta.json",
|
5059 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model.pth",
|
5060 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/edges.pkl"
|
5061 |
+
},
|
5062 |
+
{
|
5063 |
+
"case_id": "19",
|
5064 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/19",
|
5065 |
+
"task_description": "Removes consecutive duplicate tokens from a sequence.",
|
5066 |
+
"vocab": [
|
5067 |
+
"a",
|
5068 |
+
"b",
|
5069 |
+
"c"
|
5070 |
+
],
|
5071 |
+
"max_seq_len": 15,
|
5072 |
+
"min_seq_len": 4,
|
5073 |
+
"files": [
|
5074 |
+
{
|
5075 |
+
"file_name": "edges.pkl",
|
5076 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/edges.pkl"
|
5077 |
+
},
|
5078 |
+
{
|
5079 |
+
"file_name": "ll_model.pth",
|
5080 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model.pth"
|
5081 |
+
},
|
5082 |
+
{
|
5083 |
+
"file_name": "ll_model_cfg.pkl",
|
5084 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model_cfg.pkl"
|
5085 |
+
},
|
5086 |
+
{
|
5087 |
+
"file_name": "meta.json",
|
5088 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/meta.json"
|
5089 |
+
}
|
5090 |
+
],
|
5091 |
+
"transformer_cfg": {
|
5092 |
+
"n_layers": 2,
|
5093 |
+
"d_model": 32,
|
5094 |
+
"n_ctx": 15,
|
5095 |
+
"d_head": 8,
|
5096 |
+
"model_name": "custom",
|
5097 |
"n_heads": 4,
|
5098 |
"d_mlp": 128,
|
5099 |
"act_fn": "gelu",
|
|
|
5638 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth",
|
5639 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl"
|
5640 |
},
|
5641 |
+
{
|
5642 |
+
"case_id": "43",
|
5643 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/43",
|
5644 |
+
"task_description": "Returns the corresponding Fibonacci number for each element in the input sequence.",
|
5645 |
+
"vocab": [
|
5646 |
+
0,
|
5647 |
+
1,
|
5648 |
+
2,
|
5649 |
+
3,
|
5650 |
+
4,
|
5651 |
+
5,
|
5652 |
+
6,
|
5653 |
+
7,
|
5654 |
+
8,
|
5655 |
+
9,
|
5656 |
+
10,
|
5657 |
+
11,
|
5658 |
+
12,
|
5659 |
+
13,
|
5660 |
+
14,
|
5661 |
+
15,
|
5662 |
+
16,
|
5663 |
+
17,
|
5664 |
+
18,
|
5665 |
+
19
|
5666 |
+
],
|
5667 |
+
"max_seq_len": 10,
|
5668 |
+
"min_seq_len": 4,
|
5669 |
+
"files": [
|
5670 |
+
{
|
5671 |
+
"file_name": "edges.pkl",
|
5672 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/edges.pkl"
|
5673 |
+
},
|
5674 |
+
{
|
5675 |
+
"file_name": "ll_model.pth",
|
5676 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model.pth"
|
5677 |
+
},
|
5678 |
+
{
|
5679 |
+
"file_name": "ll_model_cfg.pkl",
|
5680 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model_cfg.pkl"
|
5681 |
+
},
|
5682 |
+
{
|
5683 |
+
"file_name": "meta.json",
|
5684 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/meta.json"
|
5685 |
+
}
|
5686 |
+
],
|
5687 |
+
"transformer_cfg": {
|
5688 |
+
"n_layers": 2,
|
5689 |
+
"d_model": 4,
|
5690 |
+
"n_ctx": 10,
|
5691 |
+
"d_head": 1,
|
5692 |
+
"model_name": "custom",
|
5693 |
+
"n_heads": 4,
|
5694 |
+
"d_mlp": 16,
|
5695 |
+
"act_fn": "gelu",
|
5696 |
+
"d_vocab": 22,
|
5697 |
+
"eps": 1e-05,
|
5698 |
+
"use_attn_result": true,
|
5699 |
+
"use_attn_scale": true,
|
5700 |
+
"use_split_qkv_input": true,
|
5701 |
+
"use_hook_mlp_in": true,
|
5702 |
+
"use_attn_in": false,
|
5703 |
+
"use_local_attn": false,
|
5704 |
+
"original_architecture": null,
|
5705 |
+
"from_checkpoint": false,
|
5706 |
+
"checkpoint_index": null,
|
5707 |
+
"checkpoint_label_type": null,
|
5708 |
+
"checkpoint_value": null,
|
5709 |
+
"tokenizer_name": null,
|
5710 |
+
"window_size": null,
|
5711 |
+
"attn_types": null,
|
5712 |
+
"init_mode": "gpt2",
|
5713 |
+
"normalization_type": null,
|
5714 |
+
"n_devices": 1,
|
5715 |
+
"attention_dir": "causal",
|
5716 |
+
"attn_only": false,
|
5717 |
+
"seed": 0,
|
5718 |
+
"initializer_range": 0.1131370849898476,
|
5719 |
+
"init_weights": true,
|
5720 |
+
"scale_attn_by_inverse_layer_idx": false,
|
5721 |
+
"positional_embedding_type": "standard",
|
5722 |
+
"final_rms": false,
|
5723 |
+
"d_vocab_out": 19,
|
5724 |
+
"parallel_attn_mlp": false,
|
5725 |
+
"rotary_dim": null,
|
5726 |
+
"n_params": 384,
|
5727 |
+
"use_hook_tokens": false,
|
5728 |
+
"gated_mlp": false,
|
5729 |
+
"default_prepend_bos": true,
|
5730 |
+
"dtype": "torch.float32",
|
5731 |
+
"tokenizer_prepends_bos": null,
|
5732 |
+
"n_key_value_heads": null,
|
5733 |
+
"post_embedding_ln": false,
|
5734 |
+
"rotary_base": 10000,
|
5735 |
+
"trust_remote_code": false,
|
5736 |
+
"rotary_adjacent_pairs": false,
|
5737 |
+
"load_in_4bit": false,
|
5738 |
+
"num_experts": null,
|
5739 |
+
"experts_per_token": null
|
5740 |
+
},
|
5741 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model_cfg.pkl",
|
5742 |
+
"training_args": {
|
5743 |
+
"output_dir": "/circuits-benchmark/results",
|
5744 |
+
"atol": 0.05,
|
5745 |
+
"lr": 0.001,
|
5746 |
+
"use_single_loss": true,
|
5747 |
+
"iit_weight": 1.0,
|
5748 |
+
"behavior_weight": 0.4,
|
5749 |
+
"strict_weight": 1.0,
|
5750 |
+
"epochs": 1000,
|
5751 |
+
"early_stop_accuracy_threshold": 99.9,
|
5752 |
+
"act_fn": "gelu",
|
5753 |
+
"use_wandb": true,
|
5754 |
+
"save_model_to_wandb": true,
|
5755 |
+
"clip_grad_norm": 0.1,
|
5756 |
+
"lr_scheduler": "linear",
|
5757 |
+
"model_pair": "strict",
|
5758 |
+
"same_size": false,
|
5759 |
+
"seed": 67,
|
5760 |
+
"batch_size": 256,
|
5761 |
+
"include_mlp": false,
|
5762 |
+
"detach_while_caching": true,
|
5763 |
+
"scheduler_val_metric": [
|
5764 |
+
"val/accuracy",
|
5765 |
+
"val/IIA",
|
5766 |
+
"val/strict_accuracy"
|
5767 |
+
],
|
5768 |
+
"siit_sampling": "sample_all",
|
5769 |
+
"val_iia_sampling": "all"
|
5770 |
+
},
|
5771 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/meta.json",
|
5772 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model.pth",
|
5773 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/edges.pkl"
|
5774 |
+
},
|
5775 |
{
|
5776 |
"case_id": "122",
|
5777 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122",
|
|
|
6902 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl"
|
6903 |
},
|
6904 |
{
|
6905 |
+
"case_id": "41",
|
6906 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/41",
|
6907 |
+
"task_description": "Make each element of the input sequence absolute",
|
6908 |
"vocab": [
|
6909 |
+
-10,
|
6910 |
+
-9,
|
6911 |
+
-8,
|
6912 |
+
-7,
|
6913 |
+
-6,
|
6914 |
+
-5,
|
6915 |
+
-4,
|
6916 |
+
-3,
|
6917 |
+
-2,
|
6918 |
+
-1,
|
6919 |
0,
|
6920 |
1,
|
6921 |
2,
|
|
|
6925 |
6,
|
6926 |
7,
|
6927 |
8,
|
6928 |
+
9
|
|
|
6929 |
],
|
6930 |
"max_seq_len": 10,
|
6931 |
"min_seq_len": 4,
|
6932 |
"files": [
|
6933 |
{
|
6934 |
"file_name": "edges.pkl",
|
6935 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/edges.pkl"
|
6936 |
},
|
6937 |
{
|
6938 |
"file_name": "ll_model.pth",
|
6939 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model.pth"
|
6940 |
+
},
|
6941 |
+
{
|
6942 |
+
"file_name": "ll_model_cfg.pkl",
|
6943 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model_cfg.pkl"
|
6944 |
+
},
|
6945 |
+
{
|
6946 |
+
"file_name": "meta.json",
|
6947 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/meta.json"
|
6948 |
+
}
|
6949 |
+
],
|
6950 |
+
"transformer_cfg": {
|
6951 |
+
"n_layers": 2,
|
6952 |
+
"d_model": 4,
|
6953 |
+
"n_ctx": 10,
|
6954 |
+
"d_head": 1,
|
6955 |
+
"model_name": "custom",
|
6956 |
+
"n_heads": 4,
|
6957 |
+
"d_mlp": 16,
|
6958 |
+
"act_fn": "gelu",
|
6959 |
+
"d_vocab": 22,
|
6960 |
+
"eps": 1e-05,
|
6961 |
+
"use_attn_result": true,
|
6962 |
+
"use_attn_scale": true,
|
6963 |
+
"use_split_qkv_input": true,
|
6964 |
+
"use_hook_mlp_in": true,
|
6965 |
+
"use_attn_in": false,
|
6966 |
+
"use_local_attn": false,
|
6967 |
+
"original_architecture": null,
|
6968 |
+
"from_checkpoint": false,
|
6969 |
+
"checkpoint_index": null,
|
6970 |
+
"checkpoint_label_type": null,
|
6971 |
+
"checkpoint_value": null,
|
6972 |
+
"tokenizer_name": null,
|
6973 |
+
"window_size": null,
|
6974 |
+
"attn_types": null,
|
6975 |
+
"init_mode": "gpt2",
|
6976 |
+
"normalization_type": null,
|
6977 |
+
"n_devices": 1,
|
6978 |
+
"attention_dir": "causal",
|
6979 |
+
"attn_only": false,
|
6980 |
+
"seed": 0,
|
6981 |
+
"initializer_range": 0.12344267996967354,
|
6982 |
+
"init_weights": true,
|
6983 |
+
"scale_attn_by_inverse_layer_idx": false,
|
6984 |
+
"positional_embedding_type": "standard",
|
6985 |
+
"final_rms": false,
|
6986 |
+
"d_vocab_out": 11,
|
6987 |
+
"parallel_attn_mlp": false,
|
6988 |
+
"rotary_dim": null,
|
6989 |
+
"n_params": 384,
|
6990 |
+
"use_hook_tokens": false,
|
6991 |
+
"gated_mlp": false,
|
6992 |
+
"default_prepend_bos": true,
|
6993 |
+
"dtype": "torch.float32",
|
6994 |
+
"tokenizer_prepends_bos": null,
|
6995 |
+
"n_key_value_heads": null,
|
6996 |
+
"post_embedding_ln": false,
|
6997 |
+
"rotary_base": 10000,
|
6998 |
+
"trust_remote_code": false,
|
6999 |
+
"rotary_adjacent_pairs": false,
|
7000 |
+
"load_in_4bit": false,
|
7001 |
+
"num_experts": null,
|
7002 |
+
"experts_per_token": null
|
7003 |
+
},
|
7004 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model_cfg.pkl",
|
7005 |
+
"training_args": {
|
7006 |
+
"output_dir": "/circuits-benchmark/results",
|
7007 |
+
"atol": 0.05,
|
7008 |
+
"lr": 0.001,
|
7009 |
+
"use_single_loss": true,
|
7010 |
+
"iit_weight": 1.0,
|
7011 |
+
"behavior_weight": 0.4,
|
7012 |
+
"strict_weight": 1.0,
|
7013 |
+
"epochs": 1000,
|
7014 |
+
"early_stop_accuracy_threshold": 99.9,
|
7015 |
+
"act_fn": "gelu",
|
7016 |
+
"use_wandb": true,
|
7017 |
+
"save_model_to_wandb": true,
|
7018 |
+
"clip_grad_norm": 0.1,
|
7019 |
+
"lr_scheduler": "linear",
|
7020 |
+
"model_pair": "strict",
|
7021 |
+
"same_size": false,
|
7022 |
+
"seed": 67,
|
7023 |
+
"batch_size": 256,
|
7024 |
+
"include_mlp": false,
|
7025 |
+
"detach_while_caching": true,
|
7026 |
+
"scheduler_val_metric": [
|
7027 |
+
"val/accuracy",
|
7028 |
+
"val/IIA",
|
7029 |
+
"val/strict_accuracy"
|
7030 |
+
],
|
7031 |
+
"siit_sampling": "sample_all",
|
7032 |
+
"val_iia_sampling": "all"
|
7033 |
+
},
|
7034 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/meta.json",
|
7035 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model.pth",
|
7036 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/edges.pkl"
|
7037 |
+
},
|
7038 |
+
{
|
7039 |
+
"case_id": "54",
|
7040 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/54",
|
7041 |
+
"task_description": "Applies the hyperbolic tangent to each element.",
|
7042 |
+
"vocab": [
|
7043 |
+
0,
|
7044 |
+
1,
|
7045 |
+
2,
|
7046 |
+
3,
|
7047 |
+
4,
|
7048 |
+
5,
|
7049 |
+
6,
|
7050 |
+
7,
|
7051 |
+
8,
|
7052 |
+
9,
|
7053 |
+
10
|
7054 |
+
],
|
7055 |
+
"max_seq_len": 10,
|
7056 |
+
"min_seq_len": 4,
|
7057 |
+
"files": [
|
7058 |
+
{
|
7059 |
+
"file_name": "edges.pkl",
|
7060 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/edges.pkl"
|
7061 |
+
},
|
7062 |
+
{
|
7063 |
+
"file_name": "ll_model.pth",
|
7064 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model.pth"
|
7065 |
},
|
7066 |
{
|
7067 |
"file_name": "ll_model_cfg.pkl",
|
|
|
8237 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl"
|
8238 |
},
|
8239 |
{
|
8240 |
+
"case_id": "68",
|
8241 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/68",
|
8242 |
+
"task_description": "Increment each element until it becomes a multiple of 3",
|
8243 |
"vocab": [
|
8244 |
0,
|
8245 |
1,
|
|
|
8258 |
"files": [
|
8259 |
{
|
8260 |
"file_name": "edges.pkl",
|
8261 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/edges.pkl"
|
8262 |
},
|
8263 |
{
|
8264 |
"file_name": "ll_model.pth",
|
8265 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model.pth"
|
8266 |
},
|
8267 |
{
|
8268 |
"file_name": "ll_model_cfg.pkl",
|
8269 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model_cfg.pkl"
|
8270 |
},
|
8271 |
{
|
8272 |
"file_name": "meta.json",
|
8273 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/meta.json"
|
8274 |
}
|
8275 |
],
|
8276 |
"transformer_cfg": {
|
|
|
8304 |
"attention_dir": "causal",
|
8305 |
"attn_only": false,
|
8306 |
"seed": 0,
|
8307 |
+
"initializer_range": 0.1539600717839002,
|
8308 |
"init_weights": true,
|
8309 |
"scale_attn_by_inverse_layer_idx": false,
|
8310 |
"positional_embedding_type": "standard",
|
8311 |
"final_rms": false,
|
8312 |
+
"d_vocab_out": 5,
|
8313 |
"parallel_attn_mlp": false,
|
8314 |
"rotary_dim": null,
|
8315 |
"n_params": 384,
|
|
|
8327 |
"num_experts": null,
|
8328 |
"experts_per_token": null
|
8329 |
},
|
8330 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model_cfg.pkl",
|
8331 |
"training_args": {
|
8332 |
"output_dir": "/circuits-benchmark/results",
|
8333 |
"atol": 0.05,
|
|
|
8335 |
"use_single_loss": true,
|
8336 |
"iit_weight": 1.0,
|
8337 |
"behavior_weight": 0.4,
|
8338 |
+
"strict_weight": 1.0,
|
8339 |
"epochs": 1000,
|
8340 |
"early_stop_accuracy_threshold": 99.9,
|
8341 |
"act_fn": "gelu",
|
|
|
8357 |
"siit_sampling": "sample_all",
|
8358 |
"val_iia_sampling": "all"
|
8359 |
},
|
8360 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/meta.json",
|
8361 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model.pth",
|
8362 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/edges.pkl"
|
8363 |
},
|
8364 |
{
|
8365 |
+
"case_id": "70",
|
8366 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/70",
|
8367 |
+
"task_description": "Apply the cosine function to each element of the input sequence.",
|
8368 |
"vocab": [
|
8369 |
0,
|
8370 |
1,
|
|
|
8383 |
"files": [
|
8384 |
{
|
8385 |
"file_name": "edges.pkl",
|
8386 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl"
|
8387 |
},
|
8388 |
{
|
8389 |
"file_name": "ll_model.pth",
|
8390 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth"
|
8391 |
},
|
8392 |
{
|
8393 |
"file_name": "ll_model_cfg.pkl",
|
8394 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl"
|
8395 |
},
|
8396 |
{
|
8397 |
"file_name": "meta.json",
|
8398 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json"
|
8399 |
}
|
8400 |
],
|
8401 |
"transformer_cfg": {
|
|
|
8429 |
"attention_dir": "causal",
|
8430 |
"attn_only": false,
|
8431 |
"seed": 0,
|
8432 |
+
"initializer_range": 0.1392621247645583,
|
8433 |
"init_weights": true,
|
8434 |
"scale_attn_by_inverse_layer_idx": false,
|
8435 |
"positional_embedding_type": "standard",
|
8436 |
"final_rms": false,
|
8437 |
+
"d_vocab_out": 11,
|
8438 |
"parallel_attn_mlp": false,
|
8439 |
"rotary_dim": null,
|
8440 |
"n_params": 384,
|
|
|
8452 |
"num_experts": null,
|
8453 |
"experts_per_token": null
|
8454 |
},
|
8455 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl",
|
8456 |
"training_args": {
|
8457 |
"output_dir": "/circuits-benchmark/results",
|
8458 |
"atol": 0.05,
|
|
|
8482 |
"siit_sampling": "sample_all",
|
8483 |
"val_iia_sampling": "all"
|
8484 |
},
|
8485 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json",
|
8486 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth",
|
8487 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl"
|
8488 |
},
|
8489 |
{
|
8490 |
+
"case_id": "62",
|
8491 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/62",
|
8492 |
+
"task_description": "Replaces each element with its factorial.",
|
8493 |
"vocab": [
|
8494 |
0,
|
8495 |
1,
|
|
|
8508 |
"files": [
|
8509 |
{
|
8510 |
"file_name": "edges.pkl",
|
8511 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl"
|
8512 |
},
|
8513 |
{
|
8514 |
"file_name": "ll_model.pth",
|
8515 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth"
|
8516 |
},
|
8517 |
{
|
8518 |
"file_name": "ll_model_cfg.pkl",
|
8519 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl"
|
8520 |
},
|
8521 |
{
|
8522 |
"file_name": "meta.json",
|
8523 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json"
|
8524 |
}
|
8525 |
],
|
8526 |
"transformer_cfg": {
|
8527 |
+
"n_layers": 2,
|
8528 |
+
"d_model": 4,
|
8529 |
"n_ctx": 10,
|
8530 |
+
"d_head": 1,
|
8531 |
"model_name": "custom",
|
8532 |
"n_heads": 4,
|
8533 |
+
"d_mlp": 16,
|
8534 |
"act_fn": "gelu",
|
8535 |
"d_vocab": 13,
|
8536 |
"eps": 1e-05,
|
|
|
8551 |
"init_mode": "gpt2",
|
8552 |
"normalization_type": null,
|
8553 |
"n_devices": 1,
|
8554 |
+
"attention_dir": "causal",
|
8555 |
"attn_only": false,
|
8556 |
"seed": 0,
|
8557 |
+
"initializer_range": 0.1414213562373095,
|
8558 |
"init_weights": true,
|
8559 |
"scale_attn_by_inverse_layer_idx": false,
|
8560 |
"positional_embedding_type": "standard",
|
8561 |
"final_rms": false,
|
8562 |
+
"d_vocab_out": 10,
|
8563 |
"parallel_attn_mlp": false,
|
8564 |
"rotary_dim": null,
|
8565 |
+
"n_params": 384,
|
8566 |
"use_hook_tokens": false,
|
8567 |
"gated_mlp": false,
|
8568 |
"default_prepend_bos": true,
|
|
|
8577 |
"num_experts": null,
|
8578 |
"experts_per_token": null
|
8579 |
},
|
8580 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl",
|
8581 |
"training_args": {
|
8582 |
"output_dir": "/circuits-benchmark/results",
|
8583 |
"atol": 0.05,
|
|
|
8585 |
"use_single_loss": true,
|
8586 |
"iit_weight": 1.0,
|
8587 |
"behavior_weight": 0.4,
|
8588 |
+
"strict_weight": 0.7,
|
8589 |
"epochs": 1000,
|
8590 |
"early_stop_accuracy_threshold": 99.9,
|
8591 |
"act_fn": "gelu",
|
|
|
8607 |
"siit_sampling": "sample_all",
|
8608 |
"val_iia_sampling": "all"
|
8609 |
},
|
8610 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json",
|
8611 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth",
|
8612 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl"
|
8613 |
},
|
8614 |
{
|
8615 |
+
"case_id": "111",
|
8616 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/111",
|
8617 |
+
"task_description": "Returns the last element of the sequence and pads the rest with zeros.",
|
8618 |
"vocab": [
|
8619 |
+
0,
|
8620 |
+
1,
|
8621 |
+
2,
|
8622 |
+
3,
|
8623 |
+
4,
|
8624 |
+
5,
|
8625 |
+
6,
|
8626 |
+
7,
|
8627 |
+
8,
|
8628 |
+
9,
|
8629 |
+
10
|
8630 |
],
|
8631 |
"max_seq_len": 10,
|
8632 |
"min_seq_len": 4,
|
8633 |
"files": [
|
8634 |
{
|
8635 |
"file_name": "edges.pkl",
|
8636 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl"
|
8637 |
},
|
8638 |
{
|
8639 |
"file_name": "ll_model.pth",
|
8640 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth"
|
8641 |
},
|
8642 |
{
|
8643 |
"file_name": "ll_model_cfg.pkl",
|
8644 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl"
|
8645 |
},
|
8646 |
{
|
8647 |
"file_name": "meta.json",
|
8648 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json"
|
8649 |
}
|
8650 |
],
|
8651 |
"transformer_cfg": {
|
8652 |
+
"n_layers": 3,
|
8653 |
+
"d_model": 24,
|
8654 |
"n_ctx": 10,
|
8655 |
+
"d_head": 6,
|
8656 |
"model_name": "custom",
|
8657 |
"n_heads": 4,
|
8658 |
+
"d_mlp": 96,
|
8659 |
"act_fn": "gelu",
|
8660 |
+
"d_vocab": 13,
|
8661 |
"eps": 1e-05,
|
8662 |
"use_attn_result": true,
|
8663 |
"use_attn_scale": true,
|
|
|
8676 |
"init_mode": "gpt2",
|
8677 |
"normalization_type": null,
|
8678 |
"n_devices": 1,
|
8679 |
+
"attention_dir": "bidirectional",
|
8680 |
"attn_only": false,
|
8681 |
"seed": 0,
|
8682 |
+
"initializer_range": 0.09847319278346618,
|
8683 |
"init_weights": true,
|
8684 |
"scale_attn_by_inverse_layer_idx": false,
|
8685 |
"positional_embedding_type": "standard",
|
8686 |
"final_rms": false,
|
8687 |
+
"d_vocab_out": 11,
|
8688 |
"parallel_attn_mlp": false,
|
8689 |
"rotary_dim": null,
|
8690 |
+
"n_params": 20736,
|
8691 |
"use_hook_tokens": false,
|
8692 |
"gated_mlp": false,
|
8693 |
"default_prepend_bos": true,
|
|
|
8697 |
"post_embedding_ln": false,
|
8698 |
"rotary_base": 10000,
|
8699 |
"trust_remote_code": false,
|
8700 |
+
"rotary_adjacent_pairs": false,
|
8701 |
+
"load_in_4bit": false,
|
8702 |
+
"num_experts": null,
|
8703 |
+
"experts_per_token": null
|
8704 |
+
},
|
8705 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl",
|
8706 |
+
"training_args": {
|
8707 |
+
"output_dir": "/circuits-benchmark/results",
|
8708 |
+
"atol": 0.05,
|
8709 |
+
"lr": 0.001,
|
8710 |
+
"use_single_loss": true,
|
8711 |
+
"iit_weight": 1.0,
|
8712 |
+
"behavior_weight": 0.4,
|
8713 |
+
"strict_weight": 0.4,
|
8714 |
+
"epochs": 1000,
|
8715 |
+
"early_stop_accuracy_threshold": 99.9,
|
8716 |
+
"act_fn": "gelu",
|
8717 |
+
"use_wandb": true,
|
8718 |
+
"save_model_to_wandb": true,
|
8719 |
+
"clip_grad_norm": 0.1,
|
8720 |
+
"lr_scheduler": "linear",
|
8721 |
+
"model_pair": "strict",
|
8722 |
+
"same_size": false,
|
8723 |
+
"seed": 67,
|
8724 |
+
"batch_size": 256,
|
8725 |
+
"include_mlp": false,
|
8726 |
+
"detach_while_caching": true,
|
8727 |
+
"scheduler_val_metric": [
|
8728 |
+
"val/accuracy",
|
8729 |
+
"val/IIA",
|
8730 |
+
"val/strict_accuracy"
|
8731 |
+
],
|
8732 |
+
"siit_sampling": "sample_all",
|
8733 |
+
"val_iia_sampling": "all"
|
8734 |
+
},
|
8735 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json",
|
8736 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth",
|
8737 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl"
|
8738 |
+
},
|
8739 |
+
{
|
8740 |
+
"case_id": "121",
|
8741 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/121",
|
8742 |
+
"task_description": "Compute arcsine of all elements in the input sequence.",
|
8743 |
+
"vocab": [
|
8744 |
+
-1.0,
|
8745 |
+
-0.9,
|
8746 |
+
-0.8,
|
8747 |
+
-0.7,
|
8748 |
+
-0.6,
|
8749 |
+
-0.5,
|
8750 |
+
-0.4,
|
8751 |
+
-0.30000000000000004,
|
8752 |
+
-0.19999999999999996,
|
8753 |
+
-0.09999999999999998,
|
8754 |
+
0.0,
|
8755 |
+
0.10000000000000009,
|
8756 |
+
0.19999999999999996,
|
8757 |
+
0.30000000000000004,
|
8758 |
+
0.3999999999999999,
|
8759 |
+
0.5,
|
8760 |
+
0.6000000000000001,
|
8761 |
+
0.7,
|
8762 |
+
0.8,
|
8763 |
+
0.8999999999999999
|
8764 |
+
],
|
8765 |
+
"max_seq_len": 10,
|
8766 |
+
"min_seq_len": 4,
|
8767 |
+
"files": [
|
8768 |
+
{
|
8769 |
+
"file_name": "edges.pkl",
|
8770 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/edges.pkl"
|
8771 |
+
},
|
8772 |
+
{
|
8773 |
+
"file_name": "ll_model.pth",
|
8774 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model.pth"
|
8775 |
+
},
|
8776 |
+
{
|
8777 |
+
"file_name": "ll_model_cfg.pkl",
|
8778 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model_cfg.pkl"
|
8779 |
+
},
|
8780 |
+
{
|
8781 |
+
"file_name": "meta.json",
|
8782 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/meta.json"
|
8783 |
+
}
|
8784 |
+
],
|
8785 |
+
"transformer_cfg": {
|
8786 |
+
"n_layers": 2,
|
8787 |
+
"d_model": 4,
|
8788 |
+
"n_ctx": 10,
|
8789 |
+
"d_head": 1,
|
8790 |
+
"model_name": "custom",
|
8791 |
+
"n_heads": 4,
|
8792 |
+
"d_mlp": 16,
|
8793 |
+
"act_fn": "gelu",
|
8794 |
+
"d_vocab": 22,
|
8795 |
+
"eps": 1e-05,
|
8796 |
+
"use_attn_result": true,
|
8797 |
+
"use_attn_scale": true,
|
8798 |
+
"use_split_qkv_input": true,
|
8799 |
+
"use_hook_mlp_in": true,
|
8800 |
+
"use_attn_in": false,
|
8801 |
+
"use_local_attn": false,
|
8802 |
+
"original_architecture": null,
|
8803 |
+
"from_checkpoint": false,
|
8804 |
+
"checkpoint_index": null,
|
8805 |
+
"checkpoint_label_type": null,
|
8806 |
+
"checkpoint_value": null,
|
8807 |
+
"tokenizer_name": null,
|
8808 |
+
"window_size": null,
|
8809 |
+
"attn_types": null,
|
8810 |
+
"init_mode": "gpt2",
|
8811 |
+
"normalization_type": null,
|
8812 |
+
"n_devices": 1,
|
8813 |
+
"attention_dir": "causal",
|
8814 |
+
"attn_only": false,
|
8815 |
+
"seed": 0,
|
8816 |
+
"initializer_range": 0.11202240672224079,
|
8817 |
+
"init_weights": true,
|
8818 |
+
"scale_attn_by_inverse_layer_idx": false,
|
8819 |
+
"positional_embedding_type": "standard",
|
8820 |
+
"final_rms": false,
|
8821 |
+
"d_vocab_out": 20,
|
8822 |
+
"parallel_attn_mlp": false,
|
8823 |
+
"rotary_dim": null,
|
8824 |
+
"n_params": 384,
|
8825 |
+
"use_hook_tokens": false,
|
8826 |
+
"gated_mlp": false,
|
8827 |
+
"default_prepend_bos": true,
|
8828 |
+
"dtype": "torch.float32",
|
8829 |
+
"tokenizer_prepends_bos": null,
|
8830 |
+
"n_key_value_heads": null,
|
8831 |
+
"post_embedding_ln": false,
|
8832 |
+
"rotary_base": 10000,
|
8833 |
+
"trust_remote_code": false,
|
8834 |
+
"rotary_adjacent_pairs": false,
|
8835 |
+
"load_in_4bit": false,
|
8836 |
+
"num_experts": null,
|
8837 |
+
"experts_per_token": null
|
8838 |
+
},
|
8839 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model_cfg.pkl",
|
8840 |
+
"training_args": {
|
8841 |
+
"output_dir": "/circuits-benchmark/results",
|
8842 |
+
"atol": 0.05,
|
8843 |
+
"lr": 0.001,
|
8844 |
+
"use_single_loss": true,
|
8845 |
+
"iit_weight": 1.0,
|
8846 |
+
"behavior_weight": 0.4,
|
8847 |
+
"strict_weight": 1.0,
|
8848 |
+
"epochs": 1000,
|
8849 |
+
"early_stop_accuracy_threshold": 99.9,
|
8850 |
+
"act_fn": "gelu",
|
8851 |
+
"use_wandb": true,
|
8852 |
+
"save_model_to_wandb": true,
|
8853 |
+
"clip_grad_norm": 0.1,
|
8854 |
+
"lr_scheduler": "linear",
|
8855 |
+
"model_pair": "strict",
|
8856 |
+
"same_size": false,
|
8857 |
+
"seed": 67,
|
8858 |
+
"batch_size": 256,
|
8859 |
+
"include_mlp": false,
|
8860 |
+
"detach_while_caching": true,
|
8861 |
+
"scheduler_val_metric": [
|
8862 |
+
"val/accuracy",
|
8863 |
+
"val/IIA",
|
8864 |
+
"val/strict_accuracy"
|
8865 |
+
],
|
8866 |
+
"siit_sampling": "sample_all",
|
8867 |
+
"val_iia_sampling": "all"
|
8868 |
+
},
|
8869 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/meta.json",
|
8870 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model.pth",
|
8871 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/edges.pkl"
|
8872 |
+
},
|
8873 |
+
{
|
8874 |
+
"case_id": "35",
|
8875 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/35",
|
8876 |
+
"task_description": "Alternates capitalization of each character in words.",
|
8877 |
+
"vocab": [
|
8878 |
+
"J",
|
8879 |
+
"LB",
|
8880 |
+
"TPSI",
|
8881 |
+
"V",
|
8882 |
+
"b",
|
8883 |
+
"no",
|
8884 |
+
"oCLrZaW",
|
8885 |
+
"poiVg"
|
8886 |
+
],
|
8887 |
+
"max_seq_len": 10,
|
8888 |
+
"min_seq_len": 4,
|
8889 |
+
"files": [
|
8890 |
+
{
|
8891 |
+
"file_name": "edges.pkl",
|
8892 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/edges.pkl"
|
8893 |
+
},
|
8894 |
+
{
|
8895 |
+
"file_name": "ll_model.pth",
|
8896 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model.pth"
|
8897 |
+
},
|
8898 |
+
{
|
8899 |
+
"file_name": "ll_model_cfg.pkl",
|
8900 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl"
|
8901 |
+
},
|
8902 |
+
{
|
8903 |
+
"file_name": "meta.json",
|
8904 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/meta.json"
|
8905 |
+
}
|
8906 |
+
],
|
8907 |
+
"transformer_cfg": {
|
8908 |
+
"n_layers": 2,
|
8909 |
+
"d_model": 9,
|
8910 |
+
"n_ctx": 10,
|
8911 |
+
"d_head": 2,
|
8912 |
+
"model_name": "custom",
|
8913 |
+
"n_heads": 4,
|
8914 |
+
"d_mlp": 36,
|
8915 |
+
"act_fn": "gelu",
|
8916 |
+
"d_vocab": 10,
|
8917 |
+
"eps": 1e-05,
|
8918 |
+
"use_attn_result": true,
|
8919 |
+
"use_attn_scale": true,
|
8920 |
+
"use_split_qkv_input": true,
|
8921 |
+
"use_hook_mlp_in": true,
|
8922 |
+
"use_attn_in": false,
|
8923 |
+
"use_local_attn": false,
|
8924 |
+
"original_architecture": null,
|
8925 |
+
"from_checkpoint": false,
|
8926 |
+
"checkpoint_index": null,
|
8927 |
+
"checkpoint_label_type": null,
|
8928 |
+
"checkpoint_value": null,
|
8929 |
+
"tokenizer_name": null,
|
8930 |
+
"window_size": null,
|
8931 |
+
"attn_types": null,
|
8932 |
+
"init_mode": "gpt2",
|
8933 |
+
"normalization_type": null,
|
8934 |
+
"n_devices": 1,
|
8935 |
+
"attention_dir": "causal",
|
8936 |
+
"attn_only": false,
|
8937 |
+
"seed": 0,
|
8938 |
+
"initializer_range": 0.1539600717839002,
|
8939 |
+
"init_weights": true,
|
8940 |
+
"scale_attn_by_inverse_layer_idx": false,
|
8941 |
+
"positional_embedding_type": "standard",
|
8942 |
+
"final_rms": false,
|
8943 |
+
"d_vocab_out": 8,
|
8944 |
+
"parallel_attn_mlp": false,
|
8945 |
+
"rotary_dim": null,
|
8946 |
+
"n_params": 1872,
|
8947 |
+
"use_hook_tokens": false,
|
8948 |
+
"gated_mlp": false,
|
8949 |
+
"default_prepend_bos": true,
|
8950 |
+
"dtype": "torch.float32",
|
8951 |
+
"tokenizer_prepends_bos": null,
|
8952 |
+
"n_key_value_heads": null,
|
8953 |
+
"post_embedding_ln": false,
|
8954 |
+
"rotary_base": 10000,
|
8955 |
+
"trust_remote_code": false,
|
8956 |
+
"rotary_adjacent_pairs": false
|
8957 |
+
},
|
8958 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl",
|
8959 |
"training_args": {
|
8960 |
"atol": 0.05,
|
8961 |
"lr": 0.01,
|
|
|
9060 |
"lr": 0.01,
|
9061 |
"use_single_loss": false,
|
9062 |
"iit_weight": 1.0,
|
9063 |
+
"behavior_weight": 1.0,
|
9064 |
+
"strict_weight": 10.0,
|
9065 |
+
"epochs": 2000,
|
9066 |
+
"act_fn": "gelu",
|
9067 |
+
"clip_grad_norm": 0.1,
|
9068 |
+
"lr_scheduler": "",
|
9069 |
+
"model_pair": "strict",
|
9070 |
+
"same_size": false
|
9071 |
+
},
|
9072 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/meta.json",
|
9073 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model.pth",
|
9074 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/edges.pkl"
|
9075 |
+
},
|
9076 |
+
{
|
9077 |
+
"case_id": "36",
|
9078 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/36",
|
9079 |
+
"task_description": "Classifies each token as 'positive', 'negative', or 'neutral' based on emojis.",
|
9080 |
+
"vocab": [
|
9081 |
+
"\ud83d\udcd8",
|
9082 |
+
"\ud83d\ude0a",
|
9083 |
+
"\ud83d\ude22"
|
9084 |
+
],
|
9085 |
+
"max_seq_len": 10,
|
9086 |
+
"min_seq_len": 4,
|
9087 |
+
"files": [
|
9088 |
+
{
|
9089 |
+
"file_name": "edges.pkl",
|
9090 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl"
|
9091 |
+
},
|
9092 |
+
{
|
9093 |
+
"file_name": "ll_model.pth",
|
9094 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth"
|
9095 |
+
},
|
9096 |
+
{
|
9097 |
+
"file_name": "ll_model_cfg.pkl",
|
9098 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl"
|
9099 |
+
},
|
9100 |
+
{
|
9101 |
+
"file_name": "meta.json",
|
9102 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json"
|
9103 |
+
}
|
9104 |
+
],
|
9105 |
+
"transformer_cfg": {
|
9106 |
+
"n_layers": 2,
|
9107 |
+
"d_model": 6,
|
9108 |
+
"n_ctx": 10,
|
9109 |
+
"d_head": 1,
|
9110 |
+
"model_name": "custom",
|
9111 |
+
"n_heads": 4,
|
9112 |
+
"d_mlp": 24,
|
9113 |
+
"act_fn": "gelu",
|
9114 |
+
"d_vocab": 5,
|
9115 |
+
"eps": 1e-05,
|
9116 |
+
"use_attn_result": true,
|
9117 |
+
"use_attn_scale": true,
|
9118 |
+
"use_split_qkv_input": true,
|
9119 |
+
"use_hook_mlp_in": true,
|
9120 |
+
"use_attn_in": false,
|
9121 |
+
"use_local_attn": false,
|
9122 |
+
"original_architecture": null,
|
9123 |
+
"from_checkpoint": false,
|
9124 |
+
"checkpoint_index": null,
|
9125 |
+
"checkpoint_label_type": null,
|
9126 |
+
"checkpoint_value": null,
|
9127 |
+
"tokenizer_name": null,
|
9128 |
+
"window_size": null,
|
9129 |
+
"attn_types": null,
|
9130 |
+
"init_mode": "gpt2",
|
9131 |
+
"normalization_type": null,
|
9132 |
+
"n_devices": 1,
|
9133 |
+
"attention_dir": "causal",
|
9134 |
+
"attn_only": false,
|
9135 |
+
"seed": 0,
|
9136 |
+
"initializer_range": 0.19402850002906638,
|
9137 |
+
"init_weights": true,
|
9138 |
+
"scale_attn_by_inverse_layer_idx": false,
|
9139 |
+
"positional_embedding_type": "standard",
|
9140 |
+
"final_rms": false,
|
9141 |
+
"d_vocab_out": 3,
|
9142 |
+
"parallel_attn_mlp": false,
|
9143 |
+
"rotary_dim": null,
|
9144 |
+
"n_params": 768,
|
9145 |
+
"use_hook_tokens": false,
|
9146 |
+
"gated_mlp": false,
|
9147 |
+
"default_prepend_bos": true,
|
9148 |
+
"dtype": "torch.float32",
|
9149 |
+
"tokenizer_prepends_bos": null,
|
9150 |
+
"n_key_value_heads": null,
|
9151 |
+
"post_embedding_ln": false,
|
9152 |
+
"rotary_base": 10000,
|
9153 |
+
"trust_remote_code": false,
|
9154 |
+
"rotary_adjacent_pairs": false
|
9155 |
+
},
|
9156 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl",
|
9157 |
+
"training_args": {
|
9158 |
+
"atol": 0.05,
|
9159 |
+
"lr": 0.01,
|
9160 |
+
"use_single_loss": false,
|
9161 |
+
"iit_weight": 1.0,
|
9162 |
+
"behavior_weight": 1.0,
|
9163 |
+
"strict_weight": 1.0,
|
9164 |
+
"epochs": 2000,
|
9165 |
+
"act_fn": "gelu",
|
9166 |
+
"clip_grad_norm": 0.1,
|
9167 |
+
"lr_scheduler": "",
|
9168 |
+
"model_pair": "strict"
|
9169 |
+
},
|
9170 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json",
|
9171 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth",
|
9172 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl"
|
9173 |
+
},
|
9174 |
+
{
|
9175 |
+
"case_id": "106",
|
9176 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/106",
|
9177 |
+
"task_description": "Sets all elements to zero except for the element at index 1.",
|
9178 |
+
"vocab": [
|
9179 |
+
0,
|
9180 |
+
1,
|
9181 |
+
2,
|
9182 |
+
3,
|
9183 |
+
4,
|
9184 |
+
5,
|
9185 |
+
6,
|
9186 |
+
7,
|
9187 |
+
8,
|
9188 |
+
9,
|
9189 |
+
10
|
9190 |
+
],
|
9191 |
+
"max_seq_len": 10,
|
9192 |
+
"min_seq_len": 4,
|
9193 |
+
"files": [
|
9194 |
+
{
|
9195 |
+
"file_name": "edges.pkl",
|
9196 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/edges.pkl"
|
9197 |
+
},
|
9198 |
+
{
|
9199 |
+
"file_name": "ll_model.pth",
|
9200 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model.pth"
|
9201 |
+
},
|
9202 |
+
{
|
9203 |
+
"file_name": "ll_model_cfg.pkl",
|
9204 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model_cfg.pkl"
|
9205 |
+
},
|
9206 |
+
{
|
9207 |
+
"file_name": "meta.json",
|
9208 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/meta.json"
|
9209 |
+
}
|
9210 |
+
],
|
9211 |
+
"transformer_cfg": {
|
9212 |
+
"n_layers": 2,
|
9213 |
+
"d_model": 4,
|
9214 |
+
"n_ctx": 10,
|
9215 |
+
"d_head": 1,
|
9216 |
+
"model_name": "custom",
|
9217 |
+
"n_heads": 4,
|
9218 |
+
"d_mlp": 16,
|
9219 |
+
"act_fn": "gelu",
|
9220 |
+
"d_vocab": 13,
|
9221 |
+
"eps": 1e-05,
|
9222 |
+
"use_attn_result": true,
|
9223 |
+
"use_attn_scale": true,
|
9224 |
+
"use_split_qkv_input": true,
|
9225 |
+
"use_hook_mlp_in": true,
|
9226 |
+
"use_attn_in": false,
|
9227 |
+
"use_local_attn": false,
|
9228 |
+
"original_architecture": null,
|
9229 |
+
"from_checkpoint": false,
|
9230 |
+
"checkpoint_index": null,
|
9231 |
+
"checkpoint_label_type": null,
|
9232 |
+
"checkpoint_value": null,
|
9233 |
+
"tokenizer_name": null,
|
9234 |
+
"window_size": null,
|
9235 |
+
"attn_types": null,
|
9236 |
+
"init_mode": "gpt2",
|
9237 |
+
"normalization_type": null,
|
9238 |
+
"n_devices": 1,
|
9239 |
+
"attention_dir": "causal",
|
9240 |
+
"attn_only": false,
|
9241 |
+
"seed": 0,
|
9242 |
+
"initializer_range": 0.13719886811400708,
|
9243 |
+
"init_weights": true,
|
9244 |
+
"scale_attn_by_inverse_layer_idx": false,
|
9245 |
+
"positional_embedding_type": "standard",
|
9246 |
+
"final_rms": false,
|
9247 |
+
"d_vocab_out": 11,
|
9248 |
+
"parallel_attn_mlp": false,
|
9249 |
+
"rotary_dim": null,
|
9250 |
+
"n_params": 384,
|
9251 |
+
"use_hook_tokens": false,
|
9252 |
+
"gated_mlp": false,
|
9253 |
+
"default_prepend_bos": true,
|
9254 |
+
"dtype": "torch.float32",
|
9255 |
+
"tokenizer_prepends_bos": null,
|
9256 |
+
"n_key_value_heads": null,
|
9257 |
+
"post_embedding_ln": false,
|
9258 |
+
"rotary_base": 10000,
|
9259 |
+
"trust_remote_code": false,
|
9260 |
+
"rotary_adjacent_pairs": false,
|
9261 |
+
"load_in_4bit": false,
|
9262 |
+
"num_experts": null,
|
9263 |
+
"experts_per_token": null
|
9264 |
+
},
|
9265 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model_cfg.pkl",
|
9266 |
+
"training_args": {
|
9267 |
+
"output_dir": "/circuits-benchmark/results",
|
9268 |
+
"atol": 0.05,
|
9269 |
+
"lr": 0.001,
|
9270 |
+
"use_single_loss": true,
|
9271 |
+
"iit_weight": 1.0,
|
9272 |
+
"behavior_weight": 0.4,
|
9273 |
+
"strict_weight": 0.7,
|
9274 |
+
"epochs": 1000,
|
9275 |
+
"early_stop_accuracy_threshold": 99.9,
|
9276 |
"act_fn": "gelu",
|
9277 |
+
"use_wandb": true,
|
9278 |
+
"save_model_to_wandb": true,
|
9279 |
"clip_grad_norm": 0.1,
|
9280 |
+
"lr_scheduler": "linear",
|
9281 |
"model_pair": "strict",
|
9282 |
+
"same_size": false,
|
9283 |
+
"seed": 92,
|
9284 |
+
"batch_size": 256,
|
9285 |
+
"include_mlp": false,
|
9286 |
+
"detach_while_caching": true,
|
9287 |
+
"scheduler_val_metric": [
|
9288 |
+
"val/accuracy",
|
9289 |
+
"val/IIA",
|
9290 |
+
"val/strict_accuracy"
|
9291 |
+
],
|
9292 |
+
"siit_sampling": "sample_all",
|
9293 |
+
"val_iia_sampling": "all"
|
9294 |
},
|
9295 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/meta.json",
|
9296 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model.pth",
|
9297 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/edges.pkl"
|
9298 |
},
|
9299 |
{
|
9300 |
+
"case_id": "64",
|
9301 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/64",
|
9302 |
+
"task_description": "Cubes each element in the sequence.",
|
9303 |
"vocab": [
|
9304 |
+
0,
|
9305 |
+
1,
|
9306 |
+
2,
|
9307 |
+
3,
|
9308 |
+
4,
|
9309 |
+
5,
|
9310 |
+
6,
|
9311 |
+
7,
|
9312 |
+
8,
|
9313 |
+
9,
|
9314 |
+
10
|
9315 |
],
|
9316 |
"max_seq_len": 10,
|
9317 |
"min_seq_len": 4,
|
9318 |
"files": [
|
9319 |
{
|
9320 |
"file_name": "edges.pkl",
|
9321 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl"
|
9322 |
},
|
9323 |
{
|
9324 |
"file_name": "ll_model.pth",
|
9325 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth"
|
9326 |
},
|
9327 |
{
|
9328 |
"file_name": "ll_model_cfg.pkl",
|
9329 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl"
|
9330 |
},
|
9331 |
{
|
9332 |
"file_name": "meta.json",
|
9333 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json"
|
9334 |
}
|
9335 |
],
|
9336 |
"transformer_cfg": {
|
9337 |
"n_layers": 2,
|
9338 |
+
"d_model": 4,
|
9339 |
"n_ctx": 10,
|
9340 |
"d_head": 1,
|
9341 |
"model_name": "custom",
|
9342 |
"n_heads": 4,
|
9343 |
+
"d_mlp": 16,
|
9344 |
"act_fn": "gelu",
|
9345 |
+
"d_vocab": 13,
|
9346 |
"eps": 1e-05,
|
9347 |
"use_attn_result": true,
|
9348 |
"use_attn_scale": true,
|
|
|
9364 |
"attention_dir": "causal",
|
9365 |
"attn_only": false,
|
9366 |
"seed": 0,
|
9367 |
+
"initializer_range": 0.1392621247645583,
|
9368 |
"init_weights": true,
|
9369 |
"scale_attn_by_inverse_layer_idx": false,
|
9370 |
"positional_embedding_type": "standard",
|
9371 |
"final_rms": false,
|
9372 |
+
"d_vocab_out": 11,
|
9373 |
"parallel_attn_mlp": false,
|
9374 |
"rotary_dim": null,
|
9375 |
+
"n_params": 384,
|
9376 |
"use_hook_tokens": false,
|
9377 |
"gated_mlp": false,
|
9378 |
"default_prepend_bos": true,
|
|
|
9382 |
"post_embedding_ln": false,
|
9383 |
"rotary_base": 10000,
|
9384 |
"trust_remote_code": false,
|
9385 |
+
"rotary_adjacent_pairs": false,
|
9386 |
+
"load_in_4bit": false,
|
9387 |
+
"num_experts": null,
|
9388 |
+
"experts_per_token": null
|
9389 |
},
|
9390 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl",
|
9391 |
"training_args": {
|
9392 |
+
"output_dir": "/circuits-benchmark/results",
|
9393 |
"atol": 0.05,
|
9394 |
+
"lr": 0.001,
|
9395 |
+
"use_single_loss": true,
|
9396 |
"iit_weight": 1.0,
|
9397 |
+
"behavior_weight": 0.4,
|
9398 |
+
"strict_weight": 0.7,
|
9399 |
+
"epochs": 1000,
|
9400 |
+
"early_stop_accuracy_threshold": 99.9,
|
9401 |
"act_fn": "gelu",
|
9402 |
+
"use_wandb": true,
|
9403 |
+
"save_model_to_wandb": true,
|
9404 |
"clip_grad_norm": 0.1,
|
9405 |
+
"lr_scheduler": "linear",
|
9406 |
+
"model_pair": "strict",
|
9407 |
+
"same_size": false,
|
9408 |
+
"seed": 67,
|
9409 |
+
"batch_size": 256,
|
9410 |
+
"include_mlp": false,
|
9411 |
+
"detach_while_caching": true,
|
9412 |
+
"scheduler_val_metric": [
|
9413 |
+
"val/accuracy",
|
9414 |
+
"val/IIA",
|
9415 |
+
"val/strict_accuracy"
|
9416 |
+
],
|
9417 |
+
"siit_sampling": "sample_all",
|
9418 |
+
"val_iia_sampling": "all"
|
9419 |
},
|
9420 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json",
|
9421 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth",
|
9422 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl"
|
9423 |
},
|
9424 |
{
|
9425 |
+
"case_id": "8",
|
9426 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/8",
|
9427 |
+
"task_description": "Identity",
|
9428 |
"vocab": [
|
9429 |
0,
|
9430 |
1,
|
|
|
9443 |
"files": [
|
9444 |
{
|
9445 |
"file_name": "edges.pkl",
|
9446 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl"
|
9447 |
},
|
9448 |
{
|
9449 |
"file_name": "ll_model.pth",
|
9450 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth"
|
9451 |
},
|
9452 |
{
|
9453 |
"file_name": "ll_model_cfg.pkl",
|
9454 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl"
|
9455 |
},
|
9456 |
{
|
9457 |
"file_name": "meta.json",
|
9458 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json"
|
9459 |
}
|
9460 |
],
|
9461 |
"transformer_cfg": {
|
|
|
9512 |
"num_experts": null,
|
9513 |
"experts_per_token": null
|
9514 |
},
|
9515 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl",
|
9516 |
"training_args": {
|
9517 |
"output_dir": "/circuits-benchmark/results",
|
9518 |
"atol": 0.05,
|
|
|
9542 |
"siit_sampling": "sample_all",
|
9543 |
"val_iia_sampling": "all"
|
9544 |
},
|
9545 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json",
|
9546 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth",
|
9547 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl"
|
9548 |
},
|
9549 |
{
|
9550 |
+
"case_id": "73",
|
9551 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/73",
|
9552 |
+
"task_description": "Apply the sine function to each element of the input sequence.",
|
9553 |
"vocab": [
|
9554 |
0,
|
9555 |
1,
|
|
|
9568 |
"files": [
|
9569 |
{
|
9570 |
"file_name": "edges.pkl",
|
9571 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/edges.pkl"
|
9572 |
},
|
9573 |
{
|
9574 |
"file_name": "ll_model.pth",
|
9575 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model.pth"
|
9576 |
},
|
9577 |
{
|
9578 |
"file_name": "ll_model_cfg.pkl",
|
9579 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model_cfg.pkl"
|
9580 |
},
|
9581 |
{
|
9582 |
"file_name": "meta.json",
|
9583 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/meta.json"
|
9584 |
}
|
9585 |
],
|
9586 |
"transformer_cfg": {
|
|
|
9637 |
"num_experts": null,
|
9638 |
"experts_per_token": null
|
9639 |
},
|
9640 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model_cfg.pkl",
|
9641 |
"training_args": {
|
9642 |
"output_dir": "/circuits-benchmark/results",
|
9643 |
"atol": 0.05,
|
|
|
9655 |
"lr_scheduler": "linear",
|
9656 |
"model_pair": "strict",
|
9657 |
"same_size": false,
|
9658 |
+
"seed": 92,
|
9659 |
"batch_size": 256,
|
9660 |
"include_mlp": false,
|
9661 |
"detach_while_caching": true,
|
|
|
9667 |
"siit_sampling": "sample_all",
|
9668 |
"val_iia_sampling": "all"
|
9669 |
},
|
9670 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/meta.json",
|
9671 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model.pth",
|
9672 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/edges.pkl"
|
9673 |
},
|
9674 |
{
|
9675 |
"case_id": "103",
|
|
|
10046 |
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth",
|
10047 |
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl"
|
10048 |
},
|
10049 |
+
{
|
10050 |
+
"case_id": "49",
|
10051 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/49",
|
10052 |
+
"task_description": "Decrements each element in the sequence until it becomes a multiple of 3.",
|
10053 |
+
"vocab": [
|
10054 |
+
0,
|
10055 |
+
1,
|
10056 |
+
2,
|
10057 |
+
3,
|
10058 |
+
4,
|
10059 |
+
5,
|
10060 |
+
6,
|
10061 |
+
7,
|
10062 |
+
8,
|
10063 |
+
9,
|
10064 |
+
10
|
10065 |
+
],
|
10066 |
+
"max_seq_len": 10,
|
10067 |
+
"min_seq_len": 4,
|
10068 |
+
"files": [
|
10069 |
+
{
|
10070 |
+
"file_name": "edges.pkl",
|
10071 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/edges.pkl"
|
10072 |
+
},
|
10073 |
+
{
|
10074 |
+
"file_name": "ll_model.pth",
|
10075 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model.pth"
|
10076 |
+
},
|
10077 |
+
{
|
10078 |
+
"file_name": "ll_model_cfg.pkl",
|
10079 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model_cfg.pkl"
|
10080 |
+
},
|
10081 |
+
{
|
10082 |
+
"file_name": "meta.json",
|
10083 |
+
"url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/meta.json"
|
10084 |
+
}
|
10085 |
+
],
|
10086 |
+
"transformer_cfg": {
|
10087 |
+
"n_layers": 2,
|
10088 |
+
"d_model": 4,
|
10089 |
+
"n_ctx": 10,
|
10090 |
+
"d_head": 1,
|
10091 |
+
"model_name": "custom",
|
10092 |
+
"n_heads": 4,
|
10093 |
+
"d_mlp": 16,
|
10094 |
+
"act_fn": "gelu",
|
10095 |
+
"d_vocab": 13,
|
10096 |
+
"eps": 1e-05,
|
10097 |
+
"use_attn_result": true,
|
10098 |
+
"use_attn_scale": true,
|
10099 |
+
"use_split_qkv_input": true,
|
10100 |
+
"use_hook_mlp_in": true,
|
10101 |
+
"use_attn_in": false,
|
10102 |
+
"use_local_attn": false,
|
10103 |
+
"original_architecture": null,
|
10104 |
+
"from_checkpoint": false,
|
10105 |
+
"checkpoint_index": null,
|
10106 |
+
"checkpoint_label_type": null,
|
10107 |
+
"checkpoint_value": null,
|
10108 |
+
"tokenizer_name": null,
|
10109 |
+
"window_size": null,
|
10110 |
+
"attn_types": null,
|
10111 |
+
"init_mode": "gpt2",
|
10112 |
+
"normalization_type": null,
|
10113 |
+
"n_devices": 1,
|
10114 |
+
"attention_dir": "causal",
|
10115 |
+
"attn_only": false,
|
10116 |
+
"seed": 0,
|
10117 |
+
"initializer_range": 0.15689290811054724,
|
10118 |
+
"init_weights": true,
|
10119 |
+
"scale_attn_by_inverse_layer_idx": false,
|
10120 |
+
"positional_embedding_type": "standard",
|
10121 |
+
"final_rms": false,
|
10122 |
+
"d_vocab_out": 4,
|
10123 |
+
"parallel_attn_mlp": false,
|
10124 |
+
"rotary_dim": null,
|
10125 |
+
"n_params": 384,
|
10126 |
+
"use_hook_tokens": false,
|
10127 |
+
"gated_mlp": false,
|
10128 |
+
"default_prepend_bos": true,
|
10129 |
+
"dtype": "torch.float32",
|
10130 |
+
"tokenizer_prepends_bos": null,
|
10131 |
+
"n_key_value_heads": null,
|
10132 |
+
"post_embedding_ln": false,
|
10133 |
+
"rotary_base": 10000,
|
10134 |
+
"trust_remote_code": false,
|
10135 |
+
"rotary_adjacent_pairs": false,
|
10136 |
+
"load_in_4bit": false,
|
10137 |
+
"num_experts": null,
|
10138 |
+
"experts_per_token": null
|
10139 |
+
},
|
10140 |
+
"transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model_cfg.pkl",
|
10141 |
+
"training_args": {
|
10142 |
+
"output_dir": "/circuits-benchmark/results",
|
10143 |
+
"atol": 0.05,
|
10144 |
+
"lr": 0.001,
|
10145 |
+
"use_single_loss": true,
|
10146 |
+
"iit_weight": 1.0,
|
10147 |
+
"behavior_weight": 0.4,
|
10148 |
+
"strict_weight": 0.7,
|
10149 |
+
"epochs": 1000,
|
10150 |
+
"early_stop_accuracy_threshold": 99.9,
|
10151 |
+
"act_fn": "gelu",
|
10152 |
+
"use_wandb": true,
|
10153 |
+
"save_model_to_wandb": true,
|
10154 |
+
"clip_grad_norm": 0.1,
|
10155 |
+
"lr_scheduler": "linear",
|
10156 |
+
"model_pair": "strict",
|
10157 |
+
"same_size": false,
|
10158 |
+
"seed": 92,
|
10159 |
+
"batch_size": 256,
|
10160 |
+
"include_mlp": false,
|
10161 |
+
"detach_while_caching": true,
|
10162 |
+
"scheduler_val_metric": [
|
10163 |
+
"val/accuracy",
|
10164 |
+
"val/IIA",
|
10165 |
+
"val/strict_accuracy"
|
10166 |
+
],
|
10167 |
+
"siit_sampling": "sample_all",
|
10168 |
+
"val_iia_sampling": "all"
|
10169 |
+
},
|
10170 |
+
"training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/meta.json",
|
10171 |
+
"weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model.pth",
|
10172 |
+
"circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/edges.pkl"
|
10173 |
+
},
|
10174 |
{
|
10175 |
"case_id": "46",
|
10176 |
"url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46",
|