iarcuschin commited on
Commit
16c725e
1 Parent(s): 0f12a50

Add new models

Browse files
106/edges.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fda9b02cdb2f5d7252c229a12290c6d81381606b1bfad02979549f304bf2a5d0
3
+ size 134
106/ll_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:580798eae1391aca366f15c0442c3ef1c02b1b323d610d1d9ddee0faee5e664f
3
+ size 14698
106/ll_model_cfg.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:24bca874c32c8c431cdb732e3222b4090604cde6f05ce1359710b630220650e3
3
+ size 1093
106/meta.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-106-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
121/edges.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
3
+ size 113
121/ll_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8054e00aea3c35c5ee77c693f9feeba493c499fe3218e70780137938138a4675
3
+ size 15118
121/ll_model_cfg.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9f027ad4de6828c6f5bb7a3f3c8aabd9658526e33b2284eba366977823b89c0a
3
+ size 1093
121/meta.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-121-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
130/edges.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af2a7430f7477a79df1fce6300cf37e1c46d73c31a7f91e06221ef4a6ebf9bed
3
+ size 223
130/ll_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4be63b6e0776e45f04d0905702a3a520b2b6449691ae6e34b8504693ac6805be
3
+ size 21304
130/ll_model_cfg.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:192503b894021c736145328500ab1f316e60ed7a121cf04b089bcd05d04e50b4
3
+ size 1093
130/meta.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-130-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
15/edges.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ecc8ce1a212f987b85ec909238ebc7d01d36c58389391fc96d69ca007fa2d384
3
+ size 244
15/ll_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:22ff8d1015f06b8912051e6787ba4e058047facdaadd1d9322e7e89c070c131f
3
+ size 20728
15/ll_model_cfg.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f4162b8d5712db86a2025499b1561c655fd97402716ff352305c296c7a04ff65
3
+ size 1093
15/meta.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-15-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
41/edges.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
3
+ size 113
41/ll_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7d59c31ceb0d0c9afb12dc1f63ade3c4f9edba0dfd80d5779ae27188da2c21d8
3
+ size 14862
41/ll_model_cfg.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f1dee34cba288862b06c2ff669839e06b6c17aa46cdb685f4a2c5a8c3be8a39b
3
+ size 1093
41/meta.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-41-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
43/edges.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
3
+ size 113
43/ll_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26cc6d6ffa5ae93ce73055d831d4a7119bca2166c2ed9731992c48b4b3debb49
3
+ size 15054
43/ll_model_cfg.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89a74c42552b846f4562163c6fe74a474edfa36e1972eb97bb3ce0d8aaf9444c
3
+ size 1093
43/meta.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-43-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
49/edges.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
3
+ size 113
49/ll_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:aab9be464531a3cf85f25e3ccb3153c15b6de9876d56799d8705d0784979a1ea
3
+ size 14634
49/ll_model_cfg.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e47363d4486f828a419ba208bee3a725d431ab80e418a8318f55cf6cd6bf310
3
+ size 1093
49/meta.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-49-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
66/edges.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
3
+ size 113
66/ll_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fa63d9e5b124ffb9ce9061e04b03b1ff551c8085fc51ddea31f488b152f5f7c3
3
+ size 14762
66/ll_model_cfg.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b04d734fcc61084204ead0d8cc11c5782598f6f6e4bf3e14b94eab7b0bc9d676
3
+ size 1093
66/meta.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-66-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
68/edges.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
3
+ size 113
68/ll_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1b739ebc05faa4d388c20ef60ab59e44695c4a82323ed7c9c3801ae8e502db9
3
+ size 14670
68/ll_model_cfg.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:be188cb9baf70c65af2c4ecf92c6de170c15a41599109f95c6b632f15bb3eec3
3
+ size 1093
68/meta.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 1.0, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-67-siit-weigth-1", "wandb_name": "case-68-seed-67-s-1-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 67, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
73/edges.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9a2cb02e0518a50c2b53be59ea3c3788ec80c0d3c6c1e70070bd7115abdfae77
3
+ size 113
73/ll_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:809fe1d4c9f818bac9a85b358d0722f6ed8527d56f988fe66d62f0eceac0f097
3
+ size 14698
73/ll_model_cfg.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:db76917a80935813594508b1d79b7a0836a20daf67e263161432430b095fd111
3
+ size 1093
73/meta.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"output_dir": "/circuits-benchmark/results", "atol": 0.05, "lr": 0.001, "use_single_loss": true, "iit_weight": 1.0, "behavior_weight": 0.4, "strict_weight": 0.7, "epochs": 1000, "early_stop_accuracy_threshold": 99.9, "act_fn": "gelu", "use_wandb": true, "wandb_project": "iit-train-seed-92-siit-weigth-0.7", "wandb_name": "case-73-seed-92-s-0.7-b-0.4-iit-1", "save_model_to_wandb": true, "device": "cuda", "clip_grad_norm": 0.1, "lr_scheduler": "linear", "model_pair": "strict", "same_size": false, "seed": 92, "batch_size": 256, "include_mlp": false, "detach_while_caching": true, "scheduler_val_metric": ["val/accuracy", "val/IIA", "val/strict_accuracy"], "siit_sampling": "sample_all", "val_iia_sampling": "all"}
benchmark_cases_metadata.csv CHANGED
@@ -27,6 +27,7 @@ ioi,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi,Indirect O
27
  30,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/30,Tags numeric tokens in a sequence based on whether they fall within a given range.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
28
  90,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/90,Replaces a specific token with another one.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/edges.pkl,2,4,10,1,custom,4,16,gelu,12,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,9,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
29
  39,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/39,Returns the fraction of 'x' in the input up to the i-th position for all i.,60,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl,2,120,60,30,custom,4,480,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.08432740427115679,True,False,standard,False,1,False,345600,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 
30
  75,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75,Double each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
31
  101,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/101,Check if each element is a square of an integer.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
32
  ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi_next_token,"Indirect Object Identification (IOI) task, trained using next token prediction.",16,16,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/edges.pkl,6,64,1024,16,gpt2,4,3072,gelu_new,50257,1e-05,False,True,False,False,False,False,GPT2LMHeadModel,False,gpt2,gpt2,LNPre,1,causal,False,,0.02886751345948129,True,False,standard,False,50257,False,2457600,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,,,,True,True,1.0,,,True,,256.0,True,True,"val/accuracy,val/IIA",,,True,0.65,False,0.0,True,max,,True,
@@ -34,14 +35,17 @@ ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi
34
  14,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/14,Returns the count of 'a' in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/edges.pkl,2,8,10,2,custom,4,32,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.15689290811054724,True,False,standard,False,10,False,1536,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
35
  95,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/95,Counts the distinct prime factors of each number in the input list.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12060453783110546,True,False,standard,False,3,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
36
  84,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/84,Apply the arctangent function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 
37
  93,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93,Swaps the nth with the n+1th element if n%2==1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/edges.pkl,3,20,10,5,custom,4,80,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10886621079036347,True,False,standard,False,11,False,14400,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
38
  37,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/37,Reverses each word in the sequence except for specified exclusions.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
39
  34,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/34,Calculate the ratio of vowels to consonants in each word.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/edges.pkl,2,16,10,4,custom,4,64,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,5,False,6144,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
40
  26,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/26,Creates a cascading effect by repeating each token in sequence incrementally.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl,2,21,10,5,custom,4,84,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12344267996967354,True,False,standard,False,27,False,10416,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
 
41
  19,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/19,Removes consecutive duplicate tokens from a sequence.,15,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/edges.pkl,2,32,15,8,custom,4,128,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.15689290811054724,True,False,standard,False,3,False,24576,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,,True,,,True,True,,,,True,,True,,True,,,True,
42
  53,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/53,Increment elements at odd indices by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13151918984428584,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
43
  40,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/40,Sum the last and previous to last digits of a number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/edges.pkl,2,4,10,1,custom,4,16,gelu,31,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.09847319278346618,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
44
  51,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/51,Checks if each element is a Fibonacci number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl,2,4,10,1,custom,4,16,gelu,102,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.07525766947068778,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 
45
  122,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122,Check if each number is divisible by 3.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
46
  85,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/85,Square each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
47
  2,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/2,Reverse the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/edges.pkl,4,56,10,14,custom,4,224,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.07593263966019993,True,False,standard,False,26,False,150528,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
@@ -51,6 +55,7 @@ ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi
51
  20,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/20,Detect spam messages based on appearance of spam keywords.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/edges.pkl,2,13,10,3,custom,4,52,gelu,14,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16,True,False,standard,False,2,False,3952,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
52
  25,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/25,Normalizes token frequencies in a sequence to a range between 0 and 1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/edges.pkl,2,62,10,15,custom,4,248,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.08295613557843402,True,False,standard,False,56,False,91264,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
53
  11,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/11,Counts the number of words in a sequence based on their length.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,5,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,500.0,,gelu,True,True,1.0,,,True,,,True,True,,,,True,,True,,True,,,True,
 
54
  54,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/54,Applies the hyperbolic tangent to each element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
55
  124,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/124,Check if all elements in a list are equal.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.11547005383792516,True,False,standard,False,2,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
56
  102,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/102,"Reflects each element within a range (default is [2, 7]).",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/edges.pkl,2,4,10,1,custom,4,16,gelu,42,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1059625885652035,True,False,standard,False,6,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
@@ -60,15 +65,20 @@ ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi
60
  86,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/86,"Check if each element is a power of 2. Return 1 if true, otherwise 0.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
61
  105,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/105,Replaces each number with the next prime after that number.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.11202240672224079,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
62
  58,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/58,Mirrors the first half of the sequence to the second half.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl,3,32,10,8,custom,4,128,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10415112878465911,True,False,standard,False,11,False,36864,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 
63
  70,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/70,Apply the cosine function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
64
  62,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/62,Replaces each element with its factorial.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1414213562373095,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
65
  111,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/111,Returns the last element of the sequence and pads the rest with zeros.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.09847319278346618,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 
66
  35,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/35,Alternates capitalization of each character in words.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/edges.pkl,2,9,10,2,custom,4,36,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,1872,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
67
  3,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/3,Returns the fraction of 'x' in the input up to the i-th position for all i.,5,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/edges.pkl,2,12,5,3,custom,4,48,gelu,6,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.22188007849009167,True,False,standard,False,1,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,10.0,2000.0,,gelu,True,True,0.1,,strict,False,,,True,True,,,,True,,True,,True,,,True,
68
  36,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/36,"Classifies each token as 'positive', 'negative', or 'neutral' based on emojis.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl,2,6,10,1,custom,4,24,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.19402850002906638,True,False,standard,False,3,False,768,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
 
69
  64,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/64,Cubes each element in the sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
70
  8,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/8,Identity,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 
71
  103,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/103,Swap consecutive numbers in a list,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10787197799411874,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
72
  56,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/56,Sets every third element to zero.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13333333333333333,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
73
  97,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/97,Scale a sequence by its maximum element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl,3,200,10,50,custom,4,800,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.05405899027195888,True,False,standard,False,64,False,1440000,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 
74
  46,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46,Decrements each element in the sequence by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 
27
  30,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/30,Tags numeric tokens in a sequence based on whether they fall within a given range.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/30/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
28
  90,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/90,Replaces a specific token with another one.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/90/edges.pkl,2,4,10,1,custom,4,16,gelu,12,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,9,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
29
  39,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/39,Returns the fraction of 'x' in the input up to the i-th position for all i.,60,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl,2,120,60,30,custom,4,480,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.08432740427115679,True,False,standard,False,1,False,345600,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
30
+ 130,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/130,"Clips each element to be within a range (make the default range [2, 7]).",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/edges.pkl,3,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.10079052613579392,True,False,standard,False,6,False,576,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
31
  75,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75,Double each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/75/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
32
  101,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/101,Check if each element is a square of an integer.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/101/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
33
  ioi_next_token,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/ioi_next_token,"Indirect Object Identification (IOI) task, trained using next token prediction.",16,16,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/ioi_next_token/edges.pkl,6,64,1024,16,gpt2,4,3072,gelu_new,50257,1e-05,False,True,False,False,False,False,GPT2LMHeadModel,False,gpt2,gpt2,LNPre,1,causal,False,,0.02886751345948129,True,False,standard,False,50257,False,2457600,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,,,,True,True,1.0,,,True,,256.0,True,True,"val/accuracy,val/IIA",,,True,0.65,False,0.0,True,max,,True,
 
35
  14,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/14,Returns the count of 'a' in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/14/edges.pkl,2,8,10,2,custom,4,32,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.15689290811054724,True,False,standard,False,10,False,1536,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
36
  95,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/95,Counts the distinct prime factors of each number in the input list.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/95/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12060453783110546,True,False,standard,False,3,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
37
  84,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/84,Apply the arctangent function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
38
+ 66,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/66,Round each element in the input sequence to the nearest integer.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13151918984428584,True,False,standard,False,6,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
39
  93,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93,Swaps the nth with the n+1th element if n%2==1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/93/edges.pkl,3,20,10,5,custom,4,80,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10886621079036347,True,False,standard,False,11,False,14400,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
40
  37,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/37,Reverses each word in the sequence except for specified exclusions.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/37/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
41
  34,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/34,Calculate the ratio of vowels to consonants in each word.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/34/edges.pkl,2,16,10,4,custom,4,64,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,5,False,6144,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
42
  26,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/26,Creates a cascading effect by repeating each token in sequence incrementally.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl,2,21,10,5,custom,4,84,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12344267996967354,True,False,standard,False,27,False,10416,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
43
+ 15,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/15,Returns each token multiplied by two and subtracted by its index.,5,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/edges.pkl,3,4,5,1,custom,4,16,gelu,7,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.06553855364152325,True,False,standard,False,12,False,576,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
44
  19,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/19,Removes consecutive duplicate tokens from a sequence.,15,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/edges.pkl,2,32,15,8,custom,4,128,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.15689290811054724,True,False,standard,False,3,False,24576,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.001,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,,True,,,True,True,,,,True,,True,,True,,,True,
45
  53,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/53,Increment elements at odd indices by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/53/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13151918984428584,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
46
  40,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/40,Sum the last and previous to last digits of a number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/40/edges.pkl,2,4,10,1,custom,4,16,gelu,31,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.09847319278346618,True,False,standard,False,12,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
47
  51,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/51,Checks if each element is a Fibonacci number,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl,2,4,10,1,custom,4,16,gelu,102,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.07525766947068778,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
48
+ 43,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/43,Returns the corresponding Fibonacci number for each element in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1131370849898476,True,False,standard,False,19,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
49
  122,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122,Check if each number is divisible by 3.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/122/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12199885626608374,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
50
  85,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/85,Square each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/85/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
51
  2,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/2,Reverse the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/2/edges.pkl,4,56,10,14,custom,4,224,gelu,28,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.07593263966019993,True,False,standard,False,26,False,150528,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 
55
  20,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/20,Detect spam messages based on appearance of spam keywords.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/20/edges.pkl,2,13,10,3,custom,4,52,gelu,14,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16,True,False,standard,False,2,False,3952,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
56
  25,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/25,Normalizes token frequencies in a sequence to a range between 0 and 1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/25/edges.pkl,2,62,10,15,custom,4,248,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.08295613557843402,True,False,standard,False,56,False,91264,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
57
  11,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/11,Counts the number of words in a sequence based on their length.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl,2,12,10,3,custom,4,48,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1460593486680443,True,False,standard,False,5,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,0.4,500.0,,gelu,True,True,1.0,,,True,,,True,True,,,,True,,True,,True,,,True,
58
+ 41,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/41,Make each element of the input sequence absolute,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.12344267996967354,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
59
  54,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/54,Applies the hyperbolic tangent to each element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
60
  124,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/124,Check if all elements in a list are equal.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/124/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.11547005383792516,True,False,standard,False,2,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
61
  102,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/102,"Reflects each element within a range (default is [2, 7]).",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/102/edges.pkl,2,4,10,1,custom,4,16,gelu,42,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1059625885652035,True,False,standard,False,6,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
 
65
  86,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/86,"Check if each element is a power of 2. Return 1 if true, otherwise 0.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/86/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.16329931618554522,True,False,standard,False,2,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
66
  105,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/105,Replaces each number with the next prime after that number.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/105/edges.pkl,2,4,10,1,custom,4,16,gelu,32,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.11202240672224079,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
67
  58,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/58,Mirrors the first half of the sequence to the second half.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl,3,32,10,8,custom,4,128,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10415112878465911,True,False,standard,False,11,False,36864,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
68
+ 68,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/68,Increment each element until it becomes a multiple of 3,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,5,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
69
  70,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/70,Apply the cosine function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
70
  62,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/62,Replaces each element with its factorial.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1414213562373095,True,False,standard,False,10,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
71
  111,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/111,Returns the last element of the sequence and pads the rest with zeros.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.09847319278346618,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
72
+ 121,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/121,Compute arcsine of all elements in the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/edges.pkl,2,4,10,1,custom,4,16,gelu,22,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.11202240672224079,True,False,standard,False,20,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,1.0,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
73
  35,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/35,Alternates capitalization of each character in words.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/edges.pkl,2,9,10,2,custom,4,36,gelu,10,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1539600717839002,True,False,standard,False,8,False,1872,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
74
  3,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/3,Returns the fraction of 'x' in the input up to the i-th position for all i.,5,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/edges.pkl,2,12,5,3,custom,4,48,gelu,6,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.22188007849009167,True,False,standard,False,1,False,3456,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,10.0,2000.0,,gelu,True,True,0.1,,strict,False,,,True,True,,,,True,,True,,True,,,True,
75
  36,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/36,"Classifies each token as 'positive', 'negative', or 'neutral' based on emojis.",10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl,2,6,10,1,custom,4,24,gelu,5,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.19402850002906638,True,False,standard,False,3,False,768,False,False,True,torch.float32,False,False,10000,False,False,True,,0.05,0.01,False,1.0,1.0,1.0,2000.0,,gelu,True,True,0.1,,strict,True,,,True,True,,,,True,,True,,True,,,True,
76
+ 106,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/106,Sets all elements to zero except for the element at index 1.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13719886811400708,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
77
  64,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/64,Cubes each element in the sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
78
  8,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/8,Identity,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
79
+ 73,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/73,Apply the sine function to each element of the input sequence.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
80
  103,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/103,Swap consecutive numbers in a list,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/103/edges.pkl,3,24,10,6,custom,4,96,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.10787197799411874,True,False,standard,False,11,False,20736,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
81
  56,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/56,Sets every third element to zero.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/56/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.13333333333333333,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
82
  97,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/97,Scale a sequence by its maximum element.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl,3,200,10,50,custom,4,800,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,bidirectional,False,0.0,0.05405899027195888,True,False,standard,False,64,False,1440000,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.4,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,82.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
83
+ 49,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/49,Decrements each element in the sequence until it becomes a multiple of 3.,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.15689290811054724,True,False,standard,False,4,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,92.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
84
  46,https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46,Decrements each element in the sequence by 1,10,4,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model_cfg.pkl,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/meta.json,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/ll_model.pth,https://huggingface.co/cybershiptrooper/InterpBench/blob/main/46/edges.pkl,2,4,10,1,custom,4,16,gelu,13,1e-05,True,True,True,True,False,False,,False,,gpt2,,1,causal,False,0.0,0.1392621247645583,True,False,standard,False,11,False,384,False,False,True,torch.float32,False,False,10000,False,False,False,/circuits-benchmark/results,0.05,0.001,True,1.0,0.4,0.7,1000.0,99.9,gelu,True,True,0.1,linear,strict,False,67.0,256.0,False,True,"val/accuracy,val/IIA,val/strict_accuracy",sample_all,all,True,,True,,True,,,True,
benchmark_cases_metadata.parquet CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:729585ec39204363367ad83efc6bf10185f4e191fe490714be2ab026d1c9864c
3
- size 75187
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:049d63f22c918edb98d89c9eb69f091016c4780b033e5559523abd7e50188238
3
+ size 76100
benchmark_metadata.json CHANGED
@@ -3352,6 +3352,150 @@
3352
  "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth",
3353
  "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl"
3354
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
3355
  {
3356
  "case_id": "75",
3357
  "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75",
@@ -4233,6 +4377,140 @@
4233
  "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth",
4234
  "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl"
4235
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4236
  {
4237
  "case_id": "93",
4238
  "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93",
@@ -4663,40 +4941,159 @@
4663
  "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl"
4664
  },
4665
  {
4666
- "case_id": "19",
4667
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/19",
4668
- "task_description": "Removes consecutive duplicate tokens from a sequence.",
4669
  "vocab": [
4670
- "a",
4671
- "b",
4672
- "c"
 
 
4673
  ],
4674
- "max_seq_len": 15,
4675
  "min_seq_len": 4,
4676
  "files": [
4677
  {
4678
  "file_name": "edges.pkl",
4679
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/edges.pkl"
4680
  },
4681
  {
4682
  "file_name": "ll_model.pth",
4683
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model.pth"
4684
  },
4685
  {
4686
  "file_name": "ll_model_cfg.pkl",
4687
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model_cfg.pkl"
4688
  },
4689
  {
4690
  "file_name": "meta.json",
4691
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/meta.json"
4692
  }
4693
  ],
4694
  "transformer_cfg": {
4695
- "n_layers": 2,
4696
- "d_model": 32,
4697
- "n_ctx": 15,
4698
- "d_head": 8,
4699
- "model_name": "custom",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4700
  "n_heads": 4,
4701
  "d_mlp": 128,
4702
  "act_fn": "gelu",
@@ -5241,6 +5638,140 @@
5241
  "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth",
5242
  "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl"
5243
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5244
  {
5245
  "case_id": "122",
5246
  "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122",
@@ -6371,10 +6902,20 @@
6371
  "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl"
6372
  },
6373
  {
6374
- "case_id": "54",
6375
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/54",
6376
- "task_description": "Applies the hyperbolic tangent to each element.",
6377
  "vocab": [
 
 
 
 
 
 
 
 
 
 
6378
  0,
6379
  1,
6380
  2,
@@ -6384,19 +6925,143 @@
6384
  6,
6385
  7,
6386
  8,
6387
- 9,
6388
- 10
6389
  ],
6390
  "max_seq_len": 10,
6391
  "min_seq_len": 4,
6392
  "files": [
6393
  {
6394
  "file_name": "edges.pkl",
6395
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/edges.pkl"
6396
  },
6397
  {
6398
  "file_name": "ll_model.pth",
6399
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model.pth"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6400
  },
6401
  {
6402
  "file_name": "ll_model_cfg.pkl",
@@ -7572,9 +8237,9 @@
7572
  "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl"
7573
  },
7574
  {
7575
- "case_id": "70",
7576
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/70",
7577
- "task_description": "Apply the cosine function to each element of the input sequence.",
7578
  "vocab": [
7579
  0,
7580
  1,
@@ -7593,19 +8258,19 @@
7593
  "files": [
7594
  {
7595
  "file_name": "edges.pkl",
7596
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl"
7597
  },
7598
  {
7599
  "file_name": "ll_model.pth",
7600
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth"
7601
  },
7602
  {
7603
  "file_name": "ll_model_cfg.pkl",
7604
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl"
7605
  },
7606
  {
7607
  "file_name": "meta.json",
7608
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json"
7609
  }
7610
  ],
7611
  "transformer_cfg": {
@@ -7639,12 +8304,12 @@
7639
  "attention_dir": "causal",
7640
  "attn_only": false,
7641
  "seed": 0,
7642
- "initializer_range": 0.1392621247645583,
7643
  "init_weights": true,
7644
  "scale_attn_by_inverse_layer_idx": false,
7645
  "positional_embedding_type": "standard",
7646
  "final_rms": false,
7647
- "d_vocab_out": 11,
7648
  "parallel_attn_mlp": false,
7649
  "rotary_dim": null,
7650
  "n_params": 384,
@@ -7662,7 +8327,7 @@
7662
  "num_experts": null,
7663
  "experts_per_token": null
7664
  },
7665
- "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl",
7666
  "training_args": {
7667
  "output_dir": "/circuits-benchmark/results",
7668
  "atol": 0.05,
@@ -7670,7 +8335,7 @@
7670
  "use_single_loss": true,
7671
  "iit_weight": 1.0,
7672
  "behavior_weight": 0.4,
7673
- "strict_weight": 0.7,
7674
  "epochs": 1000,
7675
  "early_stop_accuracy_threshold": 99.9,
7676
  "act_fn": "gelu",
@@ -7692,14 +8357,14 @@
7692
  "siit_sampling": "sample_all",
7693
  "val_iia_sampling": "all"
7694
  },
7695
- "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json",
7696
- "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth",
7697
- "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl"
7698
  },
7699
  {
7700
- "case_id": "62",
7701
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/62",
7702
- "task_description": "Replaces each element with its factorial.",
7703
  "vocab": [
7704
  0,
7705
  1,
@@ -7718,19 +8383,19 @@
7718
  "files": [
7719
  {
7720
  "file_name": "edges.pkl",
7721
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl"
7722
  },
7723
  {
7724
  "file_name": "ll_model.pth",
7725
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth"
7726
  },
7727
  {
7728
  "file_name": "ll_model_cfg.pkl",
7729
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl"
7730
  },
7731
  {
7732
  "file_name": "meta.json",
7733
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json"
7734
  }
7735
  ],
7736
  "transformer_cfg": {
@@ -7764,12 +8429,12 @@
7764
  "attention_dir": "causal",
7765
  "attn_only": false,
7766
  "seed": 0,
7767
- "initializer_range": 0.1414213562373095,
7768
  "init_weights": true,
7769
  "scale_attn_by_inverse_layer_idx": false,
7770
  "positional_embedding_type": "standard",
7771
  "final_rms": false,
7772
- "d_vocab_out": 10,
7773
  "parallel_attn_mlp": false,
7774
  "rotary_dim": null,
7775
  "n_params": 384,
@@ -7787,7 +8452,7 @@
7787
  "num_experts": null,
7788
  "experts_per_token": null
7789
  },
7790
- "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl",
7791
  "training_args": {
7792
  "output_dir": "/circuits-benchmark/results",
7793
  "atol": 0.05,
@@ -7817,14 +8482,14 @@
7817
  "siit_sampling": "sample_all",
7818
  "val_iia_sampling": "all"
7819
  },
7820
- "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json",
7821
- "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth",
7822
- "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl"
7823
  },
7824
  {
7825
- "case_id": "111",
7826
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/111",
7827
- "task_description": "Returns the last element of the sequence and pads the rest with zeros.",
7828
  "vocab": [
7829
  0,
7830
  1,
@@ -7843,29 +8508,29 @@
7843
  "files": [
7844
  {
7845
  "file_name": "edges.pkl",
7846
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl"
7847
  },
7848
  {
7849
  "file_name": "ll_model.pth",
7850
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth"
7851
  },
7852
  {
7853
  "file_name": "ll_model_cfg.pkl",
7854
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl"
7855
  },
7856
  {
7857
  "file_name": "meta.json",
7858
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json"
7859
  }
7860
  ],
7861
  "transformer_cfg": {
7862
- "n_layers": 3,
7863
- "d_model": 24,
7864
  "n_ctx": 10,
7865
- "d_head": 6,
7866
  "model_name": "custom",
7867
  "n_heads": 4,
7868
- "d_mlp": 96,
7869
  "act_fn": "gelu",
7870
  "d_vocab": 13,
7871
  "eps": 1e-05,
@@ -7886,18 +8551,18 @@
7886
  "init_mode": "gpt2",
7887
  "normalization_type": null,
7888
  "n_devices": 1,
7889
- "attention_dir": "bidirectional",
7890
  "attn_only": false,
7891
  "seed": 0,
7892
- "initializer_range": 0.09847319278346618,
7893
  "init_weights": true,
7894
  "scale_attn_by_inverse_layer_idx": false,
7895
  "positional_embedding_type": "standard",
7896
  "final_rms": false,
7897
- "d_vocab_out": 11,
7898
  "parallel_attn_mlp": false,
7899
  "rotary_dim": null,
7900
- "n_params": 20736,
7901
  "use_hook_tokens": false,
7902
  "gated_mlp": false,
7903
  "default_prepend_bos": true,
@@ -7912,7 +8577,7 @@
7912
  "num_experts": null,
7913
  "experts_per_token": null
7914
  },
7915
- "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl",
7916
  "training_args": {
7917
  "output_dir": "/circuits-benchmark/results",
7918
  "atol": 0.05,
@@ -7920,7 +8585,7 @@
7920
  "use_single_loss": true,
7921
  "iit_weight": 1.0,
7922
  "behavior_weight": 0.4,
7923
- "strict_weight": 0.4,
7924
  "epochs": 1000,
7925
  "early_stop_accuracy_threshold": 99.9,
7926
  "act_fn": "gelu",
@@ -7942,54 +8607,57 @@
7942
  "siit_sampling": "sample_all",
7943
  "val_iia_sampling": "all"
7944
  },
7945
- "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json",
7946
- "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth",
7947
- "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl"
7948
  },
7949
  {
7950
- "case_id": "35",
7951
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/35",
7952
- "task_description": "Alternates capitalization of each character in words.",
7953
  "vocab": [
7954
- "J",
7955
- "LB",
7956
- "TPSI",
7957
- "V",
7958
- "b",
7959
- "no",
7960
- "oCLrZaW",
7961
- "poiVg"
 
 
 
7962
  ],
7963
  "max_seq_len": 10,
7964
  "min_seq_len": 4,
7965
  "files": [
7966
  {
7967
  "file_name": "edges.pkl",
7968
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/edges.pkl"
7969
  },
7970
  {
7971
  "file_name": "ll_model.pth",
7972
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model.pth"
7973
  },
7974
  {
7975
  "file_name": "ll_model_cfg.pkl",
7976
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl"
7977
  },
7978
  {
7979
  "file_name": "meta.json",
7980
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/meta.json"
7981
  }
7982
  ],
7983
  "transformer_cfg": {
7984
- "n_layers": 2,
7985
- "d_model": 9,
7986
  "n_ctx": 10,
7987
- "d_head": 2,
7988
  "model_name": "custom",
7989
  "n_heads": 4,
7990
- "d_mlp": 36,
7991
  "act_fn": "gelu",
7992
- "d_vocab": 10,
7993
  "eps": 1e-05,
7994
  "use_attn_result": true,
7995
  "use_attn_scale": true,
@@ -8008,18 +8676,18 @@
8008
  "init_mode": "gpt2",
8009
  "normalization_type": null,
8010
  "n_devices": 1,
8011
- "attention_dir": "causal",
8012
  "attn_only": false,
8013
  "seed": 0,
8014
- "initializer_range": 0.1539600717839002,
8015
  "init_weights": true,
8016
  "scale_attn_by_inverse_layer_idx": false,
8017
  "positional_embedding_type": "standard",
8018
  "final_rms": false,
8019
- "d_vocab_out": 8,
8020
  "parallel_attn_mlp": false,
8021
  "rotary_dim": null,
8022
- "n_params": 1872,
8023
  "use_hook_tokens": false,
8024
  "gated_mlp": false,
8025
  "default_prepend_bos": true,
@@ -8029,9 +8697,265 @@
8029
  "post_embedding_ln": false,
8030
  "rotary_base": 10000,
8031
  "trust_remote_code": false,
8032
- "rotary_adjacent_pairs": false
8033
- },
8034
- "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl",
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8035
  "training_args": {
8036
  "atol": 0.05,
8037
  "lr": 0.01,
@@ -8136,58 +9060,289 @@
8136
  "lr": 0.01,
8137
  "use_single_loss": false,
8138
  "iit_weight": 1.0,
8139
- "behavior_weight": 1.0,
8140
- "strict_weight": 10.0,
8141
- "epochs": 2000,
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8142
  "act_fn": "gelu",
 
 
8143
  "clip_grad_norm": 0.1,
8144
- "lr_scheduler": "",
8145
  "model_pair": "strict",
8146
- "same_size": false
 
 
 
 
 
 
 
 
 
 
 
8147
  },
8148
- "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/meta.json",
8149
- "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model.pth",
8150
- "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/edges.pkl"
8151
  },
8152
  {
8153
- "case_id": "36",
8154
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/36",
8155
- "task_description": "Classifies each token as 'positive', 'negative', or 'neutral' based on emojis.",
8156
  "vocab": [
8157
- "\ud83d\udcd8",
8158
- "\ud83d\ude0a",
8159
- "\ud83d\ude22"
 
 
 
 
 
 
 
 
8160
  ],
8161
  "max_seq_len": 10,
8162
  "min_seq_len": 4,
8163
  "files": [
8164
  {
8165
  "file_name": "edges.pkl",
8166
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl"
8167
  },
8168
  {
8169
  "file_name": "ll_model.pth",
8170
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth"
8171
  },
8172
  {
8173
  "file_name": "ll_model_cfg.pkl",
8174
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl"
8175
  },
8176
  {
8177
  "file_name": "meta.json",
8178
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json"
8179
  }
8180
  ],
8181
  "transformer_cfg": {
8182
  "n_layers": 2,
8183
- "d_model": 6,
8184
  "n_ctx": 10,
8185
  "d_head": 1,
8186
  "model_name": "custom",
8187
  "n_heads": 4,
8188
- "d_mlp": 24,
8189
  "act_fn": "gelu",
8190
- "d_vocab": 5,
8191
  "eps": 1e-05,
8192
  "use_attn_result": true,
8193
  "use_attn_scale": true,
@@ -8209,15 +9364,15 @@
8209
  "attention_dir": "causal",
8210
  "attn_only": false,
8211
  "seed": 0,
8212
- "initializer_range": 0.19402850002906638,
8213
  "init_weights": true,
8214
  "scale_attn_by_inverse_layer_idx": false,
8215
  "positional_embedding_type": "standard",
8216
  "final_rms": false,
8217
- "d_vocab_out": 3,
8218
  "parallel_attn_mlp": false,
8219
  "rotary_dim": null,
8220
- "n_params": 768,
8221
  "use_hook_tokens": false,
8222
  "gated_mlp": false,
8223
  "default_prepend_bos": true,
@@ -8227,30 +9382,49 @@
8227
  "post_embedding_ln": false,
8228
  "rotary_base": 10000,
8229
  "trust_remote_code": false,
8230
- "rotary_adjacent_pairs": false
 
 
 
8231
  },
8232
- "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl",
8233
  "training_args": {
 
8234
  "atol": 0.05,
8235
- "lr": 0.01,
8236
- "use_single_loss": false,
8237
  "iit_weight": 1.0,
8238
- "behavior_weight": 1.0,
8239
- "strict_weight": 1.0,
8240
- "epochs": 2000,
 
8241
  "act_fn": "gelu",
 
 
8242
  "clip_grad_norm": 0.1,
8243
- "lr_scheduler": "",
8244
- "model_pair": "strict"
 
 
 
 
 
 
 
 
 
 
 
 
8245
  },
8246
- "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json",
8247
- "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth",
8248
- "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl"
8249
  },
8250
  {
8251
- "case_id": "64",
8252
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/64",
8253
- "task_description": "Cubes each element in the sequence.",
8254
  "vocab": [
8255
  0,
8256
  1,
@@ -8269,19 +9443,19 @@
8269
  "files": [
8270
  {
8271
  "file_name": "edges.pkl",
8272
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl"
8273
  },
8274
  {
8275
  "file_name": "ll_model.pth",
8276
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth"
8277
  },
8278
  {
8279
  "file_name": "ll_model_cfg.pkl",
8280
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl"
8281
  },
8282
  {
8283
  "file_name": "meta.json",
8284
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json"
8285
  }
8286
  ],
8287
  "transformer_cfg": {
@@ -8338,7 +9512,7 @@
8338
  "num_experts": null,
8339
  "experts_per_token": null
8340
  },
8341
- "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl",
8342
  "training_args": {
8343
  "output_dir": "/circuits-benchmark/results",
8344
  "atol": 0.05,
@@ -8368,14 +9542,14 @@
8368
  "siit_sampling": "sample_all",
8369
  "val_iia_sampling": "all"
8370
  },
8371
- "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json",
8372
- "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth",
8373
- "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl"
8374
  },
8375
  {
8376
- "case_id": "8",
8377
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/8",
8378
- "task_description": "Identity",
8379
  "vocab": [
8380
  0,
8381
  1,
@@ -8394,19 +9568,19 @@
8394
  "files": [
8395
  {
8396
  "file_name": "edges.pkl",
8397
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl"
8398
  },
8399
  {
8400
  "file_name": "ll_model.pth",
8401
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth"
8402
  },
8403
  {
8404
  "file_name": "ll_model_cfg.pkl",
8405
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl"
8406
  },
8407
  {
8408
  "file_name": "meta.json",
8409
- "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json"
8410
  }
8411
  ],
8412
  "transformer_cfg": {
@@ -8463,7 +9637,7 @@
8463
  "num_experts": null,
8464
  "experts_per_token": null
8465
  },
8466
- "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl",
8467
  "training_args": {
8468
  "output_dir": "/circuits-benchmark/results",
8469
  "atol": 0.05,
@@ -8481,7 +9655,7 @@
8481
  "lr_scheduler": "linear",
8482
  "model_pair": "strict",
8483
  "same_size": false,
8484
- "seed": 67,
8485
  "batch_size": 256,
8486
  "include_mlp": false,
8487
  "detach_while_caching": true,
@@ -8493,9 +9667,9 @@
8493
  "siit_sampling": "sample_all",
8494
  "val_iia_sampling": "all"
8495
  },
8496
- "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json",
8497
- "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth",
8498
- "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl"
8499
  },
8500
  {
8501
  "case_id": "103",
@@ -8872,6 +10046,131 @@
8872
  "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth",
8873
  "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl"
8874
  },
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
8875
  {
8876
  "case_id": "46",
8877
  "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46",
 
3352
  "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/ll_model.pth",
3353
  "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/39/edges.pkl"
3354
  },
3355
+ {
3356
+ "case_id": "130",
3357
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/130",
3358
+ "task_description": "Clips each element to be within a range (make the default range [2, 7]).",
3359
+ "vocab": [
3360
+ -15,
3361
+ -14,
3362
+ -13,
3363
+ -12,
3364
+ -11,
3365
+ -10,
3366
+ -9,
3367
+ -8,
3368
+ -7,
3369
+ -6,
3370
+ -5,
3371
+ -4,
3372
+ -3,
3373
+ -2,
3374
+ -1,
3375
+ 0,
3376
+ 1,
3377
+ 2,
3378
+ 3,
3379
+ 4,
3380
+ 5,
3381
+ 6,
3382
+ 7,
3383
+ 8,
3384
+ 9,
3385
+ 10,
3386
+ 11,
3387
+ 12,
3388
+ 13,
3389
+ 14
3390
+ ],
3391
+ "max_seq_len": 10,
3392
+ "min_seq_len": 4,
3393
+ "files": [
3394
+ {
3395
+ "file_name": "edges.pkl",
3396
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/edges.pkl"
3397
+ },
3398
+ {
3399
+ "file_name": "ll_model.pth",
3400
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model.pth"
3401
+ },
3402
+ {
3403
+ "file_name": "ll_model_cfg.pkl",
3404
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model_cfg.pkl"
3405
+ },
3406
+ {
3407
+ "file_name": "meta.json",
3408
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/meta.json"
3409
+ }
3410
+ ],
3411
+ "transformer_cfg": {
3412
+ "n_layers": 3,
3413
+ "d_model": 4,
3414
+ "n_ctx": 10,
3415
+ "d_head": 1,
3416
+ "model_name": "custom",
3417
+ "n_heads": 4,
3418
+ "d_mlp": 16,
3419
+ "act_fn": "gelu",
3420
+ "d_vocab": 32,
3421
+ "eps": 1e-05,
3422
+ "use_attn_result": true,
3423
+ "use_attn_scale": true,
3424
+ "use_split_qkv_input": true,
3425
+ "use_hook_mlp_in": true,
3426
+ "use_attn_in": false,
3427
+ "use_local_attn": false,
3428
+ "original_architecture": null,
3429
+ "from_checkpoint": false,
3430
+ "checkpoint_index": null,
3431
+ "checkpoint_label_type": null,
3432
+ "checkpoint_value": null,
3433
+ "tokenizer_name": null,
3434
+ "window_size": null,
3435
+ "attn_types": null,
3436
+ "init_mode": "gpt2",
3437
+ "normalization_type": null,
3438
+ "n_devices": 1,
3439
+ "attention_dir": "causal",
3440
+ "attn_only": false,
3441
+ "seed": 0,
3442
+ "initializer_range": 0.10079052613579392,
3443
+ "init_weights": true,
3444
+ "scale_attn_by_inverse_layer_idx": false,
3445
+ "positional_embedding_type": "standard",
3446
+ "final_rms": false,
3447
+ "d_vocab_out": 6,
3448
+ "parallel_attn_mlp": false,
3449
+ "rotary_dim": null,
3450
+ "n_params": 576,
3451
+ "use_hook_tokens": false,
3452
+ "gated_mlp": false,
3453
+ "default_prepend_bos": true,
3454
+ "dtype": "torch.float32",
3455
+ "tokenizer_prepends_bos": null,
3456
+ "n_key_value_heads": null,
3457
+ "post_embedding_ln": false,
3458
+ "rotary_base": 10000,
3459
+ "trust_remote_code": false,
3460
+ "rotary_adjacent_pairs": false,
3461
+ "load_in_4bit": false,
3462
+ "num_experts": null,
3463
+ "experts_per_token": null
3464
+ },
3465
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model_cfg.pkl",
3466
+ "training_args": {
3467
+ "output_dir": "/circuits-benchmark/results",
3468
+ "atol": 0.05,
3469
+ "lr": 0.001,
3470
+ "use_single_loss": true,
3471
+ "iit_weight": 1.0,
3472
+ "behavior_weight": 0.4,
3473
+ "strict_weight": 1.0,
3474
+ "epochs": 1000,
3475
+ "early_stop_accuracy_threshold": 99.9,
3476
+ "act_fn": "gelu",
3477
+ "use_wandb": true,
3478
+ "save_model_to_wandb": true,
3479
+ "clip_grad_norm": 0.1,
3480
+ "lr_scheduler": "linear",
3481
+ "model_pair": "strict",
3482
+ "same_size": false,
3483
+ "seed": 67,
3484
+ "batch_size": 256,
3485
+ "include_mlp": false,
3486
+ "detach_while_caching": true,
3487
+ "scheduler_val_metric": [
3488
+ "val/accuracy",
3489
+ "val/IIA",
3490
+ "val/strict_accuracy"
3491
+ ],
3492
+ "siit_sampling": "sample_all",
3493
+ "val_iia_sampling": "all"
3494
+ },
3495
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/meta.json",
3496
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/ll_model.pth",
3497
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/130/edges.pkl"
3498
+ },
3499
  {
3500
  "case_id": "75",
3501
  "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/75",
 
4377
  "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/ll_model.pth",
4378
  "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/84/edges.pkl"
4379
  },
4380
+ {
4381
+ "case_id": "66",
4382
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/66",
4383
+ "task_description": "Round each element in the input sequence to the nearest integer.",
4384
+ "vocab": [
4385
+ 0.0,
4386
+ 0.25,
4387
+ 0.5,
4388
+ 0.75,
4389
+ 1.0,
4390
+ 1.25,
4391
+ 1.5,
4392
+ 1.75,
4393
+ 2.0,
4394
+ 2.25,
4395
+ 2.5,
4396
+ 2.75,
4397
+ 3.0,
4398
+ 3.25,
4399
+ 3.5,
4400
+ 3.75,
4401
+ 4.0,
4402
+ 4.25,
4403
+ 4.5,
4404
+ 4.75
4405
+ ],
4406
+ "max_seq_len": 10,
4407
+ "min_seq_len": 4,
4408
+ "files": [
4409
+ {
4410
+ "file_name": "edges.pkl",
4411
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/edges.pkl"
4412
+ },
4413
+ {
4414
+ "file_name": "ll_model.pth",
4415
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model.pth"
4416
+ },
4417
+ {
4418
+ "file_name": "ll_model_cfg.pkl",
4419
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model_cfg.pkl"
4420
+ },
4421
+ {
4422
+ "file_name": "meta.json",
4423
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/meta.json"
4424
+ }
4425
+ ],
4426
+ "transformer_cfg": {
4427
+ "n_layers": 2,
4428
+ "d_model": 4,
4429
+ "n_ctx": 10,
4430
+ "d_head": 1,
4431
+ "model_name": "custom",
4432
+ "n_heads": 4,
4433
+ "d_mlp": 16,
4434
+ "act_fn": "gelu",
4435
+ "d_vocab": 22,
4436
+ "eps": 1e-05,
4437
+ "use_attn_result": true,
4438
+ "use_attn_scale": true,
4439
+ "use_split_qkv_input": true,
4440
+ "use_hook_mlp_in": true,
4441
+ "use_attn_in": false,
4442
+ "use_local_attn": false,
4443
+ "original_architecture": null,
4444
+ "from_checkpoint": false,
4445
+ "checkpoint_index": null,
4446
+ "checkpoint_label_type": null,
4447
+ "checkpoint_value": null,
4448
+ "tokenizer_name": null,
4449
+ "window_size": null,
4450
+ "attn_types": null,
4451
+ "init_mode": "gpt2",
4452
+ "normalization_type": null,
4453
+ "n_devices": 1,
4454
+ "attention_dir": "causal",
4455
+ "attn_only": false,
4456
+ "seed": 0,
4457
+ "initializer_range": 0.13151918984428584,
4458
+ "init_weights": true,
4459
+ "scale_attn_by_inverse_layer_idx": false,
4460
+ "positional_embedding_type": "standard",
4461
+ "final_rms": false,
4462
+ "d_vocab_out": 6,
4463
+ "parallel_attn_mlp": false,
4464
+ "rotary_dim": null,
4465
+ "n_params": 384,
4466
+ "use_hook_tokens": false,
4467
+ "gated_mlp": false,
4468
+ "default_prepend_bos": true,
4469
+ "dtype": "torch.float32",
4470
+ "tokenizer_prepends_bos": null,
4471
+ "n_key_value_heads": null,
4472
+ "post_embedding_ln": false,
4473
+ "rotary_base": 10000,
4474
+ "trust_remote_code": false,
4475
+ "rotary_adjacent_pairs": false,
4476
+ "load_in_4bit": false,
4477
+ "num_experts": null,
4478
+ "experts_per_token": null
4479
+ },
4480
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model_cfg.pkl",
4481
+ "training_args": {
4482
+ "output_dir": "/circuits-benchmark/results",
4483
+ "atol": 0.05,
4484
+ "lr": 0.001,
4485
+ "use_single_loss": true,
4486
+ "iit_weight": 1.0,
4487
+ "behavior_weight": 0.4,
4488
+ "strict_weight": 0.7,
4489
+ "epochs": 1000,
4490
+ "early_stop_accuracy_threshold": 99.9,
4491
+ "act_fn": "gelu",
4492
+ "use_wandb": true,
4493
+ "save_model_to_wandb": true,
4494
+ "clip_grad_norm": 0.1,
4495
+ "lr_scheduler": "linear",
4496
+ "model_pair": "strict",
4497
+ "same_size": false,
4498
+ "seed": 92,
4499
+ "batch_size": 256,
4500
+ "include_mlp": false,
4501
+ "detach_while_caching": true,
4502
+ "scheduler_val_metric": [
4503
+ "val/accuracy",
4504
+ "val/IIA",
4505
+ "val/strict_accuracy"
4506
+ ],
4507
+ "siit_sampling": "sample_all",
4508
+ "val_iia_sampling": "all"
4509
+ },
4510
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/meta.json",
4511
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/ll_model.pth",
4512
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/66/edges.pkl"
4513
+ },
4514
  {
4515
  "case_id": "93",
4516
  "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/93",
 
4941
  "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/26/edges.pkl"
4942
  },
4943
  {
4944
+ "case_id": "15",
4945
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/15",
4946
+ "task_description": "Returns each token multiplied by two and subtracted by its index.",
4947
  "vocab": [
4948
+ 0,
4949
+ 1,
4950
+ 2,
4951
+ 3,
4952
+ 4
4953
  ],
4954
+ "max_seq_len": 5,
4955
  "min_seq_len": 4,
4956
  "files": [
4957
  {
4958
  "file_name": "edges.pkl",
4959
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/edges.pkl"
4960
  },
4961
  {
4962
  "file_name": "ll_model.pth",
4963
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model.pth"
4964
  },
4965
  {
4966
  "file_name": "ll_model_cfg.pkl",
4967
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model_cfg.pkl"
4968
  },
4969
  {
4970
  "file_name": "meta.json",
4971
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/meta.json"
4972
  }
4973
  ],
4974
  "transformer_cfg": {
4975
+ "n_layers": 3,
4976
+ "d_model": 4,
4977
+ "n_ctx": 5,
4978
+ "d_head": 1,
4979
+ "model_name": "custom",
4980
+ "n_heads": 4,
4981
+ "d_mlp": 16,
4982
+ "act_fn": "gelu",
4983
+ "d_vocab": 7,
4984
+ "eps": 1e-05,
4985
+ "use_attn_result": true,
4986
+ "use_attn_scale": true,
4987
+ "use_split_qkv_input": true,
4988
+ "use_hook_mlp_in": true,
4989
+ "use_attn_in": false,
4990
+ "use_local_attn": false,
4991
+ "original_architecture": null,
4992
+ "from_checkpoint": false,
4993
+ "checkpoint_index": null,
4994
+ "checkpoint_label_type": null,
4995
+ "checkpoint_value": null,
4996
+ "tokenizer_name": null,
4997
+ "window_size": null,
4998
+ "attn_types": null,
4999
+ "init_mode": "gpt2",
5000
+ "normalization_type": null,
5001
+ "n_devices": 1,
5002
+ "attention_dir": "causal",
5003
+ "attn_only": false,
5004
+ "seed": 0,
5005
+ "initializer_range": 0.06553855364152325,
5006
+ "init_weights": true,
5007
+ "scale_attn_by_inverse_layer_idx": false,
5008
+ "positional_embedding_type": "standard",
5009
+ "final_rms": false,
5010
+ "d_vocab_out": 12,
5011
+ "parallel_attn_mlp": false,
5012
+ "rotary_dim": null,
5013
+ "n_params": 576,
5014
+ "use_hook_tokens": false,
5015
+ "gated_mlp": false,
5016
+ "default_prepend_bos": true,
5017
+ "dtype": "torch.float32",
5018
+ "tokenizer_prepends_bos": null,
5019
+ "n_key_value_heads": null,
5020
+ "post_embedding_ln": false,
5021
+ "rotary_base": 10000,
5022
+ "trust_remote_code": false,
5023
+ "rotary_adjacent_pairs": false,
5024
+ "load_in_4bit": false,
5025
+ "num_experts": null,
5026
+ "experts_per_token": null
5027
+ },
5028
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model_cfg.pkl",
5029
+ "training_args": {
5030
+ "output_dir": "/circuits-benchmark/results",
5031
+ "atol": 0.05,
5032
+ "lr": 0.001,
5033
+ "use_single_loss": true,
5034
+ "iit_weight": 1.0,
5035
+ "behavior_weight": 0.4,
5036
+ "strict_weight": 1.0,
5037
+ "epochs": 1000,
5038
+ "early_stop_accuracy_threshold": 99.9,
5039
+ "act_fn": "gelu",
5040
+ "use_wandb": true,
5041
+ "save_model_to_wandb": true,
5042
+ "clip_grad_norm": 0.1,
5043
+ "lr_scheduler": "linear",
5044
+ "model_pair": "strict",
5045
+ "same_size": false,
5046
+ "seed": 67,
5047
+ "batch_size": 256,
5048
+ "include_mlp": false,
5049
+ "detach_while_caching": true,
5050
+ "scheduler_val_metric": [
5051
+ "val/accuracy",
5052
+ "val/IIA",
5053
+ "val/strict_accuracy"
5054
+ ],
5055
+ "siit_sampling": "sample_all",
5056
+ "val_iia_sampling": "all"
5057
+ },
5058
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/meta.json",
5059
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/ll_model.pth",
5060
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/15/edges.pkl"
5061
+ },
5062
+ {
5063
+ "case_id": "19",
5064
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/19",
5065
+ "task_description": "Removes consecutive duplicate tokens from a sequence.",
5066
+ "vocab": [
5067
+ "a",
5068
+ "b",
5069
+ "c"
5070
+ ],
5071
+ "max_seq_len": 15,
5072
+ "min_seq_len": 4,
5073
+ "files": [
5074
+ {
5075
+ "file_name": "edges.pkl",
5076
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/edges.pkl"
5077
+ },
5078
+ {
5079
+ "file_name": "ll_model.pth",
5080
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model.pth"
5081
+ },
5082
+ {
5083
+ "file_name": "ll_model_cfg.pkl",
5084
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/ll_model_cfg.pkl"
5085
+ },
5086
+ {
5087
+ "file_name": "meta.json",
5088
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/19/meta.json"
5089
+ }
5090
+ ],
5091
+ "transformer_cfg": {
5092
+ "n_layers": 2,
5093
+ "d_model": 32,
5094
+ "n_ctx": 15,
5095
+ "d_head": 8,
5096
+ "model_name": "custom",
5097
  "n_heads": 4,
5098
  "d_mlp": 128,
5099
  "act_fn": "gelu",
 
5638
  "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/ll_model.pth",
5639
  "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/51/edges.pkl"
5640
  },
5641
+ {
5642
+ "case_id": "43",
5643
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/43",
5644
+ "task_description": "Returns the corresponding Fibonacci number for each element in the input sequence.",
5645
+ "vocab": [
5646
+ 0,
5647
+ 1,
5648
+ 2,
5649
+ 3,
5650
+ 4,
5651
+ 5,
5652
+ 6,
5653
+ 7,
5654
+ 8,
5655
+ 9,
5656
+ 10,
5657
+ 11,
5658
+ 12,
5659
+ 13,
5660
+ 14,
5661
+ 15,
5662
+ 16,
5663
+ 17,
5664
+ 18,
5665
+ 19
5666
+ ],
5667
+ "max_seq_len": 10,
5668
+ "min_seq_len": 4,
5669
+ "files": [
5670
+ {
5671
+ "file_name": "edges.pkl",
5672
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/edges.pkl"
5673
+ },
5674
+ {
5675
+ "file_name": "ll_model.pth",
5676
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model.pth"
5677
+ },
5678
+ {
5679
+ "file_name": "ll_model_cfg.pkl",
5680
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model_cfg.pkl"
5681
+ },
5682
+ {
5683
+ "file_name": "meta.json",
5684
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/meta.json"
5685
+ }
5686
+ ],
5687
+ "transformer_cfg": {
5688
+ "n_layers": 2,
5689
+ "d_model": 4,
5690
+ "n_ctx": 10,
5691
+ "d_head": 1,
5692
+ "model_name": "custom",
5693
+ "n_heads": 4,
5694
+ "d_mlp": 16,
5695
+ "act_fn": "gelu",
5696
+ "d_vocab": 22,
5697
+ "eps": 1e-05,
5698
+ "use_attn_result": true,
5699
+ "use_attn_scale": true,
5700
+ "use_split_qkv_input": true,
5701
+ "use_hook_mlp_in": true,
5702
+ "use_attn_in": false,
5703
+ "use_local_attn": false,
5704
+ "original_architecture": null,
5705
+ "from_checkpoint": false,
5706
+ "checkpoint_index": null,
5707
+ "checkpoint_label_type": null,
5708
+ "checkpoint_value": null,
5709
+ "tokenizer_name": null,
5710
+ "window_size": null,
5711
+ "attn_types": null,
5712
+ "init_mode": "gpt2",
5713
+ "normalization_type": null,
5714
+ "n_devices": 1,
5715
+ "attention_dir": "causal",
5716
+ "attn_only": false,
5717
+ "seed": 0,
5718
+ "initializer_range": 0.1131370849898476,
5719
+ "init_weights": true,
5720
+ "scale_attn_by_inverse_layer_idx": false,
5721
+ "positional_embedding_type": "standard",
5722
+ "final_rms": false,
5723
+ "d_vocab_out": 19,
5724
+ "parallel_attn_mlp": false,
5725
+ "rotary_dim": null,
5726
+ "n_params": 384,
5727
+ "use_hook_tokens": false,
5728
+ "gated_mlp": false,
5729
+ "default_prepend_bos": true,
5730
+ "dtype": "torch.float32",
5731
+ "tokenizer_prepends_bos": null,
5732
+ "n_key_value_heads": null,
5733
+ "post_embedding_ln": false,
5734
+ "rotary_base": 10000,
5735
+ "trust_remote_code": false,
5736
+ "rotary_adjacent_pairs": false,
5737
+ "load_in_4bit": false,
5738
+ "num_experts": null,
5739
+ "experts_per_token": null
5740
+ },
5741
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model_cfg.pkl",
5742
+ "training_args": {
5743
+ "output_dir": "/circuits-benchmark/results",
5744
+ "atol": 0.05,
5745
+ "lr": 0.001,
5746
+ "use_single_loss": true,
5747
+ "iit_weight": 1.0,
5748
+ "behavior_weight": 0.4,
5749
+ "strict_weight": 1.0,
5750
+ "epochs": 1000,
5751
+ "early_stop_accuracy_threshold": 99.9,
5752
+ "act_fn": "gelu",
5753
+ "use_wandb": true,
5754
+ "save_model_to_wandb": true,
5755
+ "clip_grad_norm": 0.1,
5756
+ "lr_scheduler": "linear",
5757
+ "model_pair": "strict",
5758
+ "same_size": false,
5759
+ "seed": 67,
5760
+ "batch_size": 256,
5761
+ "include_mlp": false,
5762
+ "detach_while_caching": true,
5763
+ "scheduler_val_metric": [
5764
+ "val/accuracy",
5765
+ "val/IIA",
5766
+ "val/strict_accuracy"
5767
+ ],
5768
+ "siit_sampling": "sample_all",
5769
+ "val_iia_sampling": "all"
5770
+ },
5771
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/meta.json",
5772
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/ll_model.pth",
5773
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/43/edges.pkl"
5774
+ },
5775
  {
5776
  "case_id": "122",
5777
  "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/122",
 
6902
  "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/11/edges.pkl"
6903
  },
6904
  {
6905
+ "case_id": "41",
6906
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/41",
6907
+ "task_description": "Make each element of the input sequence absolute",
6908
  "vocab": [
6909
+ -10,
6910
+ -9,
6911
+ -8,
6912
+ -7,
6913
+ -6,
6914
+ -5,
6915
+ -4,
6916
+ -3,
6917
+ -2,
6918
+ -1,
6919
  0,
6920
  1,
6921
  2,
 
6925
  6,
6926
  7,
6927
  8,
6928
+ 9
 
6929
  ],
6930
  "max_seq_len": 10,
6931
  "min_seq_len": 4,
6932
  "files": [
6933
  {
6934
  "file_name": "edges.pkl",
6935
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/edges.pkl"
6936
  },
6937
  {
6938
  "file_name": "ll_model.pth",
6939
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model.pth"
6940
+ },
6941
+ {
6942
+ "file_name": "ll_model_cfg.pkl",
6943
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model_cfg.pkl"
6944
+ },
6945
+ {
6946
+ "file_name": "meta.json",
6947
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/meta.json"
6948
+ }
6949
+ ],
6950
+ "transformer_cfg": {
6951
+ "n_layers": 2,
6952
+ "d_model": 4,
6953
+ "n_ctx": 10,
6954
+ "d_head": 1,
6955
+ "model_name": "custom",
6956
+ "n_heads": 4,
6957
+ "d_mlp": 16,
6958
+ "act_fn": "gelu",
6959
+ "d_vocab": 22,
6960
+ "eps": 1e-05,
6961
+ "use_attn_result": true,
6962
+ "use_attn_scale": true,
6963
+ "use_split_qkv_input": true,
6964
+ "use_hook_mlp_in": true,
6965
+ "use_attn_in": false,
6966
+ "use_local_attn": false,
6967
+ "original_architecture": null,
6968
+ "from_checkpoint": false,
6969
+ "checkpoint_index": null,
6970
+ "checkpoint_label_type": null,
6971
+ "checkpoint_value": null,
6972
+ "tokenizer_name": null,
6973
+ "window_size": null,
6974
+ "attn_types": null,
6975
+ "init_mode": "gpt2",
6976
+ "normalization_type": null,
6977
+ "n_devices": 1,
6978
+ "attention_dir": "causal",
6979
+ "attn_only": false,
6980
+ "seed": 0,
6981
+ "initializer_range": 0.12344267996967354,
6982
+ "init_weights": true,
6983
+ "scale_attn_by_inverse_layer_idx": false,
6984
+ "positional_embedding_type": "standard",
6985
+ "final_rms": false,
6986
+ "d_vocab_out": 11,
6987
+ "parallel_attn_mlp": false,
6988
+ "rotary_dim": null,
6989
+ "n_params": 384,
6990
+ "use_hook_tokens": false,
6991
+ "gated_mlp": false,
6992
+ "default_prepend_bos": true,
6993
+ "dtype": "torch.float32",
6994
+ "tokenizer_prepends_bos": null,
6995
+ "n_key_value_heads": null,
6996
+ "post_embedding_ln": false,
6997
+ "rotary_base": 10000,
6998
+ "trust_remote_code": false,
6999
+ "rotary_adjacent_pairs": false,
7000
+ "load_in_4bit": false,
7001
+ "num_experts": null,
7002
+ "experts_per_token": null
7003
+ },
7004
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model_cfg.pkl",
7005
+ "training_args": {
7006
+ "output_dir": "/circuits-benchmark/results",
7007
+ "atol": 0.05,
7008
+ "lr": 0.001,
7009
+ "use_single_loss": true,
7010
+ "iit_weight": 1.0,
7011
+ "behavior_weight": 0.4,
7012
+ "strict_weight": 1.0,
7013
+ "epochs": 1000,
7014
+ "early_stop_accuracy_threshold": 99.9,
7015
+ "act_fn": "gelu",
7016
+ "use_wandb": true,
7017
+ "save_model_to_wandb": true,
7018
+ "clip_grad_norm": 0.1,
7019
+ "lr_scheduler": "linear",
7020
+ "model_pair": "strict",
7021
+ "same_size": false,
7022
+ "seed": 67,
7023
+ "batch_size": 256,
7024
+ "include_mlp": false,
7025
+ "detach_while_caching": true,
7026
+ "scheduler_val_metric": [
7027
+ "val/accuracy",
7028
+ "val/IIA",
7029
+ "val/strict_accuracy"
7030
+ ],
7031
+ "siit_sampling": "sample_all",
7032
+ "val_iia_sampling": "all"
7033
+ },
7034
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/meta.json",
7035
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/ll_model.pth",
7036
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/41/edges.pkl"
7037
+ },
7038
+ {
7039
+ "case_id": "54",
7040
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/54",
7041
+ "task_description": "Applies the hyperbolic tangent to each element.",
7042
+ "vocab": [
7043
+ 0,
7044
+ 1,
7045
+ 2,
7046
+ 3,
7047
+ 4,
7048
+ 5,
7049
+ 6,
7050
+ 7,
7051
+ 8,
7052
+ 9,
7053
+ 10
7054
+ ],
7055
+ "max_seq_len": 10,
7056
+ "min_seq_len": 4,
7057
+ "files": [
7058
+ {
7059
+ "file_name": "edges.pkl",
7060
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/edges.pkl"
7061
+ },
7062
+ {
7063
+ "file_name": "ll_model.pth",
7064
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/54/ll_model.pth"
7065
  },
7066
  {
7067
  "file_name": "ll_model_cfg.pkl",
 
8237
  "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/58/edges.pkl"
8238
  },
8239
  {
8240
+ "case_id": "68",
8241
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/68",
8242
+ "task_description": "Increment each element until it becomes a multiple of 3",
8243
  "vocab": [
8244
  0,
8245
  1,
 
8258
  "files": [
8259
  {
8260
  "file_name": "edges.pkl",
8261
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/edges.pkl"
8262
  },
8263
  {
8264
  "file_name": "ll_model.pth",
8265
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model.pth"
8266
  },
8267
  {
8268
  "file_name": "ll_model_cfg.pkl",
8269
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model_cfg.pkl"
8270
  },
8271
  {
8272
  "file_name": "meta.json",
8273
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/meta.json"
8274
  }
8275
  ],
8276
  "transformer_cfg": {
 
8304
  "attention_dir": "causal",
8305
  "attn_only": false,
8306
  "seed": 0,
8307
+ "initializer_range": 0.1539600717839002,
8308
  "init_weights": true,
8309
  "scale_attn_by_inverse_layer_idx": false,
8310
  "positional_embedding_type": "standard",
8311
  "final_rms": false,
8312
+ "d_vocab_out": 5,
8313
  "parallel_attn_mlp": false,
8314
  "rotary_dim": null,
8315
  "n_params": 384,
 
8327
  "num_experts": null,
8328
  "experts_per_token": null
8329
  },
8330
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model_cfg.pkl",
8331
  "training_args": {
8332
  "output_dir": "/circuits-benchmark/results",
8333
  "atol": 0.05,
 
8335
  "use_single_loss": true,
8336
  "iit_weight": 1.0,
8337
  "behavior_weight": 0.4,
8338
+ "strict_weight": 1.0,
8339
  "epochs": 1000,
8340
  "early_stop_accuracy_threshold": 99.9,
8341
  "act_fn": "gelu",
 
8357
  "siit_sampling": "sample_all",
8358
  "val_iia_sampling": "all"
8359
  },
8360
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/meta.json",
8361
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/ll_model.pth",
8362
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/68/edges.pkl"
8363
  },
8364
  {
8365
+ "case_id": "70",
8366
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/70",
8367
+ "task_description": "Apply the cosine function to each element of the input sequence.",
8368
  "vocab": [
8369
  0,
8370
  1,
 
8383
  "files": [
8384
  {
8385
  "file_name": "edges.pkl",
8386
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl"
8387
  },
8388
  {
8389
  "file_name": "ll_model.pth",
8390
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth"
8391
  },
8392
  {
8393
  "file_name": "ll_model_cfg.pkl",
8394
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl"
8395
  },
8396
  {
8397
  "file_name": "meta.json",
8398
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json"
8399
  }
8400
  ],
8401
  "transformer_cfg": {
 
8429
  "attention_dir": "causal",
8430
  "attn_only": false,
8431
  "seed": 0,
8432
+ "initializer_range": 0.1392621247645583,
8433
  "init_weights": true,
8434
  "scale_attn_by_inverse_layer_idx": false,
8435
  "positional_embedding_type": "standard",
8436
  "final_rms": false,
8437
+ "d_vocab_out": 11,
8438
  "parallel_attn_mlp": false,
8439
  "rotary_dim": null,
8440
  "n_params": 384,
 
8452
  "num_experts": null,
8453
  "experts_per_token": null
8454
  },
8455
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model_cfg.pkl",
8456
  "training_args": {
8457
  "output_dir": "/circuits-benchmark/results",
8458
  "atol": 0.05,
 
8482
  "siit_sampling": "sample_all",
8483
  "val_iia_sampling": "all"
8484
  },
8485
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/meta.json",
8486
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/ll_model.pth",
8487
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/70/edges.pkl"
8488
  },
8489
  {
8490
+ "case_id": "62",
8491
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/62",
8492
+ "task_description": "Replaces each element with its factorial.",
8493
  "vocab": [
8494
  0,
8495
  1,
 
8508
  "files": [
8509
  {
8510
  "file_name": "edges.pkl",
8511
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl"
8512
  },
8513
  {
8514
  "file_name": "ll_model.pth",
8515
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth"
8516
  },
8517
  {
8518
  "file_name": "ll_model_cfg.pkl",
8519
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl"
8520
  },
8521
  {
8522
  "file_name": "meta.json",
8523
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json"
8524
  }
8525
  ],
8526
  "transformer_cfg": {
8527
+ "n_layers": 2,
8528
+ "d_model": 4,
8529
  "n_ctx": 10,
8530
+ "d_head": 1,
8531
  "model_name": "custom",
8532
  "n_heads": 4,
8533
+ "d_mlp": 16,
8534
  "act_fn": "gelu",
8535
  "d_vocab": 13,
8536
  "eps": 1e-05,
 
8551
  "init_mode": "gpt2",
8552
  "normalization_type": null,
8553
  "n_devices": 1,
8554
+ "attention_dir": "causal",
8555
  "attn_only": false,
8556
  "seed": 0,
8557
+ "initializer_range": 0.1414213562373095,
8558
  "init_weights": true,
8559
  "scale_attn_by_inverse_layer_idx": false,
8560
  "positional_embedding_type": "standard",
8561
  "final_rms": false,
8562
+ "d_vocab_out": 10,
8563
  "parallel_attn_mlp": false,
8564
  "rotary_dim": null,
8565
+ "n_params": 384,
8566
  "use_hook_tokens": false,
8567
  "gated_mlp": false,
8568
  "default_prepend_bos": true,
 
8577
  "num_experts": null,
8578
  "experts_per_token": null
8579
  },
8580
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model_cfg.pkl",
8581
  "training_args": {
8582
  "output_dir": "/circuits-benchmark/results",
8583
  "atol": 0.05,
 
8585
  "use_single_loss": true,
8586
  "iit_weight": 1.0,
8587
  "behavior_weight": 0.4,
8588
+ "strict_weight": 0.7,
8589
  "epochs": 1000,
8590
  "early_stop_accuracy_threshold": 99.9,
8591
  "act_fn": "gelu",
 
8607
  "siit_sampling": "sample_all",
8608
  "val_iia_sampling": "all"
8609
  },
8610
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/meta.json",
8611
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/ll_model.pth",
8612
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/62/edges.pkl"
8613
  },
8614
  {
8615
+ "case_id": "111",
8616
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/111",
8617
+ "task_description": "Returns the last element of the sequence and pads the rest with zeros.",
8618
  "vocab": [
8619
+ 0,
8620
+ 1,
8621
+ 2,
8622
+ 3,
8623
+ 4,
8624
+ 5,
8625
+ 6,
8626
+ 7,
8627
+ 8,
8628
+ 9,
8629
+ 10
8630
  ],
8631
  "max_seq_len": 10,
8632
  "min_seq_len": 4,
8633
  "files": [
8634
  {
8635
  "file_name": "edges.pkl",
8636
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl"
8637
  },
8638
  {
8639
  "file_name": "ll_model.pth",
8640
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth"
8641
  },
8642
  {
8643
  "file_name": "ll_model_cfg.pkl",
8644
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl"
8645
  },
8646
  {
8647
  "file_name": "meta.json",
8648
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json"
8649
  }
8650
  ],
8651
  "transformer_cfg": {
8652
+ "n_layers": 3,
8653
+ "d_model": 24,
8654
  "n_ctx": 10,
8655
+ "d_head": 6,
8656
  "model_name": "custom",
8657
  "n_heads": 4,
8658
+ "d_mlp": 96,
8659
  "act_fn": "gelu",
8660
+ "d_vocab": 13,
8661
  "eps": 1e-05,
8662
  "use_attn_result": true,
8663
  "use_attn_scale": true,
 
8676
  "init_mode": "gpt2",
8677
  "normalization_type": null,
8678
  "n_devices": 1,
8679
+ "attention_dir": "bidirectional",
8680
  "attn_only": false,
8681
  "seed": 0,
8682
+ "initializer_range": 0.09847319278346618,
8683
  "init_weights": true,
8684
  "scale_attn_by_inverse_layer_idx": false,
8685
  "positional_embedding_type": "standard",
8686
  "final_rms": false,
8687
+ "d_vocab_out": 11,
8688
  "parallel_attn_mlp": false,
8689
  "rotary_dim": null,
8690
+ "n_params": 20736,
8691
  "use_hook_tokens": false,
8692
  "gated_mlp": false,
8693
  "default_prepend_bos": true,
 
8697
  "post_embedding_ln": false,
8698
  "rotary_base": 10000,
8699
  "trust_remote_code": false,
8700
+ "rotary_adjacent_pairs": false,
8701
+ "load_in_4bit": false,
8702
+ "num_experts": null,
8703
+ "experts_per_token": null
8704
+ },
8705
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model_cfg.pkl",
8706
+ "training_args": {
8707
+ "output_dir": "/circuits-benchmark/results",
8708
+ "atol": 0.05,
8709
+ "lr": 0.001,
8710
+ "use_single_loss": true,
8711
+ "iit_weight": 1.0,
8712
+ "behavior_weight": 0.4,
8713
+ "strict_weight": 0.4,
8714
+ "epochs": 1000,
8715
+ "early_stop_accuracy_threshold": 99.9,
8716
+ "act_fn": "gelu",
8717
+ "use_wandb": true,
8718
+ "save_model_to_wandb": true,
8719
+ "clip_grad_norm": 0.1,
8720
+ "lr_scheduler": "linear",
8721
+ "model_pair": "strict",
8722
+ "same_size": false,
8723
+ "seed": 67,
8724
+ "batch_size": 256,
8725
+ "include_mlp": false,
8726
+ "detach_while_caching": true,
8727
+ "scheduler_val_metric": [
8728
+ "val/accuracy",
8729
+ "val/IIA",
8730
+ "val/strict_accuracy"
8731
+ ],
8732
+ "siit_sampling": "sample_all",
8733
+ "val_iia_sampling": "all"
8734
+ },
8735
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/meta.json",
8736
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/ll_model.pth",
8737
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/111/edges.pkl"
8738
+ },
8739
+ {
8740
+ "case_id": "121",
8741
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/121",
8742
+ "task_description": "Compute arcsine of all elements in the input sequence.",
8743
+ "vocab": [
8744
+ -1.0,
8745
+ -0.9,
8746
+ -0.8,
8747
+ -0.7,
8748
+ -0.6,
8749
+ -0.5,
8750
+ -0.4,
8751
+ -0.30000000000000004,
8752
+ -0.19999999999999996,
8753
+ -0.09999999999999998,
8754
+ 0.0,
8755
+ 0.10000000000000009,
8756
+ 0.19999999999999996,
8757
+ 0.30000000000000004,
8758
+ 0.3999999999999999,
8759
+ 0.5,
8760
+ 0.6000000000000001,
8761
+ 0.7,
8762
+ 0.8,
8763
+ 0.8999999999999999
8764
+ ],
8765
+ "max_seq_len": 10,
8766
+ "min_seq_len": 4,
8767
+ "files": [
8768
+ {
8769
+ "file_name": "edges.pkl",
8770
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/edges.pkl"
8771
+ },
8772
+ {
8773
+ "file_name": "ll_model.pth",
8774
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model.pth"
8775
+ },
8776
+ {
8777
+ "file_name": "ll_model_cfg.pkl",
8778
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model_cfg.pkl"
8779
+ },
8780
+ {
8781
+ "file_name": "meta.json",
8782
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/meta.json"
8783
+ }
8784
+ ],
8785
+ "transformer_cfg": {
8786
+ "n_layers": 2,
8787
+ "d_model": 4,
8788
+ "n_ctx": 10,
8789
+ "d_head": 1,
8790
+ "model_name": "custom",
8791
+ "n_heads": 4,
8792
+ "d_mlp": 16,
8793
+ "act_fn": "gelu",
8794
+ "d_vocab": 22,
8795
+ "eps": 1e-05,
8796
+ "use_attn_result": true,
8797
+ "use_attn_scale": true,
8798
+ "use_split_qkv_input": true,
8799
+ "use_hook_mlp_in": true,
8800
+ "use_attn_in": false,
8801
+ "use_local_attn": false,
8802
+ "original_architecture": null,
8803
+ "from_checkpoint": false,
8804
+ "checkpoint_index": null,
8805
+ "checkpoint_label_type": null,
8806
+ "checkpoint_value": null,
8807
+ "tokenizer_name": null,
8808
+ "window_size": null,
8809
+ "attn_types": null,
8810
+ "init_mode": "gpt2",
8811
+ "normalization_type": null,
8812
+ "n_devices": 1,
8813
+ "attention_dir": "causal",
8814
+ "attn_only": false,
8815
+ "seed": 0,
8816
+ "initializer_range": 0.11202240672224079,
8817
+ "init_weights": true,
8818
+ "scale_attn_by_inverse_layer_idx": false,
8819
+ "positional_embedding_type": "standard",
8820
+ "final_rms": false,
8821
+ "d_vocab_out": 20,
8822
+ "parallel_attn_mlp": false,
8823
+ "rotary_dim": null,
8824
+ "n_params": 384,
8825
+ "use_hook_tokens": false,
8826
+ "gated_mlp": false,
8827
+ "default_prepend_bos": true,
8828
+ "dtype": "torch.float32",
8829
+ "tokenizer_prepends_bos": null,
8830
+ "n_key_value_heads": null,
8831
+ "post_embedding_ln": false,
8832
+ "rotary_base": 10000,
8833
+ "trust_remote_code": false,
8834
+ "rotary_adjacent_pairs": false,
8835
+ "load_in_4bit": false,
8836
+ "num_experts": null,
8837
+ "experts_per_token": null
8838
+ },
8839
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model_cfg.pkl",
8840
+ "training_args": {
8841
+ "output_dir": "/circuits-benchmark/results",
8842
+ "atol": 0.05,
8843
+ "lr": 0.001,
8844
+ "use_single_loss": true,
8845
+ "iit_weight": 1.0,
8846
+ "behavior_weight": 0.4,
8847
+ "strict_weight": 1.0,
8848
+ "epochs": 1000,
8849
+ "early_stop_accuracy_threshold": 99.9,
8850
+ "act_fn": "gelu",
8851
+ "use_wandb": true,
8852
+ "save_model_to_wandb": true,
8853
+ "clip_grad_norm": 0.1,
8854
+ "lr_scheduler": "linear",
8855
+ "model_pair": "strict",
8856
+ "same_size": false,
8857
+ "seed": 67,
8858
+ "batch_size": 256,
8859
+ "include_mlp": false,
8860
+ "detach_while_caching": true,
8861
+ "scheduler_val_metric": [
8862
+ "val/accuracy",
8863
+ "val/IIA",
8864
+ "val/strict_accuracy"
8865
+ ],
8866
+ "siit_sampling": "sample_all",
8867
+ "val_iia_sampling": "all"
8868
+ },
8869
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/meta.json",
8870
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/ll_model.pth",
8871
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/121/edges.pkl"
8872
+ },
8873
+ {
8874
+ "case_id": "35",
8875
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/35",
8876
+ "task_description": "Alternates capitalization of each character in words.",
8877
+ "vocab": [
8878
+ "J",
8879
+ "LB",
8880
+ "TPSI",
8881
+ "V",
8882
+ "b",
8883
+ "no",
8884
+ "oCLrZaW",
8885
+ "poiVg"
8886
+ ],
8887
+ "max_seq_len": 10,
8888
+ "min_seq_len": 4,
8889
+ "files": [
8890
+ {
8891
+ "file_name": "edges.pkl",
8892
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/edges.pkl"
8893
+ },
8894
+ {
8895
+ "file_name": "ll_model.pth",
8896
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model.pth"
8897
+ },
8898
+ {
8899
+ "file_name": "ll_model_cfg.pkl",
8900
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl"
8901
+ },
8902
+ {
8903
+ "file_name": "meta.json",
8904
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/meta.json"
8905
+ }
8906
+ ],
8907
+ "transformer_cfg": {
8908
+ "n_layers": 2,
8909
+ "d_model": 9,
8910
+ "n_ctx": 10,
8911
+ "d_head": 2,
8912
+ "model_name": "custom",
8913
+ "n_heads": 4,
8914
+ "d_mlp": 36,
8915
+ "act_fn": "gelu",
8916
+ "d_vocab": 10,
8917
+ "eps": 1e-05,
8918
+ "use_attn_result": true,
8919
+ "use_attn_scale": true,
8920
+ "use_split_qkv_input": true,
8921
+ "use_hook_mlp_in": true,
8922
+ "use_attn_in": false,
8923
+ "use_local_attn": false,
8924
+ "original_architecture": null,
8925
+ "from_checkpoint": false,
8926
+ "checkpoint_index": null,
8927
+ "checkpoint_label_type": null,
8928
+ "checkpoint_value": null,
8929
+ "tokenizer_name": null,
8930
+ "window_size": null,
8931
+ "attn_types": null,
8932
+ "init_mode": "gpt2",
8933
+ "normalization_type": null,
8934
+ "n_devices": 1,
8935
+ "attention_dir": "causal",
8936
+ "attn_only": false,
8937
+ "seed": 0,
8938
+ "initializer_range": 0.1539600717839002,
8939
+ "init_weights": true,
8940
+ "scale_attn_by_inverse_layer_idx": false,
8941
+ "positional_embedding_type": "standard",
8942
+ "final_rms": false,
8943
+ "d_vocab_out": 8,
8944
+ "parallel_attn_mlp": false,
8945
+ "rotary_dim": null,
8946
+ "n_params": 1872,
8947
+ "use_hook_tokens": false,
8948
+ "gated_mlp": false,
8949
+ "default_prepend_bos": true,
8950
+ "dtype": "torch.float32",
8951
+ "tokenizer_prepends_bos": null,
8952
+ "n_key_value_heads": null,
8953
+ "post_embedding_ln": false,
8954
+ "rotary_base": 10000,
8955
+ "trust_remote_code": false,
8956
+ "rotary_adjacent_pairs": false
8957
+ },
8958
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/35/ll_model_cfg.pkl",
8959
  "training_args": {
8960
  "atol": 0.05,
8961
  "lr": 0.01,
 
9060
  "lr": 0.01,
9061
  "use_single_loss": false,
9062
  "iit_weight": 1.0,
9063
+ "behavior_weight": 1.0,
9064
+ "strict_weight": 10.0,
9065
+ "epochs": 2000,
9066
+ "act_fn": "gelu",
9067
+ "clip_grad_norm": 0.1,
9068
+ "lr_scheduler": "",
9069
+ "model_pair": "strict",
9070
+ "same_size": false
9071
+ },
9072
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/meta.json",
9073
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/ll_model.pth",
9074
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/3/edges.pkl"
9075
+ },
9076
+ {
9077
+ "case_id": "36",
9078
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/36",
9079
+ "task_description": "Classifies each token as 'positive', 'negative', or 'neutral' based on emojis.",
9080
+ "vocab": [
9081
+ "\ud83d\udcd8",
9082
+ "\ud83d\ude0a",
9083
+ "\ud83d\ude22"
9084
+ ],
9085
+ "max_seq_len": 10,
9086
+ "min_seq_len": 4,
9087
+ "files": [
9088
+ {
9089
+ "file_name": "edges.pkl",
9090
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl"
9091
+ },
9092
+ {
9093
+ "file_name": "ll_model.pth",
9094
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth"
9095
+ },
9096
+ {
9097
+ "file_name": "ll_model_cfg.pkl",
9098
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl"
9099
+ },
9100
+ {
9101
+ "file_name": "meta.json",
9102
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json"
9103
+ }
9104
+ ],
9105
+ "transformer_cfg": {
9106
+ "n_layers": 2,
9107
+ "d_model": 6,
9108
+ "n_ctx": 10,
9109
+ "d_head": 1,
9110
+ "model_name": "custom",
9111
+ "n_heads": 4,
9112
+ "d_mlp": 24,
9113
+ "act_fn": "gelu",
9114
+ "d_vocab": 5,
9115
+ "eps": 1e-05,
9116
+ "use_attn_result": true,
9117
+ "use_attn_scale": true,
9118
+ "use_split_qkv_input": true,
9119
+ "use_hook_mlp_in": true,
9120
+ "use_attn_in": false,
9121
+ "use_local_attn": false,
9122
+ "original_architecture": null,
9123
+ "from_checkpoint": false,
9124
+ "checkpoint_index": null,
9125
+ "checkpoint_label_type": null,
9126
+ "checkpoint_value": null,
9127
+ "tokenizer_name": null,
9128
+ "window_size": null,
9129
+ "attn_types": null,
9130
+ "init_mode": "gpt2",
9131
+ "normalization_type": null,
9132
+ "n_devices": 1,
9133
+ "attention_dir": "causal",
9134
+ "attn_only": false,
9135
+ "seed": 0,
9136
+ "initializer_range": 0.19402850002906638,
9137
+ "init_weights": true,
9138
+ "scale_attn_by_inverse_layer_idx": false,
9139
+ "positional_embedding_type": "standard",
9140
+ "final_rms": false,
9141
+ "d_vocab_out": 3,
9142
+ "parallel_attn_mlp": false,
9143
+ "rotary_dim": null,
9144
+ "n_params": 768,
9145
+ "use_hook_tokens": false,
9146
+ "gated_mlp": false,
9147
+ "default_prepend_bos": true,
9148
+ "dtype": "torch.float32",
9149
+ "tokenizer_prepends_bos": null,
9150
+ "n_key_value_heads": null,
9151
+ "post_embedding_ln": false,
9152
+ "rotary_base": 10000,
9153
+ "trust_remote_code": false,
9154
+ "rotary_adjacent_pairs": false
9155
+ },
9156
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model_cfg.pkl",
9157
+ "training_args": {
9158
+ "atol": 0.05,
9159
+ "lr": 0.01,
9160
+ "use_single_loss": false,
9161
+ "iit_weight": 1.0,
9162
+ "behavior_weight": 1.0,
9163
+ "strict_weight": 1.0,
9164
+ "epochs": 2000,
9165
+ "act_fn": "gelu",
9166
+ "clip_grad_norm": 0.1,
9167
+ "lr_scheduler": "",
9168
+ "model_pair": "strict"
9169
+ },
9170
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/meta.json",
9171
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/ll_model.pth",
9172
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/36/edges.pkl"
9173
+ },
9174
+ {
9175
+ "case_id": "106",
9176
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/106",
9177
+ "task_description": "Sets all elements to zero except for the element at index 1.",
9178
+ "vocab": [
9179
+ 0,
9180
+ 1,
9181
+ 2,
9182
+ 3,
9183
+ 4,
9184
+ 5,
9185
+ 6,
9186
+ 7,
9187
+ 8,
9188
+ 9,
9189
+ 10
9190
+ ],
9191
+ "max_seq_len": 10,
9192
+ "min_seq_len": 4,
9193
+ "files": [
9194
+ {
9195
+ "file_name": "edges.pkl",
9196
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/edges.pkl"
9197
+ },
9198
+ {
9199
+ "file_name": "ll_model.pth",
9200
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model.pth"
9201
+ },
9202
+ {
9203
+ "file_name": "ll_model_cfg.pkl",
9204
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model_cfg.pkl"
9205
+ },
9206
+ {
9207
+ "file_name": "meta.json",
9208
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/meta.json"
9209
+ }
9210
+ ],
9211
+ "transformer_cfg": {
9212
+ "n_layers": 2,
9213
+ "d_model": 4,
9214
+ "n_ctx": 10,
9215
+ "d_head": 1,
9216
+ "model_name": "custom",
9217
+ "n_heads": 4,
9218
+ "d_mlp": 16,
9219
+ "act_fn": "gelu",
9220
+ "d_vocab": 13,
9221
+ "eps": 1e-05,
9222
+ "use_attn_result": true,
9223
+ "use_attn_scale": true,
9224
+ "use_split_qkv_input": true,
9225
+ "use_hook_mlp_in": true,
9226
+ "use_attn_in": false,
9227
+ "use_local_attn": false,
9228
+ "original_architecture": null,
9229
+ "from_checkpoint": false,
9230
+ "checkpoint_index": null,
9231
+ "checkpoint_label_type": null,
9232
+ "checkpoint_value": null,
9233
+ "tokenizer_name": null,
9234
+ "window_size": null,
9235
+ "attn_types": null,
9236
+ "init_mode": "gpt2",
9237
+ "normalization_type": null,
9238
+ "n_devices": 1,
9239
+ "attention_dir": "causal",
9240
+ "attn_only": false,
9241
+ "seed": 0,
9242
+ "initializer_range": 0.13719886811400708,
9243
+ "init_weights": true,
9244
+ "scale_attn_by_inverse_layer_idx": false,
9245
+ "positional_embedding_type": "standard",
9246
+ "final_rms": false,
9247
+ "d_vocab_out": 11,
9248
+ "parallel_attn_mlp": false,
9249
+ "rotary_dim": null,
9250
+ "n_params": 384,
9251
+ "use_hook_tokens": false,
9252
+ "gated_mlp": false,
9253
+ "default_prepend_bos": true,
9254
+ "dtype": "torch.float32",
9255
+ "tokenizer_prepends_bos": null,
9256
+ "n_key_value_heads": null,
9257
+ "post_embedding_ln": false,
9258
+ "rotary_base": 10000,
9259
+ "trust_remote_code": false,
9260
+ "rotary_adjacent_pairs": false,
9261
+ "load_in_4bit": false,
9262
+ "num_experts": null,
9263
+ "experts_per_token": null
9264
+ },
9265
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model_cfg.pkl",
9266
+ "training_args": {
9267
+ "output_dir": "/circuits-benchmark/results",
9268
+ "atol": 0.05,
9269
+ "lr": 0.001,
9270
+ "use_single_loss": true,
9271
+ "iit_weight": 1.0,
9272
+ "behavior_weight": 0.4,
9273
+ "strict_weight": 0.7,
9274
+ "epochs": 1000,
9275
+ "early_stop_accuracy_threshold": 99.9,
9276
  "act_fn": "gelu",
9277
+ "use_wandb": true,
9278
+ "save_model_to_wandb": true,
9279
  "clip_grad_norm": 0.1,
9280
+ "lr_scheduler": "linear",
9281
  "model_pair": "strict",
9282
+ "same_size": false,
9283
+ "seed": 92,
9284
+ "batch_size": 256,
9285
+ "include_mlp": false,
9286
+ "detach_while_caching": true,
9287
+ "scheduler_val_metric": [
9288
+ "val/accuracy",
9289
+ "val/IIA",
9290
+ "val/strict_accuracy"
9291
+ ],
9292
+ "siit_sampling": "sample_all",
9293
+ "val_iia_sampling": "all"
9294
  },
9295
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/meta.json",
9296
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/ll_model.pth",
9297
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/106/edges.pkl"
9298
  },
9299
  {
9300
+ "case_id": "64",
9301
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/64",
9302
+ "task_description": "Cubes each element in the sequence.",
9303
  "vocab": [
9304
+ 0,
9305
+ 1,
9306
+ 2,
9307
+ 3,
9308
+ 4,
9309
+ 5,
9310
+ 6,
9311
+ 7,
9312
+ 8,
9313
+ 9,
9314
+ 10
9315
  ],
9316
  "max_seq_len": 10,
9317
  "min_seq_len": 4,
9318
  "files": [
9319
  {
9320
  "file_name": "edges.pkl",
9321
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl"
9322
  },
9323
  {
9324
  "file_name": "ll_model.pth",
9325
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth"
9326
  },
9327
  {
9328
  "file_name": "ll_model_cfg.pkl",
9329
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl"
9330
  },
9331
  {
9332
  "file_name": "meta.json",
9333
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json"
9334
  }
9335
  ],
9336
  "transformer_cfg": {
9337
  "n_layers": 2,
9338
+ "d_model": 4,
9339
  "n_ctx": 10,
9340
  "d_head": 1,
9341
  "model_name": "custom",
9342
  "n_heads": 4,
9343
+ "d_mlp": 16,
9344
  "act_fn": "gelu",
9345
+ "d_vocab": 13,
9346
  "eps": 1e-05,
9347
  "use_attn_result": true,
9348
  "use_attn_scale": true,
 
9364
  "attention_dir": "causal",
9365
  "attn_only": false,
9366
  "seed": 0,
9367
+ "initializer_range": 0.1392621247645583,
9368
  "init_weights": true,
9369
  "scale_attn_by_inverse_layer_idx": false,
9370
  "positional_embedding_type": "standard",
9371
  "final_rms": false,
9372
+ "d_vocab_out": 11,
9373
  "parallel_attn_mlp": false,
9374
  "rotary_dim": null,
9375
+ "n_params": 384,
9376
  "use_hook_tokens": false,
9377
  "gated_mlp": false,
9378
  "default_prepend_bos": true,
 
9382
  "post_embedding_ln": false,
9383
  "rotary_base": 10000,
9384
  "trust_remote_code": false,
9385
+ "rotary_adjacent_pairs": false,
9386
+ "load_in_4bit": false,
9387
+ "num_experts": null,
9388
+ "experts_per_token": null
9389
  },
9390
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model_cfg.pkl",
9391
  "training_args": {
9392
+ "output_dir": "/circuits-benchmark/results",
9393
  "atol": 0.05,
9394
+ "lr": 0.001,
9395
+ "use_single_loss": true,
9396
  "iit_weight": 1.0,
9397
+ "behavior_weight": 0.4,
9398
+ "strict_weight": 0.7,
9399
+ "epochs": 1000,
9400
+ "early_stop_accuracy_threshold": 99.9,
9401
  "act_fn": "gelu",
9402
+ "use_wandb": true,
9403
+ "save_model_to_wandb": true,
9404
  "clip_grad_norm": 0.1,
9405
+ "lr_scheduler": "linear",
9406
+ "model_pair": "strict",
9407
+ "same_size": false,
9408
+ "seed": 67,
9409
+ "batch_size": 256,
9410
+ "include_mlp": false,
9411
+ "detach_while_caching": true,
9412
+ "scheduler_val_metric": [
9413
+ "val/accuracy",
9414
+ "val/IIA",
9415
+ "val/strict_accuracy"
9416
+ ],
9417
+ "siit_sampling": "sample_all",
9418
+ "val_iia_sampling": "all"
9419
  },
9420
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/meta.json",
9421
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/ll_model.pth",
9422
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/64/edges.pkl"
9423
  },
9424
  {
9425
+ "case_id": "8",
9426
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/8",
9427
+ "task_description": "Identity",
9428
  "vocab": [
9429
  0,
9430
  1,
 
9443
  "files": [
9444
  {
9445
  "file_name": "edges.pkl",
9446
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl"
9447
  },
9448
  {
9449
  "file_name": "ll_model.pth",
9450
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth"
9451
  },
9452
  {
9453
  "file_name": "ll_model_cfg.pkl",
9454
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl"
9455
  },
9456
  {
9457
  "file_name": "meta.json",
9458
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json"
9459
  }
9460
  ],
9461
  "transformer_cfg": {
 
9512
  "num_experts": null,
9513
  "experts_per_token": null
9514
  },
9515
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model_cfg.pkl",
9516
  "training_args": {
9517
  "output_dir": "/circuits-benchmark/results",
9518
  "atol": 0.05,
 
9542
  "siit_sampling": "sample_all",
9543
  "val_iia_sampling": "all"
9544
  },
9545
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/meta.json",
9546
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/ll_model.pth",
9547
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/8/edges.pkl"
9548
  },
9549
  {
9550
+ "case_id": "73",
9551
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/73",
9552
+ "task_description": "Apply the sine function to each element of the input sequence.",
9553
  "vocab": [
9554
  0,
9555
  1,
 
9568
  "files": [
9569
  {
9570
  "file_name": "edges.pkl",
9571
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/edges.pkl"
9572
  },
9573
  {
9574
  "file_name": "ll_model.pth",
9575
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model.pth"
9576
  },
9577
  {
9578
  "file_name": "ll_model_cfg.pkl",
9579
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model_cfg.pkl"
9580
  },
9581
  {
9582
  "file_name": "meta.json",
9583
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/meta.json"
9584
  }
9585
  ],
9586
  "transformer_cfg": {
 
9637
  "num_experts": null,
9638
  "experts_per_token": null
9639
  },
9640
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model_cfg.pkl",
9641
  "training_args": {
9642
  "output_dir": "/circuits-benchmark/results",
9643
  "atol": 0.05,
 
9655
  "lr_scheduler": "linear",
9656
  "model_pair": "strict",
9657
  "same_size": false,
9658
+ "seed": 92,
9659
  "batch_size": 256,
9660
  "include_mlp": false,
9661
  "detach_while_caching": true,
 
9667
  "siit_sampling": "sample_all",
9668
  "val_iia_sampling": "all"
9669
  },
9670
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/meta.json",
9671
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/ll_model.pth",
9672
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/73/edges.pkl"
9673
  },
9674
  {
9675
  "case_id": "103",
 
10046
  "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/ll_model.pth",
10047
  "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/97/edges.pkl"
10048
  },
10049
+ {
10050
+ "case_id": "49",
10051
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/49",
10052
+ "task_description": "Decrements each element in the sequence until it becomes a multiple of 3.",
10053
+ "vocab": [
10054
+ 0,
10055
+ 1,
10056
+ 2,
10057
+ 3,
10058
+ 4,
10059
+ 5,
10060
+ 6,
10061
+ 7,
10062
+ 8,
10063
+ 9,
10064
+ 10
10065
+ ],
10066
+ "max_seq_len": 10,
10067
+ "min_seq_len": 4,
10068
+ "files": [
10069
+ {
10070
+ "file_name": "edges.pkl",
10071
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/edges.pkl"
10072
+ },
10073
+ {
10074
+ "file_name": "ll_model.pth",
10075
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model.pth"
10076
+ },
10077
+ {
10078
+ "file_name": "ll_model_cfg.pkl",
10079
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model_cfg.pkl"
10080
+ },
10081
+ {
10082
+ "file_name": "meta.json",
10083
+ "url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/meta.json"
10084
+ }
10085
+ ],
10086
+ "transformer_cfg": {
10087
+ "n_layers": 2,
10088
+ "d_model": 4,
10089
+ "n_ctx": 10,
10090
+ "d_head": 1,
10091
+ "model_name": "custom",
10092
+ "n_heads": 4,
10093
+ "d_mlp": 16,
10094
+ "act_fn": "gelu",
10095
+ "d_vocab": 13,
10096
+ "eps": 1e-05,
10097
+ "use_attn_result": true,
10098
+ "use_attn_scale": true,
10099
+ "use_split_qkv_input": true,
10100
+ "use_hook_mlp_in": true,
10101
+ "use_attn_in": false,
10102
+ "use_local_attn": false,
10103
+ "original_architecture": null,
10104
+ "from_checkpoint": false,
10105
+ "checkpoint_index": null,
10106
+ "checkpoint_label_type": null,
10107
+ "checkpoint_value": null,
10108
+ "tokenizer_name": null,
10109
+ "window_size": null,
10110
+ "attn_types": null,
10111
+ "init_mode": "gpt2",
10112
+ "normalization_type": null,
10113
+ "n_devices": 1,
10114
+ "attention_dir": "causal",
10115
+ "attn_only": false,
10116
+ "seed": 0,
10117
+ "initializer_range": 0.15689290811054724,
10118
+ "init_weights": true,
10119
+ "scale_attn_by_inverse_layer_idx": false,
10120
+ "positional_embedding_type": "standard",
10121
+ "final_rms": false,
10122
+ "d_vocab_out": 4,
10123
+ "parallel_attn_mlp": false,
10124
+ "rotary_dim": null,
10125
+ "n_params": 384,
10126
+ "use_hook_tokens": false,
10127
+ "gated_mlp": false,
10128
+ "default_prepend_bos": true,
10129
+ "dtype": "torch.float32",
10130
+ "tokenizer_prepends_bos": null,
10131
+ "n_key_value_heads": null,
10132
+ "post_embedding_ln": false,
10133
+ "rotary_base": 10000,
10134
+ "trust_remote_code": false,
10135
+ "rotary_adjacent_pairs": false,
10136
+ "load_in_4bit": false,
10137
+ "num_experts": null,
10138
+ "experts_per_token": null
10139
+ },
10140
+ "transformer_cfg_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model_cfg.pkl",
10141
+ "training_args": {
10142
+ "output_dir": "/circuits-benchmark/results",
10143
+ "atol": 0.05,
10144
+ "lr": 0.001,
10145
+ "use_single_loss": true,
10146
+ "iit_weight": 1.0,
10147
+ "behavior_weight": 0.4,
10148
+ "strict_weight": 0.7,
10149
+ "epochs": 1000,
10150
+ "early_stop_accuracy_threshold": 99.9,
10151
+ "act_fn": "gelu",
10152
+ "use_wandb": true,
10153
+ "save_model_to_wandb": true,
10154
+ "clip_grad_norm": 0.1,
10155
+ "lr_scheduler": "linear",
10156
+ "model_pair": "strict",
10157
+ "same_size": false,
10158
+ "seed": 92,
10159
+ "batch_size": 256,
10160
+ "include_mlp": false,
10161
+ "detach_while_caching": true,
10162
+ "scheduler_val_metric": [
10163
+ "val/accuracy",
10164
+ "val/IIA",
10165
+ "val/strict_accuracy"
10166
+ ],
10167
+ "siit_sampling": "sample_all",
10168
+ "val_iia_sampling": "all"
10169
+ },
10170
+ "training_args_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/meta.json",
10171
+ "weights_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/ll_model.pth",
10172
+ "circuit_file_url": "https://huggingface.co/cybershiptrooper/InterpBench/blob/main/49/edges.pkl"
10173
+ },
10174
  {
10175
  "case_id": "46",
10176
  "url": "https://huggingface.co/cybershiptrooper/InterpBench/tree/main/46",