cybershiptrooper commited on
Commit
0355bdd
β€’
1 Parent(s): 04070cc

add ioi edges and rename model names

Browse files
ioi/corr_100_100_40.json DELETED
@@ -1 +0,0 @@
1
- {"hook_duplicate": ["blocks.0.attn.hook_z"], "hook_s_inhibition": ["blocks.2.attn.hook_z"], "hook_name_mover": ["blocks.4.attn.hook_z"], "all_nodes_hook": ["blocks.0.mlp.hook_post"]}
 
 
ioi_next_token/ll_model_100_100_40.pth β†’ ioi/edges.pkl RENAMED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8136b3d842ffbcaef9771ebb6fde4274e95dba2a44230eab474c8212703e6300
3
- size 42432926
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f459d1ebb44a810a1d00443d1df08c1133921b21700c4c5eb1fdf682d4a55ae4
3
+ size 3966
ioi/{ll_model_100_100_40.pth β†’ ll_model.pth} RENAMED
File without changes
ioi/ll_model_cfg.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01f4644abfd87f8720aa23bb65824a39e16d04161103c967aa3bc872ba0291db
3
+ size 1165
ioi_next_token/results_100_100_40/training_args.json β†’ ioi/meta.json RENAMED
File without changes
ioi_next_token/corr_100_100_40.json DELETED
@@ -1 +0,0 @@
1
- {"hook_duplicate": ["blocks.0.attn.hook_z"], "hook_s_inhibition": ["blocks.2.attn.hook_z"], "hook_name_mover": ["blocks.4.attn.hook_z"]}
 
 
ioi_next_token/edges.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f459d1ebb44a810a1d00443d1df08c1133921b21700c4c5eb1fdf682d4a55ae4
3
+ size 3966
ioi_next_token/ll_model.pth ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3d5e3070a1678e273b2f0409200b7dfc50a203dafe2a41859737f67b923ae491
3
+ size 42434142
ioi_next_token/ll_model_cfg.pkl ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:01f4644abfd87f8720aa23bb65824a39e16d04161103c967aa3bc872ba0291db
3
+ size 1165
ioi_next_token/meta.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"next_token": true, "non_ioi_thresh": 0.65, "use_per_token_check": false, "batch_size": 256, "lr": 0.001, "num_workers": 0, "early_stop": true, "lr_scheduler": null, "scheduler_val_metric": ["val/accuracy", "val/IIA"], "scheduler_mode": "max", "clip_grad_norm": 1.0, "atol": 0.05, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4}