cybershiptrooper
commited on
Commit
β’
0355bdd
1
Parent(s):
04070cc
add ioi edges and rename model names
Browse files- ioi/corr_100_100_40.json +0 -1
- ioi_next_token/ll_model_100_100_40.pth β ioi/edges.pkl +2 -2
- ioi/{ll_model_100_100_40.pth β ll_model.pth} +0 -0
- ioi/ll_model_cfg.pkl +3 -0
- ioi_next_token/results_100_100_40/training_args.json β ioi/meta.json +0 -0
- ioi_next_token/corr_100_100_40.json +0 -1
- ioi_next_token/edges.pkl +3 -0
- ioi_next_token/ll_model.pth +3 -0
- ioi_next_token/ll_model_cfg.pkl +3 -0
- ioi_next_token/meta.json +1 -0
ioi/corr_100_100_40.json
DELETED
@@ -1 +0,0 @@
|
|
1 |
-
{"hook_duplicate": ["blocks.0.attn.hook_z"], "hook_s_inhibition": ["blocks.2.attn.hook_z"], "hook_name_mover": ["blocks.4.attn.hook_z"], "all_nodes_hook": ["blocks.0.mlp.hook_post"]}
|
|
|
|
ioi_next_token/ll_model_100_100_40.pth β ioi/edges.pkl
RENAMED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f459d1ebb44a810a1d00443d1df08c1133921b21700c4c5eb1fdf682d4a55ae4
|
3 |
+
size 3966
|
ioi/{ll_model_100_100_40.pth β ll_model.pth}
RENAMED
File without changes
|
ioi/ll_model_cfg.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01f4644abfd87f8720aa23bb65824a39e16d04161103c967aa3bc872ba0291db
|
3 |
+
size 1165
|
ioi_next_token/results_100_100_40/training_args.json β ioi/meta.json
RENAMED
File without changes
|
ioi_next_token/corr_100_100_40.json
DELETED
@@ -1 +0,0 @@
|
|
1 |
-
{"hook_duplicate": ["blocks.0.attn.hook_z"], "hook_s_inhibition": ["blocks.2.attn.hook_z"], "hook_name_mover": ["blocks.4.attn.hook_z"]}
|
|
|
|
ioi_next_token/edges.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f459d1ebb44a810a1d00443d1df08c1133921b21700c4c5eb1fdf682d4a55ae4
|
3 |
+
size 3966
|
ioi_next_token/ll_model.pth
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3d5e3070a1678e273b2f0409200b7dfc50a203dafe2a41859737f67b923ae491
|
3 |
+
size 42434142
|
ioi_next_token/ll_model_cfg.pkl
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:01f4644abfd87f8720aa23bb65824a39e16d04161103c967aa3bc872ba0291db
|
3 |
+
size 1165
|
ioi_next_token/meta.json
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
{"next_token": true, "non_ioi_thresh": 0.65, "use_per_token_check": false, "batch_size": 256, "lr": 0.001, "num_workers": 0, "early_stop": true, "lr_scheduler": null, "scheduler_val_metric": ["val/accuracy", "val/IIA"], "scheduler_mode": "max", "clip_grad_norm": 1.0, "atol": 0.05, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4}
|