cybershiptrooper commited on
Commit
7fb3212
1 Parent(s): 0d6085e

update ioi

Browse files
Files changed (4) hide show
  1. ioi/edges.pkl +2 -2
  2. ioi/ll_model.pth +1 -1
  3. ioi/ll_model_cfg.pkl +2 -2
  4. ioi/meta.json +1 -1
ioi/edges.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b8b933ca819217e35439abc32f29d935587575f73a9fb0739e332dde8b48bb83
3
- size 8720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9781e9e02a127e968bf212f01d74de6cf9b74eeb2bcf8b28a3d5c499c44b7a66
3
+ size 322
ioi/ll_model.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3d5e3070a1678e273b2f0409200b7dfc50a203dafe2a41859737f67b923ae491
3
  size 42434142
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:91f3ac5139f566d1196e258bbabf93acdcc3a5e9ab6a7c7ab20b921cfef5dd91
3
  size 42434142
ioi/ll_model_cfg.pkl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:01f4644abfd87f8720aa23bb65824a39e16d04161103c967aa3bc872ba0291db
3
- size 1165
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66d06ba6c6545e4d08360fa539ad29463f043fc86b6d6d51846a3e326c209894
3
+ size 1090
ioi/meta.json CHANGED
@@ -1 +1 @@
1
- {"next_token": true, "non_ioi_thresh": 0.65, "use_per_token_check": false, "batch_size": 256, "lr": 0.001, "num_workers": 0, "early_stop": true, "lr_scheduler": null, "scheduler_val_metric": ["val/accuracy", "val/IIA"], "scheduler_mode": "max", "clip_grad_norm": 1.0, "atol": 0.05, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "strict_weight": 0.4}
 
1
+ {"next_token": false, "non_ioi_thresh": 0.65, "use_per_token_check": false, "batch_size": 512, "num_workers": 0, "early_stop": true, "lr_scheduler": null, "scheduler_val_metric": ["val/accuracy", "val/IIA"], "scheduler_mode": "max", "scheduler_kwargs": {}, "clip_grad_norm": 1.0, "seed": 0, "lr": 0.001, "detach_while_caching": true, "optimizer_kwargs": {"betas": [0.9, 0.9]}, "atol": 0.05, "use_single_loss": false, "iit_weight": 1.0, "behavior_weight": 1.0, "val_IIA_sampling": "random", "use_all_tokens_for_behavior": false, "strict_weight": 0.4, "siit_sampling": "individual"}