ncbateman commited on
Commit
99304b5
1 Parent(s): 8d127fc

Training in progress, step 815, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bf452801c6be48cc1537a18941687b7b4700636962076dcf84dab95f9c490c5f
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b351ea48a340e8d0aefe39d72e8c7c096d1970d8822472c4b4f9a248e83c5aa9
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e173d01920f0c4adb5acdafd91f3ef92c299c24fcad8b3c449520428b5d5f98
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f2e4b9fb46f9ee260fad8a5f6d28cc1e2028cf112c6ecd0f9b828a991c4b30b
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:48357d05ceaf70ef750e9850734136084281b884901dd132b3d7307fc67b7534
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e9fafc5ba32d8ff5b04e05a3ca43c3317ebaffa1127c0eaaaca972e5a128721f
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ae1b957ea3b5be016b1408fb97083cf05faa199719b2f6f2412013b84e7b582
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2204a2f67a3dbafc8915907bcdcd66b239f7be2c081f646d7a24f64134e63ee4
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.0482044645745714,
5
  "eval_steps": 386,
6
- "global_step": 810,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -5701,6 +5701,41 @@
5701
  "learning_rate": 9.049926140583487e-05,
5702
  "loss": 0.7436,
5703
  "step": 810
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5704
  }
5705
  ],
5706
  "logging_steps": 1,
@@ -5720,7 +5755,7 @@
5720
  "attributes": {}
5721
  }
5722
  },
5723
- "total_flos": 9.054592379985592e+17,
5724
  "train_batch_size": 4,
5725
  "trial_name": null,
5726
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.054674862504044,
5
  "eval_steps": 386,
6
+ "global_step": 815,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
5701
  "learning_rate": 9.049926140583487e-05,
5702
  "loss": 0.7436,
5703
  "step": 810
5704
+ },
5705
+ {
5706
+ "epoch": 1.0494985441604658,
5707
+ "grad_norm": 0.8351684808731079,
5708
+ "learning_rate": 9.047506932194074e-05,
5709
+ "loss": 0.8892,
5710
+ "step": 811
5711
+ },
5712
+ {
5713
+ "epoch": 1.0507926237463603,
5714
+ "grad_norm": 0.8384698033332825,
5715
+ "learning_rate": 9.045084971874738e-05,
5716
+ "loss": 0.818,
5717
+ "step": 812
5718
+ },
5719
+ {
5720
+ "epoch": 1.052086703332255,
5721
+ "grad_norm": 0.9196306467056274,
5722
+ "learning_rate": 9.042660261272185e-05,
5723
+ "loss": 0.734,
5724
+ "step": 813
5725
+ },
5726
+ {
5727
+ "epoch": 1.0533807829181494,
5728
+ "grad_norm": 0.9839885234832764,
5729
+ "learning_rate": 9.040232802034998e-05,
5730
+ "loss": 0.7974,
5731
+ "step": 814
5732
+ },
5733
+ {
5734
+ "epoch": 1.054674862504044,
5735
+ "grad_norm": 0.9852064251899719,
5736
+ "learning_rate": 9.03780259581362e-05,
5737
+ "loss": 0.8203,
5738
+ "step": 815
5739
  }
5740
  ],
5741
  "logging_steps": 1,
 
5755
  "attributes": {}
5756
  }
5757
  },
5758
+ "total_flos": 9.110489238570271e+17,
5759
  "train_batch_size": 4,
5760
  "trial_name": null,
5761
  "trial_params": null