ncbateman commited on
Commit
07bd058
·
verified ·
1 Parent(s): c868933

Training in progress, step 850, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:92942064b68f22a635d4178bdbcdffb8eb8e323b4bc90a33365128f3cc01616b
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fd2eff90e09ff5cb32ab1ebd775cb0f037fd91c63a7deff49c1bf83cf6d32e7
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ae4855dfd0bb55befec84f2621a632e36dc7b481da908c36b47f26a478c29ab
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac70266b2eba094d3128dd6f864a3ede94de052e2e0aa23dba2f8f69ad1aa502
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b44d761c2dc0b6e72b2c0f65252ea5160d07505b6189282d6a4254828b3a8986
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5259289c5a137780973c8367739829eb39d5d72183980f5655a6da8d42ad769
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7ca47c546dafdf46a438555e2c974efc5fd475da85887cb0544686113929f218
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d74516f9adab70d9cfa3d092d8888b349f96cc406e15b22a9893c08784b3ae9b
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.09349725008088,
5
  "eval_steps": 386,
6
- "global_step": 845,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -5946,6 +5946,41 @@
5946
  "learning_rate": 8.963627323902104e-05,
5947
  "loss": 0.6661,
5948
  "step": 845
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5949
  }
5950
  ],
5951
  "logging_steps": 1,
@@ -5965,7 +6000,7 @@
5965
  "attributes": {}
5966
  }
5967
  },
5968
- "total_flos": 9.445870390078341e+17,
5969
  "train_batch_size": 4,
5970
  "trial_name": null,
5971
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0999676480103526,
5
  "eval_steps": 386,
6
+ "global_step": 850,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
5946
  "learning_rate": 8.963627323902104e-05,
5947
  "loss": 0.6661,
5948
  "step": 845
5949
+ },
5950
+ {
5951
+ "epoch": 1.0947913296667746,
5952
+ "grad_norm": 0.9900491833686829,
5953
+ "learning_rate": 8.961112789936703e-05,
5954
+ "loss": 0.874,
5955
+ "step": 846
5956
+ },
5957
+ {
5958
+ "epoch": 1.096085409252669,
5959
+ "grad_norm": 1.002979040145874,
5960
+ "learning_rate": 8.958595562781397e-05,
5961
+ "loss": 0.6907,
5962
+ "step": 847
5963
+ },
5964
+ {
5965
+ "epoch": 1.0973794888385635,
5966
+ "grad_norm": 0.9625217914581299,
5967
+ "learning_rate": 8.956075644147664e-05,
5968
+ "loss": 0.913,
5969
+ "step": 848
5970
+ },
5971
+ {
5972
+ "epoch": 1.0986735684244582,
5973
+ "grad_norm": 1.0066606998443604,
5974
+ "learning_rate": 8.953553035748817e-05,
5975
+ "loss": 0.7295,
5976
+ "step": 849
5977
+ },
5978
+ {
5979
+ "epoch": 1.0999676480103526,
5980
+ "grad_norm": 1.1030412912368774,
5981
+ "learning_rate": 8.951027739299996e-05,
5982
+ "loss": 0.792,
5983
+ "step": 850
5984
  }
5985
  ],
5986
  "logging_steps": 1,
 
6000
  "attributes": {}
6001
  }
6002
  },
6003
+ "total_flos": 9.50176724866302e+17,
6004
  "train_batch_size": 4,
6005
  "trial_name": null,
6006
  "trial_params": null