ncbateman commited on
Commit
cdc12a1
·
verified ·
1 Parent(s): 3454fab

Training in progress, step 820, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:33bf95807022ad8256390457a8922e5eb79283db0cb74644d292a992d88bb148
3
  size 45118424
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:970c1e5f20a9c6313ae0d772b0f16498af7abe36336fc26af3744ed91839b9b6
3
  size 45118424
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e961e61ae628fdef1c80ab9e62b59805293d403bafa5fdbd9c16e141e8f3833d
3
  size 23159546
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:80aee59a609b1f37dbe1d027f3ef1467c75b3d54433eeeaed8474b61eeae1e2d
3
  size 23159546
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c316a89e564105b6a4d3697edf95b71fd92b58e6f0210008c23c402d785036ca
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79c56ec642f4caf6c132646e9783305c87d1a4731e3978fcc2bd0ea8585ac231
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:406944ca466952137e0b114cdd90cd03d0c938cd95631d05a6add36515fca9c8
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c717f38e6747d9b86924e9284e7ce198f0fb7dc628bd7877fbe61fddd3883692
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 4.201030927835052,
5
  "eval_steps": 97,
6
- "global_step": 815,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -5784,6 +5784,41 @@
5784
  "learning_rate": 6.8417125980128675e-06,
5785
  "loss": 0.6238,
5786
  "step": 815
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5787
  }
5788
  ],
5789
  "logging_steps": 1,
@@ -5803,7 +5838,7 @@
5803
  "attributes": {}
5804
  }
5805
  },
5806
- "total_flos": 3.151872409070469e+17,
5807
  "train_batch_size": 4,
5808
  "trial_name": null,
5809
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 4.22680412371134,
5
  "eval_steps": 97,
6
+ "global_step": 820,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
5784
  "learning_rate": 6.8417125980128675e-06,
5785
  "loss": 0.6238,
5786
  "step": 815
5787
+ },
5788
+ {
5789
+ "epoch": 4.206185567010309,
5790
+ "grad_norm": 0.7783701419830322,
5791
+ "learning_rate": 6.755754876962711e-06,
5792
+ "loss": 0.5216,
5793
+ "step": 816
5794
+ },
5795
+ {
5796
+ "epoch": 4.211340206185567,
5797
+ "grad_norm": 0.6552199125289917,
5798
+ "learning_rate": 6.670301412974511e-06,
5799
+ "loss": 0.4832,
5800
+ "step": 817
5801
+ },
5802
+ {
5803
+ "epoch": 4.216494845360825,
5804
+ "grad_norm": 0.8719028830528259,
5805
+ "learning_rate": 6.585353202493322e-06,
5806
+ "loss": 0.575,
5807
+ "step": 818
5808
+ },
5809
+ {
5810
+ "epoch": 4.221649484536083,
5811
+ "grad_norm": 0.7946240305900574,
5812
+ "learning_rate": 6.500911236072532e-06,
5813
+ "loss": 0.648,
5814
+ "step": 819
5815
+ },
5816
+ {
5817
+ "epoch": 4.22680412371134,
5818
+ "grad_norm": 0.7797208428382874,
5819
+ "learning_rate": 6.416976498362432e-06,
5820
+ "loss": 0.4849,
5821
+ "step": 820
5822
  }
5823
  ],
5824
  "logging_steps": 1,
 
5838
  "attributes": {}
5839
  }
5840
  },
5841
+ "total_flos": 3.171226860461752e+17,
5842
  "train_batch_size": 4,
5843
  "trial_name": null,
5844
  "trial_params": null