ncbateman commited on
Commit
e544321
·
verified ·
1 Parent(s): 7146e1c

Training in progress, step 825, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:b3c71fa0cb7e157841e2952c317cdfa017d9a0e7e32737874f4d20b71e23615d
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:87c61933c7acb261c5801449d983e244cb4ae8e4a22df14ff59f4f35405beffe
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5d95a62ba3aba13f7257482e49d433101f269255a12dfe0be4d7ed42a74d3250
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:455f6d8dbeea414678dbb91fa9f32b887be77fc737e8ea0e996b1a93a88b7851
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9527a9656bdadb0a16bb79de1cfddac3292bebf2eb8fa1acb5151a1acad7acff
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:89cfdc62760b08909a8de6668672f514712e7b15d9dc0aff582b1601f05bbba2
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:fdc9d39e07b36aad394340652fa0d56c4ee44db94279b0fd69ca40c5c2e0621f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e53509185c72a1d7e392d56b37c619974763a56a864cc85234562e53961497e3
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.0611452604335168,
5
  "eval_steps": 386,
6
- "global_step": 820,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -5771,6 +5771,41 @@
5771
  "learning_rate": 9.025610417840237e-05,
5772
  "loss": 0.781,
5773
  "step": 820
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5774
  }
5775
  ],
5776
  "logging_steps": 1,
@@ -5790,7 +5825,7 @@
5790
  "attributes": {}
5791
  }
5792
  },
5793
- "total_flos": 9.166386097154949e+17,
5794
  "train_batch_size": 4,
5795
  "trial_name": null,
5796
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0676156583629894,
5
  "eval_steps": 386,
6
+ "global_step": 825,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
5771
  "learning_rate": 9.025610417840237e-05,
5772
  "loss": 0.781,
5773
  "step": 820
5774
+ },
5775
+ {
5776
+ "epoch": 1.0624393400194112,
5777
+ "grad_norm": 0.8441341519355774,
5778
+ "learning_rate": 9.023163764477636e-05,
5779
+ "loss": 0.7636,
5780
+ "step": 821
5781
+ },
5782
+ {
5783
+ "epoch": 1.0637334196053057,
5784
+ "grad_norm": 0.858167290687561,
5785
+ "learning_rate": 9.02071437573621e-05,
5786
+ "loss": 0.6853,
5787
+ "step": 822
5788
+ },
5789
+ {
5790
+ "epoch": 1.0650274991912003,
5791
+ "grad_norm": 0.9035941958427429,
5792
+ "learning_rate": 9.01826225328132e-05,
5793
+ "loss": 0.7757,
5794
+ "step": 823
5795
+ },
5796
+ {
5797
+ "epoch": 1.0663215787770948,
5798
+ "grad_norm": 0.8677383065223694,
5799
+ "learning_rate": 9.015807398780177e-05,
5800
+ "loss": 0.917,
5801
+ "step": 824
5802
+ },
5803
+ {
5804
+ "epoch": 1.0676156583629894,
5805
+ "grad_norm": 0.8263882994651794,
5806
+ "learning_rate": 9.013349813901859e-05,
5807
+ "loss": 0.6574,
5808
+ "step": 825
5809
  }
5810
  ],
5811
  "logging_steps": 1,
 
5825
  "attributes": {}
5826
  }
5827
  },
5828
+ "total_flos": 9.222282955739628e+17,
5829
  "train_batch_size": 4,
5830
  "trial_name": null,
5831
  "trial_params": null