ncbateman commited on
Commit
8498786
·
verified ·
1 Parent(s): 22d703b

Training in progress, step 710, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:276cc98327297733df76553f5e3b6d4860107114f0c0d09e76850d88f2e3e792
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a820a8f4eb542479915dcb468727c29cefc3d7359dd207ee3312c7df3c587cae
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:67e1bd4b745e410efa1702b658de1ecd4ec95ec3e117bd275ec883dc33e4fe8f
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dc0f6934bb01d904150982cb8e47c2f710c6f81fcd6bdc0736a215fffd1bf2df
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c2d3d37bb63f7049bbb3b5a0e021e4d5be2c3c48a17668f2b1c66f33aefe4ecd
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b64b4ae62e4075beb8480b1639d23fdd45af44a932132fe66540a077fcc1c087
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6f8030d97101266fb0ab5c1ea76d734a66ed4913265b7bd97b3ca554de2e26fd
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:733800b83bb7a95c51151abac1a9de03ea9b82fb261b8821470be38e62d0baca
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.9123261080556454,
5
  "eval_steps": 386,
6
- "global_step": 705,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -4958,6 +4958,41 @@
4958
  "learning_rate": 9.288311833837917e-05,
4959
  "loss": 0.8883,
4960
  "step": 705
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4961
  }
4962
  ],
4963
  "logging_steps": 1,
@@ -4977,7 +5012,7 @@
4977
  "attributes": {}
4978
  }
4979
  },
4980
- "total_flos": 7.881457060439654e+17,
4981
  "train_batch_size": 4,
4982
  "trial_name": null,
4983
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.9187965059851181,
5
  "eval_steps": 386,
6
+ "global_step": 710,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
4958
  "learning_rate": 9.288311833837917e-05,
4959
  "loss": 0.8883,
4960
  "step": 705
4961
+ },
4962
+ {
4963
+ "epoch": 0.91362018764154,
4964
+ "grad_norm": 0.6708902716636658,
4965
+ "learning_rate": 9.286190365013217e-05,
4966
+ "loss": 0.8315,
4967
+ "step": 706
4968
+ },
4969
+ {
4970
+ "epoch": 0.9149142672274345,
4971
+ "grad_norm": 0.802245557308197,
4972
+ "learning_rate": 9.284065981975958e-05,
4973
+ "loss": 0.9128,
4974
+ "step": 707
4975
+ },
4976
+ {
4977
+ "epoch": 0.916208346813329,
4978
+ "grad_norm": 0.8574107885360718,
4979
+ "learning_rate": 9.281938686170526e-05,
4980
+ "loss": 0.9122,
4981
+ "step": 708
4982
+ },
4983
+ {
4984
+ "epoch": 0.9175024263992235,
4985
+ "grad_norm": 1.060194730758667,
4986
+ "learning_rate": 9.279808479043286e-05,
4987
+ "loss": 1.1447,
4988
+ "step": 709
4989
+ },
4990
+ {
4991
+ "epoch": 0.9187965059851181,
4992
+ "grad_norm": 0.8753707408905029,
4993
+ "learning_rate": 9.277675362042581e-05,
4994
+ "loss": 0.8524,
4995
+ "step": 710
4996
  }
4997
  ],
4998
  "logging_steps": 1,
 
5012
  "attributes": {}
5013
  }
5014
  },
5015
+ "total_flos": 7.937353919024333e+17,
5016
  "train_batch_size": 4,
5017
  "trial_name": null,
5018
  "trial_params": null