ncbateman commited on
Commit
4e11ef2
·
verified ·
1 Parent(s): 9226d21

Training in progress, step 175, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4942b6183f603313ddbbead0c35bcd0516a7d27c74d2166204d4f4ba26f31290
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7c4368dad332de79ce5e1776ab789ac709273e1d5cfde0537da85b4f8710a393
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e8e1d461799f7506f1a0debcac6a984a4a3c2a3599cdd0d68dc31e8b53af334e
3
  size 49846260
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c8facfa6be8cc3dc3ebce039ce013fd72af97d5a0f36cf2d27f0da5791f1e5fd
3
  size 49846260
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:db5d1d56ddf5f29362595a5f01521cef39fc7e9347ff871a7770a4e89003ccaa
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1b64f69b613fca6d8f40873768b1557e9b59b999a2059a3ece3e3ec028766d3f
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:255044db1acc114cb0f2f88c44fef16238de1948a1b84ffe68ecd9e99fb61dda
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:61a3e47e838c8bbbc792ba3c58434b0fe8b77cb810386b07d18a0158d41dc378
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.21999352960207053,
5
  "eval_steps": 386,
6
- "global_step": 170,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1205,6 +1205,41 @@
1205
  "learning_rate": 9.975543295858035e-05,
1206
  "loss": 0.8836,
1207
  "step": 170
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1208
  }
1209
  ],
1210
  "logging_steps": 1,
@@ -1224,7 +1259,7 @@
1224
  "attributes": {}
1225
  }
1226
  },
1227
- "total_flos": 1.9004931918790656e+17,
1228
  "train_batch_size": 4,
1229
  "trial_name": null,
1230
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.22646392753154318,
5
  "eval_steps": 386,
6
+ "global_step": 175,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1205
  "learning_rate": 9.975543295858035e-05,
1206
  "loss": 0.8836,
1207
  "step": 170
1208
+ },
1209
+ {
1210
+ "epoch": 0.22128760918796506,
1211
+ "grad_norm": 0.8391397595405579,
1212
+ "learning_rate": 9.97513432533431e-05,
1213
+ "loss": 0.9003,
1214
+ "step": 171
1215
+ },
1216
+ {
1217
+ "epoch": 0.2225816887738596,
1218
+ "grad_norm": 0.9666821360588074,
1219
+ "learning_rate": 9.974721972179931e-05,
1220
+ "loss": 0.9528,
1221
+ "step": 172
1222
+ },
1223
+ {
1224
+ "epoch": 0.22387576835975412,
1225
+ "grad_norm": 0.9321691393852234,
1226
+ "learning_rate": 9.974306236675259e-05,
1227
+ "loss": 0.9575,
1228
+ "step": 173
1229
+ },
1230
+ {
1231
+ "epoch": 0.22516984794564865,
1232
+ "grad_norm": 0.8022271990776062,
1233
+ "learning_rate": 9.973887119102957e-05,
1234
+ "loss": 0.8731,
1235
+ "step": 174
1236
+ },
1237
+ {
1238
+ "epoch": 0.22646392753154318,
1239
+ "grad_norm": 1.1056872606277466,
1240
+ "learning_rate": 9.973464619747983e-05,
1241
+ "loss": 0.9925,
1242
+ "step": 175
1243
  }
1244
  ],
1245
  "logging_steps": 1,
 
1259
  "attributes": {}
1260
  }
1261
  },
1262
+ "total_flos": 1.956390050463744e+17,
1263
  "train_batch_size": 4,
1264
  "trial_name": null,
1265
  "trial_params": null