ncbateman commited on
Commit
0ca5a0c
·
verified ·
1 Parent(s): 5f3f031

Training in progress, step 610, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7b390cff10ccb0462e2ce56478461d8e6338b504fc23e78bc158e0819d8dc9de
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:32edca6079f3b9484783f232ac0ccb1d340292cb18066f64fd7821f34d446723
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:286cc2bd89d71803d1810c6df9f8f1ffd3acec5c70032db2dcefd9830c184d3f
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fd94789a924990bbe5fdd71e1ae4a4ed24b474b41e969e7e388565234d65aee6
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a876f1e76952adad9028628bf8945815972da7c35421764155ece90dc00dd324
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:609743375850d853d6f9c3893828fefdf1e7c4e4f00a29e837453857db0e6e70
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0544bca5420fca1dbd853da9c587baf2b7fb350e9011928f11101b6ff88e6e56
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f797c771cc3ef7f2bb02c5a7bc50a7c409a56da80db274d374a4aaeeeecf121
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.7829181494661922,
5
  "eval_steps": 386,
6
- "global_step": 605,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -4258,6 +4258,41 @@
4258
  "learning_rate": 9.485502786409107e-05,
4259
  "loss": 1.0692,
4260
  "step": 605
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4261
  }
4262
  ],
4263
  "logging_steps": 1,
@@ -4277,7 +4312,7 @@
4277
  "attributes": {}
4278
  }
4279
  },
4280
- "total_flos": 6.763519888746086e+17,
4281
  "train_batch_size": 4,
4282
  "trial_name": null,
4283
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.7893885473956649,
5
  "eval_steps": 386,
6
+ "global_step": 610,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
4258
  "learning_rate": 9.485502786409107e-05,
4259
  "loss": 1.0692,
4260
  "step": 605
4261
+ },
4262
+ {
4263
+ "epoch": 0.7842122290520867,
4264
+ "grad_norm": 0.733768105506897,
4265
+ "learning_rate": 9.483679688718135e-05,
4266
+ "loss": 0.8835,
4267
+ "step": 606
4268
+ },
4269
+ {
4270
+ "epoch": 0.7855063086379812,
4271
+ "grad_norm": 0.7453616261482239,
4272
+ "learning_rate": 9.481853542540154e-05,
4273
+ "loss": 0.7778,
4274
+ "step": 607
4275
+ },
4276
+ {
4277
+ "epoch": 0.7868003882238758,
4278
+ "grad_norm": 0.8596757650375366,
4279
+ "learning_rate": 9.480024349116771e-05,
4280
+ "loss": 0.9711,
4281
+ "step": 608
4282
+ },
4283
+ {
4284
+ "epoch": 0.7880944678097703,
4285
+ "grad_norm": 0.6516830325126648,
4286
+ "learning_rate": 9.478192109691674e-05,
4287
+ "loss": 0.8342,
4288
+ "step": 609
4289
+ },
4290
+ {
4291
+ "epoch": 0.7893885473956649,
4292
+ "grad_norm": 0.8740130662918091,
4293
+ "learning_rate": 9.476356825510612e-05,
4294
+ "loss": 0.9179,
4295
+ "step": 610
4296
  }
4297
  ],
4298
  "logging_steps": 1,
 
4312
  "attributes": {}
4313
  }
4314
  },
4315
+ "total_flos": 6.819416747330765e+17,
4316
  "train_batch_size": 4,
4317
  "trial_name": null,
4318
  "trial_params": null