ncbateman commited on
Commit
0274c8a
1 Parent(s): 24dbaa7

Training in progress, step 605, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2a11def1b8890ff338c8c007d664175329cb9dcda5b586da88c0224efb7c1162
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7b390cff10ccb0462e2ce56478461d8e6338b504fc23e78bc158e0819d8dc9de
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:bdbd37404bc8a5fa123ffac8185bfbd34fb1ed364fd02edc69624ad20d060c6c
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:286cc2bd89d71803d1810c6df9f8f1ffd3acec5c70032db2dcefd9830c184d3f
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95ccc841f095274b3bf1305720cff27c6b752d6dc6d8c301879306023e700650
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a876f1e76952adad9028628bf8945815972da7c35421764155ece90dc00dd324
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5211010f14f9c1fb779ee2261873fc677d85f915b6ea93780c3196c674072288
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0544bca5420fca1dbd853da9c587baf2b7fb350e9011928f11101b6ff88e6e56
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.7764477515367195,
5
  "eval_steps": 386,
6
- "global_step": 600,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -4223,6 +4223,41 @@
4223
  "learning_rate": 9.494572504247593e-05,
4224
  "loss": 0.9044,
4225
  "step": 600
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4226
  }
4227
  ],
4228
  "logging_steps": 1,
@@ -4242,7 +4277,7 @@
4242
  "attributes": {}
4243
  }
4244
  },
4245
- "total_flos": 6.707623030161408e+17,
4246
  "train_batch_size": 4,
4247
  "trial_name": null,
4248
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.7829181494661922,
5
  "eval_steps": 386,
6
+ "global_step": 605,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
4223
  "learning_rate": 9.494572504247593e-05,
4224
  "loss": 0.9044,
4225
  "step": 600
4226
+ },
4227
+ {
4228
+ "epoch": 0.7777418311226141,
4229
+ "grad_norm": 0.8177486062049866,
4230
+ "learning_rate": 9.492764667543252e-05,
4231
+ "loss": 0.8132,
4232
+ "step": 601
4233
+ },
4234
+ {
4235
+ "epoch": 0.7790359107085085,
4236
+ "grad_norm": 1.0061938762664795,
4237
+ "learning_rate": 9.490953776174955e-05,
4238
+ "loss": 0.9204,
4239
+ "step": 602
4240
+ },
4241
+ {
4242
+ "epoch": 0.7803299902944031,
4243
+ "grad_norm": 0.8224837779998779,
4244
+ "learning_rate": 9.489139831373944e-05,
4245
+ "loss": 0.7909,
4246
+ "step": 603
4247
+ },
4248
+ {
4249
+ "epoch": 0.7816240698802976,
4250
+ "grad_norm": 0.7812953591346741,
4251
+ "learning_rate": 9.48732283437353e-05,
4252
+ "loss": 0.9583,
4253
+ "step": 604
4254
+ },
4255
+ {
4256
+ "epoch": 0.7829181494661922,
4257
+ "grad_norm": 0.8498075604438782,
4258
+ "learning_rate": 9.485502786409107e-05,
4259
+ "loss": 1.0692,
4260
+ "step": 605
4261
  }
4262
  ],
4263
  "logging_steps": 1,
 
4277
  "attributes": {}
4278
  }
4279
  },
4280
+ "total_flos": 6.763519888746086e+17,
4281
  "train_batch_size": 4,
4282
  "trial_name": null,
4283
  "trial_params": null