ncbateman commited on
Commit
3be0a29
1 Parent(s): 3d54ca6

Training in progress, step 795, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:af1d514de1a6c8c240084c2abe4fb229e803cbb3f979d7290c1732d9e8a5122b
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:010c2a2b840c3fde77f5f0db5ad5bd6f0a52b58296feec5b8fd9dc9e42d54370
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3b7db8cc663173d80853c1b54864d85bd623d219d83845ca314b5cda205766bf
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:feeb714d469e3a6e68b9df8c7aa45ef9b97a6c08822ae8c12a628b95f1875fed
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:063fd63bc73224a76249067a1eeeb31dc678e9656124df16bfa7ce512e017f7f
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4c3bbf6e51e06c9204f77b5c5a1350738f864223365e0f7477b14a5405e97ae
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:94c0126f420d4eb985c03c001ae7f8b7fc9b010855fef21b025980a5ae889902
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7396be3b2d86ed6e3fcd71c7b4f2cd360bbd7492a3b7c96b0d16d251f623454
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 1.0223228728566807,
5
  "eval_steps": 386,
6
- "global_step": 790,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -5561,6 +5561,41 @@
5561
  "learning_rate": 9.097729883761976e-05,
5562
  "loss": 0.6884,
5563
  "step": 790
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
5564
  }
5565
  ],
5566
  "logging_steps": 1,
@@ -5580,7 +5615,7 @@
5580
  "attributes": {}
5581
  }
5582
  },
5583
- "total_flos": 8.831004945646879e+17,
5584
  "train_batch_size": 4,
5585
  "trial_name": null,
5586
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 1.0287932707861533,
5
  "eval_steps": 386,
6
+ "global_step": 795,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
5561
  "learning_rate": 9.097729883761976e-05,
5562
  "loss": 0.6884,
5563
  "step": 790
5564
+ },
5565
+ {
5566
+ "epoch": 1.0236169524425751,
5567
+ "grad_norm": 0.7473916411399841,
5568
+ "learning_rate": 9.095366056890302e-05,
5569
+ "loss": 0.7346,
5570
+ "step": 791
5571
+ },
5572
+ {
5573
+ "epoch": 1.0249110320284698,
5574
+ "grad_norm": 0.7097285985946655,
5575
+ "learning_rate": 9.09299944554893e-05,
5576
+ "loss": 0.825,
5577
+ "step": 792
5578
+ },
5579
+ {
5580
+ "epoch": 1.0262051116143642,
5581
+ "grad_norm": 0.7450020909309387,
5582
+ "learning_rate": 9.09063005134694e-05,
5583
+ "loss": 0.8589,
5584
+ "step": 793
5585
+ },
5586
+ {
5587
+ "epoch": 1.027499191200259,
5588
+ "grad_norm": 0.828708291053772,
5589
+ "learning_rate": 9.088257875895297e-05,
5590
+ "loss": 0.8284,
5591
+ "step": 794
5592
+ },
5593
+ {
5594
+ "epoch": 1.0287932707861533,
5595
+ "grad_norm": 0.7440184354782104,
5596
+ "learning_rate": 9.085882920806861e-05,
5597
+ "loss": 0.8285,
5598
+ "step": 795
5599
  }
5600
  ],
5601
  "logging_steps": 1,
 
5615
  "attributes": {}
5616
  }
5617
  },
5618
+ "total_flos": 8.886901804231557e+17,
5619
  "train_batch_size": 4,
5620
  "trial_name": null,
5621
  "trial_params": null