ncbateman commited on
Commit
c41efc1
1 Parent(s): ca301c5

Training in progress, step 655, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:a3668fa34724afb7451663beb5c2888ddcb2b7ecddb13ed07d944025c27d8d3b
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3c5083d6fe7fc6ad40025db9a82bb1249d80b2a676e2a697dce57e7e8f6ff900
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:03eb30e093c78829d55e5b35712320efbf2416ee2737745a276186c084bbdecb
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8d2e8d1efd498662ea22edb0b65f53bc5fc876649c55d813f1c68179c92087b6
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9f89037ac2abeb6171c1ce95a77a94c808e277b9f70abf8b11f093a79735219d
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:eaffbd51d7716e49736bc2fc49a38c283c724ab2443bef57f7bac6587bb0f07f
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:f40d91018758ada40c1cb9514ff9b9e8ed129fd32f51a6eaa9ac898e033c2d44
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed8ec70c66524f977f482912ad14e6e50f55a63de0200f38bf63dd1a0f5fc3f3
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.8411517308314461,
5
  "eval_steps": 386,
6
- "global_step": 650,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -4573,6 +4573,41 @@
4573
  "learning_rate": 9.400463314275943e-05,
4574
  "loss": 0.9865,
4575
  "step": 650
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4576
  }
4577
  ],
4578
  "logging_steps": 1,
@@ -4592,7 +4627,7 @@
4592
  "attributes": {}
4593
  }
4594
  },
4595
- "total_flos": 7.266591616008192e+17,
4596
  "train_batch_size": 4,
4597
  "trial_name": null,
4598
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.8476221287609188,
5
  "eval_steps": 386,
6
+ "global_step": 655,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
4573
  "learning_rate": 9.400463314275943e-05,
4574
  "loss": 0.9865,
4575
  "step": 650
4576
+ },
4577
+ {
4578
+ "epoch": 0.8424458104173407,
4579
+ "grad_norm": 0.7086622714996338,
4580
+ "learning_rate": 9.398504293135507e-05,
4581
+ "loss": 0.8451,
4582
+ "step": 651
4583
+ },
4584
+ {
4585
+ "epoch": 0.8437398900032352,
4586
+ "grad_norm": 0.8999130725860596,
4587
+ "learning_rate": 9.396542281419445e-05,
4588
+ "loss": 0.919,
4589
+ "step": 652
4590
+ },
4591
+ {
4592
+ "epoch": 0.8450339695891297,
4593
+ "grad_norm": 0.8439355492591858,
4594
+ "learning_rate": 9.39457728046174e-05,
4595
+ "loss": 0.808,
4596
+ "step": 653
4597
+ },
4598
+ {
4599
+ "epoch": 0.8463280491750242,
4600
+ "grad_norm": 0.863634467124939,
4601
+ "learning_rate": 9.392609291598413e-05,
4602
+ "loss": 1.0594,
4603
+ "step": 654
4604
+ },
4605
+ {
4606
+ "epoch": 0.8476221287609188,
4607
+ "grad_norm": 0.8126616477966309,
4608
+ "learning_rate": 9.390638316167512e-05,
4609
+ "loss": 1.0526,
4610
+ "step": 655
4611
  }
4612
  ],
4613
  "logging_steps": 1,
 
4627
  "attributes": {}
4628
  }
4629
  },
4630
+ "total_flos": 7.32248847459287e+17,
4631
  "train_batch_size": 4,
4632
  "trial_name": null,
4633
  "trial_params": null