ncbateman commited on
Commit
f4f13ca
·
verified ·
1 Parent(s): 8339968

Training in progress, step 580, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8dc3759cb3eadde8f65f5a3d7697045cdf5905ba99f1c6eaf2ca3a7844ad2aca
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ddd8d5d17a70fc79518195b5b2e2d18e0edf35451d2de3c1d4af60412a1a30e8
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8685b80d11ca02ce5247ab56c8fdc4d82bb07cfe0c06ad76dd35d09f90963d57
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1105fd8323adc5ab31859ebf0c1f559487e30aa157c674ed5d23d9852296ed98
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:530917c5e79645a47e31080d2f68465b75947e6f663e644f4e8388bf2a65638b
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48e8d93d81cb229c0956f2142d68e1f8aa0357ca11d56ce040bb137cf176e02f
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:95e7e7df729679e04b7adacc504f1466aebac28d86d657be5afa757859f96a7b
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:49970088ac3a5ad000c30d8106322041a0265ebced6d734c6afdb98d800f2095
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.7440957618893562,
5
  "eval_steps": 386,
6
- "global_step": 575,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -4048,6 +4048,41 @@
4048
  "learning_rate": 9.538772097304521e-05,
4049
  "loss": 0.8442,
4050
  "step": 575
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
4051
  }
4052
  ],
4053
  "logging_steps": 1,
@@ -4067,7 +4102,7 @@
4067
  "attributes": {}
4068
  }
4069
  },
4070
- "total_flos": 6.428138737238016e+17,
4071
  "train_batch_size": 4,
4072
  "trial_name": null,
4073
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.7505661598188289,
5
  "eval_steps": 386,
6
+ "global_step": 580,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
4048
  "learning_rate": 9.538772097304521e-05,
4049
  "loss": 0.8442,
4050
  "step": 575
4051
+ },
4052
+ {
4053
+ "epoch": 0.7453898414752508,
4054
+ "grad_norm": 0.7087002992630005,
4055
+ "learning_rate": 9.537041021262072e-05,
4056
+ "loss": 0.8004,
4057
+ "step": 576
4058
+ },
4059
+ {
4060
+ "epoch": 0.7466839210611452,
4061
+ "grad_norm": 0.8022588491439819,
4062
+ "learning_rate": 9.535306860451849e-05,
4063
+ "loss": 0.9188,
4064
+ "step": 577
4065
+ },
4066
+ {
4067
+ "epoch": 0.7479780006470398,
4068
+ "grad_norm": 0.8022916316986084,
4069
+ "learning_rate": 9.533569616052921e-05,
4070
+ "loss": 0.9815,
4071
+ "step": 578
4072
+ },
4073
+ {
4074
+ "epoch": 0.7492720802329343,
4075
+ "grad_norm": 0.6670771837234497,
4076
+ "learning_rate": 9.531829289246452e-05,
4077
+ "loss": 0.812,
4078
+ "step": 579
4079
+ },
4080
+ {
4081
+ "epoch": 0.7505661598188289,
4082
+ "grad_norm": 0.7644294500350952,
4083
+ "learning_rate": 9.530085881215705e-05,
4084
+ "loss": 0.8092,
4085
+ "step": 580
4086
  }
4087
  ],
4088
  "logging_steps": 1,
 
4102
  "attributes": {}
4103
  }
4104
  },
4105
+ "total_flos": 6.484035595822694e+17,
4106
  "train_batch_size": 4,
4107
  "trial_name": null,
4108
  "trial_params": null