ncbateman commited on
Commit
6c8da9c
·
verified ·
1 Parent(s): 7e6a17a

Training in progress, step 325, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6953ae7f6115d570fb8b6044270a4fe2e65715f11390da71b6c6571b692b38fc
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7ea56450fdd0f062e2582b0d9342bc249b9178a0f643c7c9864b7972919084f4
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2125e4e945b6170832b2f6b047046dd51779e474a701b162d37c31462bade964
3
  size 49846644
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a4fa14455bc2fa646a0d1356cf7b7978478e663d2abc89b631beb057c254467b
3
  size 49846644
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d60ac4f3dfeb480aa47e46e780d6d5afc472bfe9f3793df96d8ba938b9c9522
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7af9f543e1b227e80431d9b71735f56ac10caba331db4119655a613e1f923579
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:259f2542494ed0450cbd0aba881cda09f149af3f98edcffaf21912036f30e17f
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5ebcc6744bfae863fe4396052394cc81a120b788a3be0b48befca2ef92651996
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.4141054674862504,
5
  "eval_steps": 386,
6
- "global_step": 320,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -2255,6 +2255,41 @@
2255
  "learning_rate": 9.876597839525814e-05,
2256
  "loss": 1.1169,
2257
  "step": 320
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2258
  }
2259
  ],
2260
  "logging_steps": 1,
@@ -2274,7 +2309,7 @@
2274
  "attributes": {}
2275
  }
2276
  },
2277
- "total_flos": 3.5773989494194176e+17,
2278
  "train_batch_size": 4,
2279
  "trial_name": null,
2280
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.42057586541572306,
5
  "eval_steps": 386,
6
+ "global_step": 325,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
2255
  "learning_rate": 9.876597839525814e-05,
2256
  "loss": 1.1169,
2257
  "step": 320
2258
+ },
2259
+ {
2260
+ "epoch": 0.41539954707214494,
2261
+ "grad_norm": 0.7923420667648315,
2262
+ "learning_rate": 9.875685870448672e-05,
2263
+ "loss": 0.9942,
2264
+ "step": 321
2265
+ },
2266
+ {
2267
+ "epoch": 0.4166936266580395,
2268
+ "grad_norm": 0.7265552282333374,
2269
+ "learning_rate": 9.874770586356616e-05,
2270
+ "loss": 1.0377,
2271
+ "step": 322
2272
+ },
2273
+ {
2274
+ "epoch": 0.417987706243934,
2275
+ "grad_norm": 0.7586270570755005,
2276
+ "learning_rate": 9.873851987871954e-05,
2277
+ "loss": 0.9172,
2278
+ "step": 323
2279
+ },
2280
+ {
2281
+ "epoch": 0.41928178582982856,
2282
+ "grad_norm": 0.782192587852478,
2283
+ "learning_rate": 9.872930075619249e-05,
2284
+ "loss": 0.9219,
2285
+ "step": 324
2286
+ },
2287
+ {
2288
+ "epoch": 0.42057586541572306,
2289
+ "grad_norm": 0.8508116602897644,
2290
+ "learning_rate": 9.872004850225313e-05,
2291
+ "loss": 0.939,
2292
+ "step": 325
2293
  }
2294
  ],
2295
  "logging_steps": 1,
 
2309
  "attributes": {}
2310
  }
2311
  },
2312
+ "total_flos": 3.633295808004096e+17,
2313
  "train_batch_size": 4,
2314
  "trial_name": null,
2315
  "trial_params": null