ncbateman commited on
Commit
35323cd
·
verified ·
1 Parent(s): fa3925c

Training in progress, step 185, checkpoint

Browse files
last-checkpoint/adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:54852292744f440802866f2a783ac23ba6ef16d422e18372b624c56a9993fd60
3
  size 97307544
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:53f840c456e95ff795bb55a979f354b5ff45be3d04c09c6b95856e15c3fa87aa
3
  size 97307544
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:2e585efd52a8e20e6ad89ed740f3d2f593db339c6c6144c06fc288ce92cceb4d
3
  size 49846260
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:828ab7a81b68551a70d539cfd2cac13e0329b266849a1e49be1a7378953f427b
3
  size 49846260
last-checkpoint/rng_state.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:0be8ec8c2101cfccd393ed730b21787429a8999e0b138398d5c14f37c51656e9
3
  size 14244
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8fb359c3a6e91a0edc2b5df10f0aa833ed71c37ab5b62579c99595688bae7c64
3
  size 14244
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:7d26ba877a96beecd6515b5aee3300dc989b5588ecbd143a4bad8685b1c07c60
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:653ee3fc89860e50462e7548d430e695c40eaf8677cc1507132629ab8dddb6e3
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 0.23293432546101586,
5
  "eval_steps": 386,
6
- "global_step": 180,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1275,6 +1275,41 @@
1275
  "learning_rate": 9.971301406367644e-05,
1276
  "loss": 0.8619,
1277
  "step": 180
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1278
  }
1279
  ],
1280
  "logging_steps": 1,
@@ -1294,7 +1329,7 @@
1294
  "attributes": {}
1295
  }
1296
  },
1297
- "total_flos": 2.0122869090484224e+17,
1298
  "train_batch_size": 4,
1299
  "trial_name": null,
1300
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 0.23940472339048852,
5
  "eval_steps": 386,
6
+ "global_step": 185,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1275
  "learning_rate": 9.971301406367644e-05,
1276
  "loss": 0.8619,
1277
  "step": 180
1278
+ },
1279
+ {
1280
+ "epoch": 0.2342284050469104,
1281
+ "grad_norm": 0.6980477571487427,
1282
+ "learning_rate": 9.970858622429579e-05,
1283
+ "loss": 0.8271,
1284
+ "step": 181
1285
+ },
1286
+ {
1287
+ "epoch": 0.23552248463280492,
1288
+ "grad_norm": 0.954387903213501,
1289
+ "learning_rate": 9.970412458767943e-05,
1290
+ "loss": 0.8465,
1291
+ "step": 182
1292
+ },
1293
+ {
1294
+ "epoch": 0.23681656421869945,
1295
+ "grad_norm": 0.8425692915916443,
1296
+ "learning_rate": 9.969962915686083e-05,
1297
+ "loss": 0.8893,
1298
+ "step": 183
1299
+ },
1300
+ {
1301
+ "epoch": 0.23811064380459399,
1302
+ "grad_norm": 0.8565071225166321,
1303
+ "learning_rate": 9.969509993489647e-05,
1304
+ "loss": 0.939,
1305
+ "step": 184
1306
+ },
1307
+ {
1308
+ "epoch": 0.23940472339048852,
1309
+ "grad_norm": 0.8831691145896912,
1310
+ "learning_rate": 9.969053692486583e-05,
1311
+ "loss": 0.8907,
1312
+ "step": 185
1313
  }
1314
  ],
1315
  "logging_steps": 1,
 
1329
  "attributes": {}
1330
  }
1331
  },
1332
+ "total_flos": 2.0681837676331008e+17,
1333
  "train_batch_size": 4,
1334
  "trial_name": null,
1335
  "trial_params": null