Training in progress, step 45, checkpoint

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:94227d74def4392cb0858dec5cc79f10f016d6d4cd0918860f43d17e963e6838
 size 125248064

 version https://git-lfs.github.com/spec/v1
+oid sha256:fd339c762d519f025a02f91f9038f9a73f4a39a83087a2c3e458e39ffb1a1c0c
 size 125248064

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:316ade94b6d96eda4bd7e177d6826e75c49fc70e0c9fa9e20ae11e4acc88a7d7
 size 63350356

 version https://git-lfs.github.com/spec/v1
+oid sha256:259dfd28d649cfa0e945d3bf469db65d20e00c520f47c964d923cf55444dc01b
 size 63350356

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8f4a56d3eaf05ae5f699ef13189e24ddd5fcf425cc9cf8207ad6e0944d73bf35
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:bd7553ed48fb9af9185475a0992950d3f88e91369c31402fc9b619ffc0bfb053
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:610e491c82604b1b591117150d7c6581358cc6593f7a436345f16444653cc75d
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:ce5711d70d3076072f14e7b99af7bcdd0964855992649ccba3c74a3698371762
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.016,
   "eval_steps": 1000,
-  "global_step": 40,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -247,13 +247,43 @@
       "learning_rate": 0.00014965986394557826,
       "loss": 1.4394,
       "step": 40
     }
   ],
   "logging_steps": 1,
   "max_steps": 150,
   "num_train_epochs": 1,
   "save_steps": 5,
-  "total_flos": 4574768524247040.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.018,
   "eval_steps": 1000,
+  "global_step": 45,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00014965986394557826,
       "loss": 1.4394,
       "step": 40
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.00014829931972789117,
+      "loss": 1.4033,
+      "step": 41
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.0001469387755102041,
+      "loss": 1.5887,
+      "step": 42
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.000145578231292517,
+      "loss": 1.8761,
+      "step": 43
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.00014421768707482995,
+      "loss": 1.67,
+      "step": 44
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.00014285714285714287,
+      "loss": 1.8064,
+      "step": 45
     }
   ],
   "logging_steps": 1,
   "max_steps": 150,
   "num_train_epochs": 1,
   "save_steps": 5,
+  "total_flos": 5322104911872000.0,
   "trial_name": null,
   "trial_params": null
 }