Training in progress, step 60, checkpoint

Browse files

Files changed (5) hide show

last-checkpoint/adapter_model.safetensors +1 -1
last-checkpoint/optimizer.pt +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +63 -3

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:22660376d335aa7c59ae2006d76a706940c8aef4af7c011c7e7d2abeea1a39af
 size 125248064

 version https://git-lfs.github.com/spec/v1
+oid sha256:4e7e060c76e33b4ea8f472bc3ffe35c3c89700f29dc8ddf1785b36bfc5783f0d
 size 125248064

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:99711f18552ca634897d88e6cf50fb107c5ac591d8d935086635c8d58ba450dc
 size 63350356

 version https://git-lfs.github.com/spec/v1
+oid sha256:3d9a325ae4a57eb8dda64125b9bda977c4f29163f541340e3166315d367c30e7
 size 63350356

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:47f6661d5d07de5b2df0d6c9e638f52a46b71c0872bae5b8e7ca87f35bf01fa4
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:78da1da061288012ca67a39eca3ceec230fb3877f3be89de615db089beb7984c
 size 14244

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:fa5dbfbb9e4d48e480300700a77d16d14549c19a56fbfb81fe15f5b2fffbce24
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:b0f02c8a54d03bd9dfb0939ad3018ed1dc368b994677a1af7e7d58a0b3322f4b
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.02,
   "eval_steps": 1000,
-  "global_step": 50,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -307,13 +307,73 @@
       "learning_rate": 0.00013605442176870748,
       "loss": 1.3797,
       "step": 50
     }
   ],
   "logging_steps": 1,
   "max_steps": 150,
   "num_train_epochs": 1,
   "save_steps": 5,
-  "total_flos": 5737824304988160.0,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.024,
   "eval_steps": 1000,
+  "global_step": 60,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 0.00013605442176870748,
       "loss": 1.3797,
       "step": 50
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.0001346938775510204,
+      "loss": 1.7408,
+      "step": 51
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.00013333333333333334,
+      "loss": 1.6008,
+      "step": 52
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.00013197278911564626,
+      "loss": 1.5121,
+      "step": 53
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.00013061224489795917,
+      "loss": 1.3599,
+      "step": 54
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.00012925170068027212,
+      "loss": 1.4465,
+      "step": 55
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.00012789115646258506,
+      "loss": 1.6332,
+      "step": 56
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.00012653061224489798,
+      "loss": 1.6305,
+      "step": 57
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.0001251700680272109,
+      "loss": 1.5599,
+      "step": 58
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.0001238095238095238,
+      "loss": 1.8265,
+      "step": 59
+    },
+    {
+      "epoch": 0.02,
+      "learning_rate": 0.00012244897959183676,
+      "loss": 1.7149,
+      "step": 60
     }
   ],
   "logging_steps": 1,
   "max_steps": 150,
   "num_train_epochs": 1,
   "save_steps": 5,
+  "total_flos": 6638833090068480.0,
   "trial_name": null,
   "trial_params": null
 }