Training in progress, step 10, checkpoint

Files changed (5) hide show

last-checkpoint/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:911fc2c2022185fd1fe2e8655a9d0239b5e0657efa559c0414477b1605337408
 size 891644712

 version https://git-lfs.github.com/spec/v1
+oid sha256:ab8d748fd8f20e14a3cda2d877038ce59887130178c068dcafb79817213c24e1
 size 891644712

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:488f963d7990918726aa5581ebf3fd2337a4246d36e64222860a7927f9e82109
 size 1783444794

 version https://git-lfs.github.com/spec/v1
+oid sha256:00bca8fedb1bc6c25e6e507abe70894fe1954894c658291feb63df23505cbe3e
 size 1783444794

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6361784e84b3b22b2e079b3971edd2b6754ea45276d3b8359a98028c3ee0fa66
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:70357fb90a1dcb5ff229b8259118cfc08b286f367541b00f95c942e294080e49
 size 14244

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -7,8 +7,44 @@
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
-  "log_history": [],
-  "logging_steps": 50,
   "max_steps": 3606,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 2,

   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.0011092623405435386,
+      "grad_norm": 80.64155578613281,
+      "learning_rate": 3.6697247706422022e-06,
+      "loss": 13.4594,
+      "step": 2
+    },
+    {
+      "epoch": 0.0022185246810870773,
+      "grad_norm": 66.91927337646484,
+      "learning_rate": 7.3394495412844045e-06,
+      "loss": 13.8607,
+      "step": 4
+    },
+    {
+      "epoch": 0.0033277870216306157,
+      "grad_norm": 63.7406005859375,
+      "learning_rate": 1.1009174311926607e-05,
+      "loss": 13.0338,
+      "step": 6
+    },
+    {
+      "epoch": 0.004437049362174155,
+      "grad_norm": 61.71236801147461,
+      "learning_rate": 1.4678899082568809e-05,
+      "loss": 12.9429,
+      "step": 8
+    },
+    {
+      "epoch": 0.005546311702717693,
+      "grad_norm": 63.84341812133789,
+      "learning_rate": 1.834862385321101e-05,
+      "loss": 12.5906,
+      "step": 10
+    }
+  ],
+  "logging_steps": 2,
   "max_steps": 3606,
   "num_input_tokens_seen": 0,
   "num_train_epochs": 2,

last-checkpoint/training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4979aacbf97f1a01d64b1b1ad49db487ea684ad8d09e1547b42889a05eada653
 size 5304

 version https://git-lfs.github.com/spec/v1
+oid sha256:626d772bac197cb38cc6281159e89ab89ec3be67c70cfa94c2b35d721cf3214f
 size 5304