Training in progress, step 10, checkpoint

Files changed (12) hide show

last-checkpoint/adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1ba4843bab3f6c0de98cf2828f8059fac627894d15376bf6eb4b6b539d909db8
 size 73911112

 version https://git-lfs.github.com/spec/v1
+oid sha256:2fff02c7b4a826fb07ea195bb1a7bb4ffc9d721a69210b761baa58148f930fa7
 size 73911112

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e4d523ab2ba4df3c774b98bf6109a8713c9f0199b76bff1f7449efce144029eb
 size 37965300

 version https://git-lfs.github.com/spec/v1
+oid sha256:319548d2ea9e5b5f008e022dad56cd0f028de3735befddd24f255983fefd537e
 size 37965300

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1881ec4d999362af1e52c36de1e218d3800542004d7f7c7edd42a089b7296ccc
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:6dbb2e8ac6910520ef7694e04efc0c3d22d47c0a6764ae2a666b6a667647ed1d
 size 15984

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:00d02bbc0fa1d27820c289ea283e0155cafcbd62fa1759df4850d0a715649da0
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:5a64ea9853e527aeaa3e3e8ab63280f7a104d71f06cbc00b6586cb1151066797
 size 15984

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c73827ec09ff37ba195a38bf7f08f0537cea0c0a55db5d2fc0d29f759ccdcccb
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:bb597193ff9d2e676d231c4c21c97756a564739529ec012a7405fe102e2d6bf0
 size 15984

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4822c4ae863c6a81149f37fecf8fc589c5a0e68b5f03747420a5cc6ab7af0d14
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:8844277a61aa266c1286de806f9fbc3a0e4ffe07a5d322e90f868a6bef7c6200
 size 15984

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:1e9b440498b750929a8558219fefc2e4ad160122931aa3d6799fc4f65cdd7304
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:516bda9bd375b4dbffe21ea5098d3ba187c60e9ac82d932b20a8bdf7f85f5e7f
 size 15984

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4f0c18fbbe129f61ea282f7dbcc97540666d69c89e3f1cc4842d356efb45d0d6
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:6da94ae89efb6930839681ba2aa052a5e83a69a0af729ccfc303f5699e7189e8
 size 15984

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a99554429161338da1a7001f3a511ce540238038412b9c31276e6f7379ad186a
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:8788fd8bf5c71109ab3d1b1b8fb5df84005194baadaf8d32a3898477ae2e1c3e
 size 15984

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:e39d4edd2882a248daa72fe9c907359ed8ef2a193dbcaec84663291acb998ec0
 size 15984

 version https://git-lfs.github.com/spec/v1
+oid sha256:4b5cb477ad7cfcb7f3e9b4e0628a58437296983ffbd992ed46c97df77959dad1
 size 15984

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:9c8e6b04902f17ae368c3e6cfd97a31ad4de2f025d673daea8c033ce0e260946
 size 1064

 version https://git-lfs.github.com/spec/v1
+oid sha256:bb578e75c11a81e85dda67a691f96ba4793a02960f1409fd3e1511aac873491a
 size 1064

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,9 +1,9 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.0131916452913155,
   "eval_steps": 3,
-  "global_step": 9,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -102,6 +102,13 @@
       "eval_samples_per_second": 76.673,
       "eval_steps_per_second": 9.601,
       "step": 9
     }
   ],
   "logging_steps": 1,
@@ -116,12 +123,12 @@
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
-        "should_training_stop": false
       },
       "attributes": {}
     }
   },
-  "total_flos": 9405135625125888.0,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 0.014657383657017223,
   "eval_steps": 3,
+  "global_step": 10,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 76.673,
       "eval_steps_per_second": 9.601,
       "step": 9
+    },
+    {
+      "epoch": 0.014657383657017223,
+      "grad_norm": 0.09443683177232742,
+      "learning_rate": 0.0002,
+      "loss": 0.7131,
+      "step": 10
     }
   ],
   "logging_steps": 1,
         "should_evaluate": false,
         "should_log": false,
         "should_save": true,
+        "should_training_stop": true
       },
       "attributes": {}
     }
   },
+  "total_flos": 1.045015069458432e+16,
   "train_batch_size": 1,
   "trial_name": null,
   "trial_params": null