Training in progress, epoch 1

Files changed (5) hide show

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6352a74e314452393f2a2fcf071c68c935c571007dfbcc47e746cf616a7246a1
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:41992a55aa9943c8302d141033b567a11ee530849b4fe2c77b7578e46eaf5a62
 size 267832560

tmp-checkpoint-175/model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6352a74e314452393f2a2fcf071c68c935c571007dfbcc47e746cf616a7246a1
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:41992a55aa9943c8302d141033b567a11ee530849b4fe2c77b7578e46eaf5a62
 size 267832560

tmp-checkpoint-175/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:467810065677088ea64b1a84b5d3872a1458ff620639aee59220366634b1d3ea
 size 535727290

 version https://git-lfs.github.com/spec/v1
+oid sha256:f098f42091324014d70498dda49fcd2e57bbc8352875cb37f6b33abafebebd92
 size 535727290

tmp-checkpoint-175/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c58ef9a709639d15ce823cbab1c94a327f84302849ffa232663b1d79c1fa4e24
 size 14244

 version https://git-lfs.github.com/spec/v1
+oid sha256:2799fb355a6059a45cee9f0cd6d7dec02193106ed08b481f241a6fee90738b0d
 size 14244

tmp-checkpoint-175/trainer_state.json CHANGED Viewed

@@ -11,29 +11,29 @@
     {
       "epoch": 0.29,
       "learning_rate": 1.0000000000000002e-06,
-      "loss": 0.5522,
       "step": 50
     },
     {
       "epoch": 0.57,
       "learning_rate": 2.0000000000000003e-06,
-      "loss": 0.553,
       "step": 100
     },
     {
       "epoch": 0.86,
       "learning_rate": 3e-06,
-      "loss": 0.5327,
       "step": 150
     },
     {
       "epoch": 1.0,
       "eval_accuracy": 0.7685714285714286,
       "eval_f1": 0.8691437802907915,
-      "eval_loss": 0.5155649185180664,
-      "eval_runtime": 10.9449,
-      "eval_samples_per_second": 63.957,
-      "eval_steps_per_second": 4.02,
       "step": 175
     }
   ],

     {
       "epoch": 0.29,
       "learning_rate": 1.0000000000000002e-06,
+      "loss": 0.5582,
       "step": 50
     },
     {
       "epoch": 0.57,
       "learning_rate": 2.0000000000000003e-06,
+      "loss": 0.5351,
       "step": 100
     },
     {
       "epoch": 0.86,
       "learning_rate": 3e-06,
+      "loss": 0.541,
       "step": 150
     },
     {
       "epoch": 1.0,
       "eval_accuracy": 0.7685714285714286,
       "eval_f1": 0.8691437802907915,
+      "eval_loss": 0.5197482705116272,
+      "eval_runtime": 11.1124,
+      "eval_samples_per_second": 62.992,
+      "eval_steps_per_second": 3.96,
       "step": 175
     }
   ],