Training in progress, step 17500

Browse files

Files changed (7) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +153 -3
pytorch_model.bin +1 -1
runs/Dec05_03-30-37_fbdce2302f52/events.out.tfevents.1670211053.fbdce2302f52.24.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bf2370268fbd4ed9711f23148e5e1266d41ae04c0e88d432b6280d6684096467
 size 1115513717

 version https://git-lfs.github.com/spec/v1
+oid sha256:70920a080f4832237ce7c6ba0b7f90a36204857a2597dfa2c6caf8d3a72f7e7f
 size 1115513717

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:376812cf708ab7061c8c4ac1b0483e37e40aac837abe95f3b8ae1e5922038a43
 size 557969145

 version https://git-lfs.github.com/spec/v1
+oid sha256:3916aa768b3547ed097d45447da1e5f44df02e98af7f4c9081b40d19b99444c0
 size 557969145

last-checkpoint/rng_state.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:142093c2e302563f6acf00427729bb94740050933baea33071c54bdbba785272
 size 15523

 version https://git-lfs.github.com/spec/v1
+oid sha256:96d08c867edbcec7c00e24e146bf3d6892636f95bde24b387b90e00d4e61e819
 size 15523

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6c6a0c5b7f631fe6cce73745fa375c6f37e5118cbc55c65d587e9651ec9176ce
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:eab84ebacf80b8995a27a6b564c2dd8315f1d3f62ec0076da07f78d4762c61eb
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 0.8847991505928154,
-  "global_step": 15000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -914,11 +914,161 @@
       "learning_rate": 8.225732450678378e-07,
       "loss": 0.6941,
       "step": 15000
     }
   ],
   "max_steps": 30516,
   "num_train_epochs": 2,
-  "total_flos": 9.14703293177856e+16,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 1.032265675691618,
+  "global_step": 17500,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "learning_rate": 8.225732450678378e-07,
       "loss": 0.6941,
       "step": 15000
+    },
+    {
+      "epoch": 0.89,
+      "learning_rate": 4.948548207380218e-07,
+      "loss": 0.7049,
+      "step": 15100
+    },
+    {
+      "epoch": 0.9,
+      "learning_rate": 1.6713639640820606e-07,
+      "loss": 0.6312,
+      "step": 15200
+    },
+    {
+      "epoch": 0.9,
+      "learning_rate": 0.0,
+      "loss": 0.6369,
+      "step": 15300
+    },
+    {
+      "epoch": 0.91,
+      "learning_rate": 0.0,
+      "loss": 0.6321,
+      "step": 15400
+    },
+    {
+      "epoch": 0.91,
+      "learning_rate": 0.0,
+      "loss": 0.7197,
+      "step": 15500
+    },
+    {
+      "epoch": 0.92,
+      "learning_rate": 0.0,
+      "loss": 0.6451,
+      "step": 15600
+    },
+    {
+      "epoch": 0.93,
+      "learning_rate": 0.0,
+      "loss": 0.6704,
+      "step": 15700
+    },
+    {
+      "epoch": 0.93,
+      "learning_rate": 0.0,
+      "loss": 0.6144,
+      "step": 15800
+    },
+    {
+      "epoch": 0.94,
+      "learning_rate": 0.0,
+      "loss": 0.6497,
+      "step": 15900
+    },
+    {
+      "epoch": 0.94,
+      "learning_rate": 0.0,
+      "loss": 0.7311,
+      "step": 16000
+    },
+    {
+      "epoch": 0.95,
+      "learning_rate": 0.0,
+      "loss": 0.6799,
+      "step": 16100
+    },
+    {
+      "epoch": 0.96,
+      "learning_rate": 0.0,
+      "loss": 0.6354,
+      "step": 16200
+    },
+    {
+      "epoch": 0.96,
+      "learning_rate": 0.0,
+      "loss": 0.6063,
+      "step": 16300
+    },
+    {
+      "epoch": 0.97,
+      "learning_rate": 0.0,
+      "loss": 0.6489,
+      "step": 16400
+    },
+    {
+      "epoch": 0.97,
+      "learning_rate": 0.0,
+      "loss": 0.6334,
+      "step": 16500
+    },
+    {
+      "epoch": 0.98,
+      "learning_rate": 0.0,
+      "loss": 0.689,
+      "step": 16600
+    },
+    {
+      "epoch": 0.99,
+      "learning_rate": 0.0,
+      "loss": 0.6852,
+      "step": 16700
+    },
+    {
+      "epoch": 0.99,
+      "learning_rate": 0.0,
+      "loss": 0.6481,
+      "step": 16800
+    },
+    {
+      "epoch": 1.0,
+      "learning_rate": 0.0,
+      "loss": 0.7362,
+      "step": 16900
+    },
+    {
+      "epoch": 1.0,
+      "learning_rate": 0.0,
+      "loss": 0.7102,
+      "step": 17000
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 0.0,
+      "loss": 0.6313,
+      "step": 17100
+    },
+    {
+      "epoch": 1.01,
+      "learning_rate": 0.0,
+      "loss": 0.7327,
+      "step": 17200
+    },
+    {
+      "epoch": 1.02,
+      "learning_rate": 0.0,
+      "loss": 0.624,
+      "step": 17300
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 0.0,
+      "loss": 0.6883,
+      "step": 17400
+    },
+    {
+      "epoch": 1.03,
+      "learning_rate": 0.0,
+      "loss": 0.5119,
+      "step": 17500
     }
   ],
   "max_steps": 30516,
   "num_train_epochs": 2,
+  "total_flos": 1.0676522063241216e+17,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:376812cf708ab7061c8c4ac1b0483e37e40aac837abe95f3b8ae1e5922038a43
 size 557969145

 version https://git-lfs.github.com/spec/v1
+oid sha256:3916aa768b3547ed097d45447da1e5f44df02e98af7f4c9081b40d19b99444c0
 size 557969145

runs/Dec05_03-30-37_fbdce2302f52/events.out.tfevents.1670211053.fbdce2302f52.24.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:19a488bda0439719c1c15ecf951d4d1665a47792d76487d0be4947720935c87c
-size 33224

 version https://git-lfs.github.com/spec/v1
+oid sha256:46d026c8117c697ed1221f4329f4a0e25d72fbf3cd5830657ac90bb96ef8f6fe
+size 37185