Training in progress, step 600

Browse files

Files changed (10) hide show

{checkpoint-300 → checkpoint-600}/config.json +0 -0
{checkpoint-300 → checkpoint-600}/optimizer.pt +1 -1
{checkpoint-300 → checkpoint-600}/preprocessor_config.json +0 -0
{checkpoint-300 → checkpoint-600}/pytorch_model.bin +1 -1
{checkpoint-300 → checkpoint-600}/rng_state.pth +1 -1
{checkpoint-300 → checkpoint-600}/scaler.pt +1 -1
{checkpoint-300 → checkpoint-600}/scheduler.pt +1 -1
{checkpoint-300 → checkpoint-600}/trainer_state.json +120 -3
{checkpoint-300 → checkpoint-600}/training_args.bin +0 -0
pytorch_model.bin +1 -1

{checkpoint-300 → checkpoint-600}/config.json RENAMED Viewed

File without changes

{checkpoint-300 → checkpoint-600}/optimizer.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4851e5921f7325e240731959feb278f899280909b8e2cb6567d27fae4017c474
 size 2490337809

 version https://git-lfs.github.com/spec/v1
+oid sha256:94e544ed6fc2d04d9e3d9655de3eea506999b2814daab419e0d050c27a4a370f
 size 2490337809

{checkpoint-300 → checkpoint-600}/preprocessor_config.json RENAMED Viewed

File without changes

{checkpoint-300 → checkpoint-600}/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:434bb79de859e935ca1aaf8411c1439a4e24ef8e2396b088b07525e56e0847d8
 size 1262063089

 version https://git-lfs.github.com/spec/v1
+oid sha256:3baffe7a116d58666fc0726fb4fa6188834614eac15e96843270fc53529b943e
 size 1262063089

{checkpoint-300 → checkpoint-600}/rng_state.pth RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:04e54ce0be1689f12766dccd1bd35050e0f0346ef0556646dc973c608610db2f
 size 14567

 version https://git-lfs.github.com/spec/v1
+oid sha256:f58a88b760d3a9745a43789af262417186d48a5e0a471e8a2a080c8b3681cf9a
 size 14567

{checkpoint-300 → checkpoint-600}/scaler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:0967b9f865f16344c55f5ccc3cf7d6e8e97ca61dda304e931ca6bad130f48dd1
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:4e8415b86bbce347c0df306b84a695add049c2a3b2d0b6f4dda3bf036d341150
 size 559

{checkpoint-300 → checkpoint-600}/scheduler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:32701a4051ea5d746149966b47cdca0f213673b7e546ae3ee3646c1f9bbb83d6
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:a6b4eb516015852d76c10d5b0c139cec1e488aa3b53e560bc99f9c2300e33423
 size 623

{checkpoint-300 → checkpoint-600}/trainer_state.json RENAMED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 3.2950819672131146,
-  "global_step": 300,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -123,11 +123,128 @@
       "eval_steps_per_second": 0.782,
       "eval_wer": 1.0,
       "step": 300
     }
   ],
   "max_steps": 4550,
   "num_train_epochs": 50,
-  "total_flos": 4.675293533891495e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 6.590163934426229,
+  "global_step": 600,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_steps_per_second": 0.782,
       "eval_wer": 1.0,
       "step": 300
+    },
+    {
+      "epoch": 3.51,
+      "learning_rate": 4e-05,
+      "loss": 3.0511,
+      "step": 320
+    },
+    {
+      "epoch": 3.73,
+      "learning_rate": 4.25e-05,
+      "loss": 3.0358,
+      "step": 340
+    },
+    {
+      "epoch": 3.95,
+      "learning_rate": 4.4999999999999996e-05,
+      "loss": 3.0416,
+      "step": 360
+    },
+    {
+      "epoch": 4.17,
+      "learning_rate": 4.75e-05,
+      "loss": 3.1053,
+      "step": 380
+    },
+    {
+      "epoch": 4.39,
+      "learning_rate": 5e-05,
+      "loss": 3.0314,
+      "step": 400
+    },
+    {
+      "epoch": 4.39,
+      "eval_loss": 3.0990231037139893,
+      "eval_runtime": 198.3688,
+      "eval_samples_per_second": 24.414,
+      "eval_steps_per_second": 0.766,
+      "eval_wer": 1.0,
+      "step": 400
+    },
+    {
+      "epoch": 4.61,
+      "learning_rate": 5.25e-05,
+      "loss": 3.0309,
+      "step": 420
+    },
+    {
+      "epoch": 4.83,
+      "learning_rate": 5.5e-05,
+      "loss": 3.0259,
+      "step": 440
+    },
+    {
+      "epoch": 5.05,
+      "learning_rate": 5.75e-05,
+      "loss": 3.0998,
+      "step": 460
+    },
+    {
+      "epoch": 5.27,
+      "learning_rate": 6e-05,
+      "loss": 3.0152,
+      "step": 480
+    },
+    {
+      "epoch": 5.49,
+      "learning_rate": 6.25e-05,
+      "loss": 3.0129,
+      "step": 500
+    },
+    {
+      "epoch": 5.49,
+      "eval_loss": 3.039973497390747,
+      "eval_runtime": 190.8567,
+      "eval_samples_per_second": 25.375,
+      "eval_steps_per_second": 0.796,
+      "eval_wer": 1.0,
+      "step": 500
+    },
+    {
+      "epoch": 5.71,
+      "learning_rate": 6.500000000000001e-05,
+      "loss": 3.0088,
+      "step": 520
+    },
+    {
+      "epoch": 5.93,
+      "learning_rate": 6.75e-05,
+      "loss": 3.0051,
+      "step": 540
+    },
+    {
+      "epoch": 6.15,
+      "learning_rate": 7.000000000000001e-05,
+      "loss": 3.073,
+      "step": 560
+    },
+    {
+      "epoch": 6.37,
+      "learning_rate": 7.25e-05,
+      "loss": 3.0031,
+      "step": 580
+    },
+    {
+      "epoch": 6.59,
+      "learning_rate": 7.5e-05,
+      "loss": 2.9964,
+      "step": 600
+    },
+    {
+      "epoch": 6.59,
+      "eval_loss": 2.998962640762329,
+      "eval_runtime": 193.5213,
+      "eval_samples_per_second": 25.026,
+      "eval_steps_per_second": 0.785,
+      "eval_wer": 1.0,
+      "step": 600
     }
   ],
   "max_steps": 4550,
   "num_train_epochs": 50,
+  "total_flos": 9.32024224555606e+18,
   "trial_name": null,
   "trial_params": null
 }

{checkpoint-300 → checkpoint-600}/training_args.bin RENAMED Viewed

File without changes

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ee400442c70fe28b4032830f08f4c31605f74d5b5778895b5f30b7cad432bdcd
 size 1262063089

 version https://git-lfs.github.com/spec/v1
+oid sha256:3baffe7a116d58666fc0726fb4fa6188834614eac15e96843270fc53529b943e
 size 1262063089