Training in progress, step 700

Browse files

Files changed (10) hide show

{checkpoint-400 → checkpoint-700}/config.json +0 -0
{checkpoint-400 → checkpoint-700}/optimizer.pt +1 -1
{checkpoint-400 → checkpoint-700}/preprocessor_config.json +0 -0
{checkpoint-400 → checkpoint-700}/pytorch_model.bin +1 -1
{checkpoint-400 → checkpoint-700}/rng_state.pth +2 -2
{checkpoint-400 → checkpoint-700}/scaler.pt +1 -1
{checkpoint-400 → checkpoint-700}/scheduler.pt +1 -1
{checkpoint-400 → checkpoint-700}/trainer_state.json +120 -3
{checkpoint-400 → checkpoint-700}/training_args.bin +0 -0
pytorch_model.bin +1 -1

{checkpoint-400 → checkpoint-700}/config.json RENAMED Viewed

File without changes

{checkpoint-400 → checkpoint-700}/optimizer.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b573eee933c6c36bd4ddb6906221d3843d7e3e13dab0b96a39404d3a30f74898
 size 2490337809

 version https://git-lfs.github.com/spec/v1
+oid sha256:2734597abb10a2a590cf139e66decfdf1bc18e26d32aa5f4749a68f74109f763
 size 2490337809

{checkpoint-400 → checkpoint-700}/preprocessor_config.json RENAMED Viewed

File without changes

{checkpoint-400 → checkpoint-700}/pytorch_model.bin RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:28c7e3ec36d37a20298023cfa6ac730ae02e82d170ef8859ec5740936e2bc809
 size 1262063089

 version https://git-lfs.github.com/spec/v1
+oid sha256:866e0246bd78706b1bfb6c07818d34662e459927e54718460f8a950f5fc33ae8
 size 1262063089

{checkpoint-400 → checkpoint-700}/rng_state.pth RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:855318e4e46176f35f66cfa7dbcef4ac9632248b73c3328855184518a3b76d7f
-size 14503

 version https://git-lfs.github.com/spec/v1
+oid sha256:21798b4aee64ae056ff3e0e6a64832942beff047fe94bbbddb9d06dcf74d9125
+size 14567

{checkpoint-400 → checkpoint-700}/scaler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:476e510c8ea7edbd2b51d1e76a4e037820a5639381c0d8b5d32dafa492795a1e
 size 559

 version https://git-lfs.github.com/spec/v1
+oid sha256:7fb213daf5cce18a5f92167ca14da9df084d907f2b9796efc4666630f312b58c
 size 559

{checkpoint-400 → checkpoint-700}/scheduler.pt RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8d06447f3e192636cdb71ae042312281cde114831b8524799c0556275e17d331
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:fcdecc30328ffcc8e9b8e7d7b6cfb5d7c85a8e3d5e777d680eff74cf60f2dc24
 size 623

{checkpoint-400 → checkpoint-700}/trainer_state.json RENAMED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 4.39344262295082,
-  "global_step": 400,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -162,11 +162,128 @@
       "eval_steps_per_second": 0.766,
       "eval_wer": 1.0,
       "step": 400
     }
   ],
   "max_steps": 4550,
   "num_train_epochs": 50,
-  "total_flos": 6.222452805866187e+18,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 7.688524590163935,
+  "global_step": 700,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_steps_per_second": 0.766,
       "eval_wer": 1.0,
       "step": 400
+    },
+    {
+      "epoch": 4.61,
+      "learning_rate": 5.25e-05,
+      "loss": 3.0309,
+      "step": 420
+    },
+    {
+      "epoch": 4.83,
+      "learning_rate": 5.5e-05,
+      "loss": 3.0259,
+      "step": 440
+    },
+    {
+      "epoch": 5.05,
+      "learning_rate": 5.75e-05,
+      "loss": 3.0998,
+      "step": 460
+    },
+    {
+      "epoch": 5.27,
+      "learning_rate": 6e-05,
+      "loss": 3.0152,
+      "step": 480
+    },
+    {
+      "epoch": 5.49,
+      "learning_rate": 6.25e-05,
+      "loss": 3.0129,
+      "step": 500
+    },
+    {
+      "epoch": 5.49,
+      "eval_loss": 3.039973497390747,
+      "eval_runtime": 190.8567,
+      "eval_samples_per_second": 25.375,
+      "eval_steps_per_second": 0.796,
+      "eval_wer": 1.0,
+      "step": 500
+    },
+    {
+      "epoch": 5.71,
+      "learning_rate": 6.500000000000001e-05,
+      "loss": 3.0088,
+      "step": 520
+    },
+    {
+      "epoch": 5.93,
+      "learning_rate": 6.75e-05,
+      "loss": 3.0051,
+      "step": 540
+    },
+    {
+      "epoch": 6.15,
+      "learning_rate": 7.000000000000001e-05,
+      "loss": 3.073,
+      "step": 560
+    },
+    {
+      "epoch": 6.37,
+      "learning_rate": 7.25e-05,
+      "loss": 3.0031,
+      "step": 580
+    },
+    {
+      "epoch": 6.59,
+      "learning_rate": 7.5e-05,
+      "loss": 2.9964,
+      "step": 600
+    },
+    {
+      "epoch": 6.59,
+      "eval_loss": 2.998962640762329,
+      "eval_runtime": 193.5213,
+      "eval_samples_per_second": 25.026,
+      "eval_steps_per_second": 0.785,
+      "eval_wer": 1.0,
+      "step": 600
+    },
+    {
+      "epoch": 6.81,
+      "learning_rate": 7.75e-05,
+      "loss": 2.9921,
+      "step": 620
+    },
+    {
+      "epoch": 7.03,
+      "learning_rate": 8e-05,
+      "loss": 3.0665,
+      "step": 640
+    },
+    {
+      "epoch": 7.25,
+      "learning_rate": 8.25e-05,
+      "loss": 2.9826,
+      "step": 660
+    },
+    {
+      "epoch": 7.47,
+      "learning_rate": 8.5e-05,
+      "loss": 2.9689,
+      "step": 680
+    },
+    {
+      "epoch": 7.69,
+      "learning_rate": 8.75e-05,
+      "loss": 2.9602,
+      "step": 700
+    },
+    {
+      "epoch": 7.69,
+      "eval_loss": 2.9620397090911865,
+      "eval_runtime": 193.5851,
+      "eval_samples_per_second": 25.017,
+      "eval_steps_per_second": 0.785,
+      "eval_wer": 1.0,
+      "step": 700
     }
   ],
   "max_steps": 4550,
   "num_train_epochs": 50,
+  "total_flos": 1.0835835827730653e+19,
   "trial_name": null,
   "trial_params": null
 }

{checkpoint-400 → checkpoint-700}/training_args.bin RENAMED Viewed

File without changes

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3baffe7a116d58666fc0726fb4fa6188834614eac15e96843270fc53529b943e
 size 1262063089

 version https://git-lfs.github.com/spec/v1
+oid sha256:866e0246bd78706b1bfb6c07818d34662e459927e54718460f8a950f5fc33ae8
 size 1262063089