Training in progress, step 750000

Browse files

Files changed (14) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
pytorch_model.bin +1 -1
runs/Nov21_18-14-51_t1v-n-088af867-w-0/events.out.tfevents.1669054551.t1v-n-088af867-w-0.42571.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ae43a48589175aaf9939e78cb22924c6e7b9714449e1a77b6aea2674d6f0f535
 size 996067161

 version https://git-lfs.github.com/spec/v1
+oid sha256:8493ce7e8128e56d5ea33b2d8b536b32a965120edc32ffe82c0e67c7c74c6f88
 size 996067161

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b889229f6c63b75785b3963b98f50b36fa64eab02160a85abd3d76c7eca1972b
 size 498046827

 version https://git-lfs.github.com/spec/v1
+oid sha256:35fe33536ac807064e6fad0cd5e9ad83ec7ecc19996d055dfe966db63a34099a
 size 498046827

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4e8d8fd096b22974f0a808c190b1c67b3a173ac6818b5723a1c553da12bd61ad
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:7f7fac779826c8fbbb92a94b7bc999d0104abce6e322c0cc06283bb7e4ff5f3c
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4e8d8fd096b22974f0a808c190b1c67b3a173ac6818b5723a1c553da12bd61ad
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:7f7fac779826c8fbbb92a94b7bc999d0104abce6e322c0cc06283bb7e4ff5f3c
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4e8d8fd096b22974f0a808c190b1c67b3a173ac6818b5723a1c553da12bd61ad
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:7f7fac779826c8fbbb92a94b7bc999d0104abce6e322c0cc06283bb7e4ff5f3c
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:237857aa9cd57869e02f5c3fbb02afb8a7fe52dc11b11ceb54d6be8920f4af97
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:a9c8e535cc74c890d838da59fc834f280e4e0712e82e224b95bda2f92deaf190
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:237857aa9cd57869e02f5c3fbb02afb8a7fe52dc11b11ceb54d6be8920f4af97
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:a9c8e535cc74c890d838da59fc834f280e4e0712e82e224b95bda2f92deaf190
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:237857aa9cd57869e02f5c3fbb02afb8a7fe52dc11b11ceb54d6be8920f4af97
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:a9c8e535cc74c890d838da59fc834f280e4e0712e82e224b95bda2f92deaf190
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:237857aa9cd57869e02f5c3fbb02afb8a7fe52dc11b11ceb54d6be8920f4af97
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:a9c8e535cc74c890d838da59fc834f280e4e0712e82e224b95bda2f92deaf190
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4e8d8fd096b22974f0a808c190b1c67b3a173ac6818b5723a1c553da12bd61ad
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:7f7fac779826c8fbbb92a94b7bc999d0104abce6e322c0cc06283bb7e4ff5f3c
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d2d6ab5c2c0046e2c66cf435ff00463ff3da7208ddb35b5b6f19c87d94f3623b
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:411052d7656a2fbf4baa154bd61bcb86c1d4e17113e6919b82f37e9aff99019f
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.165921,
-  "global_step": 700000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -4318,11 +4318,319 @@
       "eval_samples_per_second": 559.497,
       "eval_steps_per_second": 2.238,
       "step": 700000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 1.17942562848768e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.215921,
+  "global_step": 750000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 559.497,
       "eval_steps_per_second": 2.238,
       "step": 700000
+    },
+    {
+      "epoch": 2.17,
+      "learning_rate": 2.251431892919171e-05,
+      "loss": 0.8155,
+      "step": 701000
+    },
+    {
+      "epoch": 2.17,
+      "learning_rate": 2.237634634350934e-05,
+      "loss": 0.8093,
+      "step": 702000
+    },
+    {
+      "epoch": 2.17,
+      "learning_rate": 2.2238675845677663e-05,
+      "loss": 0.8162,
+      "step": 703000
+    },
+    {
+      "epoch": 2.17,
+      "learning_rate": 2.2101308941239203e-05,
+      "loss": 0.8201,
+      "step": 704000
+    },
+    {
+      "epoch": 2.17,
+      "learning_rate": 2.196424713241637e-05,
+      "loss": 0.8262,
+      "step": 705000
+    },
+    {
+      "epoch": 2.17,
+      "learning_rate": 2.182749191809518e-05,
+      "loss": 0.8267,
+      "step": 706000
+    },
+    {
+      "epoch": 2.17,
+      "learning_rate": 2.1691044793808734e-05,
+      "loss": 0.8208,
+      "step": 707000
+    },
+    {
+      "epoch": 2.17,
+      "learning_rate": 2.1554907251720945e-05,
+      "loss": 0.8085,
+      "step": 708000
+    },
+    {
+      "epoch": 2.17,
+      "learning_rate": 2.1419080780610123e-05,
+      "loss": 0.8328,
+      "step": 709000
+    },
+    {
+      "epoch": 2.18,
+      "learning_rate": 2.128356686585282e-05,
+      "loss": 0.8145,
+      "step": 710000
+    },
+    {
+      "epoch": 2.18,
+      "learning_rate": 2.1148366989407496e-05,
+      "loss": 0.8211,
+      "step": 711000
+    },
+    {
+      "epoch": 2.18,
+      "learning_rate": 2.1013482629798333e-05,
+      "loss": 0.8198,
+      "step": 712000
+    },
+    {
+      "epoch": 2.18,
+      "learning_rate": 2.0878915262099098e-05,
+      "loss": 0.8227,
+      "step": 713000
+    },
+    {
+      "epoch": 2.18,
+      "learning_rate": 2.0744666357916925e-05,
+      "loss": 0.827,
+      "step": 714000
+    },
+    {
+      "epoch": 2.18,
+      "learning_rate": 2.061073738537635e-05,
+      "loss": 0.8217,
+      "step": 715000
+    },
+    {
+      "epoch": 2.18,
+      "learning_rate": 2.0477129809103147e-05,
+      "loss": 0.8122,
+      "step": 716000
+    },
+    {
+      "epoch": 2.18,
+      "learning_rate": 2.0343845090208368e-05,
+      "loss": 0.8172,
+      "step": 717000
+    },
+    {
+      "epoch": 2.18,
+      "learning_rate": 2.0210884686272368e-05,
+      "loss": 0.8255,
+      "step": 718000
+    },
+    {
+      "epoch": 2.18,
+      "learning_rate": 2.0078250051328784e-05,
+      "loss": 0.8193,
+      "step": 719000
+    },
+    {
+      "epoch": 2.19,
+      "learning_rate": 1.9945942635848748e-05,
+      "loss": 0.8105,
+      "step": 720000
+    },
+    {
+      "epoch": 2.19,
+      "learning_rate": 1.981396388672496e-05,
+      "loss": 0.8216,
+      "step": 721000
+    },
+    {
+      "epoch": 2.19,
+      "learning_rate": 1.9682315247255894e-05,
+      "loss": 0.8232,
+      "step": 722000
+    },
+    {
+      "epoch": 2.19,
+      "learning_rate": 1.9550998157129946e-05,
+      "loss": 0.8302,
+      "step": 723000
+    },
+    {
+      "epoch": 2.19,
+      "learning_rate": 1.942001405240979e-05,
+      "loss": 0.82,
+      "step": 724000
+    },
+    {
+      "epoch": 2.19,
+      "learning_rate": 1.928936436551661e-05,
+      "loss": 0.8264,
+      "step": 725000
+    },
+    {
+      "epoch": 2.19,
+      "learning_rate": 1.9159050525214452e-05,
+      "loss": 0.8356,
+      "step": 726000
+    },
+    {
+      "epoch": 2.19,
+      "learning_rate": 1.9029073956594606e-05,
+      "loss": 0.8271,
+      "step": 727000
+    },
+    {
+      "epoch": 2.19,
+      "learning_rate": 1.8899436081059975e-05,
+      "loss": 0.8051,
+      "step": 728000
+    },
+    {
+      "epoch": 2.19,
+      "learning_rate": 1.877013831630961e-05,
+      "loss": 0.8247,
+      "step": 729000
+    },
+    {
+      "epoch": 2.2,
+      "learning_rate": 1.8641182076323148e-05,
+      "loss": 0.8198,
+      "step": 730000
+    },
+    {
+      "epoch": 2.2,
+      "learning_rate": 1.851256877134538e-05,
+      "loss": 0.8189,
+      "step": 731000
+    },
+    {
+      "epoch": 2.2,
+      "learning_rate": 1.838429980787081e-05,
+      "loss": 0.8316,
+      "step": 732000
+    },
+    {
+      "epoch": 2.2,
+      "learning_rate": 1.8256376588628238e-05,
+      "loss": 0.817,
+      "step": 733000
+    },
+    {
+      "epoch": 2.2,
+      "learning_rate": 1.8128800512565513e-05,
+      "loss": 0.8169,
+      "step": 734000
+    },
+    {
+      "epoch": 2.2,
+      "learning_rate": 1.800157297483417e-05,
+      "loss": 0.821,
+      "step": 735000
+    },
+    {
+      "epoch": 2.2,
+      "learning_rate": 1.787469536677419e-05,
+      "loss": 0.8132,
+      "step": 736000
+    },
+    {
+      "epoch": 2.2,
+      "learning_rate": 1.774816907589873e-05,
+      "loss": 0.8282,
+      "step": 737000
+    },
+    {
+      "epoch": 2.2,
+      "learning_rate": 1.7621995485879062e-05,
+      "loss": 0.8211,
+      "step": 738000
+    },
+    {
+      "epoch": 2.2,
+      "learning_rate": 1.749617597652934e-05,
+      "loss": 0.8182,
+      "step": 739000
+    },
+    {
+      "epoch": 2.21,
+      "learning_rate": 1.7370711923791567e-05,
+      "loss": 0.8241,
+      "step": 740000
+    },
+    {
+      "epoch": 2.21,
+      "learning_rate": 1.7245604699720535e-05,
+      "loss": 0.8184,
+      "step": 741000
+    },
+    {
+      "epoch": 2.21,
+      "learning_rate": 1.712085567246878e-05,
+      "loss": 0.813,
+      "step": 742000
+    },
+    {
+      "epoch": 2.21,
+      "learning_rate": 1.699646620627168e-05,
+      "loss": 0.8109,
+      "step": 743000
+    },
+    {
+      "epoch": 2.21,
+      "learning_rate": 1.6872437661432517e-05,
+      "loss": 0.8137,
+      "step": 744000
+    },
+    {
+      "epoch": 2.21,
+      "learning_rate": 1.6748771394307585e-05,
+      "loss": 0.8216,
+      "step": 745000
+    },
+    {
+      "epoch": 2.21,
+      "learning_rate": 1.662546875729138e-05,
+      "loss": 0.81,
+      "step": 746000
+    },
+    {
+      "epoch": 2.21,
+      "learning_rate": 1.6502531098801753e-05,
+      "loss": 0.8109,
+      "step": 747000
+    },
+    {
+      "epoch": 2.21,
+      "learning_rate": 1.637995976326527e-05,
+      "loss": 0.8173,
+      "step": 748000
+    },
+    {
+      "epoch": 2.21,
+      "learning_rate": 1.62577560911024e-05,
+      "loss": 0.8197,
+      "step": 749000
+    },
+    {
+      "epoch": 2.22,
+      "learning_rate": 1.6135921418712956e-05,
+      "loss": 0.814,
+      "step": 750000
+    },
+    {
+      "epoch": 2.22,
+      "eval_loss": 0.773684024810791,
+      "eval_runtime": 18.4635,
+      "eval_samples_per_second": 541.609,
+      "eval_steps_per_second": 2.166,
+      "step": 750000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 1.2636703162368e+19,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b889229f6c63b75785b3963b98f50b36fa64eab02160a85abd3d76c7eca1972b
 size 498046827

 version https://git-lfs.github.com/spec/v1
+oid sha256:35fe33536ac807064e6fad0cd5e9ad83ec7ecc19996d055dfe966db63a34099a
 size 498046827

runs/Nov21_18-14-51_t1v-n-088af867-w-0/events.out.tfevents.1669054551.t1v-n-088af867-w-0.42571.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:760955c77a228959512a67fa9be4a80f48c8f4c3b85cf9260455f57c08dc70ae
-size 69956

 version https://git-lfs.github.com/spec/v1
+oid sha256:c7a6f26498ae9b62958540d2c4c973cc644673f207f87ccd6a7cceb887653518
+size 78232