Training in progress, step 800000

Browse files

Files changed (14) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
pytorch_model.bin +1 -1
runs/Nov21_18-14-51_t1v-n-088af867-w-0/events.out.tfevents.1669054551.t1v-n-088af867-w-0.42571.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:8493ce7e8128e56d5ea33b2d8b536b32a965120edc32ffe82c0e67c7c74c6f88
 size 996067161

 version https://git-lfs.github.com/spec/v1
+oid sha256:c232c3362505b09ebf2de531d028bab9e2f36f212e8090b7d19bbdab3eaa82ef
 size 996067161

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:35fe33536ac807064e6fad0cd5e9ad83ec7ecc19996d055dfe966db63a34099a
 size 498046827

 version https://git-lfs.github.com/spec/v1
+oid sha256:fec352f986ad82f2093d092c541a5c18023edc09d690d230639e4fcf0f8f68da
 size 498046827

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7f7fac779826c8fbbb92a94b7bc999d0104abce6e322c0cc06283bb7e4ff5f3c
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:bdb0b60d2639b10fa07210371a726fdae273fd173a11215ad75bd704c48168c5
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7f7fac779826c8fbbb92a94b7bc999d0104abce6e322c0cc06283bb7e4ff5f3c
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:bdb0b60d2639b10fa07210371a726fdae273fd173a11215ad75bd704c48168c5
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7f7fac779826c8fbbb92a94b7bc999d0104abce6e322c0cc06283bb7e4ff5f3c
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:bdb0b60d2639b10fa07210371a726fdae273fd173a11215ad75bd704c48168c5
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a9c8e535cc74c890d838da59fc834f280e4e0712e82e224b95bda2f92deaf190
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:6280f24dfdea0e39202209002958a3c2870d74b203c5b54e31e57a68e6d8e47b
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a9c8e535cc74c890d838da59fc834f280e4e0712e82e224b95bda2f92deaf190
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:6280f24dfdea0e39202209002958a3c2870d74b203c5b54e31e57a68e6d8e47b
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a9c8e535cc74c890d838da59fc834f280e4e0712e82e224b95bda2f92deaf190
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:6280f24dfdea0e39202209002958a3c2870d74b203c5b54e31e57a68e6d8e47b
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:a9c8e535cc74c890d838da59fc834f280e4e0712e82e224b95bda2f92deaf190
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:6280f24dfdea0e39202209002958a3c2870d74b203c5b54e31e57a68e6d8e47b
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:7f7fac779826c8fbbb92a94b7bc999d0104abce6e322c0cc06283bb7e4ff5f3c
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:bdb0b60d2639b10fa07210371a726fdae273fd173a11215ad75bd704c48168c5
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:411052d7656a2fbf4baa154bd61bcb86c1d4e17113e6919b82f37e9aff99019f
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:50e51b9224ded3ddffee57f26ec45414409de0232579ddafb7f3e083076fa4c5
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 2.215921,
-  "global_step": 750000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -4626,11 +4626,319 @@
       "eval_samples_per_second": 541.609,
       "eval_steps_per_second": 2.166,
       "step": 750000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 1.2636703162368e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 2.265921,
+  "global_step": 800000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 541.609,
       "eval_steps_per_second": 2.166,
       "step": 750000
+    },
+    {
+      "epoch": 2.22,
+      "learning_rate": 1.6014457078461353e-05,
+      "loss": 0.8177,
+      "step": 751000
+    },
+    {
+      "epoch": 2.22,
+      "learning_rate": 1.5893364398662176e-05,
+      "loss": 0.8223,
+      "step": 752000
+    },
+    {
+      "epoch": 2.22,
+      "learning_rate": 1.5772644703565565e-05,
+      "loss": 0.8236,
+      "step": 753000
+    },
+    {
+      "epoch": 2.22,
+      "learning_rate": 1.5652299313342773e-05,
+      "loss": 0.8056,
+      "step": 754000
+    },
+    {
+      "epoch": 2.22,
+      "learning_rate": 1.553232954407171e-05,
+      "loss": 0.802,
+      "step": 755000
+    },
+    {
+      "epoch": 2.22,
+      "learning_rate": 1.5412736707722537e-05,
+      "loss": 0.806,
+      "step": 756000
+    },
+    {
+      "epoch": 2.22,
+      "learning_rate": 1.5293522112143373e-05,
+      "loss": 0.8013,
+      "step": 757000
+    },
+    {
+      "epoch": 2.22,
+      "learning_rate": 1.517468706104589e-05,
+      "loss": 0.8098,
+      "step": 758000
+    },
+    {
+      "epoch": 2.22,
+      "learning_rate": 1.5056232853991209e-05,
+      "loss": 0.8062,
+      "step": 759000
+    },
+    {
+      "epoch": 2.23,
+      "learning_rate": 1.4938160786375572e-05,
+      "loss": 0.8078,
+      "step": 760000
+    },
+    {
+      "epoch": 2.23,
+      "learning_rate": 1.4820472149416154e-05,
+      "loss": 0.7976,
+      "step": 761000
+    },
+    {
+      "epoch": 2.23,
+      "learning_rate": 1.470316823013707e-05,
+      "loss": 0.8175,
+      "step": 762000
+    },
+    {
+      "epoch": 2.23,
+      "learning_rate": 1.4586250311355132e-05,
+      "loss": 0.8095,
+      "step": 763000
+    },
+    {
+      "epoch": 2.23,
+      "learning_rate": 1.4469719671666043e-05,
+      "loss": 0.8105,
+      "step": 764000
+    },
+    {
+      "epoch": 2.23,
+      "learning_rate": 1.435357758543015e-05,
+      "loss": 0.8103,
+      "step": 765000
+    },
+    {
+      "epoch": 2.23,
+      "learning_rate": 1.4237825322758736e-05,
+      "loss": 0.8153,
+      "step": 766000
+    },
+    {
+      "epoch": 2.23,
+      "learning_rate": 1.412246414949997e-05,
+      "loss": 0.8184,
+      "step": 767000
+    },
+    {
+      "epoch": 2.23,
+      "learning_rate": 1.4007495327225162e-05,
+      "loss": 0.8083,
+      "step": 768000
+    },
+    {
+      "epoch": 2.23,
+      "learning_rate": 1.389292011321498e-05,
+      "loss": 0.7992,
+      "step": 769000
+    },
+    {
+      "epoch": 2.24,
+      "learning_rate": 1.3778739760445552e-05,
+      "loss": 0.8087,
+      "step": 770000
+    },
+    {
+      "epoch": 2.24,
+      "learning_rate": 1.3664955517574968e-05,
+      "loss": 0.8118,
+      "step": 771000
+    },
+    {
+      "epoch": 2.24,
+      "learning_rate": 1.3551568628929434e-05,
+      "loss": 0.8096,
+      "step": 772000
+    },
+    {
+      "epoch": 2.24,
+      "learning_rate": 1.343858033448982e-05,
+      "loss": 0.7987,
+      "step": 773000
+    },
+    {
+      "epoch": 2.24,
+      "learning_rate": 1.3325991869878013e-05,
+      "loss": 0.8141,
+      "step": 774000
+    },
+    {
+      "epoch": 2.24,
+      "learning_rate": 1.3213804466343421e-05,
+      "loss": 0.819,
+      "step": 775000
+    },
+    {
+      "epoch": 2.24,
+      "learning_rate": 1.3102019350749528e-05,
+      "loss": 0.8183,
+      "step": 776000
+    },
+    {
+      "epoch": 2.24,
+      "learning_rate": 1.299063774556042e-05,
+      "loss": 0.8153,
+      "step": 777000
+    },
+    {
+      "epoch": 2.24,
+      "learning_rate": 1.2879660868827508e-05,
+      "loss": 0.8135,
+      "step": 778000
+    },
+    {
+      "epoch": 2.24,
+      "learning_rate": 1.2769089934176126e-05,
+      "loss": 0.835,
+      "step": 779000
+    },
+    {
+      "epoch": 2.25,
+      "learning_rate": 1.2658926150792322e-05,
+      "loss": 0.8122,
+      "step": 780000
+    },
+    {
+      "epoch": 2.25,
+      "learning_rate": 1.2549170723409549e-05,
+      "loss": 0.8031,
+      "step": 781000
+    },
+    {
+      "epoch": 2.25,
+      "learning_rate": 1.243982485229559e-05,
+      "loss": 0.8134,
+      "step": 782000
+    },
+    {
+      "epoch": 2.25,
+      "learning_rate": 1.233088973323937e-05,
+      "loss": 0.8082,
+      "step": 783000
+    },
+    {
+      "epoch": 2.25,
+      "learning_rate": 1.2222366557537911e-05,
+      "loss": 0.8139,
+      "step": 784000
+    },
+    {
+      "epoch": 2.25,
+      "learning_rate": 1.2114256511983274e-05,
+      "loss": 0.8216,
+      "step": 785000
+    },
+    {
+      "epoch": 2.25,
+      "learning_rate": 1.2006560778849578e-05,
+      "loss": 0.8128,
+      "step": 786000
+    },
+    {
+      "epoch": 2.25,
+      "learning_rate": 1.1899280535880119e-05,
+      "loss": 0.8055,
+      "step": 787000
+    },
+    {
+      "epoch": 2.25,
+      "learning_rate": 1.1792416956274444e-05,
+      "loss": 0.8176,
+      "step": 788000
+    },
+    {
+      "epoch": 2.25,
+      "learning_rate": 1.1685971208675539e-05,
+      "loss": 0.8019,
+      "step": 789000
+    },
+    {
+      "epoch": 2.26,
+      "learning_rate": 1.157994445715706e-05,
+      "loss": 0.8173,
+      "step": 790000
+    },
+    {
+      "epoch": 2.26,
+      "learning_rate": 1.1474337861210543e-05,
+      "loss": 0.815,
+      "step": 791000
+    },
+    {
+      "epoch": 2.26,
+      "learning_rate": 1.1369152575732822e-05,
+      "loss": 0.8212,
+      "step": 792000
+    },
+    {
+      "epoch": 2.26,
+      "learning_rate": 1.1264389751013326e-05,
+      "loss": 0.8235,
+      "step": 793000
+    },
+    {
+      "epoch": 2.26,
+      "learning_rate": 1.1160050532721528e-05,
+      "loss": 0.8061,
+      "step": 794000
+    },
+    {
+      "epoch": 2.26,
+      "learning_rate": 1.1056136061894384e-05,
+      "loss": 0.8078,
+      "step": 795000
+    },
+    {
+      "epoch": 2.26,
+      "learning_rate": 1.095264747492391e-05,
+      "loss": 0.8045,
+      "step": 796000
+    },
+    {
+      "epoch": 2.26,
+      "learning_rate": 1.0849585903544706e-05,
+      "loss": 0.809,
+      "step": 797000
+    },
+    {
+      "epoch": 2.26,
+      "learning_rate": 1.0746952474821614e-05,
+      "loss": 0.808,
+      "step": 798000
+    },
+    {
+      "epoch": 2.26,
+      "learning_rate": 1.0644748311137376e-05,
+      "loss": 0.7971,
+      "step": 799000
+    },
+    {
+      "epoch": 2.27,
+      "learning_rate": 1.0542974530180327e-05,
+      "loss": 0.8046,
+      "step": 800000
+    },
+    {
+      "epoch": 2.27,
+      "eval_loss": 0.7692430019378662,
+      "eval_runtime": 22.2242,
+      "eval_samples_per_second": 449.959,
+      "eval_steps_per_second": 1.8,
+      "step": 800000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 1.34791500398592e+19,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:35fe33536ac807064e6fad0cd5e9ad83ec7ecc19996d055dfe966db63a34099a
 size 498046827

 version https://git-lfs.github.com/spec/v1
+oid sha256:fec352f986ad82f2093d092c541a5c18023edc09d690d230639e4fcf0f8f68da
 size 498046827

runs/Nov21_18-14-51_t1v-n-088af867-w-0/events.out.tfevents.1669054551.t1v-n-088af867-w-0.42571.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c7a6f26498ae9b62958540d2c4c973cc644673f207f87ccd6a7cceb887653518
-size 78232

 version https://git-lfs.github.com/spec/v1
+oid sha256:a3ca84624459fb9b93a84187779a2e24244f414f34a0b93883906e7b5e7e187a
+size 86508