Training in progress, step 900000

Browse files

Files changed (14) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
pytorch_model.bin +1 -1
runs/Dec27_23-32-38_t1v-n-2d317d8b-w-0/events.out.tfevents.1672183981.t1v-n-2d317d8b-w-0.162730.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4ea2739e65bf2d4e444e37d59f4590e76d7131d84f66a9eaaf6582afb2682f19
 size 885325017

 version https://git-lfs.github.com/spec/v1
+oid sha256:345bb733106532a0f4478559f3788cc16626f2b03843c21bbf46700517f092e5
 size 885325017

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:38129657bd5caa37f8267c1c70da5cff672239b99e39e17a769a78f1a0a75f82
 size 442675755

 version https://git-lfs.github.com/spec/v1
+oid sha256:8c1921a1c1cbf8718fc703fed5923d8983ae5a3c94f3fb08cc5b295115ded811
 size 442675755

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ee72837e55312c5db90b9236e78275a0fb41dcf5b5d42ac01111f1bc9828197
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:78b6318c1c37a88a7a88d1bea333e6b55fd0f1d3338fd7f99e67179de2e57d78
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ee72837e55312c5db90b9236e78275a0fb41dcf5b5d42ac01111f1bc9828197
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:78b6318c1c37a88a7a88d1bea333e6b55fd0f1d3338fd7f99e67179de2e57d78
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ee72837e55312c5db90b9236e78275a0fb41dcf5b5d42ac01111f1bc9828197
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:78b6318c1c37a88a7a88d1bea333e6b55fd0f1d3338fd7f99e67179de2e57d78
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ee72837e55312c5db90b9236e78275a0fb41dcf5b5d42ac01111f1bc9828197
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:78b6318c1c37a88a7a88d1bea333e6b55fd0f1d3338fd7f99e67179de2e57d78
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ee72837e55312c5db90b9236e78275a0fb41dcf5b5d42ac01111f1bc9828197
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:78b6318c1c37a88a7a88d1bea333e6b55fd0f1d3338fd7f99e67179de2e57d78
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ee72837e55312c5db90b9236e78275a0fb41dcf5b5d42ac01111f1bc9828197
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:78b6318c1c37a88a7a88d1bea333e6b55fd0f1d3338fd7f99e67179de2e57d78
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ee72837e55312c5db90b9236e78275a0fb41dcf5b5d42ac01111f1bc9828197
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:78b6318c1c37a88a7a88d1bea333e6b55fd0f1d3338fd7f99e67179de2e57d78
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:6ee72837e55312c5db90b9236e78275a0fb41dcf5b5d42ac01111f1bc9828197
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:78b6318c1c37a88a7a88d1bea333e6b55fd0f1d3338fd7f99e67179de2e57d78
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:adedebe0cc7e07de957a9e2967d6e9c3934a9fdca3245f46a29d125e5e36192e
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:98fbf159ce1bb90afdab5d6ac994b4ab633fc21d8eb6c04c41c7f3a26253e5b5
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 6.045208,
-  "global_step": 850000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -5242,11 +5242,319 @@
       "eval_samples_per_second": 470.799,
       "eval_steps_per_second": 3.766,
       "step": 850000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 1.4318614083048309e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 6.095208,
+  "global_step": 900000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 470.799,
       "eval_steps_per_second": 3.766,
       "step": 850000
+    },
+    {
+      "epoch": 6.05,
+      "learning_rate": 5.947856562792925e-06,
+      "loss": 0.6625,
+      "step": 851000
+    },
+    {
+      "epoch": 6.05,
+      "learning_rate": 5.869882433093155e-06,
+      "loss": 0.5409,
+      "step": 852000
+    },
+    {
+      "epoch": 6.05,
+      "learning_rate": 5.79239090328883e-06,
+      "loss": 0.4859,
+      "step": 853000
+    },
+    {
+      "epoch": 6.05,
+      "learning_rate": 5.715382820814885e-06,
+      "loss": 0.5004,
+      "step": 854000
+    },
+    {
+      "epoch": 6.05,
+      "learning_rate": 5.6388590278194096e-06,
+      "loss": 0.5857,
+      "step": 855000
+    },
+    {
+      "epoch": 6.05,
+      "learning_rate": 5.562820361154314e-06,
+      "loss": 0.6262,
+      "step": 856000
+    },
+    {
+      "epoch": 6.05,
+      "learning_rate": 5.48726765236629e-06,
+      "loss": 0.6233,
+      "step": 857000
+    },
+    {
+      "epoch": 6.05,
+      "learning_rate": 5.412201727687644e-06,
+      "loss": 0.5173,
+      "step": 858000
+    },
+    {
+      "epoch": 6.05,
+      "learning_rate": 5.337623408027293e-06,
+      "loss": 0.5189,
+      "step": 859000
+    },
+    {
+      "epoch": 6.06,
+      "learning_rate": 5.263533508961827e-06,
+      "loss": 0.5411,
+      "step": 860000
+    },
+    {
+      "epoch": 6.06,
+      "learning_rate": 5.1899328407264855e-06,
+      "loss": 0.607,
+      "step": 861000
+    },
+    {
+      "epoch": 6.06,
+      "learning_rate": 5.116822208206396e-06,
+      "loss": 0.6584,
+      "step": 862000
+    },
+    {
+      "epoch": 6.06,
+      "learning_rate": 5.044202410927706e-06,
+      "loss": 0.5419,
+      "step": 863000
+    },
+    {
+      "epoch": 6.06,
+      "learning_rate": 4.972074243048897e-06,
+      "loss": 0.4949,
+      "step": 864000
+    },
+    {
+      "epoch": 6.06,
+      "learning_rate": 4.900438493352055e-06,
+      "loss": 0.4951,
+      "step": 865000
+    },
+    {
+      "epoch": 6.06,
+      "learning_rate": 4.829295945234258e-06,
+      "loss": 0.5807,
+      "step": 866000
+    },
+    {
+      "epoch": 6.06,
+      "learning_rate": 4.758647376699032e-06,
+      "loss": 0.6251,
+      "step": 867000
+    },
+    {
+      "epoch": 6.06,
+      "learning_rate": 4.688493560347773e-06,
+      "loss": 0.6232,
+      "step": 868000
+    },
+    {
+      "epoch": 6.06,
+      "learning_rate": 4.618835263371396e-06,
+      "loss": 0.5241,
+      "step": 869000
+    },
+    {
+      "epoch": 6.07,
+      "learning_rate": 4.549673247541875e-06,
+      "loss": 0.523,
+      "step": 870000
+    },
+    {
+      "epoch": 6.07,
+      "learning_rate": 4.48100826920394e-06,
+      "loss": 0.531,
+      "step": 871000
+    },
+    {
+      "epoch": 6.07,
+      "learning_rate": 4.412841079266777e-06,
+      "loss": 0.6089,
+      "step": 872000
+    },
+    {
+      "epoch": 6.07,
+      "learning_rate": 4.3451724231958644e-06,
+      "loss": 0.6519,
+      "step": 873000
+    },
+    {
+      "epoch": 6.07,
+      "learning_rate": 4.27800304100478e-06,
+      "loss": 0.5453,
+      "step": 874000
+    },
+    {
+      "epoch": 6.07,
+      "learning_rate": 4.2113336672471245e-06,
+      "loss": 0.4981,
+      "step": 875000
+    },
+    {
+      "epoch": 6.07,
+      "learning_rate": 4.145165031008508e-06,
+      "loss": 0.4949,
+      "step": 876000
+    },
+    {
+      "epoch": 6.07,
+      "learning_rate": 4.079497855898501e-06,
+      "loss": 0.5795,
+      "step": 877000
+    },
+    {
+      "epoch": 6.07,
+      "learning_rate": 4.01433286004283e-06,
+      "loss": 0.6226,
+      "step": 878000
+    },
+    {
+      "epoch": 6.07,
+      "learning_rate": 3.949670756075447e-06,
+      "loss": 0.6258,
+      "step": 879000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 3.885512251130763e-06,
+      "loss": 0.531,
+      "step": 880000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 3.821858046835913e-06,
+      "loss": 0.5183,
+      "step": 881000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 3.75870883930306e-06,
+      "loss": 0.5233,
+      "step": 882000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 3.696065319121833e-06,
+      "loss": 0.6147,
+      "step": 883000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 3.6339281713517303e-06,
+      "loss": 0.642,
+      "step": 884000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 3.5722980755146517e-06,
+      "loss": 0.5468,
+      "step": 885000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 3.511175705587433e-06,
+      "loss": 0.5043,
+      "step": 886000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 3.4505617299945336e-06,
+      "loss": 0.4901,
+      "step": 887000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 3.390456811600673e-06,
+      "loss": 0.5791,
+      "step": 888000
+    },
+    {
+      "epoch": 6.08,
+      "learning_rate": 3.3308616077036115e-06,
+      "loss": 0.6167,
+      "step": 889000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 3.271776770026963e-06,
+      "loss": 0.6202,
+      "step": 890000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 3.213202944713023e-06,
+      "loss": 0.54,
+      "step": 891000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 3.155140772315773e-06,
+      "loss": 0.5187,
+      "step": 892000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 3.0975908877938277e-06,
+      "loss": 0.5206,
+      "step": 893000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 3.040553920503503e-06,
+      "loss": 0.6147,
+      "step": 894000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 2.9840304941919415e-06,
+      "loss": 0.628,
+      "step": 895000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 2.928021226990263e-06,
+      "loss": 0.5573,
+      "step": 896000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 2.8725267314068495e-06,
+      "loss": 0.5079,
+      "step": 897000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 2.817547614320615e-06,
+      "loss": 0.4863,
+      "step": 898000
+    },
+    {
+      "epoch": 6.09,
+      "learning_rate": 2.7630844769743757e-06,
+      "loss": 0.5821,
+      "step": 899000
+    },
+    {
+      "epoch": 6.1,
+      "learning_rate": 2.7091379149682685e-06,
+      "loss": 0.607,
+      "step": 900000
+    },
+    {
+      "epoch": 6.1,
+      "eval_loss": 0.43322694301605225,
+      "eval_runtime": 11.9376,
+      "eval_samples_per_second": 418.845,
+      "eval_steps_per_second": 3.351,
+      "step": 900000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 1.5160884013339509e+19,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:38129657bd5caa37f8267c1c70da5cff672239b99e39e17a769a78f1a0a75f82
 size 442675755

 version https://git-lfs.github.com/spec/v1
+oid sha256:8c1921a1c1cbf8718fc703fed5923d8983ae5a3c94f3fb08cc5b295115ded811
 size 442675755

runs/Dec27_23-32-38_t1v-n-2d317d8b-w-0/events.out.tfevents.1672183981.t1v-n-2d317d8b-w-0.162730.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:f2f6129b057980f56380eb832e0c6a7bf337ab3b51742afdf922d2c093de7eee
-size 144420

 version https://git-lfs.github.com/spec/v1
+oid sha256:416c48e28ac8dda4b04a334dfbc00e4af731cc753ac2fe39df5f5ca94fbc8a9d
+size 152696