Training in progress, step 1000000

Browse files

Files changed (14) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
pytorch_model.bin +1 -1
runs/Dec27_23-32-38_t1v-n-2d317d8b-w-0/events.out.tfevents.1672183981.t1v-n-2d317d8b-w-0.162730.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:70e1cdb73c33912fdfbd44c7802198f3da92e5f2948f144c655672394f3783bb
 size 885325017

 version https://git-lfs.github.com/spec/v1
+oid sha256:ddc82d7aa4bac59a6141424c2938c722521bd1a76f953b65be1cfffa8c73c5a5
 size 885325017

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ba23237eabaae268f92a0c5e73a78704a91d8fb58eebea9dce3e91dd8ad4e295
 size 442675755

 version https://git-lfs.github.com/spec/v1
+oid sha256:2f569a8a9d5e623df505612fbda18046bdf5b16ae49848842e493e6b370840ab
 size 442675755

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:94fe5ae4f0bd12aa4a80be8d9d76c7c97add23774d07fd0efb2832b983be474d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:14e31008b512fdc798b67d85642d5829e5b1af89e3f396e398700d62f537b970
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:94fe5ae4f0bd12aa4a80be8d9d76c7c97add23774d07fd0efb2832b983be474d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:14e31008b512fdc798b67d85642d5829e5b1af89e3f396e398700d62f537b970
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:94fe5ae4f0bd12aa4a80be8d9d76c7c97add23774d07fd0efb2832b983be474d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:14e31008b512fdc798b67d85642d5829e5b1af89e3f396e398700d62f537b970
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:94fe5ae4f0bd12aa4a80be8d9d76c7c97add23774d07fd0efb2832b983be474d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:14e31008b512fdc798b67d85642d5829e5b1af89e3f396e398700d62f537b970
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:94fe5ae4f0bd12aa4a80be8d9d76c7c97add23774d07fd0efb2832b983be474d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:14e31008b512fdc798b67d85642d5829e5b1af89e3f396e398700d62f537b970
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:94fe5ae4f0bd12aa4a80be8d9d76c7c97add23774d07fd0efb2832b983be474d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:14e31008b512fdc798b67d85642d5829e5b1af89e3f396e398700d62f537b970
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:94fe5ae4f0bd12aa4a80be8d9d76c7c97add23774d07fd0efb2832b983be474d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:14e31008b512fdc798b67d85642d5829e5b1af89e3f396e398700d62f537b970
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:94fe5ae4f0bd12aa4a80be8d9d76c7c97add23774d07fd0efb2832b983be474d
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:14e31008b512fdc798b67d85642d5829e5b1af89e3f396e398700d62f537b970
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:bc2c2c8416f63b11e9c82d6dac05baa6ad73177ac658621e099b23ff71f2f801
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:906bc3ed48818cc1785b6a98c1e064532a322520b99cdf458cfd827674d9b7ec
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 7.011076,
-  "global_step": 950000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -5858,11 +5858,319 @@
       "eval_samples_per_second": 459.272,
       "eval_steps_per_second": 3.674,
       "step": 950000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 1.600315815498036e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 7.061076,
+  "global_step": 1000000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 459.272,
       "eval_steps_per_second": 3.674,
       "step": 950000
+    },
+    {
+      "epoch": 7.01,
+      "learning_rate": 6.549893279788277e-07,
+      "loss": 0.5844,
+      "step": 951000
+    },
+    {
+      "epoch": 7.01,
+      "learning_rate": 6.285834552247128e-07,
+      "loss": 0.6514,
+      "step": 952000
+    },
+    {
+      "epoch": 7.01,
+      "learning_rate": 6.027175003719354e-07,
+      "loss": 0.5718,
+      "step": 953000
+    },
+    {
+      "epoch": 7.02,
+      "learning_rate": 5.773917462864264e-07,
+      "loss": 0.48,
+      "step": 954000
+    },
+    {
+      "epoch": 7.02,
+      "learning_rate": 5.526064699265753e-07,
+      "loss": 0.4916,
+      "step": 955000
+    },
+    {
+      "epoch": 7.02,
+      "learning_rate": 5.283619423401998e-07,
+      "loss": 0.5807,
+      "step": 956000
+    },
+    {
+      "epoch": 7.02,
+      "learning_rate": 5.046584286615697e-07,
+      "loss": 0.6197,
+      "step": 957000
+    },
+    {
+      "epoch": 7.02,
+      "learning_rate": 4.814961881085045e-07,
+      "loss": 0.6185,
+      "step": 958000
+    },
+    {
+      "epoch": 7.02,
+      "learning_rate": 4.5887547397955864e-07,
+      "loss": 0.518,
+      "step": 959000
+    },
+    {
+      "epoch": 7.02,
+      "learning_rate": 4.367965336512403e-07,
+      "loss": 0.4971,
+      "step": 960000
+    },
+    {
+      "epoch": 7.02,
+      "learning_rate": 4.1525960857530243e-07,
+      "loss": 0.5754,
+      "step": 961000
+    },
+    {
+      "epoch": 7.02,
+      "learning_rate": 3.9426493427611177e-07,
+      "loss": 0.5841,
+      "step": 962000
+    },
+    {
+      "epoch": 7.02,
+      "learning_rate": 3.738127403480507e-07,
+      "loss": 0.6524,
+      "step": 963000
+    },
+    {
+      "epoch": 7.03,
+      "learning_rate": 3.5390325045304706e-07,
+      "loss": 0.5692,
+      "step": 964000
+    },
+    {
+      "epoch": 7.03,
+      "learning_rate": 3.3453668231809286e-07,
+      "loss": 0.4849,
+      "step": 965000
+    },
+    {
+      "epoch": 7.03,
+      "learning_rate": 3.157132477328628e-07,
+      "loss": 0.4884,
+      "step": 966000
+    },
+    {
+      "epoch": 7.03,
+      "learning_rate": 2.9743315254743833e-07,
+      "loss": 0.5825,
+      "step": 967000
+    },
+    {
+      "epoch": 7.03,
+      "learning_rate": 2.796965966699927e-07,
+      "loss": 0.6197,
+      "step": 968000
+    },
+    {
+      "epoch": 7.03,
+      "learning_rate": 2.625037740646763e-07,
+      "loss": 0.6273,
+      "step": 969000
+    },
+    {
+      "epoch": 7.03,
+      "learning_rate": 2.458548727494292e-07,
+      "loss": 0.5135,
+      "step": 970000
+    },
+    {
+      "epoch": 7.03,
+      "learning_rate": 2.2975007479397738e-07,
+      "loss": 0.5029,
+      "step": 971000
+    },
+    {
+      "epoch": 7.03,
+      "learning_rate": 2.1418955631781202e-07,
+      "loss": 0.5625,
+      "step": 972000
+    },
+    {
+      "epoch": 7.03,
+      "learning_rate": 1.9917348748826335e-07,
+      "loss": 0.5869,
+      "step": 973000
+    },
+    {
+      "epoch": 7.04,
+      "learning_rate": 1.847020325186577e-07,
+      "loss": 0.6541,
+      "step": 974000
+    },
+    {
+      "epoch": 7.04,
+      "learning_rate": 1.7077534966650766e-07,
+      "loss": 0.5637,
+      "step": 975000
+    },
+    {
+      "epoch": 7.04,
+      "learning_rate": 1.5739359123178587e-07,
+      "loss": 0.4865,
+      "step": 976000
+    },
+    {
+      "epoch": 7.04,
+      "learning_rate": 1.4455690355525964e-07,
+      "loss": 0.4846,
+      "step": 977000
+    },
+    {
+      "epoch": 7.04,
+      "learning_rate": 1.3226542701689215e-07,
+      "loss": 0.5801,
+      "step": 978000
+    },
+    {
+      "epoch": 7.04,
+      "learning_rate": 1.2051929603428825e-07,
+      "loss": 0.6182,
+      "step": 979000
+    },
+    {
+      "epoch": 7.04,
+      "learning_rate": 1.0931863906127327e-07,
+      "loss": 0.6277,
+      "step": 980000
+    },
+    {
+      "epoch": 7.04,
+      "learning_rate": 9.866357858642205e-08,
+      "loss": 0.5209,
+      "step": 981000
+    },
+    {
+      "epoch": 7.04,
+      "learning_rate": 8.855423113177664e-08,
+      "loss": 0.5123,
+      "step": 982000
+    },
+    {
+      "epoch": 7.04,
+      "learning_rate": 7.899070725153613e-08,
+      "loss": 0.5457,
+      "step": 983000
+    },
+    {
+      "epoch": 7.05,
+      "learning_rate": 6.997311153086883e-08,
+      "loss": 0.5915,
+      "step": 984000
+    },
+    {
+      "epoch": 7.05,
+      "learning_rate": 6.150154258476315e-08,
+      "loss": 0.6528,
+      "step": 985000
+    },
+    {
+      "epoch": 7.05,
+      "learning_rate": 5.3576093056922906e-08,
+      "loss": 0.5558,
+      "step": 986000
+    },
+    {
+      "epoch": 7.05,
+      "learning_rate": 4.619684961881254e-08,
+      "loss": 0.4924,
+      "step": 987000
+    },
+    {
+      "epoch": 7.05,
+      "learning_rate": 3.936389296864129e-08,
+      "loss": 0.4856,
+      "step": 988000
+    },
+    {
+      "epoch": 7.05,
+      "learning_rate": 3.3077297830541584e-08,
+      "loss": 0.5798,
+      "step": 989000
+    },
+    {
+      "epoch": 7.05,
+      "learning_rate": 2.7337132953697554e-08,
+      "loss": 0.6186,
+      "step": 990000
+    },
+    {
+      "epoch": 7.05,
+      "learning_rate": 2.214346111164556e-08,
+      "loss": 0.6233,
+      "step": 991000
+    },
+    {
+      "epoch": 7.05,
+      "learning_rate": 1.749633910153592e-08,
+      "loss": 0.5258,
+      "step": 992000
+    },
+    {
+      "epoch": 7.05,
+      "learning_rate": 1.3395817743561134e-08,
+      "loss": 0.5187,
+      "step": 993000
+    },
+    {
+      "epoch": 7.06,
+      "learning_rate": 9.841941880361916e-09,
+      "loss": 0.5294,
+      "step": 994000
+    },
+    {
+      "epoch": 7.06,
+      "learning_rate": 6.834750376549792e-09,
+      "loss": 0.5978,
+      "step": 995000
+    },
+    {
+      "epoch": 7.06,
+      "learning_rate": 4.3742761183018784e-09,
+      "loss": 0.6556,
+      "step": 996000
+    },
+    {
+      "epoch": 7.06,
+      "learning_rate": 2.4605460129556445e-09,
+      "loss": 0.5488,
+      "step": 997000
+    },
+    {
+      "epoch": 7.06,
+      "learning_rate": 1.0935809887702154e-09,
+      "loss": 0.4995,
+      "step": 998000
+    },
+    {
+      "epoch": 7.06,
+      "learning_rate": 2.7339599464326627e-10,
+      "loss": 0.486,
+      "step": 999000
+    },
+    {
+      "epoch": 7.06,
+      "learning_rate": 0.0,
+      "loss": 0.5751,
+      "step": 1000000
+    },
+    {
+      "epoch": 7.06,
+      "eval_loss": 0.4293349087238312,
+      "eval_runtime": 11.2697,
+      "eval_samples_per_second": 443.669,
+      "eval_steps_per_second": 3.549,
+      "step": 1000000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 1.684542808527156e+19,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ba23237eabaae268f92a0c5e73a78704a91d8fb58eebea9dce3e91dd8ad4e295
 size 442675755

 version https://git-lfs.github.com/spec/v1
+oid sha256:2f569a8a9d5e623df505612fbda18046bdf5b16ae49848842e493e6b370840ab
 size 442675755

runs/Dec27_23-32-38_t1v-n-2d317d8b-w-0/events.out.tfevents.1672183981.t1v-n-2d317d8b-w-0.162730.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:3bd6bf79762908df4de9c152fef88e518523027acee852f6a469aa4f787d95f6
-size 160972

 version https://git-lfs.github.com/spec/v1
+oid sha256:6f715755d0b69f295a2936a3aaf5da8459e3236aca0c0a87d3a5eb793a8763ea
+size 169248