Training in progress, step 900000

Browse files

Files changed (14) hide show

last-checkpoint/optimizer.pt +1 -1
last-checkpoint/pytorch_model.bin +1 -1
last-checkpoint/rng_state_0.pth +1 -1
last-checkpoint/rng_state_1.pth +1 -1
last-checkpoint/rng_state_2.pth +1 -1
last-checkpoint/rng_state_3.pth +1 -1
last-checkpoint/rng_state_4.pth +1 -1
last-checkpoint/rng_state_5.pth +1 -1
last-checkpoint/rng_state_6.pth +1 -1
last-checkpoint/rng_state_7.pth +1 -1
last-checkpoint/scheduler.pt +1 -1
last-checkpoint/trainer_state.json +311 -3
pytorch_model.bin +1 -1
runs/Nov21_18-14-51_t1v-n-088af867-w-0/events.out.tfevents.1669054551.t1v-n-088af867-w-0.42571.0 +2 -2

last-checkpoint/optimizer.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:caa2f8cc5bf01bf8a65d9abc9a5aa0a6c8d16d885a8db9890456a4f3744ed75d
 size 996067161

 version https://git-lfs.github.com/spec/v1
+oid sha256:ceb962255d325651d0214ab53a3240a3678f6fbca280bc659bf8ea957591d0fe
 size 996067161

last-checkpoint/pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:48d1bb830ab0cf49c6dc97e0fa65b716200e0db90709579694dcdd84be731092
 size 498046827

 version https://git-lfs.github.com/spec/v1
+oid sha256:6f143818755ca223dc9c8f4be31627833f9608ced576a86c60efb1a8a35eee9b
 size 498046827

last-checkpoint/rng_state_0.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:18b90d82a36c74f11c3a8e30a225b762c5734dea8af8c114983537d28d1e74eb
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:724e0436de35575f932af32259f45221d8d4e820a80fc9545c419895a08bab8c
 size 13611

last-checkpoint/rng_state_1.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b9721d3221605a3b0c84cb342b3b22be8c92667833f38a0e0c0b0c482c0f158e
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:9d66e0aa7a19ca2999a68f9b99044a10bdc77d1d2d40a7643a5aedce7e6e9bb3
 size 13611

last-checkpoint/rng_state_2.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:18b90d82a36c74f11c3a8e30a225b762c5734dea8af8c114983537d28d1e74eb
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:724e0436de35575f932af32259f45221d8d4e820a80fc9545c419895a08bab8c
 size 13611

last-checkpoint/rng_state_3.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5546bd3c2735471d80b9f1c6036e5d550929c5eb62e6e812836fa4b30e443f60
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:abe4a94ffd13ccadccdac99f40e8cab31975f7789a7c1dd25a91977835d3c564
 size 13611

last-checkpoint/rng_state_4.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ef92499627b7fe22f16323dff86b84d4e1fbf3ac771244425fe27bed83b8f5b2
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:66f39c6bca81d98dfa2129090d6cb41bbeb1dd411be9dc98d08e7c69d7e2a030
 size 13611

last-checkpoint/rng_state_5.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:5546bd3c2735471d80b9f1c6036e5d550929c5eb62e6e812836fa4b30e443f60
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:abe4a94ffd13ccadccdac99f40e8cab31975f7789a7c1dd25a91977835d3c564
 size 13611

last-checkpoint/rng_state_6.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:ef92499627b7fe22f16323dff86b84d4e1fbf3ac771244425fe27bed83b8f5b2
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:66f39c6bca81d98dfa2129090d6cb41bbeb1dd411be9dc98d08e7c69d7e2a030
 size 13611

last-checkpoint/rng_state_7.pth CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:18b90d82a36c74f11c3a8e30a225b762c5734dea8af8c114983537d28d1e74eb
 size 13611

 version https://git-lfs.github.com/spec/v1
+oid sha256:724e0436de35575f932af32259f45221d8d4e820a80fc9545c419895a08bab8c
 size 13611

last-checkpoint/scheduler.pt CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:adedebe0cc7e07de957a9e2967d6e9c3934a9fdca3245f46a29d125e5e36192e
 size 623

 version https://git-lfs.github.com/spec/v1
+oid sha256:98fbf159ce1bb90afdab5d6ac994b4ab633fc21d8eb6c04c41c7f3a26253e5b5
 size 623

last-checkpoint/trainer_state.json CHANGED Viewed

@@ -1,8 +1,8 @@
 {
   "best_metric": null,
   "best_model_checkpoint": null,
-  "epoch": 3.048882,
-  "global_step": 850000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
@@ -5242,11 +5242,319 @@
       "eval_samples_per_second": 541.935,
       "eval_steps_per_second": 2.168,
       "step": 850000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
-  "total_flos": 1.4321605341819175e+19,
   "trial_name": null,
   "trial_params": null
 }

 {
   "best_metric": null,
   "best_model_checkpoint": null,
+  "epoch": 3.098882,
+  "global_step": 900000,
   "is_hyper_param_search": false,
   "is_local_process_zero": true,
   "is_world_process_zero": true,
       "eval_samples_per_second": 541.935,
       "eval_steps_per_second": 2.168,
       "step": 850000
+    },
+    {
+      "epoch": 3.05,
+      "learning_rate": 5.947856562792925e-06,
+      "loss": 0.7914,
+      "step": 851000
+    },
+    {
+      "epoch": 3.05,
+      "learning_rate": 5.869882433093155e-06,
+      "loss": 0.7817,
+      "step": 852000
+    },
+    {
+      "epoch": 3.05,
+      "learning_rate": 5.79239090328883e-06,
+      "loss": 0.8012,
+      "step": 853000
+    },
+    {
+      "epoch": 3.05,
+      "learning_rate": 5.715382820814885e-06,
+      "loss": 0.8188,
+      "step": 854000
+    },
+    {
+      "epoch": 3.05,
+      "learning_rate": 5.6388590278194096e-06,
+      "loss": 0.8034,
+      "step": 855000
+    },
+    {
+      "epoch": 3.05,
+      "learning_rate": 5.562820361154314e-06,
+      "loss": 0.8152,
+      "step": 856000
+    },
+    {
+      "epoch": 3.06,
+      "learning_rate": 5.48726765236629e-06,
+      "loss": 0.8177,
+      "step": 857000
+    },
+    {
+      "epoch": 3.06,
+      "learning_rate": 5.412201727687644e-06,
+      "loss": 0.8338,
+      "step": 858000
+    },
+    {
+      "epoch": 3.06,
+      "learning_rate": 5.337623408027293e-06,
+      "loss": 0.8226,
+      "step": 859000
+    },
+    {
+      "epoch": 3.06,
+      "learning_rate": 5.263533508961827e-06,
+      "loss": 0.8242,
+      "step": 860000
+    },
+    {
+      "epoch": 3.06,
+      "learning_rate": 5.1899328407264855e-06,
+      "loss": 0.8299,
+      "step": 861000
+    },
+    {
+      "epoch": 3.06,
+      "learning_rate": 5.116822208206396e-06,
+      "loss": 0.8383,
+      "step": 862000
+    },
+    {
+      "epoch": 3.06,
+      "learning_rate": 5.044202410927706e-06,
+      "loss": 0.8071,
+      "step": 863000
+    },
+    {
+      "epoch": 3.06,
+      "learning_rate": 4.972074243048897e-06,
+      "loss": 0.8189,
+      "step": 864000
+    },
+    {
+      "epoch": 3.06,
+      "learning_rate": 4.900438493352055e-06,
+      "loss": 0.8109,
+      "step": 865000
+    },
+    {
+      "epoch": 3.06,
+      "learning_rate": 4.829295945234258e-06,
+      "loss": 0.7964,
+      "step": 866000
+    },
+    {
+      "epoch": 3.07,
+      "learning_rate": 4.758647376699032e-06,
+      "loss": 0.8089,
+      "step": 867000
+    },
+    {
+      "epoch": 3.07,
+      "learning_rate": 4.688493560347773e-06,
+      "loss": 0.7951,
+      "step": 868000
+    },
+    {
+      "epoch": 3.07,
+      "learning_rate": 4.618835263371396e-06,
+      "loss": 0.7972,
+      "step": 869000
+    },
+    {
+      "epoch": 3.07,
+      "learning_rate": 4.549673247541875e-06,
+      "loss": 0.7989,
+      "step": 870000
+    },
+    {
+      "epoch": 3.07,
+      "learning_rate": 4.48100826920394e-06,
+      "loss": 0.8125,
+      "step": 871000
+    },
+    {
+      "epoch": 3.07,
+      "learning_rate": 4.412841079266777e-06,
+      "loss": 0.82,
+      "step": 872000
+    },
+    {
+      "epoch": 3.07,
+      "learning_rate": 4.3451724231958644e-06,
+      "loss": 0.8155,
+      "step": 873000
+    },
+    {
+      "epoch": 3.07,
+      "learning_rate": 4.27800304100478e-06,
+      "loss": 0.8153,
+      "step": 874000
+    },
+    {
+      "epoch": 3.07,
+      "learning_rate": 4.2113336672471245e-06,
+      "loss": 0.8211,
+      "step": 875000
+    },
+    {
+      "epoch": 3.07,
+      "learning_rate": 4.145165031008508e-06,
+      "loss": 0.8203,
+      "step": 876000
+    },
+    {
+      "epoch": 3.08,
+      "learning_rate": 4.079497855898501e-06,
+      "loss": 0.8173,
+      "step": 877000
+    },
+    {
+      "epoch": 3.08,
+      "learning_rate": 4.01433286004283e-06,
+      "loss": 0.8147,
+      "step": 878000
+    },
+    {
+      "epoch": 3.08,
+      "learning_rate": 3.949670756075447e-06,
+      "loss": 0.8209,
+      "step": 879000
+    },
+    {
+      "epoch": 3.08,
+      "learning_rate": 3.885512251130763e-06,
+      "loss": 0.8282,
+      "step": 880000
+    },
+    {
+      "epoch": 3.08,
+      "learning_rate": 3.821858046835913e-06,
+      "loss": 0.8172,
+      "step": 881000
+    },
+    {
+      "epoch": 3.08,
+      "learning_rate": 3.75870883930306e-06,
+      "loss": 0.814,
+      "step": 882000
+    },
+    {
+      "epoch": 3.08,
+      "learning_rate": 3.696065319121833e-06,
+      "loss": 0.82,
+      "step": 883000
+    },
+    {
+      "epoch": 3.08,
+      "learning_rate": 3.6339281713517303e-06,
+      "loss": 0.8245,
+      "step": 884000
+    },
+    {
+      "epoch": 3.08,
+      "learning_rate": 3.5722980755146517e-06,
+      "loss": 0.8146,
+      "step": 885000
+    },
+    {
+      "epoch": 3.08,
+      "learning_rate": 3.511175705587433e-06,
+      "loss": 0.8187,
+      "step": 886000
+    },
+    {
+      "epoch": 3.09,
+      "learning_rate": 3.4505617299945336e-06,
+      "loss": 0.8271,
+      "step": 887000
+    },
+    {
+      "epoch": 3.09,
+      "learning_rate": 3.390456811600673e-06,
+      "loss": 0.8342,
+      "step": 888000
+    },
+    {
+      "epoch": 3.09,
+      "learning_rate": 3.3308616077036115e-06,
+      "loss": 0.8219,
+      "step": 889000
+    },
+    {
+      "epoch": 3.09,
+      "learning_rate": 3.271776770026963e-06,
+      "loss": 0.816,
+      "step": 890000
+    },
+    {
+      "epoch": 3.09,
+      "learning_rate": 3.213202944713023e-06,
+      "loss": 0.8273,
+      "step": 891000
+    },
+    {
+      "epoch": 3.09,
+      "learning_rate": 3.155140772315773e-06,
+      "loss": 0.8167,
+      "step": 892000
+    },
+    {
+      "epoch": 3.09,
+      "learning_rate": 3.0975908877938277e-06,
+      "loss": 0.8174,
+      "step": 893000
+    },
+    {
+      "epoch": 3.09,
+      "learning_rate": 3.040553920503503e-06,
+      "loss": 0.8112,
+      "step": 894000
+    },
+    {
+      "epoch": 3.09,
+      "learning_rate": 2.9840304941919415e-06,
+      "loss": 0.7996,
+      "step": 895000
+    },
+    {
+      "epoch": 3.09,
+      "learning_rate": 2.928021226990263e-06,
+      "loss": 0.7863,
+      "step": 896000
+    },
+    {
+      "epoch": 3.1,
+      "learning_rate": 2.8725267314068495e-06,
+      "loss": 0.8069,
+      "step": 897000
+    },
+    {
+      "epoch": 3.1,
+      "learning_rate": 2.817547614320615e-06,
+      "loss": 0.7963,
+      "step": 898000
+    },
+    {
+      "epoch": 3.1,
+      "learning_rate": 2.7630844769743757e-06,
+      "loss": 0.7979,
+      "step": 899000
+    },
+    {
+      "epoch": 3.1,
+      "learning_rate": 2.7091379149682685e-06,
+      "loss": 0.7956,
+      "step": 900000
+    },
+    {
+      "epoch": 3.1,
+      "eval_loss": 0.75617516040802,
+      "eval_runtime": 21.976,
+      "eval_samples_per_second": 455.042,
+      "eval_steps_per_second": 1.82,
+      "step": 900000
     }
   ],
   "max_steps": 1000000,
   "num_train_epochs": 9223372036854775807,
+  "total_flos": 1.5164052219310375e+19,
   "trial_name": null,
   "trial_params": null
 }

pytorch_model.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:48d1bb830ab0cf49c6dc97e0fa65b716200e0db90709579694dcdd84be731092
 size 498046827

 version https://git-lfs.github.com/spec/v1
+oid sha256:6f143818755ca223dc9c8f4be31627833f9608ced576a86c60efb1a8a35eee9b
 size 498046827

runs/Nov21_18-14-51_t1v-n-088af867-w-0/events.out.tfevents.1669054551.t1v-n-088af867-w-0.42571.0 CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c1b3c3dcaec4f582a74823f3a86224f10cd2475a549becf37838082b475e22b7
-size 94784

 version https://git-lfs.github.com/spec/v1
+oid sha256:faa77f32c37cdbd4a872c23d973d2ff518983bbab54618f50edb8ccbf3ec64c0
+size 103060