mattbonnell commited on
Commit
e876662
·
verified ·
1 Parent(s): bf6962a

Training in progress, step 8000, checkpoint

Browse files
last-checkpoint/global_step8000/mp_rank_00_model_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c58e87c0f03991d738e3335bae09acac1c1dd7681fc36f3d913b1d0ab4fd95a2
3
+ size 197282509
last-checkpoint/global_step8000/zero_pp_rank_0_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:21be6599b774db66dedc1b7b5eac08b789506bba6c492917c2021a6862c8578d
3
+ size 180416968
last-checkpoint/global_step8000/zero_pp_rank_1_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bf491a3ec6351e35110667cef3d18242de4dfff3f81721ddb42590e1a51cf795
3
+ size 180416776
last-checkpoint/global_step8000/zero_pp_rank_2_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c9c03b48010e9d4b0adb5eaa84d78f062729e9fb40b05e49ec71c7670a67b111
3
+ size 180416776
last-checkpoint/global_step8000/zero_pp_rank_3_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2e5b1cf33c9473bc545551cc835151766ce57be522c0687f70931e375eb47c66
3
+ size 180416904
last-checkpoint/global_step8000/zero_pp_rank_4_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a38dd41f89589d0faf33c397f98c618a9cce62a597a7964a499f42d586ed6c08
3
+ size 180416712
last-checkpoint/global_step8000/zero_pp_rank_5_mp_rank_00_optim_states.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ac4a14cde9deb49575b5dbeb11aa1e0c75610607c361a8494f726651ba46b8b
3
+ size 180417096
last-checkpoint/latest CHANGED
@@ -1 +1 @@
1
- global_step7500
 
1
+ global_step8000
last-checkpoint/model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5c706dc1178504f6752d44e929c9d8cc9de149880b704897aa6bf74772ef87e1
3
  size 188836816
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e2ccd66b0d3eac61fdd022c65f61fec2848db2ff54d1c43e2a14a9f026c0394
3
  size 188836816
last-checkpoint/rng_state_0.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c816547398c9d0c74280904d885bc91a841220695d82f2bc47c4c7abf13ab004
3
  size 15536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ea500e099e374ab8f40a21f5238cc4b753325af0d8cddf9294790e0f04153e7a
3
  size 15536
last-checkpoint/rng_state_1.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5ba2aff0e2022b2a3436dfb2c1c98f832679546299b17ebacc71b2eb1f71e7c0
3
- size 15472
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11e26d2216e18df43db8309fcc95dba493bd2243b1ee081f23d44d1d51767fbd
3
+ size 15536
last-checkpoint/rng_state_2.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:21e5d58d64a65caff661f48ed778a1cb549164f46e7b194156674f2eb7f3b6a8
3
  size 15536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a5dbf9199d9fbbe4519352983976ccd7fc8c6c8f988fbb95736f5368013dce0c
3
  size 15536
last-checkpoint/rng_state_3.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c1d0ad31b3a46ded17b3d98149040c14eccbf6a59c2b8f783c377ab81e0ada96
3
  size 15536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:83e6add4149c20ee1bbd11a39e647cd83b6d5e92df39787f3e4dd6d4c2c9362a
3
  size 15536
last-checkpoint/rng_state_4.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8a4b45074227cc785b28692a49aaa5abb18222039da56fa536ad532e5a17f55f
3
  size 15536
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:fdd4141f9ac586703ff022ae4a72874450b5b0b99397d5a0cb6dd7caffc6ebd4
3
  size 15536
last-checkpoint/rng_state_5.pth CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:65ce51281925c22814f6a24cbafab5e4eed2ab27e1b0a722b553ca852278e137
3
- size 15600
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ca1450055d7dfb8743ae0d1ace8a5ace9c1bef6e7e75026e510a4b2960a133be
3
+ size 15472
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:27c642e391a124150c03fa09402ee539bc1d9ff837a5db4c2246095593216182
3
  size 1256
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cad4268cfb586000e1a64ea1e79a3a6d50e4d70a575ea40791dc76489a8bd7bb
3
  size 1256
last-checkpoint/trainer_state.json CHANGED
@@ -1,9 +1,9 @@
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
- "epoch": 202.7027027027027,
5
  "eval_steps": 1500,
6
- "global_step": 7500,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
@@ -1093,6 +1093,76 @@
1093
  "eval_steps_per_second": 0.168,
1094
  "eval_wer": 0.19167904903417535,
1095
  "step": 7500
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1096
  }
1097
  ],
1098
  "logging_steps": 50,
@@ -1112,7 +1182,7 @@
1112
  "attributes": {}
1113
  }
1114
  },
1115
- "total_flos": 2.1053996452835597e+20,
1116
  "train_batch_size": 64,
1117
  "trial_name": null,
1118
  "trial_params": null
 
1
  {
2
  "best_metric": null,
3
  "best_model_checkpoint": null,
4
+ "epoch": 216.21621621621622,
5
  "eval_steps": 1500,
6
+ "global_step": 8000,
7
  "is_hyper_param_search": false,
8
  "is_local_process_zero": true,
9
  "is_world_process_zero": true,
 
1093
  "eval_steps_per_second": 0.168,
1094
  "eval_wer": 0.19167904903417535,
1095
  "step": 7500
1096
+ },
1097
+ {
1098
+ "epoch": 204.05405405405406,
1099
+ "grad_norm": 0.3734581470489502,
1100
+ "learning_rate": 0.0001,
1101
+ "loss": 0.0234,
1102
+ "step": 7550
1103
+ },
1104
+ {
1105
+ "epoch": 205.40540540540542,
1106
+ "grad_norm": 0.4595019519329071,
1107
+ "learning_rate": 0.0001,
1108
+ "loss": 0.0229,
1109
+ "step": 7600
1110
+ },
1111
+ {
1112
+ "epoch": 206.75675675675674,
1113
+ "grad_norm": 0.2700786888599396,
1114
+ "learning_rate": 0.0001,
1115
+ "loss": 0.0227,
1116
+ "step": 7650
1117
+ },
1118
+ {
1119
+ "epoch": 208.1081081081081,
1120
+ "grad_norm": 0.24691906571388245,
1121
+ "learning_rate": 0.0001,
1122
+ "loss": 0.0229,
1123
+ "step": 7700
1124
+ },
1125
+ {
1126
+ "epoch": 209.45945945945945,
1127
+ "grad_norm": 0.3328978717327118,
1128
+ "learning_rate": 0.0001,
1129
+ "loss": 0.0217,
1130
+ "step": 7750
1131
+ },
1132
+ {
1133
+ "epoch": 210.8108108108108,
1134
+ "grad_norm": 0.286808580160141,
1135
+ "learning_rate": 0.0001,
1136
+ "loss": 0.0205,
1137
+ "step": 7800
1138
+ },
1139
+ {
1140
+ "epoch": 212.16216216216216,
1141
+ "grad_norm": 0.27080458402633667,
1142
+ "learning_rate": 0.0001,
1143
+ "loss": 0.0202,
1144
+ "step": 7850
1145
+ },
1146
+ {
1147
+ "epoch": 213.51351351351352,
1148
+ "grad_norm": 0.398179292678833,
1149
+ "learning_rate": 0.0001,
1150
+ "loss": 0.0215,
1151
+ "step": 7900
1152
+ },
1153
+ {
1154
+ "epoch": 214.86486486486487,
1155
+ "grad_norm": 0.3541491627693176,
1156
+ "learning_rate": 0.0001,
1157
+ "loss": 0.0218,
1158
+ "step": 7950
1159
+ },
1160
+ {
1161
+ "epoch": 216.21621621621622,
1162
+ "grad_norm": 0.3138297498226166,
1163
+ "learning_rate": 0.0001,
1164
+ "loss": 0.022,
1165
+ "step": 8000
1166
  }
1167
  ],
1168
  "logging_steps": 50,
 
1182
  "attributes": {}
1183
  }
1184
  },
1185
+ "total_flos": 2.2456068419295904e+20,
1186
  "train_batch_size": 64,
1187
  "trial_name": null,
1188
  "trial_params": null