ihanif commited on
Commit
9c0d886
1 Parent(s): 4b34f91

End of training

Browse files
all_results.json CHANGED
@@ -1,7 +1,12 @@
1
  {
2
- "epoch": 0.97,
3
- "train_loss": 0.4665303599834442,
4
- "train_runtime": 6285.9399,
5
- "train_samples_per_second": 1.018,
6
- "train_steps_per_second": 0.032
 
 
 
 
 
7
  }
 
1
  {
2
+ "epoch": 1.45,
3
+ "eval_loss": 0.46850404143333435,
4
+ "eval_runtime": 2554.9052,
5
+ "eval_samples_per_second": 1.292,
6
+ "eval_steps_per_second": 0.081,
7
+ "eval_wer": 26.980130911344357,
8
+ "train_loss": 0.08693385044733683,
9
+ "train_runtime": 3481.8761,
10
+ "train_samples_per_second": 2.757,
11
+ "train_steps_per_second": 0.086
12
  }
eval_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 1.45,
3
+ "eval_loss": 0.46850404143333435,
4
+ "eval_runtime": 2554.9052,
5
+ "eval_samples_per_second": 1.292,
6
+ "eval_steps_per_second": 0.081,
7
+ "eval_wer": 26.980130911344357
8
+ }
runs/Dec11_14-58-14_150-136-41-252/events.out.tfevents.1670777055.150-136-41-252.369844.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c821bdf4fc61a8c11243fa75bd5c3fb6af8cfd4899b9a8d23d8f3f8cfcd9e3b
3
+ size 358
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 0.97,
3
- "train_loss": 0.4665303599834442,
4
- "train_runtime": 6285.9399,
5
- "train_samples_per_second": 1.018,
6
- "train_steps_per_second": 0.032
7
  }
 
1
  {
2
+ "epoch": 1.45,
3
+ "train_loss": 0.08693385044733683,
4
+ "train_runtime": 3481.8761,
5
+ "train_samples_per_second": 2.757,
6
+ "train_steps_per_second": 0.086
7
  }
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
  "best_metric": 26.980130911344357,
3
  "best_model_checkpoint": "./checkpoint-200",
4
- "epoch": 0.966183574879227,
5
- "global_step": 200,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -146,18 +146,87 @@
146
  "step": 200
147
  },
148
  {
149
- "epoch": 0.97,
150
- "step": 200,
151
- "total_flos": 6.531871408128e+18,
152
- "train_loss": 0.4665303599834442,
153
- "train_runtime": 6285.9399,
154
- "train_samples_per_second": 1.018,
155
- "train_steps_per_second": 0.032
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
156
  }
157
  ],
158
- "max_steps": 200,
159
- "num_train_epochs": 1,
160
- "total_flos": 6.531871408128e+18,
161
  "trial_name": null,
162
  "trial_params": null
163
  }
 
1
  {
2
  "best_metric": 26.980130911344357,
3
  "best_model_checkpoint": "./checkpoint-200",
4
+ "epoch": 1.4492753623188406,
5
+ "global_step": 300,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
146
  "step": 200
147
  },
148
  {
149
+ "epoch": 1.01,
150
+ "learning_rate": 3.538461538461539e-06,
151
+ "loss": 0.3721,
152
+ "step": 210
153
+ },
154
+ {
155
+ "epoch": 1.06,
156
+ "learning_rate": 3.153846153846154e-06,
157
+ "loss": 0.2392,
158
+ "step": 220
159
+ },
160
+ {
161
+ "epoch": 1.11,
162
+ "learning_rate": 2.7692307692307697e-06,
163
+ "loss": 0.2854,
164
+ "step": 230
165
+ },
166
+ {
167
+ "epoch": 1.16,
168
+ "learning_rate": 2.384615384615385e-06,
169
+ "loss": 0.2517,
170
+ "step": 240
171
+ },
172
+ {
173
+ "epoch": 1.21,
174
+ "learning_rate": 2.0000000000000003e-06,
175
+ "loss": 0.2506,
176
+ "step": 250
177
+ },
178
+ {
179
+ "epoch": 1.26,
180
+ "learning_rate": 1.6153846153846157e-06,
181
+ "loss": 0.2462,
182
+ "step": 260
183
+ },
184
+ {
185
+ "epoch": 1.3,
186
+ "learning_rate": 1.230769230769231e-06,
187
+ "loss": 0.2179,
188
+ "step": 270
189
+ },
190
+ {
191
+ "epoch": 1.35,
192
+ "learning_rate": 8.461538461538463e-07,
193
+ "loss": 0.2579,
194
+ "step": 280
195
+ },
196
+ {
197
+ "epoch": 1.4,
198
+ "learning_rate": 4.615384615384616e-07,
199
+ "loss": 0.2446,
200
+ "step": 290
201
+ },
202
+ {
203
+ "epoch": 1.45,
204
+ "learning_rate": 7.692307692307694e-08,
205
+ "loss": 0.2426,
206
+ "step": 300
207
+ },
208
+ {
209
+ "epoch": 1.45,
210
+ "eval_loss": 0.4635893404483795,
211
+ "eval_runtime": 2857.1857,
212
+ "eval_samples_per_second": 1.156,
213
+ "eval_steps_per_second": 0.072,
214
+ "eval_wer": 28.502265773267748,
215
+ "step": 300
216
+ },
217
+ {
218
+ "epoch": 1.45,
219
+ "step": 300,
220
+ "total_flos": 9.77943622385664e+18,
221
+ "train_loss": 0.08693385044733683,
222
+ "train_runtime": 3481.8761,
223
+ "train_samples_per_second": 2.757,
224
+ "train_steps_per_second": 0.086
225
  }
226
  ],
227
+ "max_steps": 300,
228
+ "num_train_epochs": 2,
229
+ "total_flos": 9.77943622385664e+18,
230
  "trial_name": null,
231
  "trial_params": null
232
  }