ihanif commited on
Commit
17925c1
1 Parent(s): 674d21a

End of training

Browse files
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 143.0,
3
- "eval_loss": 1.4602868556976318,
4
- "eval_runtime": 1380.6124,
5
- "eval_samples_per_second": 0.371,
6
  "eval_steps_per_second": 0.023,
7
- "eval_wer": 50.56749394673123,
8
- "train_loss": 3.4378880828425483e-07,
9
- "train_runtime": 10.5939,
10
- "train_samples_per_second": 6041.236,
11
- "train_steps_per_second": 94.394
12
  }
 
1
  {
2
+ "epoch": 171.43,
3
+ "eval_loss": 1.4806574583053589,
4
+ "eval_runtime": 1382.3743,
5
+ "eval_samples_per_second": 0.37,
6
  "eval_steps_per_second": 0.023,
7
+ "eval_wer": 50.544794188861985,
8
+ "train_loss": 5.569725840662916e-05,
9
+ "train_runtime": 4535.4947,
10
+ "train_samples_per_second": 16.933,
11
+ "train_steps_per_second": 0.265
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 143.0,
3
- "eval_loss": 1.4602868556976318,
4
- "eval_runtime": 1380.6124,
5
- "eval_samples_per_second": 0.371,
6
  "eval_steps_per_second": 0.023,
7
- "eval_wer": 50.56749394673123
8
  }
 
1
  {
2
+ "epoch": 171.43,
3
+ "eval_loss": 1.4806574583053589,
4
+ "eval_runtime": 1382.3743,
5
+ "eval_samples_per_second": 0.37,
6
  "eval_steps_per_second": 0.023,
7
+ "eval_wer": 50.544794188861985
8
  }
runs/Dec10_09-37-22_132-145-129-157/events.out.tfevents.1670671102.132-145-129-157.108751.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3188d522185a9b6ba306435cde03da7574aabecf2970ad61c134bd905ff09937
3
+ size 358
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 143.0,
3
- "train_loss": 3.4378880828425483e-07,
4
- "train_runtime": 10.5939,
5
- "train_samples_per_second": 6041.236,
6
- "train_steps_per_second": 94.394
7
  }
 
1
  {
2
+ "epoch": 171.43,
3
+ "train_loss": 5.569725840662916e-05,
4
+ "train_runtime": 4535.4947,
5
+ "train_samples_per_second": 16.933,
6
+ "train_steps_per_second": 0.265
7
  }
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 50.56749394673123,
3
- "best_model_checkpoint": "./checkpoint-1000",
4
- "epoch": 143.0,
5
- "global_step": 1001,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -338,18 +338,84 @@
338
  "step": 1000
339
  },
340
  {
341
- "epoch": 143.0,
342
- "step": 1001,
343
- "total_flos": 6.290294226518016e+19,
344
- "train_loss": 3.4378880828425483e-07,
345
- "train_runtime": 10.5939,
346
- "train_samples_per_second": 6041.236,
347
- "train_steps_per_second": 94.394
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
348
  }
349
  ],
350
- "max_steps": 1000,
351
- "num_train_epochs": 143,
352
- "total_flos": 6.290294226518016e+19,
353
  "trial_name": null,
354
  "trial_params": null
355
  }
 
1
  {
2
+ "best_metric": 50.544794188861985,
3
+ "best_model_checkpoint": "./checkpoint-1200",
4
+ "epoch": 171.42857142857142,
5
+ "global_step": 1200,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
338
  "step": 1000
339
  },
340
  {
341
+ "epoch": 146.43,
342
+ "learning_rate": 1.4957983193277311e-06,
343
+ "loss": 0.0003,
344
+ "step": 1025
345
+ },
346
+ {
347
+ "epoch": 150.0,
348
+ "learning_rate": 1.2857142857142856e-06,
349
+ "loss": 0.0003,
350
+ "step": 1050
351
+ },
352
+ {
353
+ "epoch": 153.57,
354
+ "learning_rate": 1.0756302521008405e-06,
355
+ "loss": 0.0003,
356
+ "step": 1075
357
+ },
358
+ {
359
+ "epoch": 157.14,
360
+ "learning_rate": 8.65546218487395e-07,
361
+ "loss": 0.0003,
362
+ "step": 1100
363
+ },
364
+ {
365
+ "epoch": 157.14,
366
+ "eval_loss": 1.4750263690948486,
367
+ "eval_runtime": 1385.2093,
368
+ "eval_samples_per_second": 0.37,
369
+ "eval_steps_per_second": 0.023,
370
+ "eval_wer": 50.559927360774815,
371
+ "step": 1100
372
+ },
373
+ {
374
+ "epoch": 160.71,
375
+ "learning_rate": 6.554621848739497e-07,
376
+ "loss": 0.0003,
377
+ "step": 1125
378
+ },
379
+ {
380
+ "epoch": 164.29,
381
+ "learning_rate": 4.4537815126050424e-07,
382
+ "loss": 0.0003,
383
+ "step": 1150
384
+ },
385
+ {
386
+ "epoch": 167.86,
387
+ "learning_rate": 2.3529411764705883e-07,
388
+ "loss": 0.0003,
389
+ "step": 1175
390
+ },
391
+ {
392
+ "epoch": 171.43,
393
+ "learning_rate": 2.521008403361345e-08,
394
+ "loss": 0.0003,
395
+ "step": 1200
396
+ },
397
+ {
398
+ "epoch": 171.43,
399
+ "eval_loss": 1.4806574583053589,
400
+ "eval_runtime": 1382.0563,
401
+ "eval_samples_per_second": 0.37,
402
+ "eval_steps_per_second": 0.023,
403
+ "eval_wer": 50.544794188861985,
404
+ "step": 1200
405
+ },
406
+ {
407
+ "epoch": 171.43,
408
+ "step": 1200,
409
+ "total_flos": 7.541555843137536e+19,
410
+ "train_loss": 5.569725840662916e-05,
411
+ "train_runtime": 4535.4947,
412
+ "train_samples_per_second": 16.933,
413
+ "train_steps_per_second": 0.265
414
  }
415
  ],
416
+ "max_steps": 1200,
417
+ "num_train_epochs": 172,
418
+ "total_flos": 7.541555843137536e+19,
419
  "trial_name": null,
420
  "trial_params": null
421
  }