ihanif commited on
Commit
d053918
1 Parent(s): 45f7a70

End of training

Browse files
all_results.json CHANGED
@@ -1,12 +1,12 @@
1
  {
2
- "epoch": 71.43,
3
- "eval_loss": 2.310106039047241,
4
- "eval_runtime": 206.3711,
5
- "eval_samples_per_second": 2.481,
6
- "eval_steps_per_second": 0.078,
7
- "eval_wer": 485.9866828087167,
8
- "train_loss": 0.4595182914733887,
9
- "train_runtime": 383.5233,
10
- "train_samples_per_second": 83.437,
11
- "train_steps_per_second": 1.304
12
  }
 
1
  {
2
+ "epoch": 100.0,
3
+ "eval_loss": 2.027944564819336,
4
+ "eval_runtime": 230.0349,
5
+ "eval_samples_per_second": 2.226,
6
+ "eval_steps_per_second": 0.07,
7
+ "eval_wer": 497.22306295399517,
8
+ "train_loss": 0.5946499960763114,
9
+ "train_runtime": 764.6061,
10
+ "train_samples_per_second": 58.592,
11
+ "train_steps_per_second": 0.916
12
  }
eval_results.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "epoch": 71.43,
3
- "eval_loss": 2.310106039047241,
4
- "eval_runtime": 206.3711,
5
- "eval_samples_per_second": 2.481,
6
- "eval_steps_per_second": 0.078,
7
- "eval_wer": 485.9866828087167
8
  }
 
1
  {
2
+ "epoch": 100.0,
3
+ "eval_loss": 2.027944564819336,
4
+ "eval_runtime": 230.0349,
5
+ "eval_samples_per_second": 2.226,
6
+ "eval_steps_per_second": 0.07,
7
+ "eval_wer": 497.22306295399517
8
  }
runs/Dec18_15-38-50_129-146-179-188/events.out.tfevents.1671378974.129-146-179-188.133265.2 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d645c14c0b88c954f9b9b9a96365d7eabcd3557f82edaab233f7f427f905a0e5
3
+ size 358
train_results.json CHANGED
@@ -1,7 +1,7 @@
1
  {
2
- "epoch": 71.43,
3
- "train_loss": 0.4595182914733887,
4
- "train_runtime": 383.5233,
5
- "train_samples_per_second": 83.437,
6
- "train_steps_per_second": 1.304
7
  }
 
1
  {
2
+ "epoch": 100.0,
3
+ "train_loss": 0.5946499960763114,
4
+ "train_runtime": 764.6061,
5
+ "train_samples_per_second": 58.592,
6
+ "train_steps_per_second": 0.916
7
  }
trainer_state.json CHANGED
@@ -1,8 +1,8 @@
1
  {
2
- "best_metric": 2.310106039047241,
3
- "best_model_checkpoint": "./checkpoint-500",
4
- "epoch": 71.42857142857143,
5
- "global_step": 500,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
@@ -353,18 +353,156 @@
353
  "step": 500
354
  },
355
  {
356
- "epoch": 71.43,
357
- "step": 500,
358
- "total_flos": 7.5808932950016e+17,
359
- "train_loss": 0.4595182914733887,
360
- "train_runtime": 383.5233,
361
- "train_samples_per_second": 83.437,
362
- "train_steps_per_second": 1.304
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
363
  }
364
  ],
365
- "max_steps": 500,
366
- "num_train_epochs": 72,
367
- "total_flos": 7.5808932950016e+17,
368
  "trial_name": null,
369
  "trial_params": null
370
  }
 
1
  {
2
+ "best_metric": 2.027944564819336,
3
+ "best_model_checkpoint": "./checkpoint-700",
4
+ "epoch": 100.0,
5
+ "global_step": 700,
6
  "is_hyper_param_search": false,
7
  "is_local_process_zero": true,
8
  "is_world_process_zero": true,
 
353
  "step": 500
354
  },
355
  {
356
+ "epoch": 72.86,
357
+ "learning_rate": 2.895e-07,
358
+ "loss": 2.2567,
359
+ "step": 510
360
+ },
361
+ {
362
+ "epoch": 74.29,
363
+ "learning_rate": 2.745e-07,
364
+ "loss": 2.2426,
365
+ "step": 520
366
+ },
367
+ {
368
+ "epoch": 75.71,
369
+ "learning_rate": 2.5949999999999996e-07,
370
+ "loss": 2.2056,
371
+ "step": 530
372
+ },
373
+ {
374
+ "epoch": 77.14,
375
+ "learning_rate": 2.445e-07,
376
+ "loss": 2.2007,
377
+ "step": 540
378
+ },
379
+ {
380
+ "epoch": 78.57,
381
+ "learning_rate": 2.2949999999999998e-07,
382
+ "loss": 2.1627,
383
+ "step": 550
384
+ },
385
+ {
386
+ "epoch": 80.0,
387
+ "learning_rate": 2.1449999999999997e-07,
388
+ "loss": 2.1338,
389
+ "step": 560
390
+ },
391
+ {
392
+ "epoch": 81.43,
393
+ "learning_rate": 1.995e-07,
394
+ "loss": 2.1042,
395
+ "step": 570
396
+ },
397
+ {
398
+ "epoch": 82.86,
399
+ "learning_rate": 1.845e-07,
400
+ "loss": 2.1054,
401
+ "step": 580
402
+ },
403
+ {
404
+ "epoch": 84.29,
405
+ "learning_rate": 1.6949999999999998e-07,
406
+ "loss": 2.0796,
407
+ "step": 590
408
+ },
409
+ {
410
+ "epoch": 85.71,
411
+ "learning_rate": 1.545e-07,
412
+ "loss": 2.0644,
413
+ "step": 600
414
+ },
415
+ {
416
+ "epoch": 85.71,
417
+ "eval_loss": 2.092550039291382,
418
+ "eval_runtime": 188.6334,
419
+ "eval_samples_per_second": 2.714,
420
+ "eval_steps_per_second": 0.085,
421
+ "eval_wer": 491.48002421307507,
422
+ "step": 600
423
+ },
424
+ {
425
+ "epoch": 87.14,
426
+ "learning_rate": 1.395e-07,
427
+ "loss": 2.0308,
428
+ "step": 610
429
+ },
430
+ {
431
+ "epoch": 88.57,
432
+ "learning_rate": 1.2449999999999998e-07,
433
+ "loss": 2.0388,
434
+ "step": 620
435
+ },
436
+ {
437
+ "epoch": 90.0,
438
+ "learning_rate": 1.095e-07,
439
+ "loss": 2.0281,
440
+ "step": 630
441
+ },
442
+ {
443
+ "epoch": 91.43,
444
+ "learning_rate": 9.449999999999999e-08,
445
+ "loss": 2.0146,
446
+ "step": 640
447
+ },
448
+ {
449
+ "epoch": 92.86,
450
+ "learning_rate": 7.95e-08,
451
+ "loss": 2.0052,
452
+ "step": 650
453
+ },
454
+ {
455
+ "epoch": 94.29,
456
+ "learning_rate": 6.45e-08,
457
+ "loss": 1.998,
458
+ "step": 660
459
+ },
460
+ {
461
+ "epoch": 95.71,
462
+ "learning_rate": 4.95e-08,
463
+ "loss": 1.9969,
464
+ "step": 670
465
+ },
466
+ {
467
+ "epoch": 97.14,
468
+ "learning_rate": 3.45e-08,
469
+ "loss": 1.9842,
470
+ "step": 680
471
+ },
472
+ {
473
+ "epoch": 98.57,
474
+ "learning_rate": 1.95e-08,
475
+ "loss": 1.9933,
476
+ "step": 690
477
+ },
478
+ {
479
+ "epoch": 100.0,
480
+ "learning_rate": 4.5e-09,
481
+ "loss": 1.9799,
482
+ "step": 700
483
+ },
484
+ {
485
+ "epoch": 100.0,
486
+ "eval_loss": 2.027944564819336,
487
+ "eval_runtime": 284.3457,
488
+ "eval_samples_per_second": 1.801,
489
+ "eval_steps_per_second": 0.056,
490
+ "eval_wer": 497.22306295399517,
491
+ "step": 700
492
+ },
493
+ {
494
+ "epoch": 100.0,
495
+ "step": 700,
496
+ "total_flos": 1.061073948672e+18,
497
+ "train_loss": 0.5946499960763114,
498
+ "train_runtime": 764.6061,
499
+ "train_samples_per_second": 58.592,
500
+ "train_steps_per_second": 0.916
501
  }
502
  ],
503
+ "max_steps": 700,
504
+ "num_train_epochs": 100,
505
+ "total_flos": 1.061073948672e+18,
506
  "trial_name": null,
507
  "trial_params": null
508
  }