kid-whisper-small-myst / trainer_state.json
aadel4's picture
Upload 9 files
c46adfd
raw
history blame
No virus
4.73 kB
{
"best_metric": 9.06746912032304,
"best_model_checkpoint": "./fine-tuned-whisper/openai/whisper-small/lr_1e-05_warmup_500_epochs_0_batch_32_grad_acc_1_max_steps_10000/dataset_myst/2023-09-09_11-20-19/checkpoint-1500",
"epoch": 4.0,
"eval_steps": 500,
"global_step": 2500,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.16,
"learning_rate": 1.94e-06,
"loss": 1.7092,
"step": 100
},
{
"epoch": 0.32,
"learning_rate": 3.94e-06,
"loss": 0.6661,
"step": 200
},
{
"epoch": 0.48,
"learning_rate": 5.94e-06,
"loss": 0.4875,
"step": 300
},
{
"epoch": 0.64,
"learning_rate": 7.94e-06,
"loss": 0.4176,
"step": 400
},
{
"epoch": 0.8,
"learning_rate": 9.940000000000001e-06,
"loss": 0.3943,
"step": 500
},
{
"epoch": 0.8,
"eval_loss": 0.23756489157676697,
"eval_runtime": 611.1384,
"eval_samples_per_second": 5.171,
"eval_steps_per_second": 0.324,
"eval_wer": 10.145123229361573,
"step": 500
},
{
"epoch": 0.96,
"learning_rate": 9.897894736842107e-06,
"loss": 0.3814,
"step": 600
},
{
"epoch": 1.12,
"learning_rate": 9.79263157894737e-06,
"loss": 0.3181,
"step": 700
},
{
"epoch": 1.28,
"learning_rate": 9.687368421052632e-06,
"loss": 0.3291,
"step": 800
},
{
"epoch": 1.44,
"learning_rate": 9.582105263157897e-06,
"loss": 0.324,
"step": 900
},
{
"epoch": 1.6,
"learning_rate": 9.476842105263158e-06,
"loss": 0.3302,
"step": 1000
},
{
"epoch": 1.6,
"eval_loss": 0.22787314653396606,
"eval_runtime": 601.1188,
"eval_samples_per_second": 5.257,
"eval_steps_per_second": 0.329,
"eval_wer": 9.153630009709175,
"step": 1000
},
{
"epoch": 1.76,
"learning_rate": 9.371578947368421e-06,
"loss": 0.3232,
"step": 1100
},
{
"epoch": 1.92,
"learning_rate": 9.266315789473685e-06,
"loss": 0.3179,
"step": 1200
},
{
"epoch": 2.08,
"learning_rate": 9.161052631578948e-06,
"loss": 0.2809,
"step": 1300
},
{
"epoch": 2.24,
"learning_rate": 9.055789473684211e-06,
"loss": 0.2445,
"step": 1400
},
{
"epoch": 2.4,
"learning_rate": 8.950526315789474e-06,
"loss": 0.2523,
"step": 1500
},
{
"epoch": 2.4,
"eval_loss": 0.23648202419281006,
"eval_runtime": 599.2062,
"eval_samples_per_second": 5.274,
"eval_steps_per_second": 0.33,
"eval_wer": 9.06746912032304,
"step": 1500
},
{
"epoch": 2.56,
"learning_rate": 8.845263157894738e-06,
"loss": 0.2481,
"step": 1600
},
{
"epoch": 2.72,
"learning_rate": 8.740000000000001e-06,
"loss": 0.2596,
"step": 1700
},
{
"epoch": 2.88,
"learning_rate": 8.634736842105264e-06,
"loss": 0.256,
"step": 1800
},
{
"epoch": 3.04,
"learning_rate": 8.529473684210528e-06,
"loss": 0.2419,
"step": 1900
},
{
"epoch": 3.2,
"learning_rate": 8.42421052631579e-06,
"loss": 0.1874,
"step": 2000
},
{
"epoch": 3.2,
"eval_loss": 0.24421058595180511,
"eval_runtime": 604.8436,
"eval_samples_per_second": 5.224,
"eval_steps_per_second": 0.327,
"eval_wer": 9.441690296612077,
"step": 2000
},
{
"epoch": 3.36,
"learning_rate": 8.318947368421052e-06,
"loss": 0.1942,
"step": 2100
},
{
"epoch": 3.52,
"learning_rate": 8.213684210526316e-06,
"loss": 0.2072,
"step": 2200
},
{
"epoch": 3.68,
"learning_rate": 8.10842105263158e-06,
"loss": 0.1809,
"step": 2300
},
{
"epoch": 3.84,
"learning_rate": 8.003157894736842e-06,
"loss": 0.1791,
"step": 2400
},
{
"epoch": 4.0,
"learning_rate": 7.897894736842106e-06,
"loss": 0.2087,
"step": 2500
},
{
"epoch": 4.0,
"eval_loss": 0.2534370422363281,
"eval_runtime": 605.6058,
"eval_samples_per_second": 5.218,
"eval_steps_per_second": 0.327,
"eval_wer": 9.089973830237328,
"step": 2500
}
],
"logging_steps": 100,
"max_steps": 10000,
"num_train_epochs": 16,
"save_steps": 500,
"total_flos": 2.307182558478336e+19,
"trial_name": null,
"trial_params": null
}