wavlm-large-korean-ipa / trainer_state.json
speech31's picture
upload model
daa24c6
raw
history blame contribute delete
No virus
13.1 kB
{
"best_metric": 0.17176076769828796,
"best_model_checkpoint": "wavlm-korean-phoneme-v3/checkpoint-7500",
"epoch": 11.980047885075818,
"global_step": 7500,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.16,
"learning_rate": 2.9999999999999997e-05,
"loss": 5.4024,
"step": 100
},
{
"epoch": 0.32,
"learning_rate": 5.9999999999999995e-05,
"loss": 2.7142,
"step": 200
},
{
"epoch": 0.48,
"learning_rate": 8.999999999999999e-05,
"loss": 2.6325,
"step": 300
},
{
"epoch": 0.64,
"learning_rate": 0.00011999999999999999,
"loss": 2.4302,
"step": 400
},
{
"epoch": 0.8,
"learning_rate": 0.00015,
"loss": 1.5708,
"step": 500
},
{
"epoch": 0.8,
"eval_cer": 0.5738695561575328,
"eval_loss": 1.0533815622329712,
"eval_runtime": 257.0727,
"eval_samples_per_second": 8.663,
"eval_steps_per_second": 1.085,
"step": 500
},
{
"epoch": 0.96,
"learning_rate": 0.00017999999999999998,
"loss": 0.9274,
"step": 600
},
{
"epoch": 1.12,
"learning_rate": 0.00020999999999999998,
"loss": 0.7045,
"step": 700
},
{
"epoch": 1.28,
"learning_rate": 0.00023999999999999998,
"loss": 0.5879,
"step": 800
},
{
"epoch": 1.44,
"learning_rate": 0.00027,
"loss": 0.5315,
"step": 900
},
{
"epoch": 1.6,
"learning_rate": 0.0003,
"loss": 0.4842,
"step": 1000
},
{
"epoch": 1.6,
"eval_cer": 0.2984314260873314,
"eval_loss": 0.4019908010959625,
"eval_runtime": 213.6605,
"eval_samples_per_second": 10.423,
"eval_steps_per_second": 1.306,
"step": 1000
},
{
"epoch": 1.76,
"learning_rate": 0.00029900990099009897,
"loss": 0.4486,
"step": 1100
},
{
"epoch": 1.92,
"learning_rate": 0.000298019801980198,
"loss": 0.4091,
"step": 1200
},
{
"epoch": 2.08,
"learning_rate": 0.000297029702970297,
"loss": 0.3663,
"step": 1300
},
{
"epoch": 2.24,
"learning_rate": 0.000296039603960396,
"loss": 0.3333,
"step": 1400
},
{
"epoch": 2.4,
"learning_rate": 0.000295049504950495,
"loss": 0.3181,
"step": 1500
},
{
"epoch": 2.4,
"eval_cer": 0.20734923223947518,
"eval_loss": 0.2830340266227722,
"eval_runtime": 213.9837,
"eval_samples_per_second": 10.407,
"eval_steps_per_second": 1.304,
"step": 1500
},
{
"epoch": 2.56,
"learning_rate": 0.000294059405940594,
"loss": 0.3238,
"step": 1600
},
{
"epoch": 2.72,
"learning_rate": 0.00029306930693069307,
"loss": 0.3005,
"step": 1700
},
{
"epoch": 2.87,
"learning_rate": 0.00029207920792079207,
"loss": 0.3013,
"step": 1800
},
{
"epoch": 3.04,
"learning_rate": 0.00029108910891089107,
"loss": 0.2795,
"step": 1900
},
{
"epoch": 3.19,
"learning_rate": 0.00029009900990099006,
"loss": 0.2421,
"step": 2000
},
{
"epoch": 3.19,
"eval_cer": 0.17599212479611415,
"eval_loss": 0.2522282004356384,
"eval_runtime": 210.0211,
"eval_samples_per_second": 10.604,
"eval_steps_per_second": 1.328,
"step": 2000
},
{
"epoch": 3.35,
"learning_rate": 0.00028910891089108906,
"loss": 0.2436,
"step": 2100
},
{
"epoch": 3.51,
"learning_rate": 0.00028811881188118806,
"loss": 0.234,
"step": 2200
},
{
"epoch": 3.67,
"learning_rate": 0.0002871287128712871,
"loss": 0.2347,
"step": 2300
},
{
"epoch": 3.83,
"learning_rate": 0.0002861386138613861,
"loss": 0.2356,
"step": 2400
},
{
"epoch": 3.99,
"learning_rate": 0.0002851485148514851,
"loss": 0.2255,
"step": 2500
},
{
"epoch": 3.99,
"eval_cer": 0.1599614862291713,
"eval_loss": 0.22431106865406036,
"eval_runtime": 203.7474,
"eval_samples_per_second": 10.93,
"eval_steps_per_second": 1.369,
"step": 2500
},
{
"epoch": 4.15,
"learning_rate": 0.00028415841584158416,
"loss": 0.1892,
"step": 2600
},
{
"epoch": 4.31,
"learning_rate": 0.00028316831683168316,
"loss": 0.1927,
"step": 2700
},
{
"epoch": 4.47,
"learning_rate": 0.00028217821782178216,
"loss": 0.1832,
"step": 2800
},
{
"epoch": 4.63,
"learning_rate": 0.00028118811881188116,
"loss": 0.1914,
"step": 2900
},
{
"epoch": 4.79,
"learning_rate": 0.00028019801980198015,
"loss": 0.1879,
"step": 3000
},
{
"epoch": 4.79,
"eval_cer": 0.14389492063720172,
"eval_loss": 0.21251684427261353,
"eval_runtime": 199.7095,
"eval_samples_per_second": 11.151,
"eval_steps_per_second": 1.397,
"step": 3000
},
{
"epoch": 4.95,
"learning_rate": 0.0002792079207920792,
"loss": 0.186,
"step": 3100
},
{
"epoch": 5.11,
"learning_rate": 0.0002782178217821782,
"loss": 0.1716,
"step": 3200
},
{
"epoch": 5.27,
"learning_rate": 0.0002772277227722772,
"loss": 0.1588,
"step": 3300
},
{
"epoch": 5.43,
"learning_rate": 0.0002762376237623762,
"loss": 0.1555,
"step": 3400
},
{
"epoch": 5.59,
"learning_rate": 0.0002752475247524752,
"loss": 0.1604,
"step": 3500
},
{
"epoch": 5.59,
"eval_cer": 0.13375631417464845,
"eval_loss": 0.2036324292421341,
"eval_runtime": 200.1074,
"eval_samples_per_second": 11.129,
"eval_steps_per_second": 1.394,
"step": 3500
},
{
"epoch": 5.75,
"learning_rate": 0.0002742574257425742,
"loss": 0.158,
"step": 3600
},
{
"epoch": 5.91,
"learning_rate": 0.00027326732673267325,
"loss": 0.1619,
"step": 3700
},
{
"epoch": 6.07,
"learning_rate": 0.00027227722772277225,
"loss": 0.1497,
"step": 3800
},
{
"epoch": 6.23,
"learning_rate": 0.00027128712871287125,
"loss": 0.1397,
"step": 3900
},
{
"epoch": 6.39,
"learning_rate": 0.0002702970297029703,
"loss": 0.1382,
"step": 4000
},
{
"epoch": 6.39,
"eval_cer": 0.127418786959927,
"eval_loss": 0.189874529838562,
"eval_runtime": 198.5164,
"eval_samples_per_second": 11.218,
"eval_steps_per_second": 1.405,
"step": 4000
},
{
"epoch": 6.55,
"learning_rate": 0.0002693069306930693,
"loss": 0.1371,
"step": 4100
},
{
"epoch": 6.71,
"learning_rate": 0.0002683168316831683,
"loss": 0.1385,
"step": 4200
},
{
"epoch": 6.87,
"learning_rate": 0.0002673267326732673,
"loss": 0.1382,
"step": 4300
},
{
"epoch": 7.03,
"learning_rate": 0.0002663366336633663,
"loss": 0.138,
"step": 4400
},
{
"epoch": 7.19,
"learning_rate": 0.00026534653465346534,
"loss": 0.1228,
"step": 4500
},
{
"epoch": 7.19,
"eval_cer": 0.12003937601942934,
"eval_loss": 0.1979004442691803,
"eval_runtime": 201.8805,
"eval_samples_per_second": 11.031,
"eval_steps_per_second": 1.382,
"step": 4500
},
{
"epoch": 7.35,
"learning_rate": 0.00026435643564356434,
"loss": 0.128,
"step": 4600
},
{
"epoch": 7.51,
"learning_rate": 0.00026336633663366334,
"loss": 0.1248,
"step": 4700
},
{
"epoch": 7.67,
"learning_rate": 0.00026237623762376234,
"loss": 0.1191,
"step": 4800
},
{
"epoch": 7.83,
"learning_rate": 0.00026138613861386134,
"loss": 0.1241,
"step": 4900
},
{
"epoch": 7.99,
"learning_rate": 0.00026039603960396033,
"loss": 0.1275,
"step": 5000
},
{
"epoch": 7.99,
"eval_cer": 0.11670534809694548,
"eval_loss": 0.18830785155296326,
"eval_runtime": 215.0184,
"eval_samples_per_second": 10.357,
"eval_steps_per_second": 1.298,
"step": 5000
},
{
"epoch": 8.15,
"learning_rate": 0.0002594059405940594,
"loss": 0.1133,
"step": 5100
},
{
"epoch": 8.31,
"learning_rate": 0.0002584158415841584,
"loss": 0.1121,
"step": 5200
},
{
"epoch": 8.47,
"learning_rate": 0.0002574257425742574,
"loss": 0.112,
"step": 5300
},
{
"epoch": 8.63,
"learning_rate": 0.00025643564356435644,
"loss": 0.108,
"step": 5400
},
{
"epoch": 8.79,
"learning_rate": 0.00025544554455445543,
"loss": 0.1093,
"step": 5500
},
{
"epoch": 8.79,
"eval_cer": 0.11560598113112645,
"eval_loss": 0.1854041963815689,
"eval_runtime": 221.0978,
"eval_samples_per_second": 10.072,
"eval_steps_per_second": 1.262,
"step": 5500
},
{
"epoch": 8.94,
"learning_rate": 0.00025445544554455443,
"loss": 0.1094,
"step": 5600
},
{
"epoch": 9.11,
"learning_rate": 0.00025346534653465343,
"loss": 0.1139,
"step": 5700
},
{
"epoch": 9.26,
"learning_rate": 0.00025247524752475243,
"loss": 0.1015,
"step": 5800
},
{
"epoch": 9.42,
"learning_rate": 0.0002514851485148515,
"loss": 0.1062,
"step": 5900
},
{
"epoch": 9.58,
"learning_rate": 0.0002504950495049505,
"loss": 0.1089,
"step": 6000
},
{
"epoch": 9.58,
"eval_cer": 0.1084421323407894,
"eval_loss": 0.1830228716135025,
"eval_runtime": 220.3658,
"eval_samples_per_second": 10.106,
"eval_steps_per_second": 1.266,
"step": 6000
},
{
"epoch": 9.74,
"learning_rate": 0.0002495148514851485,
"loss": 0.1076,
"step": 6100
},
{
"epoch": 9.9,
"learning_rate": 0.0002485247524752475,
"loss": 0.1063,
"step": 6200
},
{
"epoch": 10.06,
"learning_rate": 0.0002475346534653465,
"loss": 0.1009,
"step": 6300
},
{
"epoch": 10.22,
"learning_rate": 0.0002465445544554455,
"loss": 0.0987,
"step": 6400
},
{
"epoch": 10.38,
"learning_rate": 0.0002455643564356435,
"loss": 0.0968,
"step": 6500
},
{
"epoch": 10.38,
"eval_cer": 0.10436082229774882,
"eval_loss": 0.17644909024238586,
"eval_runtime": 220.8492,
"eval_samples_per_second": 10.084,
"eval_steps_per_second": 1.263,
"step": 6500
},
{
"epoch": 10.54,
"learning_rate": 0.0002445742574257425,
"loss": 0.0937,
"step": 6600
},
{
"epoch": 10.7,
"learning_rate": 0.00024358415841584157,
"loss": 0.0964,
"step": 6700
},
{
"epoch": 10.86,
"learning_rate": 0.00024259405940594056,
"loss": 0.0956,
"step": 6800
},
{
"epoch": 11.02,
"learning_rate": 0.0002416039603960396,
"loss": 0.0971,
"step": 6900
},
{
"epoch": 11.18,
"learning_rate": 0.0002406138613861386,
"loss": 0.0862,
"step": 7000
},
{
"epoch": 11.18,
"eval_cer": 0.10214771755610005,
"eval_loss": 0.19613920152187347,
"eval_runtime": 296.3031,
"eval_samples_per_second": 7.516,
"eval_steps_per_second": 0.942,
"step": 7000
},
{
"epoch": 11.34,
"learning_rate": 0.00023962376237623759,
"loss": 0.0901,
"step": 7100
},
{
"epoch": 11.5,
"learning_rate": 0.00023863366336633664,
"loss": 0.0957,
"step": 7200
},
{
"epoch": 11.66,
"learning_rate": 0.00023764356435643564,
"loss": 0.0929,
"step": 7300
},
{
"epoch": 11.82,
"learning_rate": 0.00023665346534653463,
"loss": 0.0918,
"step": 7400
},
{
"epoch": 11.98,
"learning_rate": 0.00023566336633663366,
"loss": 0.0933,
"step": 7500
},
{
"epoch": 11.98,
"eval_cer": 0.10178126190082704,
"eval_loss": 0.17176076769828796,
"eval_runtime": 220.1598,
"eval_samples_per_second": 10.115,
"eval_steps_per_second": 1.267,
"step": 7500
}
],
"max_steps": 31300,
"num_train_epochs": 50,
"total_flos": 6.187118202284854e+19,
"trial_name": null,
"trial_params": null
}