wav2vec2-large-xlsr-fleurs / trainer_state.json
sanchit-gandhi's picture
End of training
34b26c6
{
"best_metric": 0.016,
"best_model_checkpoint": "wav2vec2-large-xlsr-fleurs/checkpoint-100",
"epoch": 4.032,
"global_step": 250,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.16,
"learning_rate": 2e-05,
"loss": 4.6232,
"step": 10
},
{
"epoch": 0.32,
"learning_rate": 4e-05,
"loss": 4.6236,
"step": 20
},
{
"epoch": 0.48,
"learning_rate": 6e-05,
"loss": 4.625,
"step": 30
},
{
"epoch": 0.64,
"learning_rate": 8e-05,
"loss": 4.6225,
"step": 40
},
{
"epoch": 0.8,
"learning_rate": 0.0001,
"loss": 4.6254,
"step": 50
},
{
"epoch": 0.8,
"eval_accuracy": 0.015,
"eval_loss": 4.617953300476074,
"eval_runtime": 244.9205,
"eval_samples_per_second": 4.083,
"eval_steps_per_second": 0.51,
"step": 50
},
{
"epoch": 0.96,
"learning_rate": 0.00012,
"loss": 4.624,
"step": 60
},
{
"epoch": 1.13,
"learning_rate": 0.00014000000000000001,
"loss": 4.8421,
"step": 70
},
{
"epoch": 1.29,
"learning_rate": 0.00016,
"loss": 4.6052,
"step": 80
},
{
"epoch": 1.45,
"learning_rate": 0.00017999999999999998,
"loss": 4.6233,
"step": 90
},
{
"epoch": 1.61,
"learning_rate": 0.0002,
"loss": 4.6383,
"step": 100
},
{
"epoch": 1.61,
"eval_accuracy": 0.016,
"eval_loss": 4.607293128967285,
"eval_runtime": 252.2987,
"eval_samples_per_second": 3.964,
"eval_steps_per_second": 0.495,
"step": 100
},
{
"epoch": 1.77,
"learning_rate": 0.000218,
"loss": 4.6117,
"step": 110
},
{
"epoch": 1.93,
"learning_rate": 0.00023799999999999998,
"loss": 4.5956,
"step": 120
},
{
"epoch": 2.1,
"learning_rate": 0.00025800000000000004,
"loss": 4.8238,
"step": 130
},
{
"epoch": 2.26,
"learning_rate": 0.00027600000000000004,
"loss": 4.5525,
"step": 140
},
{
"epoch": 2.42,
"learning_rate": 0.000294,
"loss": 4.6262,
"step": 150
},
{
"epoch": 2.42,
"eval_accuracy": 0.015,
"eval_loss": 4.576992034912109,
"eval_runtime": 249.2197,
"eval_samples_per_second": 4.013,
"eval_steps_per_second": 0.502,
"step": 150
},
{
"epoch": 2.58,
"learning_rate": 0.000314,
"loss": 4.5967,
"step": 160
},
{
"epoch": 2.74,
"learning_rate": 0.00033400000000000004,
"loss": 4.5978,
"step": 170
},
{
"epoch": 2.9,
"learning_rate": 0.000354,
"loss": 4.6076,
"step": 180
},
{
"epoch": 3.06,
"learning_rate": 0.000374,
"loss": 4.8654,
"step": 190
},
{
"epoch": 3.22,
"learning_rate": 0.00039400000000000004,
"loss": 4.5614,
"step": 200
},
{
"epoch": 3.22,
"eval_accuracy": 0.015,
"eval_loss": 4.575872898101807,
"eval_runtime": 249.962,
"eval_samples_per_second": 4.001,
"eval_steps_per_second": 0.5,
"step": 200
},
{
"epoch": 3.38,
"learning_rate": 0.000414,
"loss": 4.5997,
"step": 210
},
{
"epoch": 3.54,
"learning_rate": 0.00043400000000000003,
"loss": 4.5909,
"step": 220
},
{
"epoch": 3.7,
"learning_rate": 0.00045400000000000003,
"loss": 4.6141,
"step": 230
},
{
"epoch": 3.86,
"learning_rate": 0.000474,
"loss": 4.6173,
"step": 240
},
{
"epoch": 4.03,
"learning_rate": 0.000494,
"loss": 4.8119,
"step": 250
},
{
"epoch": 4.03,
"eval_accuracy": 0.014,
"eval_loss": 4.567824363708496,
"eval_runtime": 249.2501,
"eval_samples_per_second": 4.012,
"eval_steps_per_second": 0.502,
"step": 250
},
{
"epoch": 4.03,
"step": 250,
"total_flos": 1.577948839059241e+18,
"train_loss": 4.6450146484375,
"train_runtime": 3071.4642,
"train_samples_per_second": 1.302,
"train_steps_per_second": 0.081
}
],
"max_steps": 250,
"num_train_epochs": 5,
"total_flos": 1.577948839059241e+18,
"trial_name": null,
"trial_params": null
}