|
{ |
|
"best_metric": 0.9612490594431903, |
|
"best_model_checkpoint": "/content/drive/MyDrive/SODUCO/article_das_2022/44-camembert_finetuned_pero/checkpoint-2000", |
|
"epoch": 5.319148936170213, |
|
"global_step": 2000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.27, |
|
"eval_accuracy": 0.9608945527236382, |
|
"eval_f1": 0.9189897100093545, |
|
"eval_loss": 0.24732524156570435, |
|
"eval_precision": 0.912332838038633, |
|
"eval_recall": 0.9257444402563136, |
|
"eval_runtime": 2.7834, |
|
"eval_samples_per_second": 239.997, |
|
"eval_steps_per_second": 15.09, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.53, |
|
"eval_accuracy": 0.9631434282858571, |
|
"eval_f1": 0.9296359177513677, |
|
"eval_loss": 0.17169421911239624, |
|
"eval_precision": 0.9305135951661632, |
|
"eval_recall": 0.9287598944591029, |
|
"eval_runtime": 2.6347, |
|
"eval_samples_per_second": 253.541, |
|
"eval_steps_per_second": 15.941, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_accuracy": 0.9705147426286856, |
|
"eval_f1": 0.9395872420262664, |
|
"eval_loss": 0.13204523921012878, |
|
"eval_precision": 0.9353754202465446, |
|
"eval_recall": 0.9438371654730494, |
|
"eval_runtime": 2.6, |
|
"eval_samples_per_second": 256.926, |
|
"eval_steps_per_second": 16.154, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 1.06, |
|
"eval_accuracy": 0.9681409295352323, |
|
"eval_f1": 0.9378998870907039, |
|
"eval_loss": 0.1420740932226181, |
|
"eval_precision": 0.936490041337843, |
|
"eval_recall": 0.9393139841688655, |
|
"eval_runtime": 2.565, |
|
"eval_samples_per_second": 260.431, |
|
"eval_steps_per_second": 16.374, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 1.33, |
|
"learning_rate": 9e-05, |
|
"loss": 0.2455, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.33, |
|
"eval_accuracy": 0.9758870564717641, |
|
"eval_f1": 0.9526493799323562, |
|
"eval_loss": 0.1057828888297081, |
|
"eval_precision": 0.9497939303109779, |
|
"eval_recall": 0.9555220505088579, |
|
"eval_runtime": 2.6085, |
|
"eval_samples_per_second": 256.084, |
|
"eval_steps_per_second": 16.101, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"eval_accuracy": 0.9731384307846077, |
|
"eval_f1": 0.9493694711086017, |
|
"eval_loss": 0.10737968236207962, |
|
"eval_precision": 0.9481203007518797, |
|
"eval_recall": 0.9506219374293253, |
|
"eval_runtime": 2.5863, |
|
"eval_samples_per_second": 258.283, |
|
"eval_steps_per_second": 16.239, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.86, |
|
"eval_accuracy": 0.972888555722139, |
|
"eval_f1": 0.9527573875399962, |
|
"eval_loss": 0.11101129651069641, |
|
"eval_precision": 0.9515037593984963, |
|
"eval_recall": 0.9540143234074633, |
|
"eval_runtime": 2.5978, |
|
"eval_samples_per_second": 257.138, |
|
"eval_steps_per_second": 16.167, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 2.13, |
|
"eval_accuracy": 0.9753873063468266, |
|
"eval_f1": 0.9515583927900865, |
|
"eval_loss": 0.09300221502780914, |
|
"eval_precision": 0.9479985035540591, |
|
"eval_recall": 0.9551451187335093, |
|
"eval_runtime": 2.6079, |
|
"eval_samples_per_second": 256.141, |
|
"eval_steps_per_second": 16.105, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 2.39, |
|
"eval_accuracy": 0.9762618690654673, |
|
"eval_f1": 0.9552914544425579, |
|
"eval_loss": 0.10092608630657196, |
|
"eval_precision": 0.9561933534743202, |
|
"eval_recall": 0.9543912551828119, |
|
"eval_runtime": 2.604, |
|
"eval_samples_per_second": 256.532, |
|
"eval_steps_per_second": 16.129, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 2.66, |
|
"learning_rate": 8e-05, |
|
"loss": 0.0868, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.66, |
|
"eval_accuracy": 0.9766366816591704, |
|
"eval_f1": 0.9565217391304348, |
|
"eval_loss": 0.09077496081590652, |
|
"eval_precision": 0.9552631578947368, |
|
"eval_recall": 0.9577836411609498, |
|
"eval_runtime": 2.6166, |
|
"eval_samples_per_second": 255.294, |
|
"eval_steps_per_second": 16.051, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 2.93, |
|
"eval_accuracy": 0.9761369315342329, |
|
"eval_f1": 0.9558021440662028, |
|
"eval_loss": 0.09924957156181335, |
|
"eval_precision": 0.9538288288288288, |
|
"eval_recall": 0.9577836411609498, |
|
"eval_runtime": 2.6844, |
|
"eval_samples_per_second": 248.843, |
|
"eval_steps_per_second": 15.646, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 3.19, |
|
"eval_accuracy": 0.9767616191904048, |
|
"eval_f1": 0.9542975362046267, |
|
"eval_loss": 0.08850151300430298, |
|
"eval_precision": 0.9523273273273273, |
|
"eval_recall": 0.9562759140595553, |
|
"eval_runtime": 2.8038, |
|
"eval_samples_per_second": 238.25, |
|
"eval_steps_per_second": 14.98, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 3.46, |
|
"eval_accuracy": 0.9770114942528736, |
|
"eval_f1": 0.9576191373139952, |
|
"eval_loss": 0.09413458406925201, |
|
"eval_precision": 0.9570783132530121, |
|
"eval_recall": 0.9581605729362985, |
|
"eval_runtime": 2.631, |
|
"eval_samples_per_second": 253.897, |
|
"eval_steps_per_second": 15.964, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 3.72, |
|
"eval_accuracy": 0.9758870564717641, |
|
"eval_f1": 0.9575871819038644, |
|
"eval_loss": 0.09968729317188263, |
|
"eval_precision": 0.9577677224736049, |
|
"eval_recall": 0.9574067093856012, |
|
"eval_runtime": 2.6616, |
|
"eval_samples_per_second": 250.976, |
|
"eval_steps_per_second": 15.78, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 3.99, |
|
"learning_rate": 7e-05, |
|
"loss": 0.056, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 3.99, |
|
"eval_accuracy": 0.974887556221889, |
|
"eval_f1": 0.9591106086301111, |
|
"eval_loss": 0.10856281220912933, |
|
"eval_precision": 0.9589299171062547, |
|
"eval_recall": 0.9592913682623445, |
|
"eval_runtime": 2.616, |
|
"eval_samples_per_second": 255.356, |
|
"eval_steps_per_second": 16.055, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 4.26, |
|
"eval_accuracy": 0.9762618690654673, |
|
"eval_f1": 0.9577836411609498, |
|
"eval_loss": 0.10103093087673187, |
|
"eval_precision": 0.9577836411609498, |
|
"eval_recall": 0.9577836411609498, |
|
"eval_runtime": 2.6677, |
|
"eval_samples_per_second": 250.406, |
|
"eval_steps_per_second": 15.744, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 4.52, |
|
"eval_accuracy": 0.9783858070964517, |
|
"eval_f1": 0.9612198795180723, |
|
"eval_loss": 0.09965386986732483, |
|
"eval_precision": 0.9601353892440767, |
|
"eval_recall": 0.9623068224651338, |
|
"eval_runtime": 2.9477, |
|
"eval_samples_per_second": 226.62, |
|
"eval_steps_per_second": 14.249, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 4.79, |
|
"eval_accuracy": 0.975512243878061, |
|
"eval_f1": 0.9551957831325302, |
|
"eval_loss": 0.10638727992773056, |
|
"eval_precision": 0.9541180895073336, |
|
"eval_recall": 0.9562759140595553, |
|
"eval_runtime": 2.6219, |
|
"eval_samples_per_second": 254.779, |
|
"eval_steps_per_second": 16.019, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 5.05, |
|
"eval_accuracy": 0.9757621189405298, |
|
"eval_f1": 0.9559984956750659, |
|
"eval_loss": 0.09631699323654175, |
|
"eval_precision": 0.9538461538461539, |
|
"eval_recall": 0.9581605729362985, |
|
"eval_runtime": 2.6401, |
|
"eval_samples_per_second": 253.021, |
|
"eval_steps_per_second": 15.908, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 5.32, |
|
"learning_rate": 6e-05, |
|
"loss": 0.04, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 5.32, |
|
"eval_accuracy": 0.9777611194402799, |
|
"eval_f1": 0.9612490594431903, |
|
"eval_loss": 0.09422445297241211, |
|
"eval_precision": 0.9594442358242583, |
|
"eval_recall": 0.9630606860158312, |
|
"eval_runtime": 2.6383, |
|
"eval_samples_per_second": 253.191, |
|
"eval_steps_per_second": 15.919, |
|
"step": 2000 |
|
} |
|
], |
|
"max_steps": 5000, |
|
"num_train_epochs": 14, |
|
"total_flos": 790348180152456.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|