|
{ |
|
"best_metric": 0.7772428393363953, |
|
"best_model_checkpoint": "/home2/s5431786/jb-internship/results/Salesforce-codet5-small-CodeXGLUE-CONCODE-w_special_tokens/checkpoint-5500", |
|
"epoch": 1.76, |
|
"global_step": 5500, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.16, |
|
"learning_rate": 3.160588611644274e-05, |
|
"loss": 2.7739, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.16, |
|
"eval_bleu": 0.11002405260920435, |
|
"eval_exact_match": 0.136, |
|
"eval_loss": 0.9681498408317566, |
|
"eval_rouge1": 0.5324111683230927, |
|
"eval_rouge2": 0.3516111966646144, |
|
"eval_rougeL": 0.5130793573577244, |
|
"eval_runtime": 23.6738, |
|
"eval_samples_per_second": 84.482, |
|
"eval_steps_per_second": 2.661, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"learning_rate": 6.35956493921945e-05, |
|
"loss": 0.8968, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.32, |
|
"eval_bleu": 0.11661343796568427, |
|
"eval_exact_match": 0.148, |
|
"eval_loss": 0.8933660984039307, |
|
"eval_rouge1": 0.5490713398258988, |
|
"eval_rouge2": 0.3737481223472951, |
|
"eval_rougeL": 0.5313359382235461, |
|
"eval_runtime": 21.9288, |
|
"eval_samples_per_second": 91.204, |
|
"eval_steps_per_second": 2.873, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"learning_rate": 9.558541266794626e-05, |
|
"loss": 0.8139, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.48, |
|
"eval_bleu": 0.11428222214709638, |
|
"eval_exact_match": 0.148, |
|
"eval_loss": 0.8664323687553406, |
|
"eval_rouge1": 0.5501019947483123, |
|
"eval_rouge2": 0.37606920276228095, |
|
"eval_rougeL": 0.5316473251371836, |
|
"eval_runtime": 21.9364, |
|
"eval_samples_per_second": 91.173, |
|
"eval_steps_per_second": 2.872, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"learning_rate": 9.854818607471284e-05, |
|
"loss": 0.7535, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"eval_bleu": 0.12118583002054595, |
|
"eval_exact_match": 0.152, |
|
"eval_loss": 0.8371005058288574, |
|
"eval_rouge1": 0.5554072128917051, |
|
"eval_rouge2": 0.37994480723664975, |
|
"eval_rougeL": 0.5360569772635451, |
|
"eval_runtime": 21.9828, |
|
"eval_samples_per_second": 90.98, |
|
"eval_steps_per_second": 2.866, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"learning_rate": 9.686394718226834e-05, |
|
"loss": 0.7267, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_bleu": 0.1221326088002123, |
|
"eval_exact_match": 0.1555, |
|
"eval_loss": 0.8262679576873779, |
|
"eval_rouge1": 0.5599864774843732, |
|
"eval_rouge2": 0.3892847835247521, |
|
"eval_rougeL": 0.5434109433715582, |
|
"eval_runtime": 22.0553, |
|
"eval_samples_per_second": 90.681, |
|
"eval_steps_per_second": 2.856, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 0.96, |
|
"learning_rate": 9.517970828982384e-05, |
|
"loss": 0.7044, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 0.96, |
|
"eval_bleu": 0.12264834126055617, |
|
"eval_exact_match": 0.161, |
|
"eval_loss": 0.8118048310279846, |
|
"eval_rouge1": 0.5584777889931278, |
|
"eval_rouge2": 0.38793170420432566, |
|
"eval_rougeL": 0.539366409663261, |
|
"eval_runtime": 21.8691, |
|
"eval_samples_per_second": 91.453, |
|
"eval_steps_per_second": 2.881, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 1.12, |
|
"learning_rate": 9.349546939737934e-05, |
|
"loss": 0.6505, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 1.12, |
|
"eval_bleu": 0.12561336503475642, |
|
"eval_exact_match": 0.1575, |
|
"eval_loss": 0.8004248142242432, |
|
"eval_rouge1": 0.5604501817439145, |
|
"eval_rouge2": 0.39030440934575783, |
|
"eval_rougeL": 0.5425107709271633, |
|
"eval_runtime": 21.9286, |
|
"eval_samples_per_second": 91.205, |
|
"eval_steps_per_second": 2.873, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 1.28, |
|
"learning_rate": 9.181123050493482e-05, |
|
"loss": 0.6301, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 1.28, |
|
"eval_bleu": 0.12658818034969338, |
|
"eval_exact_match": 0.1605, |
|
"eval_loss": 0.7999853491783142, |
|
"eval_rouge1": 0.5627685830925565, |
|
"eval_rouge2": 0.391269622424489, |
|
"eval_rougeL": 0.5451139508088971, |
|
"eval_runtime": 22.0195, |
|
"eval_samples_per_second": 90.828, |
|
"eval_steps_per_second": 2.861, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 1.44, |
|
"learning_rate": 9.012699161249032e-05, |
|
"loss": 0.6199, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 1.44, |
|
"eval_bleu": 0.12894396386527762, |
|
"eval_exact_match": 0.163, |
|
"eval_loss": 0.7873425483703613, |
|
"eval_rouge1": 0.5653377621170572, |
|
"eval_rouge2": 0.39748707891409585, |
|
"eval_rougeL": 0.5469501947752343, |
|
"eval_runtime": 21.8948, |
|
"eval_samples_per_second": 91.346, |
|
"eval_steps_per_second": 2.877, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"learning_rate": 8.844275272004582e-05, |
|
"loss": 0.619, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 1.6, |
|
"eval_bleu": 0.13044433567409516, |
|
"eval_exact_match": 0.159, |
|
"eval_loss": 0.7792118191719055, |
|
"eval_rouge1": 0.5697500148728435, |
|
"eval_rouge2": 0.3972375515095064, |
|
"eval_rougeL": 0.5508657148123793, |
|
"eval_runtime": 22.0783, |
|
"eval_samples_per_second": 90.587, |
|
"eval_steps_per_second": 2.853, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"learning_rate": 8.67585138276013e-05, |
|
"loss": 0.604, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"eval_bleu": 0.12974945121652084, |
|
"eval_exact_match": 0.164, |
|
"eval_loss": 0.7772428393363953, |
|
"eval_rouge1": 0.5689486656450822, |
|
"eval_rouge2": 0.3977032244845097, |
|
"eval_rougeL": 0.5513327295716377, |
|
"eval_runtime": 21.7891, |
|
"eval_samples_per_second": 91.789, |
|
"eval_steps_per_second": 2.891, |
|
"step": 5500 |
|
} |
|
], |
|
"max_steps": 31250, |
|
"num_train_epochs": 10, |
|
"total_flos": 1.9886134621372416e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|