|
{ |
|
"best_metric": 0.664968152866242, |
|
"best_model_checkpoint": "twitter-roberta-base-dec2021-WNUT/checkpoint-500", |
|
"epoch": 10.0, |
|
"global_step": 540, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.46, |
|
"eval_accuracy": 0.9241085616220682, |
|
"eval_f1": 0.055077452667814115, |
|
"eval_loss": 0.28182554244995117, |
|
"eval_precision": 0.09815950920245399, |
|
"eval_recall": 0.03827751196172249, |
|
"eval_runtime": 1.4976, |
|
"eval_samples_per_second": 673.746, |
|
"eval_steps_per_second": 0.668, |
|
"step": 25 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"eval_accuracy": 0.9480073730375643, |
|
"eval_f1": 0.5254470426409903, |
|
"eval_loss": 0.21579432487487793, |
|
"eval_precision": 0.6181229773462783, |
|
"eval_recall": 0.4569377990430622, |
|
"eval_runtime": 1.5062, |
|
"eval_samples_per_second": 669.914, |
|
"eval_steps_per_second": 0.664, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 1.39, |
|
"eval_accuracy": 0.955507531939236, |
|
"eval_f1": 0.5940199335548173, |
|
"eval_loss": 0.19296418130397797, |
|
"eval_precision": 0.6681614349775785, |
|
"eval_recall": 0.534688995215311, |
|
"eval_runtime": 1.4928, |
|
"eval_samples_per_second": 675.914, |
|
"eval_steps_per_second": 0.67, |
|
"step": 75 |
|
}, |
|
{ |
|
"epoch": 1.85, |
|
"eval_accuracy": 0.9593847327273883, |
|
"eval_f1": 0.6078557630392788, |
|
"eval_loss": 0.17283694446086884, |
|
"eval_precision": 0.6582984658298466, |
|
"eval_recall": 0.5645933014354066, |
|
"eval_runtime": 1.4931, |
|
"eval_samples_per_second": 675.766, |
|
"eval_steps_per_second": 0.67, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 2.31, |
|
"eval_accuracy": 0.9619271594737177, |
|
"eval_f1": 0.6314398943196828, |
|
"eval_loss": 0.17873725295066833, |
|
"eval_precision": 0.7050147492625368, |
|
"eval_recall": 0.5717703349282297, |
|
"eval_runtime": 1.5276, |
|
"eval_samples_per_second": 660.504, |
|
"eval_steps_per_second": 0.655, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 2.78, |
|
"eval_accuracy": 0.958749126040806, |
|
"eval_f1": 0.5993174061433448, |
|
"eval_loss": 0.20510223507881165, |
|
"eval_precision": 0.6979332273449921, |
|
"eval_recall": 0.5251196172248804, |
|
"eval_runtime": 1.5126, |
|
"eval_samples_per_second": 667.078, |
|
"eval_steps_per_second": 0.661, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 3.24, |
|
"eval_accuracy": 0.9620542808110342, |
|
"eval_f1": 0.6500981033355134, |
|
"eval_loss": 0.17545387148857117, |
|
"eval_precision": 0.7171717171717171, |
|
"eval_recall": 0.5944976076555024, |
|
"eval_runtime": 1.5007, |
|
"eval_samples_per_second": 672.361, |
|
"eval_steps_per_second": 0.666, |
|
"step": 175 |
|
}, |
|
{ |
|
"epoch": 3.7, |
|
"eval_accuracy": 0.9644695862200471, |
|
"eval_f1": 0.6608150470219436, |
|
"eval_loss": 0.17198117077350616, |
|
"eval_precision": 0.69433465085639, |
|
"eval_recall": 0.6303827751196173, |
|
"eval_runtime": 1.5311, |
|
"eval_samples_per_second": 659.017, |
|
"eval_steps_per_second": 0.653, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 4.17, |
|
"eval_accuracy": 0.9645967075573635, |
|
"eval_f1": 0.6730401529636711, |
|
"eval_loss": 0.18734638392925262, |
|
"eval_precision": 0.7203274215552524, |
|
"eval_recall": 0.631578947368421, |
|
"eval_runtime": 1.812, |
|
"eval_samples_per_second": 556.831, |
|
"eval_steps_per_second": 0.552, |
|
"step": 225 |
|
}, |
|
{ |
|
"epoch": 4.63, |
|
"eval_accuracy": 0.9638339795334647, |
|
"eval_f1": 0.6544535691724572, |
|
"eval_loss": 0.17807357013225555, |
|
"eval_precision": 0.6934404283801874, |
|
"eval_recall": 0.6196172248803827, |
|
"eval_runtime": 1.5526, |
|
"eval_samples_per_second": 649.864, |
|
"eval_steps_per_second": 0.644, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 5.09, |
|
"eval_accuracy": 0.9631348121782242, |
|
"eval_f1": 0.6577437858508605, |
|
"eval_loss": 0.19528818130493164, |
|
"eval_precision": 0.703956343792633, |
|
"eval_recall": 0.6172248803827751, |
|
"eval_runtime": 1.5217, |
|
"eval_samples_per_second": 663.053, |
|
"eval_steps_per_second": 0.657, |
|
"step": 275 |
|
}, |
|
{ |
|
"epoch": 5.56, |
|
"eval_accuracy": 0.964215343545414, |
|
"eval_f1": 0.6738991703892788, |
|
"eval_loss": 0.1952667236328125, |
|
"eval_precision": 0.7222982216142271, |
|
"eval_recall": 0.631578947368421, |
|
"eval_runtime": 1.5375, |
|
"eval_samples_per_second": 656.259, |
|
"eval_steps_per_second": 0.65, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 6.02, |
|
"eval_accuracy": 0.9647873895633382, |
|
"eval_f1": 0.6728855721393034, |
|
"eval_loss": 0.18392899632453918, |
|
"eval_precision": 0.7007772020725389, |
|
"eval_recall": 0.6471291866028708, |
|
"eval_runtime": 1.541, |
|
"eval_samples_per_second": 654.776, |
|
"eval_steps_per_second": 0.649, |
|
"step": 325 |
|
}, |
|
{ |
|
"epoch": 6.48, |
|
"eval_accuracy": 0.9650416322379711, |
|
"eval_f1": 0.6771752837326608, |
|
"eval_loss": 0.19951151311397552, |
|
"eval_precision": 0.716, |
|
"eval_recall": 0.6423444976076556, |
|
"eval_runtime": 1.5364, |
|
"eval_samples_per_second": 656.733, |
|
"eval_steps_per_second": 0.651, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 6.94, |
|
"eval_accuracy": 0.9639611008707811, |
|
"eval_f1": 0.6675274370561652, |
|
"eval_loss": 0.20560267567634583, |
|
"eval_precision": 0.7251051893408135, |
|
"eval_recall": 0.618421052631579, |
|
"eval_runtime": 1.5238, |
|
"eval_samples_per_second": 662.157, |
|
"eval_steps_per_second": 0.656, |
|
"step": 375 |
|
}, |
|
{ |
|
"epoch": 7.41, |
|
"eval_accuracy": 0.9639611008707811, |
|
"eval_f1": 0.6615776081424937, |
|
"eval_loss": 0.20440098643302917, |
|
"eval_precision": 0.7065217391304348, |
|
"eval_recall": 0.6220095693779905, |
|
"eval_runtime": 1.529, |
|
"eval_samples_per_second": 659.91, |
|
"eval_steps_per_second": 0.654, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 7.87, |
|
"eval_accuracy": 0.9650416322379711, |
|
"eval_f1": 0.6776440785307156, |
|
"eval_loss": 0.20423652231693268, |
|
"eval_precision": 0.7200538358008075, |
|
"eval_recall": 0.6399521531100478, |
|
"eval_runtime": 1.5395, |
|
"eval_samples_per_second": 655.429, |
|
"eval_steps_per_second": 0.65, |
|
"step": 425 |
|
}, |
|
{ |
|
"epoch": 8.33, |
|
"eval_accuracy": 0.9637704188648064, |
|
"eval_f1": 0.6722472633612363, |
|
"eval_loss": 0.22472669184207916, |
|
"eval_precision": 0.7280334728033473, |
|
"eval_recall": 0.6244019138755981, |
|
"eval_runtime": 1.5443, |
|
"eval_samples_per_second": 653.377, |
|
"eval_steps_per_second": 0.648, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 8.8, |
|
"eval_accuracy": 0.9648509502319964, |
|
"eval_f1": 0.6741713570981863, |
|
"eval_loss": 0.20600706338882446, |
|
"eval_precision": 0.7064220183486238, |
|
"eval_recall": 0.6447368421052632, |
|
"eval_runtime": 1.5361, |
|
"eval_samples_per_second": 656.868, |
|
"eval_steps_per_second": 0.651, |
|
"step": 475 |
|
}, |
|
{ |
|
"epoch": 9.26, |
|
"learning_rate": 3.7037037037037037e-06, |
|
"loss": 0.0675, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 9.26, |
|
"eval_accuracy": 0.9642789042140724, |
|
"eval_f1": 0.664968152866242, |
|
"eval_loss": 0.21516220271587372, |
|
"eval_precision": 0.7111716621253406, |
|
"eval_recall": 0.6244019138755981, |
|
"eval_runtime": 1.7855, |
|
"eval_samples_per_second": 565.098, |
|
"eval_steps_per_second": 0.56, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 9.72, |
|
"eval_accuracy": 0.9649780715693129, |
|
"eval_f1": 0.6770573566084789, |
|
"eval_loss": 0.20861834287643433, |
|
"eval_precision": 0.70703125, |
|
"eval_recall": 0.6495215311004785, |
|
"eval_runtime": 1.5457, |
|
"eval_samples_per_second": 652.767, |
|
"eval_steps_per_second": 0.647, |
|
"step": 525 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 540, |
|
"total_flos": 1009327449452316.0, |
|
"train_loss": 0.06299664935580006, |
|
"train_runtime": 158.2675, |
|
"train_samples_per_second": 214.447, |
|
"train_steps_per_second": 3.412 |
|
} |
|
], |
|
"max_steps": 540, |
|
"num_train_epochs": 10, |
|
"total_flos": 1009327449452316.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|