|
{ |
|
"best_metric": 0.6654040404040403, |
|
"best_model_checkpoint": "twitter-roberta-base-WNUT/checkpoint-500", |
|
"epoch": 10.0, |
|
"global_step": 540, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.46, |
|
"eval_accuracy": 0.9205491641772071, |
|
"eval_f1": 0.0, |
|
"eval_loss": 0.39121243357658386, |
|
"eval_precision": 0.0, |
|
"eval_recall": 0.0, |
|
"eval_runtime": 1.5425, |
|
"eval_samples_per_second": 654.138, |
|
"eval_steps_per_second": 0.648, |
|
"step": 25 |
|
}, |
|
{ |
|
"epoch": 0.93, |
|
"eval_accuracy": 0.9209305281891565, |
|
"eval_f1": 0.004739336492890995, |
|
"eval_loss": 0.2846619784832001, |
|
"eval_precision": 0.25, |
|
"eval_recall": 0.0023923444976076554, |
|
"eval_runtime": 1.5304, |
|
"eval_samples_per_second": 659.288, |
|
"eval_steps_per_second": 0.653, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 1.39, |
|
"eval_accuracy": 0.9426047162016145, |
|
"eval_f1": 0.4239766081871345, |
|
"eval_loss": 0.2449360191822052, |
|
"eval_precision": 0.5451127819548872, |
|
"eval_recall": 0.34688995215311, |
|
"eval_runtime": 1.487, |
|
"eval_samples_per_second": 678.556, |
|
"eval_steps_per_second": 0.673, |
|
"step": 75 |
|
}, |
|
{ |
|
"epoch": 1.85, |
|
"eval_accuracy": 0.9491514650734125, |
|
"eval_f1": 0.5565455791638108, |
|
"eval_loss": 0.19464540481567383, |
|
"eval_precision": 0.651685393258427, |
|
"eval_recall": 0.48564593301435405, |
|
"eval_runtime": 1.5409, |
|
"eval_samples_per_second": 654.812, |
|
"eval_steps_per_second": 0.649, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 2.31, |
|
"eval_accuracy": 0.9581135193542236, |
|
"eval_f1": 0.621870882740448, |
|
"eval_loss": 0.1851097047328949, |
|
"eval_precision": 0.6920821114369502, |
|
"eval_recall": 0.5645933014354066, |
|
"eval_runtime": 1.5283, |
|
"eval_samples_per_second": 660.202, |
|
"eval_steps_per_second": 0.654, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 2.78, |
|
"eval_accuracy": 0.9594482933960465, |
|
"eval_f1": 0.6331399097356544, |
|
"eval_loss": 0.1671772003173828, |
|
"eval_precision": 0.6867132867132867, |
|
"eval_recall": 0.5873205741626795, |
|
"eval_runtime": 1.7364, |
|
"eval_samples_per_second": 581.088, |
|
"eval_steps_per_second": 0.576, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 3.24, |
|
"eval_accuracy": 0.9615457954617682, |
|
"eval_f1": 0.6276527331189711, |
|
"eval_loss": 0.16754180192947388, |
|
"eval_precision": 0.6787204450625869, |
|
"eval_recall": 0.583732057416268, |
|
"eval_runtime": 1.522, |
|
"eval_samples_per_second": 662.938, |
|
"eval_steps_per_second": 0.657, |
|
"step": 175 |
|
}, |
|
{ |
|
"epoch": 3.7, |
|
"eval_accuracy": 0.9637704188648064, |
|
"eval_f1": 0.65389369592089, |
|
"eval_loss": 0.16441918909549713, |
|
"eval_precision": 0.6764705882352942, |
|
"eval_recall": 0.6327751196172249, |
|
"eval_runtime": 1.5477, |
|
"eval_samples_per_second": 651.939, |
|
"eval_steps_per_second": 0.646, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 4.17, |
|
"eval_accuracy": 0.9640246615394394, |
|
"eval_f1": 0.673697270471464, |
|
"eval_loss": 0.1672356277704239, |
|
"eval_precision": 0.6997422680412371, |
|
"eval_recall": 0.6495215311004785, |
|
"eval_runtime": 1.5668, |
|
"eval_samples_per_second": 643.973, |
|
"eval_steps_per_second": 0.638, |
|
"step": 225 |
|
}, |
|
{ |
|
"epoch": 4.63, |
|
"eval_accuracy": 0.9648509502319964, |
|
"eval_f1": 0.6666666666666666, |
|
"eval_loss": 0.16518081724643707, |
|
"eval_precision": 0.6915167095115681, |
|
"eval_recall": 0.6435406698564593, |
|
"eval_runtime": 1.544, |
|
"eval_samples_per_second": 653.501, |
|
"eval_steps_per_second": 0.648, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 5.09, |
|
"eval_accuracy": 0.9629441301722494, |
|
"eval_f1": 0.6520618556701031, |
|
"eval_loss": 0.18820269405841827, |
|
"eval_precision": 0.7067039106145251, |
|
"eval_recall": 0.6052631578947368, |
|
"eval_runtime": 1.5459, |
|
"eval_samples_per_second": 652.688, |
|
"eval_steps_per_second": 0.647, |
|
"step": 275 |
|
}, |
|
{ |
|
"epoch": 5.56, |
|
"eval_accuracy": 0.9644695862200471, |
|
"eval_f1": 0.6717267552182163, |
|
"eval_loss": 0.17831429839134216, |
|
"eval_precision": 0.7127516778523489, |
|
"eval_recall": 0.6351674641148325, |
|
"eval_runtime": 1.5976, |
|
"eval_samples_per_second": 631.564, |
|
"eval_steps_per_second": 0.626, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 6.02, |
|
"eval_accuracy": 0.9638975402021229, |
|
"eval_f1": 0.6564885496183207, |
|
"eval_loss": 0.18128034472465515, |
|
"eval_precision": 0.7010869565217391, |
|
"eval_recall": 0.6172248803827751, |
|
"eval_runtime": 1.5524, |
|
"eval_samples_per_second": 649.966, |
|
"eval_steps_per_second": 0.644, |
|
"step": 325 |
|
}, |
|
{ |
|
"epoch": 6.48, |
|
"eval_accuracy": 0.96472382889468, |
|
"eval_f1": 0.677561282212445, |
|
"eval_loss": 0.18036700785160065, |
|
"eval_precision": 0.713907284768212, |
|
"eval_recall": 0.6447368421052632, |
|
"eval_runtime": 1.6249, |
|
"eval_samples_per_second": 620.943, |
|
"eval_steps_per_second": 0.615, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 6.94, |
|
"eval_accuracy": 0.9640882222080976, |
|
"eval_f1": 0.6709346991037132, |
|
"eval_loss": 0.19022008776664734, |
|
"eval_precision": 0.721763085399449, |
|
"eval_recall": 0.6267942583732058, |
|
"eval_runtime": 1.8093, |
|
"eval_samples_per_second": 557.663, |
|
"eval_steps_per_second": 0.553, |
|
"step": 375 |
|
}, |
|
{ |
|
"epoch": 7.41, |
|
"eval_accuracy": 0.9640882222080976, |
|
"eval_f1": 0.668777707409753, |
|
"eval_loss": 0.1882619857788086, |
|
"eval_precision": 0.7106325706594886, |
|
"eval_recall": 0.631578947368421, |
|
"eval_runtime": 1.62, |
|
"eval_samples_per_second": 622.858, |
|
"eval_steps_per_second": 0.617, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 7.87, |
|
"eval_accuracy": 0.9642789042140724, |
|
"eval_f1": 0.6683480453972257, |
|
"eval_loss": 0.18618735671043396, |
|
"eval_precision": 0.7066666666666667, |
|
"eval_recall": 0.6339712918660287, |
|
"eval_runtime": 1.5944, |
|
"eval_samples_per_second": 632.853, |
|
"eval_steps_per_second": 0.627, |
|
"step": 425 |
|
}, |
|
{ |
|
"epoch": 8.33, |
|
"eval_accuracy": 0.9638975402021229, |
|
"eval_f1": 0.6670870113493064, |
|
"eval_loss": 0.1881590634584427, |
|
"eval_precision": 0.7053333333333334, |
|
"eval_recall": 0.6327751196172249, |
|
"eval_runtime": 1.7003, |
|
"eval_samples_per_second": 593.415, |
|
"eval_steps_per_second": 0.588, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 8.8, |
|
"eval_accuracy": 0.9638339795334647, |
|
"eval_f1": 0.6658243840808591, |
|
"eval_loss": 0.19190868735313416, |
|
"eval_precision": 0.7054886211512718, |
|
"eval_recall": 0.6303827751196173, |
|
"eval_runtime": 1.543, |
|
"eval_samples_per_second": 653.928, |
|
"eval_steps_per_second": 0.648, |
|
"step": 475 |
|
}, |
|
{ |
|
"epoch": 9.26, |
|
"learning_rate": 1.4814814814814815e-06, |
|
"loss": 0.1175, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 9.26, |
|
"eval_accuracy": 0.9639611008707811, |
|
"eval_f1": 0.6654040404040403, |
|
"eval_loss": 0.19381117820739746, |
|
"eval_precision": 0.7045454545454546, |
|
"eval_recall": 0.6303827751196173, |
|
"eval_runtime": 1.541, |
|
"eval_samples_per_second": 654.789, |
|
"eval_steps_per_second": 0.649, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 9.72, |
|
"eval_accuracy": 0.9645967075573635, |
|
"eval_f1": 0.6704190118824266, |
|
"eval_loss": 0.18799594044685364, |
|
"eval_precision": 0.7024901703800787, |
|
"eval_recall": 0.6411483253588517, |
|
"eval_runtime": 1.6071, |
|
"eval_samples_per_second": 627.849, |
|
"eval_steps_per_second": 0.622, |
|
"step": 525 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"step": 540, |
|
"total_flos": 1009327449452316.0, |
|
"train_loss": 0.11085769158822519, |
|
"train_runtime": 157.5154, |
|
"train_samples_per_second": 215.471, |
|
"train_steps_per_second": 3.428 |
|
} |
|
], |
|
"max_steps": 540, |
|
"num_train_epochs": 10, |
|
"total_flos": 1009327449452316.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|