|
{ |
|
"best_metric": 0.9063502550125122, |
|
"best_model_checkpoint": "/content/drive/My Drive/Colab Notebooks/aai520-project/checkpoints/roberta-finetuned/checkpoint-1000", |
|
"epoch": 1.9607843137254903, |
|
"eval_steps": 100, |
|
"global_step": 1000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.2, |
|
"learning_rate": 1.811764705882353e-05, |
|
"loss": 2.9129, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_loss": 1.4699586629867554, |
|
"eval_runtime": 17.6815, |
|
"eval_samples_per_second": 676.131, |
|
"eval_steps_per_second": 10.576, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"learning_rate": 1.6176470588235296e-05, |
|
"loss": 1.4395, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.39, |
|
"eval_loss": 1.240740418434143, |
|
"eval_runtime": 17.6813, |
|
"eval_samples_per_second": 676.14, |
|
"eval_steps_per_second": 10.576, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.59, |
|
"learning_rate": 1.4215686274509805e-05, |
|
"loss": 1.2356, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 0.59, |
|
"eval_loss": 1.0324599742889404, |
|
"eval_runtime": 17.7184, |
|
"eval_samples_per_second": 674.723, |
|
"eval_steps_per_second": 10.554, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 0.78, |
|
"learning_rate": 1.2254901960784315e-05, |
|
"loss": 1.1284, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 0.78, |
|
"eval_loss": 0.9749970436096191, |
|
"eval_runtime": 17.7173, |
|
"eval_samples_per_second": 674.763, |
|
"eval_steps_per_second": 10.555, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 0.98, |
|
"learning_rate": 1.0294117647058823e-05, |
|
"loss": 1.0821, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.98, |
|
"eval_loss": 0.9345471858978271, |
|
"eval_runtime": 17.7101, |
|
"eval_samples_per_second": 675.038, |
|
"eval_steps_per_second": 10.559, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.18, |
|
"learning_rate": 8.333333333333334e-06, |
|
"loss": 0.9978, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.18, |
|
"eval_loss": 0.9892988801002502, |
|
"eval_runtime": 17.6864, |
|
"eval_samples_per_second": 675.943, |
|
"eval_steps_per_second": 10.573, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.37, |
|
"learning_rate": 6.372549019607843e-06, |
|
"loss": 0.9697, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 1.37, |
|
"eval_loss": 0.9299613237380981, |
|
"eval_runtime": 17.7225, |
|
"eval_samples_per_second": 674.565, |
|
"eval_steps_per_second": 10.552, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 1.57, |
|
"learning_rate": 4.411764705882353e-06, |
|
"loss": 0.9455, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 1.57, |
|
"eval_loss": 0.9351199865341187, |
|
"eval_runtime": 17.7361, |
|
"eval_samples_per_second": 674.051, |
|
"eval_steps_per_second": 10.543, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"learning_rate": 2.450980392156863e-06, |
|
"loss": 0.9322, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 1.76, |
|
"eval_loss": 0.9450510144233704, |
|
"eval_runtime": 17.7032, |
|
"eval_samples_per_second": 675.301, |
|
"eval_steps_per_second": 10.563, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 1.96, |
|
"learning_rate": 4.901960784313725e-07, |
|
"loss": 0.9269, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 1.96, |
|
"eval_loss": 0.9063502550125122, |
|
"eval_runtime": 17.6937, |
|
"eval_samples_per_second": 675.663, |
|
"eval_steps_per_second": 10.569, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 1.96, |
|
"step": 1000, |
|
"total_flos": 6.688961805360538e+16, |
|
"train_loss": 0.0, |
|
"train_runtime": 0.5646, |
|
"train_samples_per_second": 462448.203, |
|
"train_steps_per_second": 903.281 |
|
}, |
|
{ |
|
"epoch": 1.96, |
|
"eval_loss": 0.9063528180122375, |
|
"eval_runtime": 17.3728, |
|
"eval_samples_per_second": 688.145, |
|
"eval_steps_per_second": 5.411, |
|
"step": 1000 |
|
} |
|
], |
|
"logging_steps": 100, |
|
"max_steps": 510, |
|
"num_train_epochs": 2, |
|
"save_steps": 100, |
|
"total_flos": 6.688961805360538e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|