File size: 2,393 Bytes
916475e d682d44 88cdeb8 916475e ab417e2 916475e ab417e2 916475e cf1c091 d682d44 88cdeb8 916475e 88cdeb8 916475e |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 |
{
"best_metric": 0.14495012164115906,
"best_model_checkpoint": "./test-small-bert-with-loss-weight/checkpoint-1500",
"epoch": 1.968503937007874,
"global_step": 2000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.49,
"learning_rate": 4.1797900262467194e-05,
"loss": 0.1546,
"step": 500
},
{
"epoch": 0.49,
"eval_accuracy": 0.8429757067519668,
"eval_f1": 0.27041574613376174,
"eval_loss": 0.14738939702510834,
"eval_precision": 0.8877752868257945,
"eval_recall": 0.1594996090695856,
"eval_runtime": 8.7195,
"eval_samples_per_second": 1128.732,
"eval_steps_per_second": 4.473,
"step": 500
},
{
"epoch": 0.98,
"learning_rate": 3.3595800524934386e-05,
"loss": 0.1506,
"step": 1000
},
{
"epoch": 0.98,
"eval_accuracy": 0.8417091726463214,
"eval_f1": 0.2548480963718129,
"eval_loss": 0.14584653079509735,
"eval_precision": 0.9028258362168397,
"eval_recall": 0.14836401544767455,
"eval_runtime": 8.6401,
"eval_samples_per_second": 1139.107,
"eval_steps_per_second": 4.514,
"step": 1000
},
{
"epoch": 1.48,
"learning_rate": 2.5393700787401574e-05,
"loss": 0.1485,
"step": 1500
},
{
"epoch": 1.48,
"eval_accuracy": 0.8470173770208351,
"eval_f1": 0.30824260667305176,
"eval_loss": 0.14495012164115906,
"eval_precision": 0.8806120169756534,
"eval_recall": 0.18681735257184828,
"eval_runtime": 8.8318,
"eval_samples_per_second": 1114.387,
"eval_steps_per_second": 4.416,
"step": 1500
},
{
"epoch": 1.97,
"learning_rate": 1.7191601049868766e-05,
"loss": 0.1487,
"step": 2000
},
{
"epoch": 1.97,
"eval_accuracy": 0.8434339068038385,
"eval_f1": 0.27119803613827514,
"eval_loss": 0.14501141011714935,
"eval_precision": 0.8996128687758643,
"eval_recall": 0.15966545833629492,
"eval_runtime": 8.7797,
"eval_samples_per_second": 1120.994,
"eval_steps_per_second": 4.442,
"step": 2000
}
],
"max_steps": 3048,
"num_train_epochs": 3,
"total_flos": 621176549989632.0,
"trial_name": null,
"trial_params": null
}
|