|
{ |
|
"best_metric": 0.8968406938741306, |
|
"best_model_checkpoint": "hmBERT-CoNLL-cp2/checkpoint-500", |
|
"epoch": 2.0, |
|
"global_step": 878, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.06, |
|
"eval_accuracy": 0.9005295743935205, |
|
"eval_f1": 0.36743180306054557, |
|
"eval_loss": 0.4116312265396118, |
|
"eval_precision": 0.36320289378493914, |
|
"eval_recall": 0.3717603500504881, |
|
"eval_runtime": 21.4683, |
|
"eval_samples_per_second": 151.386, |
|
"eval_steps_per_second": 4.751, |
|
"step": 25 |
|
}, |
|
{ |
|
"epoch": 0.11, |
|
"eval_accuracy": 0.9458549121918929, |
|
"eval_f1": 0.6632702571567201, |
|
"eval_loss": 0.22468078136444092, |
|
"eval_precision": 0.638387297633873, |
|
"eval_recall": 0.6901716593739482, |
|
"eval_runtime": 20.8937, |
|
"eval_samples_per_second": 155.549, |
|
"eval_steps_per_second": 4.882, |
|
"step": 50 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"eval_accuracy": 0.9579845021611308, |
|
"eval_f1": 0.746131050378663, |
|
"eval_loss": 0.16239947080612183, |
|
"eval_precision": 0.7302610377054464, |
|
"eval_recall": 0.7627061595422416, |
|
"eval_runtime": 21.6024, |
|
"eval_samples_per_second": 150.446, |
|
"eval_steps_per_second": 4.722, |
|
"step": 75 |
|
}, |
|
{ |
|
"epoch": 0.23, |
|
"eval_accuracy": 0.9588022273275962, |
|
"eval_f1": 0.7508835374373305, |
|
"eval_loss": 0.15414278209209442, |
|
"eval_precision": 0.7338152610441767, |
|
"eval_recall": 0.7687647256815887, |
|
"eval_runtime": 21.4049, |
|
"eval_samples_per_second": 151.835, |
|
"eval_steps_per_second": 4.765, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 0.28, |
|
"eval_accuracy": 0.9642537284373661, |
|
"eval_f1": 0.7844736198320149, |
|
"eval_loss": 0.13490867614746094, |
|
"eval_precision": 0.7609555450087011, |
|
"eval_recall": 0.8094917536183104, |
|
"eval_runtime": 21.4103, |
|
"eval_samples_per_second": 151.796, |
|
"eval_steps_per_second": 4.764, |
|
"step": 125 |
|
}, |
|
{ |
|
"epoch": 0.34, |
|
"eval_accuracy": 0.9693547759043651, |
|
"eval_f1": 0.8115174582161179, |
|
"eval_loss": 0.12301833927631378, |
|
"eval_precision": 0.7981770833333334, |
|
"eval_recall": 0.8253113429821609, |
|
"eval_runtime": 21.3799, |
|
"eval_samples_per_second": 152.012, |
|
"eval_steps_per_second": 4.771, |
|
"step": 150 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"eval_accuracy": 0.97272302480433, |
|
"eval_f1": 0.8234421364985163, |
|
"eval_loss": 0.0997077226638794, |
|
"eval_precision": 0.8069466882067852, |
|
"eval_recall": 0.8406260518343992, |
|
"eval_runtime": 21.0809, |
|
"eval_samples_per_second": 154.168, |
|
"eval_steps_per_second": 4.839, |
|
"step": 175 |
|
}, |
|
{ |
|
"epoch": 0.46, |
|
"eval_accuracy": 0.9731902963280246, |
|
"eval_f1": 0.8308945793149318, |
|
"eval_loss": 0.10443305224180222, |
|
"eval_precision": 0.8210647387446599, |
|
"eval_recall": 0.8409626388421407, |
|
"eval_runtime": 21.7924, |
|
"eval_samples_per_second": 149.135, |
|
"eval_steps_per_second": 4.681, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.51, |
|
"eval_accuracy": 0.9759939254701919, |
|
"eval_f1": 0.8507239141288069, |
|
"eval_loss": 0.08712451159954071, |
|
"eval_precision": 0.8413429888084266, |
|
"eval_recall": 0.860316391787277, |
|
"eval_runtime": 21.6266, |
|
"eval_samples_per_second": 150.278, |
|
"eval_steps_per_second": 4.716, |
|
"step": 225 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"eval_accuracy": 0.9732876445621277, |
|
"eval_f1": 0.8375655648988427, |
|
"eval_loss": 0.10657607018947601, |
|
"eval_precision": 0.8288021090789257, |
|
"eval_recall": 0.8465163244698755, |
|
"eval_runtime": 21.4498, |
|
"eval_samples_per_second": 151.517, |
|
"eval_steps_per_second": 4.755, |
|
"step": 250 |
|
}, |
|
{ |
|
"epoch": 0.63, |
|
"eval_accuracy": 0.9765780148748102, |
|
"eval_f1": 0.8623576691225721, |
|
"eval_loss": 0.08719414472579956, |
|
"eval_precision": 0.8580473175608131, |
|
"eval_recall": 0.8667115449343655, |
|
"eval_runtime": 21.04, |
|
"eval_samples_per_second": 154.468, |
|
"eval_steps_per_second": 4.848, |
|
"step": 275 |
|
}, |
|
{ |
|
"epoch": 0.68, |
|
"eval_accuracy": 0.9773178614539932, |
|
"eval_f1": 0.8613053613053614, |
|
"eval_loss": 0.08342944085597992, |
|
"eval_precision": 0.8522240527182866, |
|
"eval_recall": 0.8705822955233928, |
|
"eval_runtime": 20.9406, |
|
"eval_samples_per_second": 155.201, |
|
"eval_steps_per_second": 4.871, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"eval_accuracy": 0.9782718741482029, |
|
"eval_f1": 0.868680182043856, |
|
"eval_loss": 0.08315661549568176, |
|
"eval_precision": 0.8544685007325411, |
|
"eval_recall": 0.8833726018175698, |
|
"eval_runtime": 21.3907, |
|
"eval_samples_per_second": 151.935, |
|
"eval_steps_per_second": 4.768, |
|
"step": 325 |
|
}, |
|
{ |
|
"epoch": 0.8, |
|
"eval_accuracy": 0.9787002063782563, |
|
"eval_f1": 0.8685364441135103, |
|
"eval_loss": 0.07756651937961578, |
|
"eval_precision": 0.8541903986981285, |
|
"eval_recall": 0.8833726018175698, |
|
"eval_runtime": 21.9914, |
|
"eval_samples_per_second": 147.785, |
|
"eval_steps_per_second": 4.638, |
|
"step": 350 |
|
}, |
|
{ |
|
"epoch": 0.85, |
|
"eval_accuracy": 0.98010202094934, |
|
"eval_f1": 0.8760357971494862, |
|
"eval_loss": 0.07601791620254517, |
|
"eval_precision": 0.8628795298726738, |
|
"eval_recall": 0.8895994614607876, |
|
"eval_runtime": 21.6439, |
|
"eval_samples_per_second": 150.158, |
|
"eval_steps_per_second": 4.713, |
|
"step": 375 |
|
}, |
|
{ |
|
"epoch": 0.91, |
|
"eval_accuracy": 0.9823994392741716, |
|
"eval_f1": 0.8887781377190795, |
|
"eval_loss": 0.06729913502931595, |
|
"eval_precision": 0.8774807282269969, |
|
"eval_recall": 0.9003702457085156, |
|
"eval_runtime": 20.8932, |
|
"eval_samples_per_second": 155.553, |
|
"eval_steps_per_second": 4.882, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 0.97, |
|
"eval_accuracy": 0.9816595926949885, |
|
"eval_f1": 0.8882013546283134, |
|
"eval_loss": 0.06811415404081345, |
|
"eval_precision": 0.8826657802891806, |
|
"eval_recall": 0.8938067990575563, |
|
"eval_runtime": 21.516, |
|
"eval_samples_per_second": 151.051, |
|
"eval_steps_per_second": 4.741, |
|
"step": 425 |
|
}, |
|
{ |
|
"epoch": 1.03, |
|
"eval_accuracy": 0.9824189089209922, |
|
"eval_f1": 0.8896695943120033, |
|
"eval_loss": 0.06585536897182465, |
|
"eval_precision": 0.8844170962913687, |
|
"eval_recall": 0.8949848535846516, |
|
"eval_runtime": 21.1661, |
|
"eval_samples_per_second": 153.547, |
|
"eval_steps_per_second": 4.819, |
|
"step": 450 |
|
}, |
|
{ |
|
"epoch": 1.08, |
|
"eval_accuracy": 0.9831587555001752, |
|
"eval_f1": 0.8923128175231116, |
|
"eval_loss": 0.06903570890426636, |
|
"eval_precision": 0.8832646331409728, |
|
"eval_recall": 0.9015483002356109, |
|
"eval_runtime": 21.4553, |
|
"eval_samples_per_second": 151.478, |
|
"eval_steps_per_second": 4.754, |
|
"step": 475 |
|
}, |
|
{ |
|
"epoch": 1.14, |
|
"learning_rate": 2.152619589977221e-05, |
|
"loss": 0.1399, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.14, |
|
"eval_accuracy": 0.983217164440637, |
|
"eval_f1": 0.8968406938741306, |
|
"eval_loss": 0.0666249617934227, |
|
"eval_precision": 0.8931730929727926, |
|
"eval_recall": 0.9005385392123864, |
|
"eval_runtime": 21.9318, |
|
"eval_samples_per_second": 148.187, |
|
"eval_steps_per_second": 4.651, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 1.2, |
|
"eval_accuracy": 0.982477317861454, |
|
"eval_f1": 0.8943538268506901, |
|
"eval_loss": 0.06665532290935516, |
|
"eval_precision": 0.8890736737069682, |
|
"eval_recall": 0.8996970716930327, |
|
"eval_runtime": 21.7087, |
|
"eval_samples_per_second": 149.71, |
|
"eval_steps_per_second": 4.699, |
|
"step": 525 |
|
}, |
|
{ |
|
"epoch": 1.25, |
|
"eval_accuracy": 0.9820100463377595, |
|
"eval_f1": 0.8851177106729889, |
|
"eval_loss": 0.0698634684085846, |
|
"eval_precision": 0.8751439381477216, |
|
"eval_recall": 0.8953214405923932, |
|
"eval_runtime": 21.8836, |
|
"eval_samples_per_second": 148.513, |
|
"eval_steps_per_second": 4.661, |
|
"step": 550 |
|
}, |
|
{ |
|
"epoch": 1.31, |
|
"eval_accuracy": 0.984015419960282, |
|
"eval_f1": 0.900702106318957, |
|
"eval_loss": 0.06173388287425041, |
|
"eval_precision": 0.8947193623380937, |
|
"eval_recall": 0.9067653988556041, |
|
"eval_runtime": 21.5086, |
|
"eval_samples_per_second": 151.102, |
|
"eval_steps_per_second": 4.742, |
|
"step": 575 |
|
}, |
|
{ |
|
"epoch": 1.37, |
|
"eval_accuracy": 0.9840543592539231, |
|
"eval_f1": 0.9028686462003019, |
|
"eval_loss": 0.06334252655506134, |
|
"eval_precision": 0.9, |
|
"eval_recall": 0.9057556378323797, |
|
"eval_runtime": 21.1745, |
|
"eval_samples_per_second": 153.487, |
|
"eval_steps_per_second": 4.817, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 1.42, |
|
"eval_accuracy": 0.9843269343094116, |
|
"eval_f1": 0.9040387182910546, |
|
"eval_loss": 0.06390959024429321, |
|
"eval_precision": 0.8965574313141343, |
|
"eval_recall": 0.9116459104678559, |
|
"eval_runtime": 21.7996, |
|
"eval_samples_per_second": 149.086, |
|
"eval_steps_per_second": 4.679, |
|
"step": 625 |
|
}, |
|
{ |
|
"epoch": 1.48, |
|
"eval_accuracy": 0.9845021611307971, |
|
"eval_f1": 0.9040501043841336, |
|
"eval_loss": 0.06244850531220436, |
|
"eval_precision": 0.8972318912647108, |
|
"eval_recall": 0.910972736452373, |
|
"eval_runtime": 21.6575, |
|
"eval_samples_per_second": 150.064, |
|
"eval_steps_per_second": 4.71, |
|
"step": 650 |
|
}, |
|
{ |
|
"epoch": 1.54, |
|
"eval_accuracy": 0.9841517074880262, |
|
"eval_f1": 0.90302066772655, |
|
"eval_loss": 0.06191794201731682, |
|
"eval_precision": 0.8979863538026294, |
|
"eval_recall": 0.9081117468865701, |
|
"eval_runtime": 21.8896, |
|
"eval_samples_per_second": 148.473, |
|
"eval_steps_per_second": 4.66, |
|
"step": 675 |
|
}, |
|
{ |
|
"epoch": 1.59, |
|
"eval_accuracy": 0.9842685253689498, |
|
"eval_f1": 0.904538603249037, |
|
"eval_loss": 0.06151856482028961, |
|
"eval_precision": 0.9001666666666667, |
|
"eval_recall": 0.9089532144059239, |
|
"eval_runtime": 21.9582, |
|
"eval_samples_per_second": 148.008, |
|
"eval_steps_per_second": 4.645, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 1.65, |
|
"eval_accuracy": 0.9849889023013123, |
|
"eval_f1": 0.9082384460817148, |
|
"eval_loss": 0.060051579028367996, |
|
"eval_precision": 0.9036987670776407, |
|
"eval_recall": 0.9128239649949512, |
|
"eval_runtime": 21.5715, |
|
"eval_samples_per_second": 150.661, |
|
"eval_steps_per_second": 4.728, |
|
"step": 725 |
|
}, |
|
{ |
|
"epoch": 1.71, |
|
"eval_accuracy": 0.984949963007671, |
|
"eval_f1": 0.9085891109810152, |
|
"eval_loss": 0.058469709008932114, |
|
"eval_precision": 0.9030756442227764, |
|
"eval_recall": 0.9141703130259172, |
|
"eval_runtime": 21.259, |
|
"eval_samples_per_second": 152.877, |
|
"eval_steps_per_second": 4.798, |
|
"step": 750 |
|
}, |
|
{ |
|
"epoch": 1.77, |
|
"eval_accuracy": 0.9850862505354153, |
|
"eval_f1": 0.9089084065244667, |
|
"eval_loss": 0.05824408307671547, |
|
"eval_precision": 0.903542324962581, |
|
"eval_recall": 0.9143386065297879, |
|
"eval_runtime": 21.7846, |
|
"eval_samples_per_second": 149.188, |
|
"eval_steps_per_second": 4.682, |
|
"step": 775 |
|
}, |
|
{ |
|
"epoch": 1.82, |
|
"eval_accuracy": 0.9852809470036213, |
|
"eval_f1": 0.9100183977253721, |
|
"eval_loss": 0.0580282025039196, |
|
"eval_precision": 0.9044215425531915, |
|
"eval_recall": 0.9156849545607539, |
|
"eval_runtime": 21.4108, |
|
"eval_samples_per_second": 151.792, |
|
"eval_steps_per_second": 4.764, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 1.88, |
|
"eval_accuracy": 0.9851446594758771, |
|
"eval_f1": 0.9096682543661736, |
|
"eval_loss": 0.058311279863119125, |
|
"eval_precision": 0.903402489626556, |
|
"eval_recall": 0.9160215415684955, |
|
"eval_runtime": 21.1305, |
|
"eval_samples_per_second": 153.806, |
|
"eval_steps_per_second": 4.827, |
|
"step": 825 |
|
}, |
|
{ |
|
"epoch": 1.94, |
|
"eval_accuracy": 0.9853782952377244, |
|
"eval_f1": 0.9113564141160729, |
|
"eval_loss": 0.05776725709438324, |
|
"eval_precision": 0.905751329787234, |
|
"eval_recall": 0.9170313025917199, |
|
"eval_runtime": 21.1284, |
|
"eval_samples_per_second": 153.821, |
|
"eval_steps_per_second": 4.828, |
|
"step": 850 |
|
}, |
|
{ |
|
"epoch": 1.99, |
|
"eval_accuracy": 0.9852420077099802, |
|
"eval_f1": 0.9112356730527901, |
|
"eval_loss": 0.05755457654595375, |
|
"eval_precision": 0.9060056562967892, |
|
"eval_recall": 0.9165264220801077, |
|
"eval_runtime": 21.4936, |
|
"eval_samples_per_second": 151.208, |
|
"eval_steps_per_second": 4.746, |
|
"step": 875 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"step": 878, |
|
"total_flos": 913386421477854.0, |
|
"train_loss": 0.09878404265384196, |
|
"train_runtime": 1144.6421, |
|
"train_samples_per_second": 24.533, |
|
"train_steps_per_second": 0.767 |
|
} |
|
], |
|
"max_steps": 878, |
|
"num_train_epochs": 2, |
|
"total_flos": 913386421477854.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|