|
{ |
|
"best_metric": 0.9824828636709825, |
|
"best_model_checkpoint": "/content/drive/Shareddrives/Data Science Team folder-open/Clients/Rhenus Documents/attachments_batch7_20231027_SELECTED/Thermorossi/pdf2img/processedimg/0-60 THERMOROSSI/model/PickupReq_combined_RNS_Dec23_EEB_v4/checkpoint-4500", |
|
"epoch": 78.125, |
|
"global_step": 5000, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.56, |
|
"eval_accuracy": 0.9868951612903226, |
|
"eval_f1": 0.942878903274943, |
|
"eval_loss": 0.06447841972112656, |
|
"eval_precision": 0.9435975609756098, |
|
"eval_recall": 0.9421613394216134, |
|
"eval_runtime": 1.2198, |
|
"eval_samples_per_second": 10.658, |
|
"eval_steps_per_second": 5.739, |
|
"step": 100 |
|
}, |
|
{ |
|
"epoch": 3.12, |
|
"eval_accuracy": 0.9914314516129032, |
|
"eval_f1": 0.9573170731707317, |
|
"eval_loss": 0.04372543469071388, |
|
"eval_precision": 0.9587786259541985, |
|
"eval_recall": 0.9558599695585996, |
|
"eval_runtime": 1.2728, |
|
"eval_samples_per_second": 10.213, |
|
"eval_steps_per_second": 5.5, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 4.69, |
|
"eval_accuracy": 0.9924395161290323, |
|
"eval_f1": 0.966360856269113, |
|
"eval_loss": 0.04766829311847687, |
|
"eval_precision": 0.9708141321044547, |
|
"eval_recall": 0.9619482496194824, |
|
"eval_runtime": 1.224, |
|
"eval_samples_per_second": 10.621, |
|
"eval_steps_per_second": 5.719, |
|
"step": 300 |
|
}, |
|
{ |
|
"epoch": 6.25, |
|
"eval_accuracy": 0.9939516129032258, |
|
"eval_f1": 0.9786585365853657, |
|
"eval_loss": 0.050641875714063644, |
|
"eval_precision": 0.9801526717557252, |
|
"eval_recall": 0.9771689497716894, |
|
"eval_runtime": 1.2177, |
|
"eval_samples_per_second": 10.676, |
|
"eval_steps_per_second": 5.749, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 7.81, |
|
"learning_rate": 9e-06, |
|
"loss": 0.145, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 7.81, |
|
"eval_accuracy": 0.9939516129032258, |
|
"eval_f1": 0.9733434881949734, |
|
"eval_loss": 0.03310808911919594, |
|
"eval_precision": 0.9740853658536586, |
|
"eval_recall": 0.9726027397260274, |
|
"eval_runtime": 1.2766, |
|
"eval_samples_per_second": 10.183, |
|
"eval_steps_per_second": 5.483, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 9.38, |
|
"eval_accuracy": 0.9939516129032258, |
|
"eval_f1": 0.9718202589489718, |
|
"eval_loss": 0.04493210092186928, |
|
"eval_precision": 0.9725609756097561, |
|
"eval_recall": 0.9710806697108066, |
|
"eval_runtime": 1.2123, |
|
"eval_samples_per_second": 10.724, |
|
"eval_steps_per_second": 5.774, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 10.94, |
|
"eval_accuracy": 0.9939516129032258, |
|
"eval_f1": 0.9702970297029704, |
|
"eval_loss": 0.038082972168922424, |
|
"eval_precision": 0.9710365853658537, |
|
"eval_recall": 0.969558599695586, |
|
"eval_runtime": 1.2843, |
|
"eval_samples_per_second": 10.122, |
|
"eval_steps_per_second": 5.45, |
|
"step": 700 |
|
}, |
|
{ |
|
"epoch": 12.5, |
|
"eval_accuracy": 0.9939516129032258, |
|
"eval_f1": 0.9702970297029704, |
|
"eval_loss": 0.03552929311990738, |
|
"eval_precision": 0.9710365853658537, |
|
"eval_recall": 0.969558599695586, |
|
"eval_runtime": 1.2169, |
|
"eval_samples_per_second": 10.683, |
|
"eval_steps_per_second": 5.752, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 14.06, |
|
"eval_accuracy": 0.9919354838709677, |
|
"eval_f1": 0.9672505712109674, |
|
"eval_loss": 0.03628508001565933, |
|
"eval_precision": 0.9679878048780488, |
|
"eval_recall": 0.9665144596651446, |
|
"eval_runtime": 1.2161, |
|
"eval_samples_per_second": 10.69, |
|
"eval_steps_per_second": 5.756, |
|
"step": 900 |
|
}, |
|
{ |
|
"epoch": 15.62, |
|
"learning_rate": 8.000000000000001e-06, |
|
"loss": 0.0076, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 15.62, |
|
"eval_accuracy": 0.9919354838709677, |
|
"eval_f1": 0.9642041127189643, |
|
"eval_loss": 0.041032299399375916, |
|
"eval_precision": 0.9649390243902439, |
|
"eval_recall": 0.9634703196347032, |
|
"eval_runtime": 1.2046, |
|
"eval_samples_per_second": 10.792, |
|
"eval_steps_per_second": 5.811, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 17.19, |
|
"eval_accuracy": 0.9939516129032258, |
|
"eval_f1": 0.9763899466869764, |
|
"eval_loss": 0.025884319096803665, |
|
"eval_precision": 0.9771341463414634, |
|
"eval_recall": 0.9756468797564688, |
|
"eval_runtime": 1.2178, |
|
"eval_samples_per_second": 10.675, |
|
"eval_steps_per_second": 5.748, |
|
"step": 1100 |
|
}, |
|
{ |
|
"epoch": 18.75, |
|
"eval_accuracy": 0.9949596774193549, |
|
"eval_f1": 0.9764258555133081, |
|
"eval_loss": 0.03205409273505211, |
|
"eval_precision": 0.9756838905775076, |
|
"eval_recall": 0.9771689497716894, |
|
"eval_runtime": 1.2104, |
|
"eval_samples_per_second": 10.74, |
|
"eval_steps_per_second": 5.783, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 20.31, |
|
"eval_accuracy": 0.9949596774193549, |
|
"eval_f1": 0.9764258555133081, |
|
"eval_loss": 0.03990120440721512, |
|
"eval_precision": 0.9756838905775076, |
|
"eval_recall": 0.9771689497716894, |
|
"eval_runtime": 1.2848, |
|
"eval_samples_per_second": 10.118, |
|
"eval_steps_per_second": 5.448, |
|
"step": 1300 |
|
}, |
|
{ |
|
"epoch": 21.88, |
|
"eval_accuracy": 0.9959677419354839, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.026920977979898453, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.2238, |
|
"eval_samples_per_second": 10.623, |
|
"eval_steps_per_second": 5.72, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 23.44, |
|
"learning_rate": 7e-06, |
|
"loss": 0.0034, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 23.44, |
|
"eval_accuracy": 0.9944556451612904, |
|
"eval_f1": 0.9763899466869764, |
|
"eval_loss": 0.03660265728831291, |
|
"eval_precision": 0.9771341463414634, |
|
"eval_recall": 0.9756468797564688, |
|
"eval_runtime": 1.2067, |
|
"eval_samples_per_second": 10.773, |
|
"eval_steps_per_second": 5.801, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 25.0, |
|
"eval_accuracy": 0.9969758064516129, |
|
"eval_f1": 0.9855293221629856, |
|
"eval_loss": 0.0368938222527504, |
|
"eval_precision": 0.9862804878048781, |
|
"eval_recall": 0.984779299847793, |
|
"eval_runtime": 1.2163, |
|
"eval_samples_per_second": 10.688, |
|
"eval_steps_per_second": 5.755, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 26.56, |
|
"eval_accuracy": 0.9954637096774194, |
|
"eval_f1": 0.9794364051789796, |
|
"eval_loss": 0.03973403945565224, |
|
"eval_precision": 0.9801829268292683, |
|
"eval_recall": 0.9786910197869102, |
|
"eval_runtime": 1.2199, |
|
"eval_samples_per_second": 10.657, |
|
"eval_steps_per_second": 5.738, |
|
"step": 1700 |
|
}, |
|
{ |
|
"epoch": 28.12, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.027732405811548233, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.2739, |
|
"eval_samples_per_second": 10.205, |
|
"eval_steps_per_second": 5.495, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 29.69, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9855293221629856, |
|
"eval_loss": 0.03053249605000019, |
|
"eval_precision": 0.9862804878048781, |
|
"eval_recall": 0.984779299847793, |
|
"eval_runtime": 1.2239, |
|
"eval_samples_per_second": 10.621, |
|
"eval_steps_per_second": 5.719, |
|
"step": 1900 |
|
}, |
|
{ |
|
"epoch": 31.25, |
|
"learning_rate": 6e-06, |
|
"loss": 0.0021, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 31.25, |
|
"eval_accuracy": 0.9954637096774194, |
|
"eval_f1": 0.9763899466869764, |
|
"eval_loss": 0.04148135706782341, |
|
"eval_precision": 0.9771341463414634, |
|
"eval_recall": 0.9756468797564688, |
|
"eval_runtime": 1.2182, |
|
"eval_samples_per_second": 10.672, |
|
"eval_steps_per_second": 5.746, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 32.81, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9855293221629856, |
|
"eval_loss": 0.03434097394347191, |
|
"eval_precision": 0.9862804878048781, |
|
"eval_recall": 0.984779299847793, |
|
"eval_runtime": 1.2192, |
|
"eval_samples_per_second": 10.663, |
|
"eval_steps_per_second": 5.742, |
|
"step": 2100 |
|
}, |
|
{ |
|
"epoch": 34.38, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.036329954862594604, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.2759, |
|
"eval_samples_per_second": 10.189, |
|
"eval_steps_per_second": 5.486, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 35.94, |
|
"eval_accuracy": 0.9959677419354839, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.0368308424949646, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.215, |
|
"eval_samples_per_second": 10.7, |
|
"eval_steps_per_second": 5.762, |
|
"step": 2300 |
|
}, |
|
{ |
|
"epoch": 37.5, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.03690670430660248, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.2077, |
|
"eval_samples_per_second": 10.764, |
|
"eval_steps_per_second": 5.796, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 39.06, |
|
"learning_rate": 5e-06, |
|
"loss": 0.0016, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 39.06, |
|
"eval_accuracy": 0.9954637096774194, |
|
"eval_f1": 0.9794364051789796, |
|
"eval_loss": 0.03333241119980812, |
|
"eval_precision": 0.9801829268292683, |
|
"eval_recall": 0.9786910197869102, |
|
"eval_runtime": 1.2147, |
|
"eval_samples_per_second": 10.703, |
|
"eval_steps_per_second": 5.763, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 40.62, |
|
"eval_accuracy": 0.9979838709677419, |
|
"eval_f1": 0.9916222391469918, |
|
"eval_loss": 0.03542204946279526, |
|
"eval_precision": 0.9923780487804879, |
|
"eval_recall": 0.9908675799086758, |
|
"eval_runtime": 1.2122, |
|
"eval_samples_per_second": 10.725, |
|
"eval_steps_per_second": 5.775, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 42.19, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.03290965408086777, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.2189, |
|
"eval_samples_per_second": 10.665, |
|
"eval_steps_per_second": 5.743, |
|
"step": 2700 |
|
}, |
|
{ |
|
"epoch": 43.75, |
|
"eval_accuracy": 0.9969758064516129, |
|
"eval_f1": 0.9855293221629856, |
|
"eval_loss": 0.03801412135362625, |
|
"eval_precision": 0.9862804878048781, |
|
"eval_recall": 0.984779299847793, |
|
"eval_runtime": 1.2022, |
|
"eval_samples_per_second": 10.813, |
|
"eval_steps_per_second": 5.823, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 45.31, |
|
"eval_accuracy": 0.9959677419354839, |
|
"eval_f1": 0.9794364051789796, |
|
"eval_loss": 0.03737560659646988, |
|
"eval_precision": 0.9801829268292683, |
|
"eval_recall": 0.9786910197869102, |
|
"eval_runtime": 1.2805, |
|
"eval_samples_per_second": 10.152, |
|
"eval_steps_per_second": 5.467, |
|
"step": 2900 |
|
}, |
|
{ |
|
"epoch": 46.88, |
|
"learning_rate": 4.000000000000001e-06, |
|
"loss": 0.0008, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 46.88, |
|
"eval_accuracy": 0.9959677419354839, |
|
"eval_f1": 0.9794364051789796, |
|
"eval_loss": 0.03473510965704918, |
|
"eval_precision": 0.9801829268292683, |
|
"eval_recall": 0.9786910197869102, |
|
"eval_runtime": 1.2112, |
|
"eval_samples_per_second": 10.733, |
|
"eval_steps_per_second": 5.779, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 48.44, |
|
"eval_accuracy": 0.9959677419354839, |
|
"eval_f1": 0.9794364051789796, |
|
"eval_loss": 0.03780585899949074, |
|
"eval_precision": 0.9801829268292683, |
|
"eval_recall": 0.9786910197869102, |
|
"eval_runtime": 1.2093, |
|
"eval_samples_per_second": 10.75, |
|
"eval_steps_per_second": 5.788, |
|
"step": 3100 |
|
}, |
|
{ |
|
"epoch": 50.0, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.03984608128666878, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.2798, |
|
"eval_samples_per_second": 10.157, |
|
"eval_steps_per_second": 5.469, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 51.56, |
|
"eval_accuracy": 0.9959677419354839, |
|
"eval_f1": 0.9794364051789796, |
|
"eval_loss": 0.03601069748401642, |
|
"eval_precision": 0.9801829268292683, |
|
"eval_recall": 0.9786910197869102, |
|
"eval_runtime": 1.2064, |
|
"eval_samples_per_second": 10.776, |
|
"eval_steps_per_second": 5.802, |
|
"step": 3300 |
|
}, |
|
{ |
|
"epoch": 53.12, |
|
"eval_accuracy": 0.9954637096774194, |
|
"eval_f1": 0.9779131759329779, |
|
"eval_loss": 0.04352593794465065, |
|
"eval_precision": 0.9786585365853658, |
|
"eval_recall": 0.9771689497716894, |
|
"eval_runtime": 1.2834, |
|
"eval_samples_per_second": 10.129, |
|
"eval_steps_per_second": 5.454, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 54.69, |
|
"learning_rate": 3e-06, |
|
"loss": 0.0006, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 54.69, |
|
"eval_accuracy": 0.9959677419354839, |
|
"eval_f1": 0.9794364051789796, |
|
"eval_loss": 0.044929005205631256, |
|
"eval_precision": 0.9801829268292683, |
|
"eval_recall": 0.9786910197869102, |
|
"eval_runtime": 1.2158, |
|
"eval_samples_per_second": 10.693, |
|
"eval_steps_per_second": 5.758, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 56.25, |
|
"eval_accuracy": 0.9959677419354839, |
|
"eval_f1": 0.9794364051789796, |
|
"eval_loss": 0.04337146133184433, |
|
"eval_precision": 0.9801829268292683, |
|
"eval_recall": 0.9786910197869102, |
|
"eval_runtime": 1.3027, |
|
"eval_samples_per_second": 9.979, |
|
"eval_steps_per_second": 5.373, |
|
"step": 3600 |
|
}, |
|
{ |
|
"epoch": 57.81, |
|
"eval_accuracy": 0.9959677419354839, |
|
"eval_f1": 0.9794364051789796, |
|
"eval_loss": 0.042894065380096436, |
|
"eval_precision": 0.9801829268292683, |
|
"eval_recall": 0.9786910197869102, |
|
"eval_runtime": 1.2493, |
|
"eval_samples_per_second": 10.406, |
|
"eval_steps_per_second": 5.603, |
|
"step": 3700 |
|
}, |
|
{ |
|
"epoch": 59.38, |
|
"eval_accuracy": 0.9969758064516129, |
|
"eval_f1": 0.9855293221629856, |
|
"eval_loss": 0.04019169509410858, |
|
"eval_precision": 0.9862804878048781, |
|
"eval_recall": 0.984779299847793, |
|
"eval_runtime": 1.2664, |
|
"eval_samples_per_second": 10.265, |
|
"eval_steps_per_second": 5.527, |
|
"step": 3800 |
|
}, |
|
{ |
|
"epoch": 60.94, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.041059188544750214, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.2339, |
|
"eval_samples_per_second": 10.536, |
|
"eval_steps_per_second": 5.673, |
|
"step": 3900 |
|
}, |
|
{ |
|
"epoch": 62.5, |
|
"learning_rate": 2.0000000000000003e-06, |
|
"loss": 0.0003, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 62.5, |
|
"eval_accuracy": 0.9959677419354839, |
|
"eval_f1": 0.9794364051789796, |
|
"eval_loss": 0.04345503821969032, |
|
"eval_precision": 0.9801829268292683, |
|
"eval_recall": 0.9786910197869102, |
|
"eval_runtime": 1.2758, |
|
"eval_samples_per_second": 10.189, |
|
"eval_steps_per_second": 5.487, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 64.06, |
|
"eval_accuracy": 0.9959677419354839, |
|
"eval_f1": 0.9794364051789796, |
|
"eval_loss": 0.043661847710609436, |
|
"eval_precision": 0.9801829268292683, |
|
"eval_recall": 0.9786910197869102, |
|
"eval_runtime": 1.2235, |
|
"eval_samples_per_second": 10.625, |
|
"eval_steps_per_second": 5.721, |
|
"step": 4100 |
|
}, |
|
{ |
|
"epoch": 65.62, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.04225226491689682, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.2314, |
|
"eval_samples_per_second": 10.557, |
|
"eval_steps_per_second": 5.685, |
|
"step": 4200 |
|
}, |
|
{ |
|
"epoch": 67.19, |
|
"eval_accuracy": 0.9969758064516129, |
|
"eval_f1": 0.9855293221629856, |
|
"eval_loss": 0.04165039211511612, |
|
"eval_precision": 0.9862804878048781, |
|
"eval_recall": 0.984779299847793, |
|
"eval_runtime": 1.2205, |
|
"eval_samples_per_second": 10.651, |
|
"eval_steps_per_second": 5.735, |
|
"step": 4300 |
|
}, |
|
{ |
|
"epoch": 68.75, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.04333154484629631, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.2885, |
|
"eval_samples_per_second": 10.089, |
|
"eval_steps_per_second": 5.433, |
|
"step": 4400 |
|
}, |
|
{ |
|
"epoch": 70.31, |
|
"learning_rate": 1.0000000000000002e-06, |
|
"loss": 0.0003, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 70.31, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.043314892798662186, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.2238, |
|
"eval_samples_per_second": 10.623, |
|
"eval_steps_per_second": 5.72, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 71.88, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.043683238327503204, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.2463, |
|
"eval_samples_per_second": 10.431, |
|
"eval_steps_per_second": 5.616, |
|
"step": 4600 |
|
}, |
|
{ |
|
"epoch": 73.44, |
|
"eval_accuracy": 0.9969758064516129, |
|
"eval_f1": 0.9855293221629856, |
|
"eval_loss": 0.043529048562049866, |
|
"eval_precision": 0.9862804878048781, |
|
"eval_recall": 0.984779299847793, |
|
"eval_runtime": 1.2409, |
|
"eval_samples_per_second": 10.476, |
|
"eval_steps_per_second": 5.641, |
|
"step": 4700 |
|
}, |
|
{ |
|
"epoch": 75.0, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.043888889253139496, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.2665, |
|
"eval_samples_per_second": 10.265, |
|
"eval_steps_per_second": 5.527, |
|
"step": 4800 |
|
}, |
|
{ |
|
"epoch": 76.56, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.04420410841703415, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.2292, |
|
"eval_samples_per_second": 10.576, |
|
"eval_steps_per_second": 5.695, |
|
"step": 4900 |
|
}, |
|
{ |
|
"epoch": 78.12, |
|
"learning_rate": 0.0, |
|
"loss": 0.0002, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 78.12, |
|
"eval_accuracy": 0.9964717741935484, |
|
"eval_f1": 0.9824828636709825, |
|
"eval_loss": 0.043921105563640594, |
|
"eval_precision": 0.9832317073170732, |
|
"eval_recall": 0.9817351598173516, |
|
"eval_runtime": 1.2477, |
|
"eval_samples_per_second": 10.419, |
|
"eval_steps_per_second": 5.61, |
|
"step": 5000 |
|
} |
|
], |
|
"max_steps": 5000, |
|
"num_train_epochs": 79, |
|
"total_flos": 2634149990123520.0, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|