diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,409 +1,3929 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 20.0, + "epoch": 100.0, "eval_steps": 500, - "global_step": 2120, + "global_step": 10600, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 1.0, - "grad_norm": 3.486544132232666, - "learning_rate": 4.75e-05, - "loss": 0.3438, + "grad_norm": 4.555638790130615, + "learning_rate": 4.9500000000000004e-05, + "loss": 0.3502, "step": 106 }, { "epoch": 1.0, - "eval_accuracy": 0.9492119089316988, - "eval_f1": 0.7840440165061899, - "eval_loss": 0.16529129445552826, - "eval_precision": 0.7345360824742269, - "eval_recall": 0.8407079646017699, - "eval_runtime": 0.8917, - "eval_samples_per_second": 209.705, - "eval_steps_per_second": 3.364, + "eval_LOCATION_f1": 0.751592356687898, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.6941176470588235, + "eval_LOCATION_recall": 0.8194444444444444, + "eval_ORGANIZATION_f1": 0.7305389221556886, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6630434782608695, + "eval_ORGANIZATION_recall": 0.8133333333333334, + "eval_PERSON_f1": 0.8976897689768978, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.85, + "eval_PERSON_recall": 0.951048951048951, + "eval_QUANTITY_f1": 0.5423728813559322, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.4444444444444444, + "eval_QUANTITY_recall": 0.6956521739130435, + "eval_TIME_f1": 0.6779661016949152, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.6060606060606061, + "eval_TIME_recall": 0.7692307692307693, + "eval_loss": 0.16481448709964752, + "eval_overall_accuracy": 0.9522141606204654, + "eval_overall_f1": 0.7838926174496645, + "eval_overall_precision": 0.7192118226600985, + "eval_overall_recall": 0.8613569321533924, + "eval_runtime": 0.8792, + "eval_samples_per_second": 212.683, + "eval_steps_per_second": 3.412, "step": 106 }, { "epoch": 2.0, - "grad_norm": 2.105318307876587, - "learning_rate": 4.5e-05, - "loss": 0.1133, + "grad_norm": 3.0741477012634277, + "learning_rate": 4.9e-05, + "loss": 0.1178, "step": 212 }, { "epoch": 2.0, - "eval_accuracy": 0.9569677257943457, - "eval_f1": 0.8272108843537416, - "eval_loss": 0.13404884934425354, - "eval_precision": 0.7676767676767676, - "eval_recall": 0.8967551622418879, - "eval_runtime": 0.9428, - "eval_samples_per_second": 198.343, - "eval_steps_per_second": 3.182, + "eval_LOCATION_f1": 0.8289473684210527, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7875, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.7100000000000001, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.568, + "eval_ORGANIZATION_recall": 0.9466666666666667, + "eval_PERSON_f1": 0.9047619047619047, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8807947019867549, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.5614035087719297, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.47058823529411764, + "eval_QUANTITY_recall": 0.6956521739130435, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.14857080578804016, + "eval_overall_accuracy": 0.9537152864648486, + "eval_overall_f1": 0.8079470198675497, + "eval_overall_precision": 0.7331730769230769, + "eval_overall_recall": 0.8997050147492626, + "eval_runtime": 0.9505, + "eval_samples_per_second": 196.731, + "eval_steps_per_second": 3.156, "step": 212 }, { "epoch": 3.0, - "grad_norm": 2.1835291385650635, - "learning_rate": 4.25e-05, - "loss": 0.0736, + "grad_norm": 2.83402419090271, + "learning_rate": 4.85e-05, + "loss": 0.0781, "step": 318 }, { "epoch": 3.0, - "eval_accuracy": 0.9589692269201902, - "eval_f1": 0.8222222222222222, - "eval_loss": 0.1448056399822235, - "eval_precision": 0.7769028871391076, - "eval_recall": 0.8731563421828908, - "eval_runtime": 0.893, - "eval_samples_per_second": 209.417, - "eval_steps_per_second": 3.36, + "eval_LOCATION_f1": 0.8299319727891157, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8133333333333334, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.7777777777777778, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6666666666666666, + "eval_ORGANIZATION_recall": 0.9333333333333333, + "eval_PERSON_f1": 0.8933333333333333, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8535031847133758, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7083333333333334, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.68, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.15726295113563538, + "eval_overall_accuracy": 0.9552164123092319, + "eval_overall_f1": 0.8363136176066025, + "eval_overall_precision": 0.7835051546391752, + "eval_overall_recall": 0.8967551622418879, + "eval_runtime": 0.8869, + "eval_samples_per_second": 210.857, + "eval_steps_per_second": 3.383, "step": 318 }, { "epoch": 4.0, - "grad_norm": 4.041090965270996, - "learning_rate": 4e-05, - "loss": 0.0473, + "grad_norm": 2.320517063140869, + "learning_rate": 4.8e-05, + "loss": 0.0572, "step": 424 }, { "epoch": 4.0, - "eval_accuracy": 0.961220915686765, - "eval_f1": 0.8274894810659187, - "eval_loss": 0.158503457903862, - "eval_precision": 0.7887700534759359, - "eval_recall": 0.8702064896755162, - "eval_runtime": 0.9078, - "eval_samples_per_second": 206.001, - "eval_steps_per_second": 3.305, + "eval_LOCATION_f1": 0.816326530612245, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.7651006711409396, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7702702702702703, + "eval_ORGANIZATION_recall": 0.76, + "eval_PERSON_f1": 0.9019607843137255, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8466257668711656, + "eval_PERSON_recall": 0.965034965034965, + "eval_QUANTITY_f1": 0.6415094339622641, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.5666666666666667, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.7368421052631579, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.6774193548387096, + "eval_TIME_recall": 0.8076923076923077, + "eval_loss": 0.17222364246845245, + "eval_overall_accuracy": 0.957968476357268, + "eval_overall_f1": 0.8230337078651685, + "eval_overall_precision": 0.7855227882037533, + "eval_overall_recall": 0.8643067846607669, + "eval_runtime": 0.9001, + "eval_samples_per_second": 207.754, + "eval_steps_per_second": 3.333, "step": 424 }, { "epoch": 5.0, - "grad_norm": 2.1877193450927734, - "learning_rate": 3.7500000000000003e-05, - "loss": 0.0311, + "grad_norm": 0.44582077860832214, + "learning_rate": 4.75e-05, + "loss": 0.0359, "step": 530 }, { "epoch": 5.0, - "eval_accuracy": 0.9604703527645734, - "eval_f1": 0.8344923504867873, - "eval_loss": 0.18446023762226105, - "eval_precision": 0.7894736842105263, - "eval_recall": 0.8849557522123894, - "eval_runtime": 0.911, - "eval_samples_per_second": 205.279, - "eval_steps_per_second": 3.293, + "eval_LOCATION_f1": 0.8258064516129032, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7710843373493976, + "eval_LOCATION_recall": 0.8888888888888888, + "eval_ORGANIZATION_f1": 0.7951807228915663, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7252747252747253, + "eval_ORGANIZATION_recall": 0.88, + "eval_PERSON_f1": 0.9152542372881356, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8881578947368421, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.7450980392156864, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6785714285714286, + "eval_QUANTITY_recall": 0.8260869565217391, + "eval_TIME_f1": 0.8799999999999999, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.9166666666666666, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.15475203096866608, + "eval_overall_accuracy": 0.9642231673755316, + "eval_overall_f1": 0.8535564853556487, + "eval_overall_precision": 0.8095238095238095, + "eval_overall_recall": 0.9026548672566371, + "eval_runtime": 0.9396, + "eval_samples_per_second": 199.021, + "eval_steps_per_second": 3.193, "step": 530 }, { "epoch": 6.0, - "grad_norm": 2.7992465496063232, - "learning_rate": 3.5e-05, - "loss": 0.0179, + "grad_norm": 0.24779094755649567, + "learning_rate": 4.7e-05, + "loss": 0.0236, "step": 636 }, { "epoch": 6.0, - "eval_accuracy": 0.9602201651238429, - "eval_f1": 0.8263305322128851, - "eval_loss": 0.21451354026794434, - "eval_precision": 0.7866666666666666, - "eval_recall": 0.8702064896755162, - "eval_runtime": 0.9051, - "eval_samples_per_second": 206.598, - "eval_steps_per_second": 3.314, + "eval_LOCATION_f1": 0.7808219178082192, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7702702702702703, + "eval_LOCATION_recall": 0.7916666666666666, + "eval_ORGANIZATION_f1": 0.7564102564102564, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7283950617283951, + "eval_ORGANIZATION_recall": 0.7866666666666666, + "eval_PERSON_f1": 0.888888888888889, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8571428571428571, + "eval_PERSON_recall": 0.9230769230769231, + "eval_QUANTITY_f1": 0.72, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6666666666666666, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8148148148148148, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.7857142857142857, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.18202847242355347, + "eval_overall_accuracy": 0.9604703527645734, + "eval_overall_f1": 0.8193456614509247, + "eval_overall_precision": 0.7912087912087912, + "eval_overall_recall": 0.8495575221238938, + "eval_runtime": 0.9076, + "eval_samples_per_second": 206.029, + "eval_steps_per_second": 3.305, "step": 636 }, { "epoch": 7.0, - "grad_norm": 0.3002428412437439, - "learning_rate": 3.2500000000000004e-05, - "loss": 0.0126, + "grad_norm": 0.0966544821858406, + "learning_rate": 4.6500000000000005e-05, + "loss": 0.0164, "step": 742 }, { "epoch": 7.0, - "eval_accuracy": 0.9567175381536153, - "eval_f1": 0.82336578581363, - "eval_loss": 0.22246094048023224, - "eval_precision": 0.7789473684210526, - "eval_recall": 0.8731563421828908, - "eval_runtime": 0.9044, - "eval_samples_per_second": 206.757, - "eval_steps_per_second": 3.317, + "eval_LOCATION_f1": 0.8181818181818181, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7682926829268293, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.744186046511628, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6597938144329897, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.9072847682119206, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8616352201257862, + "eval_PERSON_recall": 0.958041958041958, + "eval_QUANTITY_f1": 0.7547169811320754, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6666666666666666, + "eval_QUANTITY_recall": 0.8695652173913043, + "eval_TIME_f1": 0.7719298245614036, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.7096774193548387, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.2388230413198471, + "eval_overall_accuracy": 0.9567175381536153, + "eval_overall_f1": 0.8292682926829268, + "eval_overall_precision": 0.7669172932330827, + "eval_overall_recall": 0.9026548672566371, + "eval_runtime": 0.9186, + "eval_samples_per_second": 203.564, + "eval_steps_per_second": 3.266, "step": 742 }, { "epoch": 8.0, - "grad_norm": 0.2764192223548889, - "learning_rate": 3e-05, - "loss": 0.0091, + "grad_norm": 6.724938869476318, + "learning_rate": 4.600000000000001e-05, + "loss": 0.0131, "step": 848 }, { "epoch": 8.0, - "eval_accuracy": 0.9582186639979985, - "eval_f1": 0.8326417704011065, - "eval_loss": 0.2556192874908447, - "eval_precision": 0.7838541666666666, - "eval_recall": 0.887905604719764, - "eval_runtime": 0.9143, - "eval_samples_per_second": 204.535, - "eval_steps_per_second": 3.281, + "eval_LOCATION_f1": 0.8157894736842106, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.775, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.7341772151898734, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6987951807228916, + "eval_ORGANIZATION_recall": 0.7733333333333333, + "eval_PERSON_f1": 0.8754208754208753, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8441558441558441, + "eval_PERSON_recall": 0.9090909090909091, + "eval_QUANTITY_f1": 0.6923076923076923, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6206896551724138, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.6779661016949152, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.6060606060606061, + "eval_TIME_recall": 0.7692307692307693, + "eval_loss": 0.21797136962413788, + "eval_overall_accuracy": 0.9582186639979985, + "eval_overall_f1": 0.8022284122562674, + "eval_overall_precision": 0.7598944591029023, + "eval_overall_recall": 0.8495575221238938, + "eval_runtime": 0.906, + "eval_samples_per_second": 206.4, + "eval_steps_per_second": 3.311, "step": 848 }, { "epoch": 9.0, - "grad_norm": 0.3533385396003723, - "learning_rate": 2.7500000000000004e-05, - "loss": 0.0041, + "grad_norm": 1.854614019393921, + "learning_rate": 4.55e-05, + "loss": 0.0091, "step": 954 }, { "epoch": 9.0, - "eval_accuracy": 0.9609707280460346, - "eval_f1": 0.8321579689703806, - "eval_loss": 0.2573556900024414, - "eval_precision": 0.7972972972972973, - "eval_recall": 0.8702064896755162, - "eval_runtime": 0.9137, - "eval_samples_per_second": 204.666, - "eval_steps_per_second": 3.283, + "eval_LOCATION_f1": 0.8435374149659863, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8266666666666667, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.788235294117647, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7052631578947368, + "eval_ORGANIZATION_recall": 0.8933333333333333, + "eval_PERSON_f1": 0.8837209302325583, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8417721518987342, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.6923076923076923, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6206896551724138, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.7777777777777779, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.75, + "eval_TIME_recall": 0.8076923076923077, + "eval_loss": 0.26150327920913696, + "eval_overall_accuracy": 0.9589692269201902, + "eval_overall_f1": 0.8314917127071824, + "eval_overall_precision": 0.7818181818181819, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9105, + "eval_samples_per_second": 205.388, + "eval_steps_per_second": 3.295, "step": 954 }, { "epoch": 10.0, - "grad_norm": 3.1199791431427, - "learning_rate": 2.5e-05, - "loss": 0.0036, + "grad_norm": 1.278331995010376, + "learning_rate": 4.5e-05, + "loss": 0.0099, "step": 1060 }, { "epoch": 10.0, - "eval_accuracy": 0.9554665999499625, - "eval_f1": 0.817174515235457, - "eval_loss": 0.3124300241470337, - "eval_precision": 0.7702349869451697, - "eval_recall": 0.8702064896755162, - "eval_runtime": 0.9012, - "eval_samples_per_second": 207.51, - "eval_steps_per_second": 3.329, + "eval_LOCATION_f1": 0.816326530612245, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.7500000000000001, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7058823529411765, + "eval_ORGANIZATION_recall": 0.8, + "eval_PERSON_f1": 0.9183673469387755, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8940397350993378, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.6923076923076923, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6206896551724138, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8214285714285715, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.7666666666666667, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.24217499792575836, + "eval_overall_accuracy": 0.9619714786089567, + "eval_overall_f1": 0.8349788434414668, + "eval_overall_precision": 0.8, + "eval_overall_recall": 0.8731563421828908, + "eval_runtime": 0.9185, + "eval_samples_per_second": 203.602, + "eval_steps_per_second": 3.266, "step": 1060 }, { "epoch": 11.0, - "grad_norm": 0.014265856705605984, - "learning_rate": 2.25e-05, - "loss": 0.0038, + "grad_norm": 0.09772255271673203, + "learning_rate": 4.4500000000000004e-05, + "loss": 0.0059, "step": 1166 }, { "epoch": 11.0, - "eval_accuracy": 0.960720540405304, - "eval_f1": 0.8324022346368715, - "eval_loss": 0.2836814224720001, - "eval_precision": 0.7904509283819628, - "eval_recall": 0.8790560471976401, - "eval_runtime": 0.916, - "eval_samples_per_second": 204.138, - "eval_steps_per_second": 3.275, + "eval_LOCATION_f1": 0.7972972972972973, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7763157894736842, + "eval_LOCATION_recall": 0.8194444444444444, + "eval_ORGANIZATION_f1": 0.7619047619047621, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6881720430107527, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.907849829351536, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8866666666666667, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.6923076923076923, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6206896551724138, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.2546893060207367, + "eval_overall_accuracy": 0.9589692269201902, + "eval_overall_f1": 0.8307692307692307, + "eval_overall_precision": 0.7898936170212766, + "eval_overall_recall": 0.8761061946902655, + "eval_runtime": 0.9121, + "eval_samples_per_second": 205.026, + "eval_steps_per_second": 3.289, "step": 1166 }, { "epoch": 12.0, - "grad_norm": 1.1654541492462158, - "learning_rate": 2e-05, - "loss": 0.0017, + "grad_norm": 0.023314962163567543, + "learning_rate": 4.4000000000000006e-05, + "loss": 0.0062, "step": 1272 }, { "epoch": 12.0, - "eval_accuracy": 0.9574681010758068, - "eval_f1": 0.825, - "eval_loss": 0.3034752905368805, - "eval_precision": 0.7795275590551181, - "eval_recall": 0.8761061946902655, - "eval_runtime": 0.91, - "eval_samples_per_second": 205.506, - "eval_steps_per_second": 3.297, + "eval_LOCATION_f1": 0.7945205479452055, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7837837837837838, + "eval_LOCATION_recall": 0.8055555555555556, + "eval_ORGANIZATION_f1": 0.8074534161490684, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7558139534883721, + "eval_ORGANIZATION_recall": 0.8666666666666667, + "eval_PERSON_f1": 0.8829431438127091, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8461538461538461, + "eval_PERSON_recall": 0.9230769230769231, + "eval_QUANTITY_f1": 0.6538461538461539, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.5862068965517241, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.8363636363636363, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.7931034482758621, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.2780083119869232, + "eval_overall_accuracy": 0.9602201651238429, + "eval_overall_f1": 0.8274894810659187, + "eval_overall_precision": 0.7887700534759359, + "eval_overall_recall": 0.8702064896755162, + "eval_runtime": 0.9675, + "eval_samples_per_second": 193.282, + "eval_steps_per_second": 3.101, "step": 1272 }, { "epoch": 13.0, - "grad_norm": 0.017983168363571167, - "learning_rate": 1.75e-05, - "loss": 0.0015, + "grad_norm": 3.4945220947265625, + "learning_rate": 4.35e-05, + "loss": 0.0037, "step": 1378 }, { "epoch": 13.0, - "eval_accuracy": 0.9604703527645734, - "eval_f1": 0.8333333333333335, - "eval_loss": 0.3068053126335144, - "eval_precision": 0.7874015748031497, - "eval_recall": 0.8849557522123894, - "eval_runtime": 0.902, - "eval_samples_per_second": 207.324, - "eval_steps_per_second": 3.326, + "eval_LOCATION_f1": 0.782051282051282, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7261904761904762, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.7417218543046358, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7368421052631579, + "eval_ORGANIZATION_recall": 0.7466666666666667, + "eval_PERSON_f1": 0.9163879598662208, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8782051282051282, + "eval_PERSON_recall": 0.958041958041958, + "eval_QUANTITY_f1": 0.72, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6666666666666666, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8727272727272727, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8275862068965517, + "eval_TIME_recall": 0.9230769230769231, + "eval_loss": 0.2757226526737213, + "eval_overall_accuracy": 0.9627220415311484, + "eval_overall_f1": 0.8326300984528833, + "eval_overall_precision": 0.7956989247311828, + "eval_overall_recall": 0.8731563421828908, + "eval_runtime": 0.9689, + "eval_samples_per_second": 193.003, + "eval_steps_per_second": 3.096, "step": 1378 }, { "epoch": 14.0, - "grad_norm": 0.011942153796553612, - "learning_rate": 1.5e-05, - "loss": 0.0012, + "grad_norm": 0.025552373379468918, + "learning_rate": 4.3e-05, + "loss": 0.005, "step": 1484 }, { "epoch": 14.0, - "eval_accuracy": 0.9577182887165374, - "eval_f1": 0.8326417704011065, - "eval_loss": 0.32863807678222656, - "eval_precision": 0.7838541666666666, - "eval_recall": 0.887905604719764, - "eval_runtime": 0.8986, - "eval_samples_per_second": 208.111, - "eval_steps_per_second": 3.339, + "eval_LOCATION_f1": 0.8243243243243243, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8026315789473685, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.7341772151898734, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6987951807228916, + "eval_ORGANIZATION_recall": 0.7733333333333333, + "eval_PERSON_f1": 0.9023569023569024, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8701298701298701, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7169811320754716, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6333333333333333, + "eval_QUANTITY_recall": 0.8260869565217391, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.280028760433197, + "eval_overall_accuracy": 0.9594696022016512, + "eval_overall_f1": 0.8305084745762712, + "eval_overall_precision": 0.7967479674796748, + "eval_overall_recall": 0.8672566371681416, + "eval_runtime": 0.9073, + "eval_samples_per_second": 206.107, + "eval_steps_per_second": 3.307, "step": 1484 }, { "epoch": 15.0, - "grad_norm": 0.0062804995104670525, - "learning_rate": 1.25e-05, - "loss": 0.0006, + "grad_norm": 0.192918598651886, + "learning_rate": 4.25e-05, + "loss": 0.0058, "step": 1590 }, { "epoch": 15.0, - "eval_accuracy": 0.960720540405304, - "eval_f1": 0.840782122905028, - "eval_loss": 0.3137037754058838, - "eval_precision": 0.7984084880636605, - "eval_recall": 0.887905604719764, - "eval_runtime": 0.9082, - "eval_samples_per_second": 205.909, - "eval_steps_per_second": 3.303, + "eval_LOCATION_f1": 0.8356164383561645, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8243243243243243, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.7784431137724551, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7065217391304348, + "eval_ORGANIZATION_recall": 0.8666666666666667, + "eval_PERSON_f1": 0.8963210702341137, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8589743589743589, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.6666666666666666, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.64, + "eval_QUANTITY_recall": 0.6956521739130435, + "eval_TIME_f1": 0.8070175438596492, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.7419354838709677, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.2716998755931854, + "eval_overall_accuracy": 0.9629722291718789, + "eval_overall_f1": 0.8340306834030684, + "eval_overall_precision": 0.791005291005291, + "eval_overall_recall": 0.8820058997050148, + "eval_runtime": 0.91, + "eval_samples_per_second": 205.503, + "eval_steps_per_second": 3.297, "step": 1590 }, { "epoch": 16.0, - "grad_norm": 0.2206662893295288, - "learning_rate": 1e-05, - "loss": 0.0008, + "grad_norm": 0.09364385157823563, + "learning_rate": 4.2e-05, + "loss": 0.0046, "step": 1696 }, { "epoch": 16.0, - "eval_accuracy": 0.9617212909682261, - "eval_f1": 0.8382559774964837, - "eval_loss": 0.3065112233161926, - "eval_precision": 0.8010752688172043, - "eval_recall": 0.8790560471976401, - "eval_runtime": 0.9053, - "eval_samples_per_second": 206.56, - "eval_steps_per_second": 3.314, + "eval_LOCATION_f1": 0.816326530612245, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.735632183908046, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6464646464646465, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.8993288590604027, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.864516129032258, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.6545454545454547, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.5625, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.7931034482758621, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.71875, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.30642953515052795, + "eval_overall_accuracy": 0.9539654741055792, + "eval_overall_f1": 0.8169398907103824, + "eval_overall_precision": 0.7608142493638677, + "eval_overall_recall": 0.8820058997050148, + "eval_runtime": 0.9036, + "eval_samples_per_second": 206.952, + "eval_steps_per_second": 3.32, "step": 1696 }, { "epoch": 17.0, - "grad_norm": 0.00254653743468225, - "learning_rate": 7.5e-06, - "loss": 0.0014, + "grad_norm": 4.5664825439453125, + "learning_rate": 4.15e-05, + "loss": 0.0063, "step": 1802 }, { "epoch": 17.0, - "eval_accuracy": 0.9589692269201902, - "eval_f1": 0.8365650969529086, - "eval_loss": 0.33052197098731995, - "eval_precision": 0.7885117493472585, - "eval_recall": 0.8908554572271387, - "eval_runtime": 0.9027, - "eval_samples_per_second": 207.161, - "eval_steps_per_second": 3.323, + "eval_LOCATION_f1": 0.7763157894736842, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7375, + "eval_LOCATION_recall": 0.8194444444444444, + "eval_ORGANIZATION_f1": 0.7922077922077922, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7721518987341772, + "eval_ORGANIZATION_recall": 0.8133333333333334, + "eval_PERSON_f1": 0.8940397350993377, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8490566037735849, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.6792452830188679, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.28576722741127014, + "eval_overall_accuracy": 0.9617212909682261, + "eval_overall_f1": 0.8263305322128851, + "eval_overall_precision": 0.7866666666666666, + "eval_overall_recall": 0.8702064896755162, + "eval_runtime": 0.9045, + "eval_samples_per_second": 206.753, + "eval_steps_per_second": 3.317, "step": 1802 }, { "epoch": 18.0, - "grad_norm": 0.0013508679112419486, - "learning_rate": 5e-06, - "loss": 0.0005, + "grad_norm": 0.04714202508330345, + "learning_rate": 4.1e-05, + "loss": 0.0033, "step": 1908 }, { "epoch": 18.0, - "eval_accuracy": 0.9597197898423818, - "eval_f1": 0.8344923504867873, - "eval_loss": 0.3244776129722595, - "eval_precision": 0.7894736842105263, - "eval_recall": 0.8849557522123894, - "eval_runtime": 0.8996, - "eval_samples_per_second": 207.879, - "eval_steps_per_second": 3.335, + "eval_LOCATION_f1": 0.8, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7692307692307693, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.779874213836478, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7380952380952381, + "eval_ORGANIZATION_recall": 0.8266666666666667, + "eval_PERSON_f1": 0.9006622516556291, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8553459119496856, + "eval_PERSON_recall": 0.951048951048951, + "eval_QUANTITY_f1": 0.6923076923076923, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6206896551724138, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8421052631578947, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.7741935483870968, + "eval_TIME_recall": 0.9230769230769231, + "eval_loss": 0.30405738949775696, + "eval_overall_accuracy": 0.9619714786089567, + "eval_overall_f1": 0.8333333333333335, + "eval_overall_precision": 0.7874015748031497, + "eval_overall_recall": 0.8849557522123894, + "eval_runtime": 0.903, + "eval_samples_per_second": 207.088, + "eval_steps_per_second": 3.322, "step": 1908 }, { "epoch": 19.0, - "grad_norm": 0.0013845202047377825, - "learning_rate": 2.5e-06, - "loss": 0.0004, + "grad_norm": 0.008477783761918545, + "learning_rate": 4.05e-05, + "loss": 0.0033, "step": 2014 }, { "epoch": 19.0, - "eval_accuracy": 0.9602201651238429, - "eval_f1": 0.8372739916550764, - "eval_loss": 0.32481154799461365, - "eval_precision": 0.7921052631578948, - "eval_recall": 0.887905604719764, - "eval_runtime": 0.9114, - "eval_samples_per_second": 205.168, - "eval_steps_per_second": 3.291, + "eval_LOCATION_f1": 0.8413793103448277, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8356164383561644, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.8101265822784811, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7710843373493976, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.8979591836734694, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8741721854304636, + "eval_PERSON_recall": 0.9230769230769231, + "eval_QUANTITY_f1": 0.6923076923076923, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6206896551724138, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8148148148148148, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.7857142857142857, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3013346493244171, + "eval_overall_accuracy": 0.960720540405304, + "eval_overall_f1": 0.844950213371266, + "eval_overall_precision": 0.8159340659340659, + "eval_overall_recall": 0.8761061946902655, + "eval_runtime": 0.9229, + "eval_samples_per_second": 202.623, + "eval_steps_per_second": 3.251, "step": 2014 }, { "epoch": 20.0, - "grad_norm": 0.003232144983485341, - "learning_rate": 0.0, - "loss": 0.0003, + "grad_norm": 0.0049218675121665, + "learning_rate": 4e-05, + "loss": 0.0036, "step": 2120 }, { "epoch": 20.0, - "eval_accuracy": 0.9604703527645734, - "eval_f1": 0.8384401114206128, - "eval_loss": 0.3243328630924225, - "eval_precision": 0.7941952506596306, - "eval_recall": 0.887905604719764, - "eval_runtime": 0.9046, - "eval_samples_per_second": 206.727, - "eval_steps_per_second": 3.316, + "eval_LOCATION_f1": 0.8219178082191781, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8108108108108109, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.8, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7333333333333333, + "eval_ORGANIZATION_recall": 0.88, + "eval_PERSON_f1": 0.9023569023569024, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8701298701298701, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.6538461538461539, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.5862068965517241, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.2967695891857147, + "eval_overall_accuracy": 0.9609707280460346, + "eval_overall_f1": 0.8387096774193548, + "eval_overall_precision": 0.7994652406417112, + "eval_overall_recall": 0.8820058997050148, + "eval_runtime": 0.9818, + "eval_samples_per_second": 190.457, + "eval_steps_per_second": 3.055, "step": 2120 }, { - "epoch": 20.0, - "step": 2120, - "total_flos": 898035701398080.0, - "train_loss": 0.03343723254489168, - "train_runtime": 509.8629, - "train_samples_per_second": 66.175, - "train_steps_per_second": 4.158 + "epoch": 21.0, + "grad_norm": 0.03995713219046593, + "learning_rate": 3.9500000000000005e-05, + "loss": 0.0038, + "step": 2226 + }, + { + "epoch": 21.0, + "eval_LOCATION_f1": 0.7625899280575541, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7910447761194029, + "eval_LOCATION_recall": 0.7361111111111112, + "eval_ORGANIZATION_f1": 0.7374999999999999, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6941176470588235, + "eval_ORGANIZATION_recall": 0.7866666666666666, + "eval_PERSON_f1": 0.9047619047619047, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8807947019867549, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.7058823529411765, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6428571428571429, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.2894110381603241, + "eval_overall_accuracy": 0.9577182887165374, + "eval_overall_f1": 0.8177905308464849, + "eval_overall_precision": 0.7960893854748603, + "eval_overall_recall": 0.8407079646017699, + "eval_runtime": 0.9338, + "eval_samples_per_second": 200.266, + "eval_steps_per_second": 3.213, + "step": 2226 + }, + { + "epoch": 22.0, + "grad_norm": 0.001287546823732555, + "learning_rate": 3.9000000000000006e-05, + "loss": 0.004, + "step": 2332 + }, + { + "epoch": 22.0, + "eval_LOCATION_f1": 0.8266666666666667, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7948717948717948, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.7051282051282051, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6790123456790124, + "eval_ORGANIZATION_recall": 0.7333333333333333, + "eval_PERSON_f1": 0.8986486486486487, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.869281045751634, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.6792452830188679, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.29990673065185547, + "eval_overall_accuracy": 0.9554665999499625, + "eval_overall_f1": 0.8203677510608203, + "eval_overall_precision": 0.7880434782608695, + "eval_overall_recall": 0.855457227138643, + "eval_runtime": 0.9065, + "eval_samples_per_second": 206.288, + "eval_steps_per_second": 3.309, + "step": 2332 + }, + { + "epoch": 23.0, + "grad_norm": 0.01974656991660595, + "learning_rate": 3.85e-05, + "loss": 0.003, + "step": 2438 + }, + { + "epoch": 23.0, + "eval_LOCATION_f1": 0.8211920529801324, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7848101265822784, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8074534161490684, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7558139534883721, + "eval_ORGANIZATION_recall": 0.8666666666666667, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.6792452830188679, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3059156537055969, + "eval_overall_accuracy": 0.9622216662496873, + "eval_overall_f1": 0.8443197755960731, + "eval_overall_precision": 0.8048128342245989, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9125, + "eval_samples_per_second": 204.922, + "eval_steps_per_second": 3.288, + "step": 2438 + }, + { + "epoch": 24.0, + "grad_norm": 2.60111141204834, + "learning_rate": 3.8e-05, + "loss": 0.0038, + "step": 2544 + }, + { + "epoch": 24.0, + "eval_LOCATION_f1": 0.8133333333333332, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.782051282051282, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.7471264367816093, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6565656565656566, + "eval_ORGANIZATION_recall": 0.8666666666666667, + "eval_PERSON_f1": 0.9152542372881356, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8881578947368421, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.6792452830188679, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.7586206896551724, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3071446716785431, + "eval_overall_accuracy": 0.9582186639979985, + "eval_overall_f1": 0.828060522696011, + "eval_overall_precision": 0.7757731958762887, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9115, + "eval_samples_per_second": 205.145, + "eval_steps_per_second": 3.291, + "step": 2544 + }, + { + "epoch": 25.0, + "grad_norm": 5.347325801849365, + "learning_rate": 3.7500000000000003e-05, + "loss": 0.0039, + "step": 2650 + }, + { + "epoch": 25.0, + "eval_LOCATION_f1": 0.7792207792207793, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7317073170731707, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.729559748427673, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6904761904761905, + "eval_ORGANIZATION_recall": 0.7733333333333333, + "eval_PERSON_f1": 0.8993288590604027, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.864516129032258, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.6792452830188679, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8148148148148148, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.7857142857142857, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3066267967224121, + "eval_overall_accuracy": 0.9572179134350763, + "eval_overall_f1": 0.8133704735376045, + "eval_overall_precision": 0.7704485488126649, + "eval_overall_recall": 0.8613569321533924, + "eval_runtime": 0.909, + "eval_samples_per_second": 205.719, + "eval_steps_per_second": 3.3, + "step": 2650 + }, + { + "epoch": 26.0, + "grad_norm": 0.00547376973554492, + "learning_rate": 3.7e-05, + "loss": 0.0031, + "step": 2756 + }, + { + "epoch": 26.0, + "eval_LOCATION_f1": 0.8137931034482759, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8082191780821918, + "eval_LOCATION_recall": 0.8194444444444444, + "eval_ORGANIZATION_f1": 0.7701863354037267, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7209302325581395, + "eval_ORGANIZATION_recall": 0.8266666666666667, + "eval_PERSON_f1": 0.8837209302325583, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8417721518987342, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.6923076923076923, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6206896551724138, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8679245283018868, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8518518518518519, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3245824873447418, + "eval_overall_accuracy": 0.9597197898423818, + "eval_overall_f1": 0.8286516853932584, + "eval_overall_precision": 0.7908847184986595, + "eval_overall_recall": 0.8702064896755162, + "eval_runtime": 0.9241, + "eval_samples_per_second": 202.35, + "eval_steps_per_second": 3.246, + "step": 2756 + }, + { + "epoch": 27.0, + "grad_norm": 0.009228230454027653, + "learning_rate": 3.65e-05, + "loss": 0.0026, + "step": 2862 + }, + { + "epoch": 27.0, + "eval_LOCATION_f1": 0.8219178082191781, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8108108108108109, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.7407407407407408, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6896551724137931, + "eval_ORGANIZATION_recall": 0.8, + "eval_PERSON_f1": 0.903654485049834, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8607594936708861, + "eval_PERSON_recall": 0.951048951048951, + "eval_QUANTITY_f1": 0.7169811320754716, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6333333333333333, + "eval_QUANTITY_recall": 0.8260869565217391, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.32465118169784546, + "eval_overall_accuracy": 0.9584688516387291, + "eval_overall_f1": 0.8324022346368715, + "eval_overall_precision": 0.7904509283819628, + "eval_overall_recall": 0.8790560471976401, + "eval_runtime": 0.8984, + "eval_samples_per_second": 208.15, + "eval_steps_per_second": 3.339, + "step": 2862 + }, + { + "epoch": 28.0, + "grad_norm": 3.7562034130096436, + "learning_rate": 3.6e-05, + "loss": 0.0041, + "step": 2968 + }, + { + "epoch": 28.0, + "eval_LOCATION_f1": 0.8082191780821918, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7972972972972973, + "eval_LOCATION_recall": 0.8194444444444444, + "eval_ORGANIZATION_f1": 0.7469879518072289, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6813186813186813, + "eval_ORGANIZATION_recall": 0.8266666666666667, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.6923076923076923, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6206896551724138, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3042037785053253, + "eval_overall_accuracy": 0.9592194145609206, + "eval_overall_f1": 0.8286516853932584, + "eval_overall_precision": 0.7908847184986595, + "eval_overall_recall": 0.8702064896755162, + "eval_runtime": 0.9162, + "eval_samples_per_second": 204.094, + "eval_steps_per_second": 3.274, + "step": 2968 + }, + { + "epoch": 29.0, + "grad_norm": 5.308003902435303, + "learning_rate": 3.55e-05, + "loss": 0.0034, + "step": 3074 + }, + { + "epoch": 29.0, + "eval_LOCATION_f1": 0.8413793103448277, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8356164383561644, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.7975460122699386, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7386363636363636, + "eval_ORGANIZATION_recall": 0.8666666666666667, + "eval_PERSON_f1": 0.9146757679180888, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8933333333333333, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.6923076923076923, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6206896551724138, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3232886493206024, + "eval_overall_accuracy": 0.9609707280460346, + "eval_overall_f1": 0.851063829787234, + "eval_overall_precision": 0.819672131147541, + "eval_overall_recall": 0.8849557522123894, + "eval_runtime": 0.9849, + "eval_samples_per_second": 189.867, + "eval_steps_per_second": 3.046, + "step": 3074 + }, + { + "epoch": 30.0, + "grad_norm": 0.0021002369467169046, + "learning_rate": 3.5e-05, + "loss": 0.0027, + "step": 3180 + }, + { + "epoch": 30.0, + "eval_LOCATION_f1": 0.8356164383561645, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8243243243243243, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.732919254658385, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.686046511627907, + "eval_ORGANIZATION_recall": 0.7866666666666666, + "eval_PERSON_f1": 0.9121621621621621, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8823529411764706, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.7272727272727273, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.625, + "eval_QUANTITY_recall": 0.8695652173913043, + "eval_TIME_f1": 0.7586206896551724, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.6875, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.34255892038345337, + "eval_overall_accuracy": 0.9577182887165374, + "eval_overall_f1": 0.8296089385474861, + "eval_overall_precision": 0.7877984084880637, + "eval_overall_recall": 0.8761061946902655, + "eval_runtime": 0.9051, + "eval_samples_per_second": 206.618, + "eval_steps_per_second": 3.315, + "step": 3180 + }, + { + "epoch": 31.0, + "grad_norm": 0.00587083725258708, + "learning_rate": 3.45e-05, + "loss": 0.0049, + "step": 3286 + }, + { + "epoch": 31.0, + "eval_LOCATION_f1": 0.8219178082191781, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8108108108108109, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.7305389221556886, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6630434782608695, + "eval_ORGANIZATION_recall": 0.8133333333333334, + "eval_PERSON_f1": 0.9152542372881356, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8881578947368421, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.6923076923076923, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6206896551724138, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.31757453083992004, + "eval_overall_accuracy": 0.9584688516387291, + "eval_overall_f1": 0.8314606741573034, + "eval_overall_precision": 0.7935656836461126, + "eval_overall_recall": 0.8731563421828908, + "eval_runtime": 0.9036, + "eval_samples_per_second": 206.959, + "eval_steps_per_second": 3.32, + "step": 3286 + }, + { + "epoch": 32.0, + "grad_norm": 0.03227420523762703, + "learning_rate": 3.4000000000000007e-05, + "loss": 0.0027, + "step": 3392 + }, + { + "epoch": 32.0, + "eval_LOCATION_f1": 0.8243243243243243, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8026315789473685, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.7625, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7176470588235294, + "eval_ORGANIZATION_recall": 0.8133333333333334, + "eval_PERSON_f1": 0.9215017064846417, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.9, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.7083333333333334, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.68, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.8846153846153846, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8846153846153846, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.29548466205596924, + "eval_overall_accuracy": 0.9627220415311484, + "eval_overall_f1": 0.8473609129814551, + "eval_overall_precision": 0.8204419889502762, + "eval_overall_recall": 0.8761061946902655, + "eval_runtime": 0.9155, + "eval_samples_per_second": 204.26, + "eval_steps_per_second": 3.277, + "step": 3392 + }, + { + "epoch": 33.0, + "grad_norm": 0.016770539805293083, + "learning_rate": 3.35e-05, + "loss": 0.0017, + "step": 3498 + }, + { + "epoch": 33.0, + "eval_LOCATION_f1": 0.8, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7692307692307693, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.7974683544303797, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7590361445783133, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.9054054054054055, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8758169934640523, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.6666666666666667, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.5806451612903226, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3393411338329315, + "eval_overall_accuracy": 0.9592194145609206, + "eval_overall_f1": 0.8354430379746836, + "eval_overall_precision": 0.7983870967741935, + "eval_overall_recall": 0.8761061946902655, + "eval_runtime": 0.9082, + "eval_samples_per_second": 205.908, + "eval_steps_per_second": 3.303, + "step": 3498 + }, + { + "epoch": 34.0, + "grad_norm": 0.003996172454208136, + "learning_rate": 3.3e-05, + "loss": 0.0017, + "step": 3604 + }, + { + "epoch": 34.0, + "eval_LOCATION_f1": 0.8243243243243243, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8026315789473685, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.8227848101265823, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7831325301204819, + "eval_ORGANIZATION_recall": 0.8666666666666667, + "eval_PERSON_f1": 0.910958904109589, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8926174496644296, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.7555555555555555, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.7727272727272727, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3279131352901459, + "eval_overall_accuracy": 0.9644733550162622, + "eval_overall_f1": 0.8575539568345324, + "eval_overall_precision": 0.8370786516853933, + "eval_overall_recall": 0.8790560471976401, + "eval_runtime": 0.9098, + "eval_samples_per_second": 205.55, + "eval_steps_per_second": 3.298, + "step": 3604 + }, + { + "epoch": 35.0, + "grad_norm": 0.0200356375426054, + "learning_rate": 3.2500000000000004e-05, + "loss": 0.002, + "step": 3710 + }, + { + "epoch": 35.0, + "eval_LOCATION_f1": 0.8108108108108109, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7894736842105263, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.8, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7333333333333333, + "eval_ORGANIZATION_recall": 0.88, + "eval_PERSON_f1": 0.9016949152542374, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.875, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.6923076923076923, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6206896551724138, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.33025962114334106, + "eval_overall_accuracy": 0.9597197898423818, + "eval_overall_f1": 0.8398876404494382, + "eval_overall_precision": 0.8016085790884718, + "eval_overall_recall": 0.8820058997050148, + "eval_runtime": 0.9088, + "eval_samples_per_second": 205.758, + "eval_steps_per_second": 3.301, + "step": 3710 + }, + { + "epoch": 36.0, + "grad_norm": 0.04783305525779724, + "learning_rate": 3.2000000000000005e-05, + "loss": 0.0012, + "step": 3816 + }, + { + "epoch": 36.0, + "eval_LOCATION_f1": 0.8344370860927153, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7974683544303798, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.7875000000000001, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7411764705882353, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.9010238907849829, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.88, + "eval_PERSON_recall": 0.9230769230769231, + "eval_QUANTITY_f1": 0.72, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6666666666666666, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.33322834968566895, + "eval_overall_accuracy": 0.9637227920940705, + "eval_overall_f1": 0.8441926345609065, + "eval_overall_precision": 0.8119891008174387, + "eval_overall_recall": 0.8790560471976401, + "eval_runtime": 0.9959, + "eval_samples_per_second": 187.774, + "eval_steps_per_second": 3.012, + "step": 3816 + }, + { + "epoch": 37.0, + "grad_norm": 0.0011351928114891052, + "learning_rate": 3.15e-05, + "loss": 0.001, + "step": 3922 + }, + { + "epoch": 37.0, + "eval_LOCATION_f1": 0.816326530612245, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.7710843373493976, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7032967032967034, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.910958904109589, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8926174496644296, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.72, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6666666666666666, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8235294117647058, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.84, + "eval_TIME_recall": 0.8076923076923077, + "eval_loss": 0.33810704946517944, + "eval_overall_accuracy": 0.9604703527645734, + "eval_overall_f1": 0.8385269121813032, + "eval_overall_precision": 0.8065395095367848, + "eval_overall_recall": 0.8731563421828908, + "eval_runtime": 0.9038, + "eval_samples_per_second": 206.905, + "eval_steps_per_second": 3.319, + "step": 3922 + }, + { + "epoch": 38.0, + "grad_norm": 12.923250198364258, + "learning_rate": 3.1e-05, + "loss": 0.0021, + "step": 4028 + }, + { + "epoch": 38.0, + "eval_LOCATION_f1": 0.816326530612245, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.7721518987341773, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7349397590361446, + "eval_ORGANIZATION_recall": 0.8133333333333334, + "eval_PERSON_f1": 0.9158249158249158, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8831168831168831, + "eval_PERSON_recall": 0.951048951048951, + "eval_QUANTITY_f1": 0.7058823529411765, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6428571428571429, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3416782021522522, + "eval_overall_accuracy": 0.960720540405304, + "eval_overall_f1": 0.8425531914893618, + "eval_overall_precision": 0.8114754098360656, + "eval_overall_recall": 0.8761061946902655, + "eval_runtime": 0.9052, + "eval_samples_per_second": 206.591, + "eval_steps_per_second": 3.314, + "step": 4028 + }, + { + "epoch": 39.0, + "grad_norm": 0.05247601494193077, + "learning_rate": 3.05e-05, + "loss": 0.0026, + "step": 4134 + }, + { + "epoch": 39.0, + "eval_LOCATION_f1": 0.7891156462585034, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7733333333333333, + "eval_LOCATION_recall": 0.8055555555555556, + "eval_ORGANIZATION_f1": 0.7974683544303797, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7590361445783133, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.8963210702341137, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8589743589743589, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7169811320754716, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6333333333333333, + "eval_QUANTITY_recall": 0.8260869565217391, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.37723416090011597, + "eval_overall_accuracy": 0.9587190392794596, + "eval_overall_f1": 0.8338028169014085, + "eval_overall_precision": 0.7978436657681941, + "eval_overall_recall": 0.8731563421828908, + "eval_runtime": 0.9093, + "eval_samples_per_second": 205.644, + "eval_steps_per_second": 3.299, + "step": 4134 + }, + { + "epoch": 40.0, + "grad_norm": 0.0038078853394836187, + "learning_rate": 3e-05, + "loss": 0.0021, + "step": 4240 + }, + { + "epoch": 40.0, + "eval_LOCATION_f1": 0.7891156462585034, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7733333333333333, + "eval_LOCATION_recall": 0.8055555555555556, + "eval_ORGANIZATION_f1": 0.7894736842105264, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7792207792207793, + "eval_ORGANIZATION_recall": 0.8, + "eval_PERSON_f1": 0.9146757679180888, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8933333333333333, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7272727272727272, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.7619047619047619, + "eval_QUANTITY_recall": 0.6956521739130435, + "eval_TIME_f1": 0.8, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.7586206896551724, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.331974595785141, + "eval_overall_accuracy": 0.960720540405304, + "eval_overall_f1": 0.8393632416787264, + "eval_overall_precision": 0.8238636363636364, + "eval_overall_recall": 0.855457227138643, + "eval_runtime": 0.902, + "eval_samples_per_second": 207.323, + "eval_steps_per_second": 3.326, + "step": 4240 + }, + { + "epoch": 41.0, + "grad_norm": 0.0014568913029506803, + "learning_rate": 2.95e-05, + "loss": 0.0013, + "step": 4346 + }, + { + "epoch": 41.0, + "eval_LOCATION_f1": 0.8187919463087249, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7922077922077922, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.7425149700598803, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6739130434782609, + "eval_ORGANIZATION_recall": 0.8266666666666667, + "eval_PERSON_f1": 0.9090909090909092, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8766233766233766, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.76, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.7037037037037037, + "eval_QUANTITY_recall": 0.8260869565217391, + "eval_TIME_f1": 0.8627450980392156, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.88, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3371780812740326, + "eval_overall_accuracy": 0.9619714786089567, + "eval_overall_f1": 0.8375350140056023, + "eval_overall_precision": 0.7973333333333333, + "eval_overall_recall": 0.8820058997050148, + "eval_runtime": 0.9175, + "eval_samples_per_second": 203.81, + "eval_steps_per_second": 3.27, + "step": 4346 + }, + { + "epoch": 42.0, + "grad_norm": 0.01008665468543768, + "learning_rate": 2.9e-05, + "loss": 0.0013, + "step": 4452 + }, + { + "epoch": 42.0, + "eval_LOCATION_f1": 0.7837837837837838, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7631578947368421, + "eval_LOCATION_recall": 0.8055555555555556, + "eval_ORGANIZATION_f1": 0.779874213836478, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7380952380952381, + "eval_ORGANIZATION_recall": 0.8266666666666667, + "eval_PERSON_f1": 0.9023569023569024, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8701298701298701, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.72, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6666666666666666, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3549456298351288, + "eval_overall_accuracy": 0.9602201651238429, + "eval_overall_f1": 0.8333333333333334, + "eval_overall_precision": 0.7994579945799458, + "eval_overall_recall": 0.8702064896755162, + "eval_runtime": 0.9061, + "eval_samples_per_second": 206.389, + "eval_steps_per_second": 3.311, + "step": 4452 + }, + { + "epoch": 43.0, + "grad_norm": 0.0012029644567519426, + "learning_rate": 2.8499999999999998e-05, + "loss": 0.0003, + "step": 4558 + }, + { + "epoch": 43.0, + "eval_LOCATION_f1": 0.8, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7469879518072289, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.7682926829268292, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7078651685393258, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.9060402684563759, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8709677419354839, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.7058823529411765, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6428571428571429, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8846153846153846, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8846153846153846, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.36216506361961365, + "eval_overall_accuracy": 0.9604703527645734, + "eval_overall_f1": 0.836111111111111, + "eval_overall_precision": 0.7900262467191601, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9049, + "eval_samples_per_second": 206.658, + "eval_steps_per_second": 3.315, + "step": 4558 + }, + { + "epoch": 44.0, + "grad_norm": 0.04154082387685776, + "learning_rate": 2.8000000000000003e-05, + "loss": 0.0032, + "step": 4664 + }, + { + "epoch": 44.0, + "eval_LOCATION_f1": 0.8026315789473685, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7625, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.7619047619047621, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6881720430107527, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.9060402684563759, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8709677419354839, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.7307692307692308, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6551724137931034, + "eval_QUANTITY_recall": 0.8260869565217391, + "eval_TIME_f1": 0.8148148148148148, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.7857142857142857, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.35855501890182495, + "eval_overall_accuracy": 0.957968476357268, + "eval_overall_f1": 0.8314917127071824, + "eval_overall_precision": 0.7818181818181819, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9082, + "eval_samples_per_second": 205.905, + "eval_steps_per_second": 3.303, + "step": 4664 + }, + { + "epoch": 45.0, + "grad_norm": 0.002047579735517502, + "learning_rate": 2.7500000000000004e-05, + "loss": 0.001, + "step": 4770 + }, + { + "epoch": 45.0, + "eval_LOCATION_f1": 0.8133333333333332, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.782051282051282, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.7950310559006211, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7441860465116279, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.9158249158249158, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8831168831168831, + "eval_PERSON_recall": 0.951048951048951, + "eval_QUANTITY_f1": 0.7307692307692308, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6551724137931034, + "eval_QUANTITY_recall": 0.8260869565217391, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.36997854709625244, + "eval_overall_accuracy": 0.9619714786089567, + "eval_overall_f1": 0.847124824684432, + "eval_overall_precision": 0.8074866310160428, + "eval_overall_recall": 0.8908554572271387, + "eval_runtime": 0.9062, + "eval_samples_per_second": 206.36, + "eval_steps_per_second": 3.311, + "step": 4770 + }, + { + "epoch": 46.0, + "grad_norm": 0.0037038603331893682, + "learning_rate": 2.7000000000000002e-05, + "loss": 0.0034, + "step": 4876 + }, + { + "epoch": 46.0, + "eval_LOCATION_f1": 0.8333333333333334, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8333333333333334, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.7924528301886793, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.75, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.9121621621621621, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8823529411764706, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.7307692307692308, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6551724137931034, + "eval_QUANTITY_recall": 0.8260869565217391, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.33895859122276306, + "eval_overall_accuracy": 0.9602201651238429, + "eval_overall_f1": 0.8494318181818181, + "eval_overall_precision": 0.8191780821917808, + "eval_overall_recall": 0.8820058997050148, + "eval_runtime": 0.9121, + "eval_samples_per_second": 205.028, + "eval_steps_per_second": 3.289, + "step": 4876 + }, + { + "epoch": 47.0, + "grad_norm": 0.0005634190747514367, + "learning_rate": 2.6500000000000004e-05, + "loss": 0.0018, + "step": 4982 + }, + { + "epoch": 47.0, + "eval_LOCATION_f1": 0.8211920529801324, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7848101265822784, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.7564102564102564, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7283950617283951, + "eval_ORGANIZATION_recall": 0.7866666666666666, + "eval_PERSON_f1": 0.9060402684563759, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8709677419354839, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.72, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6666666666666666, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3375060260295868, + "eval_overall_accuracy": 0.9632224168126094, + "eval_overall_f1": 0.8373408769448375, + "eval_overall_precision": 0.8043478260869565, + "eval_overall_recall": 0.8731563421828908, + "eval_runtime": 0.9199, + "eval_samples_per_second": 203.274, + "eval_steps_per_second": 3.261, + "step": 4982 + }, + { + "epoch": 48.0, + "grad_norm": 0.0028315193485468626, + "learning_rate": 2.6000000000000002e-05, + "loss": 0.0017, + "step": 5088 + }, + { + "epoch": 48.0, + "eval_LOCATION_f1": 0.802721088435374, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7866666666666666, + "eval_LOCATION_recall": 0.8194444444444444, + "eval_ORGANIZATION_f1": 0.7974683544303797, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7590361445783133, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.9183673469387755, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8940397350993378, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.72, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6666666666666666, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.33102044463157654, + "eval_overall_accuracy": 0.9632224168126094, + "eval_overall_f1": 0.8473609129814551, + "eval_overall_precision": 0.8204419889502762, + "eval_overall_recall": 0.8761061946902655, + "eval_runtime": 0.9017, + "eval_samples_per_second": 207.378, + "eval_steps_per_second": 3.327, + "step": 5088 + }, + { + "epoch": 49.0, + "grad_norm": 0.009939000010490417, + "learning_rate": 2.5500000000000003e-05, + "loss": 0.0014, + "step": 5194 + }, + { + "epoch": 49.0, + "eval_LOCATION_f1": 0.8299319727891157, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8133333333333334, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.8074534161490684, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7558139534883721, + "eval_ORGANIZATION_recall": 0.8666666666666667, + "eval_PERSON_f1": 0.9121621621621621, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8823529411764706, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.7450980392156864, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6785714285714286, + "eval_QUANTITY_recall": 0.8260869565217391, + "eval_TIME_f1": 0.8627450980392156, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.88, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.32123759388923645, + "eval_overall_accuracy": 0.9624718538904178, + "eval_overall_f1": 0.8555240793201133, + "eval_overall_precision": 0.8228882833787466, + "eval_overall_recall": 0.8908554572271387, + "eval_runtime": 0.9187, + "eval_samples_per_second": 203.539, + "eval_steps_per_second": 3.265, + "step": 5194 + }, + { + "epoch": 50.0, + "grad_norm": 0.7588798403739929, + "learning_rate": 2.5e-05, + "loss": 0.0011, + "step": 5300 + }, + { + "epoch": 50.0, + "eval_LOCATION_f1": 0.802721088435374, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7866666666666666, + "eval_LOCATION_recall": 0.8194444444444444, + "eval_ORGANIZATION_f1": 0.7924528301886793, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.75, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.9152542372881356, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8881578947368421, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.72, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6666666666666666, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3109734356403351, + "eval_overall_accuracy": 0.9622216662496873, + "eval_overall_f1": 0.8453900709219858, + "eval_overall_precision": 0.8142076502732241, + "eval_overall_recall": 0.8790560471976401, + "eval_runtime": 0.9093, + "eval_samples_per_second": 205.655, + "eval_steps_per_second": 3.299, + "step": 5300 + }, + { + "epoch": 51.0, + "grad_norm": 0.0009810138726606965, + "learning_rate": 2.45e-05, + "loss": 0.0005, + "step": 5406 + }, + { + "epoch": 51.0, + "eval_LOCATION_f1": 0.8299319727891157, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8133333333333334, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.825, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7764705882352941, + "eval_ORGANIZATION_recall": 0.88, + "eval_PERSON_f1": 0.9246575342465754, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.9060402684563759, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.7058823529411765, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6428571428571429, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.30816784501075745, + "eval_overall_accuracy": 0.9659744808606455, + "eval_overall_f1": 0.8607954545454546, + "eval_overall_precision": 0.8301369863013699, + "eval_overall_recall": 0.8938053097345132, + "eval_runtime": 0.914, + "eval_samples_per_second": 204.601, + "eval_steps_per_second": 3.282, + "step": 5406 + }, + { + "epoch": 52.0, + "grad_norm": 0.0026644645258784294, + "learning_rate": 2.4e-05, + "loss": 0.0003, + "step": 5512 + }, + { + "epoch": 52.0, + "eval_LOCATION_f1": 0.8157894736842106, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.775, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8024691358024691, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7471264367816092, + "eval_ORGANIZATION_recall": 0.8666666666666667, + "eval_PERSON_f1": 0.9183673469387755, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8940397350993378, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.693877551020408, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6538461538461539, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3176332414150238, + "eval_overall_accuracy": 0.9647235426569928, + "eval_overall_f1": 0.849507735583685, + "eval_overall_precision": 0.8118279569892473, + "eval_overall_recall": 0.8908554572271387, + "eval_runtime": 0.9767, + "eval_samples_per_second": 191.467, + "eval_steps_per_second": 3.072, + "step": 5512 + }, + { + "epoch": 53.0, + "grad_norm": 0.0603233277797699, + "learning_rate": 2.35e-05, + "loss": 0.0004, + "step": 5618 + }, + { + "epoch": 53.0, + "eval_LOCATION_f1": 0.8356164383561645, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8243243243243243, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.8121212121212122, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7444444444444445, + "eval_ORGANIZATION_recall": 0.8933333333333333, + "eval_PERSON_f1": 0.9215017064846417, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.9, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.68, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6296296296296297, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3314068019390106, + "eval_overall_accuracy": 0.9647235426569928, + "eval_overall_f1": 0.8559322033898304, + "eval_overall_precision": 0.8211382113821138, + "eval_overall_recall": 0.8938053097345132, + "eval_runtime": 0.9085, + "eval_samples_per_second": 205.826, + "eval_steps_per_second": 3.302, + "step": 5618 + }, + { + "epoch": 54.0, + "grad_norm": 0.00044817946036346257, + "learning_rate": 2.3000000000000003e-05, + "loss": 0.0002, + "step": 5724 + }, + { + "epoch": 54.0, + "eval_LOCATION_f1": 0.8211920529801324, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7848101265822784, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8050314465408804, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7619047619047619, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.925170068027211, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.9006622516556292, + "eval_PERSON_recall": 0.951048951048951, + "eval_QUANTITY_f1": 0.693877551020408, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6538461538461539, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3241828978061676, + "eval_overall_accuracy": 0.9657242932199149, + "eval_overall_f1": 0.8543140028288544, + "eval_overall_precision": 0.8206521739130435, + "eval_overall_recall": 0.8908554572271387, + "eval_runtime": 0.9117, + "eval_samples_per_second": 205.114, + "eval_steps_per_second": 3.291, + "step": 5724 + }, + { + "epoch": 55.0, + "grad_norm": 0.0010649035684764385, + "learning_rate": 2.25e-05, + "loss": 0.0005, + "step": 5830 + }, + { + "epoch": 55.0, + "eval_LOCATION_f1": 0.8289473684210527, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7875, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.7875000000000001, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7411764705882353, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.9220338983050849, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8947368421052632, + "eval_PERSON_recall": 0.951048951048951, + "eval_QUANTITY_f1": 0.68, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6296296296296297, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.33954718708992004, + "eval_overall_accuracy": 0.9627220415311484, + "eval_overall_f1": 0.849507735583685, + "eval_overall_precision": 0.8118279569892473, + "eval_overall_recall": 0.8908554572271387, + "eval_runtime": 0.9361, + "eval_samples_per_second": 199.766, + "eval_steps_per_second": 3.205, + "step": 5830 + }, + { + "epoch": 56.0, + "grad_norm": 0.0006854601670056581, + "learning_rate": 2.2000000000000003e-05, + "loss": 0.0001, + "step": 5936 + }, + { + "epoch": 56.0, + "eval_LOCATION_f1": 0.8289473684210527, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7875, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.7826086956521738, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7325581395348837, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.925170068027211, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.9006622516556292, + "eval_PERSON_recall": 0.951048951048951, + "eval_QUANTITY_f1": 0.7083333333333334, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.68, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3326149582862854, + "eval_overall_accuracy": 0.9647235426569928, + "eval_overall_f1": 0.8519040902679831, + "eval_overall_precision": 0.8162162162162162, + "eval_overall_recall": 0.8908554572271387, + "eval_runtime": 0.9055, + "eval_samples_per_second": 206.509, + "eval_steps_per_second": 3.313, + "step": 5936 + }, + { + "epoch": 57.0, + "grad_norm": 0.0004171407490503043, + "learning_rate": 2.15e-05, + "loss": 0.0008, + "step": 6042 + }, + { + "epoch": 57.0, + "eval_LOCATION_f1": 0.8211920529801324, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7848101265822784, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.7950310559006211, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7441860465116279, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.9090909090909092, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8766233766233766, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.68, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6296296296296297, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.8679245283018868, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8518518518518519, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3388373553752899, + "eval_overall_accuracy": 0.9639729797348011, + "eval_overall_f1": 0.8455056179775281, + "eval_overall_precision": 0.806970509383378, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9161, + "eval_samples_per_second": 204.134, + "eval_steps_per_second": 3.275, + "step": 6042 + }, + { + "epoch": 58.0, + "grad_norm": 0.000792400271166116, + "learning_rate": 2.1e-05, + "loss": 0.0005, + "step": 6148 + }, + { + "epoch": 58.0, + "eval_LOCATION_f1": 0.8344370860927153, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7974683544303798, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.8121212121212122, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7444444444444445, + "eval_ORGANIZATION_recall": 0.8933333333333333, + "eval_PERSON_f1": 0.8993288590604027, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.864516129032258, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.693877551020408, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6538461538461539, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3484926223754883, + "eval_overall_accuracy": 0.9622216662496873, + "eval_overall_f1": 0.8479776847977685, + "eval_overall_precision": 0.8042328042328042, + "eval_overall_recall": 0.8967551622418879, + "eval_runtime": 0.9061, + "eval_samples_per_second": 206.382, + "eval_steps_per_second": 3.311, + "step": 6148 + }, + { + "epoch": 59.0, + "grad_norm": 0.0005213640397414565, + "learning_rate": 2.05e-05, + "loss": 0.0004, + "step": 6254 + }, + { + "epoch": 59.0, + "eval_LOCATION_f1": 0.8211920529801324, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7848101265822784, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.7950310559006211, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7441860465116279, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.9215017064846417, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.9, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.6666666666666666, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6071428571428571, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.8627450980392156, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.88, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.34474921226501465, + "eval_overall_accuracy": 0.9627220415311484, + "eval_overall_f1": 0.8486562942008488, + "eval_overall_precision": 0.8152173913043478, + "eval_overall_recall": 0.8849557522123894, + "eval_runtime": 0.9086, + "eval_samples_per_second": 205.807, + "eval_steps_per_second": 3.302, + "step": 6254 + }, + { + "epoch": 60.0, + "grad_norm": 0.0031596734188497066, + "learning_rate": 2e-05, + "loss": 0.0017, + "step": 6360 + }, + { + "epoch": 60.0, + "eval_LOCATION_f1": 0.8289473684210527, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7875, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.783625730994152, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.6979166666666666, + "eval_ORGANIZATION_recall": 0.8933333333333333, + "eval_PERSON_f1": 0.8993288590604027, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.864516129032258, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.6666666666666667, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.5806451612903226, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3943552076816559, + "eval_overall_accuracy": 0.9559669752314236, + "eval_overall_f1": 0.8363136176066025, + "eval_overall_precision": 0.7835051546391752, + "eval_overall_recall": 0.8967551622418879, + "eval_runtime": 0.9068, + "eval_samples_per_second": 206.222, + "eval_steps_per_second": 3.308, + "step": 6360 + }, + { + "epoch": 61.0, + "grad_norm": 0.0038910319563001394, + "learning_rate": 1.9500000000000003e-05, + "loss": 0.0002, + "step": 6466 + }, + { + "epoch": 61.0, + "eval_LOCATION_f1": 0.8322147651006712, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8051948051948052, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7333333333333333, + "eval_ORGANIZATION_recall": 0.88, + "eval_PERSON_f1": 0.8963210702341137, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8589743589743589, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7346938775510203, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6923076923076923, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.38600656390190125, + "eval_overall_accuracy": 0.9599699774831123, + "eval_overall_f1": 0.8447552447552448, + "eval_overall_precision": 0.8031914893617021, + "eval_overall_recall": 0.8908554572271387, + "eval_runtime": 0.9064, + "eval_samples_per_second": 206.303, + "eval_steps_per_second": 3.31, + "step": 6466 + }, + { + "epoch": 62.0, + "grad_norm": 0.008979488164186478, + "learning_rate": 1.9e-05, + "loss": 0.0001, + "step": 6572 + }, + { + "epoch": 62.0, + "eval_LOCATION_f1": 0.8187919463087249, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7922077922077922, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.8176100628930819, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7738095238095238, + "eval_ORGANIZATION_recall": 0.8666666666666667, + "eval_PERSON_f1": 0.9047619047619047, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8807947019867549, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.7083333333333334, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.68, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3512948453426361, + "eval_overall_accuracy": 0.9629722291718789, + "eval_overall_f1": 0.8477951635846371, + "eval_overall_precision": 0.8186813186813187, + "eval_overall_recall": 0.8790560471976401, + "eval_runtime": 0.9032, + "eval_samples_per_second": 207.035, + "eval_steps_per_second": 3.321, + "step": 6572 + }, + { + "epoch": 63.0, + "grad_norm": 0.00276816263794899, + "learning_rate": 1.85e-05, + "loss": 0.0013, + "step": 6678 + }, + { + "epoch": 63.0, + "eval_LOCATION_f1": 0.8289473684210527, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7875, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.7904191616766466, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.717391304347826, + "eval_ORGANIZATION_recall": 0.88, + "eval_PERSON_f1": 0.9060402684563759, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8709677419354839, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.7083333333333334, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.68, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3540952205657959, + "eval_overall_accuracy": 0.9629722291718789, + "eval_overall_f1": 0.8440111420612812, + "eval_overall_precision": 0.7994722955145118, + "eval_overall_recall": 0.8938053097345132, + "eval_runtime": 0.9089, + "eval_samples_per_second": 205.74, + "eval_steps_per_second": 3.301, + "step": 6678 + }, + { + "epoch": 64.0, + "grad_norm": 0.010789873078465462, + "learning_rate": 1.8e-05, + "loss": 0.0007, + "step": 6784 + }, + { + "epoch": 64.0, + "eval_LOCATION_f1": 0.779874213836478, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7126436781609196, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.7848101265822784, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7469879518072289, + "eval_ORGANIZATION_recall": 0.8266666666666667, + "eval_PERSON_f1": 0.9090909090909092, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8766233766233766, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.7058823529411765, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6428571428571429, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.34456735849380493, + "eval_overall_accuracy": 0.9619714786089567, + "eval_overall_f1": 0.8344923504867873, + "eval_overall_precision": 0.7894736842105263, + "eval_overall_recall": 0.8849557522123894, + "eval_runtime": 0.9096, + "eval_samples_per_second": 205.587, + "eval_steps_per_second": 3.298, + "step": 6784 + }, + { + "epoch": 65.0, + "grad_norm": 0.0003090931277256459, + "learning_rate": 1.75e-05, + "loss": 0.0008, + "step": 6890 + }, + { + "epoch": 65.0, + "eval_LOCATION_f1": 0.8181818181818181, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7682926829268293, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.782051282051282, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7530864197530864, + "eval_ORGANIZATION_recall": 0.8133333333333334, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7346938775510203, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6923076923076923, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3443866968154907, + "eval_overall_accuracy": 0.9629722291718789, + "eval_overall_f1": 0.8429985855728431, + "eval_overall_precision": 0.8097826086956522, + "eval_overall_recall": 0.8790560471976401, + "eval_runtime": 0.906, + "eval_samples_per_second": 206.397, + "eval_steps_per_second": 3.311, + "step": 6890 + }, + { + "epoch": 66.0, + "grad_norm": 0.008000018075108528, + "learning_rate": 1.7000000000000003e-05, + "loss": 0.0007, + "step": 6996 + }, + { + "epoch": 66.0, + "eval_LOCATION_f1": 0.823529411764706, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7777777777777778, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.7564102564102564, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7283950617283951, + "eval_ORGANIZATION_recall": 0.7866666666666666, + "eval_PERSON_f1": 0.9121621621621621, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8823529411764706, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.7083333333333334, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.68, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3399989902973175, + "eval_overall_accuracy": 0.9627220415311484, + "eval_overall_f1": 0.8385269121813032, + "eval_overall_precision": 0.8065395095367848, + "eval_overall_recall": 0.8731563421828908, + "eval_runtime": 0.9215, + "eval_samples_per_second": 202.925, + "eval_steps_per_second": 3.255, + "step": 6996 + }, + { + "epoch": 67.0, + "grad_norm": 0.00037926252116449177, + "learning_rate": 1.65e-05, + "loss": 0.0004, + "step": 7102 + }, + { + "epoch": 67.0, + "eval_LOCATION_f1": 0.8289473684210527, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7875, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.8148148148148148, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7586206896551724, + "eval_ORGANIZATION_recall": 0.88, + "eval_PERSON_f1": 0.9090909090909092, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8766233766233766, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3691372275352478, + "eval_overall_accuracy": 0.96347260445334, + "eval_overall_f1": 0.853932584269663, + "eval_overall_precision": 0.8150134048257373, + "eval_overall_recall": 0.8967551622418879, + "eval_runtime": 0.9131, + "eval_samples_per_second": 204.802, + "eval_steps_per_second": 3.286, + "step": 7102 + }, + { + "epoch": 68.0, + "grad_norm": 0.0003724870621226728, + "learning_rate": 1.6000000000000003e-05, + "loss": 0.0012, + "step": 7208 + }, + { + "epoch": 68.0, + "eval_LOCATION_f1": 0.8322147651006712, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8051948051948052, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8280254777070064, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7926829268292683, + "eval_ORGANIZATION_recall": 0.8666666666666667, + "eval_PERSON_f1": 0.9121621621621621, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8823529411764706, + "eval_PERSON_recall": 0.9440559440559441, + "eval_QUANTITY_f1": 0.7083333333333334, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.68, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.8627450980392156, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.88, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.33306267857551575, + "eval_overall_accuracy": 0.9654741055791843, + "eval_overall_f1": 0.8587731811697574, + "eval_overall_precision": 0.8314917127071824, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9838, + "eval_samples_per_second": 190.074, + "eval_steps_per_second": 3.049, + "step": 7208 + }, + { + "epoch": 69.0, + "grad_norm": 0.0002074290969176218, + "learning_rate": 1.55e-05, + "loss": 0.0003, + "step": 7314 + }, + { + "epoch": 69.0, + "eval_LOCATION_f1": 0.8344370860927153, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7974683544303798, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.8170731707317072, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7528089887640449, + "eval_ORGANIZATION_recall": 0.8933333333333333, + "eval_PERSON_f1": 0.9054054054054055, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8758169934640523, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.373975545167923, + "eval_overall_accuracy": 0.96347260445334, + "eval_overall_f1": 0.8551336146272857, + "eval_overall_precision": 0.8172043010752689, + "eval_overall_recall": 0.8967551622418879, + "eval_runtime": 0.9156, + "eval_samples_per_second": 204.238, + "eval_steps_per_second": 3.277, + "step": 7314 + }, + { + "epoch": 70.0, + "grad_norm": 0.00042664690408855677, + "learning_rate": 1.5e-05, + "loss": 0.0001, + "step": 7420 + }, + { + "epoch": 70.0, + "eval_LOCATION_f1": 0.8211920529801324, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7848101265822784, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8025477707006369, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7682926829268293, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.9054054054054055, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8758169934640523, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.37100422382354736, + "eval_overall_accuracy": 0.96347260445334, + "eval_overall_f1": 0.8494318181818181, + "eval_overall_precision": 0.8191780821917808, + "eval_overall_recall": 0.8820058997050148, + "eval_runtime": 0.9101, + "eval_samples_per_second": 205.482, + "eval_steps_per_second": 3.297, + "step": 7420 + }, + { + "epoch": 71.0, + "grad_norm": 0.0007093641324900091, + "learning_rate": 1.45e-05, + "loss": 0.0002, + "step": 7526 + }, + { + "epoch": 71.0, + "eval_LOCATION_f1": 0.8266666666666667, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7948717948717948, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8101265822784811, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7710843373493976, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.91156462585034, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8874172185430463, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7083333333333334, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.68, + "eval_QUANTITY_recall": 0.7391304347826086, + "eval_TIME_f1": 0.8461538461538461, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8461538461538461, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3477381467819214, + "eval_overall_accuracy": 0.9647235426569928, + "eval_overall_f1": 0.8518518518518517, + "eval_overall_precision": 0.8236914600550964, + "eval_overall_recall": 0.8820058997050148, + "eval_runtime": 0.9072, + "eval_samples_per_second": 206.129, + "eval_steps_per_second": 3.307, + "step": 7526 + }, + { + "epoch": 72.0, + "grad_norm": 0.00021990617096889764, + "learning_rate": 1.4000000000000001e-05, + "loss": 0.0002, + "step": 7632 + }, + { + "epoch": 72.0, + "eval_LOCATION_f1": 0.823529411764706, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7777777777777778, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.7950310559006211, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7441860465116279, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.36287015676498413, + "eval_overall_accuracy": 0.9642231673755316, + "eval_overall_f1": 0.8478873239436621, + "eval_overall_precision": 0.8113207547169812, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9141, + "eval_samples_per_second": 204.572, + "eval_steps_per_second": 3.282, + "step": 7632 + }, + { + "epoch": 73.0, + "grad_norm": 0.00021961626771371812, + "learning_rate": 1.3500000000000001e-05, + "loss": 0.0002, + "step": 7738 + }, + { + "epoch": 73.0, + "eval_LOCATION_f1": 0.8181818181818181, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7682926829268293, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.7643312101910827, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7317073170731707, + "eval_ORGANIZATION_recall": 0.8, + "eval_PERSON_f1": 0.91156462585034, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8874172185430463, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3637426495552063, + "eval_overall_accuracy": 0.9639729797348011, + "eval_overall_f1": 0.8413597733711049, + "eval_overall_precision": 0.8092643051771117, + "eval_overall_recall": 0.8761061946902655, + "eval_runtime": 0.909, + "eval_samples_per_second": 205.714, + "eval_steps_per_second": 3.3, + "step": 7738 + }, + { + "epoch": 74.0, + "grad_norm": 0.00018741752137430012, + "learning_rate": 1.3000000000000001e-05, + "loss": 0.0001, + "step": 7844 + }, + { + "epoch": 74.0, + "eval_LOCATION_f1": 0.8181818181818181, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7682926829268293, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.751592356687898, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7195121951219512, + "eval_ORGANIZATION_recall": 0.7866666666666666, + "eval_PERSON_f1": 0.9047619047619047, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8807947019867549, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3637796938419342, + "eval_overall_accuracy": 0.9632224168126094, + "eval_overall_f1": 0.8356940509915013, + "eval_overall_precision": 0.8038147138964578, + "eval_overall_recall": 0.8702064896755162, + "eval_runtime": 0.9145, + "eval_samples_per_second": 204.477, + "eval_steps_per_second": 3.28, + "step": 7844 + }, + { + "epoch": 75.0, + "grad_norm": 0.0007877243915572762, + "learning_rate": 1.25e-05, + "loss": 0.0001, + "step": 7950 + }, + { + "epoch": 75.0, + "eval_LOCATION_f1": 0.8289473684210527, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7875, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.7919463087248321, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7972972972972973, + "eval_ORGANIZATION_recall": 0.7866666666666666, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3778810501098633, + "eval_overall_accuracy": 0.9649737302977233, + "eval_overall_f1": 0.8493543758967002, + "eval_overall_precision": 0.8268156424581006, + "eval_overall_recall": 0.8731563421828908, + "eval_runtime": 0.9077, + "eval_samples_per_second": 206.004, + "eval_steps_per_second": 3.305, + "step": 7950 + }, + { + "epoch": 76.0, + "grad_norm": 0.005742947105318308, + "learning_rate": 1.2e-05, + "loss": 0.0001, + "step": 8056 + }, + { + "epoch": 76.0, + "eval_LOCATION_f1": 0.8289473684210527, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7875, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.7894736842105264, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7792207792207793, + "eval_ORGANIZATION_recall": 0.8, + "eval_PERSON_f1": 0.9054054054054055, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8758169934640523, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7346938775510203, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6923076923076923, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.3797122836112976, + "eval_overall_accuracy": 0.9644733550162622, + "eval_overall_f1": 0.8461538461538463, + "eval_overall_precision": 0.8181818181818182, + "eval_overall_recall": 0.8761061946902655, + "eval_runtime": 0.9011, + "eval_samples_per_second": 207.522, + "eval_steps_per_second": 3.329, + "step": 8056 + }, + { + "epoch": 77.0, + "grad_norm": 0.00030839102691970766, + "learning_rate": 1.1500000000000002e-05, + "loss": 0.0004, + "step": 8162 + }, + { + "epoch": 77.0, + "eval_LOCATION_f1": 0.8344370860927153, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7974683544303798, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.8024691358024691, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7471264367816092, + "eval_ORGANIZATION_recall": 0.8666666666666667, + "eval_PERSON_f1": 0.8963210702341137, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8589743589743589, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.76, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.7037037037037037, + "eval_QUANTITY_recall": 0.8260869565217391, + "eval_TIME_f1": 0.830188679245283, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8148148148148148, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.40759775042533875, + "eval_overall_accuracy": 0.9614711033274956, + "eval_overall_f1": 0.8475524475524475, + "eval_overall_precision": 0.8058510638297872, + "eval_overall_recall": 0.8938053097345132, + "eval_runtime": 0.9103, + "eval_samples_per_second": 205.428, + "eval_steps_per_second": 3.296, + "step": 8162 + }, + { + "epoch": 78.0, + "grad_norm": 0.00025188998552039266, + "learning_rate": 1.1000000000000001e-05, + "loss": 0.0005, + "step": 8268 + }, + { + "epoch": 78.0, + "eval_LOCATION_f1": 0.8400000000000001, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8076923076923077, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.7950310559006211, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7441860465116279, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.8993288590604027, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.864516129032258, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7346938775510203, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6923076923076923, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8679245283018868, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8518518518518519, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.39274299144744873, + "eval_overall_accuracy": 0.9624718538904178, + "eval_overall_f1": 0.849507735583685, + "eval_overall_precision": 0.8118279569892473, + "eval_overall_recall": 0.8908554572271387, + "eval_runtime": 0.9103, + "eval_samples_per_second": 205.436, + "eval_steps_per_second": 3.296, + "step": 8268 + }, + { + "epoch": 79.0, + "grad_norm": 0.00023670213704463094, + "learning_rate": 1.05e-05, + "loss": 0.0003, + "step": 8374 + }, + { + "epoch": 79.0, + "eval_LOCATION_f1": 0.823529411764706, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7777777777777778, + "eval_LOCATION_recall": 0.875, + "eval_ORGANIZATION_f1": 0.7468354430379747, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7108433734939759, + "eval_ORGANIZATION_recall": 0.7866666666666666, + "eval_PERSON_f1": 0.9023569023569024, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8701298701298701, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7450980392156864, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6785714285714286, + "eval_QUANTITY_recall": 0.8260869565217391, + "eval_TIME_f1": 0.8148148148148148, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.7857142857142857, + "eval_TIME_recall": 0.8461538461538461, + "eval_loss": 0.4000164866447449, + "eval_overall_accuracy": 0.960720540405304, + "eval_overall_f1": 0.8330995792426367, + "eval_overall_precision": 0.7941176470588235, + "eval_overall_recall": 0.8761061946902655, + "eval_runtime": 0.9149, + "eval_samples_per_second": 204.395, + "eval_steps_per_second": 3.279, + "step": 8374 + }, + { + "epoch": 80.0, + "grad_norm": 0.000326380948536098, + "learning_rate": 1e-05, + "loss": 0.0001, + "step": 8480 + }, + { + "epoch": 80.0, + "eval_LOCATION_f1": 0.8266666666666667, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7948717948717948, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.7483870967741936, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.725, + "eval_ORGANIZATION_recall": 0.7733333333333333, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8679245283018868, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8518518518518519, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3888261020183563, + "eval_overall_accuracy": 0.9629722291718789, + "eval_overall_f1": 0.8416547788873039, + "eval_overall_precision": 0.8149171270718232, + "eval_overall_recall": 0.8702064896755162, + "eval_runtime": 0.9033, + "eval_samples_per_second": 207.02, + "eval_steps_per_second": 3.321, + "step": 8480 + }, + { + "epoch": 81.0, + "grad_norm": 0.0005148330819793046, + "learning_rate": 9.5e-06, + "loss": 0.0001, + "step": 8586 + }, + { + "epoch": 81.0, + "eval_LOCATION_f1": 0.8211920529801324, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7848101265822784, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.7643312101910827, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7317073170731707, + "eval_ORGANIZATION_recall": 0.8, + "eval_PERSON_f1": 0.8993288590604027, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.864516129032258, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.72, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6666666666666666, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3981935977935791, + "eval_overall_accuracy": 0.9614711033274956, + "eval_overall_f1": 0.836619718309859, + "eval_overall_precision": 0.8005390835579514, + "eval_overall_recall": 0.8761061946902655, + "eval_runtime": 0.9078, + "eval_samples_per_second": 205.981, + "eval_steps_per_second": 3.305, + "step": 8586 + }, + { + "epoch": 82.0, + "grad_norm": 0.0001784728665370494, + "learning_rate": 9e-06, + "loss": 0.0003, + "step": 8692 + }, + { + "epoch": 82.0, + "eval_LOCATION_f1": 0.8378378378378377, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8157894736842105, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.7870967741935484, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7625, + "eval_ORGANIZATION_recall": 0.8133333333333334, + "eval_PERSON_f1": 0.91156462585034, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8874172185430463, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8679245283018868, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8518518518518519, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3737158179283142, + "eval_overall_accuracy": 0.9647235426569928, + "eval_overall_f1": 0.8538681948424068, + "eval_overall_precision": 0.83008356545961, + "eval_overall_recall": 0.8790560471976401, + "eval_runtime": 0.9108, + "eval_samples_per_second": 205.324, + "eval_steps_per_second": 3.294, + "step": 8692 + }, + { + "epoch": 83.0, + "grad_norm": 0.00012157092714915052, + "learning_rate": 8.500000000000002e-06, + "loss": 0.0002, + "step": 8798 + }, + { + "epoch": 83.0, + "eval_LOCATION_f1": 0.8322147651006712, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8051948051948052, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.7975460122699386, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7386363636363636, + "eval_ORGANIZATION_recall": 0.8666666666666667, + "eval_PERSON_f1": 0.9047619047619047, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8807947019867549, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3761243224143982, + "eval_overall_accuracy": 0.9632224168126094, + "eval_overall_f1": 0.8502824858757062, + "eval_overall_precision": 0.8157181571815718, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9121, + "eval_samples_per_second": 205.019, + "eval_steps_per_second": 3.289, + "step": 8798 + }, + { + "epoch": 84.0, + "grad_norm": 0.01326628215610981, + "learning_rate": 8.000000000000001e-06, + "loss": 0.0001, + "step": 8904 + }, + { + "epoch": 84.0, + "eval_LOCATION_f1": 0.8322147651006712, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8051948051948052, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8025477707006369, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7682926829268293, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.9047619047619047, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8807947019867549, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8679245283018868, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8518518518518519, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.37578248977661133, + "eval_overall_accuracy": 0.9639729797348011, + "eval_overall_f1": 0.8530670470756063, + "eval_overall_precision": 0.8259668508287292, + "eval_overall_recall": 0.8820058997050148, + "eval_runtime": 0.9306, + "eval_samples_per_second": 200.941, + "eval_steps_per_second": 3.224, + "step": 8904 + }, + { + "epoch": 85.0, + "grad_norm": 0.006039230152964592, + "learning_rate": 7.5e-06, + "loss": 0.0004, + "step": 9010 + }, + { + "epoch": 85.0, + "eval_LOCATION_f1": 0.8322147651006712, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8051948051948052, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.7975460122699386, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7386363636363636, + "eval_ORGANIZATION_recall": 0.8666666666666667, + "eval_PERSON_f1": 0.9016949152542374, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.875, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.7346938775510203, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6923076923076923, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3836413621902466, + "eval_overall_accuracy": 0.9629722291718789, + "eval_overall_f1": 0.8478873239436621, + "eval_overall_precision": 0.8113207547169812, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9049, + "eval_samples_per_second": 206.647, + "eval_steps_per_second": 3.315, + "step": 9010 + }, + { + "epoch": 86.0, + "grad_norm": 0.00042766937986016273, + "learning_rate": 7.000000000000001e-06, + "loss": 0.0005, + "step": 9116 + }, + { + "epoch": 86.0, + "eval_LOCATION_f1": 0.8322147651006712, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8051948051948052, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8076923076923077, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7777777777777778, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.9016949152542374, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.875, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.7346938775510203, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6923076923076923, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3791405260562897, + "eval_overall_accuracy": 0.9642231673755316, + "eval_overall_f1": 0.8506401137980086, + "eval_overall_precision": 0.8214285714285714, + "eval_overall_recall": 0.8820058997050148, + "eval_runtime": 0.904, + "eval_samples_per_second": 206.855, + "eval_steps_per_second": 3.319, + "step": 9116 + }, + { + "epoch": 87.0, + "grad_norm": 0.0006120882462710142, + "learning_rate": 6.5000000000000004e-06, + "loss": 0.0004, + "step": 9222 + }, + { + "epoch": 87.0, + "eval_LOCATION_f1": 0.8266666666666667, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7948717948717948, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8025477707006369, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7682926829268293, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.9023569023569024, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8701298701298701, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7346938775510203, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6923076923076923, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.888888888888889, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8571428571428571, + "eval_TIME_recall": 0.9230769230769231, + "eval_loss": 0.38632336258888245, + "eval_overall_accuracy": 0.9639729797348011, + "eval_overall_f1": 0.8514851485148515, + "eval_overall_precision": 0.8179347826086957, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9113, + "eval_samples_per_second": 205.193, + "eval_steps_per_second": 3.292, + "step": 9222 + }, + { + "epoch": 88.0, + "grad_norm": 0.0006923701730556786, + "learning_rate": 6e-06, + "loss": 0.0004, + "step": 9328 + }, + { + "epoch": 88.0, + "eval_LOCATION_f1": 0.8211920529801324, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7848101265822784, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.7875000000000001, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7411764705882353, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.907849829351536, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8866666666666667, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.9056603773584906, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8888888888888888, + "eval_TIME_recall": 0.9230769230769231, + "eval_loss": 0.3742952346801758, + "eval_overall_accuracy": 0.9647235426569928, + "eval_overall_f1": 0.851063829787234, + "eval_overall_precision": 0.819672131147541, + "eval_overall_recall": 0.8849557522123894, + "eval_runtime": 0.9099, + "eval_samples_per_second": 205.512, + "eval_steps_per_second": 3.297, + "step": 9328 + }, + { + "epoch": 89.0, + "grad_norm": 0.0163017176091671, + "learning_rate": 5.500000000000001e-06, + "loss": 0.0006, + "step": 9434 + }, + { + "epoch": 89.0, + "eval_LOCATION_f1": 0.816326530612245, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.8, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.7894736842105264, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7792207792207793, + "eval_ORGANIZATION_recall": 0.8, + "eval_PERSON_f1": 0.907849829351536, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8866666666666667, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.9056603773584906, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8888888888888888, + "eval_TIME_recall": 0.9230769230769231, + "eval_loss": 0.3696248233318329, + "eval_overall_accuracy": 0.966224668501376, + "eval_overall_f1": 0.8513708513708513, + "eval_overall_precision": 0.8333333333333334, + "eval_overall_recall": 0.8702064896755162, + "eval_runtime": 0.9099, + "eval_samples_per_second": 205.507, + "eval_steps_per_second": 3.297, + "step": 9434 + }, + { + "epoch": 90.0, + "grad_norm": 15.17189884185791, + "learning_rate": 5e-06, + "loss": 0.0002, + "step": 9540 + }, + { + "epoch": 90.0, + "eval_LOCATION_f1": 0.8, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7692307692307693, + "eval_LOCATION_recall": 0.8333333333333334, + "eval_ORGANIZATION_f1": 0.7894736842105264, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7792207792207793, + "eval_ORGANIZATION_recall": 0.8, + "eval_PERSON_f1": 0.907849829351536, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8866666666666667, + "eval_PERSON_recall": 0.9300699300699301, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.9056603773584906, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8888888888888888, + "eval_TIME_recall": 0.9230769230769231, + "eval_loss": 0.3719424605369568, + "eval_overall_accuracy": 0.966224668501376, + "eval_overall_f1": 0.8477011494252874, + "eval_overall_precision": 0.8263305322128851, + "eval_overall_recall": 0.8702064896755162, + "eval_runtime": 0.9059, + "eval_samples_per_second": 206.432, + "eval_steps_per_second": 3.312, + "step": 9540 + }, + { + "epoch": 91.0, + "grad_norm": 0.00020513041818048805, + "learning_rate": 4.5e-06, + "loss": 0.0002, + "step": 9646 + }, + { + "epoch": 91.0, + "eval_LOCATION_f1": 0.8187919463087249, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7922077922077922, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.8205128205128205, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7901234567901234, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.9056603773584906, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8888888888888888, + "eval_TIME_recall": 0.9230769230769231, + "eval_loss": 0.3863327205181122, + "eval_overall_accuracy": 0.9642231673755316, + "eval_overall_f1": 0.8587731811697574, + "eval_overall_precision": 0.8314917127071824, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9044, + "eval_samples_per_second": 206.761, + "eval_steps_per_second": 3.317, + "step": 9646 + }, + { + "epoch": 92.0, + "grad_norm": 0.0004068514099344611, + "learning_rate": 4.000000000000001e-06, + "loss": 0.0004, + "step": 9752 + }, + { + "epoch": 92.0, + "eval_LOCATION_f1": 0.8187919463087249, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7922077922077922, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.8129032258064516, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7875, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.91156462585034, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.8874172185430463, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.9056603773584906, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8888888888888888, + "eval_TIME_recall": 0.9230769230769231, + "eval_loss": 0.38287997245788574, + "eval_overall_accuracy": 0.9644733550162622, + "eval_overall_f1": 0.8583690987124464, + "eval_overall_precision": 0.8333333333333334, + "eval_overall_recall": 0.8849557522123894, + "eval_runtime": 0.9043, + "eval_samples_per_second": 206.779, + "eval_steps_per_second": 3.317, + "step": 9752 + }, + { + "epoch": 93.0, + "grad_norm": 0.00010082097287522629, + "learning_rate": 3.5000000000000004e-06, + "loss": 0.0002, + "step": 9858 + }, + { + "epoch": 93.0, + "eval_LOCATION_f1": 0.8187919463087249, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7922077922077922, + "eval_LOCATION_recall": 0.8472222222222222, + "eval_ORGANIZATION_f1": 0.8104575163398693, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7948717948717948, + "eval_ORGANIZATION_recall": 0.8266666666666667, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.9056603773584906, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8888888888888888, + "eval_TIME_recall": 0.9230769230769231, + "eval_loss": 0.37826383113861084, + "eval_overall_accuracy": 0.9652239179384539, + "eval_overall_f1": 0.8567335243553009, + "eval_overall_precision": 0.8328690807799443, + "eval_overall_recall": 0.8820058997050148, + "eval_runtime": 0.918, + "eval_samples_per_second": 203.7, + "eval_steps_per_second": 3.268, + "step": 9858 + }, + { + "epoch": 94.0, + "grad_norm": 0.000542107445653528, + "learning_rate": 3e-06, + "loss": 0.0001, + "step": 9964 + }, + { + "epoch": 94.0, + "eval_LOCATION_f1": 0.8266666666666667, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7948717948717948, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8076923076923077, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7777777777777778, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.9056603773584906, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8888888888888888, + "eval_TIME_recall": 0.9230769230769231, + "eval_loss": 0.38576415181159973, + "eval_overall_accuracy": 0.9642231673755316, + "eval_overall_f1": 0.8575498575498576, + "eval_overall_precision": 0.8292011019283747, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9111, + "eval_samples_per_second": 205.24, + "eval_steps_per_second": 3.293, + "step": 9964 + }, + { + "epoch": 95.0, + "grad_norm": 0.044874146580696106, + "learning_rate": 2.5e-06, + "loss": 0.0001, + "step": 10070 + }, + { + "epoch": 95.0, + "eval_LOCATION_f1": 0.8266666666666667, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7948717948717948, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8076923076923077, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7777777777777778, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.7499999999999999, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.72, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.888888888888889, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8571428571428571, + "eval_TIME_recall": 0.9230769230769231, + "eval_loss": 0.38630810379981995, + "eval_overall_accuracy": 0.9639729797348011, + "eval_overall_f1": 0.856330014224751, + "eval_overall_precision": 0.8269230769230769, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.8986, + "eval_samples_per_second": 208.113, + "eval_steps_per_second": 3.339, + "step": 10070 + }, + { + "epoch": 96.0, + "grad_norm": 0.0001308424398303032, + "learning_rate": 2.0000000000000003e-06, + "loss": 0.0001, + "step": 10176 + }, + { + "epoch": 96.0, + "eval_LOCATION_f1": 0.8266666666666667, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7948717948717948, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8076923076923077, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7777777777777778, + "eval_ORGANIZATION_recall": 0.84, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.76, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.7037037037037037, + "eval_QUANTITY_recall": 0.8260869565217391, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3916187286376953, + "eval_overall_accuracy": 0.9637227920940705, + "eval_overall_f1": 0.8539007092198581, + "eval_overall_precision": 0.8224043715846995, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9154, + "eval_samples_per_second": 204.278, + "eval_steps_per_second": 3.277, + "step": 10176 + }, + { + "epoch": 97.0, + "grad_norm": 0.00018677054322324693, + "learning_rate": 1.5e-06, + "loss": 0.0001, + "step": 10282 + }, + { + "epoch": 97.0, + "eval_LOCATION_f1": 0.8266666666666667, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7948717948717948, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8101265822784811, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7710843373493976, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.76, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.7037037037037037, + "eval_QUANTITY_recall": 0.8260869565217391, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3897801339626312, + "eval_overall_accuracy": 0.9642231673755316, + "eval_overall_f1": 0.8543140028288544, + "eval_overall_precision": 0.8206521739130435, + "eval_overall_recall": 0.8908554572271387, + "eval_runtime": 0.9174, + "eval_samples_per_second": 203.839, + "eval_steps_per_second": 3.27, + "step": 10282 + }, + { + "epoch": 98.0, + "grad_norm": 0.004196417052298784, + "learning_rate": 1.0000000000000002e-06, + "loss": 0.0001, + "step": 10388 + }, + { + "epoch": 98.0, + "eval_LOCATION_f1": 0.8266666666666667, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7948717948717948, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8101265822784811, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7710843373493976, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.76, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.7037037037037037, + "eval_QUANTITY_recall": 0.8260869565217391, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.38807475566864014, + "eval_overall_accuracy": 0.9644733550162622, + "eval_overall_f1": 0.8543140028288544, + "eval_overall_precision": 0.8206521739130435, + "eval_overall_recall": 0.8908554572271387, + "eval_runtime": 0.9056, + "eval_samples_per_second": 206.492, + "eval_steps_per_second": 3.313, + "step": 10388 + }, + { + "epoch": 99.0, + "grad_norm": 0.0001258315023733303, + "learning_rate": 5.000000000000001e-07, + "loss": 0.0001, + "step": 10494 + }, + { + "epoch": 99.0, + "eval_LOCATION_f1": 0.8266666666666667, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7948717948717948, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8101265822784811, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7710843373493976, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.72, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6666666666666666, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3856855630874634, + "eval_overall_accuracy": 0.9642231673755316, + "eval_overall_f1": 0.8514851485148515, + "eval_overall_precision": 0.8179347826086957, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9072, + "eval_samples_per_second": 206.127, + "eval_steps_per_second": 3.307, + "step": 10494 + }, + { + "epoch": 100.0, + "grad_norm": 0.00010668273171177134, + "learning_rate": 0.0, + "loss": 0.0001, + "step": 10600 + }, + { + "epoch": 100.0, + "eval_LOCATION_f1": 0.8266666666666667, + "eval_LOCATION_number": 72, + "eval_LOCATION_precision": 0.7948717948717948, + "eval_LOCATION_recall": 0.8611111111111112, + "eval_ORGANIZATION_f1": 0.8101265822784811, + "eval_ORGANIZATION_number": 75, + "eval_ORGANIZATION_precision": 0.7710843373493976, + "eval_ORGANIZATION_recall": 0.8533333333333334, + "eval_PERSON_f1": 0.9084745762711864, + "eval_PERSON_number": 143, + "eval_PERSON_precision": 0.881578947368421, + "eval_PERSON_recall": 0.9370629370629371, + "eval_QUANTITY_f1": 0.72, + "eval_QUANTITY_number": 23, + "eval_QUANTITY_precision": 0.6666666666666666, + "eval_QUANTITY_recall": 0.782608695652174, + "eval_TIME_f1": 0.8518518518518519, + "eval_TIME_number": 26, + "eval_TIME_precision": 0.8214285714285714, + "eval_TIME_recall": 0.8846153846153846, + "eval_loss": 0.3857269287109375, + "eval_overall_accuracy": 0.9642231673755316, + "eval_overall_f1": 0.8514851485148515, + "eval_overall_precision": 0.8179347826086957, + "eval_overall_recall": 0.887905604719764, + "eval_runtime": 0.9906, + "eval_samples_per_second": 188.783, + "eval_steps_per_second": 3.029, + "step": 10600 + }, + { + "epoch": 100.0, + "step": 10600, + "total_flos": 4502314993613766.0, + "train_loss": 0.008494841067761815, + "train_runtime": 2623.6324, + "train_samples_per_second": 64.3, + "train_steps_per_second": 4.04 } ], "logging_steps": 500, - "max_steps": 2120, + "max_steps": 10600, "num_input_tokens_seen": 0, - "num_train_epochs": 20, + "num_train_epochs": 100, "save_steps": 500, - "total_flos": 898035701398080.0, + "total_flos": 4502314993613766.0, "train_batch_size": 16, "trial_name": null, "trial_params": null