twitter-roberta-base-CoNLL / trainer_state.json
emilys's picture
End of training
a673706
raw
history blame
33.4 kB
{
"best_metric": 0.9571847507331379,
"best_model_checkpoint": "twitter-roberta-base-CoNLL/checkpoint-2000",
"epoch": 10.0,
"global_step": 2200,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.11,
"eval_accuracy": 0.9385927339278065,
"eval_f1": 0.6587314799400699,
"eval_loss": 0.2062799483537674,
"eval_precision": 0.6516798418972332,
"eval_recall": 0.6659373948165601,
"eval_runtime": 5.976,
"eval_samples_per_second": 544.011,
"eval_steps_per_second": 0.669,
"step": 25
},
{
"epoch": 0.23,
"eval_accuracy": 0.9771231649857871,
"eval_f1": 0.8565321055660609,
"eval_loss": 0.08096875995397568,
"eval_precision": 0.8373251888763864,
"eval_recall": 0.8766408616627398,
"eval_runtime": 6.2407,
"eval_samples_per_second": 520.938,
"eval_steps_per_second": 0.641,
"step": 50
},
{
"epoch": 0.34,
"eval_accuracy": 0.9826914839764807,
"eval_f1": 0.8996990972918756,
"eval_loss": 0.06511491537094116,
"eval_precision": 0.8937230156094321,
"eval_recall": 0.9057556378323797,
"eval_runtime": 6.0069,
"eval_samples_per_second": 541.208,
"eval_steps_per_second": 0.666,
"step": 75
},
{
"epoch": 0.45,
"eval_accuracy": 0.9849110237140298,
"eval_f1": 0.907388833166165,
"eval_loss": 0.05366199463605881,
"eval_precision": 0.9013616738625041,
"eval_recall": 0.9134971390104342,
"eval_runtime": 6.3828,
"eval_samples_per_second": 509.335,
"eval_steps_per_second": 0.627,
"step": 100
},
{
"epoch": 0.57,
"eval_accuracy": 0.986682761574705,
"eval_f1": 0.9170283806343906,
"eval_loss": 0.04637985676527023,
"eval_precision": 0.9097383239483272,
"eval_recall": 0.924436216762033,
"eval_runtime": 6.0475,
"eval_samples_per_second": 537.576,
"eval_steps_per_second": 0.661,
"step": 125
},
{
"epoch": 0.68,
"eval_accuracy": 0.9884544994353802,
"eval_f1": 0.9296410942859533,
"eval_loss": 0.042301442474126816,
"eval_precision": 0.9243054400266179,
"eval_recall": 0.9350387075058902,
"eval_runtime": 6.0733,
"eval_samples_per_second": 535.298,
"eval_steps_per_second": 0.659,
"step": 150
},
{
"epoch": 0.8,
"eval_accuracy": 0.9899731318873876,
"eval_f1": 0.934277384423157,
"eval_loss": 0.038059305399656296,
"eval_precision": 0.9249546429160481,
"eval_recall": 0.9437899697071693,
"eval_runtime": 6.3028,
"eval_samples_per_second": 515.805,
"eval_steps_per_second": 0.635,
"step": 175
},
{
"epoch": 0.91,
"eval_accuracy": 0.9895642693041549,
"eval_f1": 0.9354220481626531,
"eval_loss": 0.038840554654598236,
"eval_precision": 0.9263904934807724,
"eval_recall": 0.9446314372265231,
"eval_runtime": 6.0497,
"eval_samples_per_second": 537.384,
"eval_steps_per_second": 0.661,
"step": 200
},
{
"epoch": 1.02,
"eval_accuracy": 0.9898368443596434,
"eval_f1": 0.9384409501505521,
"eval_loss": 0.03943933546543121,
"eval_precision": 0.9328234120385767,
"eval_recall": 0.9441265567149109,
"eval_runtime": 6.4439,
"eval_samples_per_second": 504.505,
"eval_steps_per_second": 0.621,
"step": 225
},
{
"epoch": 1.14,
"eval_accuracy": 0.9895837389509754,
"eval_f1": 0.9402710389827672,
"eval_loss": 0.042259786278009415,
"eval_precision": 0.9347970725216235,
"eval_recall": 0.9458094917536183,
"eval_runtime": 6.16,
"eval_samples_per_second": 527.761,
"eval_steps_per_second": 0.649,
"step": 250
},
{
"epoch": 1.25,
"eval_accuracy": 0.9892138156613839,
"eval_f1": 0.9354757720311323,
"eval_loss": 0.04323225095868111,
"eval_precision": 0.9304145163975363,
"eval_recall": 0.9405923931336251,
"eval_runtime": 6.3592,
"eval_samples_per_second": 511.225,
"eval_steps_per_second": 0.629,
"step": 275
},
{
"epoch": 1.36,
"eval_accuracy": 0.9900899497683112,
"eval_f1": 0.9432760787599497,
"eval_loss": 0.03824295476078987,
"eval_precision": 0.9392624728850325,
"eval_recall": 0.9473241332884551,
"eval_runtime": 6.1034,
"eval_samples_per_second": 532.654,
"eval_steps_per_second": 0.655,
"step": 300
},
{
"epoch": 1.48,
"eval_accuracy": 0.99005101047467,
"eval_f1": 0.9414020171709594,
"eval_loss": 0.0380987711250782,
"eval_precision": 0.932617671345995,
"eval_recall": 0.9503534163581285,
"eval_runtime": 6.1204,
"eval_samples_per_second": 531.176,
"eval_steps_per_second": 0.654,
"step": 325
},
{
"epoch": 1.59,
"eval_accuracy": 0.9902262372960554,
"eval_f1": 0.9429309339331834,
"eval_loss": 0.03868376836180687,
"eval_precision": 0.933674311169774,
"eval_recall": 0.9523729384045776,
"eval_runtime": 6.3273,
"eval_samples_per_second": 513.801,
"eval_steps_per_second": 0.632,
"step": 350
},
{
"epoch": 1.7,
"eval_accuracy": 0.990148358708773,
"eval_f1": 0.9439181825802665,
"eval_loss": 0.03645554929971695,
"eval_precision": 0.9403708034073827,
"eval_recall": 0.9474924267923258,
"eval_runtime": 6.2492,
"eval_samples_per_second": 520.224,
"eval_steps_per_second": 0.64,
"step": 375
},
{
"epoch": 1.82,
"eval_accuracy": 0.9905182819983646,
"eval_f1": 0.9473948735131512,
"eval_loss": 0.0382225401699543,
"eval_precision": 0.9431287525016678,
"eval_recall": 0.9516997643890945,
"eval_runtime": 6.4588,
"eval_samples_per_second": 503.348,
"eval_steps_per_second": 0.619,
"step": 400
},
{
"epoch": 1.93,
"eval_accuracy": 0.9903235855301585,
"eval_f1": 0.9460837582546184,
"eval_loss": 0.03733981028199196,
"eval_precision": 0.9398770968277694,
"eval_recall": 0.9523729384045776,
"eval_runtime": 6.1594,
"eval_samples_per_second": 527.813,
"eval_steps_per_second": 0.649,
"step": 425
},
{
"epoch": 2.05,
"eval_accuracy": 0.9910439624625209,
"eval_f1": 0.9497365559923059,
"eval_loss": 0.03666611388325691,
"eval_precision": 0.943973399833749,
"eval_recall": 0.9555705149781218,
"eval_runtime": 6.4014,
"eval_samples_per_second": 507.859,
"eval_steps_per_second": 0.625,
"step": 450
},
{
"epoch": 2.16,
"eval_accuracy": 0.99069350881975,
"eval_f1": 0.9474914433592119,
"eval_loss": 0.03960287570953369,
"eval_precision": 0.9400364419413616,
"eval_recall": 0.9550656344665096,
"eval_runtime": 6.2344,
"eval_samples_per_second": 521.465,
"eval_steps_per_second": 0.642,
"step": 475
},
{
"epoch": 2.27,
"learning_rate": 4.636363636363636e-05,
"loss": 0.0771,
"step": 500
},
{
"epoch": 2.27,
"eval_accuracy": 0.991238658930727,
"eval_f1": 0.9507813152836967,
"eval_loss": 0.035283163189888,
"eval_precision": 0.9442323651452282,
"eval_recall": 0.9574217435207001,
"eval_runtime": 6.1631,
"eval_samples_per_second": 527.493,
"eval_steps_per_second": 0.649,
"step": 500
},
{
"epoch": 2.39,
"eval_accuracy": 0.9905572212920057,
"eval_f1": 0.9453602209020165,
"eval_loss": 0.03937030956149101,
"eval_precision": 0.9400898652021967,
"eval_recall": 0.9506900033658701,
"eval_runtime": 6.243,
"eval_samples_per_second": 520.742,
"eval_steps_per_second": 0.641,
"step": 525
},
{
"epoch": 2.5,
"eval_accuracy": 0.9909660838752385,
"eval_f1": 0.9484536082474228,
"eval_loss": 0.036998968571424484,
"eval_precision": 0.9447320086825848,
"eval_recall": 0.9522046449007069,
"eval_runtime": 6.0773,
"eval_samples_per_second": 534.945,
"eval_steps_per_second": 0.658,
"step": 550
},
{
"epoch": 2.61,
"eval_accuracy": 0.9908492659943149,
"eval_f1": 0.9472013366750209,
"eval_loss": 0.035233963280916214,
"eval_precision": 0.940444591904446,
"eval_recall": 0.9540558734432851,
"eval_runtime": 6.3038,
"eval_samples_per_second": 515.72,
"eval_steps_per_second": 0.635,
"step": 575
},
{
"epoch": 2.73,
"eval_accuracy": 0.9908103267006737,
"eval_f1": 0.9448281601065159,
"eval_loss": 0.0385683998465538,
"eval_precision": 0.9344855967078189,
"eval_recall": 0.9554022214742511,
"eval_runtime": 6.1499,
"eval_samples_per_second": 528.629,
"eval_steps_per_second": 0.65,
"step": 600
},
{
"epoch": 2.84,
"eval_accuracy": 0.9916280518671391,
"eval_f1": 0.9501544627202138,
"eval_loss": 0.036591168493032455,
"eval_precision": 0.9428334714167357,
"eval_recall": 0.9575900370245709,
"eval_runtime": 6.1996,
"eval_samples_per_second": 524.389,
"eval_steps_per_second": 0.645,
"step": 625
},
{
"epoch": 2.95,
"eval_accuracy": 0.9913360071648301,
"eval_f1": 0.948574295509658,
"eval_loss": 0.035347189754247665,
"eval_precision": 0.9426624563736081,
"eval_recall": 0.9545607539548974,
"eval_runtime": 6.4287,
"eval_samples_per_second": 505.702,
"eval_steps_per_second": 0.622,
"step": 650
},
{
"epoch": 3.07,
"eval_accuracy": 0.9911023714029827,
"eval_f1": 0.9477730425336343,
"eval_loss": 0.035899706184864044,
"eval_precision": 0.9412448132780084,
"eval_recall": 0.9543924604510265,
"eval_runtime": 6.1591,
"eval_samples_per_second": 527.837,
"eval_steps_per_second": 0.649,
"step": 675
},
{
"epoch": 3.18,
"eval_accuracy": 0.9919979751567306,
"eval_f1": 0.9534164087981936,
"eval_loss": 0.0355631485581398,
"eval_precision": 0.9476309226932669,
"eval_recall": 0.9592729720632783,
"eval_runtime": 6.1923,
"eval_samples_per_second": 525.005,
"eval_steps_per_second": 0.646,
"step": 700
},
{
"epoch": 3.3,
"eval_accuracy": 0.9918422179821658,
"eval_f1": 0.953465015065283,
"eval_loss": 0.03445196524262428,
"eval_precision": 0.9483849483849484,
"eval_recall": 0.9585997980477954,
"eval_runtime": 6.3335,
"eval_samples_per_second": 513.302,
"eval_steps_per_second": 0.632,
"step": 725
},
{
"epoch": 3.41,
"eval_accuracy": 0.9915696429266773,
"eval_f1": 0.9491893698813304,
"eval_loss": 0.03445504605770111,
"eval_precision": 0.9427290836653387,
"eval_recall": 0.9557388084819926,
"eval_runtime": 6.1661,
"eval_samples_per_second": 527.234,
"eval_steps_per_second": 0.649,
"step": 750
},
{
"epoch": 3.52,
"eval_accuracy": 0.9913944161052919,
"eval_f1": 0.9478246374395733,
"eval_loss": 0.03635535016655922,
"eval_precision": 0.9389035667107001,
"eval_recall": 0.9569168630090878,
"eval_runtime": 6.4373,
"eval_samples_per_second": 505.028,
"eval_steps_per_second": 0.621,
"step": 775
},
{
"epoch": 3.64,
"eval_accuracy": 0.9914917643393949,
"eval_f1": 0.95067189717052,
"eval_loss": 0.03599384054541588,
"eval_precision": 0.943036926643484,
"eval_recall": 0.9584315045439246,
"eval_runtime": 6.1546,
"eval_samples_per_second": 528.219,
"eval_steps_per_second": 0.65,
"step": 800
},
{
"epoch": 3.75,
"eval_accuracy": 0.9914528250457537,
"eval_f1": 0.950514945993469,
"eval_loss": 0.03866244852542877,
"eval_precision": 0.9458423596067322,
"eval_recall": 0.9552339279703803,
"eval_runtime": 6.3798,
"eval_samples_per_second": 509.575,
"eval_steps_per_second": 0.627,
"step": 825
},
{
"epoch": 3.86,
"eval_accuracy": 0.9917059304544216,
"eval_f1": 0.9521419009370816,
"eval_loss": 0.034695982933044434,
"eval_precision": 0.9467554076539102,
"eval_recall": 0.9575900370245709,
"eval_runtime": 6.175,
"eval_samples_per_second": 526.482,
"eval_steps_per_second": 0.648,
"step": 850
},
{
"epoch": 3.98,
"eval_accuracy": 0.9915307036330361,
"eval_f1": 0.9509402423735897,
"eval_loss": 0.03567422926425934,
"eval_precision": 0.9445459073551387,
"eval_recall": 0.9574217435207001,
"eval_runtime": 6.2028,
"eval_samples_per_second": 524.119,
"eval_steps_per_second": 0.645,
"step": 875
},
{
"epoch": 4.09,
"eval_accuracy": 0.9918032786885246,
"eval_f1": 0.9520702634880803,
"eval_loss": 0.03815401718020439,
"eval_precision": 0.9464493597206054,
"eval_recall": 0.9577583305284416,
"eval_runtime": 6.4111,
"eval_samples_per_second": 507.091,
"eval_steps_per_second": 0.624,
"step": 900
},
{
"epoch": 4.2,
"eval_accuracy": 0.9917643393948834,
"eval_f1": 0.9518385124382277,
"eval_loss": 0.03912338241934776,
"eval_precision": 0.9474737368684342,
"eval_recall": 0.9562436889936049,
"eval_runtime": 6.1023,
"eval_samples_per_second": 532.748,
"eval_steps_per_second": 0.655,
"step": 925
},
{
"epoch": 4.32,
"eval_accuracy": 0.9911802499902652,
"eval_f1": 0.9506493506493505,
"eval_loss": 0.0428401380777359,
"eval_precision": 0.9466043717670616,
"eval_recall": 0.9547290474587681,
"eval_runtime": 6.3492,
"eval_samples_per_second": 512.03,
"eval_steps_per_second": 0.63,
"step": 950
},
{
"epoch": 4.43,
"eval_accuracy": 0.9913360071648301,
"eval_f1": 0.9506028131279304,
"eval_loss": 0.04035865515470505,
"eval_precision": 0.9458513828723759,
"eval_recall": 0.9554022214742511,
"eval_runtime": 6.1625,
"eval_samples_per_second": 527.542,
"eval_steps_per_second": 0.649,
"step": 975
},
{
"epoch": 4.55,
"learning_rate": 3.2727272727272725e-05,
"loss": 0.0118,
"step": 1000
},
{
"epoch": 4.55,
"eval_accuracy": 0.9908687356411354,
"eval_f1": 0.9461397365349341,
"eval_loss": 0.04028761386871338,
"eval_precision": 0.9375413086582948,
"eval_recall": 0.9548973409626389,
"eval_runtime": 6.261,
"eval_samples_per_second": 519.243,
"eval_steps_per_second": 0.639,
"step": 1000
},
{
"epoch": 4.66,
"eval_accuracy": 0.9919200965694482,
"eval_f1": 0.9533852205205458,
"eval_loss": 0.036938250064849854,
"eval_precision": 0.9482270684201765,
"eval_recall": 0.9585997980477954,
"eval_runtime": 6.1962,
"eval_samples_per_second": 524.674,
"eval_steps_per_second": 0.646,
"step": 1025
},
{
"epoch": 4.77,
"eval_accuracy": 0.9918032786885246,
"eval_f1": 0.9520227348712804,
"eval_loss": 0.037420712411403656,
"eval_precision": 0.9456991032879442,
"eval_recall": 0.9584315045439246,
"eval_runtime": 5.9766,
"eval_samples_per_second": 543.958,
"eval_steps_per_second": 0.669,
"step": 1050
},
{
"epoch": 4.89,
"eval_accuracy": 0.9922900198590398,
"eval_f1": 0.9538745387453874,
"eval_loss": 0.035940222442150116,
"eval_precision": 0.9506853895018389,
"eval_recall": 0.9570851565129586,
"eval_runtime": 6.2768,
"eval_samples_per_second": 517.943,
"eval_steps_per_second": 0.637,
"step": 1075
},
{
"epoch": 5.0,
"eval_accuracy": 0.9919006269226276,
"eval_f1": 0.9523093627328155,
"eval_loss": 0.03730743005871773,
"eval_precision": 0.9452827060189023,
"eval_recall": 0.9594412655671491,
"eval_runtime": 6.0853,
"eval_samples_per_second": 534.236,
"eval_steps_per_second": 0.657,
"step": 1100
},
{
"epoch": 5.11,
"eval_accuracy": 0.9923873680931428,
"eval_f1": 0.9546215673141327,
"eval_loss": 0.037039875984191895,
"eval_precision": 0.9498500499833389,
"eval_recall": 0.9594412655671491,
"eval_runtime": 6.3128,
"eval_samples_per_second": 514.986,
"eval_steps_per_second": 0.634,
"step": 1125
},
{
"epoch": 5.23,
"eval_accuracy": 0.9922316109185779,
"eval_f1": 0.9555313625324512,
"eval_loss": 0.038839343935251236,
"eval_precision": 0.9509918319719953,
"eval_recall": 0.9601144395826321,
"eval_runtime": 6.1584,
"eval_samples_per_second": 527.897,
"eval_steps_per_second": 0.65,
"step": 1150
},
{
"epoch": 5.34,
"eval_accuracy": 0.9919785055099101,
"eval_f1": 0.9522212908633696,
"eval_loss": 0.03950090706348419,
"eval_precision": 0.948563794255177,
"eval_recall": 0.9559071019858634,
"eval_runtime": 6.084,
"eval_samples_per_second": 534.349,
"eval_steps_per_second": 0.657,
"step": 1175
},
{
"epoch": 5.45,
"eval_accuracy": 0.9923678984463222,
"eval_f1": 0.9542866711319491,
"eval_loss": 0.03910110890865326,
"eval_precision": 0.949516827724092,
"eval_recall": 0.9591046785594076,
"eval_runtime": 6.3281,
"eval_samples_per_second": 513.744,
"eval_steps_per_second": 0.632,
"step": 1200
},
{
"epoch": 5.57,
"eval_accuracy": 0.9923289591526809,
"eval_f1": 0.9552313883299799,
"eval_loss": 0.037824589759111404,
"eval_precision": 0.9517206815903776,
"eval_recall": 0.9587680915516661,
"eval_runtime": 6.1901,
"eval_samples_per_second": 525.192,
"eval_steps_per_second": 0.646,
"step": 1225
},
{
"epoch": 5.68,
"eval_accuracy": 0.9923678984463222,
"eval_f1": 0.956470785200067,
"eval_loss": 0.038752481341362,
"eval_precision": 0.9515323117921386,
"eval_recall": 0.9614607876135981,
"eval_runtime": 6.178,
"eval_samples_per_second": 526.219,
"eval_steps_per_second": 0.647,
"step": 1250
},
{
"epoch": 5.8,
"eval_accuracy": 0.9924457770336046,
"eval_f1": 0.9560485558811219,
"eval_loss": 0.03838498517870903,
"eval_precision": 0.9511910711311011,
"eval_recall": 0.9609559071019859,
"eval_runtime": 6.3664,
"eval_samples_per_second": 510.65,
"eval_steps_per_second": 0.628,
"step": 1275
},
{
"epoch": 5.91,
"eval_accuracy": 0.9924068377399634,
"eval_f1": 0.9571045576407506,
"eval_loss": 0.03946718946099281,
"eval_precision": 0.9529529529529529,
"eval_recall": 0.9612924941097274,
"eval_runtime": 6.1196,
"eval_samples_per_second": 531.242,
"eval_steps_per_second": 0.654,
"step": 1300
},
{
"epoch": 6.02,
"eval_accuracy": 0.9919200965694482,
"eval_f1": 0.9533869885982562,
"eval_loss": 0.04075756296515465,
"eval_precision": 0.9498830604744404,
"eval_recall": 0.9569168630090878,
"eval_runtime": 6.1927,
"eval_samples_per_second": 524.974,
"eval_steps_per_second": 0.646,
"step": 1325
},
{
"epoch": 6.14,
"eval_accuracy": 0.9921732019781161,
"eval_f1": 0.9547998997409975,
"eval_loss": 0.04120802879333496,
"eval_precision": 0.948067031690725,
"eval_recall": 0.9616290811174689,
"eval_runtime": 6.3552,
"eval_samples_per_second": 511.548,
"eval_steps_per_second": 0.629,
"step": 1350
},
{
"epoch": 6.25,
"eval_accuracy": 0.9923873680931428,
"eval_f1": 0.9555667337357477,
"eval_loss": 0.0413355678319931,
"eval_precision": 0.952054794520548,
"eval_recall": 0.9591046785594076,
"eval_runtime": 6.2847,
"eval_samples_per_second": 517.288,
"eval_steps_per_second": 0.636,
"step": 1375
},
{
"epoch": 6.36,
"eval_accuracy": 0.9917448697480628,
"eval_f1": 0.9525004181301221,
"eval_loss": 0.04124680161476135,
"eval_precision": 0.9466422872340425,
"eval_recall": 0.9584315045439246,
"eval_runtime": 6.4524,
"eval_samples_per_second": 503.841,
"eval_steps_per_second": 0.62,
"step": 1400
},
{
"epoch": 6.48,
"eval_accuracy": 0.9920953233908337,
"eval_f1": 0.9555611348229978,
"eval_loss": 0.040540654212236404,
"eval_precision": 0.9503912102547029,
"eval_recall": 0.9607876135981152,
"eval_runtime": 6.1266,
"eval_samples_per_second": 530.638,
"eval_steps_per_second": 0.653,
"step": 1425
},
{
"epoch": 6.59,
"eval_accuracy": 0.9925041859740664,
"eval_f1": 0.9565508580996233,
"eval_loss": 0.04004018381237984,
"eval_precision": 0.9516908212560387,
"eval_recall": 0.9614607876135981,
"eval_runtime": 6.4161,
"eval_samples_per_second": 506.697,
"eval_steps_per_second": 0.623,
"step": 1450
},
{
"epoch": 6.7,
"eval_accuracy": 0.9922900198590398,
"eval_f1": 0.9551813688531458,
"eval_loss": 0.039815619587898254,
"eval_precision": 0.9509591326105088,
"eval_recall": 0.9594412655671491,
"eval_runtime": 6.2578,
"eval_samples_per_second": 519.511,
"eval_steps_per_second": 0.639,
"step": 1475
},
{
"epoch": 6.82,
"learning_rate": 1.909090909090909e-05,
"loss": 0.0049,
"step": 1500
},
{
"epoch": 6.82,
"eval_accuracy": 0.9925431252677076,
"eval_f1": 0.956871283812076,
"eval_loss": 0.03951007500290871,
"eval_precision": 0.9523253875645941,
"eval_recall": 0.9614607876135981,
"eval_runtime": 6.2854,
"eval_samples_per_second": 517.232,
"eval_steps_per_second": 0.636,
"step": 1500
},
{
"epoch": 6.93,
"eval_accuracy": 0.9927183520890931,
"eval_f1": 0.9571476397723468,
"eval_loss": 0.03918459266424179,
"eval_precision": 0.952047952047952,
"eval_recall": 0.9623022551329519,
"eval_runtime": 6.1825,
"eval_samples_per_second": 525.837,
"eval_steps_per_second": 0.647,
"step": 1525
},
{
"epoch": 7.05,
"eval_accuracy": 0.9923484287995016,
"eval_f1": 0.9551738583996647,
"eval_loss": 0.03897989168763161,
"eval_precision": 0.9511096278992157,
"eval_recall": 0.9592729720632783,
"eval_runtime": 6.0468,
"eval_samples_per_second": 537.641,
"eval_steps_per_second": 0.662,
"step": 1550
},
{
"epoch": 7.16,
"eval_accuracy": 0.9925431252677076,
"eval_f1": 0.9565363034921699,
"eval_loss": 0.03931865468621254,
"eval_precision": 0.9519919986664445,
"eval_recall": 0.9611242006058566,
"eval_runtime": 6.2528,
"eval_samples_per_second": 519.93,
"eval_steps_per_second": 0.64,
"step": 1575
},
{
"epoch": 7.27,
"eval_accuracy": 0.9925236556208871,
"eval_f1": 0.9562233196618398,
"eval_loss": 0.03892602398991585,
"eval_precision": 0.9512073272273106,
"eval_recall": 0.9612924941097274,
"eval_runtime": 6.0818,
"eval_samples_per_second": 534.544,
"eval_steps_per_second": 0.658,
"step": 1600
},
{
"epoch": 7.39,
"eval_accuracy": 0.9923678984463222,
"eval_f1": 0.9565435820145692,
"eval_loss": 0.0404973067343235,
"eval_precision": 0.9518413597733711,
"eval_recall": 0.9612924941097274,
"eval_runtime": 6.1086,
"eval_samples_per_second": 532.197,
"eval_steps_per_second": 0.655,
"step": 1625
},
{
"epoch": 7.5,
"eval_accuracy": 0.9924847163272458,
"eval_f1": 0.9558737335677803,
"eval_loss": 0.04104885458946228,
"eval_precision": 0.9511748041993001,
"eval_recall": 0.9606193200942443,
"eval_runtime": 6.3603,
"eval_samples_per_second": 511.14,
"eval_steps_per_second": 0.629,
"step": 1650
},
{
"epoch": 7.61,
"eval_accuracy": 0.9925431252677076,
"eval_f1": 0.9569442117607639,
"eval_loss": 0.04079214483499527,
"eval_precision": 0.95263509006004,
"eval_recall": 0.9612924941097274,
"eval_runtime": 6.0876,
"eval_samples_per_second": 534.04,
"eval_steps_per_second": 0.657,
"step": 1675
},
{
"epoch": 7.73,
"eval_accuracy": 0.9921732019781161,
"eval_f1": 0.9545302574389837,
"eval_loss": 0.043598320335149765,
"eval_precision": 0.9481899701095982,
"eval_recall": 0.9609559071019859,
"eval_runtime": 6.3314,
"eval_samples_per_second": 513.469,
"eval_steps_per_second": 0.632,
"step": 1700
},
{
"epoch": 7.84,
"eval_accuracy": 0.9924068377399634,
"eval_f1": 0.9559548683660676,
"eval_loss": 0.0419035442173481,
"eval_precision": 0.9495268138801262,
"eval_recall": 0.9624705486368226,
"eval_runtime": 6.237,
"eval_samples_per_second": 521.246,
"eval_steps_per_second": 0.641,
"step": 1725
},
{
"epoch": 7.95,
"eval_accuracy": 0.9925625949145283,
"eval_f1": 0.957126109529392,
"eval_loss": 0.04293340817093849,
"eval_precision": 0.9525,
"eval_recall": 0.9617973746213396,
"eval_runtime": 6.1487,
"eval_samples_per_second": 528.734,
"eval_steps_per_second": 0.651,
"step": 1750
},
{
"epoch": 8.07,
"eval_accuracy": 0.9924068377399634,
"eval_f1": 0.9561506276150629,
"eval_loss": 0.041886329650878906,
"eval_precision": 0.9508988015978695,
"eval_recall": 0.9614607876135981,
"eval_runtime": 6.3754,
"eval_samples_per_second": 509.93,
"eval_steps_per_second": 0.627,
"step": 1775
},
{
"epoch": 8.18,
"eval_accuracy": 0.9922900198590398,
"eval_f1": 0.9555313625324512,
"eval_loss": 0.04220963269472122,
"eval_precision": 0.9509918319719953,
"eval_recall": 0.9601144395826321,
"eval_runtime": 6.1129,
"eval_samples_per_second": 531.828,
"eval_steps_per_second": 0.654,
"step": 1800
},
{
"epoch": 8.3,
"eval_accuracy": 0.9923873680931428,
"eval_f1": 0.9561793045664014,
"eval_loss": 0.041702426970005035,
"eval_precision": 0.9521107959285834,
"eval_recall": 0.9602827330865029,
"eval_runtime": 6.3543,
"eval_samples_per_second": 511.618,
"eval_steps_per_second": 0.629,
"step": 1825
},
{
"epoch": 8.41,
"eval_accuracy": 0.9924652466804252,
"eval_f1": 0.9570171763720151,
"eval_loss": 0.04150727763772011,
"eval_precision": 0.952945102619723,
"eval_recall": 0.9611242006058566,
"eval_runtime": 6.1032,
"eval_samples_per_second": 532.671,
"eval_steps_per_second": 0.655,
"step": 1850
},
{
"epoch": 8.52,
"eval_accuracy": 0.9924263073867841,
"eval_f1": 0.9566965407488064,
"eval_loss": 0.04162871465086937,
"eval_precision": 0.952309488077372,
"eval_recall": 0.9611242006058566,
"eval_runtime": 6.1162,
"eval_samples_per_second": 531.542,
"eval_steps_per_second": 0.654,
"step": 1875
},
{
"epoch": 8.64,
"eval_accuracy": 0.9922316109185779,
"eval_f1": 0.9555611348229978,
"eval_loss": 0.04189736768603325,
"eval_precision": 0.9503912102547029,
"eval_recall": 0.9607876135981152,
"eval_runtime": 6.4808,
"eval_samples_per_second": 501.634,
"eval_steps_per_second": 0.617,
"step": 1900
},
{
"epoch": 8.75,
"eval_accuracy": 0.9923873680931428,
"eval_f1": 0.9564489112227805,
"eval_loss": 0.04165585711598396,
"eval_precision": 0.9519839946648883,
"eval_recall": 0.9609559071019859,
"eval_runtime": 6.2132,
"eval_samples_per_second": 523.242,
"eval_steps_per_second": 0.644,
"step": 1925
},
{
"epoch": 8.86,
"eval_accuracy": 0.9926015342081694,
"eval_f1": 0.9577818730105546,
"eval_loss": 0.041886311024427414,
"eval_precision": 0.9534689793195463,
"eval_recall": 0.9621339616290812,
"eval_runtime": 6.5243,
"eval_samples_per_second": 498.291,
"eval_steps_per_second": 0.613,
"step": 1950
},
{
"epoch": 8.98,
"eval_accuracy": 0.9926599431486313,
"eval_f1": 0.9575341318368372,
"eval_loss": 0.04215257614850998,
"eval_precision": 0.9531432382858096,
"eval_recall": 0.9619656681252103,
"eval_runtime": 6.2104,
"eval_samples_per_second": 523.476,
"eval_steps_per_second": 0.644,
"step": 1975
},
{
"epoch": 9.09,
"learning_rate": 5.4545454545454545e-06,
"loss": 0.0022,
"step": 2000
},
{
"epoch": 9.09,
"eval_accuracy": 0.9925820645613489,
"eval_f1": 0.9571847507331379,
"eval_loss": 0.04227477312088013,
"eval_precision": 0.953111963957951,
"eval_recall": 0.9612924941097274,
"eval_runtime": 6.1893,
"eval_samples_per_second": 525.265,
"eval_steps_per_second": 0.646,
"step": 2000
},
{
"epoch": 9.2,
"eval_accuracy": 0.9925431252677076,
"eval_f1": 0.9567110441262665,
"eval_loss": 0.042577099055051804,
"eval_precision": 0.9520079986668889,
"eval_recall": 0.9614607876135981,
"eval_runtime": 6.2434,
"eval_samples_per_second": 520.71,
"eval_steps_per_second": 0.641,
"step": 2025
},
{
"epoch": 9.32,
"eval_accuracy": 0.9924652466804252,
"eval_f1": 0.9560338330123105,
"eval_loss": 0.04250513017177582,
"eval_precision": 0.9514919153192198,
"eval_recall": 0.9606193200942443,
"eval_runtime": 5.9913,
"eval_samples_per_second": 542.619,
"eval_steps_per_second": 0.668,
"step": 2050
},
{
"epoch": 9.43,
"eval_accuracy": 0.9925431252677076,
"eval_f1": 0.956463496316142,
"eval_loss": 0.0422191396355629,
"eval_precision": 0.951682772409197,
"eval_recall": 0.9612924941097274,
"eval_runtime": 6.2812,
"eval_samples_per_second": 517.58,
"eval_steps_per_second": 0.637,
"step": 2075
},
{
"epoch": 9.55,
"eval_accuracy": 0.9924847163272458,
"eval_f1": 0.9559537765868363,
"eval_loss": 0.0423436276614666,
"eval_precision": 0.9513333333333334,
"eval_recall": 0.9606193200942443,
"eval_runtime": 6.0529,
"eval_samples_per_second": 537.095,
"eval_steps_per_second": 0.661,
"step": 2100
},
{
"epoch": 9.66,
"eval_accuracy": 0.9924652466804252,
"eval_f1": 0.9558663428523575,
"eval_loss": 0.04235740005970001,
"eval_precision": 0.951325220870145,
"eval_recall": 0.9604510265903736,
"eval_runtime": 6.0731,
"eval_samples_per_second": 535.315,
"eval_steps_per_second": 0.659,
"step": 2125
},
{
"epoch": 9.77,
"eval_accuracy": 0.9924652466804252,
"eval_f1": 0.9566164154103852,
"eval_loss": 0.042295120656490326,
"eval_precision": 0.9521507169056352,
"eval_recall": 0.9611242006058566,
"eval_runtime": 6.3348,
"eval_samples_per_second": 513.197,
"eval_steps_per_second": 0.631,
"step": 2150
},
{
"epoch": 9.89,
"eval_accuracy": 0.9924847163272458,
"eval_f1": 0.9567037936521229,
"eval_loss": 0.04226445034146309,
"eval_precision": 0.9521586931155193,
"eval_recall": 0.9612924941097274,
"eval_runtime": 6.1145,
"eval_samples_per_second": 531.688,
"eval_steps_per_second": 0.654,
"step": 2175
},
{
"epoch": 10.0,
"eval_accuracy": 0.9925236556208871,
"eval_f1": 0.9570387739720292,
"eval_loss": 0.04224075376987457,
"eval_precision": 0.952492082013669,
"eval_recall": 0.9616290811174689,
"eval_runtime": 6.3677,
"eval_samples_per_second": 510.543,
"eval_steps_per_second": 0.628,
"step": 2200
},
{
"epoch": 10.0,
"step": 2200,
"total_flos": 4144211411102244.0,
"train_loss": 0.021953743980689482,
"train_runtime": 1324.4932,
"train_samples_per_second": 106.018,
"train_steps_per_second": 1.661
}
],
"max_steps": 2200,
"num_train_epochs": 10,
"total_flos": 4144211411102244.0,
"trial_name": null,
"trial_params": null
}