{ "best_metric": 0.6934678744913757, "best_model_checkpoint": "sloberta_sentinews_sentence_2e-05_10e_lr2e-05/checkpoint-3560", "epoch": 2.9966329966329965, "global_step": 3560, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.03, "learning_rate": 1.9932659932659936e-05, "loss": 0.9684, "step": 40 }, { "epoch": 0.03, "eval_accuracy": 0.5901716992303138, "eval_f1_macro": 0.3290637211523573, "eval_f1_negative": 0.25811001410437234, "eval_f1_neutral": 0.7290811493526997, "eval_f1_positive": 0.0, "eval_loss": 0.9020117521286011, "eval_precision_negative": 0.6455026455026455, "eval_precision_neutral": 0.5861893881695862, "eval_precision_positive": 0.0, "eval_recall_negative": 0.16130453944468928, "eval_recall_neutral": 0.9640918580375782, "eval_recall_positive": 0.0, "eval_runtime": 13.6446, "eval_samples_per_second": 618.928, "eval_steps_per_second": 3.225, "step": 40 }, { "epoch": 0.07, "learning_rate": 1.9865319865319866e-05, "loss": 0.8398, "step": 80 }, { "epoch": 0.07, "eval_accuracy": 0.6470100651272943, "eval_f1_macro": 0.5536698584230076, "eval_f1_negative": 0.5115520521880946, "eval_f1_neutral": 0.7385869565217391, "eval_f1_positive": 0.4108705665591893, "eval_loss": 0.7759891152381897, "eval_precision_negative": 0.6673758865248227, "eval_precision_neutral": 0.65232, "eval_precision_positive": 0.5681528662420382, "eval_recall_negative": 0.41472014103129134, "eval_recall_neutral": 0.8511482254697286, "eval_recall_positive": 0.3217893217893218, "eval_runtime": 13.475, "eval_samples_per_second": 626.715, "eval_steps_per_second": 3.265, "step": 80 }, { "epoch": 0.1, "learning_rate": 1.97979797979798e-05, "loss": 0.7748, "step": 120 }, { "epoch": 0.1, "eval_accuracy": 0.6824156305506217, "eval_f1_macro": 0.6410968890440648, "eval_f1_negative": 0.6465890942276981, "eval_f1_neutral": 0.7394423944239442, "eval_f1_positive": 0.5372591784805524, "eval_loss": 0.7227517366409302, "eval_precision_negative": 0.6702932828760644, "eval_precision_neutral": 0.7263391059202577, "eval_precision_positive": 0.5413919413919414, "eval_recall_negative": 0.624504186866461, "eval_recall_neutral": 0.753027139874739, "eval_recall_positive": 0.5331890331890332, "eval_runtime": 13.5517, "eval_samples_per_second": 623.169, "eval_steps_per_second": 3.247, "step": 120 }, { "epoch": 0.13, "learning_rate": 1.973063973063973e-05, "loss": 0.7661, "step": 160 }, { "epoch": 0.13, "eval_accuracy": 0.6966252220248668, "eval_f1_macro": 0.6402639165706846, "eval_f1_negative": 0.6606451612903226, "eval_f1_neutral": 0.755861518507433, "eval_f1_positive": 0.5042850699142984, "eval_loss": 0.6990944147109985, "eval_precision_negative": 0.6451070978580429, "eval_precision_neutral": 0.7238677622778521, "eval_precision_positive": 0.6726835138387485, "eval_recall_negative": 0.6769501983252534, "eval_recall_neutral": 0.7908141962421712, "eval_recall_positive": 0.4033189033189033, "eval_runtime": 13.529, "eval_samples_per_second": 624.216, "eval_steps_per_second": 3.252, "step": 160 }, { "epoch": 0.17, "learning_rate": 1.9663299663299665e-05, "loss": 0.7329, "step": 200 }, { "epoch": 0.17, "eval_accuracy": 0.6814683244523386, "eval_f1_macro": 0.6584553155124641, "eval_f1_negative": 0.6805819101834283, "eval_f1_neutral": 0.7180338757887746, "eval_f1_positive": 0.5767501605651895, "eval_loss": 0.7035245299339294, "eval_precision_negative": 0.6523848019401779, "eval_precision_neutral": 0.7643176997407495, "eval_precision_positive": 0.5196759259259259, "eval_recall_negative": 0.7113265755839577, "eval_recall_neutral": 0.677035490605428, "eval_recall_positive": 0.6479076479076479, "eval_runtime": 13.5578, "eval_samples_per_second": 622.89, "eval_steps_per_second": 3.245, "step": 200 }, { "epoch": 0.2, "learning_rate": 1.9595959595959596e-05, "loss": 0.7084, "step": 240 }, { "epoch": 0.2, "eval_accuracy": 0.7044404973357016, "eval_f1_macro": 0.6484202003006585, "eval_f1_negative": 0.6737166776823088, "eval_f1_neutral": 0.7610199644198458, "eval_f1_positive": 0.5105239587998209, "eval_loss": 0.6696082353591919, "eval_precision_negative": 0.673568281938326, "eval_precision_neutral": 0.7225975975975976, "eval_precision_positive": 0.6729634002361276, "eval_recall_negative": 0.6738651388276774, "eval_recall_neutral": 0.8037578288100209, "eval_recall_positive": 0.41125541125541126, "eval_runtime": 13.468, "eval_samples_per_second": 627.04, "eval_steps_per_second": 3.267, "step": 240 }, { "epoch": 0.24, "learning_rate": 1.952861952861953e-05, "loss": 0.6878, "step": 280 }, { "epoch": 0.24, "eval_accuracy": 0.6889283599763173, "eval_f1_macro": 0.6646815029633141, "eval_f1_negative": 0.6859417557091976, "eval_f1_neutral": 0.7256559446701065, "eval_f1_positive": 0.5824468085106382, "eval_loss": 0.6821370720863342, "eval_precision_negative": 0.6537539936102237, "eval_precision_neutral": 0.7652234313498495, "eval_precision_positive": 0.5400739827373613, "eval_recall_negative": 0.7214631996474218, "eval_recall_neutral": 0.6899791231732777, "eval_recall_positive": 0.6320346320346321, "eval_runtime": 13.4239, "eval_samples_per_second": 629.1, "eval_steps_per_second": 3.278, "step": 280 }, { "epoch": 0.27, "learning_rate": 1.9461279461279464e-05, "loss": 0.7059, "step": 320 }, { "epoch": 0.27, "eval_accuracy": 0.7119005328596802, "eval_f1_macro": 0.6649492798540481, "eval_f1_negative": 0.6837046745303625, "eval_f1_neutral": 0.763837267704671, "eval_f1_positive": 0.5473058973271108, "eval_loss": 0.662620484828949, "eval_precision_negative": 0.6777825898657427, "eval_precision_neutral": 0.736108422071636, "eval_precision_positive": 0.6642636457260556, "eval_recall_negative": 0.6897311591009255, "eval_recall_neutral": 0.7937369519832985, "eval_recall_positive": 0.4653679653679654, "eval_runtime": 13.4494, "eval_samples_per_second": 627.911, "eval_steps_per_second": 3.272, "step": 320 }, { "epoch": 0.3, "learning_rate": 1.9393939393939395e-05, "loss": 0.6745, "step": 360 }, { "epoch": 0.3, "eval_accuracy": 0.709295441089402, "eval_f1_macro": 0.6599969904410593, "eval_f1_negative": 0.6773485513608428, "eval_f1_neutral": 0.7627118644067796, "eval_f1_positive": 0.5399305555555556, "eval_loss": 0.6554310917854309, "eval_precision_negative": 0.674682990817665, "eval_precision_neutral": 0.7299618320610687, "eval_precision_positive": 0.6775599128540305, "eval_recall_negative": 0.6800352578228295, "eval_recall_neutral": 0.7985386221294363, "eval_recall_positive": 0.44877344877344877, "eval_runtime": 13.4392, "eval_samples_per_second": 628.385, "eval_steps_per_second": 3.274, "step": 360 }, { "epoch": 0.34, "learning_rate": 1.932659932659933e-05, "loss": 0.6824, "step": 400 }, { "epoch": 0.34, "eval_accuracy": 0.7095322676139728, "eval_f1_macro": 0.6638552526690601, "eval_f1_negative": 0.6730469619407968, "eval_f1_neutral": 0.7641443071048136, "eval_f1_positive": 0.5543744889615698, "eval_loss": 0.6521803736686707, "eval_precision_negative": 0.6798561151079137, "eval_precision_neutral": 0.7366789381902732, "eval_precision_positive": 0.6396226415094339, "eval_recall_negative": 0.6663728514764213, "eval_recall_neutral": 0.7937369519832985, "eval_recall_positive": 0.48917748917748916, "eval_runtime": 13.4346, "eval_samples_per_second": 628.599, "eval_steps_per_second": 3.275, "step": 400 }, { "epoch": 0.37, "learning_rate": 1.925925925925926e-05, "loss": 0.669, "step": 440 }, { "epoch": 0.37, "eval_accuracy": 0.713084665482534, "eval_f1_macro": 0.6622007799006476, "eval_f1_negative": 0.6819873057561829, "eval_f1_neutral": 0.7671314741035858, "eval_f1_positive": 0.5374835598421743, "eval_loss": 0.6492008566856384, "eval_precision_negative": 0.6773913043478261, "eval_precision_neutral": 0.7335238095238096, "eval_precision_positive": 0.6849162011173184, "eval_recall_negative": 0.6866460996033495, "eval_recall_neutral": 0.8039665970772443, "eval_recall_positive": 0.4422799422799423, "eval_runtime": 13.4531, "eval_samples_per_second": 627.738, "eval_steps_per_second": 3.271, "step": 440 }, { "epoch": 0.4, "learning_rate": 1.9191919191919194e-05, "loss": 0.6835, "step": 480 }, { "epoch": 0.4, "eval_accuracy": 0.7045589105979869, "eval_f1_macro": 0.6620625908815416, "eval_f1_negative": 0.6357811729916215, "eval_f1_neutral": 0.7631345490389355, "eval_f1_positive": 0.5872720506140677, "eval_loss": 0.6506330966949463, "eval_precision_negative": 0.7210732252655114, "eval_precision_neutral": 0.722875816993464, "eval_precision_positive": 0.606456571867794, "eval_recall_negative": 0.5685323931247246, "eval_recall_neutral": 0.8081419624217119, "eval_recall_positive": 0.5692640692640693, "eval_runtime": 13.434, "eval_samples_per_second": 628.63, "eval_steps_per_second": 3.275, "step": 480 }, { "epoch": 0.44, "learning_rate": 1.9124579124579125e-05, "loss": 0.659, "step": 520 }, { "epoch": 0.44, "eval_accuracy": 0.7040852575488454, "eval_f1_macro": 0.6783997964045833, "eval_f1_negative": 0.699721226602947, "eval_f1_neutral": 0.7399162442142384, "eval_f1_positive": 0.595561918396564, "eval_loss": 0.6650780439376831, "eval_precision_negative": 0.6382128586996004, "eval_precision_neutral": 0.7836134453781513, "eval_precision_positive": 0.5909090909090909, "eval_recall_negative": 0.7743499338915822, "eval_recall_neutral": 0.7008350730688935, "eval_recall_positive": 0.6002886002886003, "eval_runtime": 13.4366, "eval_samples_per_second": 628.508, "eval_steps_per_second": 3.275, "step": 520 }, { "epoch": 0.47, "learning_rate": 1.905723905723906e-05, "loss": 0.6554, "step": 560 }, { "epoch": 0.47, "eval_accuracy": 0.7166370633510953, "eval_f1_macro": 0.6722586905255515, "eval_f1_negative": 0.6801165657924232, "eval_f1_neutral": 0.7694463910301331, "eval_f1_positive": 0.5672131147540983, "eval_loss": 0.6467012763023376, "eval_precision_negative": 0.6920620437956204, "eval_precision_neutral": 0.7391806116560877, "eval_precision_positive": 0.6565464895635673, "eval_recall_negative": 0.6685764654032613, "eval_recall_neutral": 0.8022964509394572, "eval_recall_positive": 0.49927849927849927, "eval_runtime": 13.4494, "eval_samples_per_second": 627.909, "eval_steps_per_second": 3.272, "step": 560 }, { "epoch": 0.51, "learning_rate": 1.8989898989898993e-05, "loss": 0.659, "step": 600 }, { "epoch": 0.51, "eval_accuracy": 0.712137359384251, "eval_f1_macro": 0.6705187144410446, "eval_f1_negative": 0.6719478098788444, "eval_f1_neutral": 0.7654419861848032, "eval_f1_positive": 0.5741663472594865, "eval_loss": 0.6443530917167664, "eval_precision_negative": 0.71280276816609, "eval_precision_neutral": 0.7353337180226966, "eval_precision_positive": 0.6124284546197875, "eval_recall_negative": 0.6355222565006611, "eval_recall_neutral": 0.7981210855949895, "eval_recall_positive": 0.5404040404040404, "eval_runtime": 13.4345, "eval_samples_per_second": 628.604, "eval_steps_per_second": 3.275, "step": 600 }, { "epoch": 0.54, "learning_rate": 1.8922558922558924e-05, "loss": 0.6692, "step": 640 }, { "epoch": 0.54, "eval_accuracy": 0.7047957371225577, "eval_f1_macro": 0.6746517865902923, "eval_f1_negative": 0.6761710794297353, "eval_f1_neutral": 0.7508104151416919, "eval_f1_positive": 0.5969738651994497, "eval_loss": 0.6483765244483948, "eval_precision_negative": 0.6948837209302325, "eval_precision_neutral": 0.7521474963335428, "eval_precision_positive": 0.5703022339027596, "eval_recall_negative": 0.6584398413397973, "eval_recall_neutral": 0.7494780793319415, "eval_recall_positive": 0.6262626262626263, "eval_runtime": 13.5781, "eval_samples_per_second": 621.958, "eval_steps_per_second": 3.241, "step": 640 }, { "epoch": 0.57, "learning_rate": 1.8855218855218858e-05, "loss": 0.6343, "step": 680 }, { "epoch": 0.57, "eval_accuracy": 0.7084665482534044, "eval_f1_macro": 0.6745823109427566, "eval_f1_negative": 0.6674407803065491, "eval_f1_neutral": 0.7580216636010628, "eval_f1_positive": 0.5982844889206576, "eval_loss": 0.6420348286628723, "eval_precision_negative": 0.7054491899852725, "eval_precision_neutral": 0.7423939151321057, "eval_precision_positive": 0.5927762039660056, "eval_recall_negative": 0.6333186425738211, "eval_recall_neutral": 0.774321503131524, "eval_recall_positive": 0.6038961038961039, "eval_runtime": 13.5238, "eval_samples_per_second": 624.455, "eval_steps_per_second": 3.254, "step": 680 }, { "epoch": 0.61, "learning_rate": 1.8787878787878792e-05, "loss": 0.6707, "step": 720 }, { "epoch": 0.61, "eval_accuracy": 0.7161634103019539, "eval_f1_macro": 0.6635859690261697, "eval_f1_negative": 0.6552984165651644, "eval_f1_neutral": 0.7757296466973886, "eval_f1_positive": 0.5597298438159561, "eval_loss": 0.630727231502533, "eval_precision_negative": 0.7325708061002179, "eval_precision_neutral": 0.7180945609669392, "eval_precision_positive": 0.6744659206510681, "eval_recall_negative": 0.5927721463199648, "eval_recall_neutral": 0.8434237995824635, "eval_recall_positive": 0.47835497835497837, "eval_runtime": 13.5358, "eval_samples_per_second": 623.902, "eval_steps_per_second": 3.251, "step": 720 }, { "epoch": 0.64, "learning_rate": 1.8720538720538723e-05, "loss": 0.6555, "step": 760 }, { "epoch": 0.64, "eval_accuracy": 0.7173475429248076, "eval_f1_macro": 0.6760934295779212, "eval_f1_negative": 0.6785469499657298, "eval_f1_neutral": 0.7685231476852316, "eval_f1_positive": 0.5812101910828025, "eval_loss": 0.6327303051948547, "eval_precision_negative": 0.7044592030360531, "eval_precision_neutral": 0.7374784110535406, "eval_precision_positive": 0.6483126110124334, "eval_recall_negative": 0.6544733362714852, "eval_recall_neutral": 0.8022964509394572, "eval_recall_positive": 0.5266955266955267, "eval_runtime": 13.5283, "eval_samples_per_second": 624.249, "eval_steps_per_second": 3.252, "step": 760 }, { "epoch": 0.67, "learning_rate": 1.8653198653198653e-05, "loss": 0.6539, "step": 800 }, { "epoch": 0.67, "eval_accuracy": 0.713676731793961, "eval_f1_macro": 0.6798716085872009, "eval_f1_negative": 0.6834306241580603, "eval_f1_neutral": 0.7602507450416196, "eval_f1_positive": 0.5959334565619224, "eval_loss": 0.63933926820755, "eval_precision_negative": 0.6965675057208238, "eval_precision_neutral": 0.7486338797814208, "eval_precision_positive": 0.6110689916603488, "eval_recall_negative": 0.6707800793301014, "eval_recall_neutral": 0.7722338204592902, "eval_recall_positive": 0.5815295815295816, "eval_runtime": 13.556, "eval_samples_per_second": 622.971, "eval_steps_per_second": 3.246, "step": 800 }, { "epoch": 0.71, "learning_rate": 1.8585858585858588e-05, "loss": 0.6586, "step": 840 }, { "epoch": 0.71, "eval_accuracy": 0.7122557726465364, "eval_f1_macro": 0.6643997026372683, "eval_f1_negative": 0.6466569058077111, "eval_f1_neutral": 0.7709443099273607, "eval_f1_positive": 0.575597892176733, "eval_loss": 0.6333789229393005, "eval_precision_negative": 0.7244395844723893, "eval_precision_neutral": 0.7190605239385727, "eval_precision_positive": 0.6567992599444958, "eval_recall_negative": 0.5839576906126047, "eval_recall_neutral": 0.8308977035490606, "eval_recall_positive": 0.5122655122655123, "eval_runtime": 13.615, "eval_samples_per_second": 620.272, "eval_steps_per_second": 3.232, "step": 840 }, { "epoch": 0.74, "learning_rate": 1.851851851851852e-05, "loss": 0.6579, "step": 880 }, { "epoch": 0.74, "eval_accuracy": 0.7187685020722321, "eval_f1_macro": 0.6807447825123648, "eval_f1_negative": 0.6873633581110626, "eval_f1_neutral": 0.7675631455159013, "eval_f1_positive": 0.5873078439101301, "eval_loss": 0.6417641639709473, "eval_precision_negative": 0.6819956616052061, "eval_precision_neutral": 0.7522549609140108, "eval_precision_positive": 0.6472632493483927, "eval_recall_negative": 0.6928162185985015, "eval_recall_neutral": 0.7835073068893528, "eval_recall_positive": 0.5375180375180375, "eval_runtime": 13.429, "eval_samples_per_second": 628.863, "eval_steps_per_second": 3.276, "step": 880 }, { "epoch": 0.77, "learning_rate": 1.8451178451178452e-05, "loss": 0.6408, "step": 920 }, { "epoch": 0.77, "eval_accuracy": 0.7156897572528124, "eval_f1_macro": 0.6733312463576527, "eval_f1_negative": 0.6765443355368133, "eval_f1_neutral": 0.7680304091227369, "eval_f1_positive": 0.5754189944134079, "eval_loss": 0.6319063901901245, "eval_precision_negative": 0.7006610009442871, "eval_precision_neutral": 0.7372767428461686, "eval_precision_positive": 0.64375, "eval_recall_negative": 0.6540326134861172, "eval_recall_neutral": 0.8014613778705637, "eval_recall_positive": 0.5202020202020202, "eval_runtime": 13.4319, "eval_samples_per_second": 628.725, "eval_steps_per_second": 3.276, "step": 920 }, { "epoch": 0.81, "learning_rate": 1.8383838383838387e-05, "loss": 0.6458, "step": 960 }, { "epoch": 0.81, "eval_accuracy": 0.7116637063351096, "eval_f1_macro": 0.6808189121483205, "eval_f1_negative": 0.6855624446412755, "eval_f1_neutral": 0.7558841907935847, "eval_f1_positive": 0.601010101010101, "eval_loss": 0.6365010142326355, "eval_precision_negative": 0.6889185580774366, "eval_precision_neutral": 0.7541562759767249, "eval_precision_positive": 0.601010101010101, "eval_recall_negative": 0.6822388717496695, "eval_recall_neutral": 0.7576200417536535, "eval_recall_positive": 0.601010101010101, "eval_runtime": 13.4342, "eval_samples_per_second": 628.619, "eval_steps_per_second": 3.275, "step": 960 }, { "epoch": 0.84, "learning_rate": 1.831649831649832e-05, "loss": 0.6663, "step": 1000 }, { "epoch": 0.84, "eval_accuracy": 0.7177027827116637, "eval_f1_macro": 0.6745871543495067, "eval_f1_negative": 0.6834215167548501, "eval_f1_neutral": 0.7686739720518749, "eval_f1_positive": 0.5716659742417948, "eval_loss": 0.6319110989570618, "eval_precision_negative": 0.6837229819144244, "eval_precision_neutral": 0.7413224743067675, "eval_precision_positive": 0.67384916748286, "eval_recall_negative": 0.6831203173204055, "eval_recall_neutral": 0.7981210855949895, "eval_recall_positive": 0.4963924963924964, "eval_runtime": 13.4422, "eval_samples_per_second": 628.246, "eval_steps_per_second": 3.273, "step": 1000 }, { "epoch": 0.88, "learning_rate": 1.824915824915825e-05, "loss": 0.6456, "step": 1040 }, { "epoch": 0.88, "eval_accuracy": 0.7104795737122558, "eval_f1_macro": 0.6846884030136478, "eval_f1_negative": 0.6933867735470942, "eval_f1_neutral": 0.7508249068653539, "eval_f1_positive": 0.6098535286284953, "eval_loss": 0.6414014101028442, "eval_precision_negative": 0.7007200720072008, "eval_precision_neutral": 0.7659066232356134, "eval_precision_positive": 0.5661310259579728, "eval_recall_negative": 0.6862053768179814, "eval_recall_neutral": 0.7363256784968685, "eval_recall_positive": 0.6608946608946609, "eval_runtime": 13.4341, "eval_samples_per_second": 628.625, "eval_steps_per_second": 3.275, "step": 1040 }, { "epoch": 0.91, "learning_rate": 1.8181818181818182e-05, "loss": 0.6416, "step": 1080 }, { "epoch": 0.91, "eval_accuracy": 0.7153345174659562, "eval_f1_macro": 0.6849725647884108, "eval_f1_negative": 0.6939308244507288, "eval_f1_neutral": 0.7585337674614012, "eval_f1_positive": 0.6024531024531025, "eval_loss": 0.6341109871864319, "eval_precision_negative": 0.6851374570446735, "eval_precision_neutral": 0.7632635806383429, "eval_precision_positive": 0.6024531024531025, "eval_recall_negative": 0.7029528426619657, "eval_recall_neutral": 0.7538622129436325, "eval_recall_positive": 0.6024531024531025, "eval_runtime": 13.5517, "eval_samples_per_second": 623.169, "eval_steps_per_second": 3.247, "step": 1080 }, { "epoch": 0.94, "learning_rate": 1.8114478114478116e-05, "loss": 0.6387, "step": 1120 }, { "epoch": 0.94, "eval_accuracy": 0.7132030787448195, "eval_f1_macro": 0.6812920768310707, "eval_f1_negative": 0.6735266604303087, "eval_f1_neutral": 0.7610456176319835, "eval_f1_positive": 0.60930395243092, "eval_loss": 0.6404346227645874, "eval_precision_negative": 0.7174887892376681, "eval_precision_neutral": 0.7476334340382679, "eval_precision_positive": 0.5913102511880516, "eval_recall_negative": 0.6346408109299251, "eval_recall_neutral": 0.7749478079331942, "eval_recall_positive": 0.6284271284271284, "eval_runtime": 13.5098, "eval_samples_per_second": 625.102, "eval_steps_per_second": 3.257, "step": 1120 }, { "epoch": 0.98, "learning_rate": 1.804713804713805e-05, "loss": 0.6483, "step": 1160 }, { "epoch": 0.98, "eval_accuracy": 0.7200710479573712, "eval_f1_macro": 0.6806619404824857, "eval_f1_negative": 0.6825213576541214, "eval_f1_neutral": 0.7708228674771426, "eval_f1_positive": 0.5886415963161934, "eval_loss": 0.6273576021194458, "eval_precision_negative": 0.7167798254122212, "eval_precision_neutral": 0.7429788882432694, "eval_precision_positive": 0.6286885245901639, "eval_recall_negative": 0.6513882767739092, "eval_recall_neutral": 0.8008350730688936, "eval_recall_positive": 0.5533910533910534, "eval_runtime": 13.5101, "eval_samples_per_second": 625.087, "eval_steps_per_second": 3.257, "step": 1160 }, { "epoch": 1.01, "learning_rate": 1.797979797979798e-05, "loss": 0.6418, "step": 1200 }, { "epoch": 1.01, "eval_accuracy": 0.7216104203670811, "eval_f1_macro": 0.6749026822057264, "eval_f1_negative": 0.6914728682170542, "eval_f1_neutral": 0.7730991818000399, "eval_f1_positive": 0.560135996600085, "eval_loss": 0.6303337812423706, "eval_precision_negative": 0.695013357079252, "eval_precision_neutral": 0.7404434250764526, "eval_precision_positive": 0.6814891416752844, "eval_recall_negative": 0.6879682679594535, "eval_recall_neutral": 0.808768267223382, "eval_recall_positive": 0.4754689754689755, "eval_runtime": 14.4031, "eval_samples_per_second": 586.332, "eval_steps_per_second": 3.055, "step": 1200 }, { "epoch": 1.04, "learning_rate": 1.7912457912457915e-05, "loss": 0.6201, "step": 1240 }, { "epoch": 1.04, "eval_accuracy": 0.7193605683836589, "eval_f1_macro": 0.6783071530429613, "eval_f1_negative": 0.6780135229657263, "eval_f1_neutral": 0.7719368378972615, "eval_f1_positive": 0.584971098265896, "eval_loss": 0.6306412220001221, "eval_precision_negative": 0.7198019801980198, "eval_precision_neutral": 0.7404141104294478, "eval_precision_positive": 0.6277915632754343, "eval_recall_negative": 0.6408109299250772, "eval_recall_neutral": 0.8062630480167015, "eval_recall_positive": 0.5476190476190477, "eval_runtime": 13.6129, "eval_samples_per_second": 620.369, "eval_steps_per_second": 3.232, "step": 1240 }, { "epoch": 1.08, "learning_rate": 1.7845117845117846e-05, "loss": 0.5971, "step": 1280 }, { "epoch": 1.08, "eval_accuracy": 0.7166370633510953, "eval_f1_macro": 0.6745910338462799, "eval_f1_negative": 0.6869394005688033, "eval_f1_neutral": 0.7662285136501515, "eval_f1_positive": 0.5706051873198847, "eval_loss": 0.6360566020011902, "eval_precision_negative": 0.682015638575152, "eval_precision_neutral": 0.7429411764705882, "eval_precision_positive": 0.6644295302013423, "eval_recall_negative": 0.6919347730277655, "eval_recall_neutral": 0.7910229645093946, "eval_recall_positive": 0.5, "eval_runtime": 13.5493, "eval_samples_per_second": 623.278, "eval_steps_per_second": 3.247, "step": 1280 }, { "epoch": 1.11, "learning_rate": 1.7777777777777777e-05, "loss": 0.6101, "step": 1320 }, { "epoch": 1.11, "eval_accuracy": 0.7226761397276495, "eval_f1_macro": 0.6791712549911954, "eval_f1_negative": 0.6990124516960068, "eval_f1_neutral": 0.7709451929895654, "eval_f1_positive": 0.5675561202880136, "eval_loss": 0.6358277201652527, "eval_precision_negative": 0.6814566764336543, "eval_precision_neutral": 0.748868333005314, "eval_precision_positive": 0.6871794871794872, "eval_recall_negative": 0.7174966945791097, "eval_recall_neutral": 0.7943632567849687, "eval_recall_positive": 0.4834054834054834, "eval_runtime": 13.4061, "eval_samples_per_second": 629.938, "eval_steps_per_second": 3.282, "step": 1320 }, { "epoch": 1.14, "learning_rate": 1.771043771043771e-05, "loss": 0.5977, "step": 1360 }, { "epoch": 1.14, "eval_accuracy": 0.7124925991711072, "eval_f1_macro": 0.6812595953156201, "eval_f1_negative": 0.6902101028162717, "eval_f1_neutral": 0.756903198916328, "eval_f1_positive": 0.5966654842142604, "eval_loss": 0.640369713306427, "eval_precision_negative": 0.7002267573696145, "eval_precision_neutral": 0.7555648013313917, "eval_precision_positive": 0.586880669923238, "eval_recall_negative": 0.6804759806081975, "eval_recall_neutral": 0.7582463465553236, "eval_recall_positive": 0.6067821067821068, "eval_runtime": 13.458, "eval_samples_per_second": 627.51, "eval_steps_per_second": 3.269, "step": 1360 }, { "epoch": 1.18, "learning_rate": 1.7643097643097645e-05, "loss": 0.6229, "step": 1400 }, { "epoch": 1.18, "eval_accuracy": 0.720307874481942, "eval_f1_macro": 0.6787577486913711, "eval_f1_negative": 0.6789838337182449, "eval_f1_neutral": 0.7721746063384493, "eval_f1_positive": 0.5851148060174189, "eval_loss": 0.625924825668335, "eval_precision_negative": 0.7132459970887919, "eval_precision_neutral": 0.7387490465293669, "eval_precision_positive": 0.6482456140350877, "eval_recall_negative": 0.6478624944909652, "eval_recall_neutral": 0.808768267223382, "eval_recall_positive": 0.5331890331890332, "eval_runtime": 13.413, "eval_samples_per_second": 629.615, "eval_steps_per_second": 3.28, "step": 1400 }, { "epoch": 1.21, "learning_rate": 1.7575757575757576e-05, "loss": 0.5971, "step": 1440 }, { "epoch": 1.21, "eval_accuracy": 0.7111900532859681, "eval_f1_macro": 0.685070727390424, "eval_f1_negative": 0.6965195246179966, "eval_f1_neutral": 0.7495985440530993, "eval_f1_positive": 0.6090941135001762, "eval_loss": 0.6486834287643433, "eval_precision_negative": 0.6717151043798608, "eval_precision_neutral": 0.7692814765985497, "eval_precision_positive": 0.5954514128187457, "eval_recall_negative": 0.7232260907888938, "eval_recall_neutral": 0.7308977035490606, "eval_recall_positive": 0.6233766233766234, "eval_runtime": 13.4217, "eval_samples_per_second": 629.204, "eval_steps_per_second": 3.278, "step": 1440 }, { "epoch": 1.25, "learning_rate": 1.750841750841751e-05, "loss": 0.6006, "step": 1480 }, { "epoch": 1.25, "eval_accuracy": 0.7155713439905269, "eval_f1_macro": 0.683204217410409, "eval_f1_negative": 0.6757380073800737, "eval_f1_neutral": 0.7631821439541312, "eval_f1_positive": 0.6106925008970219, "eval_loss": 0.6353930830955505, "eval_precision_negative": 0.7087566521528785, "eval_precision_neutral": 0.7488446855535463, "eval_precision_positive": 0.6074232690935046, "eval_recall_negative": 0.6456588805641251, "eval_recall_neutral": 0.7780793319415449, "eval_recall_positive": 0.613997113997114, "eval_runtime": 13.4559, "eval_samples_per_second": 627.605, "eval_steps_per_second": 3.27, "step": 1480 }, { "epoch": 1.28, "learning_rate": 1.7441077441077444e-05, "loss": 0.6104, "step": 1520 }, { "epoch": 1.28, "eval_accuracy": 0.7127294256956779, "eval_f1_macro": 0.6839464489013288, "eval_f1_negative": 0.6825213576541214, "eval_f1_neutral": 0.7576642335766423, "eval_f1_positive": 0.6116537554732233, "eval_loss": 0.6454949975013733, "eval_precision_negative": 0.7167798254122212, "eval_precision_neutral": 0.756875, "eval_precision_positive": 0.5735944409349337, "eval_recall_negative": 0.6513882767739092, "eval_recall_neutral": 0.758455114822547, "eval_recall_positive": 0.6551226551226551, "eval_runtime": 13.4867, "eval_samples_per_second": 626.174, "eval_steps_per_second": 3.262, "step": 1520 }, { "epoch": 1.31, "learning_rate": 1.7373737373737375e-05, "loss": 0.6101, "step": 1560 }, { "epoch": 1.31, "eval_accuracy": 0.7206631142687981, "eval_f1_macro": 0.6779869326137852, "eval_f1_negative": 0.6807543740059078, "eval_f1_neutral": 0.772482552342971, "eval_f1_positive": 0.5807238714924766, "eval_loss": 0.6268090605735779, "eval_precision_negative": 0.702626641651032, "eval_precision_neutral": 0.7393129770992366, "eval_precision_positive": 0.6654240447343895, "eval_recall_negative": 0.6602027324812693, "eval_recall_neutral": 0.808768267223382, "eval_recall_positive": 0.5151515151515151, "eval_runtime": 13.4458, "eval_samples_per_second": 628.077, "eval_steps_per_second": 3.272, "step": 1560 }, { "epoch": 1.35, "learning_rate": 1.7306397306397305e-05, "loss": 0.6022, "step": 1600 }, { "epoch": 1.35, "eval_accuracy": 0.7143872113676731, "eval_f1_macro": 0.6836129674253361, "eval_f1_negative": 0.6836007130124777, "eval_f1_neutral": 0.7594515995014541, "eval_f1_positive": 0.6077865897620764, "eval_loss": 0.6394125819206238, "eval_precision_negative": 0.6913023884632717, "eval_precision_neutral": 0.7556841670111616, "eval_precision_positive": 0.6073487031700289, "eval_recall_negative": 0.6760687527545174, "eval_recall_neutral": 0.7632567849686848, "eval_recall_positive": 0.6082251082251082, "eval_runtime": 13.4382, "eval_samples_per_second": 628.432, "eval_steps_per_second": 3.274, "step": 1600 }, { "epoch": 1.38, "learning_rate": 1.723905723905724e-05, "loss": 0.6236, "step": 1640 }, { "epoch": 1.38, "eval_accuracy": 0.7134399052693902, "eval_f1_macro": 0.6861857480530462, "eval_f1_negative": 0.683572710951526, "eval_f1_neutral": 0.7565409267626353, "eval_f1_positive": 0.6184436064449776, "eval_loss": 0.6394263505935669, "eval_precision_negative": 0.6963877457704618, "eval_precision_neutral": 0.7615823989845568, "eval_precision_positive": 0.589157413455258, "eval_recall_negative": 0.6712208021154694, "eval_recall_neutral": 0.7515657620041754, "eval_recall_positive": 0.6507936507936508, "eval_runtime": 13.4189, "eval_samples_per_second": 629.337, "eval_steps_per_second": 3.279, "step": 1640 }, { "epoch": 1.41, "learning_rate": 1.7171717171717173e-05, "loss": 0.6039, "step": 1680 }, { "epoch": 1.41, "eval_accuracy": 0.7182948490230906, "eval_f1_macro": 0.6829107741796993, "eval_f1_negative": 0.6881057268722467, "eval_f1_neutral": 0.7655158240854912, "eval_f1_positive": 0.5951107715813598, "eval_loss": 0.6307365298271179, "eval_precision_negative": 0.6878027300748569, "eval_precision_neutral": 0.7537434237150951, "eval_precision_positive": 0.6323051948051948, "eval_recall_negative": 0.6884089907448215, "eval_recall_neutral": 0.7776617954070981, "eval_recall_positive": 0.562049062049062, "eval_runtime": 13.423, "eval_samples_per_second": 629.145, "eval_steps_per_second": 3.278, "step": 1680 }, { "epoch": 1.45, "learning_rate": 1.7104377104377104e-05, "loss": 0.6059, "step": 1720 }, { "epoch": 1.45, "eval_accuracy": 0.7173475429248076, "eval_f1_macro": 0.6865160173058559, "eval_f1_negative": 0.6937445699391833, "eval_f1_neutral": 0.7605015673981192, "eval_f1_positive": 0.6053019145802652, "eval_loss": 0.6336551904678345, "eval_precision_negative": 0.6839400428265524, "eval_precision_neutral": 0.7612970711297071, "eval_precision_positive": 0.6180451127819548, "eval_recall_negative": 0.7038342882327017, "eval_recall_neutral": 0.7597077244258873, "eval_recall_positive": 0.5930735930735931, "eval_runtime": 13.4767, "eval_samples_per_second": 626.636, "eval_steps_per_second": 3.265, "step": 1720 }, { "epoch": 1.48, "learning_rate": 1.7037037037037038e-05, "loss": 0.6042, "step": 1760 }, { "epoch": 1.48, "eval_accuracy": 0.7197158081705151, "eval_f1_macro": 0.685440373432607, "eval_f1_negative": 0.694493006993007, "eval_f1_neutral": 0.7645846217274789, "eval_f1_positive": 0.5972434915773354, "eval_loss": 0.63006192445755, "eval_precision_negative": 0.6887732986562636, "eval_precision_neutral": 0.7550895765472313, "eval_precision_positive": 0.636215334420881, "eval_recall_negative": 0.7003085059497576, "eval_recall_neutral": 0.774321503131524, "eval_recall_positive": 0.5627705627705628, "eval_runtime": 13.4204, "eval_samples_per_second": 629.266, "eval_steps_per_second": 3.279, "step": 1760 }, { "epoch": 1.52, "learning_rate": 1.6969696969696972e-05, "loss": 0.5907, "step": 1800 }, { "epoch": 1.52, "eval_accuracy": 0.7238602723505032, "eval_f1_macro": 0.6788816276493144, "eval_f1_negative": 0.6713483146067416, "eval_f1_neutral": 0.7784207945071114, "eval_f1_positive": 0.58687577383409, "eval_loss": 0.6279187202453613, "eval_precision_negative": 0.7159261108337494, "eval_precision_neutral": 0.7341350601295097, "eval_precision_positive": 0.6856316297010607, "eval_recall_negative": 0.6319964742177171, "eval_recall_neutral": 0.82839248434238, "eval_recall_positive": 0.512987012987013, "eval_runtime": 13.4379, "eval_samples_per_second": 628.446, "eval_steps_per_second": 3.274, "step": 1800 }, { "epoch": 1.55, "learning_rate": 1.6902356902356903e-05, "loss": 0.6135, "step": 1840 }, { "epoch": 1.55, "eval_accuracy": 0.7229129662522202, "eval_f1_macro": 0.6795419420133372, "eval_f1_negative": 0.6882803943044906, "eval_f1_neutral": 0.7737461051361945, "eval_f1_positive": 0.5765993265993266, "eval_loss": 0.6268677711486816, "eval_precision_negative": 0.6842334494773519, "eval_precision_neutral": 0.7460748207016864, "eval_precision_positive": 0.6919191919191919, "eval_recall_negative": 0.6923754958131335, "eval_recall_neutral": 0.8035490605427975, "eval_recall_positive": 0.49422799422799424, "eval_runtime": 13.44, "eval_samples_per_second": 628.349, "eval_steps_per_second": 3.274, "step": 1840 }, { "epoch": 1.58, "learning_rate": 1.6835016835016837e-05, "loss": 0.5996, "step": 1880 }, { "epoch": 1.58, "eval_accuracy": 0.7220840734162226, "eval_f1_macro": 0.6869855176473937, "eval_f1_negative": 0.6864864864864865, "eval_f1_neutral": 0.7696068445711958, "eval_f1_positive": 0.6048632218844986, "eval_loss": 0.6290135979652405, "eval_precision_negative": 0.7019806540764625, "eval_precision_neutral": 0.7513922036595068, "eval_precision_positive": 0.6388443017656501, "eval_recall_negative": 0.6716615249008374, "eval_recall_neutral": 0.7887265135699374, "eval_recall_positive": 0.5743145743145743, "eval_runtime": 13.4252, "eval_samples_per_second": 629.039, "eval_steps_per_second": 3.277, "step": 1880 }, { "epoch": 1.62, "learning_rate": 1.6767676767676768e-05, "loss": 0.6136, "step": 1920 }, { "epoch": 1.62, "eval_accuracy": 0.7223208999407934, "eval_f1_macro": 0.6908988856510865, "eval_f1_negative": 0.7006585935840238, "eval_f1_neutral": 0.7644044755829762, "eval_f1_positive": 0.6076335877862595, "eval_loss": 0.6263943910598755, "eval_precision_negative": 0.6763740771123872, "eval_precision_neutral": 0.7657657657657657, "eval_precision_positive": 0.6450567260940032, "eval_recall_negative": 0.7267518730718379, "eval_recall_neutral": 0.7630480167014614, "eval_recall_positive": 0.5743145743145743, "eval_runtime": 13.5533, "eval_samples_per_second": 623.095, "eval_steps_per_second": 3.246, "step": 1920 }, { "epoch": 1.65, "learning_rate": 1.6700336700336702e-05, "loss": 0.6036, "step": 1960 }, { "epoch": 1.65, "eval_accuracy": 0.7141503848431024, "eval_f1_macro": 0.6879732554886911, "eval_f1_negative": 0.6988408851422551, "eval_f1_neutral": 0.7530068728522336, "eval_f1_positive": 0.6120720084715848, "eval_loss": 0.6364882588386536, "eval_precision_negative": 0.6696284329563813, "eval_precision_neutral": 0.7753206545776206, "eval_precision_positive": 0.5991706979958535, "eval_recall_negative": 0.7307183781401498, "eval_recall_neutral": 0.7319415448851775, "eval_recall_positive": 0.6255411255411255, "eval_runtime": 13.4324, "eval_samples_per_second": 628.703, "eval_steps_per_second": 3.276, "step": 1960 }, { "epoch": 1.68, "learning_rate": 1.6632996632996633e-05, "loss": 0.6123, "step": 2000 }, { "epoch": 1.68, "eval_accuracy": 0.7198342214328005, "eval_f1_macro": 0.6811378179180303, "eval_f1_negative": 0.694331550802139, "eval_f1_neutral": 0.7660226924256361, "eval_f1_positive": 0.5830592105263157, "eval_loss": 0.6256130933761597, "eval_precision_negative": 0.6745635910224439, "eval_precision_neutral": 0.7504506308832365, "eval_precision_positive": 0.6778202676864244, "eval_recall_negative": 0.7152930806522697, "eval_recall_neutral": 0.7822546972860125, "eval_recall_positive": 0.5115440115440115, "eval_runtime": 13.4059, "eval_samples_per_second": 629.947, "eval_steps_per_second": 3.282, "step": 2000 }, { "epoch": 1.72, "learning_rate": 1.6565656565656567e-05, "loss": 0.5898, "step": 2040 }, { "epoch": 1.72, "eval_accuracy": 0.7255180580224985, "eval_f1_macro": 0.6783018381472949, "eval_f1_negative": 0.6911698789780368, "eval_f1_neutral": 0.777568611909244, "eval_f1_positive": 0.5661670235546039, "eval_loss": 0.6203241944313049, "eval_precision_negative": 0.7031463748290013, "eval_precision_neutral": 0.7399585140486518, "eval_precision_positive": 0.6965226554267651, "eval_recall_negative": 0.6795945350374615, "eval_recall_neutral": 0.8192066805845512, "eval_recall_positive": 0.4769119769119769, "eval_runtime": 13.429, "eval_samples_per_second": 628.864, "eval_steps_per_second": 3.276, "step": 2040 }, { "epoch": 1.75, "learning_rate": 1.64983164983165e-05, "loss": 0.585, "step": 2080 }, { "epoch": 1.75, "eval_accuracy": 0.7277679100059207, "eval_f1_macro": 0.6856054160655031, "eval_f1_negative": 0.6840989399293286, "eval_f1_neutral": 0.7798319327731092, "eval_f1_positive": 0.5928853754940712, "eval_loss": 0.62270188331604, "eval_precision_negative": 0.7348178137651822, "eval_precision_neutral": 0.7406572769953051, "eval_precision_positive": 0.6555944055944056, "eval_recall_negative": 0.6399294843543412, "eval_recall_neutral": 0.8233820459290188, "eval_recall_positive": 0.5411255411255411, "eval_runtime": 13.4336, "eval_samples_per_second": 628.646, "eval_steps_per_second": 3.275, "step": 2080 }, { "epoch": 1.78, "learning_rate": 1.6430976430976432e-05, "loss": 0.6092, "step": 2120 }, { "epoch": 1.78, "eval_accuracy": 0.7194789816459444, "eval_f1_macro": 0.691219851642046, "eval_f1_negative": 0.6904706700672385, "eval_f1_neutral": 0.7632427932146946, "eval_f1_positive": 0.6199460916442048, "eval_loss": 0.6305855512619019, "eval_precision_negative": 0.7284735812133072, "eval_precision_neutral": 0.7609462544096286, "eval_precision_positive": 0.5815423514538559, "eval_recall_negative": 0.6562362274129573, "eval_recall_neutral": 0.765553235908142, "eval_recall_positive": 0.6637806637806638, "eval_runtime": 13.4354, "eval_samples_per_second": 628.563, "eval_steps_per_second": 3.275, "step": 2120 }, { "epoch": 1.82, "learning_rate": 1.6363636363636366e-05, "loss": 0.5902, "step": 2160 }, { "epoch": 1.82, "eval_accuracy": 0.7217288336293665, "eval_f1_macro": 0.6903674148692266, "eval_f1_negative": 0.699802067297119, "eval_f1_neutral": 0.7650182196772514, "eval_f1_positive": 0.606281957633309, "eval_loss": 0.6268182992935181, "eval_precision_negative": 0.6984196663740123, "eval_precision_neutral": 0.7630321910695742, "eval_precision_positive": 0.613905325443787, "eval_recall_negative": 0.7011899515204936, "eval_recall_neutral": 0.7670146137787056, "eval_recall_positive": 0.5988455988455988, "eval_runtime": 13.453, "eval_samples_per_second": 627.739, "eval_steps_per_second": 3.271, "step": 2160 }, { "epoch": 1.85, "learning_rate": 1.6296296296296297e-05, "loss": 0.6077, "step": 2200 }, { "epoch": 1.85, "eval_accuracy": 0.7239786856127887, "eval_f1_macro": 0.6863881436307776, "eval_f1_negative": 0.6860517946388005, "eval_f1_neutral": 0.7731126362535325, "eval_f1_positive": 0.5999999999999999, "eval_loss": 0.6207541227340698, "eval_precision_negative": 0.7079231129864041, "eval_precision_neutral": 0.7483391949980461, "eval_precision_positive": 0.6482412060301508, "eval_recall_negative": 0.6654914059056853, "eval_recall_neutral": 0.7995824634655533, "eval_recall_positive": 0.5584415584415584, "eval_runtime": 13.4434, "eval_samples_per_second": 628.189, "eval_steps_per_second": 3.273, "step": 2200 }, { "epoch": 1.89, "learning_rate": 1.622895622895623e-05, "loss": 0.5971, "step": 2240 }, { "epoch": 1.89, "eval_accuracy": 0.7297809354647721, "eval_f1_macro": 0.6928803015060957, "eval_f1_negative": 0.6937485894831867, "eval_f1_neutral": 0.7777216213484281, "eval_f1_positive": 0.6071706936866719, "eval_loss": 0.6181867122650146, "eval_precision_negative": 0.7109158186864015, "eval_precision_neutral": 0.7538702723887909, "eval_precision_positive": 0.6601694915254237, "eval_recall_negative": 0.6773909211106214, "eval_recall_neutral": 0.8031315240083508, "eval_recall_positive": 0.562049062049062, "eval_runtime": 13.5165, "eval_samples_per_second": 624.792, "eval_steps_per_second": 3.255, "step": 2240 }, { "epoch": 1.92, "learning_rate": 1.616161616161616e-05, "loss": 0.6053, "step": 2280 }, { "epoch": 1.92, "eval_accuracy": 0.7235050325636472, "eval_f1_macro": 0.6869805131510361, "eval_f1_negative": 0.6891179839633448, "eval_f1_neutral": 0.7715961966417155, "eval_f1_positive": 0.6002273588480483, "eval_loss": 0.6221389174461365, "eval_precision_negative": 0.7175572519083969, "eval_precision_neutral": 0.7484301412872841, "eval_precision_positive": 0.6320830007980845, "eval_recall_negative": 0.6628470691934774, "eval_recall_neutral": 0.7962421711899791, "eval_recall_positive": 0.5714285714285714, "eval_runtime": 13.4474, "eval_samples_per_second": 628.005, "eval_steps_per_second": 3.272, "step": 2280 }, { "epoch": 1.95, "learning_rate": 1.6094276094276096e-05, "loss": 0.5959, "step": 2320 }, { "epoch": 1.95, "eval_accuracy": 0.7199526346950859, "eval_f1_macro": 0.682651116707718, "eval_f1_negative": 0.6665057915057916, "eval_f1_neutral": 0.7722100219604712, "eval_f1_positive": 0.6092375366568915, "eval_loss": 0.6313912272453308, "eval_precision_negative": 0.7365333333333334, "eval_precision_neutral": 0.7398622800306044, "eval_precision_positive": 0.6192250372578242, "eval_recall_negative": 0.6086381665932129, "eval_recall_neutral": 0.8075156576200417, "eval_recall_positive": 0.5995670995670995, "eval_runtime": 13.532, "eval_samples_per_second": 624.078, "eval_steps_per_second": 3.252, "step": 2320 }, { "epoch": 1.99, "learning_rate": 1.602693602693603e-05, "loss": 0.6196, "step": 2360 }, { "epoch": 1.99, "eval_accuracy": 0.709295441089402, "eval_f1_macro": 0.6881296895840747, "eval_f1_negative": 0.700795870079587, "eval_f1_neutral": 0.7440385036097135, "eval_f1_positive": 0.6195546950629235, "eval_loss": 0.6360026001930237, "eval_precision_negative": 0.684453781512605, "eval_precision_neutral": 0.7814797794117647, "eval_precision_positive": 0.5604203152364273, "eval_recall_negative": 0.7179374173644777, "eval_recall_neutral": 0.7100208768267223, "eval_recall_positive": 0.6926406926406926, "eval_runtime": 13.7523, "eval_samples_per_second": 614.079, "eval_steps_per_second": 3.199, "step": 2360 }, { "epoch": 2.02, "learning_rate": 1.595959595959596e-05, "loss": 0.5686, "step": 2400 }, { "epoch": 2.02, "eval_accuracy": 0.7191237418590882, "eval_f1_macro": 0.6870370031512542, "eval_f1_negative": 0.6933101650738488, "eval_f1_neutral": 0.7630622208372286, "eval_f1_positive": 0.6047386235426853, "eval_loss": 0.6405708193778992, "eval_precision_negative": 0.6835117773019272, "eval_precision_neutral": 0.7593549720901385, "eval_precision_positive": 0.631578947368421, "eval_recall_negative": 0.7033935654473337, "eval_recall_neutral": 0.7668058455114822, "eval_recall_positive": 0.5800865800865801, "eval_runtime": 13.5092, "eval_samples_per_second": 625.128, "eval_steps_per_second": 3.257, "step": 2400 }, { "epoch": 2.05, "learning_rate": 1.5892255892255895e-05, "loss": 0.5586, "step": 2440 }, { "epoch": 2.05, "eval_accuracy": 0.7223208999407934, "eval_f1_macro": 0.6862310990226811, "eval_f1_negative": 0.6942959001782532, "eval_f1_neutral": 0.7689950980392158, "eval_f1_positive": 0.5954022988505746, "eval_loss": 0.6309220790863037, "eval_precision_negative": 0.7021180712032447, "eval_precision_neutral": 0.7526989204318273, "eval_precision_positive": 0.6348039215686274, "eval_recall_negative": 0.6866460996033495, "eval_recall_neutral": 0.7860125260960334, "eval_recall_positive": 0.5606060606060606, "eval_runtime": 13.5411, "eval_samples_per_second": 623.656, "eval_steps_per_second": 3.249, "step": 2440 }, { "epoch": 2.09, "learning_rate": 1.5824915824915825e-05, "loss": 0.5671, "step": 2480 }, { "epoch": 2.09, "eval_accuracy": 0.7205447010065127, "eval_f1_macro": 0.683056392123643, "eval_f1_negative": 0.6914449087310313, "eval_f1_neutral": 0.7678189048638727, "eval_f1_positive": 0.5899053627760252, "eval_loss": 0.6297855377197266, "eval_precision_negative": 0.6900790166812993, "eval_precision_neutral": 0.7504484751843731, "eval_precision_positive": 0.6504347826086957, "eval_recall_negative": 0.6928162185985015, "eval_recall_neutral": 0.7860125260960334, "eval_recall_positive": 0.5396825396825397, "eval_runtime": 13.5165, "eval_samples_per_second": 624.793, "eval_steps_per_second": 3.255, "step": 2480 }, { "epoch": 2.12, "learning_rate": 1.575757575757576e-05, "loss": 0.5458, "step": 2520 }, { "epoch": 2.12, "eval_accuracy": 0.7214920071047958, "eval_f1_macro": 0.6872366815721698, "eval_f1_negative": 0.6905083220872694, "eval_f1_neutral": 0.7679083094555873, "eval_f1_positive": 0.6032934131736527, "eval_loss": 0.63502436876297, "eval_precision_negative": 0.7050987597611392, "eval_precision_neutral": 0.7531112003211562, "eval_precision_positive": 0.6267496111975117, "eval_recall_negative": 0.6765094755398854, "eval_recall_neutral": 0.7832985386221294, "eval_recall_positive": 0.5815295815295816, "eval_runtime": 13.5006, "eval_samples_per_second": 625.526, "eval_steps_per_second": 3.259, "step": 2520 }, { "epoch": 2.15, "learning_rate": 1.569023569023569e-05, "loss": 0.5617, "step": 2560 }, { "epoch": 2.15, "eval_accuracy": 0.7103611604499704, "eval_f1_macro": 0.6868863746975769, "eval_f1_negative": 0.7016379846568526, "eval_f1_neutral": 0.7452902101709682, "eval_f1_positive": 0.6137309292649098, "eval_loss": 0.6412296891212463, "eval_precision_negative": 0.6624902114330462, "eval_precision_neutral": 0.7789665376735716, "eval_precision_positive": 0.5907877169559412, "eval_recall_negative": 0.745702952842662, "eval_recall_neutral": 0.7144050104384133, "eval_recall_positive": 0.6385281385281385, "eval_runtime": 13.561, "eval_samples_per_second": 622.74, "eval_steps_per_second": 3.245, "step": 2560 }, { "epoch": 2.19, "learning_rate": 1.5622895622895624e-05, "loss": 0.5582, "step": 2600 }, { "epoch": 2.19, "eval_accuracy": 0.7085849615156897, "eval_f1_macro": 0.687474213023077, "eval_f1_negative": 0.699581589958159, "eval_f1_neutral": 0.7421052631578948, "eval_f1_positive": 0.6207357859531774, "eval_loss": 0.6525644659996033, "eval_precision_negative": 0.6658701712465154, "eval_precision_neutral": 0.7815242494226328, "eval_precision_positive": 0.5785536159600998, "eval_recall_negative": 0.7368884971353019, "eval_recall_neutral": 0.7064718162839249, "eval_recall_positive": 0.6695526695526696, "eval_runtime": 13.5361, "eval_samples_per_second": 623.888, "eval_steps_per_second": 3.251, "step": 2600 }, { "epoch": 2.22, "learning_rate": 1.555555555555556e-05, "loss": 0.5543, "step": 2640 }, { "epoch": 2.22, "eval_accuracy": 0.7201894612196567, "eval_f1_macro": 0.6869432555451471, "eval_f1_negative": 0.7009306260575296, "eval_f1_neutral": 0.762918885061071, "eval_f1_positive": 0.5969802555168409, "eval_loss": 0.640322744846344, "eval_precision_negative": 0.6738511590077267, "eval_precision_neutral": 0.7629985383169764, "eval_precision_positive": 0.6441102756892231, "eval_recall_negative": 0.7302776553547818, "eval_recall_neutral": 0.762839248434238, "eval_recall_positive": 0.5562770562770563, "eval_runtime": 13.5133, "eval_samples_per_second": 624.941, "eval_steps_per_second": 3.256, "step": 2640 }, { "epoch": 2.26, "learning_rate": 1.548821548821549e-05, "loss": 0.558, "step": 2680 }, { "epoch": 2.26, "eval_accuracy": 0.7206631142687981, "eval_f1_macro": 0.6874230644596926, "eval_f1_negative": 0.697239536954586, "eval_f1_neutral": 0.7653250773993808, "eval_f1_positive": 0.5997045790251108, "eval_loss": 0.6337417364120483, "eval_precision_negative": 0.7044534412955465, "eval_precision_neutral": 0.756734693877551, "eval_precision_positive": 0.6142208774583964, "eval_recall_negative": 0.6901718818862935, "eval_recall_neutral": 0.7741127348643007, "eval_recall_positive": 0.5858585858585859, "eval_runtime": 13.5113, "eval_samples_per_second": 625.032, "eval_steps_per_second": 3.257, "step": 2680 }, { "epoch": 2.29, "learning_rate": 1.5420875420875423e-05, "loss": 0.5506, "step": 2720 }, { "epoch": 2.29, "eval_accuracy": 0.7171107164002368, "eval_f1_macro": 0.6895025450757618, "eval_f1_negative": 0.7093775262732418, "eval_f1_neutral": 0.753454231433506, "eval_f1_positive": 0.6056758775205378, "eval_loss": 0.6484044194221497, "eval_precision_negative": 0.6550951847704367, "eval_precision_neutral": 0.7800625838176128, "eval_precision_positive": 0.6277089783281734, "eval_recall_negative": 0.7734684883208461, "eval_recall_neutral": 0.7286012526096033, "eval_recall_positive": 0.5851370851370852, "eval_runtime": 13.5135, "eval_samples_per_second": 624.931, "eval_steps_per_second": 3.256, "step": 2720 }, { "epoch": 2.32, "learning_rate": 1.5353535353535354e-05, "loss": 0.5569, "step": 2760 }, { "epoch": 2.32, "eval_accuracy": 0.7167554766133807, "eval_f1_macro": 0.6895340612929335, "eval_f1_negative": 0.7063525452250736, "eval_f1_neutral": 0.7544910179640718, "eval_f1_positive": 0.6077586206896551, "eval_loss": 0.6315791606903076, "eval_precision_negative": 0.6756539235412475, "eval_precision_neutral": 0.7733450241122315, "eval_precision_positive": 0.6051502145922747, "eval_recall_negative": 0.7399735566328779, "eval_recall_neutral": 0.7365344467640919, "eval_recall_positive": 0.6103896103896104, "eval_runtime": 13.5058, "eval_samples_per_second": 625.287, "eval_steps_per_second": 3.258, "step": 2760 }, { "epoch": 2.36, "learning_rate": 1.5286195286195288e-05, "loss": 0.5469, "step": 2800 }, { "epoch": 2.36, "eval_accuracy": 0.7182948490230906, "eval_f1_macro": 0.69129222470535, "eval_f1_negative": 0.7031543764361813, "eval_f1_neutral": 0.7562953478446436, "eval_f1_positive": 0.6144269498352252, "eval_loss": 0.6461361646652222, "eval_precision_negative": 0.6683876092136616, "eval_precision_neutral": 0.7734613705805325, "eval_precision_positive": 0.6237918215613383, "eval_recall_negative": 0.7417364477743499, "eval_recall_neutral": 0.7398747390396659, "eval_recall_positive": 0.6053391053391053, "eval_runtime": 13.5002, "eval_samples_per_second": 625.546, "eval_steps_per_second": 3.259, "step": 2800 }, { "epoch": 2.39, "learning_rate": 1.521885521885522e-05, "loss": 0.5497, "step": 2840 }, { "epoch": 2.39, "eval_accuracy": 0.7205447010065127, "eval_f1_macro": 0.6901740903513232, "eval_f1_negative": 0.6989695242271432, "eval_f1_neutral": 0.7628887497390942, "eval_f1_positive": 0.608663997087732, "eval_loss": 0.6306228041648865, "eval_precision_negative": 0.6954624781849913, "eval_precision_neutral": 0.7627295492487479, "eval_precision_positive": 0.6142542248346804, "eval_recall_negative": 0.7025121198765977, "eval_recall_neutral": 0.7630480167014614, "eval_recall_positive": 0.6031746031746031, "eval_runtime": 13.5161, "eval_samples_per_second": 624.81, "eval_steps_per_second": 3.255, "step": 2840 }, { "epoch": 2.42, "learning_rate": 1.5151515151515153e-05, "loss": 0.5577, "step": 2880 }, { "epoch": 2.42, "eval_accuracy": 0.7149792776791001, "eval_f1_macro": 0.686526091020862, "eval_f1_negative": 0.6968478950708694, "eval_f1_neutral": 0.7555225148683093, "eval_f1_positive": 0.6072078631234074, "eval_loss": 0.6409549713134766, "eval_precision_negative": 0.6700569568755086, "eval_precision_neutral": 0.7689148292261133, "eval_precision_positive": 0.6127847171197649, "eval_recall_negative": 0.7258704275011018, "eval_recall_neutral": 0.7425887265135699, "eval_recall_positive": 0.6017316017316018, "eval_runtime": 13.6855, "eval_samples_per_second": 617.076, "eval_steps_per_second": 3.215, "step": 2880 }, { "epoch": 2.46, "learning_rate": 1.5084175084175085e-05, "loss": 0.557, "step": 2920 }, { "epoch": 2.46, "eval_accuracy": 0.7225577264653641, "eval_f1_macro": 0.6876490677339296, "eval_f1_negative": 0.7071207430340557, "eval_f1_neutral": 0.7645151166440004, "eval_f1_positive": 0.5913113435237329, "eval_loss": 0.6443095803260803, "eval_precision_negative": 0.6649844720496895, "eval_precision_neutral": 0.7661983644369889, "eval_precision_positive": 0.6681818181818182, "eval_recall_negative": 0.75495813133539, "eval_recall_neutral": 0.762839248434238, "eval_recall_positive": 0.5303030303030303, "eval_runtime": 13.5647, "eval_samples_per_second": 622.57, "eval_steps_per_second": 3.244, "step": 2920 }, { "epoch": 2.49, "learning_rate": 1.5016835016835018e-05, "loss": 0.5542, "step": 2960 }, { "epoch": 2.49, "eval_accuracy": 0.7161634103019539, "eval_f1_macro": 0.687092758801656, "eval_f1_negative": 0.7009579341940858, "eval_f1_neutral": 0.7560144773259526, "eval_f1_positive": 0.6043058648849294, "eval_loss": 0.6480274796485901, "eval_precision_negative": 0.6644295302013423, "eval_precision_neutral": 0.7712858384013901, "eval_precision_positive": 0.6223241590214067, "eval_recall_negative": 0.7417364477743499, "eval_recall_neutral": 0.7413361169102296, "eval_recall_positive": 0.5873015873015873, "eval_runtime": 13.5134, "eval_samples_per_second": 624.935, "eval_steps_per_second": 3.256, "step": 2960 }, { "epoch": 2.53, "learning_rate": 1.4949494949494952e-05, "loss": 0.567, "step": 3000 }, { "epoch": 2.53, "eval_accuracy": 0.7079928952042629, "eval_f1_macro": 0.6865435263558487, "eval_f1_negative": 0.7025898078529658, "eval_f1_neutral": 0.7416051965209732, "eval_f1_positive": 0.6154355746936071, "eval_loss": 0.6429863572120667, "eval_precision_negative": 0.6677252878126241, "eval_precision_neutral": 0.7845329606335896, "eval_precision_positive": 0.5688916105327618, "eval_recall_negative": 0.7412957249889819, "eval_recall_neutral": 0.7031315240083508, "eval_recall_positive": 0.6702741702741702, "eval_runtime": 13.5159, "eval_samples_per_second": 624.818, "eval_steps_per_second": 3.255, "step": 3000 }, { "epoch": 2.56, "learning_rate": 1.4882154882154884e-05, "loss": 0.5606, "step": 3040 }, { "epoch": 2.56, "eval_accuracy": 0.7155713439905269, "eval_f1_macro": 0.6890929890491521, "eval_f1_negative": 0.7017241379310344, "eval_f1_neutral": 0.7549994652978291, "eval_f1_positive": 0.6105553639185926, "eval_loss": 0.6457778811454773, "eval_precision_negative": 0.6866301138760017, "eval_precision_neutral": 0.7739530804648104, "eval_precision_positive": 0.5849306014540647, "eval_recall_negative": 0.7174966945791097, "eval_recall_neutral": 0.7369519832985386, "eval_recall_positive": 0.6385281385281385, "eval_runtime": 13.5186, "eval_samples_per_second": 624.694, "eval_steps_per_second": 3.255, "step": 3040 }, { "epoch": 2.59, "learning_rate": 1.4814814814814815e-05, "loss": 0.5492, "step": 3080 }, { "epoch": 2.59, "eval_accuracy": 0.713676731793961, "eval_f1_macro": 0.687090376547261, "eval_f1_negative": 0.6999178981937603, "eval_f1_neutral": 0.7514812021975654, "eval_f1_positive": 0.6098720292504571, "eval_loss": 0.646338164806366, "eval_precision_negative": 0.6550134460238187, "eval_precision_neutral": 0.7763187180057868, "eval_precision_positive": 0.6182357301704967, "eval_recall_negative": 0.751432349052446, "eval_recall_neutral": 0.7281837160751565, "eval_recall_positive": 0.6017316017316018, "eval_runtime": 13.5425, "eval_samples_per_second": 623.591, "eval_steps_per_second": 3.249, "step": 3080 }, { "epoch": 2.63, "learning_rate": 1.4747474747474747e-05, "loss": 0.5509, "step": 3120 }, { "epoch": 2.63, "eval_accuracy": 0.7187685020722321, "eval_f1_macro": 0.6907132499480086, "eval_f1_negative": 0.7029375258585022, "eval_f1_neutral": 0.7576566001493972, "eval_f1_positive": 0.6115456238361267, "eval_loss": 0.6359885334968567, "eval_precision_negative": 0.6623781676413255, "eval_precision_neutral": 0.7749399694389871, "eval_precision_positive": 0.6320246343341032, "eval_recall_negative": 0.748788012340238, "eval_recall_neutral": 0.7411273486430062, "eval_recall_positive": 0.5923520923520924, "eval_runtime": 13.4528, "eval_samples_per_second": 627.753, "eval_steps_per_second": 3.271, "step": 3120 }, { "epoch": 2.66, "learning_rate": 1.4680134680134681e-05, "loss": 0.5626, "step": 3160 }, { "epoch": 2.66, "eval_accuracy": 0.7175843694493783, "eval_f1_macro": 0.6878133884212742, "eval_f1_negative": 0.7006661115736886, "eval_f1_neutral": 0.7580354301474488, "eval_f1_positive": 0.6047386235426853, "eval_loss": 0.6416473984718323, "eval_precision_negative": 0.663905325443787, "eval_precision_neutral": 0.770541298253181, "eval_precision_positive": 0.631578947368421, "eval_recall_negative": 0.7417364477743499, "eval_recall_neutral": 0.7459290187891441, "eval_recall_positive": 0.5800865800865801, "eval_runtime": 13.5444, "eval_samples_per_second": 623.505, "eval_steps_per_second": 3.249, "step": 3160 }, { "epoch": 2.69, "learning_rate": 1.4612794612794614e-05, "loss": 0.5589, "step": 3200 }, { "epoch": 2.69, "eval_accuracy": 0.7187685020722321, "eval_f1_macro": 0.6920386854465886, "eval_f1_negative": 0.706980691703798, "eval_f1_neutral": 0.7570633561643835, "eval_f1_positive": 0.6120720084715848, "eval_loss": 0.6367910504341125, "eval_precision_negative": 0.6816693944353519, "eval_precision_neutral": 0.7766798418972332, "eval_precision_positive": 0.5991706979958535, "eval_recall_negative": 0.7342441604230939, "eval_recall_neutral": 0.7384133611691023, "eval_recall_positive": 0.6255411255411255, "eval_runtime": 13.5341, "eval_samples_per_second": 623.979, "eval_steps_per_second": 3.251, "step": 3200 }, { "epoch": 2.73, "learning_rate": 1.4545454545454546e-05, "loss": 0.5499, "step": 3240 }, { "epoch": 2.73, "eval_accuracy": 0.7135583185316755, "eval_f1_macro": 0.6872354106917024, "eval_f1_negative": 0.7027480595762535, "eval_f1_neutral": 0.7509126046811251, "eval_f1_positive": 0.6080455678177287, "eval_loss": 0.6405165791511536, "eval_precision_negative": 0.6705364291433147, "eval_precision_neutral": 0.7729885057471264, "eval_precision_positive": 0.6001405481377372, "eval_recall_negative": 0.7382106654914059, "eval_recall_neutral": 0.7300626304801671, "eval_recall_positive": 0.6161616161616161, "eval_runtime": 13.5535, "eval_samples_per_second": 623.087, "eval_steps_per_second": 3.246, "step": 3240 }, { "epoch": 2.76, "learning_rate": 1.447811447811448e-05, "loss": 0.5431, "step": 3280 }, { "epoch": 2.76, "eval_accuracy": 0.7207815275310835, "eval_f1_macro": 0.6892335124121108, "eval_f1_negative": 0.7012817727568977, "eval_f1_neutral": 0.7629961454318157, "eval_f1_positive": 0.6034226190476191, "eval_loss": 0.6356926560401917, "eval_precision_negative": 0.6915167095115681, "eval_precision_neutral": 0.7614888750259929, "eval_precision_positive": 0.6228878648233487, "eval_recall_negative": 0.7113265755839577, "eval_recall_neutral": 0.764509394572025, "eval_recall_positive": 0.5851370851370852, "eval_runtime": 13.6103, "eval_samples_per_second": 620.484, "eval_steps_per_second": 3.233, "step": 3280 }, { "epoch": 2.79, "learning_rate": 1.4410774410774413e-05, "loss": 0.5388, "step": 3320 }, { "epoch": 2.79, "eval_accuracy": 0.7103611604499704, "eval_f1_macro": 0.6887331835620346, "eval_f1_negative": 0.7057600332709503, "eval_f1_neutral": 0.7435107787065551, "eval_f1_positive": 0.6169287387085982, "eval_loss": 0.6553226113319397, "eval_precision_negative": 0.6681102362204724, "eval_precision_neutral": 0.7856810785681079, "eval_precision_positive": 0.5751715533374921, "eval_recall_negative": 0.747906566769502, "eval_recall_neutral": 0.7056367432150313, "eval_recall_positive": 0.6652236652236653, "eval_runtime": 13.4151, "eval_samples_per_second": 629.514, "eval_steps_per_second": 3.28, "step": 3320 }, { "epoch": 2.83, "learning_rate": 1.4343434343434344e-05, "loss": 0.5613, "step": 3360 }, { "epoch": 2.83, "eval_accuracy": 0.7232682060390764, "eval_f1_macro": 0.6875059651526924, "eval_f1_negative": 0.7051926298157454, "eval_f1_neutral": 0.7659927423535511, "eval_f1_positive": 0.5913325232887808, "eval_loss": 0.6239017844200134, "eval_precision_negative": 0.6717191862784204, "eval_precision_neutral": 0.76086508753862, "eval_precision_positive": 0.6740535549399815, "eval_recall_negative": 0.742177170559718, "eval_recall_neutral": 0.7711899791231733, "eval_recall_positive": 0.5266955266955267, "eval_runtime": 13.4098, "eval_samples_per_second": 629.763, "eval_steps_per_second": 3.281, "step": 3360 }, { "epoch": 2.86, "learning_rate": 1.4276094276094276e-05, "loss": 0.556, "step": 3400 }, { "epoch": 2.86, "eval_accuracy": 0.7217288336293665, "eval_f1_macro": 0.6902285547620584, "eval_f1_negative": 0.7011167068097219, "eval_f1_neutral": 0.7648837451777708, "eval_f1_positive": 0.6046852122986822, "eval_loss": 0.6339342594146729, "eval_precision_negative": 0.696692776327241, "eval_precision_neutral": 0.7640074984378254, "eval_precision_positive": 0.6136701337295691, "eval_recall_negative": 0.7055971793741737, "eval_recall_neutral": 0.7657620041753653, "eval_recall_positive": 0.5959595959595959, "eval_runtime": 13.436, "eval_samples_per_second": 628.537, "eval_steps_per_second": 3.275, "step": 3400 }, { "epoch": 2.9, "learning_rate": 1.420875420875421e-05, "loss": 0.5536, "step": 3440 }, { "epoch": 2.9, "eval_accuracy": 0.7108348134991119, "eval_f1_macro": 0.6898151957724491, "eval_f1_negative": 0.7129761662253005, "eval_f1_neutral": 0.7415480427046264, "eval_f1_positive": 0.6149213783874204, "eval_loss": 0.659329891204834, "eval_precision_negative": 0.6628787878787878, "eval_precision_neutral": 0.7934316991908615, "eval_precision_positive": 0.5733000623830318, "eval_recall_negative": 0.7712648743940062, "eval_recall_neutral": 0.6960334029227557, "eval_recall_positive": 0.663059163059163, "eval_runtime": 13.4431, "eval_samples_per_second": 628.201, "eval_steps_per_second": 3.273, "step": 3440 }, { "epoch": 2.93, "learning_rate": 1.4141414141414143e-05, "loss": 0.5663, "step": 3480 }, { "epoch": 2.93, "eval_accuracy": 0.7154529307282416, "eval_f1_macro": 0.6878232234805552, "eval_f1_negative": 0.6974677920924034, "eval_f1_neutral": 0.7573062261753494, "eval_f1_positive": 0.6086956521739131, "eval_loss": 0.6353215575218201, "eval_precision_negative": 0.703090013434841, "eval_precision_neutral": 0.7683712935109583, "eval_precision_positive": 0.5750962772785623, "eval_recall_negative": 0.6919347730277655, "eval_recall_neutral": 0.7465553235908142, "eval_recall_positive": 0.6464646464646465, "eval_runtime": 13.4095, "eval_samples_per_second": 629.78, "eval_steps_per_second": 3.281, "step": 3480 }, { "epoch": 2.96, "learning_rate": 1.4074074074074075e-05, "loss": 0.5499, "step": 3520 }, { "epoch": 2.96, "eval_accuracy": 0.7143872113676731, "eval_f1_macro": 0.6899472024314622, "eval_f1_negative": 0.7078491335372069, "eval_f1_neutral": 0.7488017429193901, "eval_f1_positive": 0.6131907308377897, "eval_loss": 0.6429401636123657, "eval_precision_negative": 0.6585735963581184, "eval_precision_neutral": 0.7829157175398633, "eval_precision_positive": 0.6060606060606061, "eval_recall_negative": 0.7650947553988541, "eval_recall_neutral": 0.7175365344467641, "eval_recall_positive": 0.6204906204906205, "eval_runtime": 13.4298, "eval_samples_per_second": 628.824, "eval_steps_per_second": 3.276, "step": 3520 }, { "epoch": 3.0, "learning_rate": 1.4006734006734009e-05, "loss": 0.5619, "step": 3560 }, { "epoch": 3.0, "eval_accuracy": 0.7207815275310835, "eval_f1_macro": 0.6934678744913757, "eval_f1_negative": 0.7042136003337507, "eval_f1_neutral": 0.759215853398679, "eval_f1_positive": 0.6169741697416974, "eval_loss": 0.6337869167327881, "eval_precision_negative": 0.6685148514851486, "eval_precision_neutral": 0.7752393385552655, "eval_precision_positive": 0.6314199395770392, "eval_recall_negative": 0.74394006170119, "eval_recall_neutral": 0.7438413361169103, "eval_recall_positive": 0.6031746031746031, "eval_runtime": 13.4185, "eval_samples_per_second": 629.354, "eval_steps_per_second": 3.279, "step": 3560 } ], "max_steps": 11880, "num_train_epochs": 10, "total_flos": 1.849503866686182e+16, "trial_name": null, "trial_params": null }