|
{ |
|
"best_metric": 0.6934678744913757, |
|
"best_model_checkpoint": "sloberta_sentinews_sentence_2e-05_10e_lr2e-05/checkpoint-3560", |
|
"epoch": 2.9966329966329965, |
|
"global_step": 3560, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.03, |
|
"learning_rate": 1.9932659932659936e-05, |
|
"loss": 0.9684, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 0.03, |
|
"eval_accuracy": 0.5901716992303138, |
|
"eval_f1_macro": 0.3290637211523573, |
|
"eval_f1_negative": 0.25811001410437234, |
|
"eval_f1_neutral": 0.7290811493526997, |
|
"eval_f1_positive": 0.0, |
|
"eval_loss": 0.9020117521286011, |
|
"eval_precision_negative": 0.6455026455026455, |
|
"eval_precision_neutral": 0.5861893881695862, |
|
"eval_precision_positive": 0.0, |
|
"eval_recall_negative": 0.16130453944468928, |
|
"eval_recall_neutral": 0.9640918580375782, |
|
"eval_recall_positive": 0.0, |
|
"eval_runtime": 13.6446, |
|
"eval_samples_per_second": 618.928, |
|
"eval_steps_per_second": 3.225, |
|
"step": 40 |
|
}, |
|
{ |
|
"epoch": 0.07, |
|
"learning_rate": 1.9865319865319866e-05, |
|
"loss": 0.8398, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 0.07, |
|
"eval_accuracy": 0.6470100651272943, |
|
"eval_f1_macro": 0.5536698584230076, |
|
"eval_f1_negative": 0.5115520521880946, |
|
"eval_f1_neutral": 0.7385869565217391, |
|
"eval_f1_positive": 0.4108705665591893, |
|
"eval_loss": 0.7759891152381897, |
|
"eval_precision_negative": 0.6673758865248227, |
|
"eval_precision_neutral": 0.65232, |
|
"eval_precision_positive": 0.5681528662420382, |
|
"eval_recall_negative": 0.41472014103129134, |
|
"eval_recall_neutral": 0.8511482254697286, |
|
"eval_recall_positive": 0.3217893217893218, |
|
"eval_runtime": 13.475, |
|
"eval_samples_per_second": 626.715, |
|
"eval_steps_per_second": 3.265, |
|
"step": 80 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"learning_rate": 1.97979797979798e-05, |
|
"loss": 0.7748, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 0.1, |
|
"eval_accuracy": 0.6824156305506217, |
|
"eval_f1_macro": 0.6410968890440648, |
|
"eval_f1_negative": 0.6465890942276981, |
|
"eval_f1_neutral": 0.7394423944239442, |
|
"eval_f1_positive": 0.5372591784805524, |
|
"eval_loss": 0.7227517366409302, |
|
"eval_precision_negative": 0.6702932828760644, |
|
"eval_precision_neutral": 0.7263391059202577, |
|
"eval_precision_positive": 0.5413919413919414, |
|
"eval_recall_negative": 0.624504186866461, |
|
"eval_recall_neutral": 0.753027139874739, |
|
"eval_recall_positive": 0.5331890331890332, |
|
"eval_runtime": 13.5517, |
|
"eval_samples_per_second": 623.169, |
|
"eval_steps_per_second": 3.247, |
|
"step": 120 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"learning_rate": 1.973063973063973e-05, |
|
"loss": 0.7661, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 0.13, |
|
"eval_accuracy": 0.6966252220248668, |
|
"eval_f1_macro": 0.6402639165706846, |
|
"eval_f1_negative": 0.6606451612903226, |
|
"eval_f1_neutral": 0.755861518507433, |
|
"eval_f1_positive": 0.5042850699142984, |
|
"eval_loss": 0.6990944147109985, |
|
"eval_precision_negative": 0.6451070978580429, |
|
"eval_precision_neutral": 0.7238677622778521, |
|
"eval_precision_positive": 0.6726835138387485, |
|
"eval_recall_negative": 0.6769501983252534, |
|
"eval_recall_neutral": 0.7908141962421712, |
|
"eval_recall_positive": 0.4033189033189033, |
|
"eval_runtime": 13.529, |
|
"eval_samples_per_second": 624.216, |
|
"eval_steps_per_second": 3.252, |
|
"step": 160 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"learning_rate": 1.9663299663299665e-05, |
|
"loss": 0.7329, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.17, |
|
"eval_accuracy": 0.6814683244523386, |
|
"eval_f1_macro": 0.6584553155124641, |
|
"eval_f1_negative": 0.6805819101834283, |
|
"eval_f1_neutral": 0.7180338757887746, |
|
"eval_f1_positive": 0.5767501605651895, |
|
"eval_loss": 0.7035245299339294, |
|
"eval_precision_negative": 0.6523848019401779, |
|
"eval_precision_neutral": 0.7643176997407495, |
|
"eval_precision_positive": 0.5196759259259259, |
|
"eval_recall_negative": 0.7113265755839577, |
|
"eval_recall_neutral": 0.677035490605428, |
|
"eval_recall_positive": 0.6479076479076479, |
|
"eval_runtime": 13.5578, |
|
"eval_samples_per_second": 622.89, |
|
"eval_steps_per_second": 3.245, |
|
"step": 200 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"learning_rate": 1.9595959595959596e-05, |
|
"loss": 0.7084, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 0.2, |
|
"eval_accuracy": 0.7044404973357016, |
|
"eval_f1_macro": 0.6484202003006585, |
|
"eval_f1_negative": 0.6737166776823088, |
|
"eval_f1_neutral": 0.7610199644198458, |
|
"eval_f1_positive": 0.5105239587998209, |
|
"eval_loss": 0.6696082353591919, |
|
"eval_precision_negative": 0.673568281938326, |
|
"eval_precision_neutral": 0.7225975975975976, |
|
"eval_precision_positive": 0.6729634002361276, |
|
"eval_recall_negative": 0.6738651388276774, |
|
"eval_recall_neutral": 0.8037578288100209, |
|
"eval_recall_positive": 0.41125541125541126, |
|
"eval_runtime": 13.468, |
|
"eval_samples_per_second": 627.04, |
|
"eval_steps_per_second": 3.267, |
|
"step": 240 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"learning_rate": 1.952861952861953e-05, |
|
"loss": 0.6878, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 0.24, |
|
"eval_accuracy": 0.6889283599763173, |
|
"eval_f1_macro": 0.6646815029633141, |
|
"eval_f1_negative": 0.6859417557091976, |
|
"eval_f1_neutral": 0.7256559446701065, |
|
"eval_f1_positive": 0.5824468085106382, |
|
"eval_loss": 0.6821370720863342, |
|
"eval_precision_negative": 0.6537539936102237, |
|
"eval_precision_neutral": 0.7652234313498495, |
|
"eval_precision_positive": 0.5400739827373613, |
|
"eval_recall_negative": 0.7214631996474218, |
|
"eval_recall_neutral": 0.6899791231732777, |
|
"eval_recall_positive": 0.6320346320346321, |
|
"eval_runtime": 13.4239, |
|
"eval_samples_per_second": 629.1, |
|
"eval_steps_per_second": 3.278, |
|
"step": 280 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"learning_rate": 1.9461279461279464e-05, |
|
"loss": 0.7059, |
|
"step": 320 |
|
}, |
|
{ |
|
"epoch": 0.27, |
|
"eval_accuracy": 0.7119005328596802, |
|
"eval_f1_macro": 0.6649492798540481, |
|
"eval_f1_negative": 0.6837046745303625, |
|
"eval_f1_neutral": 0.763837267704671, |
|
"eval_f1_positive": 0.5473058973271108, |
|
"eval_loss": 0.662620484828949, |
|
"eval_precision_negative": 0.6777825898657427, |
|
"eval_precision_neutral": 0.736108422071636, |
|
"eval_precision_positive": 0.6642636457260556, |
|
"eval_recall_negative": 0.6897311591009255, |
|
"eval_recall_neutral": 0.7937369519832985, |
|
"eval_recall_positive": 0.4653679653679654, |
|
"eval_runtime": 13.4494, |
|
"eval_samples_per_second": 627.911, |
|
"eval_steps_per_second": 3.272, |
|
"step": 320 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"learning_rate": 1.9393939393939395e-05, |
|
"loss": 0.6745, |
|
"step": 360 |
|
}, |
|
{ |
|
"epoch": 0.3, |
|
"eval_accuracy": 0.709295441089402, |
|
"eval_f1_macro": 0.6599969904410593, |
|
"eval_f1_negative": 0.6773485513608428, |
|
"eval_f1_neutral": 0.7627118644067796, |
|
"eval_f1_positive": 0.5399305555555556, |
|
"eval_loss": 0.6554310917854309, |
|
"eval_precision_negative": 0.674682990817665, |
|
"eval_precision_neutral": 0.7299618320610687, |
|
"eval_precision_positive": 0.6775599128540305, |
|
"eval_recall_negative": 0.6800352578228295, |
|
"eval_recall_neutral": 0.7985386221294363, |
|
"eval_recall_positive": 0.44877344877344877, |
|
"eval_runtime": 13.4392, |
|
"eval_samples_per_second": 628.385, |
|
"eval_steps_per_second": 3.274, |
|
"step": 360 |
|
}, |
|
{ |
|
"epoch": 0.34, |
|
"learning_rate": 1.932659932659933e-05, |
|
"loss": 0.6824, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 0.34, |
|
"eval_accuracy": 0.7095322676139728, |
|
"eval_f1_macro": 0.6638552526690601, |
|
"eval_f1_negative": 0.6730469619407968, |
|
"eval_f1_neutral": 0.7641443071048136, |
|
"eval_f1_positive": 0.5543744889615698, |
|
"eval_loss": 0.6521803736686707, |
|
"eval_precision_negative": 0.6798561151079137, |
|
"eval_precision_neutral": 0.7366789381902732, |
|
"eval_precision_positive": 0.6396226415094339, |
|
"eval_recall_negative": 0.6663728514764213, |
|
"eval_recall_neutral": 0.7937369519832985, |
|
"eval_recall_positive": 0.48917748917748916, |
|
"eval_runtime": 13.4346, |
|
"eval_samples_per_second": 628.599, |
|
"eval_steps_per_second": 3.275, |
|
"step": 400 |
|
}, |
|
{ |
|
"epoch": 0.37, |
|
"learning_rate": 1.925925925925926e-05, |
|
"loss": 0.669, |
|
"step": 440 |
|
}, |
|
{ |
|
"epoch": 0.37, |
|
"eval_accuracy": 0.713084665482534, |
|
"eval_f1_macro": 0.6622007799006476, |
|
"eval_f1_negative": 0.6819873057561829, |
|
"eval_f1_neutral": 0.7671314741035858, |
|
"eval_f1_positive": 0.5374835598421743, |
|
"eval_loss": 0.6492008566856384, |
|
"eval_precision_negative": 0.6773913043478261, |
|
"eval_precision_neutral": 0.7335238095238096, |
|
"eval_precision_positive": 0.6849162011173184, |
|
"eval_recall_negative": 0.6866460996033495, |
|
"eval_recall_neutral": 0.8039665970772443, |
|
"eval_recall_positive": 0.4422799422799423, |
|
"eval_runtime": 13.4531, |
|
"eval_samples_per_second": 627.738, |
|
"eval_steps_per_second": 3.271, |
|
"step": 440 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"learning_rate": 1.9191919191919194e-05, |
|
"loss": 0.6835, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 0.4, |
|
"eval_accuracy": 0.7045589105979869, |
|
"eval_f1_macro": 0.6620625908815416, |
|
"eval_f1_negative": 0.6357811729916215, |
|
"eval_f1_neutral": 0.7631345490389355, |
|
"eval_f1_positive": 0.5872720506140677, |
|
"eval_loss": 0.6506330966949463, |
|
"eval_precision_negative": 0.7210732252655114, |
|
"eval_precision_neutral": 0.722875816993464, |
|
"eval_precision_positive": 0.606456571867794, |
|
"eval_recall_negative": 0.5685323931247246, |
|
"eval_recall_neutral": 0.8081419624217119, |
|
"eval_recall_positive": 0.5692640692640693, |
|
"eval_runtime": 13.434, |
|
"eval_samples_per_second": 628.63, |
|
"eval_steps_per_second": 3.275, |
|
"step": 480 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"learning_rate": 1.9124579124579125e-05, |
|
"loss": 0.659, |
|
"step": 520 |
|
}, |
|
{ |
|
"epoch": 0.44, |
|
"eval_accuracy": 0.7040852575488454, |
|
"eval_f1_macro": 0.6783997964045833, |
|
"eval_f1_negative": 0.699721226602947, |
|
"eval_f1_neutral": 0.7399162442142384, |
|
"eval_f1_positive": 0.595561918396564, |
|
"eval_loss": 0.6650780439376831, |
|
"eval_precision_negative": 0.6382128586996004, |
|
"eval_precision_neutral": 0.7836134453781513, |
|
"eval_precision_positive": 0.5909090909090909, |
|
"eval_recall_negative": 0.7743499338915822, |
|
"eval_recall_neutral": 0.7008350730688935, |
|
"eval_recall_positive": 0.6002886002886003, |
|
"eval_runtime": 13.4366, |
|
"eval_samples_per_second": 628.508, |
|
"eval_steps_per_second": 3.275, |
|
"step": 520 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"learning_rate": 1.905723905723906e-05, |
|
"loss": 0.6554, |
|
"step": 560 |
|
}, |
|
{ |
|
"epoch": 0.47, |
|
"eval_accuracy": 0.7166370633510953, |
|
"eval_f1_macro": 0.6722586905255515, |
|
"eval_f1_negative": 0.6801165657924232, |
|
"eval_f1_neutral": 0.7694463910301331, |
|
"eval_f1_positive": 0.5672131147540983, |
|
"eval_loss": 0.6467012763023376, |
|
"eval_precision_negative": 0.6920620437956204, |
|
"eval_precision_neutral": 0.7391806116560877, |
|
"eval_precision_positive": 0.6565464895635673, |
|
"eval_recall_negative": 0.6685764654032613, |
|
"eval_recall_neutral": 0.8022964509394572, |
|
"eval_recall_positive": 0.49927849927849927, |
|
"eval_runtime": 13.4494, |
|
"eval_samples_per_second": 627.909, |
|
"eval_steps_per_second": 3.272, |
|
"step": 560 |
|
}, |
|
{ |
|
"epoch": 0.51, |
|
"learning_rate": 1.8989898989898993e-05, |
|
"loss": 0.659, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 0.51, |
|
"eval_accuracy": 0.712137359384251, |
|
"eval_f1_macro": 0.6705187144410446, |
|
"eval_f1_negative": 0.6719478098788444, |
|
"eval_f1_neutral": 0.7654419861848032, |
|
"eval_f1_positive": 0.5741663472594865, |
|
"eval_loss": 0.6443530917167664, |
|
"eval_precision_negative": 0.71280276816609, |
|
"eval_precision_neutral": 0.7353337180226966, |
|
"eval_precision_positive": 0.6124284546197875, |
|
"eval_recall_negative": 0.6355222565006611, |
|
"eval_recall_neutral": 0.7981210855949895, |
|
"eval_recall_positive": 0.5404040404040404, |
|
"eval_runtime": 13.4345, |
|
"eval_samples_per_second": 628.604, |
|
"eval_steps_per_second": 3.275, |
|
"step": 600 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"learning_rate": 1.8922558922558924e-05, |
|
"loss": 0.6692, |
|
"step": 640 |
|
}, |
|
{ |
|
"epoch": 0.54, |
|
"eval_accuracy": 0.7047957371225577, |
|
"eval_f1_macro": 0.6746517865902923, |
|
"eval_f1_negative": 0.6761710794297353, |
|
"eval_f1_neutral": 0.7508104151416919, |
|
"eval_f1_positive": 0.5969738651994497, |
|
"eval_loss": 0.6483765244483948, |
|
"eval_precision_negative": 0.6948837209302325, |
|
"eval_precision_neutral": 0.7521474963335428, |
|
"eval_precision_positive": 0.5703022339027596, |
|
"eval_recall_negative": 0.6584398413397973, |
|
"eval_recall_neutral": 0.7494780793319415, |
|
"eval_recall_positive": 0.6262626262626263, |
|
"eval_runtime": 13.5781, |
|
"eval_samples_per_second": 621.958, |
|
"eval_steps_per_second": 3.241, |
|
"step": 640 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"learning_rate": 1.8855218855218858e-05, |
|
"loss": 0.6343, |
|
"step": 680 |
|
}, |
|
{ |
|
"epoch": 0.57, |
|
"eval_accuracy": 0.7084665482534044, |
|
"eval_f1_macro": 0.6745823109427566, |
|
"eval_f1_negative": 0.6674407803065491, |
|
"eval_f1_neutral": 0.7580216636010628, |
|
"eval_f1_positive": 0.5982844889206576, |
|
"eval_loss": 0.6420348286628723, |
|
"eval_precision_negative": 0.7054491899852725, |
|
"eval_precision_neutral": 0.7423939151321057, |
|
"eval_precision_positive": 0.5927762039660056, |
|
"eval_recall_negative": 0.6333186425738211, |
|
"eval_recall_neutral": 0.774321503131524, |
|
"eval_recall_positive": 0.6038961038961039, |
|
"eval_runtime": 13.5238, |
|
"eval_samples_per_second": 624.455, |
|
"eval_steps_per_second": 3.254, |
|
"step": 680 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"learning_rate": 1.8787878787878792e-05, |
|
"loss": 0.6707, |
|
"step": 720 |
|
}, |
|
{ |
|
"epoch": 0.61, |
|
"eval_accuracy": 0.7161634103019539, |
|
"eval_f1_macro": 0.6635859690261697, |
|
"eval_f1_negative": 0.6552984165651644, |
|
"eval_f1_neutral": 0.7757296466973886, |
|
"eval_f1_positive": 0.5597298438159561, |
|
"eval_loss": 0.630727231502533, |
|
"eval_precision_negative": 0.7325708061002179, |
|
"eval_precision_neutral": 0.7180945609669392, |
|
"eval_precision_positive": 0.6744659206510681, |
|
"eval_recall_negative": 0.5927721463199648, |
|
"eval_recall_neutral": 0.8434237995824635, |
|
"eval_recall_positive": 0.47835497835497837, |
|
"eval_runtime": 13.5358, |
|
"eval_samples_per_second": 623.902, |
|
"eval_steps_per_second": 3.251, |
|
"step": 720 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"learning_rate": 1.8720538720538723e-05, |
|
"loss": 0.6555, |
|
"step": 760 |
|
}, |
|
{ |
|
"epoch": 0.64, |
|
"eval_accuracy": 0.7173475429248076, |
|
"eval_f1_macro": 0.6760934295779212, |
|
"eval_f1_negative": 0.6785469499657298, |
|
"eval_f1_neutral": 0.7685231476852316, |
|
"eval_f1_positive": 0.5812101910828025, |
|
"eval_loss": 0.6327303051948547, |
|
"eval_precision_negative": 0.7044592030360531, |
|
"eval_precision_neutral": 0.7374784110535406, |
|
"eval_precision_positive": 0.6483126110124334, |
|
"eval_recall_negative": 0.6544733362714852, |
|
"eval_recall_neutral": 0.8022964509394572, |
|
"eval_recall_positive": 0.5266955266955267, |
|
"eval_runtime": 13.5283, |
|
"eval_samples_per_second": 624.249, |
|
"eval_steps_per_second": 3.252, |
|
"step": 760 |
|
}, |
|
{ |
|
"epoch": 0.67, |
|
"learning_rate": 1.8653198653198653e-05, |
|
"loss": 0.6539, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 0.67, |
|
"eval_accuracy": 0.713676731793961, |
|
"eval_f1_macro": 0.6798716085872009, |
|
"eval_f1_negative": 0.6834306241580603, |
|
"eval_f1_neutral": 0.7602507450416196, |
|
"eval_f1_positive": 0.5959334565619224, |
|
"eval_loss": 0.63933926820755, |
|
"eval_precision_negative": 0.6965675057208238, |
|
"eval_precision_neutral": 0.7486338797814208, |
|
"eval_precision_positive": 0.6110689916603488, |
|
"eval_recall_negative": 0.6707800793301014, |
|
"eval_recall_neutral": 0.7722338204592902, |
|
"eval_recall_positive": 0.5815295815295816, |
|
"eval_runtime": 13.556, |
|
"eval_samples_per_second": 622.971, |
|
"eval_steps_per_second": 3.246, |
|
"step": 800 |
|
}, |
|
{ |
|
"epoch": 0.71, |
|
"learning_rate": 1.8585858585858588e-05, |
|
"loss": 0.6586, |
|
"step": 840 |
|
}, |
|
{ |
|
"epoch": 0.71, |
|
"eval_accuracy": 0.7122557726465364, |
|
"eval_f1_macro": 0.6643997026372683, |
|
"eval_f1_negative": 0.6466569058077111, |
|
"eval_f1_neutral": 0.7709443099273607, |
|
"eval_f1_positive": 0.575597892176733, |
|
"eval_loss": 0.6333789229393005, |
|
"eval_precision_negative": 0.7244395844723893, |
|
"eval_precision_neutral": 0.7190605239385727, |
|
"eval_precision_positive": 0.6567992599444958, |
|
"eval_recall_negative": 0.5839576906126047, |
|
"eval_recall_neutral": 0.8308977035490606, |
|
"eval_recall_positive": 0.5122655122655123, |
|
"eval_runtime": 13.615, |
|
"eval_samples_per_second": 620.272, |
|
"eval_steps_per_second": 3.232, |
|
"step": 840 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"learning_rate": 1.851851851851852e-05, |
|
"loss": 0.6579, |
|
"step": 880 |
|
}, |
|
{ |
|
"epoch": 0.74, |
|
"eval_accuracy": 0.7187685020722321, |
|
"eval_f1_macro": 0.6807447825123648, |
|
"eval_f1_negative": 0.6873633581110626, |
|
"eval_f1_neutral": 0.7675631455159013, |
|
"eval_f1_positive": 0.5873078439101301, |
|
"eval_loss": 0.6417641639709473, |
|
"eval_precision_negative": 0.6819956616052061, |
|
"eval_precision_neutral": 0.7522549609140108, |
|
"eval_precision_positive": 0.6472632493483927, |
|
"eval_recall_negative": 0.6928162185985015, |
|
"eval_recall_neutral": 0.7835073068893528, |
|
"eval_recall_positive": 0.5375180375180375, |
|
"eval_runtime": 13.429, |
|
"eval_samples_per_second": 628.863, |
|
"eval_steps_per_second": 3.276, |
|
"step": 880 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"learning_rate": 1.8451178451178452e-05, |
|
"loss": 0.6408, |
|
"step": 920 |
|
}, |
|
{ |
|
"epoch": 0.77, |
|
"eval_accuracy": 0.7156897572528124, |
|
"eval_f1_macro": 0.6733312463576527, |
|
"eval_f1_negative": 0.6765443355368133, |
|
"eval_f1_neutral": 0.7680304091227369, |
|
"eval_f1_positive": 0.5754189944134079, |
|
"eval_loss": 0.6319063901901245, |
|
"eval_precision_negative": 0.7006610009442871, |
|
"eval_precision_neutral": 0.7372767428461686, |
|
"eval_precision_positive": 0.64375, |
|
"eval_recall_negative": 0.6540326134861172, |
|
"eval_recall_neutral": 0.8014613778705637, |
|
"eval_recall_positive": 0.5202020202020202, |
|
"eval_runtime": 13.4319, |
|
"eval_samples_per_second": 628.725, |
|
"eval_steps_per_second": 3.276, |
|
"step": 920 |
|
}, |
|
{ |
|
"epoch": 0.81, |
|
"learning_rate": 1.8383838383838387e-05, |
|
"loss": 0.6458, |
|
"step": 960 |
|
}, |
|
{ |
|
"epoch": 0.81, |
|
"eval_accuracy": 0.7116637063351096, |
|
"eval_f1_macro": 0.6808189121483205, |
|
"eval_f1_negative": 0.6855624446412755, |
|
"eval_f1_neutral": 0.7558841907935847, |
|
"eval_f1_positive": 0.601010101010101, |
|
"eval_loss": 0.6365010142326355, |
|
"eval_precision_negative": 0.6889185580774366, |
|
"eval_precision_neutral": 0.7541562759767249, |
|
"eval_precision_positive": 0.601010101010101, |
|
"eval_recall_negative": 0.6822388717496695, |
|
"eval_recall_neutral": 0.7576200417536535, |
|
"eval_recall_positive": 0.601010101010101, |
|
"eval_runtime": 13.4342, |
|
"eval_samples_per_second": 628.619, |
|
"eval_steps_per_second": 3.275, |
|
"step": 960 |
|
}, |
|
{ |
|
"epoch": 0.84, |
|
"learning_rate": 1.831649831649832e-05, |
|
"loss": 0.6663, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.84, |
|
"eval_accuracy": 0.7177027827116637, |
|
"eval_f1_macro": 0.6745871543495067, |
|
"eval_f1_negative": 0.6834215167548501, |
|
"eval_f1_neutral": 0.7686739720518749, |
|
"eval_f1_positive": 0.5716659742417948, |
|
"eval_loss": 0.6319110989570618, |
|
"eval_precision_negative": 0.6837229819144244, |
|
"eval_precision_neutral": 0.7413224743067675, |
|
"eval_precision_positive": 0.67384916748286, |
|
"eval_recall_negative": 0.6831203173204055, |
|
"eval_recall_neutral": 0.7981210855949895, |
|
"eval_recall_positive": 0.4963924963924964, |
|
"eval_runtime": 13.4422, |
|
"eval_samples_per_second": 628.246, |
|
"eval_steps_per_second": 3.273, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.88, |
|
"learning_rate": 1.824915824915825e-05, |
|
"loss": 0.6456, |
|
"step": 1040 |
|
}, |
|
{ |
|
"epoch": 0.88, |
|
"eval_accuracy": 0.7104795737122558, |
|
"eval_f1_macro": 0.6846884030136478, |
|
"eval_f1_negative": 0.6933867735470942, |
|
"eval_f1_neutral": 0.7508249068653539, |
|
"eval_f1_positive": 0.6098535286284953, |
|
"eval_loss": 0.6414014101028442, |
|
"eval_precision_negative": 0.7007200720072008, |
|
"eval_precision_neutral": 0.7659066232356134, |
|
"eval_precision_positive": 0.5661310259579728, |
|
"eval_recall_negative": 0.6862053768179814, |
|
"eval_recall_neutral": 0.7363256784968685, |
|
"eval_recall_positive": 0.6608946608946609, |
|
"eval_runtime": 13.4341, |
|
"eval_samples_per_second": 628.625, |
|
"eval_steps_per_second": 3.275, |
|
"step": 1040 |
|
}, |
|
{ |
|
"epoch": 0.91, |
|
"learning_rate": 1.8181818181818182e-05, |
|
"loss": 0.6416, |
|
"step": 1080 |
|
}, |
|
{ |
|
"epoch": 0.91, |
|
"eval_accuracy": 0.7153345174659562, |
|
"eval_f1_macro": 0.6849725647884108, |
|
"eval_f1_negative": 0.6939308244507288, |
|
"eval_f1_neutral": 0.7585337674614012, |
|
"eval_f1_positive": 0.6024531024531025, |
|
"eval_loss": 0.6341109871864319, |
|
"eval_precision_negative": 0.6851374570446735, |
|
"eval_precision_neutral": 0.7632635806383429, |
|
"eval_precision_positive": 0.6024531024531025, |
|
"eval_recall_negative": 0.7029528426619657, |
|
"eval_recall_neutral": 0.7538622129436325, |
|
"eval_recall_positive": 0.6024531024531025, |
|
"eval_runtime": 13.5517, |
|
"eval_samples_per_second": 623.169, |
|
"eval_steps_per_second": 3.247, |
|
"step": 1080 |
|
}, |
|
{ |
|
"epoch": 0.94, |
|
"learning_rate": 1.8114478114478116e-05, |
|
"loss": 0.6387, |
|
"step": 1120 |
|
}, |
|
{ |
|
"epoch": 0.94, |
|
"eval_accuracy": 0.7132030787448195, |
|
"eval_f1_macro": 0.6812920768310707, |
|
"eval_f1_negative": 0.6735266604303087, |
|
"eval_f1_neutral": 0.7610456176319835, |
|
"eval_f1_positive": 0.60930395243092, |
|
"eval_loss": 0.6404346227645874, |
|
"eval_precision_negative": 0.7174887892376681, |
|
"eval_precision_neutral": 0.7476334340382679, |
|
"eval_precision_positive": 0.5913102511880516, |
|
"eval_recall_negative": 0.6346408109299251, |
|
"eval_recall_neutral": 0.7749478079331942, |
|
"eval_recall_positive": 0.6284271284271284, |
|
"eval_runtime": 13.5098, |
|
"eval_samples_per_second": 625.102, |
|
"eval_steps_per_second": 3.257, |
|
"step": 1120 |
|
}, |
|
{ |
|
"epoch": 0.98, |
|
"learning_rate": 1.804713804713805e-05, |
|
"loss": 0.6483, |
|
"step": 1160 |
|
}, |
|
{ |
|
"epoch": 0.98, |
|
"eval_accuracy": 0.7200710479573712, |
|
"eval_f1_macro": 0.6806619404824857, |
|
"eval_f1_negative": 0.6825213576541214, |
|
"eval_f1_neutral": 0.7708228674771426, |
|
"eval_f1_positive": 0.5886415963161934, |
|
"eval_loss": 0.6273576021194458, |
|
"eval_precision_negative": 0.7167798254122212, |
|
"eval_precision_neutral": 0.7429788882432694, |
|
"eval_precision_positive": 0.6286885245901639, |
|
"eval_recall_negative": 0.6513882767739092, |
|
"eval_recall_neutral": 0.8008350730688936, |
|
"eval_recall_positive": 0.5533910533910534, |
|
"eval_runtime": 13.5101, |
|
"eval_samples_per_second": 625.087, |
|
"eval_steps_per_second": 3.257, |
|
"step": 1160 |
|
}, |
|
{ |
|
"epoch": 1.01, |
|
"learning_rate": 1.797979797979798e-05, |
|
"loss": 0.6418, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 1.01, |
|
"eval_accuracy": 0.7216104203670811, |
|
"eval_f1_macro": 0.6749026822057264, |
|
"eval_f1_negative": 0.6914728682170542, |
|
"eval_f1_neutral": 0.7730991818000399, |
|
"eval_f1_positive": 0.560135996600085, |
|
"eval_loss": 0.6303337812423706, |
|
"eval_precision_negative": 0.695013357079252, |
|
"eval_precision_neutral": 0.7404434250764526, |
|
"eval_precision_positive": 0.6814891416752844, |
|
"eval_recall_negative": 0.6879682679594535, |
|
"eval_recall_neutral": 0.808768267223382, |
|
"eval_recall_positive": 0.4754689754689755, |
|
"eval_runtime": 14.4031, |
|
"eval_samples_per_second": 586.332, |
|
"eval_steps_per_second": 3.055, |
|
"step": 1200 |
|
}, |
|
{ |
|
"epoch": 1.04, |
|
"learning_rate": 1.7912457912457915e-05, |
|
"loss": 0.6201, |
|
"step": 1240 |
|
}, |
|
{ |
|
"epoch": 1.04, |
|
"eval_accuracy": 0.7193605683836589, |
|
"eval_f1_macro": 0.6783071530429613, |
|
"eval_f1_negative": 0.6780135229657263, |
|
"eval_f1_neutral": 0.7719368378972615, |
|
"eval_f1_positive": 0.584971098265896, |
|
"eval_loss": 0.6306412220001221, |
|
"eval_precision_negative": 0.7198019801980198, |
|
"eval_precision_neutral": 0.7404141104294478, |
|
"eval_precision_positive": 0.6277915632754343, |
|
"eval_recall_negative": 0.6408109299250772, |
|
"eval_recall_neutral": 0.8062630480167015, |
|
"eval_recall_positive": 0.5476190476190477, |
|
"eval_runtime": 13.6129, |
|
"eval_samples_per_second": 620.369, |
|
"eval_steps_per_second": 3.232, |
|
"step": 1240 |
|
}, |
|
{ |
|
"epoch": 1.08, |
|
"learning_rate": 1.7845117845117846e-05, |
|
"loss": 0.5971, |
|
"step": 1280 |
|
}, |
|
{ |
|
"epoch": 1.08, |
|
"eval_accuracy": 0.7166370633510953, |
|
"eval_f1_macro": 0.6745910338462799, |
|
"eval_f1_negative": 0.6869394005688033, |
|
"eval_f1_neutral": 0.7662285136501515, |
|
"eval_f1_positive": 0.5706051873198847, |
|
"eval_loss": 0.6360566020011902, |
|
"eval_precision_negative": 0.682015638575152, |
|
"eval_precision_neutral": 0.7429411764705882, |
|
"eval_precision_positive": 0.6644295302013423, |
|
"eval_recall_negative": 0.6919347730277655, |
|
"eval_recall_neutral": 0.7910229645093946, |
|
"eval_recall_positive": 0.5, |
|
"eval_runtime": 13.5493, |
|
"eval_samples_per_second": 623.278, |
|
"eval_steps_per_second": 3.247, |
|
"step": 1280 |
|
}, |
|
{ |
|
"epoch": 1.11, |
|
"learning_rate": 1.7777777777777777e-05, |
|
"loss": 0.6101, |
|
"step": 1320 |
|
}, |
|
{ |
|
"epoch": 1.11, |
|
"eval_accuracy": 0.7226761397276495, |
|
"eval_f1_macro": 0.6791712549911954, |
|
"eval_f1_negative": 0.6990124516960068, |
|
"eval_f1_neutral": 0.7709451929895654, |
|
"eval_f1_positive": 0.5675561202880136, |
|
"eval_loss": 0.6358277201652527, |
|
"eval_precision_negative": 0.6814566764336543, |
|
"eval_precision_neutral": 0.748868333005314, |
|
"eval_precision_positive": 0.6871794871794872, |
|
"eval_recall_negative": 0.7174966945791097, |
|
"eval_recall_neutral": 0.7943632567849687, |
|
"eval_recall_positive": 0.4834054834054834, |
|
"eval_runtime": 13.4061, |
|
"eval_samples_per_second": 629.938, |
|
"eval_steps_per_second": 3.282, |
|
"step": 1320 |
|
}, |
|
{ |
|
"epoch": 1.14, |
|
"learning_rate": 1.771043771043771e-05, |
|
"loss": 0.5977, |
|
"step": 1360 |
|
}, |
|
{ |
|
"epoch": 1.14, |
|
"eval_accuracy": 0.7124925991711072, |
|
"eval_f1_macro": 0.6812595953156201, |
|
"eval_f1_negative": 0.6902101028162717, |
|
"eval_f1_neutral": 0.756903198916328, |
|
"eval_f1_positive": 0.5966654842142604, |
|
"eval_loss": 0.640369713306427, |
|
"eval_precision_negative": 0.7002267573696145, |
|
"eval_precision_neutral": 0.7555648013313917, |
|
"eval_precision_positive": 0.586880669923238, |
|
"eval_recall_negative": 0.6804759806081975, |
|
"eval_recall_neutral": 0.7582463465553236, |
|
"eval_recall_positive": 0.6067821067821068, |
|
"eval_runtime": 13.458, |
|
"eval_samples_per_second": 627.51, |
|
"eval_steps_per_second": 3.269, |
|
"step": 1360 |
|
}, |
|
{ |
|
"epoch": 1.18, |
|
"learning_rate": 1.7643097643097645e-05, |
|
"loss": 0.6229, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 1.18, |
|
"eval_accuracy": 0.720307874481942, |
|
"eval_f1_macro": 0.6787577486913711, |
|
"eval_f1_negative": 0.6789838337182449, |
|
"eval_f1_neutral": 0.7721746063384493, |
|
"eval_f1_positive": 0.5851148060174189, |
|
"eval_loss": 0.625924825668335, |
|
"eval_precision_negative": 0.7132459970887919, |
|
"eval_precision_neutral": 0.7387490465293669, |
|
"eval_precision_positive": 0.6482456140350877, |
|
"eval_recall_negative": 0.6478624944909652, |
|
"eval_recall_neutral": 0.808768267223382, |
|
"eval_recall_positive": 0.5331890331890332, |
|
"eval_runtime": 13.413, |
|
"eval_samples_per_second": 629.615, |
|
"eval_steps_per_second": 3.28, |
|
"step": 1400 |
|
}, |
|
{ |
|
"epoch": 1.21, |
|
"learning_rate": 1.7575757575757576e-05, |
|
"loss": 0.5971, |
|
"step": 1440 |
|
}, |
|
{ |
|
"epoch": 1.21, |
|
"eval_accuracy": 0.7111900532859681, |
|
"eval_f1_macro": 0.685070727390424, |
|
"eval_f1_negative": 0.6965195246179966, |
|
"eval_f1_neutral": 0.7495985440530993, |
|
"eval_f1_positive": 0.6090941135001762, |
|
"eval_loss": 0.6486834287643433, |
|
"eval_precision_negative": 0.6717151043798608, |
|
"eval_precision_neutral": 0.7692814765985497, |
|
"eval_precision_positive": 0.5954514128187457, |
|
"eval_recall_negative": 0.7232260907888938, |
|
"eval_recall_neutral": 0.7308977035490606, |
|
"eval_recall_positive": 0.6233766233766234, |
|
"eval_runtime": 13.4217, |
|
"eval_samples_per_second": 629.204, |
|
"eval_steps_per_second": 3.278, |
|
"step": 1440 |
|
}, |
|
{ |
|
"epoch": 1.25, |
|
"learning_rate": 1.750841750841751e-05, |
|
"loss": 0.6006, |
|
"step": 1480 |
|
}, |
|
{ |
|
"epoch": 1.25, |
|
"eval_accuracy": 0.7155713439905269, |
|
"eval_f1_macro": 0.683204217410409, |
|
"eval_f1_negative": 0.6757380073800737, |
|
"eval_f1_neutral": 0.7631821439541312, |
|
"eval_f1_positive": 0.6106925008970219, |
|
"eval_loss": 0.6353930830955505, |
|
"eval_precision_negative": 0.7087566521528785, |
|
"eval_precision_neutral": 0.7488446855535463, |
|
"eval_precision_positive": 0.6074232690935046, |
|
"eval_recall_negative": 0.6456588805641251, |
|
"eval_recall_neutral": 0.7780793319415449, |
|
"eval_recall_positive": 0.613997113997114, |
|
"eval_runtime": 13.4559, |
|
"eval_samples_per_second": 627.605, |
|
"eval_steps_per_second": 3.27, |
|
"step": 1480 |
|
}, |
|
{ |
|
"epoch": 1.28, |
|
"learning_rate": 1.7441077441077444e-05, |
|
"loss": 0.6104, |
|
"step": 1520 |
|
}, |
|
{ |
|
"epoch": 1.28, |
|
"eval_accuracy": 0.7127294256956779, |
|
"eval_f1_macro": 0.6839464489013288, |
|
"eval_f1_negative": 0.6825213576541214, |
|
"eval_f1_neutral": 0.7576642335766423, |
|
"eval_f1_positive": 0.6116537554732233, |
|
"eval_loss": 0.6454949975013733, |
|
"eval_precision_negative": 0.7167798254122212, |
|
"eval_precision_neutral": 0.756875, |
|
"eval_precision_positive": 0.5735944409349337, |
|
"eval_recall_negative": 0.6513882767739092, |
|
"eval_recall_neutral": 0.758455114822547, |
|
"eval_recall_positive": 0.6551226551226551, |
|
"eval_runtime": 13.4867, |
|
"eval_samples_per_second": 626.174, |
|
"eval_steps_per_second": 3.262, |
|
"step": 1520 |
|
}, |
|
{ |
|
"epoch": 1.31, |
|
"learning_rate": 1.7373737373737375e-05, |
|
"loss": 0.6101, |
|
"step": 1560 |
|
}, |
|
{ |
|
"epoch": 1.31, |
|
"eval_accuracy": 0.7206631142687981, |
|
"eval_f1_macro": 0.6779869326137852, |
|
"eval_f1_negative": 0.6807543740059078, |
|
"eval_f1_neutral": 0.772482552342971, |
|
"eval_f1_positive": 0.5807238714924766, |
|
"eval_loss": 0.6268090605735779, |
|
"eval_precision_negative": 0.702626641651032, |
|
"eval_precision_neutral": 0.7393129770992366, |
|
"eval_precision_positive": 0.6654240447343895, |
|
"eval_recall_negative": 0.6602027324812693, |
|
"eval_recall_neutral": 0.808768267223382, |
|
"eval_recall_positive": 0.5151515151515151, |
|
"eval_runtime": 13.4458, |
|
"eval_samples_per_second": 628.077, |
|
"eval_steps_per_second": 3.272, |
|
"step": 1560 |
|
}, |
|
{ |
|
"epoch": 1.35, |
|
"learning_rate": 1.7306397306397305e-05, |
|
"loss": 0.6022, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 1.35, |
|
"eval_accuracy": 0.7143872113676731, |
|
"eval_f1_macro": 0.6836129674253361, |
|
"eval_f1_negative": 0.6836007130124777, |
|
"eval_f1_neutral": 0.7594515995014541, |
|
"eval_f1_positive": 0.6077865897620764, |
|
"eval_loss": 0.6394125819206238, |
|
"eval_precision_negative": 0.6913023884632717, |
|
"eval_precision_neutral": 0.7556841670111616, |
|
"eval_precision_positive": 0.6073487031700289, |
|
"eval_recall_negative": 0.6760687527545174, |
|
"eval_recall_neutral": 0.7632567849686848, |
|
"eval_recall_positive": 0.6082251082251082, |
|
"eval_runtime": 13.4382, |
|
"eval_samples_per_second": 628.432, |
|
"eval_steps_per_second": 3.274, |
|
"step": 1600 |
|
}, |
|
{ |
|
"epoch": 1.38, |
|
"learning_rate": 1.723905723905724e-05, |
|
"loss": 0.6236, |
|
"step": 1640 |
|
}, |
|
{ |
|
"epoch": 1.38, |
|
"eval_accuracy": 0.7134399052693902, |
|
"eval_f1_macro": 0.6861857480530462, |
|
"eval_f1_negative": 0.683572710951526, |
|
"eval_f1_neutral": 0.7565409267626353, |
|
"eval_f1_positive": 0.6184436064449776, |
|
"eval_loss": 0.6394263505935669, |
|
"eval_precision_negative": 0.6963877457704618, |
|
"eval_precision_neutral": 0.7615823989845568, |
|
"eval_precision_positive": 0.589157413455258, |
|
"eval_recall_negative": 0.6712208021154694, |
|
"eval_recall_neutral": 0.7515657620041754, |
|
"eval_recall_positive": 0.6507936507936508, |
|
"eval_runtime": 13.4189, |
|
"eval_samples_per_second": 629.337, |
|
"eval_steps_per_second": 3.279, |
|
"step": 1640 |
|
}, |
|
{ |
|
"epoch": 1.41, |
|
"learning_rate": 1.7171717171717173e-05, |
|
"loss": 0.6039, |
|
"step": 1680 |
|
}, |
|
{ |
|
"epoch": 1.41, |
|
"eval_accuracy": 0.7182948490230906, |
|
"eval_f1_macro": 0.6829107741796993, |
|
"eval_f1_negative": 0.6881057268722467, |
|
"eval_f1_neutral": 0.7655158240854912, |
|
"eval_f1_positive": 0.5951107715813598, |
|
"eval_loss": 0.6307365298271179, |
|
"eval_precision_negative": 0.6878027300748569, |
|
"eval_precision_neutral": 0.7537434237150951, |
|
"eval_precision_positive": 0.6323051948051948, |
|
"eval_recall_negative": 0.6884089907448215, |
|
"eval_recall_neutral": 0.7776617954070981, |
|
"eval_recall_positive": 0.562049062049062, |
|
"eval_runtime": 13.423, |
|
"eval_samples_per_second": 629.145, |
|
"eval_steps_per_second": 3.278, |
|
"step": 1680 |
|
}, |
|
{ |
|
"epoch": 1.45, |
|
"learning_rate": 1.7104377104377104e-05, |
|
"loss": 0.6059, |
|
"step": 1720 |
|
}, |
|
{ |
|
"epoch": 1.45, |
|
"eval_accuracy": 0.7173475429248076, |
|
"eval_f1_macro": 0.6865160173058559, |
|
"eval_f1_negative": 0.6937445699391833, |
|
"eval_f1_neutral": 0.7605015673981192, |
|
"eval_f1_positive": 0.6053019145802652, |
|
"eval_loss": 0.6336551904678345, |
|
"eval_precision_negative": 0.6839400428265524, |
|
"eval_precision_neutral": 0.7612970711297071, |
|
"eval_precision_positive": 0.6180451127819548, |
|
"eval_recall_negative": 0.7038342882327017, |
|
"eval_recall_neutral": 0.7597077244258873, |
|
"eval_recall_positive": 0.5930735930735931, |
|
"eval_runtime": 13.4767, |
|
"eval_samples_per_second": 626.636, |
|
"eval_steps_per_second": 3.265, |
|
"step": 1720 |
|
}, |
|
{ |
|
"epoch": 1.48, |
|
"learning_rate": 1.7037037037037038e-05, |
|
"loss": 0.6042, |
|
"step": 1760 |
|
}, |
|
{ |
|
"epoch": 1.48, |
|
"eval_accuracy": 0.7197158081705151, |
|
"eval_f1_macro": 0.685440373432607, |
|
"eval_f1_negative": 0.694493006993007, |
|
"eval_f1_neutral": 0.7645846217274789, |
|
"eval_f1_positive": 0.5972434915773354, |
|
"eval_loss": 0.63006192445755, |
|
"eval_precision_negative": 0.6887732986562636, |
|
"eval_precision_neutral": 0.7550895765472313, |
|
"eval_precision_positive": 0.636215334420881, |
|
"eval_recall_negative": 0.7003085059497576, |
|
"eval_recall_neutral": 0.774321503131524, |
|
"eval_recall_positive": 0.5627705627705628, |
|
"eval_runtime": 13.4204, |
|
"eval_samples_per_second": 629.266, |
|
"eval_steps_per_second": 3.279, |
|
"step": 1760 |
|
}, |
|
{ |
|
"epoch": 1.52, |
|
"learning_rate": 1.6969696969696972e-05, |
|
"loss": 0.5907, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 1.52, |
|
"eval_accuracy": 0.7238602723505032, |
|
"eval_f1_macro": 0.6788816276493144, |
|
"eval_f1_negative": 0.6713483146067416, |
|
"eval_f1_neutral": 0.7784207945071114, |
|
"eval_f1_positive": 0.58687577383409, |
|
"eval_loss": 0.6279187202453613, |
|
"eval_precision_negative": 0.7159261108337494, |
|
"eval_precision_neutral": 0.7341350601295097, |
|
"eval_precision_positive": 0.6856316297010607, |
|
"eval_recall_negative": 0.6319964742177171, |
|
"eval_recall_neutral": 0.82839248434238, |
|
"eval_recall_positive": 0.512987012987013, |
|
"eval_runtime": 13.4379, |
|
"eval_samples_per_second": 628.446, |
|
"eval_steps_per_second": 3.274, |
|
"step": 1800 |
|
}, |
|
{ |
|
"epoch": 1.55, |
|
"learning_rate": 1.6902356902356903e-05, |
|
"loss": 0.6135, |
|
"step": 1840 |
|
}, |
|
{ |
|
"epoch": 1.55, |
|
"eval_accuracy": 0.7229129662522202, |
|
"eval_f1_macro": 0.6795419420133372, |
|
"eval_f1_negative": 0.6882803943044906, |
|
"eval_f1_neutral": 0.7737461051361945, |
|
"eval_f1_positive": 0.5765993265993266, |
|
"eval_loss": 0.6268677711486816, |
|
"eval_precision_negative": 0.6842334494773519, |
|
"eval_precision_neutral": 0.7460748207016864, |
|
"eval_precision_positive": 0.6919191919191919, |
|
"eval_recall_negative": 0.6923754958131335, |
|
"eval_recall_neutral": 0.8035490605427975, |
|
"eval_recall_positive": 0.49422799422799424, |
|
"eval_runtime": 13.44, |
|
"eval_samples_per_second": 628.349, |
|
"eval_steps_per_second": 3.274, |
|
"step": 1840 |
|
}, |
|
{ |
|
"epoch": 1.58, |
|
"learning_rate": 1.6835016835016837e-05, |
|
"loss": 0.5996, |
|
"step": 1880 |
|
}, |
|
{ |
|
"epoch": 1.58, |
|
"eval_accuracy": 0.7220840734162226, |
|
"eval_f1_macro": 0.6869855176473937, |
|
"eval_f1_negative": 0.6864864864864865, |
|
"eval_f1_neutral": 0.7696068445711958, |
|
"eval_f1_positive": 0.6048632218844986, |
|
"eval_loss": 0.6290135979652405, |
|
"eval_precision_negative": 0.7019806540764625, |
|
"eval_precision_neutral": 0.7513922036595068, |
|
"eval_precision_positive": 0.6388443017656501, |
|
"eval_recall_negative": 0.6716615249008374, |
|
"eval_recall_neutral": 0.7887265135699374, |
|
"eval_recall_positive": 0.5743145743145743, |
|
"eval_runtime": 13.4252, |
|
"eval_samples_per_second": 629.039, |
|
"eval_steps_per_second": 3.277, |
|
"step": 1880 |
|
}, |
|
{ |
|
"epoch": 1.62, |
|
"learning_rate": 1.6767676767676768e-05, |
|
"loss": 0.6136, |
|
"step": 1920 |
|
}, |
|
{ |
|
"epoch": 1.62, |
|
"eval_accuracy": 0.7223208999407934, |
|
"eval_f1_macro": 0.6908988856510865, |
|
"eval_f1_negative": 0.7006585935840238, |
|
"eval_f1_neutral": 0.7644044755829762, |
|
"eval_f1_positive": 0.6076335877862595, |
|
"eval_loss": 0.6263943910598755, |
|
"eval_precision_negative": 0.6763740771123872, |
|
"eval_precision_neutral": 0.7657657657657657, |
|
"eval_precision_positive": 0.6450567260940032, |
|
"eval_recall_negative": 0.7267518730718379, |
|
"eval_recall_neutral": 0.7630480167014614, |
|
"eval_recall_positive": 0.5743145743145743, |
|
"eval_runtime": 13.5533, |
|
"eval_samples_per_second": 623.095, |
|
"eval_steps_per_second": 3.246, |
|
"step": 1920 |
|
}, |
|
{ |
|
"epoch": 1.65, |
|
"learning_rate": 1.6700336700336702e-05, |
|
"loss": 0.6036, |
|
"step": 1960 |
|
}, |
|
{ |
|
"epoch": 1.65, |
|
"eval_accuracy": 0.7141503848431024, |
|
"eval_f1_macro": 0.6879732554886911, |
|
"eval_f1_negative": 0.6988408851422551, |
|
"eval_f1_neutral": 0.7530068728522336, |
|
"eval_f1_positive": 0.6120720084715848, |
|
"eval_loss": 0.6364882588386536, |
|
"eval_precision_negative": 0.6696284329563813, |
|
"eval_precision_neutral": 0.7753206545776206, |
|
"eval_precision_positive": 0.5991706979958535, |
|
"eval_recall_negative": 0.7307183781401498, |
|
"eval_recall_neutral": 0.7319415448851775, |
|
"eval_recall_positive": 0.6255411255411255, |
|
"eval_runtime": 13.4324, |
|
"eval_samples_per_second": 628.703, |
|
"eval_steps_per_second": 3.276, |
|
"step": 1960 |
|
}, |
|
{ |
|
"epoch": 1.68, |
|
"learning_rate": 1.6632996632996633e-05, |
|
"loss": 0.6123, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 1.68, |
|
"eval_accuracy": 0.7198342214328005, |
|
"eval_f1_macro": 0.6811378179180303, |
|
"eval_f1_negative": 0.694331550802139, |
|
"eval_f1_neutral": 0.7660226924256361, |
|
"eval_f1_positive": 0.5830592105263157, |
|
"eval_loss": 0.6256130933761597, |
|
"eval_precision_negative": 0.6745635910224439, |
|
"eval_precision_neutral": 0.7504506308832365, |
|
"eval_precision_positive": 0.6778202676864244, |
|
"eval_recall_negative": 0.7152930806522697, |
|
"eval_recall_neutral": 0.7822546972860125, |
|
"eval_recall_positive": 0.5115440115440115, |
|
"eval_runtime": 13.4059, |
|
"eval_samples_per_second": 629.947, |
|
"eval_steps_per_second": 3.282, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 1.72, |
|
"learning_rate": 1.6565656565656567e-05, |
|
"loss": 0.5898, |
|
"step": 2040 |
|
}, |
|
{ |
|
"epoch": 1.72, |
|
"eval_accuracy": 0.7255180580224985, |
|
"eval_f1_macro": 0.6783018381472949, |
|
"eval_f1_negative": 0.6911698789780368, |
|
"eval_f1_neutral": 0.777568611909244, |
|
"eval_f1_positive": 0.5661670235546039, |
|
"eval_loss": 0.6203241944313049, |
|
"eval_precision_negative": 0.7031463748290013, |
|
"eval_precision_neutral": 0.7399585140486518, |
|
"eval_precision_positive": 0.6965226554267651, |
|
"eval_recall_negative": 0.6795945350374615, |
|
"eval_recall_neutral": 0.8192066805845512, |
|
"eval_recall_positive": 0.4769119769119769, |
|
"eval_runtime": 13.429, |
|
"eval_samples_per_second": 628.864, |
|
"eval_steps_per_second": 3.276, |
|
"step": 2040 |
|
}, |
|
{ |
|
"epoch": 1.75, |
|
"learning_rate": 1.64983164983165e-05, |
|
"loss": 0.585, |
|
"step": 2080 |
|
}, |
|
{ |
|
"epoch": 1.75, |
|
"eval_accuracy": 0.7277679100059207, |
|
"eval_f1_macro": 0.6856054160655031, |
|
"eval_f1_negative": 0.6840989399293286, |
|
"eval_f1_neutral": 0.7798319327731092, |
|
"eval_f1_positive": 0.5928853754940712, |
|
"eval_loss": 0.62270188331604, |
|
"eval_precision_negative": 0.7348178137651822, |
|
"eval_precision_neutral": 0.7406572769953051, |
|
"eval_precision_positive": 0.6555944055944056, |
|
"eval_recall_negative": 0.6399294843543412, |
|
"eval_recall_neutral": 0.8233820459290188, |
|
"eval_recall_positive": 0.5411255411255411, |
|
"eval_runtime": 13.4336, |
|
"eval_samples_per_second": 628.646, |
|
"eval_steps_per_second": 3.275, |
|
"step": 2080 |
|
}, |
|
{ |
|
"epoch": 1.78, |
|
"learning_rate": 1.6430976430976432e-05, |
|
"loss": 0.6092, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 1.78, |
|
"eval_accuracy": 0.7194789816459444, |
|
"eval_f1_macro": 0.691219851642046, |
|
"eval_f1_negative": 0.6904706700672385, |
|
"eval_f1_neutral": 0.7632427932146946, |
|
"eval_f1_positive": 0.6199460916442048, |
|
"eval_loss": 0.6305855512619019, |
|
"eval_precision_negative": 0.7284735812133072, |
|
"eval_precision_neutral": 0.7609462544096286, |
|
"eval_precision_positive": 0.5815423514538559, |
|
"eval_recall_negative": 0.6562362274129573, |
|
"eval_recall_neutral": 0.765553235908142, |
|
"eval_recall_positive": 0.6637806637806638, |
|
"eval_runtime": 13.4354, |
|
"eval_samples_per_second": 628.563, |
|
"eval_steps_per_second": 3.275, |
|
"step": 2120 |
|
}, |
|
{ |
|
"epoch": 1.82, |
|
"learning_rate": 1.6363636363636366e-05, |
|
"loss": 0.5902, |
|
"step": 2160 |
|
}, |
|
{ |
|
"epoch": 1.82, |
|
"eval_accuracy": 0.7217288336293665, |
|
"eval_f1_macro": 0.6903674148692266, |
|
"eval_f1_negative": 0.699802067297119, |
|
"eval_f1_neutral": 0.7650182196772514, |
|
"eval_f1_positive": 0.606281957633309, |
|
"eval_loss": 0.6268182992935181, |
|
"eval_precision_negative": 0.6984196663740123, |
|
"eval_precision_neutral": 0.7630321910695742, |
|
"eval_precision_positive": 0.613905325443787, |
|
"eval_recall_negative": 0.7011899515204936, |
|
"eval_recall_neutral": 0.7670146137787056, |
|
"eval_recall_positive": 0.5988455988455988, |
|
"eval_runtime": 13.453, |
|
"eval_samples_per_second": 627.739, |
|
"eval_steps_per_second": 3.271, |
|
"step": 2160 |
|
}, |
|
{ |
|
"epoch": 1.85, |
|
"learning_rate": 1.6296296296296297e-05, |
|
"loss": 0.6077, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 1.85, |
|
"eval_accuracy": 0.7239786856127887, |
|
"eval_f1_macro": 0.6863881436307776, |
|
"eval_f1_negative": 0.6860517946388005, |
|
"eval_f1_neutral": 0.7731126362535325, |
|
"eval_f1_positive": 0.5999999999999999, |
|
"eval_loss": 0.6207541227340698, |
|
"eval_precision_negative": 0.7079231129864041, |
|
"eval_precision_neutral": 0.7483391949980461, |
|
"eval_precision_positive": 0.6482412060301508, |
|
"eval_recall_negative": 0.6654914059056853, |
|
"eval_recall_neutral": 0.7995824634655533, |
|
"eval_recall_positive": 0.5584415584415584, |
|
"eval_runtime": 13.4434, |
|
"eval_samples_per_second": 628.189, |
|
"eval_steps_per_second": 3.273, |
|
"step": 2200 |
|
}, |
|
{ |
|
"epoch": 1.89, |
|
"learning_rate": 1.622895622895623e-05, |
|
"loss": 0.5971, |
|
"step": 2240 |
|
}, |
|
{ |
|
"epoch": 1.89, |
|
"eval_accuracy": 0.7297809354647721, |
|
"eval_f1_macro": 0.6928803015060957, |
|
"eval_f1_negative": 0.6937485894831867, |
|
"eval_f1_neutral": 0.7777216213484281, |
|
"eval_f1_positive": 0.6071706936866719, |
|
"eval_loss": 0.6181867122650146, |
|
"eval_precision_negative": 0.7109158186864015, |
|
"eval_precision_neutral": 0.7538702723887909, |
|
"eval_precision_positive": 0.6601694915254237, |
|
"eval_recall_negative": 0.6773909211106214, |
|
"eval_recall_neutral": 0.8031315240083508, |
|
"eval_recall_positive": 0.562049062049062, |
|
"eval_runtime": 13.5165, |
|
"eval_samples_per_second": 624.792, |
|
"eval_steps_per_second": 3.255, |
|
"step": 2240 |
|
}, |
|
{ |
|
"epoch": 1.92, |
|
"learning_rate": 1.616161616161616e-05, |
|
"loss": 0.6053, |
|
"step": 2280 |
|
}, |
|
{ |
|
"epoch": 1.92, |
|
"eval_accuracy": 0.7235050325636472, |
|
"eval_f1_macro": 0.6869805131510361, |
|
"eval_f1_negative": 0.6891179839633448, |
|
"eval_f1_neutral": 0.7715961966417155, |
|
"eval_f1_positive": 0.6002273588480483, |
|
"eval_loss": 0.6221389174461365, |
|
"eval_precision_negative": 0.7175572519083969, |
|
"eval_precision_neutral": 0.7484301412872841, |
|
"eval_precision_positive": 0.6320830007980845, |
|
"eval_recall_negative": 0.6628470691934774, |
|
"eval_recall_neutral": 0.7962421711899791, |
|
"eval_recall_positive": 0.5714285714285714, |
|
"eval_runtime": 13.4474, |
|
"eval_samples_per_second": 628.005, |
|
"eval_steps_per_second": 3.272, |
|
"step": 2280 |
|
}, |
|
{ |
|
"epoch": 1.95, |
|
"learning_rate": 1.6094276094276096e-05, |
|
"loss": 0.5959, |
|
"step": 2320 |
|
}, |
|
{ |
|
"epoch": 1.95, |
|
"eval_accuracy": 0.7199526346950859, |
|
"eval_f1_macro": 0.682651116707718, |
|
"eval_f1_negative": 0.6665057915057916, |
|
"eval_f1_neutral": 0.7722100219604712, |
|
"eval_f1_positive": 0.6092375366568915, |
|
"eval_loss": 0.6313912272453308, |
|
"eval_precision_negative": 0.7365333333333334, |
|
"eval_precision_neutral": 0.7398622800306044, |
|
"eval_precision_positive": 0.6192250372578242, |
|
"eval_recall_negative": 0.6086381665932129, |
|
"eval_recall_neutral": 0.8075156576200417, |
|
"eval_recall_positive": 0.5995670995670995, |
|
"eval_runtime": 13.532, |
|
"eval_samples_per_second": 624.078, |
|
"eval_steps_per_second": 3.252, |
|
"step": 2320 |
|
}, |
|
{ |
|
"epoch": 1.99, |
|
"learning_rate": 1.602693602693603e-05, |
|
"loss": 0.6196, |
|
"step": 2360 |
|
}, |
|
{ |
|
"epoch": 1.99, |
|
"eval_accuracy": 0.709295441089402, |
|
"eval_f1_macro": 0.6881296895840747, |
|
"eval_f1_negative": 0.700795870079587, |
|
"eval_f1_neutral": 0.7440385036097135, |
|
"eval_f1_positive": 0.6195546950629235, |
|
"eval_loss": 0.6360026001930237, |
|
"eval_precision_negative": 0.684453781512605, |
|
"eval_precision_neutral": 0.7814797794117647, |
|
"eval_precision_positive": 0.5604203152364273, |
|
"eval_recall_negative": 0.7179374173644777, |
|
"eval_recall_neutral": 0.7100208768267223, |
|
"eval_recall_positive": 0.6926406926406926, |
|
"eval_runtime": 13.7523, |
|
"eval_samples_per_second": 614.079, |
|
"eval_steps_per_second": 3.199, |
|
"step": 2360 |
|
}, |
|
{ |
|
"epoch": 2.02, |
|
"learning_rate": 1.595959595959596e-05, |
|
"loss": 0.5686, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 2.02, |
|
"eval_accuracy": 0.7191237418590882, |
|
"eval_f1_macro": 0.6870370031512542, |
|
"eval_f1_negative": 0.6933101650738488, |
|
"eval_f1_neutral": 0.7630622208372286, |
|
"eval_f1_positive": 0.6047386235426853, |
|
"eval_loss": 0.6405708193778992, |
|
"eval_precision_negative": 0.6835117773019272, |
|
"eval_precision_neutral": 0.7593549720901385, |
|
"eval_precision_positive": 0.631578947368421, |
|
"eval_recall_negative": 0.7033935654473337, |
|
"eval_recall_neutral": 0.7668058455114822, |
|
"eval_recall_positive": 0.5800865800865801, |
|
"eval_runtime": 13.5092, |
|
"eval_samples_per_second": 625.128, |
|
"eval_steps_per_second": 3.257, |
|
"step": 2400 |
|
}, |
|
{ |
|
"epoch": 2.05, |
|
"learning_rate": 1.5892255892255895e-05, |
|
"loss": 0.5586, |
|
"step": 2440 |
|
}, |
|
{ |
|
"epoch": 2.05, |
|
"eval_accuracy": 0.7223208999407934, |
|
"eval_f1_macro": 0.6862310990226811, |
|
"eval_f1_negative": 0.6942959001782532, |
|
"eval_f1_neutral": 0.7689950980392158, |
|
"eval_f1_positive": 0.5954022988505746, |
|
"eval_loss": 0.6309220790863037, |
|
"eval_precision_negative": 0.7021180712032447, |
|
"eval_precision_neutral": 0.7526989204318273, |
|
"eval_precision_positive": 0.6348039215686274, |
|
"eval_recall_negative": 0.6866460996033495, |
|
"eval_recall_neutral": 0.7860125260960334, |
|
"eval_recall_positive": 0.5606060606060606, |
|
"eval_runtime": 13.5411, |
|
"eval_samples_per_second": 623.656, |
|
"eval_steps_per_second": 3.249, |
|
"step": 2440 |
|
}, |
|
{ |
|
"epoch": 2.09, |
|
"learning_rate": 1.5824915824915825e-05, |
|
"loss": 0.5671, |
|
"step": 2480 |
|
}, |
|
{ |
|
"epoch": 2.09, |
|
"eval_accuracy": 0.7205447010065127, |
|
"eval_f1_macro": 0.683056392123643, |
|
"eval_f1_negative": 0.6914449087310313, |
|
"eval_f1_neutral": 0.7678189048638727, |
|
"eval_f1_positive": 0.5899053627760252, |
|
"eval_loss": 0.6297855377197266, |
|
"eval_precision_negative": 0.6900790166812993, |
|
"eval_precision_neutral": 0.7504484751843731, |
|
"eval_precision_positive": 0.6504347826086957, |
|
"eval_recall_negative": 0.6928162185985015, |
|
"eval_recall_neutral": 0.7860125260960334, |
|
"eval_recall_positive": 0.5396825396825397, |
|
"eval_runtime": 13.5165, |
|
"eval_samples_per_second": 624.793, |
|
"eval_steps_per_second": 3.255, |
|
"step": 2480 |
|
}, |
|
{ |
|
"epoch": 2.12, |
|
"learning_rate": 1.575757575757576e-05, |
|
"loss": 0.5458, |
|
"step": 2520 |
|
}, |
|
{ |
|
"epoch": 2.12, |
|
"eval_accuracy": 0.7214920071047958, |
|
"eval_f1_macro": 0.6872366815721698, |
|
"eval_f1_negative": 0.6905083220872694, |
|
"eval_f1_neutral": 0.7679083094555873, |
|
"eval_f1_positive": 0.6032934131736527, |
|
"eval_loss": 0.63502436876297, |
|
"eval_precision_negative": 0.7050987597611392, |
|
"eval_precision_neutral": 0.7531112003211562, |
|
"eval_precision_positive": 0.6267496111975117, |
|
"eval_recall_negative": 0.6765094755398854, |
|
"eval_recall_neutral": 0.7832985386221294, |
|
"eval_recall_positive": 0.5815295815295816, |
|
"eval_runtime": 13.5006, |
|
"eval_samples_per_second": 625.526, |
|
"eval_steps_per_second": 3.259, |
|
"step": 2520 |
|
}, |
|
{ |
|
"epoch": 2.15, |
|
"learning_rate": 1.569023569023569e-05, |
|
"loss": 0.5617, |
|
"step": 2560 |
|
}, |
|
{ |
|
"epoch": 2.15, |
|
"eval_accuracy": 0.7103611604499704, |
|
"eval_f1_macro": 0.6868863746975769, |
|
"eval_f1_negative": 0.7016379846568526, |
|
"eval_f1_neutral": 0.7452902101709682, |
|
"eval_f1_positive": 0.6137309292649098, |
|
"eval_loss": 0.6412296891212463, |
|
"eval_precision_negative": 0.6624902114330462, |
|
"eval_precision_neutral": 0.7789665376735716, |
|
"eval_precision_positive": 0.5907877169559412, |
|
"eval_recall_negative": 0.745702952842662, |
|
"eval_recall_neutral": 0.7144050104384133, |
|
"eval_recall_positive": 0.6385281385281385, |
|
"eval_runtime": 13.561, |
|
"eval_samples_per_second": 622.74, |
|
"eval_steps_per_second": 3.245, |
|
"step": 2560 |
|
}, |
|
{ |
|
"epoch": 2.19, |
|
"learning_rate": 1.5622895622895624e-05, |
|
"loss": 0.5582, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 2.19, |
|
"eval_accuracy": 0.7085849615156897, |
|
"eval_f1_macro": 0.687474213023077, |
|
"eval_f1_negative": 0.699581589958159, |
|
"eval_f1_neutral": 0.7421052631578948, |
|
"eval_f1_positive": 0.6207357859531774, |
|
"eval_loss": 0.6525644659996033, |
|
"eval_precision_negative": 0.6658701712465154, |
|
"eval_precision_neutral": 0.7815242494226328, |
|
"eval_precision_positive": 0.5785536159600998, |
|
"eval_recall_negative": 0.7368884971353019, |
|
"eval_recall_neutral": 0.7064718162839249, |
|
"eval_recall_positive": 0.6695526695526696, |
|
"eval_runtime": 13.5361, |
|
"eval_samples_per_second": 623.888, |
|
"eval_steps_per_second": 3.251, |
|
"step": 2600 |
|
}, |
|
{ |
|
"epoch": 2.22, |
|
"learning_rate": 1.555555555555556e-05, |
|
"loss": 0.5543, |
|
"step": 2640 |
|
}, |
|
{ |
|
"epoch": 2.22, |
|
"eval_accuracy": 0.7201894612196567, |
|
"eval_f1_macro": 0.6869432555451471, |
|
"eval_f1_negative": 0.7009306260575296, |
|
"eval_f1_neutral": 0.762918885061071, |
|
"eval_f1_positive": 0.5969802555168409, |
|
"eval_loss": 0.640322744846344, |
|
"eval_precision_negative": 0.6738511590077267, |
|
"eval_precision_neutral": 0.7629985383169764, |
|
"eval_precision_positive": 0.6441102756892231, |
|
"eval_recall_negative": 0.7302776553547818, |
|
"eval_recall_neutral": 0.762839248434238, |
|
"eval_recall_positive": 0.5562770562770563, |
|
"eval_runtime": 13.5133, |
|
"eval_samples_per_second": 624.941, |
|
"eval_steps_per_second": 3.256, |
|
"step": 2640 |
|
}, |
|
{ |
|
"epoch": 2.26, |
|
"learning_rate": 1.548821548821549e-05, |
|
"loss": 0.558, |
|
"step": 2680 |
|
}, |
|
{ |
|
"epoch": 2.26, |
|
"eval_accuracy": 0.7206631142687981, |
|
"eval_f1_macro": 0.6874230644596926, |
|
"eval_f1_negative": 0.697239536954586, |
|
"eval_f1_neutral": 0.7653250773993808, |
|
"eval_f1_positive": 0.5997045790251108, |
|
"eval_loss": 0.6337417364120483, |
|
"eval_precision_negative": 0.7044534412955465, |
|
"eval_precision_neutral": 0.756734693877551, |
|
"eval_precision_positive": 0.6142208774583964, |
|
"eval_recall_negative": 0.6901718818862935, |
|
"eval_recall_neutral": 0.7741127348643007, |
|
"eval_recall_positive": 0.5858585858585859, |
|
"eval_runtime": 13.5113, |
|
"eval_samples_per_second": 625.032, |
|
"eval_steps_per_second": 3.257, |
|
"step": 2680 |
|
}, |
|
{ |
|
"epoch": 2.29, |
|
"learning_rate": 1.5420875420875423e-05, |
|
"loss": 0.5506, |
|
"step": 2720 |
|
}, |
|
{ |
|
"epoch": 2.29, |
|
"eval_accuracy": 0.7171107164002368, |
|
"eval_f1_macro": 0.6895025450757618, |
|
"eval_f1_negative": 0.7093775262732418, |
|
"eval_f1_neutral": 0.753454231433506, |
|
"eval_f1_positive": 0.6056758775205378, |
|
"eval_loss": 0.6484044194221497, |
|
"eval_precision_negative": 0.6550951847704367, |
|
"eval_precision_neutral": 0.7800625838176128, |
|
"eval_precision_positive": 0.6277089783281734, |
|
"eval_recall_negative": 0.7734684883208461, |
|
"eval_recall_neutral": 0.7286012526096033, |
|
"eval_recall_positive": 0.5851370851370852, |
|
"eval_runtime": 13.5135, |
|
"eval_samples_per_second": 624.931, |
|
"eval_steps_per_second": 3.256, |
|
"step": 2720 |
|
}, |
|
{ |
|
"epoch": 2.32, |
|
"learning_rate": 1.5353535353535354e-05, |
|
"loss": 0.5569, |
|
"step": 2760 |
|
}, |
|
{ |
|
"epoch": 2.32, |
|
"eval_accuracy": 0.7167554766133807, |
|
"eval_f1_macro": 0.6895340612929335, |
|
"eval_f1_negative": 0.7063525452250736, |
|
"eval_f1_neutral": 0.7544910179640718, |
|
"eval_f1_positive": 0.6077586206896551, |
|
"eval_loss": 0.6315791606903076, |
|
"eval_precision_negative": 0.6756539235412475, |
|
"eval_precision_neutral": 0.7733450241122315, |
|
"eval_precision_positive": 0.6051502145922747, |
|
"eval_recall_negative": 0.7399735566328779, |
|
"eval_recall_neutral": 0.7365344467640919, |
|
"eval_recall_positive": 0.6103896103896104, |
|
"eval_runtime": 13.5058, |
|
"eval_samples_per_second": 625.287, |
|
"eval_steps_per_second": 3.258, |
|
"step": 2760 |
|
}, |
|
{ |
|
"epoch": 2.36, |
|
"learning_rate": 1.5286195286195288e-05, |
|
"loss": 0.5469, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 2.36, |
|
"eval_accuracy": 0.7182948490230906, |
|
"eval_f1_macro": 0.69129222470535, |
|
"eval_f1_negative": 0.7031543764361813, |
|
"eval_f1_neutral": 0.7562953478446436, |
|
"eval_f1_positive": 0.6144269498352252, |
|
"eval_loss": 0.6461361646652222, |
|
"eval_precision_negative": 0.6683876092136616, |
|
"eval_precision_neutral": 0.7734613705805325, |
|
"eval_precision_positive": 0.6237918215613383, |
|
"eval_recall_negative": 0.7417364477743499, |
|
"eval_recall_neutral": 0.7398747390396659, |
|
"eval_recall_positive": 0.6053391053391053, |
|
"eval_runtime": 13.5002, |
|
"eval_samples_per_second": 625.546, |
|
"eval_steps_per_second": 3.259, |
|
"step": 2800 |
|
}, |
|
{ |
|
"epoch": 2.39, |
|
"learning_rate": 1.521885521885522e-05, |
|
"loss": 0.5497, |
|
"step": 2840 |
|
}, |
|
{ |
|
"epoch": 2.39, |
|
"eval_accuracy": 0.7205447010065127, |
|
"eval_f1_macro": 0.6901740903513232, |
|
"eval_f1_negative": 0.6989695242271432, |
|
"eval_f1_neutral": 0.7628887497390942, |
|
"eval_f1_positive": 0.608663997087732, |
|
"eval_loss": 0.6306228041648865, |
|
"eval_precision_negative": 0.6954624781849913, |
|
"eval_precision_neutral": 0.7627295492487479, |
|
"eval_precision_positive": 0.6142542248346804, |
|
"eval_recall_negative": 0.7025121198765977, |
|
"eval_recall_neutral": 0.7630480167014614, |
|
"eval_recall_positive": 0.6031746031746031, |
|
"eval_runtime": 13.5161, |
|
"eval_samples_per_second": 624.81, |
|
"eval_steps_per_second": 3.255, |
|
"step": 2840 |
|
}, |
|
{ |
|
"epoch": 2.42, |
|
"learning_rate": 1.5151515151515153e-05, |
|
"loss": 0.5577, |
|
"step": 2880 |
|
}, |
|
{ |
|
"epoch": 2.42, |
|
"eval_accuracy": 0.7149792776791001, |
|
"eval_f1_macro": 0.686526091020862, |
|
"eval_f1_negative": 0.6968478950708694, |
|
"eval_f1_neutral": 0.7555225148683093, |
|
"eval_f1_positive": 0.6072078631234074, |
|
"eval_loss": 0.6409549713134766, |
|
"eval_precision_negative": 0.6700569568755086, |
|
"eval_precision_neutral": 0.7689148292261133, |
|
"eval_precision_positive": 0.6127847171197649, |
|
"eval_recall_negative": 0.7258704275011018, |
|
"eval_recall_neutral": 0.7425887265135699, |
|
"eval_recall_positive": 0.6017316017316018, |
|
"eval_runtime": 13.6855, |
|
"eval_samples_per_second": 617.076, |
|
"eval_steps_per_second": 3.215, |
|
"step": 2880 |
|
}, |
|
{ |
|
"epoch": 2.46, |
|
"learning_rate": 1.5084175084175085e-05, |
|
"loss": 0.557, |
|
"step": 2920 |
|
}, |
|
{ |
|
"epoch": 2.46, |
|
"eval_accuracy": 0.7225577264653641, |
|
"eval_f1_macro": 0.6876490677339296, |
|
"eval_f1_negative": 0.7071207430340557, |
|
"eval_f1_neutral": 0.7645151166440004, |
|
"eval_f1_positive": 0.5913113435237329, |
|
"eval_loss": 0.6443095803260803, |
|
"eval_precision_negative": 0.6649844720496895, |
|
"eval_precision_neutral": 0.7661983644369889, |
|
"eval_precision_positive": 0.6681818181818182, |
|
"eval_recall_negative": 0.75495813133539, |
|
"eval_recall_neutral": 0.762839248434238, |
|
"eval_recall_positive": 0.5303030303030303, |
|
"eval_runtime": 13.5647, |
|
"eval_samples_per_second": 622.57, |
|
"eval_steps_per_second": 3.244, |
|
"step": 2920 |
|
}, |
|
{ |
|
"epoch": 2.49, |
|
"learning_rate": 1.5016835016835018e-05, |
|
"loss": 0.5542, |
|
"step": 2960 |
|
}, |
|
{ |
|
"epoch": 2.49, |
|
"eval_accuracy": 0.7161634103019539, |
|
"eval_f1_macro": 0.687092758801656, |
|
"eval_f1_negative": 0.7009579341940858, |
|
"eval_f1_neutral": 0.7560144773259526, |
|
"eval_f1_positive": 0.6043058648849294, |
|
"eval_loss": 0.6480274796485901, |
|
"eval_precision_negative": 0.6644295302013423, |
|
"eval_precision_neutral": 0.7712858384013901, |
|
"eval_precision_positive": 0.6223241590214067, |
|
"eval_recall_negative": 0.7417364477743499, |
|
"eval_recall_neutral": 0.7413361169102296, |
|
"eval_recall_positive": 0.5873015873015873, |
|
"eval_runtime": 13.5134, |
|
"eval_samples_per_second": 624.935, |
|
"eval_steps_per_second": 3.256, |
|
"step": 2960 |
|
}, |
|
{ |
|
"epoch": 2.53, |
|
"learning_rate": 1.4949494949494952e-05, |
|
"loss": 0.567, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 2.53, |
|
"eval_accuracy": 0.7079928952042629, |
|
"eval_f1_macro": 0.6865435263558487, |
|
"eval_f1_negative": 0.7025898078529658, |
|
"eval_f1_neutral": 0.7416051965209732, |
|
"eval_f1_positive": 0.6154355746936071, |
|
"eval_loss": 0.6429863572120667, |
|
"eval_precision_negative": 0.6677252878126241, |
|
"eval_precision_neutral": 0.7845329606335896, |
|
"eval_precision_positive": 0.5688916105327618, |
|
"eval_recall_negative": 0.7412957249889819, |
|
"eval_recall_neutral": 0.7031315240083508, |
|
"eval_recall_positive": 0.6702741702741702, |
|
"eval_runtime": 13.5159, |
|
"eval_samples_per_second": 624.818, |
|
"eval_steps_per_second": 3.255, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 2.56, |
|
"learning_rate": 1.4882154882154884e-05, |
|
"loss": 0.5606, |
|
"step": 3040 |
|
}, |
|
{ |
|
"epoch": 2.56, |
|
"eval_accuracy": 0.7155713439905269, |
|
"eval_f1_macro": 0.6890929890491521, |
|
"eval_f1_negative": 0.7017241379310344, |
|
"eval_f1_neutral": 0.7549994652978291, |
|
"eval_f1_positive": 0.6105553639185926, |
|
"eval_loss": 0.6457778811454773, |
|
"eval_precision_negative": 0.6866301138760017, |
|
"eval_precision_neutral": 0.7739530804648104, |
|
"eval_precision_positive": 0.5849306014540647, |
|
"eval_recall_negative": 0.7174966945791097, |
|
"eval_recall_neutral": 0.7369519832985386, |
|
"eval_recall_positive": 0.6385281385281385, |
|
"eval_runtime": 13.5186, |
|
"eval_samples_per_second": 624.694, |
|
"eval_steps_per_second": 3.255, |
|
"step": 3040 |
|
}, |
|
{ |
|
"epoch": 2.59, |
|
"learning_rate": 1.4814814814814815e-05, |
|
"loss": 0.5492, |
|
"step": 3080 |
|
}, |
|
{ |
|
"epoch": 2.59, |
|
"eval_accuracy": 0.713676731793961, |
|
"eval_f1_macro": 0.687090376547261, |
|
"eval_f1_negative": 0.6999178981937603, |
|
"eval_f1_neutral": 0.7514812021975654, |
|
"eval_f1_positive": 0.6098720292504571, |
|
"eval_loss": 0.646338164806366, |
|
"eval_precision_negative": 0.6550134460238187, |
|
"eval_precision_neutral": 0.7763187180057868, |
|
"eval_precision_positive": 0.6182357301704967, |
|
"eval_recall_negative": 0.751432349052446, |
|
"eval_recall_neutral": 0.7281837160751565, |
|
"eval_recall_positive": 0.6017316017316018, |
|
"eval_runtime": 13.5425, |
|
"eval_samples_per_second": 623.591, |
|
"eval_steps_per_second": 3.249, |
|
"step": 3080 |
|
}, |
|
{ |
|
"epoch": 2.63, |
|
"learning_rate": 1.4747474747474747e-05, |
|
"loss": 0.5509, |
|
"step": 3120 |
|
}, |
|
{ |
|
"epoch": 2.63, |
|
"eval_accuracy": 0.7187685020722321, |
|
"eval_f1_macro": 0.6907132499480086, |
|
"eval_f1_negative": 0.7029375258585022, |
|
"eval_f1_neutral": 0.7576566001493972, |
|
"eval_f1_positive": 0.6115456238361267, |
|
"eval_loss": 0.6359885334968567, |
|
"eval_precision_negative": 0.6623781676413255, |
|
"eval_precision_neutral": 0.7749399694389871, |
|
"eval_precision_positive": 0.6320246343341032, |
|
"eval_recall_negative": 0.748788012340238, |
|
"eval_recall_neutral": 0.7411273486430062, |
|
"eval_recall_positive": 0.5923520923520924, |
|
"eval_runtime": 13.4528, |
|
"eval_samples_per_second": 627.753, |
|
"eval_steps_per_second": 3.271, |
|
"step": 3120 |
|
}, |
|
{ |
|
"epoch": 2.66, |
|
"learning_rate": 1.4680134680134681e-05, |
|
"loss": 0.5626, |
|
"step": 3160 |
|
}, |
|
{ |
|
"epoch": 2.66, |
|
"eval_accuracy": 0.7175843694493783, |
|
"eval_f1_macro": 0.6878133884212742, |
|
"eval_f1_negative": 0.7006661115736886, |
|
"eval_f1_neutral": 0.7580354301474488, |
|
"eval_f1_positive": 0.6047386235426853, |
|
"eval_loss": 0.6416473984718323, |
|
"eval_precision_negative": 0.663905325443787, |
|
"eval_precision_neutral": 0.770541298253181, |
|
"eval_precision_positive": 0.631578947368421, |
|
"eval_recall_negative": 0.7417364477743499, |
|
"eval_recall_neutral": 0.7459290187891441, |
|
"eval_recall_positive": 0.5800865800865801, |
|
"eval_runtime": 13.5444, |
|
"eval_samples_per_second": 623.505, |
|
"eval_steps_per_second": 3.249, |
|
"step": 3160 |
|
}, |
|
{ |
|
"epoch": 2.69, |
|
"learning_rate": 1.4612794612794614e-05, |
|
"loss": 0.5589, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 2.69, |
|
"eval_accuracy": 0.7187685020722321, |
|
"eval_f1_macro": 0.6920386854465886, |
|
"eval_f1_negative": 0.706980691703798, |
|
"eval_f1_neutral": 0.7570633561643835, |
|
"eval_f1_positive": 0.6120720084715848, |
|
"eval_loss": 0.6367910504341125, |
|
"eval_precision_negative": 0.6816693944353519, |
|
"eval_precision_neutral": 0.7766798418972332, |
|
"eval_precision_positive": 0.5991706979958535, |
|
"eval_recall_negative": 0.7342441604230939, |
|
"eval_recall_neutral": 0.7384133611691023, |
|
"eval_recall_positive": 0.6255411255411255, |
|
"eval_runtime": 13.5341, |
|
"eval_samples_per_second": 623.979, |
|
"eval_steps_per_second": 3.251, |
|
"step": 3200 |
|
}, |
|
{ |
|
"epoch": 2.73, |
|
"learning_rate": 1.4545454545454546e-05, |
|
"loss": 0.5499, |
|
"step": 3240 |
|
}, |
|
{ |
|
"epoch": 2.73, |
|
"eval_accuracy": 0.7135583185316755, |
|
"eval_f1_macro": 0.6872354106917024, |
|
"eval_f1_negative": 0.7027480595762535, |
|
"eval_f1_neutral": 0.7509126046811251, |
|
"eval_f1_positive": 0.6080455678177287, |
|
"eval_loss": 0.6405165791511536, |
|
"eval_precision_negative": 0.6705364291433147, |
|
"eval_precision_neutral": 0.7729885057471264, |
|
"eval_precision_positive": 0.6001405481377372, |
|
"eval_recall_negative": 0.7382106654914059, |
|
"eval_recall_neutral": 0.7300626304801671, |
|
"eval_recall_positive": 0.6161616161616161, |
|
"eval_runtime": 13.5535, |
|
"eval_samples_per_second": 623.087, |
|
"eval_steps_per_second": 3.246, |
|
"step": 3240 |
|
}, |
|
{ |
|
"epoch": 2.76, |
|
"learning_rate": 1.447811447811448e-05, |
|
"loss": 0.5431, |
|
"step": 3280 |
|
}, |
|
{ |
|
"epoch": 2.76, |
|
"eval_accuracy": 0.7207815275310835, |
|
"eval_f1_macro": 0.6892335124121108, |
|
"eval_f1_negative": 0.7012817727568977, |
|
"eval_f1_neutral": 0.7629961454318157, |
|
"eval_f1_positive": 0.6034226190476191, |
|
"eval_loss": 0.6356926560401917, |
|
"eval_precision_negative": 0.6915167095115681, |
|
"eval_precision_neutral": 0.7614888750259929, |
|
"eval_precision_positive": 0.6228878648233487, |
|
"eval_recall_negative": 0.7113265755839577, |
|
"eval_recall_neutral": 0.764509394572025, |
|
"eval_recall_positive": 0.5851370851370852, |
|
"eval_runtime": 13.6103, |
|
"eval_samples_per_second": 620.484, |
|
"eval_steps_per_second": 3.233, |
|
"step": 3280 |
|
}, |
|
{ |
|
"epoch": 2.79, |
|
"learning_rate": 1.4410774410774413e-05, |
|
"loss": 0.5388, |
|
"step": 3320 |
|
}, |
|
{ |
|
"epoch": 2.79, |
|
"eval_accuracy": 0.7103611604499704, |
|
"eval_f1_macro": 0.6887331835620346, |
|
"eval_f1_negative": 0.7057600332709503, |
|
"eval_f1_neutral": 0.7435107787065551, |
|
"eval_f1_positive": 0.6169287387085982, |
|
"eval_loss": 0.6553226113319397, |
|
"eval_precision_negative": 0.6681102362204724, |
|
"eval_precision_neutral": 0.7856810785681079, |
|
"eval_precision_positive": 0.5751715533374921, |
|
"eval_recall_negative": 0.747906566769502, |
|
"eval_recall_neutral": 0.7056367432150313, |
|
"eval_recall_positive": 0.6652236652236653, |
|
"eval_runtime": 13.4151, |
|
"eval_samples_per_second": 629.514, |
|
"eval_steps_per_second": 3.28, |
|
"step": 3320 |
|
}, |
|
{ |
|
"epoch": 2.83, |
|
"learning_rate": 1.4343434343434344e-05, |
|
"loss": 0.5613, |
|
"step": 3360 |
|
}, |
|
{ |
|
"epoch": 2.83, |
|
"eval_accuracy": 0.7232682060390764, |
|
"eval_f1_macro": 0.6875059651526924, |
|
"eval_f1_negative": 0.7051926298157454, |
|
"eval_f1_neutral": 0.7659927423535511, |
|
"eval_f1_positive": 0.5913325232887808, |
|
"eval_loss": 0.6239017844200134, |
|
"eval_precision_negative": 0.6717191862784204, |
|
"eval_precision_neutral": 0.76086508753862, |
|
"eval_precision_positive": 0.6740535549399815, |
|
"eval_recall_negative": 0.742177170559718, |
|
"eval_recall_neutral": 0.7711899791231733, |
|
"eval_recall_positive": 0.5266955266955267, |
|
"eval_runtime": 13.4098, |
|
"eval_samples_per_second": 629.763, |
|
"eval_steps_per_second": 3.281, |
|
"step": 3360 |
|
}, |
|
{ |
|
"epoch": 2.86, |
|
"learning_rate": 1.4276094276094276e-05, |
|
"loss": 0.556, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 2.86, |
|
"eval_accuracy": 0.7217288336293665, |
|
"eval_f1_macro": 0.6902285547620584, |
|
"eval_f1_negative": 0.7011167068097219, |
|
"eval_f1_neutral": 0.7648837451777708, |
|
"eval_f1_positive": 0.6046852122986822, |
|
"eval_loss": 0.6339342594146729, |
|
"eval_precision_negative": 0.696692776327241, |
|
"eval_precision_neutral": 0.7640074984378254, |
|
"eval_precision_positive": 0.6136701337295691, |
|
"eval_recall_negative": 0.7055971793741737, |
|
"eval_recall_neutral": 0.7657620041753653, |
|
"eval_recall_positive": 0.5959595959595959, |
|
"eval_runtime": 13.436, |
|
"eval_samples_per_second": 628.537, |
|
"eval_steps_per_second": 3.275, |
|
"step": 3400 |
|
}, |
|
{ |
|
"epoch": 2.9, |
|
"learning_rate": 1.420875420875421e-05, |
|
"loss": 0.5536, |
|
"step": 3440 |
|
}, |
|
{ |
|
"epoch": 2.9, |
|
"eval_accuracy": 0.7108348134991119, |
|
"eval_f1_macro": 0.6898151957724491, |
|
"eval_f1_negative": 0.7129761662253005, |
|
"eval_f1_neutral": 0.7415480427046264, |
|
"eval_f1_positive": 0.6149213783874204, |
|
"eval_loss": 0.659329891204834, |
|
"eval_precision_negative": 0.6628787878787878, |
|
"eval_precision_neutral": 0.7934316991908615, |
|
"eval_precision_positive": 0.5733000623830318, |
|
"eval_recall_negative": 0.7712648743940062, |
|
"eval_recall_neutral": 0.6960334029227557, |
|
"eval_recall_positive": 0.663059163059163, |
|
"eval_runtime": 13.4431, |
|
"eval_samples_per_second": 628.201, |
|
"eval_steps_per_second": 3.273, |
|
"step": 3440 |
|
}, |
|
{ |
|
"epoch": 2.93, |
|
"learning_rate": 1.4141414141414143e-05, |
|
"loss": 0.5663, |
|
"step": 3480 |
|
}, |
|
{ |
|
"epoch": 2.93, |
|
"eval_accuracy": 0.7154529307282416, |
|
"eval_f1_macro": 0.6878232234805552, |
|
"eval_f1_negative": 0.6974677920924034, |
|
"eval_f1_neutral": 0.7573062261753494, |
|
"eval_f1_positive": 0.6086956521739131, |
|
"eval_loss": 0.6353215575218201, |
|
"eval_precision_negative": 0.703090013434841, |
|
"eval_precision_neutral": 0.7683712935109583, |
|
"eval_precision_positive": 0.5750962772785623, |
|
"eval_recall_negative": 0.6919347730277655, |
|
"eval_recall_neutral": 0.7465553235908142, |
|
"eval_recall_positive": 0.6464646464646465, |
|
"eval_runtime": 13.4095, |
|
"eval_samples_per_second": 629.78, |
|
"eval_steps_per_second": 3.281, |
|
"step": 3480 |
|
}, |
|
{ |
|
"epoch": 2.96, |
|
"learning_rate": 1.4074074074074075e-05, |
|
"loss": 0.5499, |
|
"step": 3520 |
|
}, |
|
{ |
|
"epoch": 2.96, |
|
"eval_accuracy": 0.7143872113676731, |
|
"eval_f1_macro": 0.6899472024314622, |
|
"eval_f1_negative": 0.7078491335372069, |
|
"eval_f1_neutral": 0.7488017429193901, |
|
"eval_f1_positive": 0.6131907308377897, |
|
"eval_loss": 0.6429401636123657, |
|
"eval_precision_negative": 0.6585735963581184, |
|
"eval_precision_neutral": 0.7829157175398633, |
|
"eval_precision_positive": 0.6060606060606061, |
|
"eval_recall_negative": 0.7650947553988541, |
|
"eval_recall_neutral": 0.7175365344467641, |
|
"eval_recall_positive": 0.6204906204906205, |
|
"eval_runtime": 13.4298, |
|
"eval_samples_per_second": 628.824, |
|
"eval_steps_per_second": 3.276, |
|
"step": 3520 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"learning_rate": 1.4006734006734009e-05, |
|
"loss": 0.5619, |
|
"step": 3560 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.7207815275310835, |
|
"eval_f1_macro": 0.6934678744913757, |
|
"eval_f1_negative": 0.7042136003337507, |
|
"eval_f1_neutral": 0.759215853398679, |
|
"eval_f1_positive": 0.6169741697416974, |
|
"eval_loss": 0.6337869167327881, |
|
"eval_precision_negative": 0.6685148514851486, |
|
"eval_precision_neutral": 0.7752393385552655, |
|
"eval_precision_positive": 0.6314199395770392, |
|
"eval_recall_negative": 0.74394006170119, |
|
"eval_recall_neutral": 0.7438413361169103, |
|
"eval_recall_positive": 0.6031746031746031, |
|
"eval_runtime": 13.4185, |
|
"eval_samples_per_second": 629.354, |
|
"eval_steps_per_second": 3.279, |
|
"step": 3560 |
|
} |
|
], |
|
"max_steps": 11880, |
|
"num_train_epochs": 10, |
|
"total_flos": 1.849503866686182e+16, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|