lombardata's picture
🍻 cheers
0722a99
{
"best_metric": 0.08124219626188278,
"best_model_checkpoint": "/home1/datawork/mcontini/models/multilabel/huggingface/dinov2-large-2024_01_05-kornia_img-size518_batch-size32_epochs70_freeze/checkpoint-28496",
"epoch": 114.0,
"eval_steps": 500,
"global_step": 31236,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.44556873691556176,
"eval_f1_macro": 0.5755948244574681,
"eval_f1_micro": 0.7376394107473012,
"eval_loss": 0.13577787578105927,
"eval_roc_auc": 0.8276012534175776,
"eval_runtime": 686.0469,
"eval_samples_per_second": 4.178,
"eval_steps_per_second": 0.131,
"learning_rate": 0.01,
"step": 274
},
{
"epoch": 1.82,
"learning_rate": 0.01,
"loss": 0.1895,
"step": 500
},
{
"epoch": 2.0,
"eval_accuracy": 0.4357990230286113,
"eval_f1_macro": 0.6131029690652663,
"eval_f1_micro": 0.7463369963369964,
"eval_loss": 0.14224015176296234,
"eval_roc_auc": 0.8432701847378548,
"eval_runtime": 679.513,
"eval_samples_per_second": 4.218,
"eval_steps_per_second": 0.132,
"learning_rate": 0.01,
"step": 548
},
{
"epoch": 3.0,
"eval_accuracy": 0.38415910676901605,
"eval_f1_macro": 0.5242425898328716,
"eval_f1_micro": 0.7273147345925026,
"eval_loss": 0.21337130665779114,
"eval_roc_auc": 0.8305454415797603,
"eval_runtime": 681.6164,
"eval_samples_per_second": 4.205,
"eval_steps_per_second": 0.132,
"learning_rate": 0.01,
"step": 822
},
{
"epoch": 3.65,
"learning_rate": 0.01,
"loss": 0.1668,
"step": 1000
},
{
"epoch": 4.0,
"eval_accuracy": 0.4438241451500349,
"eval_f1_macro": 0.5474301561230492,
"eval_f1_micro": 0.7034210860994532,
"eval_loss": 0.14501234889030457,
"eval_roc_auc": 0.7947377699358407,
"eval_runtime": 676.7895,
"eval_samples_per_second": 4.235,
"eval_steps_per_second": 0.133,
"learning_rate": 0.01,
"step": 1096
},
{
"epoch": 5.0,
"eval_accuracy": 0.4438241451500349,
"eval_f1_macro": 0.6194844495540315,
"eval_f1_micro": 0.7611423380457615,
"eval_loss": 0.13293854892253876,
"eval_roc_auc": 0.8535844928345971,
"eval_runtime": 676.1205,
"eval_samples_per_second": 4.239,
"eval_steps_per_second": 0.133,
"learning_rate": 0.01,
"step": 1370
},
{
"epoch": 5.47,
"learning_rate": 0.01,
"loss": 0.1666,
"step": 1500
},
{
"epoch": 6.0,
"eval_accuracy": 0.44452198185624564,
"eval_f1_macro": 0.5624987041776927,
"eval_f1_micro": 0.752847713067352,
"eval_loss": 0.13243332505226135,
"eval_roc_auc": 0.8411441150969292,
"eval_runtime": 676.3907,
"eval_samples_per_second": 4.237,
"eval_steps_per_second": 0.133,
"learning_rate": 0.01,
"step": 1644
},
{
"epoch": 7.0,
"eval_accuracy": 0.43126308443824146,
"eval_f1_macro": 0.5689553622505643,
"eval_f1_micro": 0.7496488764044945,
"eval_loss": 0.13447266817092896,
"eval_roc_auc": 0.838952950800037,
"eval_runtime": 675.7851,
"eval_samples_per_second": 4.241,
"eval_steps_per_second": 0.133,
"learning_rate": 0.01,
"step": 1918
},
{
"epoch": 7.3,
"learning_rate": 0.01,
"loss": 0.1664,
"step": 2000
},
{
"epoch": 8.0,
"eval_accuracy": 0.4323098394975576,
"eval_f1_macro": 0.5627920395195278,
"eval_f1_micro": 0.7502482911725186,
"eval_loss": 0.13808754086494446,
"eval_roc_auc": 0.8397325865953646,
"eval_runtime": 681.8119,
"eval_samples_per_second": 4.204,
"eval_steps_per_second": 0.132,
"learning_rate": 0.01,
"step": 2192
},
{
"epoch": 9.0,
"eval_accuracy": 0.44033496161898117,
"eval_f1_macro": 0.5492251158735639,
"eval_f1_micro": 0.7395667604944316,
"eval_loss": 0.13694943487644196,
"eval_roc_auc": 0.8219722316265465,
"eval_runtime": 674.9771,
"eval_samples_per_second": 4.246,
"eval_steps_per_second": 0.133,
"learning_rate": 0.01,
"step": 2466
},
{
"epoch": 9.12,
"learning_rate": 0.01,
"loss": 0.1656,
"step": 2500
},
{
"epoch": 10.0,
"eval_accuracy": 0.4424284717376134,
"eval_f1_macro": 0.528180519175626,
"eval_f1_micro": 0.7326552851434799,
"eval_loss": 0.13609227538108826,
"eval_roc_auc": 0.821178691278072,
"eval_runtime": 674.2621,
"eval_samples_per_second": 4.251,
"eval_steps_per_second": 0.133,
"learning_rate": 0.01,
"step": 2740
},
{
"epoch": 10.95,
"learning_rate": 0.01,
"loss": 0.166,
"step": 3000
},
{
"epoch": 11.0,
"eval_accuracy": 0.4277739009071877,
"eval_f1_macro": 0.5428317486981787,
"eval_f1_micro": 0.7434225844004656,
"eval_loss": 0.1380929797887802,
"eval_roc_auc": 0.8371006883503846,
"eval_runtime": 676.158,
"eval_samples_per_second": 4.239,
"eval_steps_per_second": 0.133,
"learning_rate": 0.01,
"step": 3014
},
{
"epoch": 12.0,
"eval_accuracy": 0.444870900209351,
"eval_f1_macro": 0.5618568055480317,
"eval_f1_micro": 0.7354685646500594,
"eval_loss": 0.1344844251871109,
"eval_roc_auc": 0.827911942291835,
"eval_runtime": 683.7162,
"eval_samples_per_second": 4.192,
"eval_steps_per_second": 0.132,
"learning_rate": 0.01,
"step": 3288
},
{
"epoch": 12.77,
"learning_rate": 0.001,
"loss": 0.1585,
"step": 3500
},
{
"epoch": 13.0,
"eval_accuracy": 0.49023028611304953,
"eval_f1_macro": 0.650060261894195,
"eval_f1_micro": 0.8009333029820168,
"eval_loss": 0.11546628922224045,
"eval_roc_auc": 0.8745955707824836,
"eval_runtime": 679.0864,
"eval_samples_per_second": 4.22,
"eval_steps_per_second": 0.133,
"learning_rate": 0.001,
"step": 3562
},
{
"epoch": 14.0,
"eval_accuracy": 0.5041870202372645,
"eval_f1_macro": 0.6697333276095331,
"eval_f1_micro": 0.8079378774805867,
"eval_loss": 0.11155486851930618,
"eval_roc_auc": 0.8750976636196655,
"eval_runtime": 676.6891,
"eval_samples_per_second": 4.235,
"eval_steps_per_second": 0.133,
"learning_rate": 0.001,
"step": 3836
},
{
"epoch": 14.6,
"learning_rate": 0.001,
"loss": 0.133,
"step": 4000
},
{
"epoch": 15.0,
"eval_accuracy": 0.5181437543614794,
"eval_f1_macro": 0.6736053030113935,
"eval_f1_micro": 0.814943326393708,
"eval_loss": 0.10734836012125015,
"eval_roc_auc": 0.877205285207194,
"eval_runtime": 677.4924,
"eval_samples_per_second": 4.23,
"eval_steps_per_second": 0.133,
"learning_rate": 0.001,
"step": 4110
},
{
"epoch": 16.0,
"eval_accuracy": 0.5083740404745289,
"eval_f1_macro": 0.7055616874566738,
"eval_f1_micro": 0.8238276299112801,
"eval_loss": 0.10476414114236832,
"eval_roc_auc": 0.8975418625131631,
"eval_runtime": 687.0217,
"eval_samples_per_second": 4.172,
"eval_steps_per_second": 0.131,
"learning_rate": 0.001,
"step": 4384
},
{
"epoch": 16.42,
"learning_rate": 0.001,
"loss": 0.1289,
"step": 4500
},
{
"epoch": 17.0,
"eval_accuracy": 0.5244242847173761,
"eval_f1_macro": 0.6896485755961196,
"eval_f1_micro": 0.820858825547487,
"eval_loss": 0.10253454744815826,
"eval_roc_auc": 0.8839468587595108,
"eval_runtime": 684.6037,
"eval_samples_per_second": 4.186,
"eval_steps_per_second": 0.131,
"learning_rate": 0.001,
"step": 4658
},
{
"epoch": 18.0,
"eval_accuracy": 0.5321004884856944,
"eval_f1_macro": 0.7045003592264228,
"eval_f1_micro": 0.8289563051845145,
"eval_loss": 0.10259302705526352,
"eval_roc_auc": 0.8916264271206406,
"eval_runtime": 685.7262,
"eval_samples_per_second": 4.18,
"eval_steps_per_second": 0.131,
"learning_rate": 0.001,
"step": 4932
},
{
"epoch": 18.25,
"learning_rate": 0.001,
"loss": 0.1227,
"step": 5000
},
{
"epoch": 19.0,
"eval_accuracy": 0.5279134682484299,
"eval_f1_macro": 0.6905367219275804,
"eval_f1_micro": 0.8306010928961749,
"eval_loss": 0.10123815387487411,
"eval_roc_auc": 0.8940566516497492,
"eval_runtime": 685.5377,
"eval_samples_per_second": 4.181,
"eval_steps_per_second": 0.131,
"learning_rate": 0.001,
"step": 5206
},
{
"epoch": 20.0,
"eval_accuracy": 0.5216329378925332,
"eval_f1_macro": 0.6830881274898382,
"eval_f1_micro": 0.8280441143371596,
"eval_loss": 0.09970748424530029,
"eval_roc_auc": 0.8930346669934526,
"eval_runtime": 686.9199,
"eval_samples_per_second": 4.172,
"eval_steps_per_second": 0.131,
"learning_rate": 0.001,
"step": 5480
},
{
"epoch": 20.07,
"learning_rate": 0.001,
"loss": 0.1202,
"step": 5500
},
{
"epoch": 21.0,
"eval_accuracy": 0.5352407536636427,
"eval_f1_macro": 0.6926783323821563,
"eval_f1_micro": 0.8300336623495178,
"eval_loss": 0.09886988252401352,
"eval_roc_auc": 0.8896211857387517,
"eval_runtime": 684.9162,
"eval_samples_per_second": 4.184,
"eval_steps_per_second": 0.131,
"learning_rate": 0.001,
"step": 5754
},
{
"epoch": 21.9,
"learning_rate": 0.001,
"loss": 0.12,
"step": 6000
},
{
"epoch": 22.0,
"eval_accuracy": 0.5209351011863224,
"eval_f1_macro": 0.6961228606859606,
"eval_f1_micro": 0.8279826958105646,
"eval_loss": 0.09963646531105042,
"eval_roc_auc": 0.8892587586568824,
"eval_runtime": 686.1389,
"eval_samples_per_second": 4.177,
"eval_steps_per_second": 0.131,
"learning_rate": 0.001,
"step": 6028
},
{
"epoch": 23.0,
"eval_accuracy": 0.5195394277739009,
"eval_f1_macro": 0.6958628426894405,
"eval_f1_micro": 0.831919078392807,
"eval_loss": 0.09720779210329056,
"eval_roc_auc": 0.8955944894582717,
"eval_runtime": 693.3459,
"eval_samples_per_second": 4.134,
"eval_steps_per_second": 0.13,
"learning_rate": 0.001,
"step": 6302
},
{
"epoch": 23.72,
"learning_rate": 0.001,
"loss": 0.1179,
"step": 6500
},
{
"epoch": 24.0,
"eval_accuracy": 0.5212840195394278,
"eval_f1_macro": 0.6881053152313114,
"eval_f1_micro": 0.8270608813406306,
"eval_loss": 0.10082241147756577,
"eval_roc_auc": 0.8915954736236973,
"eval_runtime": 682.9894,
"eval_samples_per_second": 4.196,
"eval_steps_per_second": 0.132,
"learning_rate": 0.001,
"step": 6576
},
{
"epoch": 25.0,
"eval_accuracy": 0.5268667131891137,
"eval_f1_macro": 0.6859679989625925,
"eval_f1_micro": 0.8283316086006668,
"eval_loss": 0.09828384965658188,
"eval_roc_auc": 0.8862551588199984,
"eval_runtime": 673.7378,
"eval_samples_per_second": 4.254,
"eval_steps_per_second": 0.134,
"learning_rate": 0.001,
"step": 6850
},
{
"epoch": 25.55,
"learning_rate": 0.001,
"loss": 0.1166,
"step": 7000
},
{
"epoch": 26.0,
"eval_accuracy": 0.5310537334263782,
"eval_f1_macro": 0.6805616825898689,
"eval_f1_micro": 0.8284274424464553,
"eval_loss": 0.09853371977806091,
"eval_roc_auc": 0.8875551335725609,
"eval_runtime": 679.0226,
"eval_samples_per_second": 4.221,
"eval_steps_per_second": 0.133,
"learning_rate": 0.001,
"step": 7124
},
{
"epoch": 27.0,
"eval_accuracy": 0.5324494068387997,
"eval_f1_macro": 0.6901040821549612,
"eval_f1_micro": 0.8305464575073264,
"eval_loss": 0.09571811556816101,
"eval_roc_auc": 0.887615396252071,
"eval_runtime": 672.1908,
"eval_samples_per_second": 4.264,
"eval_steps_per_second": 0.134,
"learning_rate": 0.001,
"step": 7398
},
{
"epoch": 27.37,
"learning_rate": 0.001,
"loss": 0.1158,
"step": 7500
},
{
"epoch": 28.0,
"eval_accuracy": 0.5177948360083741,
"eval_f1_macro": 0.7054421966314011,
"eval_f1_micro": 0.8292325882551658,
"eval_loss": 0.09954769909381866,
"eval_roc_auc": 0.8934873150088631,
"eval_runtime": 681.7881,
"eval_samples_per_second": 4.204,
"eval_steps_per_second": 0.132,
"learning_rate": 0.001,
"step": 7672
},
{
"epoch": 29.0,
"eval_accuracy": 0.5334961618981159,
"eval_f1_macro": 0.7026467347883069,
"eval_f1_micro": 0.8363861804655357,
"eval_loss": 0.09332505613565445,
"eval_roc_auc": 0.8970916521216963,
"eval_runtime": 684.6938,
"eval_samples_per_second": 4.186,
"eval_steps_per_second": 0.131,
"learning_rate": 0.001,
"step": 7946
},
{
"epoch": 29.2,
"learning_rate": 0.001,
"loss": 0.114,
"step": 8000
},
{
"epoch": 30.0,
"eval_accuracy": 0.5258199581297976,
"eval_f1_macro": 0.7109768073155117,
"eval_f1_micro": 0.8351258454374099,
"eval_loss": 0.09473367780447006,
"eval_roc_auc": 0.901874991489952,
"eval_runtime": 677.918,
"eval_samples_per_second": 4.228,
"eval_steps_per_second": 0.133,
"learning_rate": 0.001,
"step": 8220
},
{
"epoch": 31.0,
"eval_accuracy": 0.5331472435450104,
"eval_f1_macro": 0.7175382540523837,
"eval_f1_micro": 0.8365119611950171,
"eval_loss": 0.09674925357103348,
"eval_roc_auc": 0.9045853985344947,
"eval_runtime": 675.0971,
"eval_samples_per_second": 4.245,
"eval_steps_per_second": 0.133,
"learning_rate": 0.001,
"step": 8494
},
{
"epoch": 31.02,
"learning_rate": 0.001,
"loss": 0.1134,
"step": 8500
},
{
"epoch": 32.0,
"eval_accuracy": 0.5324494068387997,
"eval_f1_macro": 0.6932594476375145,
"eval_f1_micro": 0.8353541076487252,
"eval_loss": 0.09490892291069031,
"eval_roc_auc": 0.8947967085095635,
"eval_runtime": 677.2028,
"eval_samples_per_second": 4.232,
"eval_steps_per_second": 0.133,
"learning_rate": 0.001,
"step": 8768
},
{
"epoch": 32.85,
"learning_rate": 0.001,
"loss": 0.113,
"step": 9000
},
{
"epoch": 33.0,
"eval_accuracy": 0.5362875087229588,
"eval_f1_macro": 0.6973292248077614,
"eval_f1_micro": 0.8367208672086721,
"eval_loss": 0.09511947631835938,
"eval_roc_auc": 0.8966987186810037,
"eval_runtime": 679.2015,
"eval_samples_per_second": 4.22,
"eval_steps_per_second": 0.133,
"learning_rate": 0.001,
"step": 9042
},
{
"epoch": 34.0,
"eval_accuracy": 0.5380321004884857,
"eval_f1_macro": 0.6878227037845351,
"eval_f1_micro": 0.8334680679062246,
"eval_loss": 0.09364539384841919,
"eval_roc_auc": 0.8876181367760314,
"eval_runtime": 675.0346,
"eval_samples_per_second": 4.246,
"eval_steps_per_second": 0.133,
"learning_rate": 0.001,
"step": 9316
},
{
"epoch": 34.67,
"learning_rate": 0.001,
"loss": 0.1124,
"step": 9500
},
{
"epoch": 35.0,
"eval_accuracy": 0.5310537334263782,
"eval_f1_macro": 0.6856042645068489,
"eval_f1_micro": 0.833974649162517,
"eval_loss": 0.09358564764261246,
"eval_roc_auc": 0.8944494841237697,
"eval_runtime": 678.2782,
"eval_samples_per_second": 4.225,
"eval_steps_per_second": 0.133,
"learning_rate": 0.001,
"step": 9590
},
{
"epoch": 36.0,
"eval_accuracy": 0.5453593859036985,
"eval_f1_macro": 0.729828782855425,
"eval_f1_micro": 0.8455960879096174,
"eval_loss": 0.09342356771230698,
"eval_roc_auc": 0.9030647539078717,
"eval_runtime": 674.7512,
"eval_samples_per_second": 4.247,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 9864
},
{
"epoch": 36.5,
"learning_rate": 0.0001,
"loss": 0.1083,
"step": 10000
},
{
"epoch": 37.0,
"eval_accuracy": 0.54675505931612,
"eval_f1_macro": 0.7188765655113909,
"eval_f1_micro": 0.8456650022696323,
"eval_loss": 0.09240464121103287,
"eval_roc_auc": 0.8999478550409371,
"eval_runtime": 674.676,
"eval_samples_per_second": 4.248,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 10138
},
{
"epoch": 38.0,
"eval_accuracy": 0.5450104675505931,
"eval_f1_macro": 0.7089159960142193,
"eval_f1_micro": 0.8449173647271904,
"eval_loss": 0.09147636592388153,
"eval_roc_auc": 0.9003695495594045,
"eval_runtime": 675.4085,
"eval_samples_per_second": 4.243,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 10412
},
{
"epoch": 38.32,
"learning_rate": 0.0001,
"loss": 0.1034,
"step": 10500
},
{
"epoch": 39.0,
"eval_accuracy": 0.5484996510816469,
"eval_f1_macro": 0.725215575661352,
"eval_f1_micro": 0.8487853799866281,
"eval_loss": 0.09022974222898483,
"eval_roc_auc": 0.9078051247451889,
"eval_runtime": 672.7306,
"eval_samples_per_second": 4.26,
"eval_steps_per_second": 0.134,
"learning_rate": 0.0001,
"step": 10686
},
{
"epoch": 40.0,
"eval_accuracy": 0.5495464061409631,
"eval_f1_macro": 0.7182446688615595,
"eval_f1_micro": 0.8458797579322437,
"eval_loss": 0.09058264642953873,
"eval_roc_auc": 0.9011424061638826,
"eval_runtime": 678.9298,
"eval_samples_per_second": 4.221,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 10960
},
{
"epoch": 40.15,
"learning_rate": 0.0001,
"loss": 0.1024,
"step": 11000
},
{
"epoch": 41.0,
"eval_accuracy": 0.5505931612002791,
"eval_f1_macro": 0.7130026819185953,
"eval_f1_micro": 0.8481005491705826,
"eval_loss": 0.08943015336990356,
"eval_roc_auc": 0.902018393012137,
"eval_runtime": 676.4356,
"eval_samples_per_second": 4.237,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 11234
},
{
"epoch": 41.97,
"learning_rate": 0.0001,
"loss": 0.1004,
"step": 11500
},
{
"epoch": 42.0,
"eval_accuracy": 0.5519888346127007,
"eval_f1_macro": 0.7148190184347656,
"eval_f1_micro": 0.8457012282205084,
"eval_loss": 0.08726447820663452,
"eval_roc_auc": 0.8977194051943719,
"eval_runtime": 677.9496,
"eval_samples_per_second": 4.227,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 11508
},
{
"epoch": 43.0,
"eval_accuracy": 0.5537334263782275,
"eval_f1_macro": 0.71816969331258,
"eval_f1_micro": 0.8494563389754511,
"eval_loss": 0.08699071407318115,
"eval_roc_auc": 0.906163507621426,
"eval_runtime": 676.5268,
"eval_samples_per_second": 4.236,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 11782
},
{
"epoch": 43.8,
"learning_rate": 0.0001,
"loss": 0.0998,
"step": 12000
},
{
"epoch": 44.0,
"eval_accuracy": 0.5498953244940684,
"eval_f1_macro": 0.7261208407998851,
"eval_f1_micro": 0.8486114247008355,
"eval_loss": 0.08676985651254654,
"eval_roc_auc": 0.9033042612782081,
"eval_runtime": 674.6536,
"eval_samples_per_second": 4.248,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 12056
},
{
"epoch": 45.0,
"eval_accuracy": 0.555129099790649,
"eval_f1_macro": 0.7235580263821535,
"eval_f1_micro": 0.8493258426966293,
"eval_loss": 0.08680889010429382,
"eval_roc_auc": 0.9052931027877648,
"eval_runtime": 688.2557,
"eval_samples_per_second": 4.164,
"eval_steps_per_second": 0.131,
"learning_rate": 0.0001,
"step": 12330
},
{
"epoch": 45.62,
"learning_rate": 0.0001,
"loss": 0.0975,
"step": 12500
},
{
"epoch": 46.0,
"eval_accuracy": 0.5512909979064898,
"eval_f1_macro": 0.7317716716296281,
"eval_f1_micro": 0.8489586241554526,
"eval_loss": 0.0865492969751358,
"eval_roc_auc": 0.9071607698668371,
"eval_runtime": 684.0678,
"eval_samples_per_second": 4.19,
"eval_steps_per_second": 0.132,
"learning_rate": 0.0001,
"step": 12604
},
{
"epoch": 47.0,
"eval_accuracy": 0.5547801814375436,
"eval_f1_macro": 0.7390020274567815,
"eval_f1_micro": 0.8512299882858259,
"eval_loss": 0.08599700033664703,
"eval_roc_auc": 0.908765101440927,
"eval_runtime": 688.2365,
"eval_samples_per_second": 4.164,
"eval_steps_per_second": 0.131,
"learning_rate": 0.0001,
"step": 12878
},
{
"epoch": 47.45,
"learning_rate": 0.0001,
"loss": 0.099,
"step": 13000
},
{
"epoch": 48.0,
"eval_accuracy": 0.5558269364968598,
"eval_f1_macro": 0.7360003523455093,
"eval_f1_micro": 0.8509512552065742,
"eval_loss": 0.08596429973840714,
"eval_roc_auc": 0.9055422308395834,
"eval_runtime": 686.3198,
"eval_samples_per_second": 4.176,
"eval_steps_per_second": 0.131,
"learning_rate": 0.0001,
"step": 13152
},
{
"epoch": 49.0,
"eval_accuracy": 0.5547801814375436,
"eval_f1_macro": 0.7361919298080869,
"eval_f1_micro": 0.849985959000281,
"eval_loss": 0.08584348857402802,
"eval_roc_auc": 0.9057525299940252,
"eval_runtime": 688.3813,
"eval_samples_per_second": 4.163,
"eval_steps_per_second": 0.131,
"learning_rate": 0.0001,
"step": 13426
},
{
"epoch": 49.27,
"learning_rate": 0.0001,
"loss": 0.0972,
"step": 13500
},
{
"epoch": 50.0,
"eval_accuracy": 0.5586182833217027,
"eval_f1_macro": 0.725712332481399,
"eval_f1_micro": 0.8505096262740656,
"eval_loss": 0.08557379245758057,
"eval_roc_auc": 0.9032805341102342,
"eval_runtime": 685.8179,
"eval_samples_per_second": 4.179,
"eval_steps_per_second": 0.131,
"learning_rate": 0.0001,
"step": 13700
},
{
"epoch": 51.0,
"eval_accuracy": 0.557920446615492,
"eval_f1_macro": 0.7408593608052999,
"eval_f1_micro": 0.8500254194204373,
"eval_loss": 0.08562461286783218,
"eval_roc_auc": 0.9038335718454608,
"eval_runtime": 683.3234,
"eval_samples_per_second": 4.194,
"eval_steps_per_second": 0.132,
"learning_rate": 0.0001,
"step": 13974
},
{
"epoch": 51.09,
"learning_rate": 0.0001,
"loss": 0.0957,
"step": 14000
},
{
"epoch": 52.0,
"eval_accuracy": 0.5568736915561758,
"eval_f1_macro": 0.7232142709265429,
"eval_f1_micro": 0.8507868221442318,
"eval_loss": 0.08591117709875107,
"eval_roc_auc": 0.9035466101391771,
"eval_runtime": 693.4248,
"eval_samples_per_second": 4.133,
"eval_steps_per_second": 0.13,
"learning_rate": 0.0001,
"step": 14248
},
{
"epoch": 52.92,
"learning_rate": 0.0001,
"loss": 0.0964,
"step": 14500
},
{
"epoch": 53.0,
"eval_accuracy": 0.5628053035589672,
"eval_f1_macro": 0.7275870481420489,
"eval_f1_micro": 0.852056338028169,
"eval_loss": 0.08490145951509476,
"eval_roc_auc": 0.9058454914515268,
"eval_runtime": 691.5127,
"eval_samples_per_second": 4.145,
"eval_steps_per_second": 0.13,
"learning_rate": 0.0001,
"step": 14522
},
{
"epoch": 54.0,
"eval_accuracy": 0.5537334263782275,
"eval_f1_macro": 0.7394514344990791,
"eval_f1_micro": 0.85390386218394,
"eval_loss": 0.08516541868448257,
"eval_roc_auc": 0.9115532672468961,
"eval_runtime": 698.0325,
"eval_samples_per_second": 4.106,
"eval_steps_per_second": 0.129,
"learning_rate": 0.0001,
"step": 14796
},
{
"epoch": 54.74,
"learning_rate": 0.0001,
"loss": 0.0955,
"step": 15000
},
{
"epoch": 55.0,
"eval_accuracy": 0.5565247732030705,
"eval_f1_macro": 0.7354184764103003,
"eval_f1_micro": 0.8511167656205825,
"eval_loss": 0.08514942973852158,
"eval_roc_auc": 0.904089479088129,
"eval_runtime": 681.3519,
"eval_samples_per_second": 4.206,
"eval_steps_per_second": 0.132,
"learning_rate": 0.0001,
"step": 15070
},
{
"epoch": 56.0,
"eval_accuracy": 0.5572226099092812,
"eval_f1_macro": 0.736739641327092,
"eval_f1_micro": 0.8529461421576904,
"eval_loss": 0.08491206169128418,
"eval_roc_auc": 0.9066984002032717,
"eval_runtime": 677.9791,
"eval_samples_per_second": 4.227,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 15344
},
{
"epoch": 56.57,
"learning_rate": 0.0001,
"loss": 0.095,
"step": 15500
},
{
"epoch": 57.0,
"eval_accuracy": 0.5537334263782275,
"eval_f1_macro": 0.7241830253482859,
"eval_f1_micro": 0.8493824336688013,
"eval_loss": 0.0848437026143074,
"eval_roc_auc": 0.8993941682342463,
"eval_runtime": 677.1333,
"eval_samples_per_second": 4.233,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 15618
},
{
"epoch": 58.0,
"eval_accuracy": 0.5593161200279134,
"eval_f1_macro": 0.7363418087082886,
"eval_f1_micro": 0.8511604153662826,
"eval_loss": 0.08454328030347824,
"eval_roc_auc": 0.9029315644433922,
"eval_runtime": 675.3593,
"eval_samples_per_second": 4.244,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 15892
},
{
"epoch": 58.39,
"learning_rate": 0.0001,
"loss": 0.093,
"step": 16000
},
{
"epoch": 59.0,
"eval_accuracy": 0.560711793440335,
"eval_f1_macro": 0.73901392865669,
"eval_f1_micro": 0.8530955471527739,
"eval_loss": 0.08396653085947037,
"eval_roc_auc": 0.9058246057741859,
"eval_runtime": 679.8275,
"eval_samples_per_second": 4.216,
"eval_steps_per_second": 0.132,
"learning_rate": 0.0001,
"step": 16166
},
{
"epoch": 60.0,
"eval_accuracy": 0.5561758548499651,
"eval_f1_macro": 0.7472770304573509,
"eval_f1_micro": 0.852848189028787,
"eval_loss": 0.08474517613649368,
"eval_roc_auc": 0.9116141789978706,
"eval_runtime": 679.8207,
"eval_samples_per_second": 4.216,
"eval_steps_per_second": 0.132,
"learning_rate": 0.0001,
"step": 16440
},
{
"epoch": 60.22,
"learning_rate": 0.0001,
"loss": 0.0936,
"step": 16500
},
{
"epoch": 61.0,
"eval_accuracy": 0.552337752965806,
"eval_f1_macro": 0.7425280881449604,
"eval_f1_micro": 0.8516569637259293,
"eval_loss": 0.08434043824672699,
"eval_roc_auc": 0.9078005379735077,
"eval_runtime": 678.8837,
"eval_samples_per_second": 4.222,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 16714
},
{
"epoch": 62.0,
"eval_accuracy": 0.5540823447313329,
"eval_f1_macro": 0.7455853496732745,
"eval_f1_micro": 0.8515365097265295,
"eval_loss": 0.08436089754104614,
"eval_roc_auc": 0.905273313320008,
"eval_runtime": 684.8061,
"eval_samples_per_second": 4.185,
"eval_steps_per_second": 0.131,
"learning_rate": 0.0001,
"step": 16988
},
{
"epoch": 62.04,
"learning_rate": 0.0001,
"loss": 0.0932,
"step": 17000
},
{
"epoch": 63.0,
"eval_accuracy": 0.5575715282623867,
"eval_f1_macro": 0.7344319075168565,
"eval_f1_micro": 0.8535319341006545,
"eval_loss": 0.0839960053563118,
"eval_roc_auc": 0.9061600170593289,
"eval_runtime": 676.8011,
"eval_samples_per_second": 4.235,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 17262
},
{
"epoch": 63.87,
"learning_rate": 0.0001,
"loss": 0.0933,
"step": 17500
},
{
"epoch": 64.0,
"eval_accuracy": 0.5614096301465457,
"eval_f1_macro": 0.7405199466064576,
"eval_f1_micro": 0.8543109759531453,
"eval_loss": 0.08395348489284515,
"eval_roc_auc": 0.907220383474883,
"eval_runtime": 676.0097,
"eval_samples_per_second": 4.24,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 17536
},
{
"epoch": 65.0,
"eval_accuracy": 0.557920446615492,
"eval_f1_macro": 0.7354221702015719,
"eval_f1_micro": 0.8506689439225733,
"eval_loss": 0.08403661847114563,
"eval_roc_auc": 0.9015583167344123,
"eval_runtime": 675.0487,
"eval_samples_per_second": 4.246,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 17810
},
{
"epoch": 65.69,
"learning_rate": 0.0001,
"loss": 0.0921,
"step": 18000
},
{
"epoch": 66.0,
"eval_accuracy": 0.5568736915561758,
"eval_f1_macro": 0.7296578358578595,
"eval_f1_micro": 0.852865023077789,
"eval_loss": 0.08408054709434509,
"eval_roc_auc": 0.9065963661690798,
"eval_runtime": 680.0166,
"eval_samples_per_second": 4.215,
"eval_steps_per_second": 0.132,
"learning_rate": 0.0001,
"step": 18084
},
{
"epoch": 67.0,
"eval_accuracy": 0.5540823447313329,
"eval_f1_macro": 0.7392975848141861,
"eval_f1_micro": 0.8539689628223736,
"eval_loss": 0.08376849442720413,
"eval_roc_auc": 0.9100385075348831,
"eval_runtime": 675.941,
"eval_samples_per_second": 4.24,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 18358
},
{
"epoch": 67.52,
"learning_rate": 0.0001,
"loss": 0.0913,
"step": 18500
},
{
"epoch": 68.0,
"eval_accuracy": 0.5572226099092812,
"eval_f1_macro": 0.7403483881006915,
"eval_f1_micro": 0.854102492299076,
"eval_loss": 0.08355987071990967,
"eval_roc_auc": 0.9089826269243382,
"eval_runtime": 676.7975,
"eval_samples_per_second": 4.235,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 18632
},
{
"epoch": 69.0,
"eval_accuracy": 0.5582693649685974,
"eval_f1_macro": 0.7494443807338856,
"eval_f1_micro": 0.8547792062604807,
"eval_loss": 0.08346723765134811,
"eval_roc_auc": 0.9100283387486087,
"eval_runtime": 675.2406,
"eval_samples_per_second": 4.244,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 18906
},
{
"epoch": 69.34,
"learning_rate": 0.0001,
"loss": 0.0911,
"step": 19000
},
{
"epoch": 70.0,
"eval_accuracy": 0.5561758548499651,
"eval_f1_macro": 0.7486606655073544,
"eval_f1_micro": 0.8551793496480055,
"eval_loss": 0.08306006342172623,
"eval_roc_auc": 0.9104037761073852,
"eval_runtime": 675.6626,
"eval_samples_per_second": 4.242,
"eval_steps_per_second": 0.133,
"learning_rate": 0.0001,
"step": 19180
},
{
"epoch": 71.0,
"eval_accuracy": 0.557920446615492,
"eval_f1_macro": 0.74841480686329,
"eval_f1_micro": 0.8557041347283614,
"eval_loss": 0.08348394185304642,
"eval_roc_auc": 0.9102149107350765,
"eval_runtime": 688.9991,
"eval_samples_per_second": 4.16,
"eval_steps_per_second": 0.131,
"learning_rate": 0.0001,
"step": 19454
},
{
"epoch": 71.17,
"learning_rate": 0.0001,
"loss": 0.0907,
"step": 19500
},
{
"epoch": 72.0,
"eval_accuracy": 0.5610607117934403,
"eval_f1_macro": 0.7445560004670461,
"eval_f1_micro": 0.8531667140017041,
"eval_loss": 0.08317266404628754,
"eval_roc_auc": 0.9036835353705291,
"eval_runtime": 686.0467,
"eval_samples_per_second": 4.178,
"eval_steps_per_second": 0.131,
"learning_rate": 0.0001,
"step": 19728
},
{
"epoch": 72.99,
"learning_rate": 0.0001,
"loss": 0.0905,
"step": 20000
},
{
"epoch": 73.0,
"eval_accuracy": 0.5575715282623867,
"eval_f1_macro": 0.7511661878734329,
"eval_f1_micro": 0.8557848235754626,
"eval_loss": 0.0826636552810669,
"eval_roc_auc": 0.9104516775814524,
"eval_runtime": 696.2462,
"eval_samples_per_second": 4.116,
"eval_steps_per_second": 0.129,
"learning_rate": 0.0001,
"step": 20002
},
{
"epoch": 74.0,
"eval_accuracy": 0.5589672016748081,
"eval_f1_macro": 0.7519078199055363,
"eval_f1_micro": 0.8547880690737834,
"eval_loss": 0.08345863223075867,
"eval_roc_auc": 0.9089978296204139,
"eval_runtime": 684.5044,
"eval_samples_per_second": 4.187,
"eval_steps_per_second": 0.131,
"learning_rate": 0.0001,
"step": 20276
},
{
"epoch": 74.82,
"learning_rate": 0.0001,
"loss": 0.0896,
"step": 20500
},
{
"epoch": 75.0,
"eval_accuracy": 0.5565247732030705,
"eval_f1_macro": 0.7427640048071817,
"eval_f1_micro": 0.8535384963511908,
"eval_loss": 0.08291995525360107,
"eval_roc_auc": 0.9052642407433178,
"eval_runtime": 693.0369,
"eval_samples_per_second": 4.135,
"eval_steps_per_second": 0.13,
"learning_rate": 0.0001,
"step": 20550
},
{
"epoch": 76.0,
"eval_accuracy": 0.5642009769713887,
"eval_f1_macro": 0.7449358839801685,
"eval_f1_micro": 0.8560516708789666,
"eval_loss": 0.08278567343950272,
"eval_roc_auc": 0.9091009598641902,
"eval_runtime": 689.5027,
"eval_samples_per_second": 4.157,
"eval_steps_per_second": 0.131,
"learning_rate": 0.0001,
"step": 20824
},
{
"epoch": 76.64,
"learning_rate": 0.0001,
"loss": 0.089,
"step": 21000
},
{
"epoch": 77.0,
"eval_accuracy": 0.5603628750872296,
"eval_f1_macro": 0.7507123347472292,
"eval_f1_micro": 0.8567585743106928,
"eval_loss": 0.08268015086650848,
"eval_roc_auc": 0.9102413784270108,
"eval_runtime": 691.3385,
"eval_samples_per_second": 4.146,
"eval_steps_per_second": 0.13,
"learning_rate": 0.0001,
"step": 21098
},
{
"epoch": 78.0,
"eval_accuracy": 0.557920446615492,
"eval_f1_macro": 0.7435504236075495,
"eval_f1_micro": 0.8528667079277555,
"eval_loss": 0.0833190307021141,
"eval_roc_auc": 0.9067310989812636,
"eval_runtime": 698.1968,
"eval_samples_per_second": 4.105,
"eval_steps_per_second": 0.129,
"learning_rate": 0.0001,
"step": 21372
},
{
"epoch": 78.47,
"learning_rate": 0.0001,
"loss": 0.0892,
"step": 21500
},
{
"epoch": 79.0,
"eval_accuracy": 0.5589672016748081,
"eval_f1_macro": 0.7501683098189544,
"eval_f1_micro": 0.8540393754243042,
"eval_loss": 0.08301213383674622,
"eval_roc_auc": 0.905519599881194,
"eval_runtime": 693.3725,
"eval_samples_per_second": 4.133,
"eval_steps_per_second": 0.13,
"learning_rate": 0.0001,
"step": 21646
},
{
"epoch": 80.0,
"eval_accuracy": 0.5600139567341242,
"eval_f1_macro": 0.7461247141006309,
"eval_f1_micro": 0.8548240635641317,
"eval_loss": 0.08266153186559677,
"eval_roc_auc": 0.9048757931076342,
"eval_runtime": 692.1533,
"eval_samples_per_second": 4.141,
"eval_steps_per_second": 0.13,
"learning_rate": 1e-05,
"step": 21920
},
{
"epoch": 80.29,
"learning_rate": 1e-05,
"loss": 0.0879,
"step": 22000
},
{
"epoch": 81.0,
"eval_accuracy": 0.560711793440335,
"eval_f1_macro": 0.7542778186740821,
"eval_f1_micro": 0.8576379185065117,
"eval_loss": 0.08230110257863998,
"eval_roc_auc": 0.9116332184274908,
"eval_runtime": 691.9752,
"eval_samples_per_second": 4.142,
"eval_steps_per_second": 0.13,
"learning_rate": 1e-05,
"step": 22194
},
{
"epoch": 82.0,
"eval_accuracy": 0.5631542219120725,
"eval_f1_macro": 0.7536111063550082,
"eval_f1_micro": 0.8576225654801881,
"eval_loss": 0.08222728967666626,
"eval_roc_auc": 0.9111816666216643,
"eval_runtime": 688.2687,
"eval_samples_per_second": 4.164,
"eval_steps_per_second": 0.131,
"learning_rate": 1e-05,
"step": 22468
},
{
"epoch": 82.12,
"learning_rate": 1e-05,
"loss": 0.0867,
"step": 22500
},
{
"epoch": 83.0,
"eval_accuracy": 0.5624563852058618,
"eval_f1_macro": 0.7519980936807484,
"eval_f1_micro": 0.8553623024191264,
"eval_loss": 0.08224428445100784,
"eval_roc_auc": 0.9057647902327958,
"eval_runtime": 675.1087,
"eval_samples_per_second": 4.245,
"eval_steps_per_second": 0.133,
"learning_rate": 1e-05,
"step": 22742
},
{
"epoch": 83.94,
"learning_rate": 1e-05,
"loss": 0.0864,
"step": 23000
},
{
"epoch": 84.0,
"eval_accuracy": 0.5638520586182834,
"eval_f1_macro": 0.751088987860079,
"eval_f1_micro": 0.8550642905481616,
"eval_loss": 0.08214889466762543,
"eval_roc_auc": 0.9071555340236915,
"eval_runtime": 684.6287,
"eval_samples_per_second": 4.186,
"eval_steps_per_second": 0.131,
"learning_rate": 1e-05,
"step": 23016
},
{
"epoch": 85.0,
"eval_accuracy": 0.5617585484996511,
"eval_f1_macro": 0.7532850236770345,
"eval_f1_micro": 0.8560117633751838,
"eval_loss": 0.08197268098592758,
"eval_roc_auc": 0.9067157953185159,
"eval_runtime": 685.9962,
"eval_samples_per_second": 4.178,
"eval_steps_per_second": 0.131,
"learning_rate": 1e-05,
"step": 23290
},
{
"epoch": 85.77,
"learning_rate": 1e-05,
"loss": 0.0865,
"step": 23500
},
{
"epoch": 86.0,
"eval_accuracy": 0.5600139567341242,
"eval_f1_macro": 0.7495768803790436,
"eval_f1_micro": 0.8553152949167893,
"eval_loss": 0.0821395218372345,
"eval_roc_auc": 0.9060269285615214,
"eval_runtime": 676.0683,
"eval_samples_per_second": 4.239,
"eval_steps_per_second": 0.133,
"learning_rate": 1e-05,
"step": 23564
},
{
"epoch": 87.0,
"eval_accuracy": 0.5586182833217027,
"eval_f1_macro": 0.7518865385404515,
"eval_f1_micro": 0.8558878188883257,
"eval_loss": 0.08169202506542206,
"eval_roc_auc": 0.9080884949227034,
"eval_runtime": 683.932,
"eval_samples_per_second": 4.19,
"eval_steps_per_second": 0.132,
"learning_rate": 1e-05,
"step": 23838
},
{
"epoch": 87.59,
"learning_rate": 1e-05,
"loss": 0.0868,
"step": 24000
},
{
"epoch": 88.0,
"eval_accuracy": 0.5621074668527565,
"eval_f1_macro": 0.7526313975322289,
"eval_f1_micro": 0.8558239036198839,
"eval_loss": 0.08171343803405762,
"eval_roc_auc": 0.9081685470699702,
"eval_runtime": 687.6304,
"eval_samples_per_second": 4.168,
"eval_steps_per_second": 0.131,
"learning_rate": 1e-05,
"step": 24112
},
{
"epoch": 89.0,
"eval_accuracy": 0.5638520586182834,
"eval_f1_macro": 0.7535945449960157,
"eval_f1_micro": 0.8569978572234127,
"eval_loss": 0.08180436491966248,
"eval_roc_auc": 0.9082570227224631,
"eval_runtime": 685.8987,
"eval_samples_per_second": 4.178,
"eval_steps_per_second": 0.131,
"learning_rate": 1e-05,
"step": 24386
},
{
"epoch": 89.42,
"learning_rate": 1e-05,
"loss": 0.0857,
"step": 24500
},
{
"epoch": 90.0,
"eval_accuracy": 0.5617585484996511,
"eval_f1_macro": 0.7521712775972677,
"eval_f1_micro": 0.8557914296976182,
"eval_loss": 0.08184907585382462,
"eval_roc_auc": 0.9080738403314199,
"eval_runtime": 2199.2107,
"eval_samples_per_second": 1.303,
"eval_steps_per_second": 0.041,
"learning_rate": 1e-05,
"step": 24660
},
{
"epoch": 91.0,
"eval_accuracy": 0.5631542219120725,
"eval_f1_macro": 0.7496381590553177,
"eval_f1_micro": 0.856868937514099,
"eval_loss": 0.08175913989543915,
"eval_roc_auc": 0.9081476613926293,
"eval_runtime": 685.7142,
"eval_samples_per_second": 4.18,
"eval_steps_per_second": 0.131,
"learning_rate": 1e-05,
"step": 24934
},
{
"epoch": 91.24,
"learning_rate": 1e-05,
"loss": 0.0862,
"step": 25000
},
{
"epoch": 92.0,
"eval_accuracy": 0.5648988136775994,
"eval_f1_macro": 0.7551884126903309,
"eval_f1_micro": 0.8566131025957974,
"eval_loss": 0.08205177634954453,
"eval_roc_auc": 0.9092762668547993,
"eval_runtime": 688.0975,
"eval_samples_per_second": 4.165,
"eval_steps_per_second": 0.131,
"learning_rate": 1e-05,
"step": 25208
},
{
"epoch": 93.0,
"eval_accuracy": 0.5628053035589672,
"eval_f1_macro": 0.7579638727848569,
"eval_f1_micro": 0.8588642195693407,
"eval_loss": 0.08153587579727173,
"eval_roc_auc": 0.9129889700545543,
"eval_runtime": 686.4355,
"eval_samples_per_second": 4.175,
"eval_steps_per_second": 0.131,
"learning_rate": 1e-05,
"step": 25482
},
{
"epoch": 93.07,
"learning_rate": 1e-05,
"loss": 0.0851,
"step": 25500
},
{
"epoch": 94.0,
"eval_accuracy": 0.5600139567341242,
"eval_f1_macro": 0.7565755790887538,
"eval_f1_micro": 0.8570630932439977,
"eval_loss": 0.0816139355301857,
"eval_roc_auc": 0.911680023691974,
"eval_runtime": 686.9681,
"eval_samples_per_second": 4.172,
"eval_steps_per_second": 0.131,
"learning_rate": 1e-05,
"step": 25756
},
{
"epoch": 94.89,
"learning_rate": 1e-05,
"loss": 0.0854,
"step": 26000
},
{
"epoch": 95.0,
"eval_accuracy": 0.5631542219120725,
"eval_f1_macro": 0.7553215815461111,
"eval_f1_micro": 0.8563582357226924,
"eval_loss": 0.08153104782104492,
"eval_roc_auc": 0.9100006738804182,
"eval_runtime": 792.6719,
"eval_samples_per_second": 3.616,
"eval_steps_per_second": 0.114,
"learning_rate": 1e-05,
"step": 26030
},
{
"epoch": 96.0,
"eval_accuracy": 0.5621074668527565,
"eval_f1_macro": 0.7584737150271473,
"eval_f1_micro": 0.8576208800401539,
"eval_loss": 0.081536203622818,
"eval_roc_auc": 0.9123942619313182,
"eval_runtime": 689.1211,
"eval_samples_per_second": 4.159,
"eval_steps_per_second": 0.131,
"learning_rate": 1e-05,
"step": 26304
},
{
"epoch": 96.72,
"learning_rate": 1e-05,
"loss": 0.0854,
"step": 26500
},
{
"epoch": 97.0,
"eval_accuracy": 0.5628053035589672,
"eval_f1_macro": 0.7578675241138624,
"eval_f1_micro": 0.8575591168889387,
"eval_loss": 0.0817214846611023,
"eval_roc_auc": 0.9107227875201963,
"eval_runtime": 791.8215,
"eval_samples_per_second": 3.62,
"eval_steps_per_second": 0.114,
"learning_rate": 1e-05,
"step": 26578
},
{
"epoch": 98.0,
"eval_accuracy": 0.5638520586182834,
"eval_f1_macro": 0.7526862577512524,
"eval_f1_micro": 0.8570947651910453,
"eval_loss": 0.08161807805299759,
"eval_roc_auc": 0.9100232038721354,
"eval_runtime": 689.7672,
"eval_samples_per_second": 4.155,
"eval_steps_per_second": 0.13,
"learning_rate": 1e-05,
"step": 26852
},
{
"epoch": 98.54,
"learning_rate": 1e-05,
"loss": 0.0855,
"step": 27000
},
{
"epoch": 99.0,
"eval_accuracy": 0.5642009769713887,
"eval_f1_macro": 0.7556285126609241,
"eval_f1_micro": 0.8578035986237239,
"eval_loss": 0.08184286206960678,
"eval_roc_auc": 0.9086036990034648,
"eval_runtime": 685.3364,
"eval_samples_per_second": 4.182,
"eval_steps_per_second": 0.131,
"learning_rate": 1e-05,
"step": 27126
},
{
"epoch": 100.0,
"eval_accuracy": 0.5631542219120725,
"eval_f1_macro": 0.753319281703831,
"eval_f1_micro": 0.857062242537103,
"eval_loss": 0.08161789923906326,
"eval_roc_auc": 0.9080422377630124,
"eval_runtime": 680.1579,
"eval_samples_per_second": 4.214,
"eval_steps_per_second": 0.132,
"learning_rate": 1.0000000000000002e-06,
"step": 27400
},
{
"epoch": 100.36,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0837,
"step": 27500
},
{
"epoch": 101.0,
"eval_accuracy": 0.5645498953244941,
"eval_f1_macro": 0.7553159980269647,
"eval_f1_micro": 0.8575286968264686,
"eval_loss": 0.08142262697219849,
"eval_roc_auc": 0.9092807526598085,
"eval_runtime": 693.9432,
"eval_samples_per_second": 4.13,
"eval_steps_per_second": 0.13,
"learning_rate": 1.0000000000000002e-06,
"step": 27674
},
{
"epoch": 102.0,
"eval_accuracy": 0.5652477320307048,
"eval_f1_macro": 0.7559444477928223,
"eval_f1_micro": 0.8571749382438806,
"eval_loss": 0.08143333345651627,
"eval_roc_auc": 0.9098557722819599,
"eval_runtime": 695.0171,
"eval_samples_per_second": 4.124,
"eval_steps_per_second": 0.129,
"learning_rate": 1.0000000000000002e-06,
"step": 27948
},
{
"epoch": 102.19,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.085,
"step": 28000
},
{
"epoch": 103.0,
"eval_accuracy": 0.5645498953244941,
"eval_f1_macro": 0.7565514506209431,
"eval_f1_micro": 0.8570462613399448,
"eval_loss": 0.08157742768526077,
"eval_roc_auc": 0.9085338156424723,
"eval_runtime": 710.2061,
"eval_samples_per_second": 4.035,
"eval_steps_per_second": 0.127,
"learning_rate": 1.0000000000000002e-06,
"step": 28222
},
{
"epoch": 104.0,
"eval_accuracy": 0.5645498953244941,
"eval_f1_macro": 0.7572978759334409,
"eval_f1_micro": 0.857623884617543,
"eval_loss": 0.08124219626188278,
"eval_roc_auc": 0.9102385369363781,
"eval_runtime": 703.8703,
"eval_samples_per_second": 4.072,
"eval_steps_per_second": 0.128,
"learning_rate": 1.0000000000000002e-06,
"step": 28496
},
{
"epoch": 104.01,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0844,
"step": 28500
},
{
"epoch": 105.0,
"eval_accuracy": 0.5603628750872296,
"eval_f1_macro": 0.7588882568234135,
"eval_f1_micro": 0.8571747004736696,
"eval_loss": 0.08170615136623383,
"eval_roc_auc": 0.9124156957134514,
"eval_runtime": 693.4706,
"eval_samples_per_second": 4.133,
"eval_steps_per_second": 0.13,
"learning_rate": 1.0000000000000002e-06,
"step": 28770
},
{
"epoch": 105.84,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0845,
"step": 29000
},
{
"epoch": 106.0,
"eval_accuracy": 0.5628053035589672,
"eval_f1_macro": 0.7514055460147794,
"eval_f1_micro": 0.8562891131532955,
"eval_loss": 0.08144387602806091,
"eval_roc_auc": 0.9079250010327448,
"eval_runtime": 693.924,
"eval_samples_per_second": 4.13,
"eval_steps_per_second": 0.13,
"learning_rate": 1.0000000000000002e-06,
"step": 29044
},
{
"epoch": 107.0,
"eval_accuracy": 0.5635031402651779,
"eval_f1_macro": 0.7490061784836257,
"eval_f1_micro": 0.8557823129251702,
"eval_loss": 0.08168599754571915,
"eval_roc_auc": 0.9057833825242961,
"eval_runtime": 697.3665,
"eval_samples_per_second": 4.11,
"eval_steps_per_second": 0.129,
"learning_rate": 1.0000000000000002e-06,
"step": 29318
},
{
"epoch": 107.66,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0854,
"step": 29500
},
{
"epoch": 108.0,
"eval_accuracy": 0.5642009769713887,
"eval_f1_macro": 0.7569164155873785,
"eval_f1_micro": 0.8569341425039335,
"eval_loss": 0.08160943537950516,
"eval_roc_auc": 0.9094149373671999,
"eval_runtime": 692.7895,
"eval_samples_per_second": 4.137,
"eval_steps_per_second": 0.13,
"learning_rate": 1.0000000000000002e-06,
"step": 29592
},
{
"epoch": 109.0,
"eval_accuracy": 0.5652477320307048,
"eval_f1_macro": 0.7558234898859766,
"eval_f1_micro": 0.8573669467787115,
"eval_loss": 0.08135490119457245,
"eval_roc_auc": 0.9106934783376293,
"eval_runtime": 695.7903,
"eval_samples_per_second": 4.119,
"eval_steps_per_second": 0.129,
"learning_rate": 1.0000000000000002e-06,
"step": 29866
},
{
"epoch": 109.49,
"learning_rate": 1.0000000000000002e-06,
"loss": 0.0854,
"step": 30000
},
{
"epoch": 110.0,
"eval_accuracy": 0.5638520586182834,
"eval_f1_macro": 0.7564667466516518,
"eval_f1_micro": 0.8577973962116557,
"eval_loss": 0.08132224529981613,
"eval_roc_auc": 0.9118372864958749,
"eval_runtime": 682.0266,
"eval_samples_per_second": 4.202,
"eval_steps_per_second": 0.132,
"learning_rate": 1.0000000000000002e-06,
"step": 30140
},
{
"epoch": 111.0,
"eval_accuracy": 0.5638520586182834,
"eval_f1_macro": 0.7579481466413214,
"eval_f1_micro": 0.8576381122791322,
"eval_loss": 0.0814104825258255,
"eval_roc_auc": 0.911498485615307,
"eval_runtime": 686.5544,
"eval_samples_per_second": 4.174,
"eval_steps_per_second": 0.131,
"learning_rate": 1.0000000000000002e-07,
"step": 30414
},
{
"epoch": 111.31,
"learning_rate": 1.0000000000000002e-07,
"loss": 0.0851,
"step": 30500
},
{
"epoch": 112.0,
"eval_accuracy": 0.5631542219120725,
"eval_f1_macro": 0.7575801018117111,
"eval_f1_micro": 0.8580721134974485,
"eval_loss": 0.08170080929994583,
"eval_roc_auc": 0.91075603440298,
"eval_runtime": 746.778,
"eval_samples_per_second": 3.838,
"eval_steps_per_second": 0.121,
"learning_rate": 1.0000000000000002e-07,
"step": 30688
},
{
"epoch": 113.0,
"eval_accuracy": 0.5614096301465457,
"eval_f1_macro": 0.7562692232145891,
"eval_f1_micro": 0.8583059164668487,
"eval_loss": 0.081505186855793,
"eval_roc_auc": 0.912813663063945,
"eval_runtime": 687.4479,
"eval_samples_per_second": 4.169,
"eval_steps_per_second": 0.131,
"learning_rate": 1.0000000000000002e-07,
"step": 30962
},
{
"epoch": 113.14,
"learning_rate": 1.0000000000000002e-07,
"loss": 0.0848,
"step": 31000
},
{
"epoch": 114.0,
"eval_accuracy": 0.5655966503838102,
"eval_f1_macro": 0.7560403631861836,
"eval_f1_micro": 0.8563654914408797,
"eval_loss": 0.08186182379722595,
"eval_roc_auc": 0.9061407756963643,
"eval_runtime": 731.2304,
"eval_samples_per_second": 3.919,
"eval_steps_per_second": 0.123,
"learning_rate": 1.0000000000000002e-07,
"step": 31236
},
{
"epoch": 114.0,
"learning_rate": 1.0000000000000002e-07,
"step": 31236,
"total_flos": 1.4819663325231928e+21,
"train_loss": 0.033337813025782426,
"train_runtime": 131818.0427,
"train_samples_per_second": 9.311,
"train_steps_per_second": 0.291
}
],
"logging_steps": 500,
"max_steps": 38360,
"num_train_epochs": 140,
"save_steps": 500,
"total_flos": 1.4819663325231928e+21,
"trial_name": null,
"trial_params": null
}