deberta-v3-large-nli-v1 / trainer_state.json
sjrhuschlee's picture
Upload folder using huggingface_hub
6bb6b05
{
"best_metric": 0.71900826446281,
"best_model_checkpoint": "models/single_label/deberta-v3-large/exp5/checkpoint-1500",
"epoch": 0.07913166189678593,
"global_step": 1500,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.01,
"learning_rate": 3.1645569620253166e-08,
"loss": 1.4101,
"step": 100
},
{
"epoch": 0.01,
"learning_rate": 6.329113924050633e-08,
"loss": 1.4037,
"step": 200
},
{
"epoch": 0.01,
"eval_osu_accuracy": 0.5289256198347108,
"eval_osu_loss": 1.3296300172805786,
"eval_osu_matthews_correlation": 0.08430984949814109,
"eval_osu_runtime": 4.6863,
"eval_osu_samples_per_second": 51.64,
"eval_osu_steps_per_second": 3.414,
"step": 250
},
{
"epoch": 0.01,
"eval_deepset_1_accuracy": 0.42016806722689076,
"eval_deepset_1_loss": 1.3601003885269165,
"eval_deepset_1_matthews_correlation": 0.007340018855649166,
"eval_deepset_1_runtime": 1.0598,
"eval_deepset_1_samples_per_second": 112.29,
"eval_deepset_1_steps_per_second": 7.549,
"step": 250
},
{
"epoch": 0.01,
"eval_deepset_2_accuracy": 0.5128205128205128,
"eval_deepset_2_loss": 1.341286540031433,
"eval_deepset_2_matthews_correlation": 0.09702062677085851,
"eval_deepset_2_runtime": 1.5595,
"eval_deepset_2_samples_per_second": 100.032,
"eval_deepset_2_steps_per_second": 6.412,
"step": 250
},
{
"epoch": 0.01,
"eval_deepset_3_accuracy": 0.5260115606936416,
"eval_deepset_3_loss": 1.3386189937591553,
"eval_deepset_3_matthews_correlation": 0.13147932110355937,
"eval_deepset_3_runtime": 3.0465,
"eval_deepset_3_samples_per_second": 113.572,
"eval_deepset_3_steps_per_second": 7.221,
"step": 250
},
{
"epoch": 0.01,
"eval_deepset_4_accuracy": 0.46601941747572817,
"eval_deepset_4_loss": 1.354163646697998,
"eval_deepset_4_matthews_correlation": 0.04602315745107765,
"eval_deepset_4_runtime": 1.7129,
"eval_deepset_4_samples_per_second": 120.262,
"eval_deepset_4_steps_per_second": 7.589,
"step": 250
},
{
"epoch": 0.01,
"eval_anli_accuracy": 0.314,
"eval_anli_loss": 1.3443490266799927,
"eval_anli_matthews_correlation": -0.03669996966921473,
"eval_anli_runtime": 5.1544,
"eval_anli_samples_per_second": 194.01,
"eval_anli_steps_per_second": 12.223,
"step": 250
},
{
"epoch": 0.02,
"learning_rate": 9.462025316455696e-08,
"loss": 1.381,
"step": 300
},
{
"epoch": 0.02,
"learning_rate": 1.2626582278481014e-07,
"loss": 1.3016,
"step": 400
},
{
"epoch": 0.03,
"learning_rate": 1.5791139240506326e-07,
"loss": 1.1103,
"step": 500
},
{
"epoch": 0.03,
"eval_osu_accuracy": 0.3677685950413223,
"eval_osu_loss": 1.2251540422439575,
"eval_osu_matthews_correlation": 0.009389673632694094,
"eval_osu_runtime": 4.6743,
"eval_osu_samples_per_second": 51.773,
"eval_osu_steps_per_second": 3.423,
"step": 500
},
{
"epoch": 0.03,
"eval_deepset_1_accuracy": 0.2605042016806723,
"eval_deepset_1_loss": 1.498146414756775,
"eval_deepset_1_matthews_correlation": -0.12070085589088507,
"eval_deepset_1_runtime": 1.0684,
"eval_deepset_1_samples_per_second": 111.378,
"eval_deepset_1_steps_per_second": 7.488,
"step": 500
},
{
"epoch": 0.03,
"eval_deepset_2_accuracy": 0.3076923076923077,
"eval_deepset_2_loss": 1.3761013746261597,
"eval_deepset_2_matthews_correlation": -0.08397491442025497,
"eval_deepset_2_runtime": 1.5607,
"eval_deepset_2_samples_per_second": 99.953,
"eval_deepset_2_steps_per_second": 6.407,
"step": 500
},
{
"epoch": 0.03,
"eval_deepset_3_accuracy": 0.31213872832369943,
"eval_deepset_3_loss": 1.4205697774887085,
"eval_deepset_3_matthews_correlation": -0.06528708661392457,
"eval_deepset_3_runtime": 3.0447,
"eval_deepset_3_samples_per_second": 113.639,
"eval_deepset_3_steps_per_second": 7.226,
"step": 500
},
{
"epoch": 0.03,
"eval_deepset_4_accuracy": 0.25728155339805825,
"eval_deepset_4_loss": 1.5763508081436157,
"eval_deepset_4_matthews_correlation": -0.11908261162663966,
"eval_deepset_4_runtime": 1.7183,
"eval_deepset_4_samples_per_second": 119.883,
"eval_deepset_4_steps_per_second": 7.565,
"step": 500
},
{
"epoch": 0.03,
"eval_anli_accuracy": 0.33,
"eval_anli_loss": 1.1667168140411377,
"eval_anli_matthews_correlation": 0.0012307081400291311,
"eval_anli_runtime": 5.1504,
"eval_anli_samples_per_second": 194.161,
"eval_anli_steps_per_second": 12.232,
"step": 500
},
{
"epoch": 0.03,
"learning_rate": 1.8955696202531644e-07,
"loss": 0.8892,
"step": 600
},
{
"epoch": 0.04,
"learning_rate": 2.2120253164556962e-07,
"loss": 0.7838,
"step": 700
},
{
"epoch": 0.04,
"eval_osu_accuracy": 0.6942148760330579,
"eval_osu_loss": 0.9712508916854858,
"eval_osu_matthews_correlation": 0.4897642238477718,
"eval_osu_runtime": 4.6823,
"eval_osu_samples_per_second": 51.684,
"eval_osu_steps_per_second": 3.417,
"step": 750
},
{
"epoch": 0.04,
"eval_deepset_1_accuracy": 0.6134453781512605,
"eval_deepset_1_loss": 1.6580817699432373,
"eval_deepset_1_matthews_correlation": 0.41985911107813456,
"eval_deepset_1_runtime": 1.0652,
"eval_deepset_1_samples_per_second": 111.721,
"eval_deepset_1_steps_per_second": 7.511,
"step": 750
},
{
"epoch": 0.04,
"eval_deepset_2_accuracy": 0.7051282051282052,
"eval_deepset_2_loss": 1.3619518280029297,
"eval_deepset_2_matthews_correlation": 0.5328568142577198,
"eval_deepset_2_runtime": 1.5605,
"eval_deepset_2_samples_per_second": 99.966,
"eval_deepset_2_steps_per_second": 6.408,
"step": 750
},
{
"epoch": 0.04,
"eval_deepset_3_accuracy": 0.5578034682080925,
"eval_deepset_3_loss": 1.4653511047363281,
"eval_deepset_3_matthews_correlation": 0.2932617859503659,
"eval_deepset_3_runtime": 3.0504,
"eval_deepset_3_samples_per_second": 113.429,
"eval_deepset_3_steps_per_second": 7.212,
"step": 750
},
{
"epoch": 0.04,
"eval_deepset_4_accuracy": 0.529126213592233,
"eval_deepset_4_loss": 1.7414307594299316,
"eval_deepset_4_matthews_correlation": 0.3054166536717615,
"eval_deepset_4_runtime": 1.7235,
"eval_deepset_4_samples_per_second": 119.522,
"eval_deepset_4_steps_per_second": 7.543,
"step": 750
},
{
"epoch": 0.04,
"eval_anli_accuracy": 0.351,
"eval_anli_loss": 1.1338268518447876,
"eval_anli_matthews_correlation": 0.030305510765310642,
"eval_anli_runtime": 5.1432,
"eval_anli_samples_per_second": 194.432,
"eval_anli_steps_per_second": 12.249,
"step": 750
},
{
"epoch": 0.04,
"learning_rate": 2.5284810126582275e-07,
"loss": 0.6807,
"step": 800
},
{
"epoch": 0.05,
"learning_rate": 2.844936708860759e-07,
"loss": 0.502,
"step": 900
},
{
"epoch": 0.05,
"learning_rate": 2.991503304270561e-07,
"loss": 0.4006,
"step": 1000
},
{
"epoch": 0.05,
"eval_osu_accuracy": 0.7024793388429752,
"eval_osu_loss": 0.7255080938339233,
"eval_osu_matthews_correlation": 0.4761839486992106,
"eval_osu_runtime": 4.6909,
"eval_osu_samples_per_second": 51.589,
"eval_osu_steps_per_second": 3.411,
"step": 1000
},
{
"epoch": 0.05,
"eval_deepset_1_accuracy": 0.6134453781512605,
"eval_deepset_1_loss": 1.6959413290023804,
"eval_deepset_1_matthews_correlation": 0.42105052198193255,
"eval_deepset_1_runtime": 1.0672,
"eval_deepset_1_samples_per_second": 111.505,
"eval_deepset_1_steps_per_second": 7.496,
"step": 1000
},
{
"epoch": 0.05,
"eval_deepset_2_accuracy": 0.7243589743589743,
"eval_deepset_2_loss": 1.2153555154800415,
"eval_deepset_2_matthews_correlation": 0.5466918371684817,
"eval_deepset_2_runtime": 1.556,
"eval_deepset_2_samples_per_second": 100.254,
"eval_deepset_2_steps_per_second": 6.427,
"step": 1000
},
{
"epoch": 0.05,
"eval_deepset_3_accuracy": 0.6473988439306358,
"eval_deepset_3_loss": 1.4247812032699585,
"eval_deepset_3_matthews_correlation": 0.4017768477834457,
"eval_deepset_3_runtime": 3.045,
"eval_deepset_3_samples_per_second": 113.628,
"eval_deepset_3_steps_per_second": 7.225,
"step": 1000
},
{
"epoch": 0.05,
"eval_deepset_4_accuracy": 0.6504854368932039,
"eval_deepset_4_loss": 1.7334672212600708,
"eval_deepset_4_matthews_correlation": 0.4508615553005039,
"eval_deepset_4_runtime": 1.7091,
"eval_deepset_4_samples_per_second": 120.534,
"eval_deepset_4_steps_per_second": 7.606,
"step": 1000
},
{
"epoch": 0.05,
"eval_anli_accuracy": 0.477,
"eval_anli_loss": 1.3187198638916016,
"eval_anli_matthews_correlation": 0.218035345395415,
"eval_anli_runtime": 5.1567,
"eval_anli_samples_per_second": 193.922,
"eval_anli_steps_per_second": 12.217,
"step": 1000
},
{
"epoch": 0.06,
"learning_rate": 2.9748431165657797e-07,
"loss": 0.3456,
"step": 1100
},
{
"epoch": 0.06,
"learning_rate": 2.9581829288609986e-07,
"loss": 0.3098,
"step": 1200
},
{
"epoch": 0.07,
"eval_osu_accuracy": 0.6900826446280992,
"eval_osu_loss": 0.794772207736969,
"eval_osu_matthews_correlation": 0.4632054751499522,
"eval_osu_runtime": 4.6759,
"eval_osu_samples_per_second": 51.755,
"eval_osu_steps_per_second": 3.422,
"step": 1250
},
{
"epoch": 0.07,
"eval_deepset_1_accuracy": 0.5882352941176471,
"eval_deepset_1_loss": 1.9199906587600708,
"eval_deepset_1_matthews_correlation": 0.3787987593817238,
"eval_deepset_1_runtime": 1.0581,
"eval_deepset_1_samples_per_second": 112.466,
"eval_deepset_1_steps_per_second": 7.561,
"step": 1250
},
{
"epoch": 0.07,
"eval_deepset_2_accuracy": 0.6923076923076923,
"eval_deepset_2_loss": 1.3611226081848145,
"eval_deepset_2_matthews_correlation": 0.5007307553834116,
"eval_deepset_2_runtime": 1.5603,
"eval_deepset_2_samples_per_second": 99.978,
"eval_deepset_2_steps_per_second": 6.409,
"step": 1250
},
{
"epoch": 0.07,
"eval_deepset_3_accuracy": 0.630057803468208,
"eval_deepset_3_loss": 1.5691180229187012,
"eval_deepset_3_matthews_correlation": 0.38258183358832687,
"eval_deepset_3_runtime": 3.052,
"eval_deepset_3_samples_per_second": 113.37,
"eval_deepset_3_steps_per_second": 7.208,
"step": 1250
},
{
"epoch": 0.07,
"eval_deepset_4_accuracy": 0.5922330097087378,
"eval_deepset_4_loss": 1.946365237236023,
"eval_deepset_4_matthews_correlation": 0.36618144302865463,
"eval_deepset_4_runtime": 1.7085,
"eval_deepset_4_samples_per_second": 120.574,
"eval_deepset_4_steps_per_second": 7.609,
"step": 1250
},
{
"epoch": 0.07,
"eval_anli_accuracy": 0.577,
"eval_anli_loss": 1.1495600938796997,
"eval_anli_matthews_correlation": 0.36758926218287485,
"eval_anli_runtime": 5.1325,
"eval_anli_samples_per_second": 194.837,
"eval_anli_steps_per_second": 12.275,
"step": 1250
},
{
"epoch": 0.07,
"learning_rate": 2.941522741156217e-07,
"loss": 0.2936,
"step": 1300
},
{
"epoch": 0.07,
"learning_rate": 2.9248625534514355e-07,
"loss": 0.275,
"step": 1400
},
{
"epoch": 0.08,
"learning_rate": 2.9083689676237014e-07,
"loss": 0.2711,
"step": 1500
},
{
"epoch": 0.08,
"eval_osu_accuracy": 0.71900826446281,
"eval_osu_loss": 0.8360257744789124,
"eval_osu_matthews_correlation": 0.5055263088346037,
"eval_osu_runtime": 4.6825,
"eval_osu_samples_per_second": 51.682,
"eval_osu_steps_per_second": 3.417,
"step": 1500
},
{
"epoch": 0.08,
"eval_deepset_1_accuracy": 0.6302521008403361,
"eval_deepset_1_loss": 2.0135045051574707,
"eval_deepset_1_matthews_correlation": 0.43404618683091417,
"eval_deepset_1_runtime": 1.0652,
"eval_deepset_1_samples_per_second": 111.718,
"eval_deepset_1_steps_per_second": 7.51,
"step": 1500
},
{
"epoch": 0.08,
"eval_deepset_2_accuracy": 0.7115384615384616,
"eval_deepset_2_loss": 1.3997838497161865,
"eval_deepset_2_matthews_correlation": 0.5105532533477752,
"eval_deepset_2_runtime": 1.5611,
"eval_deepset_2_samples_per_second": 99.928,
"eval_deepset_2_steps_per_second": 6.406,
"step": 1500
},
{
"epoch": 0.08,
"eval_deepset_3_accuracy": 0.6676300578034682,
"eval_deepset_3_loss": 1.5432208776474,
"eval_deepset_3_matthews_correlation": 0.42876096695199906,
"eval_deepset_3_runtime": 3.0533,
"eval_deepset_3_samples_per_second": 113.322,
"eval_deepset_3_steps_per_second": 7.205,
"step": 1500
},
{
"epoch": 0.08,
"eval_deepset_4_accuracy": 0.6359223300970874,
"eval_deepset_4_loss": 1.9390015602111816,
"eval_deepset_4_matthews_correlation": 0.4108775577859797,
"eval_deepset_4_runtime": 1.7173,
"eval_deepset_4_samples_per_second": 119.953,
"eval_deepset_4_steps_per_second": 7.57,
"step": 1500
},
{
"epoch": 0.08,
"eval_anli_accuracy": 0.609,
"eval_anli_loss": 1.042230486869812,
"eval_anli_matthews_correlation": 0.42100205280404024,
"eval_anli_runtime": 5.1501,
"eval_anli_samples_per_second": 194.17,
"eval_anli_steps_per_second": 12.233,
"step": 1500
}
],
"max_steps": 18955,
"num_train_epochs": 1,
"total_flos": 2.042867740823347e+16,
"trial_name": null,
"trial_params": null
}