diff --git "a/trainer_state.json" "b/trainer_state.json" --- "a/trainer_state.json" +++ "b/trainer_state.json" @@ -1,254440 +1,16816 @@ { "best_metric": null, "best_model_checkpoint": null, - "epoch": 0.9992431561435143, - "global_step": 573000, + "epoch": 0.9994610049580405, + "global_step": 280000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, - "learning_rate": 4.9956403003658664e-05, - "loss": 6.6229, - "step": 500 - }, - { - "epoch": 0.0, - "learning_rate": 4.991280600731732e-05, - "loss": 5.5184, - "step": 1000 - }, - { - "epoch": 0.0, - "learning_rate": 4.986920901097598e-05, - "loss": 5.1215, - "step": 1500 - }, - { - "epoch": 0.0, - "learning_rate": 4.982561201463464e-05, - "loss": 4.8658, - "step": 2000 - }, - { - "epoch": 0.0, - "learning_rate": 4.97820150182933e-05, - "loss": 4.6479, - "step": 2500 - }, - { - "epoch": 0.01, - "learning_rate": 4.973841802195196e-05, - "loss": 4.5154, - "step": 3000 - }, - { - "epoch": 0.01, - "learning_rate": 4.969482102561062e-05, - "loss": 4.3856, - "step": 3500 - }, - { - "epoch": 0.01, - "learning_rate": 4.965122402926928e-05, - "loss": 4.2794, - "step": 4000 - }, - { - "epoch": 0.01, - "learning_rate": 4.960762703292794e-05, - "loss": 4.1869, - "step": 4500 - }, - { - "epoch": 0.01, - "learning_rate": 4.95640300365866e-05, - "loss": 4.1061, - "step": 5000 - }, - { - "epoch": 0.01, - "learning_rate": 4.9520433040245264e-05, - "loss": 4.0322, - "step": 5500 - }, - { - "epoch": 0.01, - "learning_rate": 4.9476836043903926e-05, - "loss": 3.9469, - "step": 6000 - }, - { - "epoch": 0.01, - "learning_rate": 4.943323904756258e-05, - "loss": 3.8693, - "step": 6500 - }, - { - "epoch": 0.01, - "learning_rate": 4.938964205122124e-05, - "loss": 3.8154, - "step": 7000 - }, - { - "epoch": 0.01, - "learning_rate": 4.93460450548799e-05, - "loss": 3.7452, - "step": 7500 - }, - { - "epoch": 0.01, - "learning_rate": 4.9302448058538564e-05, - "loss": 3.6877, - "step": 8000 - }, - { - "epoch": 0.01, - "learning_rate": 4.925885106219722e-05, - "loss": 3.6377, - "step": 8500 - }, - { - "epoch": 0.02, - "learning_rate": 4.921525406585588e-05, - "loss": 3.5988, - "step": 9000 - }, - { - "epoch": 0.02, - "learning_rate": 4.917165706951454e-05, - "loss": 3.5531, - "step": 9500 - }, - { - "epoch": 0.02, - "learning_rate": 4.9128060073173196e-05, - "loss": 3.5133, - "step": 10000 - }, - { - "epoch": 0.02, - "learning_rate": 4.908446307683186e-05, - "loss": 3.4781, - "step": 10500 - }, - { - "epoch": 0.02, - "learning_rate": 4.904086608049052e-05, - "loss": 3.4556, - "step": 11000 - }, - { - "epoch": 0.02, - "learning_rate": 4.899726908414918e-05, - "loss": 3.4205, - "step": 11500 - }, - { - "epoch": 0.02, - "learning_rate": 4.895367208780784e-05, - "loss": 3.4049, - "step": 12000 - }, - { - "epoch": 0.02, - "learning_rate": 4.89100750914665e-05, - "loss": 3.3677, - "step": 12500 - }, - { - "epoch": 0.02, - "learning_rate": 4.8866478095125165e-05, - "loss": 3.3676, - "step": 13000 - }, - { - "epoch": 0.02, - "learning_rate": 4.882288109878382e-05, - "loss": 3.3316, - "step": 13500 - }, - { - "epoch": 0.02, - "learning_rate": 4.877928410244248e-05, - "loss": 3.3093, - "step": 14000 - }, - { - "epoch": 0.03, - "learning_rate": 4.873568710610114e-05, - "loss": 3.311, - "step": 14500 - }, - { - "epoch": 0.03, - "learning_rate": 4.8692090109759803e-05, - "loss": 3.248, - "step": 15000 - }, - { - "epoch": 0.03, - "learning_rate": 4.864849311341846e-05, - "loss": 3.258, - "step": 15500 - }, - { - "epoch": 0.03, - "learning_rate": 4.860489611707712e-05, - "loss": 3.2311, - "step": 16000 - }, - { - "epoch": 0.03, - "learning_rate": 4.856129912073578e-05, - "loss": 3.2173, - "step": 16500 - }, - { - "epoch": 0.03, - "learning_rate": 4.8517702124394435e-05, - "loss": 3.2002, - "step": 17000 - }, - { - "epoch": 0.03, - "learning_rate": 4.84741051280531e-05, - "loss": 3.1813, - "step": 17500 - }, - { - "epoch": 0.03, - "learning_rate": 4.843050813171176e-05, - "loss": 3.1847, - "step": 18000 - }, - { - "epoch": 0.03, - "learning_rate": 4.838691113537042e-05, - "loss": 3.1575, - "step": 18500 - }, - { - "epoch": 0.03, - "learning_rate": 4.834331413902908e-05, - "loss": 3.1634, - "step": 19000 - }, - { - "epoch": 0.03, - "learning_rate": 4.829971714268774e-05, - "loss": 3.1104, - "step": 19500 - }, - { - "epoch": 0.03, - "learning_rate": 4.8256120146346404e-05, - "loss": 3.1243, - "step": 20000 - }, - { - "epoch": 0.04, - "learning_rate": 4.8212523150005065e-05, - "loss": 3.1088, - "step": 20500 - }, - { - "epoch": 0.04, - "learning_rate": 4.816892615366372e-05, - "loss": 3.1038, - "step": 21000 - }, - { - "epoch": 0.04, - "learning_rate": 4.812532915732238e-05, - "loss": 3.0727, - "step": 21500 - }, - { - "epoch": 0.04, - "learning_rate": 4.808173216098104e-05, - "loss": 3.0702, - "step": 22000 - }, - { - "epoch": 0.04, - "learning_rate": 4.80381351646397e-05, - "loss": 3.0794, - "step": 22500 - }, - { - "epoch": 0.04, - "learning_rate": 4.799453816829836e-05, - "loss": 3.0593, - "step": 23000 - }, - { - "epoch": 0.04, - "learning_rate": 4.795094117195702e-05, - "loss": 3.044, - "step": 23500 - }, - { - "epoch": 0.04, - "learning_rate": 4.790734417561568e-05, - "loss": 3.0237, - "step": 24000 - }, - { - "epoch": 0.04, - "learning_rate": 4.7863747179274336e-05, - "loss": 3.0296, - "step": 24500 - }, - { - "epoch": 0.04, - "learning_rate": 4.7820150182933e-05, - "loss": 3.024, - "step": 25000 - }, - { - "epoch": 0.04, - "learning_rate": 4.777655318659166e-05, - "loss": 3.0292, - "step": 25500 - }, - { - "epoch": 0.05, - "learning_rate": 4.773295619025031e-05, - "loss": 3.006, - "step": 26000 - }, - { - "epoch": 0.05, - "learning_rate": 4.7689359193908975e-05, - "loss": 2.996, - "step": 26500 - }, - { - "epoch": 0.05, - "learning_rate": 4.7645762197567636e-05, - "loss": 2.9869, - "step": 27000 - }, - { - "epoch": 0.05, - "learning_rate": 4.76021652012263e-05, - "loss": 2.9667, - "step": 27500 - }, - { - "epoch": 0.05, - "learning_rate": 4.755856820488496e-05, - "loss": 2.9537, - "step": 28000 - }, - { - "epoch": 0.05, - "learning_rate": 4.751497120854362e-05, - "loss": 2.9679, - "step": 28500 - }, - { - "epoch": 0.05, - "learning_rate": 4.747137421220228e-05, - "loss": 2.9606, - "step": 29000 - }, - { - "epoch": 0.05, - "learning_rate": 4.7427777215860936e-05, - "loss": 2.9225, - "step": 29500 - }, - { - "epoch": 0.05, - "learning_rate": 4.73841802195196e-05, - "loss": 2.9253, - "step": 30000 - }, - { - "epoch": 0.05, - "learning_rate": 4.734058322317826e-05, - "loss": 2.945, - "step": 30500 - }, - { - "epoch": 0.05, - "learning_rate": 4.729698622683692e-05, - "loss": 2.9421, - "step": 31000 - }, - { - "epoch": 0.05, - "learning_rate": 4.7253389230495575e-05, - "loss": 2.9291, - "step": 31500 - }, - { - "epoch": 0.06, - "learning_rate": 4.7209792234154237e-05, - "loss": 2.9093, - "step": 32000 - }, - { - "epoch": 0.06, - "learning_rate": 4.71661952378129e-05, - "loss": 2.914, - "step": 32500 - }, - { - "epoch": 0.06, - "learning_rate": 4.712259824147156e-05, - "loss": 2.9038, - "step": 33000 - }, - { - "epoch": 0.06, - "learning_rate": 4.7079001245130214e-05, - "loss": 2.8911, - "step": 33500 - }, - { - "epoch": 0.06, - "learning_rate": 4.7035404248788875e-05, - "loss": 2.8811, - "step": 34000 - }, - { - "epoch": 0.06, - "learning_rate": 4.699180725244754e-05, - "loss": 2.8962, - "step": 34500 - }, - { - "epoch": 0.06, - "learning_rate": 4.69482102561062e-05, - "loss": 2.8896, - "step": 35000 - }, - { - "epoch": 0.06, - "learning_rate": 4.690461325976486e-05, - "loss": 2.886, - "step": 35500 - }, - { - "epoch": 0.06, - "learning_rate": 4.686101626342352e-05, - "loss": 2.8664, - "step": 36000 - }, - { - "epoch": 0.06, - "learning_rate": 4.681741926708218e-05, - "loss": 2.8638, - "step": 36500 - }, - { - "epoch": 0.06, - "learning_rate": 4.677382227074084e-05, - "loss": 2.8561, - "step": 37000 - }, - { - "epoch": 0.07, - "learning_rate": 4.67302252743995e-05, - "loss": 2.8694, - "step": 37500 - }, - { - "epoch": 0.07, - "learning_rate": 4.668662827805816e-05, - "loss": 2.8585, - "step": 38000 - }, - { - "epoch": 0.07, - "learning_rate": 4.6643031281716814e-05, - "loss": 2.8377, - "step": 38500 - }, - { - "epoch": 0.07, - "learning_rate": 4.6599434285375476e-05, - "loss": 2.8471, - "step": 39000 - }, - { - "epoch": 0.07, - "learning_rate": 4.655583728903414e-05, - "loss": 2.855, - "step": 39500 - }, - { - "epoch": 0.07, - "learning_rate": 4.65122402926928e-05, - "loss": 2.8583, - "step": 40000 - }, - { - "epoch": 0.07, - "learning_rate": 4.646864329635145e-05, - "loss": 2.8162, - "step": 40500 - }, - { - "epoch": 0.07, - "learning_rate": 4.6425046300010114e-05, - "loss": 2.8341, - "step": 41000 - }, - { - "epoch": 0.07, - "learning_rate": 4.6381449303668776e-05, - "loss": 2.8176, - "step": 41500 - }, - { - "epoch": 0.07, - "learning_rate": 4.633785230732744e-05, - "loss": 2.8046, - "step": 42000 - }, - { - "epoch": 0.07, - "learning_rate": 4.62942553109861e-05, - "loss": 2.8167, - "step": 42500 - }, - { - "epoch": 0.07, - "learning_rate": 4.625065831464476e-05, - "loss": 2.7942, - "step": 43000 - }, - { - "epoch": 0.08, - "learning_rate": 4.620706131830342e-05, - "loss": 2.8192, - "step": 43500 - }, - { - "epoch": 0.08, - "learning_rate": 4.6163464321962076e-05, - "loss": 2.8207, - "step": 44000 - }, - { - "epoch": 0.08, - "learning_rate": 4.611986732562074e-05, - "loss": 2.7887, - "step": 44500 - }, - { - "epoch": 0.08, - "learning_rate": 4.60762703292794e-05, - "loss": 2.8046, - "step": 45000 - }, - { - "epoch": 0.08, - "learning_rate": 4.603267333293806e-05, - "loss": 2.7617, - "step": 45500 - }, - { - "epoch": 0.08, - "learning_rate": 4.5989076336596715e-05, - "loss": 2.7807, - "step": 46000 - }, - { - "epoch": 0.08, - "learning_rate": 4.5945479340255376e-05, - "loss": 2.7942, - "step": 46500 - }, - { - "epoch": 0.08, - "learning_rate": 4.590188234391404e-05, - "loss": 2.7787, - "step": 47000 - }, - { - "epoch": 0.08, - "learning_rate": 4.585828534757269e-05, - "loss": 2.7708, - "step": 47500 - }, - { - "epoch": 0.08, - "learning_rate": 4.5814688351231354e-05, - "loss": 2.7828, - "step": 48000 - }, - { - "epoch": 0.08, - "learning_rate": 4.5771091354890015e-05, - "loss": 2.7828, - "step": 48500 - }, - { - "epoch": 0.09, - "learning_rate": 4.5727494358548676e-05, - "loss": 2.7639, - "step": 49000 - }, - { - "epoch": 0.09, - "learning_rate": 4.568389736220733e-05, - "loss": 2.7538, - "step": 49500 - }, - { - "epoch": 0.09, - "learning_rate": 4.564030036586599e-05, - "loss": 2.7618, - "step": 50000 - }, - { - "epoch": 0.09, - "learning_rate": 4.5596703369524654e-05, - "loss": 2.7534, - "step": 50500 - }, - { - "epoch": 0.09, - "learning_rate": 4.5553106373183315e-05, - "loss": 2.759, - "step": 51000 - }, - { - "epoch": 0.09, - "learning_rate": 4.5509509376841977e-05, - "loss": 2.7616, - "step": 51500 - }, - { - "epoch": 0.09, - "learning_rate": 4.546591238050064e-05, - "loss": 2.7393, - "step": 52000 - }, - { - "epoch": 0.09, - "learning_rate": 4.54223153841593e-05, - "loss": 2.7513, - "step": 52500 - }, - { - "epoch": 0.09, - "learning_rate": 4.5378718387817954e-05, - "loss": 2.7386, - "step": 53000 - }, - { - "epoch": 0.09, - "learning_rate": 4.5335121391476615e-05, - "loss": 2.7542, - "step": 53500 - }, - { - "epoch": 0.09, - "learning_rate": 4.529152439513528e-05, - "loss": 2.7503, - "step": 54000 - }, - { - "epoch": 0.1, - "learning_rate": 4.524792739879393e-05, - "loss": 2.7396, - "step": 54500 - }, - { - "epoch": 0.1, - "learning_rate": 4.520433040245259e-05, - "loss": 2.7056, - "step": 55000 - }, - { - "epoch": 0.1, - "learning_rate": 4.5160733406111254e-05, - "loss": 2.7219, - "step": 55500 - }, - { - "epoch": 0.1, - "learning_rate": 4.5117136409769915e-05, - "loss": 2.7176, - "step": 56000 - }, - { - "epoch": 0.1, - "learning_rate": 4.507353941342857e-05, - "loss": 2.7235, - "step": 56500 - }, - { - "epoch": 0.1, - "learning_rate": 4.502994241708723e-05, - "loss": 2.7279, - "step": 57000 - }, - { - "epoch": 0.1, - "learning_rate": 4.498634542074589e-05, - "loss": 2.7177, - "step": 57500 - }, - { - "epoch": 0.1, - "learning_rate": 4.4942748424404554e-05, - "loss": 2.7252, - "step": 58000 - }, - { - "epoch": 0.1, - "learning_rate": 4.4899151428063216e-05, - "loss": 2.7003, - "step": 58500 - }, - { - "epoch": 0.1, - "learning_rate": 4.485555443172188e-05, - "loss": 2.7073, - "step": 59000 - }, - { - "epoch": 0.1, - "learning_rate": 4.481195743538054e-05, - "loss": 2.6908, - "step": 59500 - }, - { - "epoch": 0.1, - "learning_rate": 4.476836043903919e-05, - "loss": 2.7133, - "step": 60000 - }, - { - "epoch": 0.11, - "learning_rate": 4.4724763442697854e-05, - "loss": 2.7251, - "step": 60500 - }, - { - "epoch": 0.11, - "learning_rate": 4.4681166446356516e-05, - "loss": 2.6973, - "step": 61000 - }, - { - "epoch": 0.11, - "learning_rate": 4.463756945001518e-05, - "loss": 2.7148, - "step": 61500 - }, - { - "epoch": 0.11, - "learning_rate": 4.459397245367383e-05, - "loss": 2.6953, - "step": 62000 - }, - { - "epoch": 0.11, - "learning_rate": 4.455037545733249e-05, - "loss": 2.6877, - "step": 62500 - }, - { - "epoch": 0.11, - "learning_rate": 4.4506778460991155e-05, - "loss": 2.7098, - "step": 63000 - }, - { - "epoch": 0.11, - "learning_rate": 4.446318146464981e-05, - "loss": 2.6791, - "step": 63500 - }, - { - "epoch": 0.11, - "learning_rate": 4.441958446830847e-05, - "loss": 2.688, - "step": 64000 - }, - { - "epoch": 0.11, - "learning_rate": 4.437598747196713e-05, - "loss": 2.6947, - "step": 64500 - }, - { - "epoch": 0.11, - "learning_rate": 4.4332390475625793e-05, - "loss": 2.6871, - "step": 65000 - }, - { - "epoch": 0.11, - "learning_rate": 4.4288793479284455e-05, - "loss": 2.6713, - "step": 65500 - }, - { - "epoch": 0.12, - "learning_rate": 4.4245196482943116e-05, - "loss": 2.6781, - "step": 66000 - }, - { - "epoch": 0.12, - "learning_rate": 4.420159948660178e-05, - "loss": 2.6799, - "step": 66500 - }, - { - "epoch": 0.12, - "learning_rate": 4.415800249026043e-05, - "loss": 2.6627, - "step": 67000 - }, - { - "epoch": 0.12, - "learning_rate": 4.4114405493919094e-05, - "loss": 2.6837, - "step": 67500 - }, - { - "epoch": 0.12, - "learning_rate": 4.4070808497577755e-05, - "loss": 2.6745, - "step": 68000 - }, - { - "epoch": 0.12, - "learning_rate": 4.4027211501236416e-05, - "loss": 2.6741, - "step": 68500 - }, - { - "epoch": 0.12, - "learning_rate": 4.398361450489507e-05, - "loss": 2.6666, - "step": 69000 - }, - { - "epoch": 0.12, - "learning_rate": 4.394001750855373e-05, - "loss": 2.6748, - "step": 69500 - }, - { - "epoch": 0.12, - "learning_rate": 4.3896420512212394e-05, - "loss": 2.6532, - "step": 70000 - }, - { - "epoch": 0.12, - "learning_rate": 4.3852823515871055e-05, - "loss": 2.6596, - "step": 70500 - }, - { - "epoch": 0.12, - "learning_rate": 4.380922651952971e-05, - "loss": 2.6524, - "step": 71000 - }, - { - "epoch": 0.12, - "learning_rate": 4.376562952318837e-05, - "loss": 2.64, - "step": 71500 - }, - { - "epoch": 0.13, - "learning_rate": 4.372203252684703e-05, - "loss": 2.6664, - "step": 72000 - }, - { - "epoch": 0.13, - "learning_rate": 4.367843553050569e-05, - "loss": 2.6496, - "step": 72500 - }, - { - "epoch": 0.13, - "learning_rate": 4.363483853416435e-05, - "loss": 2.6401, - "step": 73000 - }, - { - "epoch": 0.13, - "learning_rate": 4.359124153782301e-05, - "loss": 2.6422, - "step": 73500 - }, - { - "epoch": 0.13, - "learning_rate": 4.354764454148167e-05, - "loss": 2.6466, - "step": 74000 - }, - { - "epoch": 0.13, - "learning_rate": 4.350404754514033e-05, - "loss": 2.6331, - "step": 74500 - }, - { - "epoch": 0.13, - "learning_rate": 4.3460450548798994e-05, - "loss": 2.6435, - "step": 75000 - }, - { - "epoch": 0.13, - "learning_rate": 4.3416853552457656e-05, - "loss": 2.6557, - "step": 75500 - }, - { - "epoch": 0.13, - "learning_rate": 4.337325655611631e-05, - "loss": 2.6306, - "step": 76000 - }, - { - "epoch": 0.13, - "learning_rate": 4.332965955977497e-05, - "loss": 2.631, - "step": 76500 - }, - { - "epoch": 0.13, - "learning_rate": 4.328606256343363e-05, - "loss": 2.6575, - "step": 77000 - }, - { - "epoch": 0.14, - "learning_rate": 4.3242465567092294e-05, - "loss": 2.6436, - "step": 77500 - }, - { - "epoch": 0.14, - "learning_rate": 4.319886857075095e-05, - "loss": 2.6248, - "step": 78000 - }, - { - "epoch": 0.14, - "learning_rate": 4.315527157440961e-05, - "loss": 2.6213, - "step": 78500 - }, - { - "epoch": 0.14, - "learning_rate": 4.311167457806827e-05, - "loss": 2.6431, - "step": 79000 - }, - { - "epoch": 0.14, - "learning_rate": 4.3068077581726926e-05, - "loss": 2.6397, - "step": 79500 - }, - { - "epoch": 0.14, - "learning_rate": 4.302448058538559e-05, - "loss": 2.6158, - "step": 80000 - }, - { - "epoch": 0.14, - "learning_rate": 4.298088358904425e-05, - "loss": 2.6327, - "step": 80500 - }, - { - "epoch": 0.14, - "learning_rate": 4.293728659270291e-05, - "loss": 2.6201, - "step": 81000 - }, - { - "epoch": 0.14, - "learning_rate": 4.289368959636157e-05, - "loss": 2.6227, - "step": 81500 - }, - { - "epoch": 0.14, - "learning_rate": 4.285009260002023e-05, - "loss": 2.6222, - "step": 82000 - }, - { - "epoch": 0.14, - "learning_rate": 4.2806495603678895e-05, - "loss": 2.6215, - "step": 82500 - }, - { - "epoch": 0.14, - "learning_rate": 4.276289860733755e-05, - "loss": 2.6115, - "step": 83000 - }, - { - "epoch": 0.15, - "learning_rate": 4.271930161099621e-05, - "loss": 2.6067, - "step": 83500 - }, - { - "epoch": 0.15, - "learning_rate": 4.267570461465487e-05, - "loss": 2.6234, - "step": 84000 - }, - { - "epoch": 0.15, - "learning_rate": 4.2632107618313533e-05, - "loss": 2.6084, - "step": 84500 - }, - { - "epoch": 0.15, - "learning_rate": 4.258851062197219e-05, - "loss": 2.6051, - "step": 85000 - }, - { - "epoch": 0.15, - "learning_rate": 4.254491362563085e-05, - "loss": 2.6035, - "step": 85500 - }, - { - "epoch": 0.15, - "learning_rate": 4.250131662928951e-05, - "loss": 2.6023, - "step": 86000 - }, - { - "epoch": 0.15, - "learning_rate": 4.245771963294817e-05, - "loss": 2.5975, - "step": 86500 - }, - { - "epoch": 0.15, - "learning_rate": 4.241412263660683e-05, - "loss": 2.5987, - "step": 87000 - }, - { - "epoch": 0.15, - "learning_rate": 4.237052564026549e-05, - "loss": 2.5887, - "step": 87500 - }, - { - "epoch": 0.15, - "learning_rate": 4.232692864392415e-05, - "loss": 2.617, - "step": 88000 - }, - { - "epoch": 0.15, - "learning_rate": 4.228333164758281e-05, - "loss": 2.5967, - "step": 88500 - }, - { - "epoch": 0.16, - "learning_rate": 4.223973465124147e-05, - "loss": 2.6002, - "step": 89000 - }, - { - "epoch": 0.16, - "learning_rate": 4.2196137654900134e-05, - "loss": 2.5859, - "step": 89500 - }, - { - "epoch": 0.16, - "learning_rate": 4.2152540658558795e-05, - "loss": 2.605, - "step": 90000 - }, - { - "epoch": 0.16, - "learning_rate": 4.210894366221745e-05, - "loss": 2.5834, - "step": 90500 - }, - { - "epoch": 0.16, - "learning_rate": 4.206534666587611e-05, - "loss": 2.5869, - "step": 91000 - }, - { - "epoch": 0.16, - "learning_rate": 4.202174966953477e-05, - "loss": 2.5856, - "step": 91500 - }, - { - "epoch": 0.16, - "learning_rate": 4.197815267319343e-05, - "loss": 2.5791, - "step": 92000 - }, - { - "epoch": 0.16, - "learning_rate": 4.193455567685209e-05, - "loss": 2.5899, - "step": 92500 - }, - { - "epoch": 0.16, - "learning_rate": 4.189095868051075e-05, - "loss": 2.5982, - "step": 93000 - }, - { - "epoch": 0.16, - "learning_rate": 4.184736168416941e-05, - "loss": 2.5828, - "step": 93500 - }, - { - "epoch": 0.16, - "learning_rate": 4.1803764687828066e-05, - "loss": 2.5874, - "step": 94000 - }, - { - "epoch": 0.16, - "learning_rate": 4.176016769148673e-05, - "loss": 2.5749, - "step": 94500 - }, - { - "epoch": 0.17, - "learning_rate": 4.171657069514539e-05, - "loss": 2.5809, - "step": 95000 - }, - { - "epoch": 0.17, - "learning_rate": 4.167297369880404e-05, - "loss": 2.5824, - "step": 95500 - }, - { - "epoch": 0.17, - "learning_rate": 4.1629376702462705e-05, - "loss": 2.584, - "step": 96000 - }, - { - "epoch": 0.17, - "learning_rate": 4.1585779706121366e-05, - "loss": 2.5837, - "step": 96500 - }, - { - "epoch": 0.17, - "learning_rate": 4.154218270978003e-05, - "loss": 2.5784, - "step": 97000 - }, - { - "epoch": 0.17, - "learning_rate": 4.149858571343869e-05, - "loss": 2.5895, - "step": 97500 - }, - { - "epoch": 0.17, - "learning_rate": 4.145498871709735e-05, - "loss": 2.571, - "step": 98000 - }, - { - "epoch": 0.17, - "learning_rate": 4.141139172075601e-05, - "loss": 2.5712, - "step": 98500 - }, - { - "epoch": 0.17, - "learning_rate": 4.136779472441467e-05, - "loss": 2.5636, - "step": 99000 - }, - { - "epoch": 0.17, - "learning_rate": 4.132419772807333e-05, - "loss": 2.5699, - "step": 99500 - }, - { - "epoch": 0.17, - "learning_rate": 4.128060073173199e-05, - "loss": 2.5768, - "step": 100000 - }, - { - "epoch": 0.18, - "learning_rate": 4.123700373539065e-05, - "loss": 2.5644, - "step": 100500 - }, - { - "epoch": 0.18, - "learning_rate": 4.1193406739049305e-05, - "loss": 2.5699, - "step": 101000 - }, - { - "epoch": 0.18, - "learning_rate": 4.1149809742707966e-05, - "loss": 2.5651, - "step": 101500 - }, - { - "epoch": 0.18, - "learning_rate": 4.110621274636663e-05, - "loss": 2.5625, - "step": 102000 - }, - { - "epoch": 0.18, - "learning_rate": 4.106261575002529e-05, - "loss": 2.5617, - "step": 102500 - }, - { - "epoch": 0.18, - "learning_rate": 4.1019018753683944e-05, - "loss": 2.5593, - "step": 103000 - }, - { - "epoch": 0.18, - "learning_rate": 4.0975421757342605e-05, - "loss": 2.5751, - "step": 103500 - }, - { - "epoch": 0.18, - "learning_rate": 4.093182476100127e-05, - "loss": 2.554, - "step": 104000 - }, - { - "epoch": 0.18, - "learning_rate": 4.088822776465993e-05, - "loss": 2.5473, - "step": 104500 - }, - { - "epoch": 0.18, - "learning_rate": 4.084463076831859e-05, - "loss": 2.5546, - "step": 105000 - }, - { - "epoch": 0.18, - "learning_rate": 4.080103377197725e-05, - "loss": 2.5567, - "step": 105500 - }, - { - "epoch": 0.18, - "learning_rate": 4.075743677563591e-05, - "loss": 2.5422, - "step": 106000 - }, - { - "epoch": 0.19, - "learning_rate": 4.071383977929457e-05, - "loss": 2.5428, - "step": 106500 - }, - { - "epoch": 0.19, - "learning_rate": 4.067024278295323e-05, - "loss": 2.5522, - "step": 107000 - }, - { - "epoch": 0.19, - "learning_rate": 4.062664578661189e-05, - "loss": 2.5447, - "step": 107500 - }, - { - "epoch": 0.19, - "learning_rate": 4.0583048790270544e-05, - "loss": 2.5577, - "step": 108000 - }, - { - "epoch": 0.19, - "learning_rate": 4.0539451793929206e-05, - "loss": 2.5512, - "step": 108500 - }, - { - "epoch": 0.19, - "learning_rate": 4.049585479758787e-05, - "loss": 2.5744, - "step": 109000 - }, - { - "epoch": 0.19, - "learning_rate": 4.045225780124653e-05, - "loss": 2.5468, - "step": 109500 - }, - { - "epoch": 0.19, - "learning_rate": 4.040866080490518e-05, - "loss": 2.5397, - "step": 110000 - }, - { - "epoch": 0.19, - "learning_rate": 4.0365063808563844e-05, - "loss": 2.5598, - "step": 110500 - }, - { - "epoch": 0.19, - "learning_rate": 4.0321466812222506e-05, - "loss": 2.5554, - "step": 111000 - }, - { - "epoch": 0.19, - "learning_rate": 4.027786981588117e-05, - "loss": 2.545, - "step": 111500 - }, - { - "epoch": 0.2, - "learning_rate": 4.023427281953983e-05, - "loss": 2.5403, - "step": 112000 - }, - { - "epoch": 0.2, - "learning_rate": 4.019067582319849e-05, - "loss": 2.5293, - "step": 112500 - }, - { - "epoch": 0.2, - "learning_rate": 4.014707882685715e-05, - "loss": 2.557, - "step": 113000 - }, - { - "epoch": 0.2, - "learning_rate": 4.0103481830515806e-05, - "loss": 2.5597, - "step": 113500 - }, - { - "epoch": 0.2, - "learning_rate": 4.005988483417447e-05, - "loss": 2.5351, - "step": 114000 - }, - { - "epoch": 0.2, - "learning_rate": 4.001628783783313e-05, - "loss": 2.5318, - "step": 114500 - }, - { - "epoch": 0.2, - "learning_rate": 3.997269084149179e-05, - "loss": 2.5601, - "step": 115000 - }, - { - "epoch": 0.2, - "learning_rate": 3.9929093845150445e-05, - "loss": 2.5203, - "step": 115500 - }, - { - "epoch": 0.2, - "learning_rate": 3.9885496848809106e-05, - "loss": 2.5251, - "step": 116000 - }, - { - "epoch": 0.2, - "learning_rate": 3.984189985246777e-05, - "loss": 2.5424, - "step": 116500 - }, - { - "epoch": 0.2, - "learning_rate": 3.979830285612642e-05, - "loss": 2.5324, - "step": 117000 - }, - { - "epoch": 0.2, - "learning_rate": 3.9754705859785084e-05, - "loss": 2.5238, - "step": 117500 - }, - { - "epoch": 0.21, - "learning_rate": 3.9711108863443745e-05, - "loss": 2.5231, - "step": 118000 - }, - { - "epoch": 0.21, - "learning_rate": 3.9667511867102406e-05, - "loss": 2.5361, - "step": 118500 - }, - { - "epoch": 0.21, - "learning_rate": 3.962391487076106e-05, - "loss": 2.5367, - "step": 119000 - }, - { - "epoch": 0.21, - "learning_rate": 3.958031787441972e-05, - "loss": 2.5504, - "step": 119500 - }, - { - "epoch": 0.21, - "learning_rate": 3.9536720878078384e-05, - "loss": 2.5164, - "step": 120000 - }, - { - "epoch": 0.21, - "learning_rate": 3.9493123881737045e-05, - "loss": 2.5362, - "step": 120500 - }, - { - "epoch": 0.21, - "learning_rate": 3.9449526885395707e-05, - "loss": 2.5249, - "step": 121000 - }, - { - "epoch": 0.21, - "learning_rate": 3.940592988905437e-05, - "loss": 2.5258, - "step": 121500 - }, - { - "epoch": 0.21, - "learning_rate": 3.936233289271303e-05, - "loss": 2.5254, - "step": 122000 - }, - { - "epoch": 0.21, - "learning_rate": 3.9318735896371684e-05, - "loss": 2.5352, - "step": 122500 - }, - { - "epoch": 0.21, - "learning_rate": 3.9275138900030345e-05, - "loss": 2.516, - "step": 123000 - }, - { - "epoch": 0.22, - "learning_rate": 3.923154190368901e-05, - "loss": 2.5314, - "step": 123500 - }, - { - "epoch": 0.22, - "learning_rate": 3.918794490734767e-05, - "loss": 2.5212, - "step": 124000 - }, - { - "epoch": 0.22, - "learning_rate": 3.914434791100632e-05, - "loss": 2.5217, - "step": 124500 - }, - { - "epoch": 0.22, - "learning_rate": 3.9100750914664984e-05, - "loss": 2.5368, - "step": 125000 - }, - { - "epoch": 0.22, - "learning_rate": 3.9057153918323645e-05, - "loss": 2.5083, - "step": 125500 - }, - { - "epoch": 0.22, - "learning_rate": 3.90135569219823e-05, - "loss": 2.5115, - "step": 126000 - }, - { - "epoch": 0.22, - "learning_rate": 3.896995992564096e-05, - "loss": 2.5327, - "step": 126500 - }, - { - "epoch": 0.22, - "learning_rate": 3.892636292929962e-05, - "loss": 2.4913, - "step": 127000 - }, - { - "epoch": 0.22, - "learning_rate": 3.8882765932958284e-05, - "loss": 2.4975, - "step": 127500 - }, - { - "epoch": 0.22, - "learning_rate": 3.8839168936616946e-05, - "loss": 2.511, - "step": 128000 - }, - { - "epoch": 0.22, - "learning_rate": 3.879557194027561e-05, - "loss": 2.5149, - "step": 128500 - }, - { - "epoch": 0.22, - "learning_rate": 3.875197494393427e-05, - "loss": 2.502, - "step": 129000 - }, - { - "epoch": 0.23, - "learning_rate": 3.870837794759292e-05, - "loss": 2.4992, - "step": 129500 - }, - { - "epoch": 0.23, - "learning_rate": 3.8664780951251584e-05, - "loss": 2.5071, - "step": 130000 - }, - { - "epoch": 0.23, - "learning_rate": 3.8621183954910246e-05, - "loss": 2.5123, - "step": 130500 - }, - { - "epoch": 0.23, - "learning_rate": 3.857758695856891e-05, - "loss": 2.4968, - "step": 131000 - }, - { - "epoch": 0.23, - "learning_rate": 3.853398996222756e-05, - "loss": 2.5091, - "step": 131500 - }, - { - "epoch": 0.23, - "learning_rate": 3.849039296588622e-05, - "loss": 2.5059, - "step": 132000 - }, - { - "epoch": 0.23, - "learning_rate": 3.8446795969544885e-05, - "loss": 2.501, - "step": 132500 - }, - { - "epoch": 0.23, - "learning_rate": 3.840319897320354e-05, - "loss": 2.5034, - "step": 133000 - }, - { - "epoch": 0.23, - "learning_rate": 3.83596019768622e-05, - "loss": 2.5065, - "step": 133500 - }, - { - "epoch": 0.23, - "learning_rate": 3.831600498052086e-05, - "loss": 2.4937, - "step": 134000 - }, - { - "epoch": 0.23, - "learning_rate": 3.8272407984179523e-05, - "loss": 2.5109, - "step": 134500 - }, - { - "epoch": 0.24, - "learning_rate": 3.8228810987838185e-05, - "loss": 2.4983, - "step": 135000 - }, - { - "epoch": 0.24, - "learning_rate": 3.8185213991496846e-05, - "loss": 2.4944, - "step": 135500 - }, - { - "epoch": 0.24, - "learning_rate": 3.814161699515551e-05, - "loss": 2.4964, - "step": 136000 - }, - { - "epoch": 0.24, - "learning_rate": 3.809801999881417e-05, - "loss": 2.4916, - "step": 136500 - }, - { - "epoch": 0.24, - "learning_rate": 3.8054423002472824e-05, - "loss": 2.5128, - "step": 137000 - }, - { - "epoch": 0.24, - "learning_rate": 3.8010826006131485e-05, - "loss": 2.4886, - "step": 137500 - }, - { - "epoch": 0.24, - "learning_rate": 3.7967229009790146e-05, - "loss": 2.4835, - "step": 138000 - }, - { - "epoch": 0.24, - "learning_rate": 3.79236320134488e-05, - "loss": 2.4954, - "step": 138500 - }, - { - "epoch": 0.24, - "learning_rate": 3.788003501710746e-05, - "loss": 2.4935, - "step": 139000 - }, - { - "epoch": 0.24, - "learning_rate": 3.7836438020766124e-05, - "loss": 2.4825, - "step": 139500 - }, - { - "epoch": 0.24, - "learning_rate": 3.7792841024424785e-05, - "loss": 2.5103, - "step": 140000 - }, - { - "epoch": 0.25, - "learning_rate": 3.774924402808344e-05, - "loss": 2.4995, - "step": 140500 - }, - { - "epoch": 0.25, - "learning_rate": 3.77056470317421e-05, - "loss": 2.4935, - "step": 141000 - }, - { - "epoch": 0.25, - "learning_rate": 3.766205003540076e-05, - "loss": 2.5006, - "step": 141500 - }, - { - "epoch": 0.25, - "learning_rate": 3.761845303905942e-05, - "loss": 2.4913, - "step": 142000 - }, - { - "epoch": 0.25, - "learning_rate": 3.757485604271808e-05, - "loss": 2.4799, - "step": 142500 - }, - { - "epoch": 0.25, - "learning_rate": 3.753125904637674e-05, - "loss": 2.4833, - "step": 143000 - }, - { - "epoch": 0.25, - "learning_rate": 3.748766205003541e-05, - "loss": 2.495, - "step": 143500 - }, - { - "epoch": 0.25, - "learning_rate": 3.744406505369406e-05, - "loss": 2.4815, - "step": 144000 - }, - { - "epoch": 0.25, - "learning_rate": 3.7400468057352724e-05, - "loss": 2.4914, - "step": 144500 - }, - { - "epoch": 0.25, - "learning_rate": 3.7356871061011385e-05, - "loss": 2.4826, - "step": 145000 - }, - { - "epoch": 0.25, - "learning_rate": 3.731327406467004e-05, - "loss": 2.4923, - "step": 145500 - }, - { - "epoch": 0.25, - "learning_rate": 3.72696770683287e-05, - "loss": 2.4838, - "step": 146000 - }, - { - "epoch": 0.26, - "learning_rate": 3.722608007198736e-05, - "loss": 2.4831, - "step": 146500 - }, - { - "epoch": 0.26, - "learning_rate": 3.7182483075646024e-05, - "loss": 2.4867, - "step": 147000 - }, - { - "epoch": 0.26, - "learning_rate": 3.713888607930468e-05, - "loss": 2.4856, - "step": 147500 - }, - { - "epoch": 0.26, - "learning_rate": 3.709528908296334e-05, - "loss": 2.4846, - "step": 148000 - }, - { - "epoch": 0.26, - "learning_rate": 3.7051692086622e-05, - "loss": 2.4948, - "step": 148500 - }, - { - "epoch": 0.26, - "learning_rate": 3.700809509028066e-05, - "loss": 2.4816, - "step": 149000 - }, - { - "epoch": 0.26, - "learning_rate": 3.696449809393932e-05, - "loss": 2.4807, - "step": 149500 - }, - { - "epoch": 0.26, - "learning_rate": 3.692090109759798e-05, - "loss": 2.4847, - "step": 150000 - }, - { - "epoch": 0.26, - "learning_rate": 3.687730410125664e-05, - "loss": 2.4854, - "step": 150500 - }, - { - "epoch": 0.26, - "learning_rate": 3.68337071049153e-05, - "loss": 2.45, - "step": 151000 - }, - { - "epoch": 0.26, - "learning_rate": 3.679011010857396e-05, - "loss": 2.467, - "step": 151500 - }, - { - "epoch": 0.27, - "learning_rate": 3.6746513112232625e-05, - "loss": 2.489, - "step": 152000 - }, - { - "epoch": 0.27, - "learning_rate": 3.6745641172305795e-05, - "loss": 2.4486, - "step": 152010 - }, - { - "epoch": 0.27, - "learning_rate": 3.6744769232378965e-05, - "loss": 2.5418, - "step": 152020 - }, - { - "epoch": 0.27, - "learning_rate": 3.674389729245214e-05, - "loss": 2.487, - "step": 152030 - }, - { - "epoch": 0.27, - "learning_rate": 3.674302535252531e-05, - "loss": 2.5183, - "step": 152040 - }, - { - "epoch": 0.27, - "learning_rate": 3.674215341259849e-05, - "loss": 2.5454, - "step": 152050 - }, - { - "epoch": 0.27, - "learning_rate": 3.674128147267166e-05, - "loss": 2.5318, - "step": 152060 - }, - { - "epoch": 0.27, - "learning_rate": 3.674040953274484e-05, - "loss": 2.6745, - "step": 152070 - }, - { - "epoch": 0.27, - "learning_rate": 3.673953759281801e-05, - "loss": 2.539, - "step": 152080 - }, - { - "epoch": 0.27, - "learning_rate": 3.673866565289118e-05, - "loss": 2.5846, - "step": 152090 - }, - { - "epoch": 0.27, - "learning_rate": 3.6737793712964356e-05, - "loss": 2.4039, - "step": 152100 - }, - { - "epoch": 0.27, - "learning_rate": 3.6736921773037526e-05, - "loss": 2.4249, - "step": 152110 - }, - { - "epoch": 0.27, - "learning_rate": 3.6736049833110696e-05, - "loss": 2.4787, - "step": 152120 - }, - { - "epoch": 0.27, - "learning_rate": 3.6735177893183873e-05, - "loss": 2.5389, - "step": 152130 - }, - { - "epoch": 0.27, - "learning_rate": 3.673430595325705e-05, - "loss": 2.4451, - "step": 152140 - }, - { - "epoch": 0.27, - "learning_rate": 3.673343401333022e-05, - "loss": 2.438, - "step": 152150 - }, - { - "epoch": 0.27, - "learning_rate": 3.673256207340339e-05, - "loss": 2.4797, - "step": 152160 - }, - { - "epoch": 0.27, - "learning_rate": 3.673169013347656e-05, - "loss": 2.531, - "step": 152170 - }, - { - "epoch": 0.27, - "learning_rate": 3.673081819354974e-05, - "loss": 2.4701, - "step": 152180 - }, - { - "epoch": 0.27, - "learning_rate": 3.672994625362291e-05, - "loss": 2.347, - "step": 152190 - }, - { - "epoch": 0.27, - "learning_rate": 3.6729074313696086e-05, - "loss": 2.521, - "step": 152200 - }, - { - "epoch": 0.27, - "learning_rate": 3.6728202373769264e-05, - "loss": 2.4582, - "step": 152210 - }, - { - "epoch": 0.27, - "learning_rate": 3.6727330433842434e-05, - "loss": 2.457, - "step": 152220 - }, - { - "epoch": 0.27, - "learning_rate": 3.6726458493915604e-05, - "loss": 2.4437, - "step": 152230 - }, - { - "epoch": 0.27, - "learning_rate": 3.6725586553988775e-05, - "loss": 2.4435, - "step": 152240 - }, - { - "epoch": 0.27, - "learning_rate": 3.672471461406195e-05, - "loss": 2.5245, - "step": 152250 - }, - { - "epoch": 0.27, - "learning_rate": 3.672384267413512e-05, - "loss": 2.4433, - "step": 152260 - }, - { - "epoch": 0.27, - "learning_rate": 3.672297073420829e-05, - "loss": 2.4936, - "step": 152270 - }, - { - "epoch": 0.27, - "learning_rate": 3.672209879428147e-05, - "loss": 2.3041, - "step": 152280 - }, - { - "epoch": 0.27, - "learning_rate": 3.672122685435465e-05, - "loss": 2.3409, - "step": 152290 - }, - { - "epoch": 0.27, - "learning_rate": 3.672035491442782e-05, - "loss": 2.4557, - "step": 152300 - }, - { - "epoch": 0.27, - "learning_rate": 3.671948297450099e-05, - "loss": 2.4309, - "step": 152310 - }, - { - "epoch": 0.27, - "learning_rate": 3.6718611034574165e-05, - "loss": 2.4952, - "step": 152320 - }, - { - "epoch": 0.27, - "learning_rate": 3.6717739094647335e-05, - "loss": 2.4949, - "step": 152330 - }, - { - "epoch": 0.27, - "learning_rate": 3.6716867154720506e-05, - "loss": 2.4713, - "step": 152340 - }, - { - "epoch": 0.27, - "learning_rate": 3.671599521479368e-05, - "loss": 2.3882, - "step": 152350 - }, - { - "epoch": 0.27, - "learning_rate": 3.671512327486686e-05, - "loss": 2.5458, - "step": 152360 - }, - { - "epoch": 0.27, - "learning_rate": 3.671425133494003e-05, - "loss": 2.5279, - "step": 152370 - }, - { - "epoch": 0.27, - "learning_rate": 3.67133793950132e-05, - "loss": 2.5048, - "step": 152380 - }, - { - "epoch": 0.27, - "learning_rate": 3.671250745508638e-05, - "loss": 2.3942, - "step": 152390 - }, - { - "epoch": 0.27, - "learning_rate": 3.671163551515955e-05, - "loss": 2.5749, - "step": 152400 - }, - { - "epoch": 0.27, - "learning_rate": 3.671076357523272e-05, - "loss": 2.4163, - "step": 152410 - }, - { - "epoch": 0.27, - "learning_rate": 3.6709891635305896e-05, - "loss": 2.5594, - "step": 152420 - }, - { - "epoch": 0.27, - "learning_rate": 3.670901969537907e-05, - "loss": 2.5412, - "step": 152430 - }, - { - "epoch": 0.27, - "learning_rate": 3.6708147755452243e-05, - "loss": 2.4455, - "step": 152440 - }, - { - "epoch": 0.27, - "learning_rate": 3.6707275815525414e-05, - "loss": 2.5134, - "step": 152450 - }, - { - "epoch": 0.27, - "learning_rate": 3.670640387559859e-05, - "loss": 2.4105, - "step": 152460 - }, - { - "epoch": 0.27, - "learning_rate": 3.670553193567176e-05, - "loss": 2.4572, - "step": 152470 - }, - { - "epoch": 0.27, - "learning_rate": 3.670465999574493e-05, - "loss": 2.4765, - "step": 152480 - }, - { - "epoch": 0.27, - "learning_rate": 3.670378805581811e-05, - "loss": 2.5432, - "step": 152490 - }, - { - "epoch": 0.27, - "learning_rate": 3.6702916115891286e-05, - "loss": 2.5638, - "step": 152500 - }, - { - "epoch": 0.27, - "learning_rate": 3.6702044175964456e-05, - "loss": 2.4502, - "step": 152510 - }, - { - "epoch": 0.27, - "learning_rate": 3.670117223603763e-05, - "loss": 2.448, - "step": 152520 - }, - { - "epoch": 0.27, - "learning_rate": 3.6700300296110804e-05, - "loss": 2.4897, - "step": 152530 - }, - { - "epoch": 0.27, - "learning_rate": 3.6699428356183974e-05, - "loss": 2.4653, - "step": 152540 - }, - { - "epoch": 0.27, - "learning_rate": 3.6698556416257145e-05, - "loss": 2.3926, - "step": 152550 - }, - { - "epoch": 0.27, - "learning_rate": 3.6697684476330315e-05, - "loss": 2.3552, - "step": 152560 - }, - { - "epoch": 0.27, - "learning_rate": 3.66968125364035e-05, - "loss": 2.475, - "step": 152570 - }, - { - "epoch": 0.27, - "learning_rate": 3.669594059647667e-05, - "loss": 2.6209, - "step": 152580 - }, - { - "epoch": 0.27, - "learning_rate": 3.669506865654984e-05, - "loss": 2.4461, - "step": 152590 - }, - { - "epoch": 0.27, - "learning_rate": 3.669419671662302e-05, - "loss": 2.4276, - "step": 152600 - }, - { - "epoch": 0.27, - "learning_rate": 3.669332477669619e-05, - "loss": 2.4866, - "step": 152610 - }, - { - "epoch": 0.27, - "learning_rate": 3.669245283676936e-05, - "loss": 2.5518, - "step": 152620 - }, - { - "epoch": 0.27, - "learning_rate": 3.669158089684253e-05, - "loss": 2.4193, - "step": 152630 - }, - { - "epoch": 0.27, - "learning_rate": 3.6690708956915705e-05, - "loss": 2.4557, - "step": 152640 - }, - { - "epoch": 0.27, - "learning_rate": 3.668983701698888e-05, - "loss": 2.5545, - "step": 152650 - }, - { - "epoch": 0.27, - "learning_rate": 3.668896507706205e-05, - "loss": 2.4605, - "step": 152660 - }, - { - "epoch": 0.27, - "learning_rate": 3.668809313713522e-05, - "loss": 2.5508, - "step": 152670 - }, - { - "epoch": 0.27, - "learning_rate": 3.66872211972084e-05, - "loss": 2.3837, - "step": 152680 - }, - { - "epoch": 0.27, - "learning_rate": 3.668634925728157e-05, - "loss": 2.5232, - "step": 152690 - }, - { - "epoch": 0.27, - "learning_rate": 3.668547731735474e-05, - "loss": 2.451, - "step": 152700 - }, - { - "epoch": 0.27, - "learning_rate": 3.668460537742792e-05, - "loss": 2.5399, - "step": 152710 - }, - { - "epoch": 0.27, - "learning_rate": 3.6683733437501095e-05, - "loss": 2.4515, - "step": 152720 - }, - { - "epoch": 0.27, - "learning_rate": 3.6682861497574266e-05, - "loss": 2.523, - "step": 152730 - }, - { - "epoch": 0.27, - "learning_rate": 3.6681989557647436e-05, - "loss": 2.3892, - "step": 152740 - }, - { - "epoch": 0.27, - "learning_rate": 3.668111761772061e-05, - "loss": 2.5305, - "step": 152750 - }, - { - "epoch": 0.27, - "learning_rate": 3.6680245677793784e-05, - "loss": 2.4433, - "step": 152760 - }, - { - "epoch": 0.27, - "learning_rate": 3.6679373737866954e-05, - "loss": 2.2944, - "step": 152770 - }, - { - "epoch": 0.27, - "learning_rate": 3.667850179794013e-05, - "loss": 2.4241, - "step": 152780 - }, - { - "epoch": 0.27, - "learning_rate": 3.66776298580133e-05, - "loss": 2.5217, - "step": 152790 - }, - { - "epoch": 0.27, - "learning_rate": 3.667675791808648e-05, - "loss": 2.4226, - "step": 152800 - }, - { - "epoch": 0.27, - "learning_rate": 3.667588597815965e-05, - "loss": 2.3673, - "step": 152810 - }, - { - "epoch": 0.27, - "learning_rate": 3.6675014038232826e-05, - "loss": 2.446, - "step": 152820 - }, - { - "epoch": 0.27, - "learning_rate": 3.6674142098306e-05, - "loss": 2.5055, - "step": 152830 - }, - { - "epoch": 0.27, - "learning_rate": 3.667327015837917e-05, - "loss": 2.4555, - "step": 152840 - }, - { - "epoch": 0.27, - "learning_rate": 3.6672398218452344e-05, - "loss": 2.3256, - "step": 152850 - }, - { - "epoch": 0.27, - "learning_rate": 3.6671526278525515e-05, - "loss": 2.5913, - "step": 152860 - }, - { - "epoch": 0.27, - "learning_rate": 3.667065433859869e-05, - "loss": 2.5243, - "step": 152870 - }, - { - "epoch": 0.27, - "learning_rate": 3.666978239867186e-05, - "loss": 2.518, - "step": 152880 - }, - { - "epoch": 0.27, - "learning_rate": 3.666891045874504e-05, - "loss": 2.3962, - "step": 152890 - }, - { - "epoch": 0.27, - "learning_rate": 3.666803851881821e-05, - "loss": 2.5183, - "step": 152900 - }, - { - "epoch": 0.27, - "learning_rate": 3.666716657889138e-05, - "loss": 2.4048, - "step": 152910 - }, - { - "epoch": 0.27, - "learning_rate": 3.666629463896456e-05, - "loss": 2.4158, - "step": 152920 - }, - { - "epoch": 0.27, - "learning_rate": 3.666542269903773e-05, - "loss": 2.5343, - "step": 152930 - }, - { - "epoch": 0.27, - "learning_rate": 3.66645507591109e-05, - "loss": 2.5247, - "step": 152940 - }, - { - "epoch": 0.27, - "learning_rate": 3.6663678819184075e-05, - "loss": 2.586, - "step": 152950 - }, - { - "epoch": 0.27, - "learning_rate": 3.666280687925725e-05, - "loss": 2.4529, - "step": 152960 - }, - { - "epoch": 0.27, - "learning_rate": 3.666193493933042e-05, - "loss": 2.4641, - "step": 152970 - }, - { - "epoch": 0.27, - "learning_rate": 3.666106299940359e-05, - "loss": 2.473, - "step": 152980 - }, - { - "epoch": 0.27, - "learning_rate": 3.666019105947677e-05, - "loss": 2.6165, - "step": 152990 - }, - { - "epoch": 0.27, - "learning_rate": 3.665931911954994e-05, - "loss": 2.438, - "step": 153000 - }, - { - "epoch": 0.27, - "learning_rate": 3.665844717962311e-05, - "loss": 2.5722, - "step": 153010 - }, - { - "epoch": 0.27, - "learning_rate": 3.665757523969629e-05, - "loss": 2.3216, - "step": 153020 - }, - { - "epoch": 0.27, - "learning_rate": 3.6656703299769465e-05, - "loss": 2.4708, - "step": 153030 - }, - { - "epoch": 0.27, - "learning_rate": 3.6655831359842636e-05, - "loss": 2.4548, - "step": 153040 - }, - { - "epoch": 0.27, - "learning_rate": 3.6654959419915806e-05, - "loss": 2.553, - "step": 153050 - }, - { - "epoch": 0.27, - "learning_rate": 3.665408747998898e-05, - "loss": 2.3702, - "step": 153060 - }, - { - "epoch": 0.27, - "learning_rate": 3.6653215540062154e-05, - "loss": 2.4696, - "step": 153070 - }, - { - "epoch": 0.27, - "learning_rate": 3.6652343600135324e-05, - "loss": 2.4943, - "step": 153080 - }, - { - "epoch": 0.27, - "learning_rate": 3.6651471660208494e-05, - "loss": 2.4602, - "step": 153090 - }, - { - "epoch": 0.27, - "learning_rate": 3.665059972028168e-05, - "loss": 2.5162, - "step": 153100 - }, - { - "epoch": 0.27, - "learning_rate": 3.664972778035485e-05, - "loss": 2.5272, - "step": 153110 - }, - { - "epoch": 0.27, - "learning_rate": 3.664885584042802e-05, - "loss": 2.5137, - "step": 153120 - }, - { - "epoch": 0.27, - "learning_rate": 3.664798390050119e-05, - "loss": 2.4247, - "step": 153130 - }, - { - "epoch": 0.27, - "learning_rate": 3.664711196057437e-05, - "loss": 2.5762, - "step": 153140 - }, - { - "epoch": 0.27, - "learning_rate": 3.664624002064754e-05, - "loss": 2.3815, - "step": 153150 - }, - { - "epoch": 0.27, - "learning_rate": 3.664536808072071e-05, - "loss": 2.5058, - "step": 153160 - }, - { - "epoch": 0.27, - "learning_rate": 3.664449614079389e-05, - "loss": 2.5451, - "step": 153170 - }, - { - "epoch": 0.27, - "learning_rate": 3.664362420086706e-05, - "loss": 2.4483, - "step": 153180 - }, - { - "epoch": 0.27, - "learning_rate": 3.664275226094023e-05, - "loss": 2.5478, - "step": 153190 - }, - { - "epoch": 0.27, - "learning_rate": 3.66418803210134e-05, - "loss": 2.47, - "step": 153200 - }, - { - "epoch": 0.27, - "learning_rate": 3.664100838108658e-05, - "loss": 2.5263, - "step": 153210 - }, - { - "epoch": 0.27, - "learning_rate": 3.664013644115975e-05, - "loss": 2.4633, - "step": 153220 - }, - { - "epoch": 0.27, - "learning_rate": 3.663926450123292e-05, - "loss": 2.4284, - "step": 153230 - }, - { - "epoch": 0.27, - "learning_rate": 3.66383925613061e-05, - "loss": 2.5113, - "step": 153240 - }, - { - "epoch": 0.27, - "learning_rate": 3.6637520621379275e-05, - "loss": 2.5383, - "step": 153250 - }, - { - "epoch": 0.27, - "learning_rate": 3.6636648681452445e-05, - "loss": 2.5392, - "step": 153260 - }, - { - "epoch": 0.27, - "learning_rate": 3.6635776741525615e-05, - "loss": 2.4705, - "step": 153270 - }, - { - "epoch": 0.27, - "learning_rate": 3.663490480159879e-05, - "loss": 2.4512, - "step": 153280 - }, - { - "epoch": 0.27, - "learning_rate": 3.663403286167196e-05, - "loss": 2.4616, - "step": 153290 - }, - { - "epoch": 0.27, - "learning_rate": 3.6633160921745133e-05, - "loss": 2.586, - "step": 153300 - }, - { - "epoch": 0.27, - "learning_rate": 3.663228898181831e-05, - "loss": 2.5649, - "step": 153310 - }, - { - "epoch": 0.27, - "learning_rate": 3.663141704189149e-05, - "loss": 2.3707, - "step": 153320 - }, - { - "epoch": 0.27, - "learning_rate": 3.663054510196466e-05, - "loss": 2.3424, - "step": 153330 - }, - { - "epoch": 0.27, - "learning_rate": 3.662967316203783e-05, - "loss": 2.4832, - "step": 153340 - }, - { - "epoch": 0.27, - "learning_rate": 3.6628801222111006e-05, - "loss": 2.4943, - "step": 153350 - }, - { - "epoch": 0.27, - "learning_rate": 3.6627929282184176e-05, - "loss": 2.4926, - "step": 153360 - }, - { - "epoch": 0.27, - "learning_rate": 3.6627057342257346e-05, - "loss": 2.4588, - "step": 153370 - }, - { - "epoch": 0.27, - "learning_rate": 3.6626185402330524e-05, - "loss": 2.4157, - "step": 153380 - }, - { - "epoch": 0.27, - "learning_rate": 3.66253134624037e-05, - "loss": 2.3983, - "step": 153390 - }, - { - "epoch": 0.27, - "learning_rate": 3.662444152247687e-05, - "loss": 2.5982, - "step": 153400 - }, - { - "epoch": 0.27, - "learning_rate": 3.662356958255004e-05, - "loss": 2.5575, - "step": 153410 - }, - { - "epoch": 0.27, - "learning_rate": 3.662269764262322e-05, - "loss": 2.5491, - "step": 153420 - }, - { - "epoch": 0.27, - "learning_rate": 3.662182570269639e-05, - "loss": 2.6, - "step": 153430 - }, - { - "epoch": 0.27, - "learning_rate": 3.662095376276956e-05, - "loss": 2.4442, - "step": 153440 - }, - { - "epoch": 0.27, - "learning_rate": 3.6620081822842737e-05, - "loss": 2.4518, - "step": 153450 - }, - { - "epoch": 0.27, - "learning_rate": 3.661920988291591e-05, - "loss": 2.4971, - "step": 153460 - }, - { - "epoch": 0.27, - "learning_rate": 3.6618337942989084e-05, - "loss": 2.5864, - "step": 153470 - }, - { - "epoch": 0.27, - "learning_rate": 3.6617466003062254e-05, - "loss": 2.4505, - "step": 153480 - }, - { - "epoch": 0.27, - "learning_rate": 3.661659406313543e-05, - "loss": 2.4895, - "step": 153490 - }, - { - "epoch": 0.27, - "learning_rate": 3.66157221232086e-05, - "loss": 2.4581, - "step": 153500 - }, - { - "epoch": 0.27, - "learning_rate": 3.661485018328177e-05, - "loss": 2.508, - "step": 153510 - }, - { - "epoch": 0.27, - "learning_rate": 3.661397824335494e-05, - "loss": 2.4373, - "step": 153520 - }, - { - "epoch": 0.27, - "learning_rate": 3.661310630342812e-05, - "loss": 2.4385, - "step": 153530 - }, - { - "epoch": 0.27, - "learning_rate": 3.66122343635013e-05, - "loss": 2.4961, - "step": 153540 - }, - { - "epoch": 0.27, - "learning_rate": 3.661136242357447e-05, - "loss": 2.5488, - "step": 153550 - }, - { - "epoch": 0.27, - "learning_rate": 3.6610490483647645e-05, - "loss": 2.5372, - "step": 153560 - }, - { - "epoch": 0.27, - "learning_rate": 3.6609618543720815e-05, - "loss": 2.435, - "step": 153570 - }, - { - "epoch": 0.27, - "learning_rate": 3.6608746603793985e-05, - "loss": 2.477, - "step": 153580 - }, - { - "epoch": 0.27, - "learning_rate": 3.6607874663867156e-05, - "loss": 2.513, - "step": 153590 - }, - { - "epoch": 0.27, - "learning_rate": 3.660700272394033e-05, - "loss": 2.5042, - "step": 153600 - }, - { - "epoch": 0.27, - "learning_rate": 3.66061307840135e-05, - "loss": 2.3907, - "step": 153610 - }, - { - "epoch": 0.27, - "learning_rate": 3.660525884408668e-05, - "loss": 2.3942, - "step": 153620 - }, - { - "epoch": 0.27, - "learning_rate": 3.660438690415985e-05, - "loss": 2.5732, - "step": 153630 - }, - { - "epoch": 0.27, - "learning_rate": 3.660351496423303e-05, - "loss": 2.4726, - "step": 153640 - }, - { - "epoch": 0.27, - "learning_rate": 3.66026430243062e-05, - "loss": 2.6508, - "step": 153650 - }, - { - "epoch": 0.27, - "learning_rate": 3.660177108437937e-05, - "loss": 2.561, - "step": 153660 - }, - { - "epoch": 0.27, - "learning_rate": 3.6600899144452546e-05, - "loss": 2.4914, - "step": 153670 - }, - { - "epoch": 0.27, - "learning_rate": 3.6600027204525716e-05, - "loss": 2.5237, - "step": 153680 - }, - { - "epoch": 0.27, - "learning_rate": 3.6599155264598893e-05, - "loss": 2.5076, - "step": 153690 - }, - { - "epoch": 0.27, - "learning_rate": 3.6598283324672064e-05, - "loss": 2.5305, - "step": 153700 - }, - { - "epoch": 0.27, - "learning_rate": 3.659741138474524e-05, - "loss": 2.4579, - "step": 153710 - }, - { - "epoch": 0.27, - "learning_rate": 3.659653944481841e-05, - "loss": 2.514, - "step": 153720 - }, - { - "epoch": 0.27, - "learning_rate": 3.659566750489158e-05, - "loss": 2.4739, - "step": 153730 - }, - { - "epoch": 0.27, - "learning_rate": 3.659479556496476e-05, - "loss": 2.4183, - "step": 153740 - }, - { - "epoch": 0.27, - "learning_rate": 3.659392362503793e-05, - "loss": 2.5075, - "step": 153750 - }, - { - "epoch": 0.27, - "learning_rate": 3.65930516851111e-05, - "loss": 2.3852, - "step": 153760 - }, - { - "epoch": 0.27, - "learning_rate": 3.659217974518428e-05, - "loss": 2.4561, - "step": 153770 - }, - { - "epoch": 0.27, - "learning_rate": 3.6591307805257454e-05, - "loss": 2.5005, - "step": 153780 - }, - { - "epoch": 0.27, - "learning_rate": 3.6590435865330624e-05, - "loss": 2.4754, - "step": 153790 - }, - { - "epoch": 0.27, - "learning_rate": 3.6589563925403795e-05, - "loss": 2.4185, - "step": 153800 - }, - { - "epoch": 0.27, - "learning_rate": 3.658869198547697e-05, - "loss": 2.4837, - "step": 153810 - }, - { - "epoch": 0.27, - "learning_rate": 3.658782004555014e-05, - "loss": 2.5526, - "step": 153820 - }, - { - "epoch": 0.27, - "learning_rate": 3.658694810562331e-05, - "loss": 2.3712, - "step": 153830 - }, - { - "epoch": 0.27, - "learning_rate": 3.658607616569649e-05, - "loss": 2.5492, - "step": 153840 - }, - { - "epoch": 0.27, - "learning_rate": 3.658520422576967e-05, - "loss": 2.5242, - "step": 153850 - }, - { - "epoch": 0.27, - "learning_rate": 3.658433228584284e-05, - "loss": 2.3864, - "step": 153860 - }, - { - "epoch": 0.27, - "learning_rate": 3.658346034591601e-05, - "loss": 2.5395, - "step": 153870 - }, - { - "epoch": 0.27, - "learning_rate": 3.6582588405989185e-05, - "loss": 2.444, - "step": 153880 - }, - { - "epoch": 0.27, - "learning_rate": 3.6581716466062355e-05, - "loss": 2.5091, - "step": 153890 - }, - { - "epoch": 0.27, - "learning_rate": 3.6580844526135526e-05, - "loss": 2.356, - "step": 153900 - }, - { - "epoch": 0.27, - "learning_rate": 3.65799725862087e-05, - "loss": 2.5168, - "step": 153910 - }, - { - "epoch": 0.27, - "learning_rate": 3.657910064628188e-05, - "loss": 2.5785, - "step": 153920 - }, - { - "epoch": 0.27, - "learning_rate": 3.657822870635505e-05, - "loss": 2.4682, - "step": 153930 - }, - { - "epoch": 0.27, - "learning_rate": 3.657735676642822e-05, - "loss": 2.4289, - "step": 153940 - }, - { - "epoch": 0.27, - "learning_rate": 3.65764848265014e-05, - "loss": 2.5931, - "step": 153950 - }, - { - "epoch": 0.27, - "learning_rate": 3.657561288657457e-05, - "loss": 2.4355, - "step": 153960 - }, - { - "epoch": 0.27, - "learning_rate": 3.657474094664774e-05, - "loss": 2.4306, - "step": 153970 - }, - { - "epoch": 0.27, - "learning_rate": 3.657386900672091e-05, - "loss": 2.421, - "step": 153980 - }, - { - "epoch": 0.27, - "learning_rate": 3.657299706679409e-05, - "loss": 2.4914, - "step": 153990 - }, - { - "epoch": 0.27, - "learning_rate": 3.6572125126867263e-05, - "loss": 2.4436, - "step": 154000 - }, - { - "epoch": 0.27, - "learning_rate": 3.6571253186940434e-05, - "loss": 2.4277, - "step": 154010 - }, - { - "epoch": 0.27, - "learning_rate": 3.657038124701361e-05, - "loss": 2.5265, - "step": 154020 - }, - { - "epoch": 0.27, - "learning_rate": 3.656950930708678e-05, - "loss": 2.3525, - "step": 154030 - }, - { - "epoch": 0.27, - "learning_rate": 3.656863736715995e-05, - "loss": 2.4789, - "step": 154040 - }, - { - "epoch": 0.27, - "learning_rate": 3.656776542723312e-05, - "loss": 2.4033, - "step": 154050 - }, - { - "epoch": 0.27, - "learning_rate": 3.6566893487306306e-05, - "loss": 2.4459, - "step": 154060 - }, - { - "epoch": 0.27, - "learning_rate": 3.6566021547379476e-05, - "loss": 2.5555, - "step": 154070 - }, - { - "epoch": 0.27, - "learning_rate": 3.656514960745265e-05, - "loss": 2.4849, - "step": 154080 - }, - { - "epoch": 0.27, - "learning_rate": 3.656427766752582e-05, - "loss": 2.5541, - "step": 154090 - }, - { - "epoch": 0.27, - "learning_rate": 3.6563405727598994e-05, - "loss": 2.4857, - "step": 154100 - }, - { - "epoch": 0.27, - "learning_rate": 3.6562533787672165e-05, - "loss": 2.5062, - "step": 154110 - }, - { - "epoch": 0.27, - "learning_rate": 3.6561661847745335e-05, - "loss": 2.5225, - "step": 154120 - }, - { - "epoch": 0.27, - "learning_rate": 3.656078990781851e-05, - "loss": 2.5021, - "step": 154130 - }, - { - "epoch": 0.27, - "learning_rate": 3.655991796789169e-05, - "loss": 2.4613, - "step": 154140 - }, - { - "epoch": 0.27, - "learning_rate": 3.655904602796486e-05, - "loss": 2.4709, - "step": 154150 - }, - { - "epoch": 0.27, - "learning_rate": 3.655817408803803e-05, - "loss": 2.432, - "step": 154160 - }, - { - "epoch": 0.27, - "learning_rate": 3.655730214811121e-05, - "loss": 2.444, - "step": 154170 - }, - { - "epoch": 0.27, - "learning_rate": 3.655643020818438e-05, - "loss": 2.4323, - "step": 154180 - }, - { - "epoch": 0.27, - "learning_rate": 3.655555826825755e-05, - "loss": 2.4727, - "step": 154190 - }, - { - "epoch": 0.27, - "learning_rate": 3.6554686328330725e-05, - "loss": 2.4011, - "step": 154200 - }, - { - "epoch": 0.27, - "learning_rate": 3.65538143884039e-05, - "loss": 2.4264, - "step": 154210 - }, - { - "epoch": 0.27, - "learning_rate": 3.655294244847707e-05, - "loss": 2.5412, - "step": 154220 - }, - { - "epoch": 0.27, - "learning_rate": 3.655207050855024e-05, - "loss": 2.4666, - "step": 154230 - }, - { - "epoch": 0.27, - "learning_rate": 3.655119856862342e-05, - "loss": 2.4731, - "step": 154240 - }, - { - "epoch": 0.27, - "learning_rate": 3.655032662869659e-05, - "loss": 2.3906, - "step": 154250 - }, - { - "epoch": 0.27, - "learning_rate": 3.654945468876976e-05, - "loss": 2.4348, - "step": 154260 - }, - { - "epoch": 0.27, - "learning_rate": 3.654858274884294e-05, - "loss": 2.4669, - "step": 154270 - }, - { - "epoch": 0.27, - "learning_rate": 3.654771080891611e-05, - "loss": 2.4968, - "step": 154280 - }, - { - "epoch": 0.27, - "learning_rate": 3.6546838868989286e-05, - "loss": 2.4301, - "step": 154290 - }, - { - "epoch": 0.27, - "learning_rate": 3.6545966929062456e-05, - "loss": 2.54, - "step": 154300 - }, - { - "epoch": 0.27, - "learning_rate": 3.654509498913563e-05, - "loss": 2.5115, - "step": 154310 - }, - { - "epoch": 0.27, - "learning_rate": 3.6544223049208804e-05, - "loss": 2.4678, - "step": 154320 - }, - { - "epoch": 0.27, - "learning_rate": 3.6543351109281974e-05, - "loss": 2.5372, - "step": 154330 - }, - { - "epoch": 0.27, - "learning_rate": 3.654247916935515e-05, - "loss": 2.422, - "step": 154340 - }, - { - "epoch": 0.27, - "learning_rate": 3.654160722942832e-05, - "loss": 2.4744, - "step": 154350 - }, - { - "epoch": 0.27, - "learning_rate": 3.65407352895015e-05, - "loss": 2.571, - "step": 154360 - }, - { - "epoch": 0.27, - "learning_rate": 3.653986334957467e-05, - "loss": 2.4502, - "step": 154370 - }, - { - "epoch": 0.27, - "learning_rate": 3.6538991409647846e-05, - "loss": 2.4257, - "step": 154380 - }, - { - "epoch": 0.27, - "learning_rate": 3.653811946972102e-05, - "loss": 2.5118, - "step": 154390 - }, - { - "epoch": 0.27, - "learning_rate": 3.653724752979419e-05, - "loss": 2.372, - "step": 154400 - }, - { - "epoch": 0.27, - "learning_rate": 3.6536375589867364e-05, - "loss": 2.4393, - "step": 154410 - }, - { - "epoch": 0.27, - "learning_rate": 3.6535503649940535e-05, - "loss": 2.3996, - "step": 154420 - }, - { - "epoch": 0.27, - "learning_rate": 3.6534631710013705e-05, - "loss": 2.534, - "step": 154430 - }, - { - "epoch": 0.27, - "learning_rate": 3.653375977008688e-05, - "loss": 2.4919, - "step": 154440 - }, - { - "epoch": 0.27, - "learning_rate": 3.653288783016006e-05, - "loss": 2.5061, - "step": 154450 - }, - { - "epoch": 0.27, - "learning_rate": 3.653201589023323e-05, - "loss": 2.3938, - "step": 154460 - }, - { - "epoch": 0.27, - "learning_rate": 3.65311439503064e-05, - "loss": 2.3806, - "step": 154470 - }, - { - "epoch": 0.27, - "learning_rate": 3.653027201037957e-05, - "loss": 2.4858, - "step": 154480 - }, - { - "epoch": 0.27, - "learning_rate": 3.652940007045275e-05, - "loss": 2.3837, - "step": 154490 - }, - { - "epoch": 0.27, - "learning_rate": 3.652852813052592e-05, - "loss": 2.5549, - "step": 154500 - }, - { - "epoch": 0.27, - "learning_rate": 3.6527656190599095e-05, - "loss": 2.5551, - "step": 154510 - }, - { - "epoch": 0.27, - "learning_rate": 3.652678425067227e-05, - "loss": 2.4959, - "step": 154520 - }, - { - "epoch": 0.27, - "learning_rate": 3.652591231074544e-05, - "loss": 2.4661, - "step": 154530 - }, - { - "epoch": 0.27, - "learning_rate": 3.652504037081861e-05, - "loss": 2.4459, - "step": 154540 - }, - { - "epoch": 0.27, - "learning_rate": 3.6524168430891783e-05, - "loss": 2.4684, - "step": 154550 - }, - { - "epoch": 0.27, - "learning_rate": 3.652329649096496e-05, - "loss": 2.5005, - "step": 154560 - }, - { - "epoch": 0.27, - "learning_rate": 3.652242455103813e-05, - "loss": 2.4378, - "step": 154570 - }, - { - "epoch": 0.27, - "learning_rate": 3.652155261111131e-05, - "loss": 2.3806, - "step": 154580 - }, - { - "epoch": 0.27, - "learning_rate": 3.652068067118448e-05, - "loss": 2.4518, - "step": 154590 - }, - { - "epoch": 0.27, - "learning_rate": 3.6519808731257656e-05, - "loss": 2.4433, - "step": 154600 - }, - { - "epoch": 0.27, - "learning_rate": 3.6518936791330826e-05, - "loss": 2.4036, - "step": 154610 - }, - { - "epoch": 0.27, - "learning_rate": 3.6518064851403996e-05, - "loss": 2.4838, - "step": 154620 - }, - { - "epoch": 0.27, - "learning_rate": 3.6517192911477174e-05, - "loss": 2.5261, - "step": 154630 - }, - { - "epoch": 0.27, - "learning_rate": 3.6516320971550344e-05, - "loss": 2.4718, - "step": 154640 - }, - { - "epoch": 0.27, - "learning_rate": 3.6515449031623514e-05, - "loss": 2.4859, - "step": 154650 - }, - { - "epoch": 0.27, - "learning_rate": 3.651457709169669e-05, - "loss": 2.4945, - "step": 154660 - }, - { - "epoch": 0.27, - "learning_rate": 3.651370515176987e-05, - "loss": 2.5331, - "step": 154670 - }, - { - "epoch": 0.27, - "learning_rate": 3.651283321184304e-05, - "loss": 2.552, - "step": 154680 - }, - { - "epoch": 0.27, - "learning_rate": 3.651196127191621e-05, - "loss": 2.4628, - "step": 154690 - }, - { - "epoch": 0.27, - "learning_rate": 3.651108933198939e-05, - "loss": 2.4445, - "step": 154700 - }, - { - "epoch": 0.27, - "learning_rate": 3.651021739206256e-05, - "loss": 2.4283, - "step": 154710 - }, - { - "epoch": 0.27, - "learning_rate": 3.650934545213573e-05, - "loss": 2.4362, - "step": 154720 - }, - { - "epoch": 0.27, - "learning_rate": 3.6508473512208905e-05, - "loss": 2.5159, - "step": 154730 - }, - { - "epoch": 0.27, - "learning_rate": 3.650760157228208e-05, - "loss": 2.4871, - "step": 154740 - }, - { - "epoch": 0.27, - "learning_rate": 3.650672963235525e-05, - "loss": 2.5108, - "step": 154750 - }, - { - "epoch": 0.27, - "learning_rate": 3.650585769242842e-05, - "loss": 2.3753, - "step": 154760 - }, - { - "epoch": 0.27, - "learning_rate": 3.65049857525016e-05, - "loss": 2.4486, - "step": 154770 - }, - { - "epoch": 0.27, - "learning_rate": 3.650411381257477e-05, - "loss": 2.5333, - "step": 154780 - }, - { - "epoch": 0.27, - "learning_rate": 3.650324187264794e-05, - "loss": 2.4196, - "step": 154790 - }, - { - "epoch": 0.27, - "learning_rate": 3.650236993272112e-05, - "loss": 2.4526, - "step": 154800 - }, - { - "epoch": 0.27, - "learning_rate": 3.6501497992794295e-05, - "loss": 2.4811, - "step": 154810 - }, - { - "epoch": 0.27, - "learning_rate": 3.6500626052867465e-05, - "loss": 2.4955, - "step": 154820 - }, - { - "epoch": 0.27, - "learning_rate": 3.6499754112940635e-05, - "loss": 2.3906, - "step": 154830 - }, - { - "epoch": 0.27, - "learning_rate": 3.649888217301381e-05, - "loss": 2.4716, - "step": 154840 - }, - { - "epoch": 0.27, - "learning_rate": 3.649801023308698e-05, - "loss": 2.5367, - "step": 154850 - }, - { - "epoch": 0.27, - "learning_rate": 3.6497138293160153e-05, - "loss": 2.4541, - "step": 154860 - }, - { - "epoch": 0.27, - "learning_rate": 3.6496266353233324e-05, - "loss": 2.448, - "step": 154870 - }, - { - "epoch": 0.27, - "learning_rate": 3.649539441330651e-05, - "loss": 2.3652, - "step": 154880 - }, - { - "epoch": 0.27, - "learning_rate": 3.649452247337968e-05, - "loss": 2.4605, - "step": 154890 - }, - { - "epoch": 0.27, - "learning_rate": 3.649365053345285e-05, - "loss": 2.4749, - "step": 154900 - }, - { - "epoch": 0.27, - "learning_rate": 3.6492778593526026e-05, - "loss": 2.4812, - "step": 154910 - }, - { - "epoch": 0.27, - "learning_rate": 3.6491906653599196e-05, - "loss": 2.5383, - "step": 154920 - }, - { - "epoch": 0.27, - "learning_rate": 3.6491034713672366e-05, - "loss": 2.4793, - "step": 154930 - }, - { - "epoch": 0.27, - "learning_rate": 3.649016277374554e-05, - "loss": 2.4586, - "step": 154940 - }, - { - "epoch": 0.27, - "learning_rate": 3.6489290833818714e-05, - "loss": 2.4967, - "step": 154950 - }, - { - "epoch": 0.27, - "learning_rate": 3.648841889389189e-05, - "loss": 2.5468, - "step": 154960 - }, - { - "epoch": 0.27, - "learning_rate": 3.648754695396506e-05, - "loss": 2.5512, - "step": 154970 - }, - { - "epoch": 0.27, - "learning_rate": 3.648667501403823e-05, - "loss": 2.5069, - "step": 154980 - }, - { - "epoch": 0.27, - "learning_rate": 3.648580307411141e-05, - "loss": 2.4701, - "step": 154990 - }, - { - "epoch": 0.27, - "learning_rate": 3.648493113418458e-05, - "loss": 2.5543, - "step": 155000 - }, - { - "epoch": 0.27, - "learning_rate": 3.648405919425775e-05, - "loss": 2.4378, - "step": 155010 - }, - { - "epoch": 0.27, - "learning_rate": 3.648318725433093e-05, - "loss": 2.4965, - "step": 155020 - }, - { - "epoch": 0.27, - "learning_rate": 3.6482315314404104e-05, - "loss": 2.5626, - "step": 155030 - }, - { - "epoch": 0.27, - "learning_rate": 3.6481443374477275e-05, - "loss": 2.4642, - "step": 155040 - }, - { - "epoch": 0.27, - "learning_rate": 3.6480571434550445e-05, - "loss": 2.4567, - "step": 155050 - }, - { - "epoch": 0.27, - "learning_rate": 3.647969949462362e-05, - "loss": 2.6072, - "step": 155060 - }, - { - "epoch": 0.27, - "learning_rate": 3.647882755469679e-05, - "loss": 2.4729, - "step": 155070 - }, - { - "epoch": 0.27, - "learning_rate": 3.647795561476996e-05, - "loss": 2.4355, - "step": 155080 - }, - { - "epoch": 0.27, - "learning_rate": 3.647708367484314e-05, - "loss": 2.437, - "step": 155090 - }, - { - "epoch": 0.27, - "learning_rate": 3.647621173491632e-05, - "loss": 2.3747, - "step": 155100 - }, - { - "epoch": 0.27, - "learning_rate": 3.647533979498949e-05, - "loss": 2.3842, - "step": 155110 - }, - { - "epoch": 0.27, - "learning_rate": 3.647446785506266e-05, - "loss": 2.4239, - "step": 155120 - }, - { - "epoch": 0.27, - "learning_rate": 3.6473595915135835e-05, - "loss": 2.3532, - "step": 155130 - }, - { - "epoch": 0.27, - "learning_rate": 3.6472723975209005e-05, - "loss": 2.4949, - "step": 155140 - }, - { - "epoch": 0.27, - "learning_rate": 3.6471852035282176e-05, - "loss": 2.4654, - "step": 155150 - }, - { - "epoch": 0.27, - "learning_rate": 3.647098009535535e-05, - "loss": 2.4049, - "step": 155160 - }, - { - "epoch": 0.27, - "learning_rate": 3.647010815542852e-05, - "loss": 2.3882, - "step": 155170 - }, - { - "epoch": 0.27, - "learning_rate": 3.64692362155017e-05, - "loss": 2.514, - "step": 155180 - }, - { - "epoch": 0.27, - "learning_rate": 3.646836427557487e-05, - "loss": 2.4248, - "step": 155190 - }, - { - "epoch": 0.27, - "learning_rate": 3.646749233564805e-05, - "loss": 2.5609, - "step": 155200 - }, - { - "epoch": 0.27, - "learning_rate": 3.646662039572122e-05, - "loss": 2.4598, - "step": 155210 - }, - { - "epoch": 0.27, - "learning_rate": 3.646574845579439e-05, - "loss": 2.4837, - "step": 155220 - }, - { - "epoch": 0.27, - "learning_rate": 3.6464876515867566e-05, - "loss": 2.5123, - "step": 155230 - }, - { - "epoch": 0.27, - "learning_rate": 3.6464004575940736e-05, - "loss": 2.4236, - "step": 155240 - }, - { - "epoch": 0.27, - "learning_rate": 3.6463132636013914e-05, - "loss": 2.4939, - "step": 155250 - }, - { - "epoch": 0.27, - "learning_rate": 3.6462260696087084e-05, - "loss": 2.4721, - "step": 155260 - }, - { - "epoch": 0.27, - "learning_rate": 3.646138875616026e-05, - "loss": 2.5476, - "step": 155270 - }, - { - "epoch": 0.27, - "learning_rate": 3.646051681623343e-05, - "loss": 2.4465, - "step": 155280 - }, - { - "epoch": 0.27, - "learning_rate": 3.64596448763066e-05, - "loss": 2.3279, - "step": 155290 - }, - { - "epoch": 0.27, - "learning_rate": 3.645877293637978e-05, - "loss": 2.3808, - "step": 155300 - }, - { - "epoch": 0.27, - "learning_rate": 3.645790099645295e-05, - "loss": 2.3918, - "step": 155310 - }, - { - "epoch": 0.27, - "learning_rate": 3.645702905652612e-05, - "loss": 2.4104, - "step": 155320 - }, - { - "epoch": 0.27, - "learning_rate": 3.64561571165993e-05, - "loss": 2.5214, - "step": 155330 - }, - { - "epoch": 0.27, - "learning_rate": 3.6455285176672474e-05, - "loss": 2.5854, - "step": 155340 - }, - { - "epoch": 0.27, - "learning_rate": 3.6454413236745644e-05, - "loss": 2.4914, - "step": 155350 - }, - { - "epoch": 0.27, - "learning_rate": 3.6453541296818815e-05, - "loss": 2.3887, - "step": 155360 - }, - { - "epoch": 0.27, - "learning_rate": 3.645266935689199e-05, - "loss": 2.4305, - "step": 155370 - }, - { - "epoch": 0.27, - "learning_rate": 3.645179741696516e-05, - "loss": 2.4562, - "step": 155380 - }, - { - "epoch": 0.27, - "learning_rate": 3.645092547703833e-05, - "loss": 2.3466, - "step": 155390 - }, - { - "epoch": 0.27, - "learning_rate": 3.645005353711151e-05, - "loss": 2.2605, - "step": 155400 - }, - { - "epoch": 0.27, - "learning_rate": 3.644918159718469e-05, - "loss": 2.5322, - "step": 155410 - }, - { - "epoch": 0.27, - "learning_rate": 3.644830965725786e-05, - "loss": 2.4933, - "step": 155420 - }, - { - "epoch": 0.27, - "learning_rate": 3.644743771733103e-05, - "loss": 2.5813, - "step": 155430 - }, - { - "epoch": 0.27, - "learning_rate": 3.64465657774042e-05, - "loss": 2.5314, - "step": 155440 - }, - { - "epoch": 0.27, - "learning_rate": 3.6445693837477375e-05, - "loss": 2.5212, - "step": 155450 - }, - { - "epoch": 0.27, - "learning_rate": 3.6444821897550546e-05, - "loss": 2.4556, - "step": 155460 - }, - { - "epoch": 0.27, - "learning_rate": 3.6443949957623716e-05, - "loss": 2.4274, - "step": 155470 - }, - { - "epoch": 0.27, - "learning_rate": 3.64430780176969e-05, - "loss": 2.4236, - "step": 155480 - }, - { - "epoch": 0.27, - "learning_rate": 3.644220607777007e-05, - "loss": 2.4665, - "step": 155490 - }, - { - "epoch": 0.27, - "learning_rate": 3.644133413784324e-05, - "loss": 2.4957, - "step": 155500 - }, - { - "epoch": 0.27, - "learning_rate": 3.644046219791641e-05, - "loss": 2.5674, - "step": 155510 - }, - { - "epoch": 0.27, - "learning_rate": 3.643959025798959e-05, - "loss": 2.4107, - "step": 155520 - }, - { - "epoch": 0.27, - "learning_rate": 3.643871831806276e-05, - "loss": 2.5169, - "step": 155530 - }, - { - "epoch": 0.27, - "learning_rate": 3.643784637813593e-05, - "loss": 2.552, - "step": 155540 - }, - { - "epoch": 0.27, - "learning_rate": 3.6436974438209106e-05, - "loss": 2.5274, - "step": 155550 - }, - { - "epoch": 0.27, - "learning_rate": 3.6436102498282283e-05, - "loss": 2.3424, - "step": 155560 - }, - { - "epoch": 0.27, - "learning_rate": 3.6435230558355454e-05, - "loss": 2.5219, - "step": 155570 - }, - { - "epoch": 0.27, - "learning_rate": 3.6434358618428624e-05, - "loss": 2.4806, - "step": 155580 - }, - { - "epoch": 0.27, - "learning_rate": 3.64334866785018e-05, - "loss": 2.3758, - "step": 155590 - }, - { - "epoch": 0.27, - "learning_rate": 3.643261473857497e-05, - "loss": 2.4223, - "step": 155600 - }, - { - "epoch": 0.27, - "learning_rate": 3.643174279864814e-05, - "loss": 2.494, - "step": 155610 - }, - { - "epoch": 0.27, - "learning_rate": 3.643087085872132e-05, - "loss": 2.4317, - "step": 155620 - }, - { - "epoch": 0.27, - "learning_rate": 3.6429998918794496e-05, - "loss": 2.4989, - "step": 155630 - }, - { - "epoch": 0.27, - "learning_rate": 3.642912697886767e-05, - "loss": 2.418, - "step": 155640 - }, - { - "epoch": 0.27, - "learning_rate": 3.642825503894084e-05, - "loss": 2.5125, - "step": 155650 - }, - { - "epoch": 0.27, - "learning_rate": 3.6427383099014014e-05, - "loss": 2.4109, - "step": 155660 - }, - { - "epoch": 0.27, - "learning_rate": 3.6426511159087185e-05, - "loss": 2.4724, - "step": 155670 - }, - { - "epoch": 0.27, - "learning_rate": 3.6425639219160355e-05, - "loss": 2.5436, - "step": 155680 - }, - { - "epoch": 0.27, - "learning_rate": 3.642476727923353e-05, - "loss": 2.3952, - "step": 155690 - }, - { - "epoch": 0.27, - "learning_rate": 3.642389533930671e-05, - "loss": 2.5672, - "step": 155700 - }, - { - "epoch": 0.27, - "learning_rate": 3.642302339937988e-05, - "loss": 2.4518, - "step": 155710 - }, - { - "epoch": 0.27, - "learning_rate": 3.642215145945305e-05, - "loss": 2.5465, - "step": 155720 - }, - { - "epoch": 0.27, - "learning_rate": 3.642127951952623e-05, - "loss": 2.501, - "step": 155730 - }, - { - "epoch": 0.27, - "learning_rate": 3.64204075795994e-05, - "loss": 2.5318, - "step": 155740 - }, - { - "epoch": 0.27, - "learning_rate": 3.641953563967257e-05, - "loss": 2.4314, - "step": 155750 - }, - { - "epoch": 0.27, - "learning_rate": 3.6418663699745745e-05, - "loss": 2.5144, - "step": 155760 - }, - { - "epoch": 0.27, - "learning_rate": 3.641779175981892e-05, - "loss": 2.4561, - "step": 155770 - }, - { - "epoch": 0.27, - "learning_rate": 3.641691981989209e-05, - "loss": 2.5109, - "step": 155780 - }, - { - "epoch": 0.27, - "learning_rate": 3.641604787996526e-05, - "loss": 2.4761, - "step": 155790 - }, - { - "epoch": 0.27, - "learning_rate": 3.641517594003844e-05, - "loss": 2.4298, - "step": 155800 - }, - { - "epoch": 0.27, - "learning_rate": 3.641430400011161e-05, - "loss": 2.5636, - "step": 155810 - }, - { - "epoch": 0.27, - "learning_rate": 3.641343206018478e-05, - "loss": 2.4865, - "step": 155820 - }, - { - "epoch": 0.27, - "learning_rate": 3.641256012025795e-05, - "loss": 2.4705, - "step": 155830 - }, - { - "epoch": 0.27, - "learning_rate": 3.641168818033113e-05, - "loss": 2.3615, - "step": 155840 - }, - { - "epoch": 0.27, - "learning_rate": 3.6410816240404306e-05, - "loss": 2.3725, - "step": 155850 - }, - { - "epoch": 0.27, - "learning_rate": 3.6409944300477476e-05, - "loss": 2.662, - "step": 155860 - }, - { - "epoch": 0.27, - "learning_rate": 3.640907236055065e-05, - "loss": 2.3241, - "step": 155870 - }, - { - "epoch": 0.27, - "learning_rate": 3.6408200420623824e-05, - "loss": 2.483, - "step": 155880 - }, - { - "epoch": 0.27, - "learning_rate": 3.6407328480696994e-05, - "loss": 2.4559, - "step": 155890 - }, - { - "epoch": 0.27, - "learning_rate": 3.6406456540770165e-05, - "loss": 2.5119, - "step": 155900 - }, - { - "epoch": 0.27, - "learning_rate": 3.640558460084334e-05, - "loss": 2.4485, - "step": 155910 - }, - { - "epoch": 0.27, - "learning_rate": 3.640471266091652e-05, - "loss": 2.3782, - "step": 155920 - }, - { - "epoch": 0.27, - "learning_rate": 3.640384072098969e-05, - "loss": 2.3632, - "step": 155930 - }, - { - "epoch": 0.27, - "learning_rate": 3.640296878106286e-05, - "loss": 2.4593, - "step": 155940 - }, - { - "epoch": 0.27, - "learning_rate": 3.640209684113604e-05, - "loss": 2.5489, - "step": 155950 - }, - { - "epoch": 0.27, - "learning_rate": 3.640122490120921e-05, - "loss": 2.4247, - "step": 155960 - }, - { - "epoch": 0.27, - "learning_rate": 3.640035296128238e-05, - "loss": 2.4403, - "step": 155970 - }, - { - "epoch": 0.27, - "learning_rate": 3.6399481021355555e-05, - "loss": 2.5107, - "step": 155980 - }, - { - "epoch": 0.27, - "learning_rate": 3.6398609081428725e-05, - "loss": 2.4828, - "step": 155990 - }, - { - "epoch": 0.27, - "learning_rate": 3.63977371415019e-05, - "loss": 2.5713, - "step": 156000 - }, - { - "epoch": 0.27, - "learning_rate": 3.639686520157507e-05, - "loss": 2.4321, - "step": 156010 - }, - { - "epoch": 0.27, - "learning_rate": 3.639599326164825e-05, - "loss": 2.5822, - "step": 156020 - }, - { - "epoch": 0.27, - "learning_rate": 3.639512132172142e-05, - "loss": 2.4153, - "step": 156030 - }, - { - "epoch": 0.27, - "learning_rate": 3.639424938179459e-05, - "loss": 2.3516, - "step": 156040 - }, - { - "epoch": 0.27, - "learning_rate": 3.639337744186777e-05, - "loss": 2.3746, - "step": 156050 - }, - { - "epoch": 0.27, - "learning_rate": 3.639250550194094e-05, - "loss": 2.4728, - "step": 156060 - }, - { - "epoch": 0.27, - "learning_rate": 3.6391633562014115e-05, - "loss": 2.5447, - "step": 156070 - }, - { - "epoch": 0.27, - "learning_rate": 3.6390761622087286e-05, - "loss": 2.4828, - "step": 156080 - }, - { - "epoch": 0.27, - "learning_rate": 3.638988968216046e-05, - "loss": 2.5017, - "step": 156090 - }, - { - "epoch": 0.27, - "learning_rate": 3.638901774223363e-05, - "loss": 2.5204, - "step": 156100 - }, - { - "epoch": 0.27, - "learning_rate": 3.6388145802306804e-05, - "loss": 2.4672, - "step": 156110 - }, - { - "epoch": 0.27, - "learning_rate": 3.638727386237998e-05, - "loss": 2.5459, - "step": 156120 - }, - { - "epoch": 0.27, - "learning_rate": 3.638640192245315e-05, - "loss": 2.4295, - "step": 156130 - }, - { - "epoch": 0.27, - "learning_rate": 3.638552998252632e-05, - "loss": 2.5147, - "step": 156140 - }, - { - "epoch": 0.27, - "learning_rate": 3.63846580425995e-05, - "loss": 2.5548, - "step": 156150 - }, - { - "epoch": 0.27, - "learning_rate": 3.6383786102672676e-05, - "loss": 2.4305, - "step": 156160 - }, - { - "epoch": 0.27, - "learning_rate": 3.6382914162745846e-05, - "loss": 2.4602, - "step": 156170 - }, - { - "epoch": 0.27, - "learning_rate": 3.6382042222819017e-05, - "loss": 2.4771, - "step": 156180 - }, - { - "epoch": 0.27, - "learning_rate": 3.6381170282892194e-05, - "loss": 2.4165, - "step": 156190 - }, - { - "epoch": 0.27, - "learning_rate": 3.6380298342965364e-05, - "loss": 2.5503, - "step": 156200 - }, - { - "epoch": 0.27, - "learning_rate": 3.6379426403038534e-05, - "loss": 2.4572, - "step": 156210 - }, - { - "epoch": 0.27, - "learning_rate": 3.637855446311171e-05, - "loss": 2.4384, - "step": 156220 - }, - { - "epoch": 0.27, - "learning_rate": 3.637768252318489e-05, - "loss": 2.3908, - "step": 156230 - }, - { - "epoch": 0.27, - "learning_rate": 3.637681058325806e-05, - "loss": 2.4969, - "step": 156240 - }, - { - "epoch": 0.27, - "learning_rate": 3.637593864333123e-05, - "loss": 2.367, - "step": 156250 - }, - { - "epoch": 0.27, - "learning_rate": 3.637506670340441e-05, - "loss": 2.5095, - "step": 156260 - }, - { - "epoch": 0.27, - "learning_rate": 3.637419476347758e-05, - "loss": 2.4504, - "step": 156270 - }, - { - "epoch": 0.27, - "learning_rate": 3.637332282355075e-05, - "loss": 2.5414, - "step": 156280 - }, - { - "epoch": 0.27, - "learning_rate": 3.637245088362392e-05, - "loss": 2.4773, - "step": 156290 - }, - { - "epoch": 0.27, - "learning_rate": 3.63715789436971e-05, - "loss": 2.4729, - "step": 156300 - }, - { - "epoch": 0.27, - "learning_rate": 3.637070700377027e-05, - "loss": 2.5452, - "step": 156310 - }, - { - "epoch": 0.27, - "learning_rate": 3.636983506384344e-05, - "loss": 2.4456, - "step": 156320 - }, - { - "epoch": 0.27, - "learning_rate": 3.636896312391661e-05, - "loss": 2.5955, - "step": 156330 - }, - { - "epoch": 0.27, - "learning_rate": 3.636809118398979e-05, - "loss": 2.5142, - "step": 156340 - }, - { - "epoch": 0.27, - "learning_rate": 3.636721924406296e-05, - "loss": 2.5174, - "step": 156350 - }, - { - "epoch": 0.27, - "learning_rate": 3.636634730413613e-05, - "loss": 2.5109, - "step": 156360 - }, - { - "epoch": 0.27, - "learning_rate": 3.6365475364209315e-05, - "loss": 2.3371, - "step": 156370 - }, - { - "epoch": 0.27, - "learning_rate": 3.6364603424282485e-05, - "loss": 2.4786, - "step": 156380 - }, - { - "epoch": 0.27, - "learning_rate": 3.6363731484355656e-05, - "loss": 2.513, - "step": 156390 - }, - { - "epoch": 0.27, - "learning_rate": 3.6362859544428826e-05, - "loss": 2.4422, - "step": 156400 - }, - { - "epoch": 0.27, - "learning_rate": 3.6361987604502e-05, - "loss": 2.525, - "step": 156410 - }, - { - "epoch": 0.27, - "learning_rate": 3.6361115664575173e-05, - "loss": 2.4383, - "step": 156420 - }, - { - "epoch": 0.27, - "learning_rate": 3.6360243724648344e-05, - "loss": 2.4084, - "step": 156430 - }, - { - "epoch": 0.27, - "learning_rate": 3.635937178472152e-05, - "loss": 2.5718, - "step": 156440 - }, - { - "epoch": 0.27, - "learning_rate": 3.63584998447947e-05, - "loss": 2.4003, - "step": 156450 - }, - { - "epoch": 0.27, - "learning_rate": 3.635762790486787e-05, - "loss": 2.6099, - "step": 156460 - }, - { - "epoch": 0.27, - "learning_rate": 3.635675596494104e-05, - "loss": 2.506, - "step": 156470 - }, - { - "epoch": 0.27, - "learning_rate": 3.6355884025014216e-05, - "loss": 2.447, - "step": 156480 - }, - { - "epoch": 0.27, - "learning_rate": 3.6355012085087386e-05, - "loss": 2.4893, - "step": 156490 - }, - { - "epoch": 0.27, - "learning_rate": 3.635414014516056e-05, - "loss": 2.4426, - "step": 156500 - }, - { - "epoch": 0.27, - "learning_rate": 3.6353268205233734e-05, - "loss": 2.4573, - "step": 156510 - }, - { - "epoch": 0.27, - "learning_rate": 3.635239626530691e-05, - "loss": 2.4118, - "step": 156520 - }, - { - "epoch": 0.27, - "learning_rate": 3.635152432538008e-05, - "loss": 2.4635, - "step": 156530 - }, - { - "epoch": 0.27, - "learning_rate": 3.635065238545325e-05, - "loss": 2.3155, - "step": 156540 - }, - { - "epoch": 0.27, - "learning_rate": 3.634978044552643e-05, - "loss": 2.4393, - "step": 156550 - }, - { - "epoch": 0.27, - "learning_rate": 3.63489085055996e-05, - "loss": 2.5061, - "step": 156560 - }, - { - "epoch": 0.27, - "learning_rate": 3.634803656567277e-05, - "loss": 2.494, - "step": 156570 - }, - { - "epoch": 0.27, - "learning_rate": 3.634716462574595e-05, - "loss": 2.3617, - "step": 156580 - }, - { - "epoch": 0.27, - "learning_rate": 3.6346292685819124e-05, - "loss": 2.3667, - "step": 156590 - }, - { - "epoch": 0.27, - "learning_rate": 3.6345420745892295e-05, - "loss": 2.4048, - "step": 156600 - }, - { - "epoch": 0.27, - "learning_rate": 3.6344548805965465e-05, - "loss": 2.477, - "step": 156610 - }, - { - "epoch": 0.27, - "learning_rate": 3.634367686603864e-05, - "loss": 2.5504, - "step": 156620 - }, - { - "epoch": 0.27, - "learning_rate": 3.634280492611181e-05, - "loss": 2.5258, - "step": 156630 - }, - { - "epoch": 0.27, - "learning_rate": 3.634193298618498e-05, - "loss": 2.3471, - "step": 156640 - }, - { - "epoch": 0.27, - "learning_rate": 3.634106104625816e-05, - "loss": 2.4454, - "step": 156650 - }, - { - "epoch": 0.27, - "learning_rate": 3.634018910633133e-05, - "loss": 2.6074, - "step": 156660 - }, - { - "epoch": 0.27, - "learning_rate": 3.633931716640451e-05, - "loss": 2.4111, - "step": 156670 - }, - { - "epoch": 0.27, - "learning_rate": 3.633844522647768e-05, - "loss": 2.5251, - "step": 156680 - }, - { - "epoch": 0.27, - "learning_rate": 3.6337573286550855e-05, - "loss": 2.434, - "step": 156690 - }, - { - "epoch": 0.27, - "learning_rate": 3.6336701346624025e-05, - "loss": 2.5038, - "step": 156700 - }, - { - "epoch": 0.27, - "learning_rate": 3.6335829406697196e-05, - "loss": 2.3842, - "step": 156710 - }, - { - "epoch": 0.27, - "learning_rate": 3.633495746677037e-05, - "loss": 2.536, - "step": 156720 - }, - { - "epoch": 0.27, - "learning_rate": 3.633408552684354e-05, - "loss": 2.6134, - "step": 156730 - }, - { - "epoch": 0.27, - "learning_rate": 3.633321358691672e-05, - "loss": 2.4007, - "step": 156740 - }, - { - "epoch": 0.27, - "learning_rate": 3.633234164698989e-05, - "loss": 2.3886, - "step": 156750 - }, - { - "epoch": 0.27, - "learning_rate": 3.633146970706307e-05, - "loss": 2.3241, - "step": 156760 - }, - { - "epoch": 0.27, - "learning_rate": 3.633059776713624e-05, - "loss": 2.5102, - "step": 156770 - }, - { - "epoch": 0.27, - "learning_rate": 3.632972582720941e-05, - "loss": 2.4743, - "step": 156780 - }, - { - "epoch": 0.27, - "learning_rate": 3.632885388728258e-05, - "loss": 2.482, - "step": 156790 - }, - { - "epoch": 0.27, - "learning_rate": 3.6327981947355756e-05, - "loss": 2.5374, - "step": 156800 - }, - { - "epoch": 0.27, - "learning_rate": 3.632711000742893e-05, - "loss": 2.4418, - "step": 156810 - }, - { - "epoch": 0.27, - "learning_rate": 3.6326238067502104e-05, - "loss": 2.3741, - "step": 156820 - }, - { - "epoch": 0.27, - "learning_rate": 3.632536612757528e-05, - "loss": 2.4014, - "step": 156830 - }, - { - "epoch": 0.27, - "learning_rate": 3.632449418764845e-05, - "loss": 2.5746, - "step": 156840 - }, - { - "epoch": 0.27, - "learning_rate": 3.632362224772162e-05, - "loss": 2.4703, - "step": 156850 - }, - { - "epoch": 0.27, - "learning_rate": 3.632275030779479e-05, - "loss": 2.5042, - "step": 156860 - }, - { - "epoch": 0.27, - "learning_rate": 3.632187836786797e-05, - "loss": 2.5316, - "step": 156870 - }, - { - "epoch": 0.27, - "learning_rate": 3.632100642794114e-05, - "loss": 2.3897, - "step": 156880 - }, - { - "epoch": 0.27, - "learning_rate": 3.632013448801432e-05, - "loss": 2.6795, - "step": 156890 - }, - { - "epoch": 0.27, - "learning_rate": 3.631926254808749e-05, - "loss": 2.4771, - "step": 156900 - }, - { - "epoch": 0.27, - "learning_rate": 3.6318390608160664e-05, - "loss": 2.4428, - "step": 156910 - }, - { - "epoch": 0.27, - "learning_rate": 3.6317518668233835e-05, - "loss": 2.5406, - "step": 156920 - }, - { - "epoch": 0.27, - "learning_rate": 3.6316646728307005e-05, - "loss": 2.5282, - "step": 156930 - }, - { - "epoch": 0.27, - "learning_rate": 3.631577478838018e-05, - "loss": 2.4702, - "step": 156940 - }, - { - "epoch": 0.27, - "learning_rate": 3.631490284845335e-05, - "loss": 2.4686, - "step": 156950 - }, - { - "epoch": 0.27, - "learning_rate": 3.631403090852653e-05, - "loss": 2.3784, - "step": 156960 - }, - { - "epoch": 0.27, - "learning_rate": 3.63131589685997e-05, - "loss": 2.4512, - "step": 156970 - }, - { - "epoch": 0.27, - "learning_rate": 3.631228702867288e-05, - "loss": 2.4713, - "step": 156980 - }, - { - "epoch": 0.27, - "learning_rate": 3.631141508874605e-05, - "loss": 2.4541, - "step": 156990 - }, - { - "epoch": 0.27, - "learning_rate": 3.631054314881922e-05, - "loss": 2.5669, - "step": 157000 - }, - { - "epoch": 0.27, - "learning_rate": 3.6309671208892395e-05, - "loss": 2.5455, - "step": 157010 - }, - { - "epoch": 0.27, - "learning_rate": 3.6308799268965566e-05, - "loss": 2.4095, - "step": 157020 - }, - { - "epoch": 0.27, - "learning_rate": 3.6307927329038736e-05, - "loss": 2.3543, - "step": 157030 - }, - { - "epoch": 0.27, - "learning_rate": 3.630705538911191e-05, - "loss": 2.4215, - "step": 157040 - }, - { - "epoch": 0.27, - "learning_rate": 3.630618344918509e-05, - "loss": 2.383, - "step": 157050 - }, - { - "epoch": 0.27, - "learning_rate": 3.630531150925826e-05, - "loss": 2.5181, - "step": 157060 - }, - { - "epoch": 0.27, - "learning_rate": 3.630443956933143e-05, - "loss": 2.5034, - "step": 157070 - }, - { - "epoch": 0.27, - "learning_rate": 3.630356762940461e-05, - "loss": 2.4443, - "step": 157080 - }, - { - "epoch": 0.27, - "learning_rate": 3.630269568947778e-05, - "loss": 2.4164, - "step": 157090 - }, - { - "epoch": 0.27, - "learning_rate": 3.630182374955095e-05, - "loss": 2.4502, - "step": 157100 - }, - { - "epoch": 0.27, - "learning_rate": 3.6300951809624126e-05, - "loss": 2.4662, - "step": 157110 - }, - { - "epoch": 0.27, - "learning_rate": 3.6300079869697303e-05, - "loss": 2.4841, - "step": 157120 - }, - { - "epoch": 0.27, - "learning_rate": 3.6299207929770474e-05, - "loss": 2.4678, - "step": 157130 - }, - { - "epoch": 0.27, - "learning_rate": 3.6298335989843644e-05, - "loss": 2.4524, - "step": 157140 - }, - { - "epoch": 0.27, - "learning_rate": 3.629746404991682e-05, - "loss": 2.4058, - "step": 157150 - }, - { - "epoch": 0.27, - "learning_rate": 3.629659210998999e-05, - "loss": 2.4994, - "step": 157160 - }, - { - "epoch": 0.27, - "learning_rate": 3.629572017006316e-05, - "loss": 2.5034, - "step": 157170 - }, - { - "epoch": 0.27, - "learning_rate": 3.629484823013633e-05, - "loss": 2.4819, - "step": 157180 - }, - { - "epoch": 0.27, - "learning_rate": 3.6293976290209516e-05, - "loss": 2.5782, - "step": 157190 - }, - { - "epoch": 0.27, - "learning_rate": 3.629310435028269e-05, - "loss": 2.3965, - "step": 157200 - }, - { - "epoch": 0.27, - "learning_rate": 3.629223241035586e-05, - "loss": 2.4526, - "step": 157210 - }, - { - "epoch": 0.27, - "learning_rate": 3.6291360470429034e-05, - "loss": 2.4886, - "step": 157220 - }, - { - "epoch": 0.27, - "learning_rate": 3.6290488530502205e-05, - "loss": 2.5081, - "step": 157230 - }, - { - "epoch": 0.27, - "learning_rate": 3.6289616590575375e-05, - "loss": 2.4405, - "step": 157240 - }, - { - "epoch": 0.27, - "learning_rate": 3.6288744650648546e-05, - "loss": 2.5502, - "step": 157250 - }, - { - "epoch": 0.27, - "learning_rate": 3.628787271072173e-05, - "loss": 2.4542, - "step": 157260 - }, - { - "epoch": 0.27, - "learning_rate": 3.62870007707949e-05, - "loss": 2.3706, - "step": 157270 - }, - { - "epoch": 0.27, - "learning_rate": 3.628612883086807e-05, - "loss": 2.5007, - "step": 157280 - }, - { - "epoch": 0.27, - "learning_rate": 3.628525689094124e-05, - "loss": 2.3579, - "step": 157290 - }, - { - "epoch": 0.27, - "learning_rate": 3.628438495101442e-05, - "loss": 2.3731, - "step": 157300 - }, - { - "epoch": 0.27, - "learning_rate": 3.628351301108759e-05, - "loss": 2.4236, - "step": 157310 - }, - { - "epoch": 0.27, - "learning_rate": 3.628264107116076e-05, - "loss": 2.3747, - "step": 157320 - }, - { - "epoch": 0.27, - "learning_rate": 3.6281769131233936e-05, - "loss": 2.4181, - "step": 157330 - }, - { - "epoch": 0.27, - "learning_rate": 3.628089719130711e-05, - "loss": 2.4565, - "step": 157340 - }, - { - "epoch": 0.27, - "learning_rate": 3.628002525138028e-05, - "loss": 2.4621, - "step": 157350 - }, - { - "epoch": 0.27, - "learning_rate": 3.6279153311453454e-05, - "loss": 2.4596, - "step": 157360 - }, - { - "epoch": 0.27, - "learning_rate": 3.627828137152663e-05, - "loss": 2.4082, - "step": 157370 - }, - { - "epoch": 0.27, - "learning_rate": 3.62774094315998e-05, - "loss": 2.4693, - "step": 157380 - }, - { - "epoch": 0.27, - "learning_rate": 3.627653749167297e-05, - "loss": 2.3981, - "step": 157390 - }, - { - "epoch": 0.27, - "learning_rate": 3.627566555174615e-05, - "loss": 2.5457, - "step": 157400 - }, - { - "epoch": 0.27, - "learning_rate": 3.6274793611819326e-05, - "loss": 2.4339, - "step": 157410 - }, - { - "epoch": 0.27, - "learning_rate": 3.6273921671892496e-05, - "loss": 2.4549, - "step": 157420 - }, - { - "epoch": 0.27, - "learning_rate": 3.6273049731965667e-05, - "loss": 2.4571, - "step": 157430 - }, - { - "epoch": 0.27, - "learning_rate": 3.6272177792038844e-05, - "loss": 2.3742, - "step": 157440 - }, - { - "epoch": 0.27, - "learning_rate": 3.6271305852112014e-05, - "loss": 2.6293, - "step": 157450 - }, - { - "epoch": 0.27, - "learning_rate": 3.6270433912185185e-05, - "loss": 2.4379, - "step": 157460 - }, - { - "epoch": 0.27, - "learning_rate": 3.626956197225836e-05, - "loss": 2.5224, - "step": 157470 - }, - { - "epoch": 0.27, - "learning_rate": 3.626869003233153e-05, - "loss": 2.3801, - "step": 157480 - }, - { - "epoch": 0.27, - "learning_rate": 3.626781809240471e-05, - "loss": 2.388, - "step": 157490 - }, - { - "epoch": 0.27, - "learning_rate": 3.626694615247788e-05, - "loss": 2.5315, - "step": 157500 - }, - { - "epoch": 0.27, - "learning_rate": 3.626607421255106e-05, - "loss": 2.4945, - "step": 157510 - }, - { - "epoch": 0.27, - "learning_rate": 3.626520227262423e-05, - "loss": 2.3014, - "step": 157520 - }, - { - "epoch": 0.27, - "learning_rate": 3.62643303326974e-05, - "loss": 2.431, - "step": 157530 - }, - { - "epoch": 0.27, - "learning_rate": 3.6263458392770575e-05, - "loss": 2.4098, - "step": 157540 - }, - { - "epoch": 0.27, - "learning_rate": 3.6262586452843745e-05, - "loss": 2.4461, - "step": 157550 - }, - { - "epoch": 0.27, - "learning_rate": 3.626171451291692e-05, - "loss": 2.5093, - "step": 157560 - }, - { - "epoch": 0.27, - "learning_rate": 3.626084257299009e-05, - "loss": 2.4942, - "step": 157570 - }, - { - "epoch": 0.27, - "learning_rate": 3.625997063306327e-05, - "loss": 2.4958, - "step": 157580 - }, - { - "epoch": 0.27, - "learning_rate": 3.625909869313644e-05, - "loss": 2.518, - "step": 157590 - }, - { - "epoch": 0.27, - "learning_rate": 3.625822675320961e-05, - "loss": 2.5571, - "step": 157600 - }, - { - "epoch": 0.27, - "learning_rate": 3.625735481328279e-05, - "loss": 2.3392, - "step": 157610 - }, - { - "epoch": 0.27, - "learning_rate": 3.625648287335596e-05, - "loss": 2.4738, - "step": 157620 - }, - { - "epoch": 0.27, - "learning_rate": 3.6255610933429135e-05, - "loss": 2.559, - "step": 157630 - }, - { - "epoch": 0.27, - "learning_rate": 3.6254738993502306e-05, - "loss": 2.4398, - "step": 157640 - }, - { - "epoch": 0.27, - "learning_rate": 3.625386705357548e-05, - "loss": 2.385, - "step": 157650 - }, - { - "epoch": 0.27, - "learning_rate": 3.625299511364865e-05, - "loss": 2.4164, - "step": 157660 - }, - { - "epoch": 0.27, - "learning_rate": 3.6252123173721824e-05, - "loss": 2.5259, - "step": 157670 - }, - { - "epoch": 0.27, - "learning_rate": 3.6251251233794994e-05, - "loss": 2.4383, - "step": 157680 - }, - { - "epoch": 0.27, - "learning_rate": 3.625037929386817e-05, - "loss": 2.5332, - "step": 157690 - }, - { - "epoch": 0.28, - "learning_rate": 3.624950735394134e-05, - "loss": 2.4792, - "step": 157700 - }, - { - "epoch": 0.28, - "learning_rate": 3.624863541401452e-05, - "loss": 2.5096, - "step": 157710 - }, - { - "epoch": 0.28, - "learning_rate": 3.6247763474087696e-05, - "loss": 2.4969, - "step": 157720 - }, - { - "epoch": 0.28, - "learning_rate": 3.6246891534160866e-05, - "loss": 2.3412, - "step": 157730 - }, - { - "epoch": 0.28, - "learning_rate": 3.6246019594234037e-05, - "loss": 2.5155, - "step": 157740 - }, - { - "epoch": 0.28, - "learning_rate": 3.624514765430721e-05, - "loss": 2.3689, - "step": 157750 - }, - { - "epoch": 0.28, - "learning_rate": 3.6244275714380384e-05, - "loss": 2.4016, - "step": 157760 - }, - { - "epoch": 0.28, - "learning_rate": 3.6243403774453554e-05, - "loss": 2.5478, - "step": 157770 - }, - { - "epoch": 0.28, - "learning_rate": 3.624253183452673e-05, - "loss": 2.5229, - "step": 157780 - }, - { - "epoch": 0.28, - "learning_rate": 3.62416598945999e-05, - "loss": 2.5097, - "step": 157790 - }, - { - "epoch": 0.28, - "learning_rate": 3.624078795467308e-05, - "loss": 2.3721, - "step": 157800 - }, - { - "epoch": 0.28, - "learning_rate": 3.623991601474625e-05, - "loss": 2.4563, - "step": 157810 - }, - { - "epoch": 0.28, - "learning_rate": 3.623904407481942e-05, - "loss": 2.4738, - "step": 157820 - }, - { - "epoch": 0.28, - "learning_rate": 3.62381721348926e-05, - "loss": 2.4515, - "step": 157830 - }, - { - "epoch": 0.28, - "learning_rate": 3.623730019496577e-05, - "loss": 2.456, - "step": 157840 - }, - { - "epoch": 0.28, - "learning_rate": 3.623642825503894e-05, - "loss": 2.5649, - "step": 157850 - }, - { - "epoch": 0.28, - "learning_rate": 3.6235556315112115e-05, - "loss": 2.5164, - "step": 157860 - }, - { - "epoch": 0.28, - "learning_rate": 3.623468437518529e-05, - "loss": 2.4528, - "step": 157870 - }, - { - "epoch": 0.28, - "learning_rate": 3.623381243525846e-05, - "loss": 2.4888, - "step": 157880 - }, - { - "epoch": 0.28, - "learning_rate": 3.623294049533163e-05, - "loss": 2.4247, - "step": 157890 - }, - { - "epoch": 0.28, - "learning_rate": 3.623206855540481e-05, - "loss": 2.4001, - "step": 157900 - }, - { - "epoch": 0.28, - "learning_rate": 3.623119661547798e-05, - "loss": 2.5063, - "step": 157910 - }, - { - "epoch": 0.28, - "learning_rate": 3.623032467555115e-05, - "loss": 2.4233, - "step": 157920 - }, - { - "epoch": 0.28, - "learning_rate": 3.622945273562433e-05, - "loss": 2.4055, - "step": 157930 - }, - { - "epoch": 0.28, - "learning_rate": 3.6228580795697505e-05, - "loss": 2.4862, - "step": 157940 - }, - { - "epoch": 0.28, - "learning_rate": 3.6227708855770676e-05, - "loss": 2.4465, - "step": 157950 - }, - { - "epoch": 0.28, - "learning_rate": 3.6226836915843846e-05, - "loss": 2.4754, - "step": 157960 - }, - { - "epoch": 0.28, - "learning_rate": 3.622596497591702e-05, - "loss": 2.4737, - "step": 157970 - }, - { - "epoch": 0.28, - "learning_rate": 3.6225093035990193e-05, - "loss": 2.3204, - "step": 157980 - }, - { - "epoch": 0.28, - "learning_rate": 3.6224221096063364e-05, - "loss": 2.5267, - "step": 157990 - }, - { - "epoch": 0.28, - "learning_rate": 3.622334915613654e-05, - "loss": 2.4259, - "step": 158000 - }, - { - "epoch": 0.28, - "learning_rate": 3.622247721620972e-05, - "loss": 2.3581, - "step": 158010 - }, - { - "epoch": 0.28, - "learning_rate": 3.622160527628289e-05, - "loss": 2.4394, - "step": 158020 - }, - { - "epoch": 0.28, - "learning_rate": 3.622073333635606e-05, - "loss": 2.4651, - "step": 158030 - }, - { - "epoch": 0.28, - "learning_rate": 3.6219861396429236e-05, - "loss": 2.4093, - "step": 158040 - }, - { - "epoch": 0.28, - "learning_rate": 3.6218989456502406e-05, - "loss": 2.3624, - "step": 158050 - }, - { - "epoch": 0.28, - "learning_rate": 3.621811751657558e-05, - "loss": 2.4489, - "step": 158060 - }, - { - "epoch": 0.28, - "learning_rate": 3.6217245576648754e-05, - "loss": 2.464, - "step": 158070 - }, - { - "epoch": 0.28, - "learning_rate": 3.621637363672193e-05, - "loss": 2.6171, - "step": 158080 - }, - { - "epoch": 0.28, - "learning_rate": 3.62155016967951e-05, - "loss": 2.4873, - "step": 158090 - }, - { - "epoch": 0.28, - "learning_rate": 3.621462975686827e-05, - "loss": 2.4508, - "step": 158100 - }, - { - "epoch": 0.28, - "learning_rate": 3.621375781694145e-05, - "loss": 2.5439, - "step": 158110 - }, - { - "epoch": 0.28, - "learning_rate": 3.621288587701462e-05, - "loss": 2.4547, - "step": 158120 - }, - { - "epoch": 0.28, - "learning_rate": 3.621201393708779e-05, - "loss": 2.5828, - "step": 158130 - }, - { - "epoch": 0.28, - "learning_rate": 3.621114199716096e-05, - "loss": 2.5051, - "step": 158140 - }, - { - "epoch": 0.28, - "learning_rate": 3.621027005723414e-05, - "loss": 2.4019, - "step": 158150 - }, - { - "epoch": 0.28, - "learning_rate": 3.6209398117307315e-05, - "loss": 2.4636, - "step": 158160 - }, - { - "epoch": 0.28, - "learning_rate": 3.6208526177380485e-05, - "loss": 2.5634, - "step": 158170 - }, - { - "epoch": 0.28, - "learning_rate": 3.620765423745366e-05, - "loss": 2.4104, - "step": 158180 - }, - { - "epoch": 0.28, - "learning_rate": 3.620678229752683e-05, - "loss": 2.4341, - "step": 158190 - }, - { - "epoch": 0.28, - "learning_rate": 3.62059103576e-05, - "loss": 2.555, - "step": 158200 - }, - { - "epoch": 0.28, - "learning_rate": 3.620503841767317e-05, - "loss": 2.4247, - "step": 158210 - }, - { - "epoch": 0.28, - "learning_rate": 3.620416647774635e-05, - "loss": 2.3986, - "step": 158220 - }, - { - "epoch": 0.28, - "learning_rate": 3.620329453781953e-05, - "loss": 2.3833, - "step": 158230 - }, - { - "epoch": 0.28, - "learning_rate": 3.62024225978927e-05, - "loss": 2.4761, - "step": 158240 - }, - { - "epoch": 0.28, - "learning_rate": 3.620155065796587e-05, - "loss": 2.4916, - "step": 158250 - }, - { - "epoch": 0.28, - "learning_rate": 3.6200678718039045e-05, - "loss": 2.4935, - "step": 158260 - }, - { - "epoch": 0.28, - "learning_rate": 3.6199806778112216e-05, - "loss": 2.4511, - "step": 158270 - }, - { - "epoch": 0.28, - "learning_rate": 3.6198934838185386e-05, - "loss": 2.4797, - "step": 158280 - }, - { - "epoch": 0.28, - "learning_rate": 3.619806289825856e-05, - "loss": 2.4778, - "step": 158290 - }, - { - "epoch": 0.28, - "learning_rate": 3.619719095833174e-05, - "loss": 2.4833, - "step": 158300 - }, - { - "epoch": 0.28, - "learning_rate": 3.619631901840491e-05, - "loss": 2.3816, - "step": 158310 - }, - { - "epoch": 0.28, - "learning_rate": 3.619544707847808e-05, - "loss": 2.4974, - "step": 158320 - }, - { - "epoch": 0.28, - "learning_rate": 3.619457513855126e-05, - "loss": 2.4197, - "step": 158330 - }, - { - "epoch": 0.28, - "learning_rate": 3.619370319862443e-05, - "loss": 2.3479, - "step": 158340 - }, - { - "epoch": 0.28, - "learning_rate": 3.61928312586976e-05, - "loss": 2.4866, - "step": 158350 - }, - { - "epoch": 0.28, - "learning_rate": 3.6191959318770776e-05, - "loss": 2.3751, - "step": 158360 - }, - { - "epoch": 0.28, - "learning_rate": 3.619108737884395e-05, - "loss": 2.5667, - "step": 158370 - }, - { - "epoch": 0.28, - "learning_rate": 3.6190215438917124e-05, - "loss": 2.5504, - "step": 158380 - }, - { - "epoch": 0.28, - "learning_rate": 3.6189343498990294e-05, - "loss": 2.4182, - "step": 158390 - }, - { - "epoch": 0.28, - "learning_rate": 3.618847155906347e-05, - "loss": 2.377, - "step": 158400 - }, - { - "epoch": 0.28, - "learning_rate": 3.618759961913664e-05, - "loss": 2.3578, - "step": 158410 - }, - { - "epoch": 0.28, - "learning_rate": 3.618672767920981e-05, - "loss": 2.572, - "step": 158420 - }, - { - "epoch": 0.28, - "learning_rate": 3.618585573928299e-05, - "loss": 2.3768, - "step": 158430 - }, - { - "epoch": 0.28, - "learning_rate": 3.618498379935616e-05, - "loss": 2.636, - "step": 158440 - }, - { - "epoch": 0.28, - "learning_rate": 3.618411185942934e-05, - "loss": 2.3853, - "step": 158450 - }, - { - "epoch": 0.28, - "learning_rate": 3.618323991950251e-05, - "loss": 2.5109, - "step": 158460 - }, - { - "epoch": 0.28, - "learning_rate": 3.6182367979575684e-05, - "loss": 2.3925, - "step": 158470 - }, - { - "epoch": 0.28, - "learning_rate": 3.6181496039648855e-05, - "loss": 2.5192, - "step": 158480 - }, - { - "epoch": 0.28, - "learning_rate": 3.6180624099722025e-05, - "loss": 2.4908, - "step": 158490 - }, - { - "epoch": 0.28, - "learning_rate": 3.61797521597952e-05, - "loss": 2.5071, - "step": 158500 - }, - { - "epoch": 0.28, - "learning_rate": 3.617888021986837e-05, - "loss": 2.382, - "step": 158510 - }, - { - "epoch": 0.28, - "learning_rate": 3.617800827994154e-05, - "loss": 2.4319, - "step": 158520 - }, - { - "epoch": 0.28, - "learning_rate": 3.617713634001472e-05, - "loss": 2.5312, - "step": 158530 - }, - { - "epoch": 0.28, - "learning_rate": 3.61762644000879e-05, - "loss": 2.3542, - "step": 158540 - }, - { - "epoch": 0.28, - "learning_rate": 3.617539246016107e-05, - "loss": 2.3892, - "step": 158550 - }, - { - "epoch": 0.28, - "learning_rate": 3.617452052023424e-05, - "loss": 2.4892, - "step": 158560 - }, - { - "epoch": 0.28, - "learning_rate": 3.6173648580307415e-05, - "loss": 2.5553, - "step": 158570 - }, - { - "epoch": 0.28, - "learning_rate": 3.6172776640380586e-05, - "loss": 2.5329, - "step": 158580 - }, - { - "epoch": 0.28, - "learning_rate": 3.6171904700453756e-05, - "loss": 2.4897, - "step": 158590 - }, - { - "epoch": 0.28, - "learning_rate": 3.617103276052693e-05, - "loss": 2.4238, - "step": 158600 - }, - { - "epoch": 0.28, - "learning_rate": 3.617016082060011e-05, - "loss": 2.5928, - "step": 158610 - }, - { - "epoch": 0.28, - "learning_rate": 3.616928888067328e-05, - "loss": 2.5827, - "step": 158620 - }, - { - "epoch": 0.28, - "learning_rate": 3.616841694074645e-05, - "loss": 2.4721, - "step": 158630 - }, - { - "epoch": 0.28, - "learning_rate": 3.616754500081962e-05, - "loss": 2.4641, - "step": 158640 - }, - { - "epoch": 0.28, - "learning_rate": 3.61666730608928e-05, - "loss": 2.4211, - "step": 158650 - }, - { - "epoch": 0.28, - "learning_rate": 3.616580112096597e-05, - "loss": 2.506, - "step": 158660 - }, - { - "epoch": 0.28, - "learning_rate": 3.616492918103914e-05, - "loss": 2.3982, - "step": 158670 - }, - { - "epoch": 0.28, - "learning_rate": 3.6164057241112323e-05, - "loss": 2.4974, - "step": 158680 - }, - { - "epoch": 0.28, - "learning_rate": 3.6163185301185494e-05, - "loss": 2.3699, - "step": 158690 - }, - { - "epoch": 0.28, - "learning_rate": 3.6162313361258664e-05, - "loss": 2.4624, - "step": 158700 - }, - { - "epoch": 0.28, - "learning_rate": 3.6161441421331835e-05, - "loss": 2.5034, - "step": 158710 - }, - { - "epoch": 0.28, - "learning_rate": 3.616056948140501e-05, - "loss": 2.3561, - "step": 158720 - }, - { - "epoch": 0.28, - "learning_rate": 3.615969754147818e-05, - "loss": 2.2772, - "step": 158730 - }, - { - "epoch": 0.28, - "learning_rate": 3.615882560155135e-05, - "loss": 2.3848, - "step": 158740 - }, - { - "epoch": 0.28, - "learning_rate": 3.615795366162453e-05, - "loss": 2.4483, - "step": 158750 - }, - { - "epoch": 0.28, - "learning_rate": 3.615708172169771e-05, - "loss": 2.4917, - "step": 158760 - }, - { - "epoch": 0.28, - "learning_rate": 3.615620978177088e-05, - "loss": 2.5059, - "step": 158770 - }, - { - "epoch": 0.28, - "learning_rate": 3.615533784184405e-05, - "loss": 2.4944, - "step": 158780 - }, - { - "epoch": 0.28, - "learning_rate": 3.6154465901917225e-05, - "loss": 2.5317, - "step": 158790 - }, - { - "epoch": 0.28, - "learning_rate": 3.6153593961990395e-05, - "loss": 2.5851, - "step": 158800 - }, - { - "epoch": 0.28, - "learning_rate": 3.6152722022063566e-05, - "loss": 2.4465, - "step": 158810 - }, - { - "epoch": 0.28, - "learning_rate": 3.615185008213674e-05, - "loss": 2.5491, - "step": 158820 - }, - { - "epoch": 0.28, - "learning_rate": 3.615097814220992e-05, - "loss": 2.5602, - "step": 158830 - }, - { - "epoch": 0.28, - "learning_rate": 3.615010620228309e-05, - "loss": 2.4775, - "step": 158840 - }, - { - "epoch": 0.28, - "learning_rate": 3.614923426235626e-05, - "loss": 2.2982, - "step": 158850 - }, - { - "epoch": 0.28, - "learning_rate": 3.614836232242944e-05, - "loss": 2.4727, - "step": 158860 - }, - { - "epoch": 0.28, - "learning_rate": 3.614749038250261e-05, - "loss": 2.4499, - "step": 158870 - }, - { - "epoch": 0.28, - "learning_rate": 3.614661844257578e-05, - "loss": 2.5835, - "step": 158880 - }, - { - "epoch": 0.28, - "learning_rate": 3.6145746502648956e-05, - "loss": 2.4609, - "step": 158890 - }, - { - "epoch": 0.28, - "learning_rate": 3.614487456272213e-05, - "loss": 2.4769, - "step": 158900 - }, - { - "epoch": 0.28, - "learning_rate": 3.61440026227953e-05, - "loss": 2.5274, - "step": 158910 - }, - { - "epoch": 0.28, - "learning_rate": 3.6143130682868474e-05, - "loss": 2.4963, - "step": 158920 - }, - { - "epoch": 0.28, - "learning_rate": 3.614225874294165e-05, - "loss": 2.508, - "step": 158930 - }, - { - "epoch": 0.28, - "learning_rate": 3.614138680301482e-05, - "loss": 2.5174, - "step": 158940 - }, - { - "epoch": 0.28, - "learning_rate": 3.614051486308799e-05, - "loss": 2.4868, - "step": 158950 - }, - { - "epoch": 0.28, - "learning_rate": 3.613964292316117e-05, - "loss": 2.5373, - "step": 158960 - }, - { - "epoch": 0.28, - "learning_rate": 3.6138770983234346e-05, - "loss": 2.479, - "step": 158970 - }, - { - "epoch": 0.28, - "learning_rate": 3.6137899043307516e-05, - "loss": 2.3461, - "step": 158980 - }, - { - "epoch": 0.28, - "learning_rate": 3.613702710338069e-05, - "loss": 2.4132, - "step": 158990 - }, - { - "epoch": 0.28, - "learning_rate": 3.6136155163453864e-05, - "loss": 2.6106, - "step": 159000 - }, - { - "epoch": 0.28, - "learning_rate": 3.6135283223527034e-05, - "loss": 2.4851, - "step": 159010 - }, - { - "epoch": 0.28, - "learning_rate": 3.6134411283600205e-05, - "loss": 2.5289, - "step": 159020 - }, - { - "epoch": 0.28, - "learning_rate": 3.6133539343673375e-05, - "loss": 2.4335, - "step": 159030 - }, - { - "epoch": 0.28, - "learning_rate": 3.613266740374655e-05, - "loss": 2.4513, - "step": 159040 - }, - { - "epoch": 0.28, - "learning_rate": 3.613179546381973e-05, - "loss": 2.4876, - "step": 159050 - }, - { - "epoch": 0.28, - "learning_rate": 3.61309235238929e-05, - "loss": 2.5026, - "step": 159060 - }, - { - "epoch": 0.28, - "learning_rate": 3.613005158396608e-05, - "loss": 2.4494, - "step": 159070 - }, - { - "epoch": 0.28, - "learning_rate": 3.612917964403925e-05, - "loss": 2.4427, - "step": 159080 - }, - { - "epoch": 0.28, - "learning_rate": 3.612830770411242e-05, - "loss": 2.4911, - "step": 159090 - }, - { - "epoch": 0.28, - "learning_rate": 3.612743576418559e-05, - "loss": 2.5413, - "step": 159100 - }, - { - "epoch": 0.28, - "learning_rate": 3.6126563824258765e-05, - "loss": 2.4199, - "step": 159110 - }, - { - "epoch": 0.28, - "learning_rate": 3.612569188433194e-05, - "loss": 2.3814, - "step": 159120 - }, - { - "epoch": 0.28, - "learning_rate": 3.612481994440511e-05, - "loss": 2.4526, - "step": 159130 - }, - { - "epoch": 0.28, - "learning_rate": 3.612394800447828e-05, - "loss": 2.4609, - "step": 159140 - }, - { - "epoch": 0.28, - "learning_rate": 3.612307606455146e-05, - "loss": 2.5237, - "step": 159150 - }, - { - "epoch": 0.28, - "learning_rate": 3.612220412462463e-05, - "loss": 2.4578, - "step": 159160 - }, - { - "epoch": 0.28, - "learning_rate": 3.61213321846978e-05, - "loss": 2.4745, - "step": 159170 - }, - { - "epoch": 0.28, - "learning_rate": 3.612046024477098e-05, - "loss": 2.5355, - "step": 159180 - }, - { - "epoch": 0.28, - "learning_rate": 3.611958830484415e-05, - "loss": 2.5195, - "step": 159190 - }, - { - "epoch": 0.28, - "learning_rate": 3.6118716364917326e-05, - "loss": 2.532, - "step": 159200 - }, - { - "epoch": 0.28, - "learning_rate": 3.6117844424990496e-05, - "loss": 2.517, - "step": 159210 - }, - { - "epoch": 0.28, - "learning_rate": 3.611697248506367e-05, - "loss": 2.4345, - "step": 159220 - }, - { - "epoch": 0.28, - "learning_rate": 3.6116100545136844e-05, - "loss": 2.4636, - "step": 159230 - }, - { - "epoch": 0.28, - "learning_rate": 3.6115228605210014e-05, - "loss": 2.4148, - "step": 159240 - }, - { - "epoch": 0.28, - "learning_rate": 3.611435666528319e-05, - "loss": 2.5263, - "step": 159250 - }, - { - "epoch": 0.28, - "learning_rate": 3.611348472535636e-05, - "loss": 2.5123, - "step": 159260 - }, - { - "epoch": 0.28, - "learning_rate": 3.611261278542954e-05, - "loss": 2.4818, - "step": 159270 - }, - { - "epoch": 0.28, - "learning_rate": 3.611174084550271e-05, - "loss": 2.4063, - "step": 159280 - }, - { - "epoch": 0.28, - "learning_rate": 3.6110868905575886e-05, - "loss": 2.4991, - "step": 159290 - }, - { - "epoch": 0.28, - "learning_rate": 3.6109996965649057e-05, - "loss": 2.4683, - "step": 159300 - }, - { - "epoch": 0.28, - "learning_rate": 3.610912502572223e-05, - "loss": 2.3689, - "step": 159310 - }, - { - "epoch": 0.28, - "learning_rate": 3.6108253085795404e-05, - "loss": 2.4414, - "step": 159320 - }, - { - "epoch": 0.28, - "learning_rate": 3.6107381145868574e-05, - "loss": 2.405, - "step": 159330 - }, - { - "epoch": 0.28, - "learning_rate": 3.6106509205941745e-05, - "loss": 2.5283, - "step": 159340 - }, - { - "epoch": 0.28, - "learning_rate": 3.610563726601492e-05, - "loss": 2.5163, - "step": 159350 - }, - { - "epoch": 0.28, - "learning_rate": 3.61047653260881e-05, - "loss": 2.4752, - "step": 159360 - }, - { - "epoch": 0.28, - "learning_rate": 3.610389338616127e-05, - "loss": 2.5769, - "step": 159370 - }, - { - "epoch": 0.28, - "learning_rate": 3.610302144623444e-05, - "loss": 2.4702, - "step": 159380 - }, - { - "epoch": 0.28, - "learning_rate": 3.610214950630762e-05, - "loss": 2.5041, - "step": 159390 - }, - { - "epoch": 0.28, - "learning_rate": 3.610127756638079e-05, - "loss": 2.4992, - "step": 159400 - }, - { - "epoch": 0.28, - "learning_rate": 3.610040562645396e-05, - "loss": 2.4641, - "step": 159410 - }, - { - "epoch": 0.28, - "learning_rate": 3.6099533686527135e-05, - "loss": 2.4176, - "step": 159420 - }, - { - "epoch": 0.28, - "learning_rate": 3.609866174660031e-05, - "loss": 2.502, - "step": 159430 - }, - { - "epoch": 0.28, - "learning_rate": 3.609778980667348e-05, - "loss": 2.4075, - "step": 159440 - }, - { - "epoch": 0.28, - "learning_rate": 3.609691786674665e-05, - "loss": 2.4912, - "step": 159450 - }, - { - "epoch": 0.28, - "learning_rate": 3.609604592681983e-05, - "loss": 2.5276, - "step": 159460 - }, - { - "epoch": 0.28, - "learning_rate": 3.6095173986893e-05, - "loss": 2.4742, - "step": 159470 - }, - { - "epoch": 0.28, - "learning_rate": 3.609430204696617e-05, - "loss": 2.475, - "step": 159480 - }, - { - "epoch": 0.28, - "learning_rate": 3.609343010703935e-05, - "loss": 2.405, - "step": 159490 - }, - { - "epoch": 0.28, - "learning_rate": 3.6092558167112525e-05, - "loss": 2.4384, - "step": 159500 - }, - { - "epoch": 0.28, - "learning_rate": 3.6091686227185696e-05, - "loss": 2.5349, - "step": 159510 - }, - { - "epoch": 0.28, - "learning_rate": 3.6090814287258866e-05, - "loss": 2.4869, - "step": 159520 - }, - { - "epoch": 0.28, - "learning_rate": 3.608994234733204e-05, - "loss": 2.4231, - "step": 159530 - }, - { - "epoch": 0.28, - "learning_rate": 3.6089070407405213e-05, - "loss": 2.5343, - "step": 159540 - }, - { - "epoch": 0.28, - "learning_rate": 3.6088198467478384e-05, - "loss": 2.4278, - "step": 159550 - }, - { - "epoch": 0.28, - "learning_rate": 3.6087326527551554e-05, - "loss": 2.3507, - "step": 159560 - }, - { - "epoch": 0.28, - "learning_rate": 3.608645458762474e-05, - "loss": 2.3748, - "step": 159570 - }, - { - "epoch": 0.28, - "learning_rate": 3.608558264769791e-05, - "loss": 2.3294, - "step": 159580 - }, - { - "epoch": 0.28, - "learning_rate": 3.608471070777108e-05, - "loss": 2.3537, - "step": 159590 - }, - { - "epoch": 0.28, - "learning_rate": 3.608383876784425e-05, - "loss": 2.4014, - "step": 159600 - }, - { - "epoch": 0.28, - "learning_rate": 3.6082966827917426e-05, - "loss": 2.4964, - "step": 159610 - }, - { - "epoch": 0.28, - "learning_rate": 3.60820948879906e-05, - "loss": 2.5006, - "step": 159620 - }, - { - "epoch": 0.28, - "learning_rate": 3.608122294806377e-05, - "loss": 2.3333, - "step": 159630 - }, - { - "epoch": 0.28, - "learning_rate": 3.608035100813695e-05, - "loss": 2.5203, - "step": 159640 - }, - { - "epoch": 0.28, - "learning_rate": 3.607947906821012e-05, - "loss": 2.4291, - "step": 159650 - }, - { - "epoch": 0.28, - "learning_rate": 3.607860712828329e-05, - "loss": 2.5787, - "step": 159660 - }, - { - "epoch": 0.28, - "learning_rate": 3.607773518835646e-05, - "loss": 2.5119, - "step": 159670 - }, - { - "epoch": 0.28, - "learning_rate": 3.607686324842964e-05, - "loss": 2.382, - "step": 159680 - }, - { - "epoch": 0.28, - "learning_rate": 3.607599130850281e-05, - "loss": 2.5071, - "step": 159690 - }, - { - "epoch": 0.28, - "learning_rate": 3.607511936857598e-05, - "loss": 2.5098, - "step": 159700 - }, - { - "epoch": 0.28, - "learning_rate": 3.607424742864916e-05, - "loss": 2.5453, - "step": 159710 - }, - { - "epoch": 0.28, - "learning_rate": 3.6073375488722335e-05, - "loss": 2.4523, - "step": 159720 - }, - { - "epoch": 0.28, - "learning_rate": 3.6072503548795505e-05, - "loss": 2.3715, - "step": 159730 - }, - { - "epoch": 0.28, - "learning_rate": 3.6071631608868675e-05, - "loss": 2.5125, - "step": 159740 - }, - { - "epoch": 0.28, - "learning_rate": 3.607075966894185e-05, - "loss": 2.4511, - "step": 159750 - }, - { - "epoch": 0.28, - "learning_rate": 3.606988772901502e-05, - "loss": 2.5003, - "step": 159760 - }, - { - "epoch": 0.28, - "learning_rate": 3.606901578908819e-05, - "loss": 2.4033, - "step": 159770 - }, - { - "epoch": 0.28, - "learning_rate": 3.606814384916137e-05, - "loss": 2.3536, - "step": 159780 - }, - { - "epoch": 0.28, - "learning_rate": 3.606727190923455e-05, - "loss": 2.3868, - "step": 159790 - }, - { - "epoch": 0.28, - "learning_rate": 3.606639996930772e-05, - "loss": 2.3987, - "step": 159800 - }, - { - "epoch": 0.28, - "learning_rate": 3.606552802938089e-05, - "loss": 2.5167, - "step": 159810 - }, - { - "epoch": 0.28, - "learning_rate": 3.6064656089454065e-05, - "loss": 2.5118, - "step": 159820 - }, - { - "epoch": 0.28, - "learning_rate": 3.6063784149527236e-05, - "loss": 2.4024, - "step": 159830 - }, - { - "epoch": 0.28, - "learning_rate": 3.6062912209600406e-05, - "loss": 2.4471, - "step": 159840 - }, - { - "epoch": 0.28, - "learning_rate": 3.6062040269673583e-05, - "loss": 2.4761, - "step": 159850 - }, - { - "epoch": 0.28, - "learning_rate": 3.6061168329746754e-05, - "loss": 2.566, - "step": 159860 - }, - { - "epoch": 0.28, - "learning_rate": 3.606029638981993e-05, - "loss": 2.4395, - "step": 159870 - }, - { - "epoch": 0.28, - "learning_rate": 3.60594244498931e-05, - "loss": 2.3773, - "step": 159880 - }, - { - "epoch": 0.28, - "learning_rate": 3.605855250996628e-05, - "loss": 2.5625, - "step": 159890 - }, - { - "epoch": 0.28, - "learning_rate": 3.605768057003945e-05, - "loss": 2.3982, - "step": 159900 - }, - { - "epoch": 0.28, - "learning_rate": 3.605680863011262e-05, - "loss": 2.5109, - "step": 159910 - }, - { - "epoch": 0.28, - "learning_rate": 3.6055936690185796e-05, - "loss": 2.4417, - "step": 159920 - }, - { - "epoch": 0.28, - "learning_rate": 3.605506475025897e-05, - "loss": 2.5569, - "step": 159930 - }, - { - "epoch": 0.28, - "learning_rate": 3.6054192810332144e-05, - "loss": 2.4019, - "step": 159940 - }, - { - "epoch": 0.28, - "learning_rate": 3.6053320870405314e-05, - "loss": 2.3759, - "step": 159950 - }, - { - "epoch": 0.28, - "learning_rate": 3.605244893047849e-05, - "loss": 2.5832, - "step": 159960 - }, - { - "epoch": 0.28, - "learning_rate": 3.605157699055166e-05, - "loss": 2.4822, - "step": 159970 - }, - { - "epoch": 0.28, - "learning_rate": 3.605070505062483e-05, - "loss": 2.5388, - "step": 159980 - }, - { - "epoch": 0.28, - "learning_rate": 3.6049833110698e-05, - "loss": 2.4319, - "step": 159990 - }, - { - "epoch": 0.28, - "learning_rate": 3.604896117077118e-05, - "loss": 2.4019, - "step": 160000 - }, - { - "epoch": 0.28, - "learning_rate": 3.604808923084435e-05, - "loss": 2.4911, - "step": 160010 - }, - { - "epoch": 0.28, - "learning_rate": 3.604721729091753e-05, - "loss": 2.3876, - "step": 160020 - }, - { - "epoch": 0.28, - "learning_rate": 3.6046345350990704e-05, - "loss": 2.6499, - "step": 160030 - }, - { - "epoch": 0.28, - "learning_rate": 3.6045473411063875e-05, - "loss": 2.5657, - "step": 160040 - }, - { - "epoch": 0.28, - "learning_rate": 3.6044601471137045e-05, - "loss": 2.4525, - "step": 160050 - }, - { - "epoch": 0.28, - "learning_rate": 3.6043729531210216e-05, - "loss": 2.527, - "step": 160060 - }, - { - "epoch": 0.28, - "learning_rate": 3.604285759128339e-05, - "loss": 2.5589, - "step": 160070 - }, - { - "epoch": 0.28, - "learning_rate": 3.604198565135656e-05, - "loss": 2.5113, - "step": 160080 - }, - { - "epoch": 0.28, - "learning_rate": 3.604111371142974e-05, - "loss": 2.5132, - "step": 160090 - }, - { - "epoch": 0.28, - "learning_rate": 3.604024177150291e-05, - "loss": 2.4847, - "step": 160100 - }, - { - "epoch": 0.28, - "learning_rate": 3.603936983157609e-05, - "loss": 2.365, - "step": 160110 - }, - { - "epoch": 0.28, - "learning_rate": 3.603849789164926e-05, - "loss": 2.5025, - "step": 160120 - }, - { - "epoch": 0.28, - "learning_rate": 3.603762595172243e-05, - "loss": 2.4683, - "step": 160130 - }, - { - "epoch": 0.28, - "learning_rate": 3.6036754011795606e-05, - "loss": 2.5249, - "step": 160140 - }, - { - "epoch": 0.28, - "learning_rate": 3.6035882071868776e-05, - "loss": 2.4792, - "step": 160150 - }, - { - "epoch": 0.28, - "learning_rate": 3.603501013194195e-05, - "loss": 2.5081, - "step": 160160 - }, - { - "epoch": 0.28, - "learning_rate": 3.6034138192015124e-05, - "loss": 2.3498, - "step": 160170 - }, - { - "epoch": 0.28, - "learning_rate": 3.60332662520883e-05, - "loss": 2.54, - "step": 160180 - }, - { - "epoch": 0.28, - "learning_rate": 3.603239431216147e-05, - "loss": 2.4053, - "step": 160190 - }, - { - "epoch": 0.28, - "learning_rate": 3.603152237223464e-05, - "loss": 2.4748, - "step": 160200 - }, - { - "epoch": 0.28, - "learning_rate": 3.603065043230782e-05, - "loss": 2.475, - "step": 160210 - }, - { - "epoch": 0.28, - "learning_rate": 3.602977849238099e-05, - "loss": 2.5056, - "step": 160220 - }, - { - "epoch": 0.28, - "learning_rate": 3.602890655245416e-05, - "loss": 2.533, - "step": 160230 - }, - { - "epoch": 0.28, - "learning_rate": 3.602803461252734e-05, - "loss": 2.509, - "step": 160240 - }, - { - "epoch": 0.28, - "learning_rate": 3.6027162672600514e-05, - "loss": 2.5158, - "step": 160250 - }, - { - "epoch": 0.28, - "learning_rate": 3.6026290732673684e-05, - "loss": 2.43, - "step": 160260 - }, - { - "epoch": 0.28, - "learning_rate": 3.6025418792746855e-05, - "loss": 2.3634, - "step": 160270 - }, - { - "epoch": 0.28, - "learning_rate": 3.602454685282003e-05, - "loss": 2.4561, - "step": 160280 - }, - { - "epoch": 0.28, - "learning_rate": 3.60236749128932e-05, - "loss": 2.4939, - "step": 160290 - }, - { - "epoch": 0.28, - "learning_rate": 3.602280297296637e-05, - "loss": 2.533, - "step": 160300 - }, - { - "epoch": 0.28, - "learning_rate": 3.602193103303955e-05, - "loss": 2.4733, - "step": 160310 - }, - { - "epoch": 0.28, - "learning_rate": 3.602105909311273e-05, - "loss": 2.5626, - "step": 160320 - }, - { - "epoch": 0.28, - "learning_rate": 3.60201871531859e-05, - "loss": 2.4411, - "step": 160330 - }, - { - "epoch": 0.28, - "learning_rate": 3.601931521325907e-05, - "loss": 2.4735, - "step": 160340 - }, - { - "epoch": 0.28, - "learning_rate": 3.6018443273332245e-05, - "loss": 2.5209, - "step": 160350 - }, - { - "epoch": 0.28, - "learning_rate": 3.6017571333405415e-05, - "loss": 2.3299, - "step": 160360 - }, - { - "epoch": 0.28, - "learning_rate": 3.6016699393478586e-05, - "loss": 2.6316, - "step": 160370 - }, - { - "epoch": 0.28, - "learning_rate": 3.6015827453551756e-05, - "loss": 2.5081, - "step": 160380 - }, - { - "epoch": 0.28, - "learning_rate": 3.601495551362494e-05, - "loss": 2.5134, - "step": 160390 - }, - { - "epoch": 0.28, - "learning_rate": 3.601408357369811e-05, - "loss": 2.39, - "step": 160400 - }, - { - "epoch": 0.28, - "learning_rate": 3.601321163377128e-05, - "loss": 2.4445, - "step": 160410 - }, - { - "epoch": 0.28, - "learning_rate": 3.601233969384446e-05, - "loss": 2.5235, - "step": 160420 - }, - { - "epoch": 0.28, - "learning_rate": 3.601146775391763e-05, - "loss": 2.5852, - "step": 160430 - }, - { - "epoch": 0.28, - "learning_rate": 3.60105958139908e-05, - "loss": 2.3619, - "step": 160440 - }, - { - "epoch": 0.28, - "learning_rate": 3.600972387406397e-05, - "loss": 2.5189, - "step": 160450 - }, - { - "epoch": 0.28, - "learning_rate": 3.600885193413715e-05, - "loss": 2.5251, - "step": 160460 - }, - { - "epoch": 0.28, - "learning_rate": 3.600797999421032e-05, - "loss": 2.5485, - "step": 160470 - }, - { - "epoch": 0.28, - "learning_rate": 3.6007108054283494e-05, - "loss": 2.5654, - "step": 160480 - }, - { - "epoch": 0.28, - "learning_rate": 3.6006236114356664e-05, - "loss": 2.5539, - "step": 160490 - }, - { - "epoch": 0.28, - "learning_rate": 3.600536417442984e-05, - "loss": 2.3799, - "step": 160500 - }, - { - "epoch": 0.28, - "learning_rate": 3.600449223450301e-05, - "loss": 2.4116, - "step": 160510 - }, - { - "epoch": 0.28, - "learning_rate": 3.600362029457618e-05, - "loss": 2.5031, - "step": 160520 - }, - { - "epoch": 0.28, - "learning_rate": 3.600274835464936e-05, - "loss": 2.5526, - "step": 160530 - }, - { - "epoch": 0.28, - "learning_rate": 3.6001876414722536e-05, - "loss": 2.501, - "step": 160540 - }, - { - "epoch": 0.28, - "learning_rate": 3.600100447479571e-05, - "loss": 2.5118, - "step": 160550 - }, - { - "epoch": 0.28, - "learning_rate": 3.600013253486888e-05, - "loss": 2.3993, - "step": 160560 - }, - { - "epoch": 0.28, - "learning_rate": 3.5999260594942054e-05, - "loss": 2.4398, - "step": 160570 - }, - { - "epoch": 0.28, - "learning_rate": 3.5998388655015225e-05, - "loss": 2.475, - "step": 160580 - }, - { - "epoch": 0.28, - "learning_rate": 3.5997516715088395e-05, - "loss": 2.4782, - "step": 160590 - }, - { - "epoch": 0.28, - "learning_rate": 3.599664477516157e-05, - "loss": 2.4373, - "step": 160600 - }, - { - "epoch": 0.28, - "learning_rate": 3.599577283523475e-05, - "loss": 2.4974, - "step": 160610 - }, - { - "epoch": 0.28, - "learning_rate": 3.599490089530792e-05, - "loss": 2.5432, - "step": 160620 - }, - { - "epoch": 0.28, - "learning_rate": 3.599402895538109e-05, - "loss": 2.4291, - "step": 160630 - }, - { - "epoch": 0.28, - "learning_rate": 3.599315701545427e-05, - "loss": 2.5297, - "step": 160640 - }, - { - "epoch": 0.28, - "learning_rate": 3.599228507552744e-05, - "loss": 2.428, - "step": 160650 - }, - { - "epoch": 0.28, - "learning_rate": 3.599141313560061e-05, - "loss": 2.5287, - "step": 160660 - }, - { - "epoch": 0.28, - "learning_rate": 3.5990541195673785e-05, - "loss": 2.489, - "step": 160670 - }, - { - "epoch": 0.28, - "learning_rate": 3.5989669255746955e-05, - "loss": 2.4336, - "step": 160680 - }, - { - "epoch": 0.28, - "learning_rate": 3.598879731582013e-05, - "loss": 2.4365, - "step": 160690 - }, - { - "epoch": 0.28, - "learning_rate": 3.59879253758933e-05, - "loss": 2.523, - "step": 160700 - }, - { - "epoch": 0.28, - "learning_rate": 3.598705343596648e-05, - "loss": 2.4898, - "step": 160710 - }, - { - "epoch": 0.28, - "learning_rate": 3.598618149603965e-05, - "loss": 2.51, - "step": 160720 - }, - { - "epoch": 0.28, - "learning_rate": 3.598530955611282e-05, - "loss": 2.3696, - "step": 160730 - }, - { - "epoch": 0.28, - "learning_rate": 3.5984437616186e-05, - "loss": 2.4365, - "step": 160740 - }, - { - "epoch": 0.28, - "learning_rate": 3.598356567625917e-05, - "loss": 2.5552, - "step": 160750 - }, - { - "epoch": 0.28, - "learning_rate": 3.5982693736332346e-05, - "loss": 2.373, - "step": 160760 - }, - { - "epoch": 0.28, - "learning_rate": 3.5981821796405516e-05, - "loss": 2.5448, - "step": 160770 - }, - { - "epoch": 0.28, - "learning_rate": 3.598094985647869e-05, - "loss": 2.4785, - "step": 160780 - }, - { - "epoch": 0.28, - "learning_rate": 3.5980077916551864e-05, - "loss": 2.4516, - "step": 160790 - }, - { - "epoch": 0.28, - "learning_rate": 3.5979205976625034e-05, - "loss": 2.4978, - "step": 160800 - }, - { - "epoch": 0.28, - "learning_rate": 3.597833403669821e-05, - "loss": 2.42, - "step": 160810 - }, - { - "epoch": 0.28, - "learning_rate": 3.597746209677138e-05, - "loss": 2.4461, - "step": 160820 - }, - { - "epoch": 0.28, - "learning_rate": 3.597659015684456e-05, - "loss": 2.45, - "step": 160830 - }, - { - "epoch": 0.28, - "learning_rate": 3.597571821691773e-05, - "loss": 2.371, - "step": 160840 - }, - { - "epoch": 0.28, - "learning_rate": 3.5974846276990906e-05, - "loss": 2.4641, - "step": 160850 - }, - { - "epoch": 0.28, - "learning_rate": 3.5973974337064077e-05, - "loss": 2.5072, - "step": 160860 - }, - { - "epoch": 0.28, - "learning_rate": 3.597310239713725e-05, - "loss": 2.5882, - "step": 160870 - }, - { - "epoch": 0.28, - "learning_rate": 3.5972230457210424e-05, - "loss": 2.512, - "step": 160880 - }, - { - "epoch": 0.28, - "learning_rate": 3.5971358517283594e-05, - "loss": 2.4811, - "step": 160890 - }, - { - "epoch": 0.28, - "learning_rate": 3.5970486577356765e-05, - "loss": 2.4684, - "step": 160900 - }, - { - "epoch": 0.28, - "learning_rate": 3.596961463742994e-05, - "loss": 2.4771, - "step": 160910 - }, - { - "epoch": 0.28, - "learning_rate": 3.596874269750312e-05, - "loss": 2.528, - "step": 160920 - }, - { - "epoch": 0.28, - "learning_rate": 3.596787075757629e-05, - "loss": 2.4297, - "step": 160930 - }, - { - "epoch": 0.28, - "learning_rate": 3.596699881764946e-05, - "loss": 2.5184, - "step": 160940 - }, - { - "epoch": 0.28, - "learning_rate": 3.596612687772263e-05, - "loss": 2.5246, - "step": 160950 - }, - { - "epoch": 0.28, - "learning_rate": 3.596525493779581e-05, - "loss": 2.3287, - "step": 160960 - }, - { - "epoch": 0.28, - "learning_rate": 3.596438299786898e-05, - "loss": 2.5457, - "step": 160970 - }, - { - "epoch": 0.28, - "learning_rate": 3.5963511057942155e-05, - "loss": 2.4036, - "step": 160980 - }, - { - "epoch": 0.28, - "learning_rate": 3.596263911801533e-05, - "loss": 2.5145, - "step": 160990 - }, - { - "epoch": 0.28, - "learning_rate": 3.59617671780885e-05, - "loss": 2.4885, - "step": 161000 - }, - { - "epoch": 0.28, - "learning_rate": 3.596089523816167e-05, - "loss": 2.6295, - "step": 161010 - }, - { - "epoch": 0.28, - "learning_rate": 3.596002329823484e-05, - "loss": 2.4541, - "step": 161020 - }, - { - "epoch": 0.28, - "learning_rate": 3.595915135830802e-05, - "loss": 2.4291, - "step": 161030 - }, - { - "epoch": 0.28, - "learning_rate": 3.595827941838119e-05, - "loss": 2.5297, - "step": 161040 - }, - { - "epoch": 0.28, - "learning_rate": 3.595740747845436e-05, - "loss": 2.3596, - "step": 161050 - }, - { - "epoch": 0.28, - "learning_rate": 3.595653553852754e-05, - "loss": 2.535, - "step": 161060 - }, - { - "epoch": 0.28, - "learning_rate": 3.5955663598600716e-05, - "loss": 2.4637, - "step": 161070 - }, - { - "epoch": 0.28, - "learning_rate": 3.5954791658673886e-05, - "loss": 2.4817, - "step": 161080 - }, - { - "epoch": 0.28, - "learning_rate": 3.5953919718747056e-05, - "loss": 2.3421, - "step": 161090 - }, - { - "epoch": 0.28, - "learning_rate": 3.5953047778820233e-05, - "loss": 2.4885, - "step": 161100 - }, - { - "epoch": 0.28, - "learning_rate": 3.5952175838893404e-05, - "loss": 2.4621, - "step": 161110 - }, - { - "epoch": 0.28, - "learning_rate": 3.5951303898966574e-05, - "loss": 2.5066, - "step": 161120 - }, - { - "epoch": 0.28, - "learning_rate": 3.595043195903975e-05, - "loss": 2.4639, - "step": 161130 - }, - { - "epoch": 0.28, - "learning_rate": 3.594956001911293e-05, - "loss": 2.3893, - "step": 161140 - }, - { - "epoch": 0.28, - "learning_rate": 3.59486880791861e-05, - "loss": 2.552, - "step": 161150 - }, - { - "epoch": 0.28, - "learning_rate": 3.594781613925927e-05, - "loss": 2.4569, - "step": 161160 - }, - { - "epoch": 0.28, - "learning_rate": 3.5946944199332446e-05, - "loss": 2.5544, - "step": 161170 - }, - { - "epoch": 0.28, - "learning_rate": 3.594607225940562e-05, - "loss": 2.4857, - "step": 161180 - }, - { - "epoch": 0.28, - "learning_rate": 3.594520031947879e-05, - "loss": 2.518, - "step": 161190 - }, - { - "epoch": 0.28, - "learning_rate": 3.5944328379551964e-05, - "loss": 2.5083, - "step": 161200 - }, - { - "epoch": 0.28, - "learning_rate": 3.594345643962514e-05, - "loss": 2.4356, - "step": 161210 - }, - { - "epoch": 0.28, - "learning_rate": 3.594258449969831e-05, - "loss": 2.4845, - "step": 161220 - }, - { - "epoch": 0.28, - "learning_rate": 3.594171255977148e-05, - "loss": 2.4358, - "step": 161230 - }, - { - "epoch": 0.28, - "learning_rate": 3.594084061984466e-05, - "loss": 2.4577, - "step": 161240 - }, - { - "epoch": 0.28, - "learning_rate": 3.593996867991783e-05, - "loss": 2.4873, - "step": 161250 - }, - { - "epoch": 0.28, - "learning_rate": 3.5939096739991e-05, - "loss": 2.5052, - "step": 161260 - }, - { - "epoch": 0.28, - "learning_rate": 3.593822480006418e-05, - "loss": 2.4967, - "step": 161270 - }, - { - "epoch": 0.28, - "learning_rate": 3.5937352860137355e-05, - "loss": 2.4035, - "step": 161280 - }, - { - "epoch": 0.28, - "learning_rate": 3.5936480920210525e-05, - "loss": 2.4148, - "step": 161290 - }, - { - "epoch": 0.28, - "learning_rate": 3.5935608980283695e-05, - "loss": 2.535, - "step": 161300 - }, - { - "epoch": 0.28, - "learning_rate": 3.593473704035687e-05, - "loss": 2.4256, - "step": 161310 - }, - { - "epoch": 0.28, - "learning_rate": 3.593386510043004e-05, - "loss": 2.4302, - "step": 161320 - }, - { - "epoch": 0.28, - "learning_rate": 3.593299316050321e-05, - "loss": 2.5056, - "step": 161330 - }, - { - "epoch": 0.28, - "learning_rate": 3.5932121220576384e-05, - "loss": 2.4575, - "step": 161340 - }, - { - "epoch": 0.28, - "learning_rate": 3.593124928064957e-05, - "loss": 2.3701, - "step": 161350 - }, - { - "epoch": 0.28, - "learning_rate": 3.593037734072274e-05, - "loss": 2.5588, - "step": 161360 - }, - { - "epoch": 0.28, - "learning_rate": 3.592950540079591e-05, - "loss": 2.3768, - "step": 161370 - }, - { - "epoch": 0.28, - "learning_rate": 3.5928633460869085e-05, - "loss": 2.516, - "step": 161380 - }, - { - "epoch": 0.28, - "learning_rate": 3.5927761520942256e-05, - "loss": 2.264, - "step": 161390 - }, - { - "epoch": 0.28, - "learning_rate": 3.5926889581015426e-05, - "loss": 2.5461, - "step": 161400 - }, - { - "epoch": 0.28, - "learning_rate": 3.59260176410886e-05, - "loss": 2.4103, - "step": 161410 - }, - { - "epoch": 0.28, - "learning_rate": 3.5925145701161774e-05, - "loss": 2.525, - "step": 161420 - }, - { - "epoch": 0.28, - "learning_rate": 3.592427376123495e-05, - "loss": 2.4775, - "step": 161430 - }, - { - "epoch": 0.28, - "learning_rate": 3.592340182130812e-05, - "loss": 2.4087, - "step": 161440 - }, - { - "epoch": 0.28, - "learning_rate": 3.592252988138129e-05, - "loss": 2.4634, - "step": 161450 - }, - { - "epoch": 0.28, - "learning_rate": 3.592165794145447e-05, - "loss": 2.5198, - "step": 161460 - }, - { - "epoch": 0.28, - "learning_rate": 3.592078600152764e-05, - "loss": 2.4963, - "step": 161470 - }, - { - "epoch": 0.28, - "learning_rate": 3.591991406160081e-05, - "loss": 2.4908, - "step": 161480 - }, - { - "epoch": 0.28, - "learning_rate": 3.591904212167399e-05, - "loss": 2.4373, - "step": 161490 - }, - { - "epoch": 0.28, - "learning_rate": 3.5918170181747164e-05, - "loss": 2.4841, - "step": 161500 - }, - { - "epoch": 0.28, - "learning_rate": 3.5917298241820334e-05, - "loss": 2.5065, - "step": 161510 - }, - { - "epoch": 0.28, - "learning_rate": 3.5916426301893505e-05, - "loss": 2.4846, - "step": 161520 - }, - { - "epoch": 0.28, - "learning_rate": 3.591555436196668e-05, - "loss": 2.4356, - "step": 161530 - }, - { - "epoch": 0.28, - "learning_rate": 3.591468242203985e-05, - "loss": 2.3448, - "step": 161540 - }, - { - "epoch": 0.28, - "learning_rate": 3.591381048211302e-05, - "loss": 2.4578, - "step": 161550 - }, - { - "epoch": 0.28, - "learning_rate": 3.59129385421862e-05, - "loss": 2.4142, - "step": 161560 - }, - { - "epoch": 0.28, - "learning_rate": 3.591206660225937e-05, - "loss": 2.4362, - "step": 161570 - }, - { - "epoch": 0.28, - "learning_rate": 3.591119466233255e-05, - "loss": 2.4127, - "step": 161580 - }, - { - "epoch": 0.28, - "learning_rate": 3.591032272240572e-05, - "loss": 2.4763, - "step": 161590 - }, - { - "epoch": 0.28, - "learning_rate": 3.5909450782478895e-05, - "loss": 2.4136, - "step": 161600 - }, - { - "epoch": 0.28, - "learning_rate": 3.5908578842552065e-05, - "loss": 2.4938, - "step": 161610 - }, - { - "epoch": 0.28, - "learning_rate": 3.5907706902625236e-05, - "loss": 2.4925, - "step": 161620 - }, - { - "epoch": 0.28, - "learning_rate": 3.590683496269841e-05, - "loss": 2.3786, - "step": 161630 - }, - { - "epoch": 0.28, - "learning_rate": 3.590596302277158e-05, - "loss": 2.4216, - "step": 161640 - }, - { - "epoch": 0.28, - "learning_rate": 3.590509108284476e-05, - "loss": 2.5383, - "step": 161650 - }, - { - "epoch": 0.28, - "learning_rate": 3.590421914291793e-05, - "loss": 2.4748, - "step": 161660 - }, - { - "epoch": 0.28, - "learning_rate": 3.590334720299111e-05, - "loss": 2.475, - "step": 161670 - }, - { - "epoch": 0.28, - "learning_rate": 3.590247526306428e-05, - "loss": 2.4389, - "step": 161680 - }, - { - "epoch": 0.28, - "learning_rate": 3.590160332313745e-05, - "loss": 2.3216, - "step": 161690 - }, - { - "epoch": 0.28, - "learning_rate": 3.5900731383210626e-05, - "loss": 2.4488, - "step": 161700 - }, - { - "epoch": 0.28, - "learning_rate": 3.5899859443283796e-05, - "loss": 2.4684, - "step": 161710 - }, - { - "epoch": 0.28, - "learning_rate": 3.5898987503356967e-05, - "loss": 2.3212, - "step": 161720 - }, - { - "epoch": 0.28, - "learning_rate": 3.5898115563430144e-05, - "loss": 2.3901, - "step": 161730 - }, - { - "epoch": 0.28, - "learning_rate": 3.589724362350332e-05, - "loss": 2.5628, - "step": 161740 - }, - { - "epoch": 0.28, - "learning_rate": 3.589637168357649e-05, - "loss": 2.4605, - "step": 161750 - }, - { - "epoch": 0.28, - "learning_rate": 3.589549974364966e-05, - "loss": 2.5451, - "step": 161760 - }, - { - "epoch": 0.28, - "learning_rate": 3.589462780372284e-05, - "loss": 2.3324, - "step": 161770 - }, - { - "epoch": 0.28, - "learning_rate": 3.589375586379601e-05, - "loss": 2.3672, - "step": 161780 - }, - { - "epoch": 0.28, - "learning_rate": 3.589288392386918e-05, - "loss": 2.4037, - "step": 161790 - }, - { - "epoch": 0.28, - "learning_rate": 3.589201198394236e-05, - "loss": 2.539, - "step": 161800 - }, - { - "epoch": 0.28, - "learning_rate": 3.5891140044015534e-05, - "loss": 2.4081, - "step": 161810 - }, - { - "epoch": 0.28, - "learning_rate": 3.5890268104088704e-05, - "loss": 2.5872, - "step": 161820 - }, - { - "epoch": 0.28, - "learning_rate": 3.5889396164161875e-05, - "loss": 2.5146, - "step": 161830 - }, - { - "epoch": 0.28, - "learning_rate": 3.5888524224235045e-05, - "loss": 2.562, - "step": 161840 - }, - { - "epoch": 0.28, - "learning_rate": 3.588765228430822e-05, - "loss": 2.5189, - "step": 161850 - }, - { - "epoch": 0.28, - "learning_rate": 3.588678034438139e-05, - "loss": 2.3453, - "step": 161860 - }, - { - "epoch": 0.28, - "learning_rate": 3.588590840445456e-05, - "loss": 2.4748, - "step": 161870 - }, - { - "epoch": 0.28, - "learning_rate": 3.588503646452775e-05, - "loss": 2.4053, - "step": 161880 - }, - { - "epoch": 0.28, - "learning_rate": 3.588416452460092e-05, - "loss": 2.4021, - "step": 161890 - }, - { - "epoch": 0.28, - "learning_rate": 3.588329258467409e-05, - "loss": 2.4935, - "step": 161900 - }, - { - "epoch": 0.28, - "learning_rate": 3.588242064474726e-05, - "loss": 2.581, - "step": 161910 - }, - { - "epoch": 0.28, - "learning_rate": 3.5881548704820435e-05, - "loss": 2.4478, - "step": 161920 - }, - { - "epoch": 0.28, - "learning_rate": 3.5880676764893606e-05, - "loss": 2.4383, - "step": 161930 - }, - { - "epoch": 0.28, - "learning_rate": 3.5879804824966776e-05, - "loss": 2.4971, - "step": 161940 - }, - { - "epoch": 0.28, - "learning_rate": 3.587893288503995e-05, - "loss": 2.4982, - "step": 161950 - }, - { - "epoch": 0.28, - "learning_rate": 3.587806094511313e-05, - "loss": 2.4975, - "step": 161960 - }, - { - "epoch": 0.28, - "learning_rate": 3.58771890051863e-05, - "loss": 2.4346, - "step": 161970 - }, - { - "epoch": 0.28, - "learning_rate": 3.587631706525947e-05, - "loss": 2.4912, - "step": 161980 - }, - { - "epoch": 0.28, - "learning_rate": 3.587544512533265e-05, - "loss": 2.373, - "step": 161990 - }, - { - "epoch": 0.28, - "learning_rate": 3.587457318540582e-05, - "loss": 2.5432, - "step": 162000 - }, - { - "epoch": 0.28, - "learning_rate": 3.587370124547899e-05, - "loss": 2.5072, - "step": 162010 - }, - { - "epoch": 0.28, - "learning_rate": 3.5872829305552166e-05, - "loss": 2.4547, - "step": 162020 - }, - { - "epoch": 0.28, - "learning_rate": 3.587195736562534e-05, - "loss": 2.5613, - "step": 162030 - }, - { - "epoch": 0.28, - "learning_rate": 3.5871085425698514e-05, - "loss": 2.4657, - "step": 162040 - }, - { - "epoch": 0.28, - "learning_rate": 3.5870213485771684e-05, - "loss": 2.5226, - "step": 162050 - }, - { - "epoch": 0.28, - "learning_rate": 3.586934154584486e-05, - "loss": 2.4084, - "step": 162060 - }, - { - "epoch": 0.28, - "learning_rate": 3.586846960591803e-05, - "loss": 2.3903, - "step": 162070 - }, - { - "epoch": 0.28, - "learning_rate": 3.58675976659912e-05, - "loss": 2.4147, - "step": 162080 - }, - { - "epoch": 0.28, - "learning_rate": 3.586672572606438e-05, - "loss": 2.5282, - "step": 162090 - }, - { - "epoch": 0.28, - "learning_rate": 3.5865853786137556e-05, - "loss": 2.4644, - "step": 162100 - }, - { - "epoch": 0.28, - "learning_rate": 3.586498184621073e-05, - "loss": 2.4641, - "step": 162110 - }, - { - "epoch": 0.28, - "learning_rate": 3.58641099062839e-05, - "loss": 2.4437, - "step": 162120 - }, - { - "epoch": 0.28, - "learning_rate": 3.5863237966357074e-05, - "loss": 2.3976, - "step": 162130 - }, - { - "epoch": 0.28, - "learning_rate": 3.5862366026430245e-05, - "loss": 2.5111, - "step": 162140 - }, - { - "epoch": 0.28, - "learning_rate": 3.5861494086503415e-05, - "loss": 2.4028, - "step": 162150 - }, - { - "epoch": 0.28, - "learning_rate": 3.586062214657659e-05, - "loss": 2.5139, - "step": 162160 - }, - { - "epoch": 0.28, - "learning_rate": 3.585975020664977e-05, - "loss": 2.5538, - "step": 162170 - }, - { - "epoch": 0.28, - "learning_rate": 3.585887826672294e-05, - "loss": 2.4415, - "step": 162180 - }, - { - "epoch": 0.28, - "learning_rate": 3.585800632679611e-05, - "loss": 2.4173, - "step": 162190 - }, - { - "epoch": 0.28, - "learning_rate": 3.585713438686929e-05, - "loss": 2.4297, - "step": 162200 - }, - { - "epoch": 0.28, - "learning_rate": 3.585626244694246e-05, - "loss": 2.3451, - "step": 162210 - }, - { - "epoch": 0.28, - "learning_rate": 3.585539050701563e-05, - "loss": 2.479, - "step": 162220 - }, - { - "epoch": 0.28, - "learning_rate": 3.5854518567088805e-05, - "loss": 2.4393, - "step": 162230 - }, - { - "epoch": 0.28, - "learning_rate": 3.5853646627161975e-05, - "loss": 2.4763, - "step": 162240 - }, - { - "epoch": 0.28, - "learning_rate": 3.585277468723515e-05, - "loss": 2.5125, - "step": 162250 - }, - { - "epoch": 0.28, - "learning_rate": 3.585190274730832e-05, - "loss": 2.595, - "step": 162260 - }, - { - "epoch": 0.28, - "learning_rate": 3.58510308073815e-05, - "loss": 2.4609, - "step": 162270 - }, - { - "epoch": 0.28, - "learning_rate": 3.585015886745467e-05, - "loss": 2.5116, - "step": 162280 - }, - { - "epoch": 0.28, - "learning_rate": 3.584928692752784e-05, - "loss": 2.4604, - "step": 162290 - }, - { - "epoch": 0.28, - "learning_rate": 3.584841498760101e-05, - "loss": 2.3033, - "step": 162300 - }, - { - "epoch": 0.28, - "learning_rate": 3.584754304767419e-05, - "loss": 2.575, - "step": 162310 - }, - { - "epoch": 0.28, - "learning_rate": 3.5846671107747366e-05, - "loss": 2.5025, - "step": 162320 - }, - { - "epoch": 0.28, - "learning_rate": 3.5845799167820536e-05, - "loss": 2.4327, - "step": 162330 - }, - { - "epoch": 0.28, - "learning_rate": 3.584492722789371e-05, - "loss": 2.5581, - "step": 162340 - }, - { - "epoch": 0.28, - "learning_rate": 3.5844055287966884e-05, - "loss": 2.5169, - "step": 162350 - }, - { - "epoch": 0.28, - "learning_rate": 3.5843183348040054e-05, - "loss": 2.485, - "step": 162360 - }, - { - "epoch": 0.28, - "learning_rate": 3.5842311408113224e-05, - "loss": 2.4712, - "step": 162370 - }, - { - "epoch": 0.28, - "learning_rate": 3.58414394681864e-05, - "loss": 2.4284, - "step": 162380 - }, - { - "epoch": 0.28, - "learning_rate": 3.584056752825957e-05, - "loss": 2.3953, - "step": 162390 - }, - { - "epoch": 0.28, - "learning_rate": 3.583969558833275e-05, - "loss": 2.4782, - "step": 162400 - }, - { - "epoch": 0.28, - "learning_rate": 3.583882364840592e-05, - "loss": 2.4561, - "step": 162410 - }, - { - "epoch": 0.28, - "learning_rate": 3.5837951708479097e-05, - "loss": 2.4739, - "step": 162420 - }, - { - "epoch": 0.28, - "learning_rate": 3.583707976855227e-05, - "loss": 2.4242, - "step": 162430 - }, - { - "epoch": 0.28, - "learning_rate": 3.583620782862544e-05, - "loss": 2.5245, - "step": 162440 - }, - { - "epoch": 0.28, - "learning_rate": 3.5835335888698614e-05, - "loss": 2.5443, - "step": 162450 - }, - { - "epoch": 0.28, - "learning_rate": 3.5834463948771785e-05, - "loss": 2.539, - "step": 162460 - }, - { - "epoch": 0.28, - "learning_rate": 3.583359200884496e-05, - "loss": 2.5217, - "step": 162470 - }, - { - "epoch": 0.28, - "learning_rate": 3.583272006891813e-05, - "loss": 2.3403, - "step": 162480 - }, - { - "epoch": 0.28, - "learning_rate": 3.583184812899131e-05, - "loss": 2.397, - "step": 162490 - }, - { - "epoch": 0.28, - "learning_rate": 3.583097618906448e-05, - "loss": 2.4368, - "step": 162500 - }, - { - "epoch": 0.28, - "learning_rate": 3.583010424913765e-05, - "loss": 2.5124, - "step": 162510 - }, - { - "epoch": 0.28, - "learning_rate": 3.582923230921083e-05, - "loss": 2.4834, - "step": 162520 - }, - { - "epoch": 0.28, - "learning_rate": 3.5828360369284e-05, - "loss": 2.3832, - "step": 162530 - }, - { - "epoch": 0.28, - "learning_rate": 3.582748842935717e-05, - "loss": 2.4137, - "step": 162540 - }, - { - "epoch": 0.28, - "learning_rate": 3.5826616489430345e-05, - "loss": 2.3535, - "step": 162550 - }, - { - "epoch": 0.28, - "learning_rate": 3.582574454950352e-05, - "loss": 2.4871, - "step": 162560 - }, - { - "epoch": 0.28, - "learning_rate": 3.582487260957669e-05, - "loss": 2.4627, - "step": 162570 - }, - { - "epoch": 0.28, - "learning_rate": 3.582400066964986e-05, - "loss": 2.3643, - "step": 162580 - }, - { - "epoch": 0.28, - "learning_rate": 3.582312872972304e-05, - "loss": 2.4921, - "step": 162590 - }, - { - "epoch": 0.28, - "learning_rate": 3.582225678979621e-05, - "loss": 2.4221, - "step": 162600 - }, - { - "epoch": 0.28, - "learning_rate": 3.582138484986938e-05, - "loss": 2.2779, - "step": 162610 - }, - { - "epoch": 0.28, - "learning_rate": 3.582051290994256e-05, - "loss": 2.4719, - "step": 162620 - }, - { - "epoch": 0.28, - "learning_rate": 3.5819640970015736e-05, - "loss": 2.4631, - "step": 162630 - }, - { - "epoch": 0.28, - "learning_rate": 3.5818769030088906e-05, - "loss": 2.5035, - "step": 162640 - }, - { - "epoch": 0.28, - "learning_rate": 3.5817897090162076e-05, - "loss": 2.4025, - "step": 162650 - }, - { - "epoch": 0.28, - "learning_rate": 3.5817025150235253e-05, - "loss": 2.3971, - "step": 162660 - }, - { - "epoch": 0.28, - "learning_rate": 3.5816153210308424e-05, - "loss": 2.4036, - "step": 162670 - }, - { - "epoch": 0.28, - "learning_rate": 3.5815281270381594e-05, - "loss": 2.401, - "step": 162680 - }, - { - "epoch": 0.28, - "learning_rate": 3.581440933045477e-05, - "loss": 2.4388, - "step": 162690 - }, - { - "epoch": 0.28, - "learning_rate": 3.581353739052795e-05, - "loss": 2.4638, - "step": 162700 - }, - { - "epoch": 0.28, - "learning_rate": 3.581266545060112e-05, - "loss": 2.527, - "step": 162710 - }, - { - "epoch": 0.28, - "learning_rate": 3.581179351067429e-05, - "loss": 2.5276, - "step": 162720 - }, - { - "epoch": 0.28, - "learning_rate": 3.5810921570747466e-05, - "loss": 2.5474, - "step": 162730 - }, - { - "epoch": 0.28, - "learning_rate": 3.581004963082064e-05, - "loss": 2.4129, - "step": 162740 - }, - { - "epoch": 0.28, - "learning_rate": 3.580917769089381e-05, - "loss": 2.4962, - "step": 162750 - }, - { - "epoch": 0.28, - "learning_rate": 3.580830575096698e-05, - "loss": 2.4513, - "step": 162760 - }, - { - "epoch": 0.28, - "learning_rate": 3.580743381104016e-05, - "loss": 2.5142, - "step": 162770 - }, - { - "epoch": 0.28, - "learning_rate": 3.580656187111333e-05, - "loss": 2.5034, - "step": 162780 - }, - { - "epoch": 0.28, - "learning_rate": 3.58056899311865e-05, - "loss": 2.5083, - "step": 162790 - }, - { - "epoch": 0.28, - "learning_rate": 3.580481799125967e-05, - "loss": 2.412, - "step": 162800 - }, - { - "epoch": 0.28, - "learning_rate": 3.580394605133285e-05, - "loss": 2.4903, - "step": 162810 - }, - { - "epoch": 0.28, - "learning_rate": 3.580307411140602e-05, - "loss": 2.5649, - "step": 162820 - }, - { - "epoch": 0.28, - "learning_rate": 3.580220217147919e-05, - "loss": 2.4464, - "step": 162830 - }, - { - "epoch": 0.28, - "learning_rate": 3.5801330231552375e-05, - "loss": 2.4823, - "step": 162840 - }, - { - "epoch": 0.28, - "learning_rate": 3.5800458291625545e-05, - "loss": 2.4688, - "step": 162850 - }, - { - "epoch": 0.28, - "learning_rate": 3.5799586351698715e-05, - "loss": 2.3645, - "step": 162860 - }, - { - "epoch": 0.28, - "learning_rate": 3.5798714411771886e-05, - "loss": 2.4538, - "step": 162870 - }, - { - "epoch": 0.28, - "learning_rate": 3.579784247184506e-05, - "loss": 2.4637, - "step": 162880 - }, - { - "epoch": 0.28, - "learning_rate": 3.579697053191823e-05, - "loss": 2.519, - "step": 162890 - }, - { - "epoch": 0.28, - "learning_rate": 3.5796098591991404e-05, - "loss": 2.515, - "step": 162900 - }, - { - "epoch": 0.28, - "learning_rate": 3.579522665206458e-05, - "loss": 2.3999, - "step": 162910 - }, - { - "epoch": 0.28, - "learning_rate": 3.579435471213776e-05, - "loss": 2.5164, - "step": 162920 - }, - { - "epoch": 0.28, - "learning_rate": 3.579348277221093e-05, - "loss": 2.3545, - "step": 162930 - }, - { - "epoch": 0.28, - "learning_rate": 3.57926108322841e-05, - "loss": 2.5532, - "step": 162940 - }, - { - "epoch": 0.28, - "learning_rate": 3.5791738892357276e-05, - "loss": 2.4029, - "step": 162950 - }, - { - "epoch": 0.28, - "learning_rate": 3.5790866952430446e-05, - "loss": 2.4644, - "step": 162960 - }, - { - "epoch": 0.28, - "learning_rate": 3.578999501250362e-05, - "loss": 2.4687, - "step": 162970 - }, - { - "epoch": 0.28, - "learning_rate": 3.5789123072576794e-05, - "loss": 2.5753, - "step": 162980 - }, - { - "epoch": 0.28, - "learning_rate": 3.578825113264997e-05, - "loss": 2.5615, - "step": 162990 - }, - { - "epoch": 0.28, - "learning_rate": 3.578737919272314e-05, - "loss": 2.4235, - "step": 163000 - }, - { - "epoch": 0.28, - "learning_rate": 3.578650725279631e-05, - "loss": 2.3957, - "step": 163010 - }, - { - "epoch": 0.28, - "learning_rate": 3.578563531286949e-05, - "loss": 2.6168, - "step": 163020 - }, - { - "epoch": 0.28, - "learning_rate": 3.578476337294266e-05, - "loss": 2.3729, - "step": 163030 - }, - { - "epoch": 0.28, - "learning_rate": 3.578389143301583e-05, - "loss": 2.6107, - "step": 163040 - }, - { - "epoch": 0.28, - "learning_rate": 3.578301949308901e-05, - "loss": 2.5027, - "step": 163050 - }, - { - "epoch": 0.28, - "learning_rate": 3.578214755316218e-05, - "loss": 2.4279, - "step": 163060 - }, - { - "epoch": 0.28, - "learning_rate": 3.5781275613235354e-05, - "loss": 2.5548, - "step": 163070 - }, - { - "epoch": 0.28, - "learning_rate": 3.5780403673308525e-05, - "loss": 2.3662, - "step": 163080 - }, - { - "epoch": 0.28, - "learning_rate": 3.57795317333817e-05, - "loss": 2.4031, - "step": 163090 - }, - { - "epoch": 0.28, - "learning_rate": 3.577865979345487e-05, - "loss": 2.4124, - "step": 163100 - }, - { - "epoch": 0.28, - "learning_rate": 3.577778785352804e-05, - "loss": 2.4811, - "step": 163110 - }, - { - "epoch": 0.28, - "learning_rate": 3.577691591360122e-05, - "loss": 2.4216, - "step": 163120 - }, - { - "epoch": 0.28, - "learning_rate": 3.577604397367439e-05, - "loss": 2.4655, - "step": 163130 - }, - { - "epoch": 0.28, - "learning_rate": 3.577517203374757e-05, - "loss": 2.4212, - "step": 163140 - }, - { - "epoch": 0.28, - "learning_rate": 3.577430009382074e-05, - "loss": 2.4961, - "step": 163150 - }, - { - "epoch": 0.28, - "learning_rate": 3.5773428153893915e-05, - "loss": 2.5018, - "step": 163160 - }, - { - "epoch": 0.28, - "learning_rate": 3.5772556213967085e-05, - "loss": 2.4043, - "step": 163170 - }, - { - "epoch": 0.28, - "learning_rate": 3.5771684274040256e-05, - "loss": 2.3424, - "step": 163180 - }, - { - "epoch": 0.28, - "learning_rate": 3.5770812334113426e-05, - "loss": 2.4613, - "step": 163190 - }, - { - "epoch": 0.28, - "learning_rate": 3.57699403941866e-05, - "loss": 2.5123, - "step": 163200 - }, - { - "epoch": 0.28, - "learning_rate": 3.5769068454259774e-05, - "loss": 2.5497, - "step": 163210 - }, - { - "epoch": 0.28, - "learning_rate": 3.576819651433295e-05, - "loss": 2.5294, - "step": 163220 - }, - { - "epoch": 0.28, - "learning_rate": 3.576732457440613e-05, - "loss": 2.3783, - "step": 163230 - }, - { - "epoch": 0.28, - "learning_rate": 3.57664526344793e-05, - "loss": 2.4957, - "step": 163240 - }, - { - "epoch": 0.28, - "learning_rate": 3.576558069455247e-05, - "loss": 2.4889, - "step": 163250 - }, - { - "epoch": 0.28, - "learning_rate": 3.576470875462564e-05, - "loss": 2.383, - "step": 163260 - }, - { - "epoch": 0.28, - "learning_rate": 3.5763836814698816e-05, - "loss": 2.3913, - "step": 163270 - }, - { - "epoch": 0.28, - "learning_rate": 3.5762964874771987e-05, - "loss": 2.3977, - "step": 163280 - }, - { - "epoch": 0.28, - "learning_rate": 3.5762092934845164e-05, - "loss": 2.4546, - "step": 163290 - }, - { - "epoch": 0.28, - "learning_rate": 3.5761220994918334e-05, - "loss": 2.5295, - "step": 163300 - }, - { - "epoch": 0.28, - "learning_rate": 3.576034905499151e-05, - "loss": 2.5171, - "step": 163310 - }, - { - "epoch": 0.28, - "learning_rate": 3.575947711506468e-05, - "loss": 2.443, - "step": 163320 - }, - { - "epoch": 0.28, - "learning_rate": 3.575860517513785e-05, - "loss": 2.4957, - "step": 163330 - }, - { - "epoch": 0.28, - "learning_rate": 3.575773323521103e-05, - "loss": 2.3504, - "step": 163340 - }, - { - "epoch": 0.28, - "learning_rate": 3.57568612952842e-05, - "loss": 2.49, - "step": 163350 - }, - { - "epoch": 0.28, - "learning_rate": 3.575598935535738e-05, - "loss": 2.4671, - "step": 163360 - }, - { - "epoch": 0.28, - "learning_rate": 3.575511741543055e-05, - "loss": 2.5163, - "step": 163370 - }, - { - "epoch": 0.28, - "learning_rate": 3.5754245475503724e-05, - "loss": 2.511, - "step": 163380 - }, - { - "epoch": 0.28, - "learning_rate": 3.5753373535576895e-05, - "loss": 2.4355, - "step": 163390 - }, - { - "epoch": 0.28, - "learning_rate": 3.5752501595650065e-05, - "loss": 2.3787, - "step": 163400 - }, - { - "epoch": 0.28, - "learning_rate": 3.575162965572324e-05, - "loss": 2.5262, - "step": 163410 - }, - { - "epoch": 0.28, - "learning_rate": 3.575075771579641e-05, - "loss": 2.4935, - "step": 163420 - }, - { - "epoch": 0.29, - "learning_rate": 3.574988577586958e-05, - "loss": 2.4503, - "step": 163430 - }, - { - "epoch": 0.29, - "learning_rate": 3.574901383594276e-05, - "loss": 2.3568, - "step": 163440 - }, - { - "epoch": 0.29, - "learning_rate": 3.574814189601594e-05, - "loss": 2.4373, - "step": 163450 - }, - { - "epoch": 0.29, - "learning_rate": 3.574726995608911e-05, - "loss": 2.4647, - "step": 163460 - }, - { - "epoch": 0.29, - "learning_rate": 3.574639801616228e-05, - "loss": 2.467, - "step": 163470 - }, - { - "epoch": 0.29, - "learning_rate": 3.5745526076235455e-05, - "loss": 2.4688, - "step": 163480 - }, - { - "epoch": 0.29, - "learning_rate": 3.5744654136308626e-05, - "loss": 2.5826, - "step": 163490 - }, - { - "epoch": 0.29, - "learning_rate": 3.5743782196381796e-05, - "loss": 2.4336, - "step": 163500 - }, - { - "epoch": 0.29, - "learning_rate": 3.574291025645497e-05, - "loss": 2.3839, - "step": 163510 - }, - { - "epoch": 0.29, - "learning_rate": 3.574203831652815e-05, - "loss": 2.4228, - "step": 163520 - }, - { - "epoch": 0.29, - "learning_rate": 3.574116637660132e-05, - "loss": 2.6131, - "step": 163530 - }, - { - "epoch": 0.29, - "learning_rate": 3.574029443667449e-05, - "loss": 2.38, - "step": 163540 - }, - { - "epoch": 0.29, - "learning_rate": 3.573942249674767e-05, - "loss": 2.5222, - "step": 163550 - }, - { - "epoch": 0.29, - "learning_rate": 3.573855055682084e-05, - "loss": 2.3964, - "step": 163560 - }, - { - "epoch": 0.29, - "learning_rate": 3.573767861689401e-05, - "loss": 2.5504, - "step": 163570 - }, - { - "epoch": 0.29, - "learning_rate": 3.5736806676967186e-05, - "loss": 2.3896, - "step": 163580 - }, - { - "epoch": 0.29, - "learning_rate": 3.573593473704036e-05, - "loss": 2.4043, - "step": 163590 - }, - { - "epoch": 0.29, - "learning_rate": 3.5735062797113534e-05, - "loss": 2.3889, - "step": 163600 - }, - { - "epoch": 0.29, - "learning_rate": 3.5734190857186704e-05, - "loss": 2.5412, - "step": 163610 - }, - { - "epoch": 0.29, - "learning_rate": 3.573331891725988e-05, - "loss": 2.484, - "step": 163620 - }, - { - "epoch": 0.29, - "learning_rate": 3.573244697733305e-05, - "loss": 2.5485, - "step": 163630 - }, - { - "epoch": 0.29, - "learning_rate": 3.573157503740622e-05, - "loss": 2.4472, - "step": 163640 - }, - { - "epoch": 0.29, - "learning_rate": 3.573070309747939e-05, - "loss": 2.4013, - "step": 163650 - }, - { - "epoch": 0.29, - "learning_rate": 3.5729831157552576e-05, - "loss": 2.5532, - "step": 163660 - }, - { - "epoch": 0.29, - "learning_rate": 3.572895921762575e-05, - "loss": 2.4734, - "step": 163670 - }, - { - "epoch": 0.29, - "learning_rate": 3.572808727769892e-05, - "loss": 2.381, - "step": 163680 - }, - { - "epoch": 0.29, - "learning_rate": 3.5727215337772094e-05, - "loss": 2.4884, - "step": 163690 - }, - { - "epoch": 0.29, - "learning_rate": 3.5726343397845265e-05, - "loss": 2.4463, - "step": 163700 - }, - { - "epoch": 0.29, - "learning_rate": 3.5725471457918435e-05, - "loss": 2.426, - "step": 163710 - }, - { - "epoch": 0.29, - "learning_rate": 3.5724599517991605e-05, - "loss": 2.4908, - "step": 163720 - }, - { - "epoch": 0.29, - "learning_rate": 3.572372757806478e-05, - "loss": 2.478, - "step": 163730 - }, - { - "epoch": 0.29, - "learning_rate": 3.572285563813796e-05, - "loss": 2.4896, - "step": 163740 - }, - { - "epoch": 0.29, - "learning_rate": 3.572198369821113e-05, - "loss": 2.3766, - "step": 163750 - }, - { - "epoch": 0.29, - "learning_rate": 3.57211117582843e-05, - "loss": 2.487, - "step": 163760 - }, - { - "epoch": 0.29, - "learning_rate": 3.572023981835748e-05, - "loss": 2.4702, - "step": 163770 - }, - { - "epoch": 0.29, - "learning_rate": 3.571936787843065e-05, - "loss": 2.4704, - "step": 163780 - }, - { - "epoch": 0.29, - "learning_rate": 3.571849593850382e-05, - "loss": 2.2693, - "step": 163790 - }, - { - "epoch": 0.29, - "learning_rate": 3.5717623998576995e-05, - "loss": 2.4605, - "step": 163800 - }, - { - "epoch": 0.29, - "learning_rate": 3.571675205865017e-05, - "loss": 2.5936, - "step": 163810 - }, - { - "epoch": 0.29, - "learning_rate": 3.571588011872334e-05, - "loss": 2.3992, - "step": 163820 - }, - { - "epoch": 0.29, - "learning_rate": 3.5715008178796513e-05, - "loss": 2.5256, - "step": 163830 - }, - { - "epoch": 0.29, - "learning_rate": 3.571413623886969e-05, - "loss": 2.4283, - "step": 163840 - }, - { - "epoch": 0.29, - "learning_rate": 3.571326429894286e-05, - "loss": 2.3965, - "step": 163850 - }, - { - "epoch": 0.29, - "learning_rate": 3.571239235901603e-05, - "loss": 2.3946, - "step": 163860 - }, - { - "epoch": 0.29, - "learning_rate": 3.571152041908921e-05, - "loss": 2.4976, - "step": 163870 - }, - { - "epoch": 0.29, - "learning_rate": 3.5710648479162386e-05, - "loss": 2.4436, - "step": 163880 - }, - { - "epoch": 0.29, - "learning_rate": 3.5709776539235556e-05, - "loss": 2.3958, - "step": 163890 - }, - { - "epoch": 0.29, - "learning_rate": 3.5708904599308726e-05, - "loss": 2.3972, - "step": 163900 - }, - { - "epoch": 0.29, - "learning_rate": 3.5708032659381904e-05, - "loss": 2.4612, - "step": 163910 - }, - { - "epoch": 0.29, - "learning_rate": 3.5707160719455074e-05, - "loss": 2.3444, - "step": 163920 - }, - { - "epoch": 0.29, - "learning_rate": 3.5706288779528244e-05, - "loss": 2.4478, - "step": 163930 - }, - { - "epoch": 0.29, - "learning_rate": 3.570541683960142e-05, - "loss": 2.4753, - "step": 163940 - }, - { - "epoch": 0.29, - "learning_rate": 3.570454489967459e-05, - "loss": 2.4726, - "step": 163950 - }, - { - "epoch": 0.29, - "learning_rate": 3.570367295974777e-05, - "loss": 2.3975, - "step": 163960 - }, - { - "epoch": 0.29, - "learning_rate": 3.570280101982094e-05, - "loss": 2.4568, - "step": 163970 - }, - { - "epoch": 0.29, - "learning_rate": 3.5701929079894117e-05, - "loss": 2.4907, - "step": 163980 - }, - { - "epoch": 0.29, - "learning_rate": 3.570105713996729e-05, - "loss": 2.4617, - "step": 163990 - }, - { - "epoch": 0.29, - "learning_rate": 3.570018520004046e-05, - "loss": 2.3885, - "step": 164000 - }, - { - "epoch": 0.29, - "learning_rate": 3.5699313260113635e-05, - "loss": 2.3687, - "step": 164010 - }, - { - "epoch": 0.29, - "learning_rate": 3.5698441320186805e-05, - "loss": 2.3566, - "step": 164020 - }, - { - "epoch": 0.29, - "learning_rate": 3.569756938025998e-05, - "loss": 2.4889, - "step": 164030 - }, - { - "epoch": 0.29, - "learning_rate": 3.569669744033315e-05, - "loss": 2.5355, - "step": 164040 - }, - { - "epoch": 0.29, - "learning_rate": 3.569582550040633e-05, - "loss": 2.4097, - "step": 164050 - }, - { - "epoch": 0.29, - "learning_rate": 3.56949535604795e-05, - "loss": 2.4413, - "step": 164060 - }, - { - "epoch": 0.29, - "learning_rate": 3.569408162055267e-05, - "loss": 2.5077, - "step": 164070 - }, - { - "epoch": 0.29, - "learning_rate": 3.569320968062585e-05, - "loss": 2.5464, - "step": 164080 - }, - { - "epoch": 0.29, - "learning_rate": 3.569233774069902e-05, - "loss": 2.5293, - "step": 164090 - }, - { - "epoch": 0.29, - "learning_rate": 3.569146580077219e-05, - "loss": 2.4624, - "step": 164100 - }, - { - "epoch": 0.29, - "learning_rate": 3.5690593860845365e-05, - "loss": 2.3749, - "step": 164110 - }, - { - "epoch": 0.29, - "learning_rate": 3.568972192091854e-05, - "loss": 2.4282, - "step": 164120 - }, - { - "epoch": 0.29, - "learning_rate": 3.568884998099171e-05, - "loss": 2.4281, - "step": 164130 - }, - { - "epoch": 0.29, - "learning_rate": 3.568797804106488e-05, - "loss": 2.394, - "step": 164140 - }, - { - "epoch": 0.29, - "learning_rate": 3.5687106101138054e-05, - "loss": 2.5526, - "step": 164150 - }, - { - "epoch": 0.29, - "learning_rate": 3.568623416121123e-05, - "loss": 2.4958, - "step": 164160 - }, - { - "epoch": 0.29, - "learning_rate": 3.56853622212844e-05, - "loss": 2.4447, - "step": 164170 - }, - { - "epoch": 0.29, - "learning_rate": 3.568449028135758e-05, - "loss": 2.3417, - "step": 164180 - }, - { - "epoch": 0.29, - "learning_rate": 3.5683618341430756e-05, - "loss": 2.4386, - "step": 164190 - }, - { - "epoch": 0.29, - "learning_rate": 3.5682746401503926e-05, - "loss": 2.5449, - "step": 164200 - }, - { - "epoch": 0.29, - "learning_rate": 3.5681874461577096e-05, - "loss": 2.4397, - "step": 164210 - }, - { - "epoch": 0.29, - "learning_rate": 3.568100252165027e-05, - "loss": 2.4285, - "step": 164220 - }, - { - "epoch": 0.29, - "learning_rate": 3.5680130581723444e-05, - "loss": 2.495, - "step": 164230 - }, - { - "epoch": 0.29, - "learning_rate": 3.5679258641796614e-05, - "loss": 2.424, - "step": 164240 - }, - { - "epoch": 0.29, - "learning_rate": 3.5678386701869785e-05, - "loss": 2.4263, - "step": 164250 - }, - { - "epoch": 0.29, - "learning_rate": 3.567751476194296e-05, - "loss": 2.4559, - "step": 164260 - }, - { - "epoch": 0.29, - "learning_rate": 3.567664282201614e-05, - "loss": 2.4739, - "step": 164270 - }, - { - "epoch": 0.29, - "learning_rate": 3.567577088208931e-05, - "loss": 2.2774, - "step": 164280 - }, - { - "epoch": 0.29, - "learning_rate": 3.567489894216248e-05, - "loss": 2.494, - "step": 164290 - }, - { - "epoch": 0.29, - "learning_rate": 3.567402700223566e-05, - "loss": 2.4299, - "step": 164300 - }, - { - "epoch": 0.29, - "learning_rate": 3.567315506230883e-05, - "loss": 2.3825, - "step": 164310 - }, - { - "epoch": 0.29, - "learning_rate": 3.5672283122382e-05, - "loss": 2.4311, - "step": 164320 - }, - { - "epoch": 0.29, - "learning_rate": 3.5671411182455175e-05, - "loss": 2.4683, - "step": 164330 - }, - { - "epoch": 0.29, - "learning_rate": 3.567053924252835e-05, - "loss": 2.4806, - "step": 164340 - }, - { - "epoch": 0.29, - "learning_rate": 3.566966730260152e-05, - "loss": 2.4548, - "step": 164350 - }, - { - "epoch": 0.29, - "learning_rate": 3.566879536267469e-05, - "loss": 2.544, - "step": 164360 - }, - { - "epoch": 0.29, - "learning_rate": 3.566792342274787e-05, - "loss": 2.3951, - "step": 164370 - }, - { - "epoch": 0.29, - "learning_rate": 3.566705148282104e-05, - "loss": 2.4092, - "step": 164380 - }, - { - "epoch": 0.29, - "learning_rate": 3.566617954289421e-05, - "loss": 2.4913, - "step": 164390 - }, - { - "epoch": 0.29, - "learning_rate": 3.566530760296739e-05, - "loss": 2.2802, - "step": 164400 - }, - { - "epoch": 0.29, - "learning_rate": 3.5664435663040565e-05, - "loss": 2.4012, - "step": 164410 - }, - { - "epoch": 0.29, - "learning_rate": 3.5663563723113735e-05, - "loss": 2.4172, - "step": 164420 - }, - { - "epoch": 0.29, - "learning_rate": 3.5662691783186906e-05, - "loss": 2.4683, - "step": 164430 - }, - { - "epoch": 0.29, - "learning_rate": 3.566181984326008e-05, - "loss": 2.4777, - "step": 164440 - }, - { - "epoch": 0.29, - "learning_rate": 3.566094790333325e-05, - "loss": 2.5168, - "step": 164450 - }, - { - "epoch": 0.29, - "learning_rate": 3.5660075963406424e-05, - "loss": 2.4752, - "step": 164460 - }, - { - "epoch": 0.29, - "learning_rate": 3.56592040234796e-05, - "loss": 2.4125, - "step": 164470 - }, - { - "epoch": 0.29, - "learning_rate": 3.565833208355278e-05, - "loss": 2.4447, - "step": 164480 - }, - { - "epoch": 0.29, - "learning_rate": 3.565746014362595e-05, - "loss": 2.3651, - "step": 164490 - }, - { - "epoch": 0.29, - "learning_rate": 3.565658820369912e-05, - "loss": 2.5025, - "step": 164500 - }, - { - "epoch": 0.29, - "learning_rate": 3.5655716263772296e-05, - "loss": 2.3765, - "step": 164510 - }, - { - "epoch": 0.29, - "learning_rate": 3.5654844323845466e-05, - "loss": 2.3971, - "step": 164520 - }, - { - "epoch": 0.29, - "learning_rate": 3.565397238391864e-05, - "loss": 2.4514, - "step": 164530 - }, - { - "epoch": 0.29, - "learning_rate": 3.565310044399181e-05, - "loss": 2.5132, - "step": 164540 - }, - { - "epoch": 0.29, - "learning_rate": 3.565222850406499e-05, - "loss": 2.4848, - "step": 164550 - }, - { - "epoch": 0.29, - "learning_rate": 3.565135656413816e-05, - "loss": 2.4414, - "step": 164560 - }, - { - "epoch": 0.29, - "learning_rate": 3.565048462421133e-05, - "loss": 2.4461, - "step": 164570 - }, - { - "epoch": 0.29, - "learning_rate": 3.564961268428451e-05, - "loss": 2.4283, - "step": 164580 - }, - { - "epoch": 0.29, - "learning_rate": 3.564874074435768e-05, - "loss": 2.4562, - "step": 164590 - }, - { - "epoch": 0.29, - "learning_rate": 3.564786880443085e-05, - "loss": 2.4519, - "step": 164600 - }, - { - "epoch": 0.29, - "learning_rate": 3.564699686450402e-05, - "loss": 2.393, - "step": 164610 - }, - { - "epoch": 0.29, - "learning_rate": 3.56461249245772e-05, - "loss": 2.4844, - "step": 164620 - }, - { - "epoch": 0.29, - "learning_rate": 3.5645252984650374e-05, - "loss": 2.3434, - "step": 164630 - }, - { - "epoch": 0.29, - "learning_rate": 3.5644381044723545e-05, - "loss": 2.5201, - "step": 164640 - }, - { - "epoch": 0.29, - "learning_rate": 3.5643509104796715e-05, - "loss": 2.4117, - "step": 164650 - }, - { - "epoch": 0.29, - "learning_rate": 3.564263716486989e-05, - "loss": 2.381, - "step": 164660 - }, - { - "epoch": 0.29, - "learning_rate": 3.564176522494306e-05, - "loss": 2.5044, - "step": 164670 - }, - { - "epoch": 0.29, - "learning_rate": 3.564089328501623e-05, - "loss": 2.5189, - "step": 164680 - }, - { - "epoch": 0.29, - "learning_rate": 3.564002134508941e-05, - "loss": 2.3945, - "step": 164690 - }, - { - "epoch": 0.29, - "learning_rate": 3.563914940516259e-05, - "loss": 2.4969, - "step": 164700 - }, - { - "epoch": 0.29, - "learning_rate": 3.563827746523576e-05, - "loss": 2.3678, - "step": 164710 - }, - { - "epoch": 0.29, - "learning_rate": 3.563740552530893e-05, - "loss": 2.4734, - "step": 164720 - }, - { - "epoch": 0.29, - "learning_rate": 3.5636533585382105e-05, - "loss": 2.4138, - "step": 164730 - }, - { - "epoch": 0.29, - "learning_rate": 3.5635661645455276e-05, - "loss": 2.5524, - "step": 164740 - }, - { - "epoch": 0.29, - "learning_rate": 3.5634789705528446e-05, - "loss": 2.4349, - "step": 164750 - }, - { - "epoch": 0.29, - "learning_rate": 3.563391776560162e-05, - "loss": 2.5142, - "step": 164760 - }, - { - "epoch": 0.29, - "learning_rate": 3.5633045825674794e-05, - "loss": 2.5149, - "step": 164770 - }, - { - "epoch": 0.29, - "learning_rate": 3.563217388574797e-05, - "loss": 2.3948, - "step": 164780 - }, - { - "epoch": 0.29, - "learning_rate": 3.563130194582114e-05, - "loss": 2.4952, - "step": 164790 - }, - { - "epoch": 0.29, - "learning_rate": 3.563043000589432e-05, - "loss": 2.3797, - "step": 164800 - }, - { - "epoch": 0.29, - "learning_rate": 3.562955806596749e-05, - "loss": 2.4534, - "step": 164810 - }, - { - "epoch": 0.29, - "learning_rate": 3.562868612604066e-05, - "loss": 2.5144, - "step": 164820 - }, - { - "epoch": 0.29, - "learning_rate": 3.5627814186113836e-05, - "loss": 2.4112, - "step": 164830 - }, - { - "epoch": 0.29, - "learning_rate": 3.5626942246187007e-05, - "loss": 2.4588, - "step": 164840 - }, - { - "epoch": 0.29, - "learning_rate": 3.5626070306260184e-05, - "loss": 2.4273, - "step": 164850 - }, - { - "epoch": 0.29, - "learning_rate": 3.5625198366333354e-05, - "loss": 2.4635, - "step": 164860 - }, - { - "epoch": 0.29, - "learning_rate": 3.562432642640653e-05, - "loss": 2.5639, - "step": 164870 - }, - { - "epoch": 0.29, - "learning_rate": 3.56234544864797e-05, - "loss": 2.4065, - "step": 164880 - }, - { - "epoch": 0.29, - "learning_rate": 3.562258254655287e-05, - "loss": 2.4314, - "step": 164890 - }, - { - "epoch": 0.29, - "learning_rate": 3.562171060662605e-05, - "loss": 2.4086, - "step": 164900 - }, - { - "epoch": 0.29, - "learning_rate": 3.562083866669922e-05, - "loss": 2.4424, - "step": 164910 - }, - { - "epoch": 0.29, - "learning_rate": 3.561996672677239e-05, - "loss": 2.4522, - "step": 164920 - }, - { - "epoch": 0.29, - "learning_rate": 3.561909478684557e-05, - "loss": 2.4733, - "step": 164930 - }, - { - "epoch": 0.29, - "learning_rate": 3.5618222846918744e-05, - "loss": 2.4848, - "step": 164940 - }, - { - "epoch": 0.29, - "learning_rate": 3.5617350906991915e-05, - "loss": 2.5818, - "step": 164950 - }, - { - "epoch": 0.29, - "learning_rate": 3.5616478967065085e-05, - "loss": 2.5364, - "step": 164960 - }, - { - "epoch": 0.29, - "learning_rate": 3.561560702713826e-05, - "loss": 2.4628, - "step": 164970 - }, - { - "epoch": 0.29, - "learning_rate": 3.561473508721143e-05, - "loss": 2.44, - "step": 164980 - }, - { - "epoch": 0.29, - "learning_rate": 3.56138631472846e-05, - "loss": 2.5132, - "step": 164990 - }, - { - "epoch": 0.29, - "learning_rate": 3.561299120735778e-05, - "loss": 2.4146, - "step": 165000 - }, - { - "epoch": 0.29, - "learning_rate": 3.561211926743096e-05, - "loss": 2.5654, - "step": 165010 - }, - { - "epoch": 0.29, - "learning_rate": 3.561124732750413e-05, - "loss": 2.4368, - "step": 165020 - }, - { - "epoch": 0.29, - "learning_rate": 3.56103753875773e-05, - "loss": 2.4794, - "step": 165030 - }, - { - "epoch": 0.29, - "learning_rate": 3.5609503447650475e-05, - "loss": 2.4145, - "step": 165040 - }, - { - "epoch": 0.29, - "learning_rate": 3.5608631507723646e-05, - "loss": 2.4795, - "step": 165050 - }, - { - "epoch": 0.29, - "learning_rate": 3.5607759567796816e-05, - "loss": 2.5096, - "step": 165060 - }, - { - "epoch": 0.29, - "learning_rate": 3.5606887627869986e-05, - "loss": 2.3871, - "step": 165070 - }, - { - "epoch": 0.29, - "learning_rate": 3.560601568794317e-05, - "loss": 2.4988, - "step": 165080 - }, - { - "epoch": 0.29, - "learning_rate": 3.560514374801634e-05, - "loss": 2.4883, - "step": 165090 - }, - { - "epoch": 0.29, - "learning_rate": 3.560427180808951e-05, - "loss": 2.5418, - "step": 165100 - }, - { - "epoch": 0.29, - "learning_rate": 3.560339986816268e-05, - "loss": 2.5093, - "step": 165110 - }, - { - "epoch": 0.29, - "learning_rate": 3.560252792823586e-05, - "loss": 2.5039, - "step": 165120 - }, - { - "epoch": 0.29, - "learning_rate": 3.560165598830903e-05, - "loss": 2.4575, - "step": 165130 - }, - { - "epoch": 0.29, - "learning_rate": 3.56007840483822e-05, - "loss": 2.3921, - "step": 165140 - }, - { - "epoch": 0.29, - "learning_rate": 3.559991210845538e-05, - "loss": 2.5532, - "step": 165150 - }, - { - "epoch": 0.29, - "learning_rate": 3.5599040168528554e-05, - "loss": 2.4609, - "step": 165160 - }, - { - "epoch": 0.29, - "learning_rate": 3.5598168228601724e-05, - "loss": 2.4985, - "step": 165170 - }, - { - "epoch": 0.29, - "learning_rate": 3.5597296288674894e-05, - "loss": 2.4029, - "step": 165180 - }, - { - "epoch": 0.29, - "learning_rate": 3.559642434874807e-05, - "loss": 2.451, - "step": 165190 - }, - { - "epoch": 0.29, - "learning_rate": 3.559555240882124e-05, - "loss": 2.4447, - "step": 165200 - }, - { - "epoch": 0.29, - "learning_rate": 3.559468046889441e-05, - "loss": 2.5557, - "step": 165210 - }, - { - "epoch": 0.29, - "learning_rate": 3.559380852896759e-05, - "loss": 2.4692, - "step": 165220 - }, - { - "epoch": 0.29, - "learning_rate": 3.559293658904077e-05, - "loss": 2.4048, - "step": 165230 - }, - { - "epoch": 0.29, - "learning_rate": 3.559206464911394e-05, - "loss": 2.5142, - "step": 165240 - }, - { - "epoch": 0.29, - "learning_rate": 3.559119270918711e-05, - "loss": 2.4792, - "step": 165250 - }, - { - "epoch": 0.29, - "learning_rate": 3.5590320769260285e-05, - "loss": 2.5196, - "step": 165260 - }, - { - "epoch": 0.29, - "learning_rate": 3.5589448829333455e-05, - "loss": 2.3687, - "step": 165270 - }, - { - "epoch": 0.29, - "learning_rate": 3.5588576889406625e-05, - "loss": 2.4878, - "step": 165280 - }, - { - "epoch": 0.29, - "learning_rate": 3.55877049494798e-05, - "loss": 2.5611, - "step": 165290 - }, - { - "epoch": 0.29, - "learning_rate": 3.558683300955298e-05, - "loss": 2.3713, - "step": 165300 - }, - { - "epoch": 0.29, - "learning_rate": 3.558596106962615e-05, - "loss": 2.4958, - "step": 165310 - }, - { - "epoch": 0.29, - "learning_rate": 3.558508912969932e-05, - "loss": 2.4929, - "step": 165320 - }, - { - "epoch": 0.29, - "learning_rate": 3.55842171897725e-05, - "loss": 2.5568, - "step": 165330 - }, - { - "epoch": 0.29, - "learning_rate": 3.558334524984567e-05, - "loss": 2.5188, - "step": 165340 - }, - { - "epoch": 0.29, - "learning_rate": 3.558247330991884e-05, - "loss": 2.489, - "step": 165350 - }, - { - "epoch": 0.29, - "learning_rate": 3.5581601369992016e-05, - "loss": 2.4606, - "step": 165360 - }, - { - "epoch": 0.29, - "learning_rate": 3.558072943006519e-05, - "loss": 2.5154, - "step": 165370 - }, - { - "epoch": 0.29, - "learning_rate": 3.557985749013836e-05, - "loss": 2.529, - "step": 165380 - }, - { - "epoch": 0.29, - "learning_rate": 3.5578985550211533e-05, - "loss": 2.4099, - "step": 165390 - }, - { - "epoch": 0.29, - "learning_rate": 3.557811361028471e-05, - "loss": 2.3799, - "step": 165400 - }, - { - "epoch": 0.29, - "learning_rate": 3.557724167035788e-05, - "loss": 2.4736, - "step": 165410 - }, - { - "epoch": 0.29, - "learning_rate": 3.557636973043105e-05, - "loss": 2.4705, - "step": 165420 - }, - { - "epoch": 0.29, - "learning_rate": 3.557549779050423e-05, - "loss": 2.4442, - "step": 165430 - }, - { - "epoch": 0.29, - "learning_rate": 3.55746258505774e-05, - "loss": 2.4921, - "step": 165440 - }, - { - "epoch": 0.29, - "learning_rate": 3.5573753910650576e-05, - "loss": 2.4556, - "step": 165450 - }, - { - "epoch": 0.29, - "learning_rate": 3.5572881970723746e-05, - "loss": 2.3888, - "step": 165460 - }, - { - "epoch": 0.29, - "learning_rate": 3.5572010030796924e-05, - "loss": 2.3655, - "step": 165470 - }, - { - "epoch": 0.29, - "learning_rate": 3.5571138090870094e-05, - "loss": 2.5085, - "step": 165480 - }, - { - "epoch": 0.29, - "learning_rate": 3.5570266150943264e-05, - "loss": 2.3582, - "step": 165490 - }, - { - "epoch": 0.29, - "learning_rate": 3.5569394211016435e-05, - "loss": 2.4073, - "step": 165500 - }, - { - "epoch": 0.29, - "learning_rate": 3.556852227108961e-05, - "loss": 2.5286, - "step": 165510 - }, - { - "epoch": 0.29, - "learning_rate": 3.556765033116279e-05, - "loss": 2.464, - "step": 165520 - }, - { - "epoch": 0.29, - "learning_rate": 3.556677839123596e-05, - "loss": 2.4177, - "step": 165530 - }, - { - "epoch": 0.29, - "learning_rate": 3.5565906451309137e-05, - "loss": 2.4397, - "step": 165540 - }, - { - "epoch": 0.29, - "learning_rate": 3.556503451138231e-05, - "loss": 2.4099, - "step": 165550 - }, - { - "epoch": 0.29, - "learning_rate": 3.556416257145548e-05, - "loss": 2.4783, - "step": 165560 - }, - { - "epoch": 0.29, - "learning_rate": 3.556329063152865e-05, - "loss": 2.5651, - "step": 165570 - }, - { - "epoch": 0.29, - "learning_rate": 3.5562418691601825e-05, - "loss": 2.5295, - "step": 165580 - }, - { - "epoch": 0.29, - "learning_rate": 3.5561546751674995e-05, - "loss": 2.474, - "step": 165590 - }, - { - "epoch": 0.29, - "learning_rate": 3.556067481174817e-05, - "loss": 2.4217, - "step": 165600 - }, - { - "epoch": 0.29, - "learning_rate": 3.555980287182134e-05, - "loss": 2.5536, - "step": 165610 - }, - { - "epoch": 0.29, - "learning_rate": 3.555893093189452e-05, - "loss": 2.3338, - "step": 165620 - }, - { - "epoch": 0.29, - "learning_rate": 3.555805899196769e-05, - "loss": 2.476, - "step": 165630 - }, - { - "epoch": 0.29, - "learning_rate": 3.555718705204086e-05, - "loss": 2.4061, - "step": 165640 - }, - { - "epoch": 0.29, - "learning_rate": 3.555631511211404e-05, - "loss": 2.4849, - "step": 165650 - }, - { - "epoch": 0.29, - "learning_rate": 3.555544317218721e-05, - "loss": 2.482, - "step": 165660 - }, - { - "epoch": 0.29, - "learning_rate": 3.5554571232260385e-05, - "loss": 2.5204, - "step": 165670 - }, - { - "epoch": 0.29, - "learning_rate": 3.5553699292333556e-05, - "loss": 2.4538, - "step": 165680 - }, - { - "epoch": 0.29, - "learning_rate": 3.555282735240673e-05, - "loss": 2.3613, - "step": 165690 - }, - { - "epoch": 0.29, - "learning_rate": 3.55519554124799e-05, - "loss": 2.4801, - "step": 165700 - }, - { - "epoch": 0.29, - "learning_rate": 3.5551083472553074e-05, - "loss": 2.4775, - "step": 165710 - }, - { - "epoch": 0.29, - "learning_rate": 3.555021153262625e-05, - "loss": 2.5998, - "step": 165720 - }, - { - "epoch": 0.29, - "learning_rate": 3.554933959269942e-05, - "loss": 2.5338, - "step": 165730 - }, - { - "epoch": 0.29, - "learning_rate": 3.55484676527726e-05, - "loss": 2.3647, - "step": 165740 - }, - { - "epoch": 0.29, - "learning_rate": 3.554759571284577e-05, - "loss": 2.4646, - "step": 165750 - }, - { - "epoch": 0.29, - "learning_rate": 3.5546723772918946e-05, - "loss": 2.5317, - "step": 165760 - }, - { - "epoch": 0.29, - "learning_rate": 3.5545851832992116e-05, - "loss": 2.4301, - "step": 165770 - }, - { - "epoch": 0.29, - "learning_rate": 3.554497989306529e-05, - "loss": 2.3837, - "step": 165780 - }, - { - "epoch": 0.29, - "learning_rate": 3.5544107953138464e-05, - "loss": 2.3855, - "step": 165790 - }, - { - "epoch": 0.29, - "learning_rate": 3.5543236013211634e-05, - "loss": 2.4639, - "step": 165800 - }, - { - "epoch": 0.29, - "learning_rate": 3.5542364073284805e-05, - "loss": 2.3749, - "step": 165810 - }, - { - "epoch": 0.29, - "learning_rate": 3.554149213335798e-05, - "loss": 2.4193, - "step": 165820 - }, - { - "epoch": 0.29, - "learning_rate": 3.554062019343116e-05, - "loss": 2.4932, - "step": 165830 - }, - { - "epoch": 0.29, - "learning_rate": 3.553974825350433e-05, - "loss": 2.5595, - "step": 165840 - }, - { - "epoch": 0.29, - "learning_rate": 3.55388763135775e-05, - "loss": 2.4528, - "step": 165850 - }, - { - "epoch": 0.29, - "learning_rate": 3.553800437365068e-05, - "loss": 2.46, - "step": 165860 - }, - { - "epoch": 0.29, - "learning_rate": 3.553713243372385e-05, - "loss": 2.5175, - "step": 165870 - }, - { - "epoch": 0.29, - "learning_rate": 3.553626049379702e-05, - "loss": 2.5066, - "step": 165880 - }, - { - "epoch": 0.29, - "learning_rate": 3.5535388553870195e-05, - "loss": 2.4617, - "step": 165890 - }, - { - "epoch": 0.29, - "learning_rate": 3.553451661394337e-05, - "loss": 2.4986, - "step": 165900 - }, - { - "epoch": 0.29, - "learning_rate": 3.553364467401654e-05, - "loss": 2.5352, - "step": 165910 - }, - { - "epoch": 0.29, - "learning_rate": 3.553277273408971e-05, - "loss": 2.5039, - "step": 165920 - }, - { - "epoch": 0.29, - "learning_rate": 3.553190079416289e-05, - "loss": 2.4456, - "step": 165930 - }, - { - "epoch": 0.29, - "learning_rate": 3.553102885423606e-05, - "loss": 2.4385, - "step": 165940 - }, - { - "epoch": 0.29, - "learning_rate": 3.553015691430923e-05, - "loss": 2.5003, - "step": 165950 - }, - { - "epoch": 0.29, - "learning_rate": 3.55292849743824e-05, - "loss": 2.4418, - "step": 165960 - }, - { - "epoch": 0.29, - "learning_rate": 3.5528413034455585e-05, - "loss": 2.4694, - "step": 165970 - }, - { - "epoch": 0.29, - "learning_rate": 3.5527541094528755e-05, - "loss": 2.4026, - "step": 165980 - }, - { - "epoch": 0.29, - "learning_rate": 3.5526669154601926e-05, - "loss": 2.4127, - "step": 165990 - }, - { - "epoch": 0.29, - "learning_rate": 3.5525797214675096e-05, - "loss": 2.4963, - "step": 166000 - }, - { - "epoch": 0.29, - "learning_rate": 3.552492527474827e-05, - "loss": 2.4053, - "step": 166010 - }, - { - "epoch": 0.29, - "learning_rate": 3.5524053334821444e-05, - "loss": 2.4972, - "step": 166020 - }, - { - "epoch": 0.29, - "learning_rate": 3.5523181394894614e-05, - "loss": 2.4792, - "step": 166030 - }, - { - "epoch": 0.29, - "learning_rate": 3.55223094549678e-05, - "loss": 2.502, - "step": 166040 - }, - { - "epoch": 0.29, - "learning_rate": 3.552143751504097e-05, - "loss": 2.4581, - "step": 166050 - }, - { - "epoch": 0.29, - "learning_rate": 3.552056557511414e-05, - "loss": 2.4615, - "step": 166060 - }, - { - "epoch": 0.29, - "learning_rate": 3.551969363518731e-05, - "loss": 2.4633, - "step": 166070 - }, - { - "epoch": 0.29, - "learning_rate": 3.5518821695260486e-05, - "loss": 2.528, - "step": 166080 - }, - { - "epoch": 0.29, - "learning_rate": 3.551794975533366e-05, - "loss": 2.4119, - "step": 166090 - }, - { - "epoch": 0.29, - "learning_rate": 3.551707781540683e-05, - "loss": 2.4505, - "step": 166100 - }, - { - "epoch": 0.29, - "learning_rate": 3.5516205875480004e-05, - "loss": 2.3717, - "step": 166110 - }, - { - "epoch": 0.29, - "learning_rate": 3.551533393555318e-05, - "loss": 2.4343, - "step": 166120 - }, - { - "epoch": 0.29, - "learning_rate": 3.551446199562635e-05, - "loss": 2.4637, - "step": 166130 - }, - { - "epoch": 0.29, - "learning_rate": 3.551359005569952e-05, - "loss": 2.5498, - "step": 166140 - }, - { - "epoch": 0.29, - "learning_rate": 3.55127181157727e-05, - "loss": 2.495, - "step": 166150 - }, - { - "epoch": 0.29, - "learning_rate": 3.551184617584587e-05, - "loss": 2.4986, - "step": 166160 - }, - { - "epoch": 0.29, - "learning_rate": 3.551097423591904e-05, - "loss": 2.4281, - "step": 166170 - }, - { - "epoch": 0.29, - "learning_rate": 3.551010229599222e-05, - "loss": 2.4873, - "step": 166180 - }, - { - "epoch": 0.29, - "learning_rate": 3.5509230356065394e-05, - "loss": 2.5315, - "step": 166190 - }, - { - "epoch": 0.29, - "learning_rate": 3.5508358416138565e-05, - "loss": 2.5263, - "step": 166200 - }, - { - "epoch": 0.29, - "learning_rate": 3.5507486476211735e-05, - "loss": 2.5171, - "step": 166210 - }, - { - "epoch": 0.29, - "learning_rate": 3.550661453628491e-05, - "loss": 2.408, - "step": 166220 - }, - { - "epoch": 0.29, - "learning_rate": 3.550574259635808e-05, - "loss": 2.3325, - "step": 166230 - }, - { - "epoch": 0.29, - "learning_rate": 3.550487065643125e-05, - "loss": 2.5064, - "step": 166240 - }, - { - "epoch": 0.29, - "learning_rate": 3.550399871650443e-05, - "loss": 2.531, - "step": 166250 - }, - { - "epoch": 0.29, - "learning_rate": 3.55031267765776e-05, - "loss": 2.4481, - "step": 166260 - }, - { - "epoch": 0.29, - "learning_rate": 3.550225483665078e-05, - "loss": 2.6393, - "step": 166270 - }, - { - "epoch": 0.29, - "learning_rate": 3.550138289672395e-05, - "loss": 2.3866, - "step": 166280 - }, - { - "epoch": 0.29, - "learning_rate": 3.5500510956797125e-05, - "loss": 2.4442, - "step": 166290 - }, - { - "epoch": 0.29, - "learning_rate": 3.5499639016870296e-05, - "loss": 2.3262, - "step": 166300 - }, - { - "epoch": 0.29, - "learning_rate": 3.5498767076943466e-05, - "loss": 2.3473, - "step": 166310 - }, - { - "epoch": 0.29, - "learning_rate": 3.549789513701664e-05, - "loss": 2.4574, - "step": 166320 - }, - { - "epoch": 0.29, - "learning_rate": 3.5497023197089814e-05, - "loss": 2.4369, - "step": 166330 - }, - { - "epoch": 0.29, - "learning_rate": 3.549615125716299e-05, - "loss": 2.4616, - "step": 166340 - }, - { - "epoch": 0.29, - "learning_rate": 3.549527931723616e-05, - "loss": 2.5159, - "step": 166350 - }, - { - "epoch": 0.29, - "learning_rate": 3.549440737730934e-05, - "loss": 2.2647, - "step": 166360 - }, - { - "epoch": 0.29, - "learning_rate": 3.549353543738251e-05, - "loss": 2.5083, - "step": 166370 - }, - { - "epoch": 0.29, - "learning_rate": 3.549266349745568e-05, - "loss": 2.4601, - "step": 166380 - }, - { - "epoch": 0.29, - "learning_rate": 3.5491791557528856e-05, - "loss": 2.4143, - "step": 166390 - }, - { - "epoch": 0.29, - "learning_rate": 3.5490919617602027e-05, - "loss": 2.3872, - "step": 166400 - }, - { - "epoch": 0.29, - "learning_rate": 3.5490047677675204e-05, - "loss": 2.4757, - "step": 166410 - }, - { - "epoch": 0.29, - "learning_rate": 3.5489175737748374e-05, - "loss": 2.426, - "step": 166420 - }, - { - "epoch": 0.29, - "learning_rate": 3.548830379782155e-05, - "loss": 2.4325, - "step": 166430 - }, - { - "epoch": 0.29, - "learning_rate": 3.548743185789472e-05, - "loss": 2.5182, - "step": 166440 - }, - { - "epoch": 0.29, - "learning_rate": 3.548655991796789e-05, - "loss": 2.4776, - "step": 166450 - }, - { - "epoch": 0.29, - "learning_rate": 3.548568797804106e-05, - "loss": 2.4819, - "step": 166460 - }, - { - "epoch": 0.29, - "learning_rate": 3.548481603811424e-05, - "loss": 2.4571, - "step": 166470 - }, - { - "epoch": 0.29, - "learning_rate": 3.548394409818741e-05, - "loss": 2.4906, - "step": 166480 - }, - { - "epoch": 0.29, - "learning_rate": 3.548307215826059e-05, - "loss": 2.3059, - "step": 166490 - }, - { - "epoch": 0.29, - "learning_rate": 3.5482200218333764e-05, - "loss": 2.5139, - "step": 166500 - }, - { - "epoch": 0.29, - "learning_rate": 3.5481328278406935e-05, - "loss": 2.4645, - "step": 166510 - }, - { - "epoch": 0.29, - "learning_rate": 3.5480456338480105e-05, - "loss": 2.4584, - "step": 166520 - }, - { - "epoch": 0.29, - "learning_rate": 3.5479584398553275e-05, - "loss": 2.5249, - "step": 166530 - }, - { - "epoch": 0.29, - "learning_rate": 3.547871245862645e-05, - "loss": 2.3972, - "step": 166540 - }, - { - "epoch": 0.29, - "learning_rate": 3.547784051869962e-05, - "loss": 2.5353, - "step": 166550 - }, - { - "epoch": 0.29, - "learning_rate": 3.54769685787728e-05, - "loss": 2.4966, - "step": 166560 - }, - { - "epoch": 0.29, - "learning_rate": 3.547609663884597e-05, - "loss": 2.5684, - "step": 166570 - }, - { - "epoch": 0.29, - "learning_rate": 3.547522469891915e-05, - "loss": 2.477, - "step": 166580 - }, - { - "epoch": 0.29, - "learning_rate": 3.547435275899232e-05, - "loss": 2.3517, - "step": 166590 - }, - { - "epoch": 0.29, - "learning_rate": 3.547348081906549e-05, - "loss": 2.3799, - "step": 166600 - }, - { - "epoch": 0.29, - "learning_rate": 3.5472608879138666e-05, - "loss": 2.5365, - "step": 166610 - }, - { - "epoch": 0.29, - "learning_rate": 3.5471736939211836e-05, - "loss": 2.448, - "step": 166620 - }, - { - "epoch": 0.29, - "learning_rate": 3.5470864999285006e-05, - "loss": 2.4269, - "step": 166630 - }, - { - "epoch": 0.29, - "learning_rate": 3.5469993059358184e-05, - "loss": 2.5941, - "step": 166640 - }, - { - "epoch": 0.29, - "learning_rate": 3.546912111943136e-05, - "loss": 2.466, - "step": 166650 - }, - { - "epoch": 0.29, - "learning_rate": 3.546824917950453e-05, - "loss": 2.3849, - "step": 166660 - }, - { - "epoch": 0.29, - "learning_rate": 3.54673772395777e-05, - "loss": 2.4722, - "step": 166670 - }, - { - "epoch": 0.29, - "learning_rate": 3.546650529965088e-05, - "loss": 2.534, - "step": 166680 - }, - { - "epoch": 0.29, - "learning_rate": 3.546563335972405e-05, - "loss": 2.551, - "step": 166690 - }, - { - "epoch": 0.29, - "learning_rate": 3.546476141979722e-05, - "loss": 2.3644, - "step": 166700 - }, - { - "epoch": 0.29, - "learning_rate": 3.5463889479870397e-05, - "loss": 2.3399, - "step": 166710 - }, - { - "epoch": 0.29, - "learning_rate": 3.5463017539943574e-05, - "loss": 2.4451, - "step": 166720 - }, - { - "epoch": 0.29, - "learning_rate": 3.5462145600016744e-05, - "loss": 2.4629, - "step": 166730 - }, - { - "epoch": 0.29, - "learning_rate": 3.5461273660089914e-05, - "loss": 2.4476, - "step": 166740 - }, - { - "epoch": 0.29, - "learning_rate": 3.546040172016309e-05, - "loss": 2.3844, - "step": 166750 - }, - { - "epoch": 0.29, - "learning_rate": 3.545952978023626e-05, - "loss": 2.4374, - "step": 166760 - }, - { - "epoch": 0.29, - "learning_rate": 3.545865784030943e-05, - "loss": 2.6131, - "step": 166770 - }, - { - "epoch": 0.29, - "learning_rate": 3.545778590038261e-05, - "loss": 2.4787, - "step": 166780 - }, - { - "epoch": 0.29, - "learning_rate": 3.545691396045579e-05, - "loss": 2.4375, - "step": 166790 - }, - { - "epoch": 0.29, - "learning_rate": 3.545604202052896e-05, - "loss": 2.4365, - "step": 166800 - }, - { - "epoch": 0.29, - "learning_rate": 3.545517008060213e-05, - "loss": 2.5628, - "step": 166810 - }, - { - "epoch": 0.29, - "learning_rate": 3.5454298140675305e-05, - "loss": 2.4755, - "step": 166820 - }, - { - "epoch": 0.29, - "learning_rate": 3.5453426200748475e-05, - "loss": 2.4974, - "step": 166830 - }, - { - "epoch": 0.29, - "learning_rate": 3.5452554260821645e-05, - "loss": 2.5527, - "step": 166840 - }, - { - "epoch": 0.29, - "learning_rate": 3.5451682320894816e-05, - "loss": 2.554, - "step": 166850 - }, - { - "epoch": 0.29, - "learning_rate": 3.5450810380968e-05, - "loss": 2.4496, - "step": 166860 - }, - { - "epoch": 0.29, - "learning_rate": 3.544993844104117e-05, - "loss": 2.4068, - "step": 166870 - }, - { - "epoch": 0.29, - "learning_rate": 3.544906650111434e-05, - "loss": 2.3906, - "step": 166880 - }, - { - "epoch": 0.29, - "learning_rate": 3.544819456118752e-05, - "loss": 2.4405, - "step": 166890 - }, - { - "epoch": 0.29, - "learning_rate": 3.544732262126069e-05, - "loss": 2.4183, - "step": 166900 - }, - { - "epoch": 0.29, - "learning_rate": 3.544645068133386e-05, - "loss": 2.4636, - "step": 166910 - }, - { - "epoch": 0.29, - "learning_rate": 3.544557874140703e-05, - "loss": 2.3897, - "step": 166920 - }, - { - "epoch": 0.29, - "learning_rate": 3.5444706801480206e-05, - "loss": 2.4287, - "step": 166930 - }, - { - "epoch": 0.29, - "learning_rate": 3.544383486155338e-05, - "loss": 2.5287, - "step": 166940 - }, - { - "epoch": 0.29, - "learning_rate": 3.5442962921626553e-05, - "loss": 2.5049, - "step": 166950 - }, - { - "epoch": 0.29, - "learning_rate": 3.5442090981699724e-05, - "loss": 2.4281, - "step": 166960 - }, - { - "epoch": 0.29, - "learning_rate": 3.54412190417729e-05, - "loss": 2.4498, - "step": 166970 - }, - { - "epoch": 0.29, - "learning_rate": 3.544034710184607e-05, - "loss": 2.3228, - "step": 166980 - }, - { - "epoch": 0.29, - "learning_rate": 3.543947516191924e-05, - "loss": 2.4957, - "step": 166990 - }, - { - "epoch": 0.29, - "learning_rate": 3.543860322199242e-05, - "loss": 2.5492, - "step": 167000 - }, - { - "epoch": 0.29, - "learning_rate": 3.5437731282065596e-05, - "loss": 2.5168, - "step": 167010 - }, - { - "epoch": 0.29, - "learning_rate": 3.5436859342138766e-05, - "loss": 2.5529, - "step": 167020 - }, - { - "epoch": 0.29, - "learning_rate": 3.543598740221194e-05, - "loss": 2.4013, - "step": 167030 - }, - { - "epoch": 0.29, - "learning_rate": 3.5435115462285114e-05, - "loss": 2.367, - "step": 167040 - }, - { - "epoch": 0.29, - "learning_rate": 3.5434243522358284e-05, - "loss": 2.5402, - "step": 167050 - }, - { - "epoch": 0.29, - "learning_rate": 3.5433371582431455e-05, - "loss": 2.5249, - "step": 167060 - }, - { - "epoch": 0.29, - "learning_rate": 3.543249964250463e-05, - "loss": 2.3472, - "step": 167070 - }, - { - "epoch": 0.29, - "learning_rate": 3.543162770257781e-05, - "loss": 2.3929, - "step": 167080 - }, - { - "epoch": 0.29, - "learning_rate": 3.543075576265098e-05, - "loss": 2.5685, - "step": 167090 - }, - { - "epoch": 0.29, - "learning_rate": 3.542988382272415e-05, - "loss": 2.3922, - "step": 167100 - }, - { - "epoch": 0.29, - "learning_rate": 3.542901188279733e-05, - "loss": 2.4528, - "step": 167110 - }, - { - "epoch": 0.29, - "learning_rate": 3.54281399428705e-05, - "loss": 2.4981, - "step": 167120 - }, - { - "epoch": 0.29, - "learning_rate": 3.542726800294367e-05, - "loss": 2.4471, - "step": 167130 - }, - { - "epoch": 0.29, - "learning_rate": 3.5426396063016845e-05, - "loss": 2.4437, - "step": 167140 - }, - { - "epoch": 0.29, - "learning_rate": 3.5425524123090015e-05, - "loss": 2.3641, - "step": 167150 - }, - { - "epoch": 0.29, - "learning_rate": 3.542465218316319e-05, - "loss": 2.4525, - "step": 167160 - }, - { - "epoch": 0.29, - "learning_rate": 3.542378024323636e-05, - "loss": 2.3183, - "step": 167170 - }, - { - "epoch": 0.29, - "learning_rate": 3.542290830330954e-05, - "loss": 2.5476, - "step": 167180 - }, - { - "epoch": 0.29, - "learning_rate": 3.542203636338271e-05, - "loss": 2.4978, - "step": 167190 - }, - { - "epoch": 0.29, - "learning_rate": 3.542116442345588e-05, - "loss": 2.5051, - "step": 167200 - }, - { - "epoch": 0.29, - "learning_rate": 3.542029248352906e-05, - "loss": 2.5498, - "step": 167210 - }, - { - "epoch": 0.29, - "learning_rate": 3.541942054360223e-05, - "loss": 2.3269, - "step": 167220 - }, - { - "epoch": 0.29, - "learning_rate": 3.5418548603675405e-05, - "loss": 2.4043, - "step": 167230 - }, - { - "epoch": 0.29, - "learning_rate": 3.5417676663748576e-05, - "loss": 2.4945, - "step": 167240 - }, - { - "epoch": 0.29, - "learning_rate": 3.541680472382175e-05, - "loss": 2.4872, - "step": 167250 - }, - { - "epoch": 0.29, - "learning_rate": 3.541593278389492e-05, - "loss": 2.4399, - "step": 167260 - }, - { - "epoch": 0.29, - "learning_rate": 3.5415060843968094e-05, - "loss": 2.4093, - "step": 167270 - }, - { - "epoch": 0.29, - "learning_rate": 3.541418890404127e-05, - "loss": 2.5422, - "step": 167280 - }, - { - "epoch": 0.29, - "learning_rate": 3.541331696411444e-05, - "loss": 2.4887, - "step": 167290 - }, - { - "epoch": 0.29, - "learning_rate": 3.541244502418761e-05, - "loss": 2.4559, - "step": 167300 - }, - { - "epoch": 0.29, - "learning_rate": 3.541157308426079e-05, - "loss": 2.4926, - "step": 167310 - }, - { - "epoch": 0.29, - "learning_rate": 3.5410701144333966e-05, - "loss": 2.5435, - "step": 167320 - }, - { - "epoch": 0.29, - "learning_rate": 3.5409829204407136e-05, - "loss": 2.5389, - "step": 167330 - }, - { - "epoch": 0.29, - "learning_rate": 3.540895726448031e-05, - "loss": 2.4541, - "step": 167340 - }, - { - "epoch": 0.29, - "learning_rate": 3.540808532455348e-05, - "loss": 2.3828, - "step": 167350 - }, - { - "epoch": 0.29, - "learning_rate": 3.5407213384626654e-05, - "loss": 2.4292, - "step": 167360 - }, - { - "epoch": 0.29, - "learning_rate": 3.5406341444699825e-05, - "loss": 2.4625, - "step": 167370 - }, - { - "epoch": 0.29, - "learning_rate": 3.5405469504773e-05, - "loss": 2.408, - "step": 167380 - }, - { - "epoch": 0.29, - "learning_rate": 3.540459756484618e-05, - "loss": 2.5149, - "step": 167390 - }, - { - "epoch": 0.29, - "learning_rate": 3.540372562491935e-05, - "loss": 2.4246, - "step": 167400 - }, - { - "epoch": 0.29, - "learning_rate": 3.540285368499252e-05, - "loss": 2.513, - "step": 167410 - }, - { - "epoch": 0.29, - "learning_rate": 3.540198174506569e-05, - "loss": 2.4599, - "step": 167420 - }, - { - "epoch": 0.29, - "learning_rate": 3.540110980513887e-05, - "loss": 2.5593, - "step": 167430 - }, - { - "epoch": 0.29, - "learning_rate": 3.540023786521204e-05, - "loss": 2.4391, - "step": 167440 - }, - { - "epoch": 0.29, - "learning_rate": 3.539936592528521e-05, - "loss": 2.3684, - "step": 167450 - }, - { - "epoch": 0.29, - "learning_rate": 3.5398493985358385e-05, - "loss": 2.4891, - "step": 167460 - }, - { - "epoch": 0.29, - "learning_rate": 3.539762204543156e-05, - "loss": 2.3801, - "step": 167470 - }, - { - "epoch": 0.29, - "learning_rate": 3.539675010550473e-05, - "loss": 2.4378, - "step": 167480 - }, - { - "epoch": 0.29, - "learning_rate": 3.53958781655779e-05, - "loss": 2.5027, - "step": 167490 - }, - { - "epoch": 0.29, - "learning_rate": 3.539500622565108e-05, - "loss": 2.5005, - "step": 167500 - }, - { - "epoch": 0.29, - "learning_rate": 3.539413428572425e-05, - "loss": 2.5704, - "step": 167510 - }, - { - "epoch": 0.29, - "learning_rate": 3.539326234579742e-05, - "loss": 2.4681, - "step": 167520 - }, - { - "epoch": 0.29, - "learning_rate": 3.53923904058706e-05, - "loss": 2.4243, - "step": 167530 - }, - { - "epoch": 0.29, - "learning_rate": 3.5391518465943775e-05, - "loss": 2.5039, - "step": 167540 - }, - { - "epoch": 0.29, - "learning_rate": 3.5390646526016946e-05, - "loss": 2.5044, - "step": 167550 - }, - { - "epoch": 0.29, - "learning_rate": 3.5389774586090116e-05, - "loss": 2.3394, - "step": 167560 - }, - { - "epoch": 0.29, - "learning_rate": 3.538890264616329e-05, - "loss": 2.6213, - "step": 167570 - }, - { - "epoch": 0.29, - "learning_rate": 3.5388030706236464e-05, - "loss": 2.3932, - "step": 167580 - }, - { - "epoch": 0.29, - "learning_rate": 3.5387158766309634e-05, - "loss": 2.4945, - "step": 167590 - }, - { - "epoch": 0.29, - "learning_rate": 3.538628682638281e-05, - "loss": 2.3556, - "step": 167600 - }, - { - "epoch": 0.29, - "learning_rate": 3.538541488645599e-05, - "loss": 2.3652, - "step": 167610 - }, - { - "epoch": 0.29, - "learning_rate": 3.538454294652916e-05, - "loss": 2.4347, - "step": 167620 - }, - { - "epoch": 0.29, - "learning_rate": 3.538367100660233e-05, - "loss": 2.5093, - "step": 167630 - }, - { - "epoch": 0.29, - "learning_rate": 3.5382799066675506e-05, - "loss": 2.4627, - "step": 167640 - }, - { - "epoch": 0.29, - "learning_rate": 3.538192712674868e-05, - "loss": 2.4024, - "step": 167650 - }, - { - "epoch": 0.29, - "learning_rate": 3.538105518682185e-05, - "loss": 2.5644, - "step": 167660 - }, - { - "epoch": 0.29, - "learning_rate": 3.5380183246895024e-05, - "loss": 2.3824, - "step": 167670 - }, - { - "epoch": 0.29, - "learning_rate": 3.53793113069682e-05, - "loss": 2.484, - "step": 167680 - }, - { - "epoch": 0.29, - "learning_rate": 3.537843936704137e-05, - "loss": 2.4867, - "step": 167690 - }, - { - "epoch": 0.29, - "learning_rate": 3.537756742711454e-05, - "loss": 2.3815, - "step": 167700 - }, - { - "epoch": 0.29, - "learning_rate": 3.537669548718772e-05, - "loss": 2.4159, - "step": 167710 - }, - { - "epoch": 0.29, - "learning_rate": 3.537582354726089e-05, - "loss": 2.4514, - "step": 167720 - }, - { - "epoch": 0.29, - "learning_rate": 3.537495160733406e-05, - "loss": 2.4168, - "step": 167730 - }, - { - "epoch": 0.29, - "learning_rate": 3.537407966740724e-05, - "loss": 2.516, - "step": 167740 - }, - { - "epoch": 0.29, - "learning_rate": 3.5373207727480414e-05, - "loss": 2.4593, - "step": 167750 - }, - { - "epoch": 0.29, - "learning_rate": 3.5372335787553585e-05, - "loss": 2.4126, - "step": 167760 - }, - { - "epoch": 0.29, - "learning_rate": 3.5371463847626755e-05, - "loss": 2.5254, - "step": 167770 - }, - { - "epoch": 0.29, - "learning_rate": 3.537059190769993e-05, - "loss": 2.4948, - "step": 167780 - }, - { - "epoch": 0.29, - "learning_rate": 3.53697199677731e-05, - "loss": 2.4072, - "step": 167790 - }, - { - "epoch": 0.29, - "learning_rate": 3.536884802784627e-05, - "loss": 2.4212, - "step": 167800 - }, - { - "epoch": 0.29, - "learning_rate": 3.5367976087919443e-05, - "loss": 2.5912, - "step": 167810 - }, - { - "epoch": 0.29, - "learning_rate": 3.536710414799262e-05, - "loss": 2.4645, - "step": 167820 - }, - { - "epoch": 0.29, - "learning_rate": 3.53662322080658e-05, - "loss": 2.4082, - "step": 167830 - }, - { - "epoch": 0.29, - "learning_rate": 3.536536026813897e-05, - "loss": 2.3787, - "step": 167840 - }, - { - "epoch": 0.29, - "learning_rate": 3.5364488328212145e-05, - "loss": 2.5597, - "step": 167850 - }, - { - "epoch": 0.29, - "learning_rate": 3.5363616388285316e-05, - "loss": 2.3858, - "step": 167860 - }, - { - "epoch": 0.29, - "learning_rate": 3.5362744448358486e-05, - "loss": 2.4648, - "step": 167870 - }, - { - "epoch": 0.29, - "learning_rate": 3.5361872508431656e-05, - "loss": 2.3653, - "step": 167880 - }, - { - "epoch": 0.29, - "learning_rate": 3.5361000568504834e-05, - "loss": 2.309, - "step": 167890 - }, - { - "epoch": 0.29, - "learning_rate": 3.536012862857801e-05, - "loss": 2.5142, - "step": 167900 - }, - { - "epoch": 0.29, - "learning_rate": 3.535925668865118e-05, - "loss": 2.5591, - "step": 167910 - }, - { - "epoch": 0.29, - "learning_rate": 3.535838474872435e-05, - "loss": 2.5658, - "step": 167920 - }, - { - "epoch": 0.29, - "learning_rate": 3.535751280879753e-05, - "loss": 2.4736, - "step": 167930 - }, - { - "epoch": 0.29, - "learning_rate": 3.53566408688707e-05, - "loss": 2.4847, - "step": 167940 - }, - { - "epoch": 0.29, - "learning_rate": 3.535576892894387e-05, - "loss": 2.4867, - "step": 167950 - }, - { - "epoch": 0.29, - "learning_rate": 3.535489698901705e-05, - "loss": 2.5061, - "step": 167960 - }, - { - "epoch": 0.29, - "learning_rate": 3.535402504909022e-05, - "loss": 2.4292, - "step": 167970 - }, - { - "epoch": 0.29, - "learning_rate": 3.5353153109163394e-05, - "loss": 2.4158, - "step": 167980 - }, - { - "epoch": 0.29, - "learning_rate": 3.5352281169236565e-05, - "loss": 2.3662, - "step": 167990 - }, - { - "epoch": 0.29, - "learning_rate": 3.535140922930974e-05, - "loss": 2.3809, - "step": 168000 - }, - { - "epoch": 0.29, - "learning_rate": 3.535053728938291e-05, - "loss": 2.4851, - "step": 168010 - }, - { - "epoch": 0.29, - "learning_rate": 3.534966534945608e-05, - "loss": 2.5539, - "step": 168020 - }, - { - "epoch": 0.29, - "learning_rate": 3.534879340952926e-05, - "loss": 2.4808, - "step": 168030 - }, - { - "epoch": 0.29, - "learning_rate": 3.534792146960243e-05, - "loss": 2.4078, - "step": 168040 - }, - { - "epoch": 0.29, - "learning_rate": 3.534704952967561e-05, - "loss": 2.4229, - "step": 168050 - }, - { - "epoch": 0.29, - "learning_rate": 3.534617758974878e-05, - "loss": 2.5643, - "step": 168060 - }, - { - "epoch": 0.29, - "learning_rate": 3.5345305649821955e-05, - "loss": 2.4597, - "step": 168070 - }, - { - "epoch": 0.29, - "learning_rate": 3.5344433709895125e-05, - "loss": 2.4128, - "step": 168080 - }, - { - "epoch": 0.29, - "learning_rate": 3.5343561769968295e-05, - "loss": 2.4249, - "step": 168090 - }, - { - "epoch": 0.29, - "learning_rate": 3.534268983004147e-05, - "loss": 2.4253, - "step": 168100 - }, - { - "epoch": 0.29, - "learning_rate": 3.534181789011464e-05, - "loss": 2.4292, - "step": 168110 - }, - { - "epoch": 0.29, - "learning_rate": 3.534094595018781e-05, - "loss": 2.3837, - "step": 168120 - }, - { - "epoch": 0.29, - "learning_rate": 3.534007401026099e-05, - "loss": 2.4647, - "step": 168130 - }, - { - "epoch": 0.29, - "learning_rate": 3.533920207033417e-05, - "loss": 2.3561, - "step": 168140 - }, - { - "epoch": 0.29, - "learning_rate": 3.533833013040734e-05, - "loss": 2.4867, - "step": 168150 - }, - { - "epoch": 0.29, - "learning_rate": 3.533745819048051e-05, - "loss": 2.4032, - "step": 168160 - }, - { - "epoch": 0.29, - "learning_rate": 3.5336586250553686e-05, - "loss": 2.5519, - "step": 168170 - }, - { - "epoch": 0.29, - "learning_rate": 3.5335714310626856e-05, - "loss": 2.3794, - "step": 168180 - }, - { - "epoch": 0.29, - "learning_rate": 3.5334842370700026e-05, - "loss": 2.3873, - "step": 168190 - }, - { - "epoch": 0.29, - "learning_rate": 3.5333970430773204e-05, - "loss": 2.427, - "step": 168200 - }, - { - "epoch": 0.29, - "learning_rate": 3.533309849084638e-05, - "loss": 2.3977, - "step": 168210 - }, - { - "epoch": 0.29, - "learning_rate": 3.533222655091955e-05, - "loss": 2.4215, - "step": 168220 - }, - { - "epoch": 0.29, - "learning_rate": 3.533135461099272e-05, - "loss": 2.4187, - "step": 168230 - }, - { - "epoch": 0.29, - "learning_rate": 3.53304826710659e-05, - "loss": 2.5239, - "step": 168240 - }, - { - "epoch": 0.29, - "learning_rate": 3.532961073113907e-05, - "loss": 2.4903, - "step": 168250 - }, - { - "epoch": 0.29, - "learning_rate": 3.532873879121224e-05, - "loss": 2.4396, - "step": 168260 - }, - { - "epoch": 0.29, - "learning_rate": 3.5327866851285417e-05, - "loss": 2.4269, - "step": 168270 - }, - { - "epoch": 0.29, - "learning_rate": 3.5326994911358594e-05, - "loss": 2.5431, - "step": 168280 - }, - { - "epoch": 0.29, - "learning_rate": 3.5326122971431764e-05, - "loss": 2.5244, - "step": 168290 - }, - { - "epoch": 0.29, - "learning_rate": 3.5325251031504934e-05, - "loss": 2.531, - "step": 168300 - }, - { - "epoch": 0.29, - "learning_rate": 3.5324379091578105e-05, - "loss": 2.3828, - "step": 168310 - }, - { - "epoch": 0.29, - "learning_rate": 3.532350715165128e-05, - "loss": 2.4002, - "step": 168320 - }, - { - "epoch": 0.29, - "learning_rate": 3.532263521172445e-05, - "loss": 2.4119, - "step": 168330 - }, - { - "epoch": 0.29, - "learning_rate": 3.532176327179762e-05, - "loss": 2.4092, - "step": 168340 - }, - { - "epoch": 0.29, - "learning_rate": 3.532089133187081e-05, - "loss": 2.4178, - "step": 168350 - }, - { - "epoch": 0.29, - "learning_rate": 3.532001939194398e-05, - "loss": 2.385, - "step": 168360 - }, - { - "epoch": 0.29, - "learning_rate": 3.531914745201715e-05, - "loss": 2.3948, - "step": 168370 - }, - { - "epoch": 0.29, - "learning_rate": 3.531827551209032e-05, - "loss": 2.44, - "step": 168380 - }, - { - "epoch": 0.29, - "learning_rate": 3.5317403572163495e-05, - "loss": 2.4606, - "step": 168390 - }, - { - "epoch": 0.29, - "learning_rate": 3.5316531632236665e-05, - "loss": 2.4639, - "step": 168400 - }, - { - "epoch": 0.29, - "learning_rate": 3.5315659692309836e-05, - "loss": 2.5539, - "step": 168410 - }, - { - "epoch": 0.29, - "learning_rate": 3.531478775238301e-05, - "loss": 2.3607, - "step": 168420 - }, - { - "epoch": 0.29, - "learning_rate": 3.531391581245619e-05, - "loss": 2.5212, - "step": 168430 - }, - { - "epoch": 0.29, - "learning_rate": 3.531304387252936e-05, - "loss": 2.504, - "step": 168440 - }, - { - "epoch": 0.29, - "learning_rate": 3.531217193260253e-05, - "loss": 2.3469, - "step": 168450 - }, - { - "epoch": 0.29, - "learning_rate": 3.531129999267571e-05, - "loss": 2.5591, - "step": 168460 - }, - { - "epoch": 0.29, - "learning_rate": 3.531042805274888e-05, - "loss": 2.4587, - "step": 168470 - }, - { - "epoch": 0.29, - "learning_rate": 3.530955611282205e-05, - "loss": 2.598, - "step": 168480 - }, - { - "epoch": 0.29, - "learning_rate": 3.5308684172895226e-05, - "loss": 2.4452, - "step": 168490 - }, - { - "epoch": 0.29, - "learning_rate": 3.53078122329684e-05, - "loss": 2.5471, - "step": 168500 - }, - { - "epoch": 0.29, - "learning_rate": 3.5306940293041573e-05, - "loss": 2.4438, - "step": 168510 - }, - { - "epoch": 0.29, - "learning_rate": 3.5306068353114744e-05, - "loss": 2.5603, - "step": 168520 - }, - { - "epoch": 0.29, - "learning_rate": 3.530519641318792e-05, - "loss": 2.4473, - "step": 168530 - }, - { - "epoch": 0.29, - "learning_rate": 3.530432447326109e-05, - "loss": 2.5166, - "step": 168540 - }, - { - "epoch": 0.29, - "learning_rate": 3.530345253333426e-05, - "loss": 2.3941, - "step": 168550 - }, - { - "epoch": 0.29, - "learning_rate": 3.530258059340744e-05, - "loss": 2.4741, - "step": 168560 - }, - { - "epoch": 0.29, - "learning_rate": 3.5301708653480616e-05, - "loss": 2.535, - "step": 168570 - }, - { - "epoch": 0.29, - "learning_rate": 3.5300836713553786e-05, - "loss": 2.4841, - "step": 168580 - }, - { - "epoch": 0.29, - "learning_rate": 3.529996477362696e-05, - "loss": 2.4588, - "step": 168590 - }, - { - "epoch": 0.29, - "learning_rate": 3.5299092833700134e-05, - "loss": 2.5207, - "step": 168600 - }, - { - "epoch": 0.29, - "learning_rate": 3.5298220893773304e-05, - "loss": 2.4895, - "step": 168610 - }, - { - "epoch": 0.29, - "learning_rate": 3.5297348953846475e-05, - "loss": 2.4612, - "step": 168620 - }, - { - "epoch": 0.29, - "learning_rate": 3.529647701391965e-05, - "loss": 2.4685, - "step": 168630 - }, - { - "epoch": 0.29, - "learning_rate": 3.529560507399282e-05, - "loss": 2.5118, - "step": 168640 - }, - { - "epoch": 0.29, - "learning_rate": 3.5294733134066e-05, - "loss": 2.3397, - "step": 168650 - }, - { - "epoch": 0.29, - "learning_rate": 3.529386119413917e-05, - "loss": 2.3591, - "step": 168660 - }, - { - "epoch": 0.29, - "learning_rate": 3.529298925421235e-05, - "loss": 2.5084, - "step": 168670 - }, - { - "epoch": 0.29, - "learning_rate": 3.529211731428552e-05, - "loss": 2.4749, - "step": 168680 - }, - { - "epoch": 0.29, - "learning_rate": 3.529124537435869e-05, - "loss": 2.5872, - "step": 168690 - }, - { - "epoch": 0.29, - "learning_rate": 3.529037343443186e-05, - "loss": 2.4919, - "step": 168700 - }, - { - "epoch": 0.29, - "learning_rate": 3.5289501494505035e-05, - "loss": 2.3341, - "step": 168710 - }, - { - "epoch": 0.29, - "learning_rate": 3.528862955457821e-05, - "loss": 2.3201, - "step": 168720 - }, - { - "epoch": 0.29, - "learning_rate": 3.528775761465138e-05, - "loss": 2.4643, - "step": 168730 - }, - { - "epoch": 0.29, - "learning_rate": 3.528688567472456e-05, - "loss": 2.4143, - "step": 168740 - }, - { - "epoch": 0.29, - "learning_rate": 3.528601373479773e-05, - "loss": 2.4467, - "step": 168750 - }, - { - "epoch": 0.29, - "learning_rate": 3.52851417948709e-05, - "loss": 2.4602, - "step": 168760 - }, - { - "epoch": 0.29, - "learning_rate": 3.528426985494407e-05, - "loss": 2.438, - "step": 168770 - }, - { - "epoch": 0.29, - "learning_rate": 3.528339791501725e-05, - "loss": 2.4321, - "step": 168780 - }, - { - "epoch": 0.29, - "learning_rate": 3.528252597509042e-05, - "loss": 2.336, - "step": 168790 - }, - { - "epoch": 0.29, - "learning_rate": 3.5281654035163596e-05, - "loss": 2.473, - "step": 168800 - }, - { - "epoch": 0.29, - "learning_rate": 3.5280782095236766e-05, - "loss": 2.5285, - "step": 168810 - }, - { - "epoch": 0.29, - "learning_rate": 3.5279910155309943e-05, - "loss": 2.4396, - "step": 168820 - }, - { - "epoch": 0.29, - "learning_rate": 3.5279038215383114e-05, - "loss": 2.5216, - "step": 168830 - }, - { - "epoch": 0.29, - "learning_rate": 3.5278166275456284e-05, - "loss": 2.4411, - "step": 168840 - }, - { - "epoch": 0.29, - "learning_rate": 3.527729433552946e-05, - "loss": 2.4334, - "step": 168850 - }, - { - "epoch": 0.29, - "learning_rate": 3.527642239560263e-05, - "loss": 2.4952, - "step": 168860 - }, - { - "epoch": 0.29, - "learning_rate": 3.527555045567581e-05, - "loss": 2.4104, - "step": 168870 - }, - { - "epoch": 0.29, - "learning_rate": 3.527467851574898e-05, - "loss": 2.4974, - "step": 168880 - }, - { - "epoch": 0.29, - "learning_rate": 3.5273806575822156e-05, - "loss": 2.5858, - "step": 168890 - }, - { - "epoch": 0.29, - "learning_rate": 3.527293463589533e-05, - "loss": 2.5843, - "step": 168900 - }, - { - "epoch": 0.29, - "learning_rate": 3.52720626959685e-05, - "loss": 2.5252, - "step": 168910 - }, - { - "epoch": 0.29, - "learning_rate": 3.5271190756041674e-05, - "loss": 2.4999, - "step": 168920 - }, - { - "epoch": 0.29, - "learning_rate": 3.5270318816114845e-05, - "loss": 2.5392, - "step": 168930 - }, - { - "epoch": 0.29, - "learning_rate": 3.526944687618802e-05, - "loss": 2.4938, - "step": 168940 - }, - { - "epoch": 0.29, - "learning_rate": 3.526857493626119e-05, - "loss": 2.4556, - "step": 168950 - }, - { - "epoch": 0.29, - "learning_rate": 3.526770299633437e-05, - "loss": 2.481, - "step": 168960 - }, - { - "epoch": 0.29, - "learning_rate": 3.526683105640754e-05, - "loss": 2.4818, - "step": 168970 - }, - { - "epoch": 0.29, - "learning_rate": 3.526595911648071e-05, - "loss": 2.5869, - "step": 168980 - }, - { - "epoch": 0.29, - "learning_rate": 3.526508717655389e-05, - "loss": 2.3808, - "step": 168990 - }, - { - "epoch": 0.29, - "learning_rate": 3.526421523662706e-05, - "loss": 2.3291, - "step": 169000 - }, - { - "epoch": 0.29, - "learning_rate": 3.526334329670023e-05, - "loss": 2.431, - "step": 169010 - }, - { - "epoch": 0.29, - "learning_rate": 3.5262471356773405e-05, - "loss": 2.3751, - "step": 169020 - }, - { - "epoch": 0.29, - "learning_rate": 3.526159941684658e-05, - "loss": 2.4939, - "step": 169030 - }, - { - "epoch": 0.29, - "learning_rate": 3.526072747691975e-05, - "loss": 2.4091, - "step": 169040 - }, - { - "epoch": 0.29, - "learning_rate": 3.525985553699292e-05, - "loss": 2.5762, - "step": 169050 - }, - { - "epoch": 0.29, - "learning_rate": 3.52589835970661e-05, - "loss": 2.4489, - "step": 169060 - }, - { - "epoch": 0.29, - "learning_rate": 3.525811165713927e-05, - "loss": 2.4814, - "step": 169070 - }, - { - "epoch": 0.29, - "learning_rate": 3.525723971721244e-05, - "loss": 2.5183, - "step": 169080 - }, - { - "epoch": 0.29, - "learning_rate": 3.525636777728562e-05, - "loss": 2.5138, - "step": 169090 - }, - { - "epoch": 0.29, - "learning_rate": 3.5255495837358795e-05, - "loss": 2.3706, - "step": 169100 - }, - { - "epoch": 0.29, - "learning_rate": 3.5254623897431966e-05, - "loss": 2.3754, - "step": 169110 - }, - { - "epoch": 0.29, - "learning_rate": 3.5253751957505136e-05, - "loss": 2.4297, - "step": 169120 - }, - { - "epoch": 0.29, - "learning_rate": 3.525288001757831e-05, - "loss": 2.4091, - "step": 169130 - }, - { - "epoch": 0.29, - "learning_rate": 3.5252008077651484e-05, - "loss": 2.5541, - "step": 169140 - }, - { - "epoch": 0.29, - "learning_rate": 3.5251136137724654e-05, - "loss": 2.518, - "step": 169150 - }, - { - "epoch": 0.29, - "learning_rate": 3.5250264197797824e-05, - "loss": 2.4313, - "step": 169160 - }, - { - "epoch": 0.3, - "learning_rate": 3.524939225787101e-05, - "loss": 2.4291, - "step": 169170 - }, - { - "epoch": 0.3, - "learning_rate": 3.524852031794418e-05, - "loss": 2.4187, - "step": 169180 - }, - { - "epoch": 0.3, - "learning_rate": 3.524764837801735e-05, - "loss": 2.3611, - "step": 169190 - }, - { - "epoch": 0.3, - "learning_rate": 3.5246776438090526e-05, - "loss": 2.5302, - "step": 169200 - }, - { - "epoch": 0.3, - "learning_rate": 3.52459044981637e-05, - "loss": 2.6025, - "step": 169210 - }, - { - "epoch": 0.3, - "learning_rate": 3.524503255823687e-05, - "loss": 2.4825, - "step": 169220 - }, - { - "epoch": 0.3, - "learning_rate": 3.524416061831004e-05, - "loss": 2.2108, - "step": 169230 - }, - { - "epoch": 0.3, - "learning_rate": 3.524328867838322e-05, - "loss": 2.4297, - "step": 169240 - }, - { - "epoch": 0.3, - "learning_rate": 3.524241673845639e-05, - "loss": 2.3878, - "step": 169250 - }, - { - "epoch": 0.3, - "learning_rate": 3.524154479852956e-05, - "loss": 2.4975, - "step": 169260 - }, - { - "epoch": 0.3, - "learning_rate": 3.524067285860273e-05, - "loss": 2.4923, - "step": 169270 - }, - { - "epoch": 0.3, - "learning_rate": 3.523980091867591e-05, - "loss": 2.4842, - "step": 169280 - }, - { - "epoch": 0.3, - "learning_rate": 3.523892897874908e-05, - "loss": 2.4116, - "step": 169290 - }, - { - "epoch": 0.3, - "learning_rate": 3.523805703882225e-05, - "loss": 2.4319, - "step": 169300 - }, - { - "epoch": 0.3, - "learning_rate": 3.523718509889543e-05, - "loss": 2.4734, - "step": 169310 - }, - { - "epoch": 0.3, - "learning_rate": 3.5236313158968605e-05, - "loss": 2.4038, - "step": 169320 - }, - { - "epoch": 0.3, - "learning_rate": 3.5235441219041775e-05, - "loss": 2.5087, - "step": 169330 - }, - { - "epoch": 0.3, - "learning_rate": 3.5234569279114946e-05, - "loss": 2.4814, - "step": 169340 - }, - { - "epoch": 0.3, - "learning_rate": 3.523369733918812e-05, - "loss": 2.4497, - "step": 169350 - }, - { - "epoch": 0.3, - "learning_rate": 3.523282539926129e-05, - "loss": 2.411, - "step": 169360 - }, - { - "epoch": 0.3, - "learning_rate": 3.5231953459334463e-05, - "loss": 2.4608, - "step": 169370 - }, - { - "epoch": 0.3, - "learning_rate": 3.523108151940764e-05, - "loss": 2.4122, - "step": 169380 - }, - { - "epoch": 0.3, - "learning_rate": 3.523020957948082e-05, - "loss": 2.5392, - "step": 169390 - }, - { - "epoch": 0.3, - "learning_rate": 3.522933763955399e-05, - "loss": 2.4991, - "step": 169400 - }, - { - "epoch": 0.3, - "learning_rate": 3.522846569962716e-05, - "loss": 2.4316, - "step": 169410 - }, - { - "epoch": 0.3, - "learning_rate": 3.5227593759700336e-05, - "loss": 2.4634, - "step": 169420 - }, - { - "epoch": 0.3, - "learning_rate": 3.5226721819773506e-05, - "loss": 2.3525, - "step": 169430 - }, - { - "epoch": 0.3, - "learning_rate": 3.5225849879846676e-05, - "loss": 2.4535, - "step": 169440 - }, - { - "epoch": 0.3, - "learning_rate": 3.5224977939919854e-05, - "loss": 2.4728, - "step": 169450 - }, - { - "epoch": 0.3, - "learning_rate": 3.5224105999993024e-05, - "loss": 2.4439, - "step": 169460 - }, - { - "epoch": 0.3, - "learning_rate": 3.52232340600662e-05, - "loss": 2.4124, - "step": 169470 - }, - { - "epoch": 0.3, - "learning_rate": 3.522236212013937e-05, - "loss": 2.5247, - "step": 169480 - }, - { - "epoch": 0.3, - "learning_rate": 3.522149018021255e-05, - "loss": 2.4999, - "step": 169490 - }, - { - "epoch": 0.3, - "learning_rate": 3.522061824028572e-05, - "loss": 2.4822, - "step": 169500 - }, - { - "epoch": 0.3, - "learning_rate": 3.521974630035889e-05, - "loss": 2.4564, - "step": 169510 - }, - { - "epoch": 0.3, - "learning_rate": 3.521887436043207e-05, - "loss": 2.548, - "step": 169520 - }, - { - "epoch": 0.3, - "learning_rate": 3.521800242050524e-05, - "loss": 2.4801, - "step": 169530 - }, - { - "epoch": 0.3, - "learning_rate": 3.5217130480578414e-05, - "loss": 2.4971, - "step": 169540 - }, - { - "epoch": 0.3, - "learning_rate": 3.5216258540651585e-05, - "loss": 2.428, - "step": 169550 - }, - { - "epoch": 0.3, - "learning_rate": 3.521538660072476e-05, - "loss": 2.4959, - "step": 169560 - }, - { - "epoch": 0.3, - "learning_rate": 3.521451466079793e-05, - "loss": 2.3543, - "step": 169570 - }, - { - "epoch": 0.3, - "learning_rate": 3.52136427208711e-05, - "loss": 2.4471, - "step": 169580 - }, - { - "epoch": 0.3, - "learning_rate": 3.521277078094428e-05, - "loss": 2.5954, - "step": 169590 - }, - { - "epoch": 0.3, - "learning_rate": 3.521189884101745e-05, - "loss": 2.4725, - "step": 169600 - }, - { - "epoch": 0.3, - "learning_rate": 3.521102690109063e-05, - "loss": 2.6089, - "step": 169610 - }, - { - "epoch": 0.3, - "learning_rate": 3.52101549611638e-05, - "loss": 2.514, - "step": 169620 - }, - { - "epoch": 0.3, - "learning_rate": 3.5209283021236975e-05, - "loss": 2.4704, - "step": 169630 - }, - { - "epoch": 0.3, - "learning_rate": 3.5208411081310145e-05, - "loss": 2.461, - "step": 169640 - }, - { - "epoch": 0.3, - "learning_rate": 3.5207539141383315e-05, - "loss": 2.4368, - "step": 169650 - }, - { - "epoch": 0.3, - "learning_rate": 3.5206667201456486e-05, - "loss": 2.4786, - "step": 169660 - }, - { - "epoch": 0.3, - "learning_rate": 3.520579526152966e-05, - "loss": 2.4035, - "step": 169670 - }, - { - "epoch": 0.3, - "learning_rate": 3.5204923321602833e-05, - "loss": 2.4433, - "step": 169680 - }, - { - "epoch": 0.3, - "learning_rate": 3.520405138167601e-05, - "loss": 2.4052, - "step": 169690 - }, - { - "epoch": 0.3, - "learning_rate": 3.520317944174919e-05, - "loss": 2.4469, - "step": 169700 - }, - { - "epoch": 0.3, - "learning_rate": 3.520230750182236e-05, - "loss": 2.584, - "step": 169710 - }, - { - "epoch": 0.3, - "learning_rate": 3.520143556189553e-05, - "loss": 2.4628, - "step": 169720 - }, - { - "epoch": 0.3, - "learning_rate": 3.52005636219687e-05, - "loss": 2.3857, - "step": 169730 - }, - { - "epoch": 0.3, - "learning_rate": 3.5199691682041876e-05, - "loss": 2.4345, - "step": 169740 - }, - { - "epoch": 0.3, - "learning_rate": 3.5198819742115046e-05, - "loss": 2.4244, - "step": 169750 - }, - { - "epoch": 0.3, - "learning_rate": 3.5197947802188224e-05, - "loss": 2.3823, - "step": 169760 - }, - { - "epoch": 0.3, - "learning_rate": 3.5197075862261394e-05, - "loss": 2.4318, - "step": 169770 - }, - { - "epoch": 0.3, - "learning_rate": 3.519620392233457e-05, - "loss": 2.562, - "step": 169780 - }, - { - "epoch": 0.3, - "learning_rate": 3.519533198240774e-05, - "loss": 2.5123, - "step": 169790 - }, - { - "epoch": 0.3, - "learning_rate": 3.519446004248091e-05, - "loss": 2.3934, - "step": 169800 - }, - { - "epoch": 0.3, - "learning_rate": 3.519358810255409e-05, - "loss": 2.4599, - "step": 169810 - }, - { - "epoch": 0.3, - "learning_rate": 3.519271616262726e-05, - "loss": 2.4926, - "step": 169820 - }, - { - "epoch": 0.3, - "learning_rate": 3.519184422270043e-05, - "loss": 2.4292, - "step": 169830 - }, - { - "epoch": 0.3, - "learning_rate": 3.519097228277361e-05, - "loss": 2.5683, - "step": 169840 - }, - { - "epoch": 0.3, - "learning_rate": 3.5190100342846784e-05, - "loss": 2.4025, - "step": 169850 - }, - { - "epoch": 0.3, - "learning_rate": 3.5189228402919954e-05, - "loss": 2.2624, - "step": 169860 - }, - { - "epoch": 0.3, - "learning_rate": 3.5188356462993125e-05, - "loss": 2.412, - "step": 169870 - }, - { - "epoch": 0.3, - "learning_rate": 3.51874845230663e-05, - "loss": 2.4542, - "step": 169880 - }, - { - "epoch": 0.3, - "learning_rate": 3.518661258313947e-05, - "loss": 2.506, - "step": 169890 - }, - { - "epoch": 0.3, - "learning_rate": 3.518574064321264e-05, - "loss": 2.4993, - "step": 169900 - }, - { - "epoch": 0.3, - "learning_rate": 3.518486870328582e-05, - "loss": 2.5845, - "step": 169910 - }, - { - "epoch": 0.3, - "learning_rate": 3.5183996763359e-05, - "loss": 2.4467, - "step": 169920 - }, - { - "epoch": 0.3, - "learning_rate": 3.518312482343217e-05, - "loss": 2.5103, - "step": 169930 - }, - { - "epoch": 0.3, - "learning_rate": 3.518225288350534e-05, - "loss": 2.4377, - "step": 169940 - }, - { - "epoch": 0.3, - "learning_rate": 3.5181380943578515e-05, - "loss": 2.4834, - "step": 169950 - }, - { - "epoch": 0.3, - "learning_rate": 3.5180509003651685e-05, - "loss": 2.4566, - "step": 169960 - }, - { - "epoch": 0.3, - "learning_rate": 3.5179637063724856e-05, - "loss": 2.5547, - "step": 169970 - }, - { - "epoch": 0.3, - "learning_rate": 3.517876512379803e-05, - "loss": 2.4644, - "step": 169980 - }, - { - "epoch": 0.3, - "learning_rate": 3.517789318387121e-05, - "loss": 2.4691, - "step": 169990 - }, - { - "epoch": 0.3, - "learning_rate": 3.517702124394438e-05, - "loss": 2.509, - "step": 170000 - }, - { - "epoch": 0.3, - "learning_rate": 3.517614930401755e-05, - "loss": 2.4427, - "step": 170010 - }, - { - "epoch": 0.3, - "learning_rate": 3.517527736409073e-05, - "loss": 2.3924, - "step": 170020 - }, - { - "epoch": 0.3, - "learning_rate": 3.51744054241639e-05, - "loss": 2.4402, - "step": 170030 - }, - { - "epoch": 0.3, - "learning_rate": 3.517353348423707e-05, - "loss": 2.2973, - "step": 170040 - }, - { - "epoch": 0.3, - "learning_rate": 3.517266154431024e-05, - "loss": 2.41, - "step": 170050 - }, - { - "epoch": 0.3, - "learning_rate": 3.517178960438342e-05, - "loss": 2.4829, - "step": 170060 - }, - { - "epoch": 0.3, - "learning_rate": 3.5170917664456593e-05, - "loss": 2.5026, - "step": 170070 - }, - { - "epoch": 0.3, - "learning_rate": 3.5170045724529764e-05, - "loss": 2.4643, - "step": 170080 - }, - { - "epoch": 0.3, - "learning_rate": 3.516917378460294e-05, - "loss": 2.4412, - "step": 170090 - }, - { - "epoch": 0.3, - "learning_rate": 3.516830184467611e-05, - "loss": 2.4897, - "step": 170100 - }, - { - "epoch": 0.3, - "learning_rate": 3.516742990474928e-05, - "loss": 2.4402, - "step": 170110 - }, - { - "epoch": 0.3, - "learning_rate": 3.516655796482245e-05, - "loss": 2.5482, - "step": 170120 - }, - { - "epoch": 0.3, - "learning_rate": 3.5165686024895636e-05, - "loss": 2.4534, - "step": 170130 - }, - { - "epoch": 0.3, - "learning_rate": 3.5164814084968806e-05, - "loss": 2.5417, - "step": 170140 - }, - { - "epoch": 0.3, - "learning_rate": 3.516394214504198e-05, - "loss": 2.4766, - "step": 170150 - }, - { - "epoch": 0.3, - "learning_rate": 3.516307020511515e-05, - "loss": 2.3702, - "step": 170160 - }, - { - "epoch": 0.3, - "learning_rate": 3.5162198265188324e-05, - "loss": 2.4652, - "step": 170170 - }, - { - "epoch": 0.3, - "learning_rate": 3.5161326325261495e-05, - "loss": 2.4069, - "step": 170180 - }, - { - "epoch": 0.3, - "learning_rate": 3.5160454385334665e-05, - "loss": 2.4813, - "step": 170190 - }, - { - "epoch": 0.3, - "learning_rate": 3.515958244540784e-05, - "loss": 2.506, - "step": 170200 - }, - { - "epoch": 0.3, - "learning_rate": 3.515871050548102e-05, - "loss": 2.4427, - "step": 170210 - }, - { - "epoch": 0.3, - "learning_rate": 3.515783856555419e-05, - "loss": 2.4545, - "step": 170220 - }, - { - "epoch": 0.3, - "learning_rate": 3.515696662562736e-05, - "loss": 2.4909, - "step": 170230 - }, - { - "epoch": 0.3, - "learning_rate": 3.515609468570054e-05, - "loss": 2.4418, - "step": 170240 - }, - { - "epoch": 0.3, - "learning_rate": 3.515522274577371e-05, - "loss": 2.4183, - "step": 170250 - }, - { - "epoch": 0.3, - "learning_rate": 3.515435080584688e-05, - "loss": 2.5243, - "step": 170260 - }, - { - "epoch": 0.3, - "learning_rate": 3.5153478865920055e-05, - "loss": 2.3377, - "step": 170270 - }, - { - "epoch": 0.3, - "learning_rate": 3.515260692599323e-05, - "loss": 2.4375, - "step": 170280 - }, - { - "epoch": 0.3, - "learning_rate": 3.51517349860664e-05, - "loss": 2.3941, - "step": 170290 - }, - { - "epoch": 0.3, - "learning_rate": 3.515086304613957e-05, - "loss": 2.4843, - "step": 170300 - }, - { - "epoch": 0.3, - "learning_rate": 3.514999110621275e-05, - "loss": 2.4441, - "step": 170310 - }, - { - "epoch": 0.3, - "learning_rate": 3.514911916628592e-05, - "loss": 2.5799, - "step": 170320 - }, - { - "epoch": 0.3, - "learning_rate": 3.514824722635909e-05, - "loss": 2.5459, - "step": 170330 - }, - { - "epoch": 0.3, - "learning_rate": 3.514737528643227e-05, - "loss": 2.5358, - "step": 170340 - }, - { - "epoch": 0.3, - "learning_rate": 3.514650334650544e-05, - "loss": 2.402, - "step": 170350 - }, - { - "epoch": 0.3, - "learning_rate": 3.5145631406578616e-05, - "loss": 2.5565, - "step": 170360 - }, - { - "epoch": 0.3, - "learning_rate": 3.5144759466651786e-05, - "loss": 2.4677, - "step": 170370 - }, - { - "epoch": 0.3, - "learning_rate": 3.5143887526724963e-05, - "loss": 2.3627, - "step": 170380 - }, - { - "epoch": 0.3, - "learning_rate": 3.5143015586798134e-05, - "loss": 2.3271, - "step": 170390 - }, - { - "epoch": 0.3, - "learning_rate": 3.5142143646871304e-05, - "loss": 2.4371, - "step": 170400 - }, - { - "epoch": 0.3, - "learning_rate": 3.514127170694448e-05, - "loss": 2.5496, - "step": 170410 - }, - { - "epoch": 0.3, - "learning_rate": 3.514039976701765e-05, - "loss": 2.4879, - "step": 170420 - }, - { - "epoch": 0.3, - "learning_rate": 3.513952782709083e-05, - "loss": 2.441, - "step": 170430 - }, - { - "epoch": 0.3, - "learning_rate": 3.5138655887164e-05, - "loss": 2.5028, - "step": 170440 - }, - { - "epoch": 0.3, - "learning_rate": 3.5137783947237176e-05, - "loss": 2.4815, - "step": 170450 - }, - { - "epoch": 0.3, - "learning_rate": 3.513691200731035e-05, - "loss": 2.4727, - "step": 170460 - }, - { - "epoch": 0.3, - "learning_rate": 3.513604006738352e-05, - "loss": 2.4404, - "step": 170470 - }, - { - "epoch": 0.3, - "learning_rate": 3.5135168127456694e-05, - "loss": 2.4508, - "step": 170480 - }, - { - "epoch": 0.3, - "learning_rate": 3.5134296187529865e-05, - "loss": 2.3534, - "step": 170490 - }, - { - "epoch": 0.3, - "learning_rate": 3.5133424247603035e-05, - "loss": 2.4178, - "step": 170500 - }, - { - "epoch": 0.3, - "learning_rate": 3.513255230767621e-05, - "loss": 2.3128, - "step": 170510 - }, - { - "epoch": 0.3, - "learning_rate": 3.513168036774939e-05, - "loss": 2.401, - "step": 170520 - }, - { - "epoch": 0.3, - "learning_rate": 3.513080842782256e-05, - "loss": 2.4872, - "step": 170530 - }, - { - "epoch": 0.3, - "learning_rate": 3.512993648789573e-05, - "loss": 2.4247, - "step": 170540 - }, - { - "epoch": 0.3, - "learning_rate": 3.512906454796891e-05, - "loss": 2.4046, - "step": 170550 - }, - { - "epoch": 0.3, - "learning_rate": 3.512819260804208e-05, - "loss": 2.3925, - "step": 170560 - }, - { - "epoch": 0.3, - "learning_rate": 3.512732066811525e-05, - "loss": 2.3637, - "step": 170570 - }, - { - "epoch": 0.3, - "learning_rate": 3.5126448728188425e-05, - "loss": 2.4699, - "step": 170580 - }, - { - "epoch": 0.3, - "learning_rate": 3.51255767882616e-05, - "loss": 2.5448, - "step": 170590 - }, - { - "epoch": 0.3, - "learning_rate": 3.512470484833477e-05, - "loss": 2.4501, - "step": 170600 - }, - { - "epoch": 0.3, - "learning_rate": 3.512383290840794e-05, - "loss": 2.4357, - "step": 170610 - }, - { - "epoch": 0.3, - "learning_rate": 3.5122960968481114e-05, - "loss": 2.4215, - "step": 170620 - }, - { - "epoch": 0.3, - "learning_rate": 3.512208902855429e-05, - "loss": 2.474, - "step": 170630 - }, - { - "epoch": 0.3, - "learning_rate": 3.512121708862746e-05, - "loss": 2.3257, - "step": 170640 - }, - { - "epoch": 0.3, - "learning_rate": 3.512034514870063e-05, - "loss": 2.4396, - "step": 170650 - }, - { - "epoch": 0.3, - "learning_rate": 3.5119473208773815e-05, - "loss": 2.5419, - "step": 170660 - }, - { - "epoch": 0.3, - "learning_rate": 3.5118601268846986e-05, - "loss": 2.4137, - "step": 170670 - }, - { - "epoch": 0.3, - "learning_rate": 3.5117729328920156e-05, - "loss": 2.4571, - "step": 170680 - }, - { - "epoch": 0.3, - "learning_rate": 3.5116857388993327e-05, - "loss": 2.3385, - "step": 170690 - }, - { - "epoch": 0.3, - "learning_rate": 3.5115985449066504e-05, - "loss": 2.5011, - "step": 170700 - }, - { - "epoch": 0.3, - "learning_rate": 3.5115113509139674e-05, - "loss": 2.5838, - "step": 170710 - }, - { - "epoch": 0.3, - "learning_rate": 3.5114241569212844e-05, - "loss": 2.4617, - "step": 170720 - }, - { - "epoch": 0.3, - "learning_rate": 3.511336962928602e-05, - "loss": 2.4591, - "step": 170730 - }, - { - "epoch": 0.3, - "learning_rate": 3.51124976893592e-05, - "loss": 2.4133, - "step": 170740 - }, - { - "epoch": 0.3, - "learning_rate": 3.511162574943237e-05, - "loss": 2.422, - "step": 170750 - }, - { - "epoch": 0.3, - "learning_rate": 3.511075380950554e-05, - "loss": 2.4892, - "step": 170760 - }, - { - "epoch": 0.3, - "learning_rate": 3.510988186957872e-05, - "loss": 2.4556, - "step": 170770 - }, - { - "epoch": 0.3, - "learning_rate": 3.510900992965189e-05, - "loss": 2.4703, - "step": 170780 - }, - { - "epoch": 0.3, - "learning_rate": 3.510813798972506e-05, - "loss": 2.4509, - "step": 170790 - }, - { - "epoch": 0.3, - "learning_rate": 3.5107266049798235e-05, - "loss": 2.4998, - "step": 170800 - }, - { - "epoch": 0.3, - "learning_rate": 3.510639410987141e-05, - "loss": 2.5058, - "step": 170810 - }, - { - "epoch": 0.3, - "learning_rate": 3.510552216994458e-05, - "loss": 2.34, - "step": 170820 - }, - { - "epoch": 0.3, - "learning_rate": 3.510465023001775e-05, - "loss": 2.3594, - "step": 170830 - }, - { - "epoch": 0.3, - "learning_rate": 3.510377829009093e-05, - "loss": 2.4802, - "step": 170840 - }, - { - "epoch": 0.3, - "learning_rate": 3.51029063501641e-05, - "loss": 2.4529, - "step": 170850 - }, - { - "epoch": 0.3, - "learning_rate": 3.510203441023727e-05, - "loss": 2.5129, - "step": 170860 - }, - { - "epoch": 0.3, - "learning_rate": 3.510116247031045e-05, - "loss": 2.4836, - "step": 170870 - }, - { - "epoch": 0.3, - "learning_rate": 3.5100290530383625e-05, - "loss": 2.3228, - "step": 170880 - }, - { - "epoch": 0.3, - "learning_rate": 3.5099418590456795e-05, - "loss": 2.5659, - "step": 170890 - }, - { - "epoch": 0.3, - "learning_rate": 3.5098546650529966e-05, - "loss": 2.3954, - "step": 170900 - }, - { - "epoch": 0.3, - "learning_rate": 3.509767471060314e-05, - "loss": 2.3909, - "step": 170910 - }, - { - "epoch": 0.3, - "learning_rate": 3.509680277067631e-05, - "loss": 2.4788, - "step": 170920 - }, - { - "epoch": 0.3, - "learning_rate": 3.5095930830749483e-05, - "loss": 2.5497, - "step": 170930 - }, - { - "epoch": 0.3, - "learning_rate": 3.509505889082266e-05, - "loss": 2.4048, - "step": 170940 - }, - { - "epoch": 0.3, - "learning_rate": 3.509418695089584e-05, - "loss": 2.4873, - "step": 170950 - }, - { - "epoch": 0.3, - "learning_rate": 3.509331501096901e-05, - "loss": 2.4359, - "step": 170960 - }, - { - "epoch": 0.3, - "learning_rate": 3.509244307104218e-05, - "loss": 2.5613, - "step": 170970 - }, - { - "epoch": 0.3, - "learning_rate": 3.5091571131115356e-05, - "loss": 2.3702, - "step": 170980 - }, - { - "epoch": 0.3, - "learning_rate": 3.5090699191188526e-05, - "loss": 2.5211, - "step": 170990 - }, - { - "epoch": 0.3, - "learning_rate": 3.5089827251261696e-05, - "loss": 2.4112, - "step": 171000 - }, - { - "epoch": 0.3, - "learning_rate": 3.508895531133487e-05, - "loss": 2.5257, - "step": 171010 - }, - { - "epoch": 0.3, - "learning_rate": 3.5088083371408044e-05, - "loss": 2.4561, - "step": 171020 - }, - { - "epoch": 0.3, - "learning_rate": 3.508721143148122e-05, - "loss": 2.5636, - "step": 171030 - }, - { - "epoch": 0.3, - "learning_rate": 3.508633949155439e-05, - "loss": 2.5467, - "step": 171040 - }, - { - "epoch": 0.3, - "learning_rate": 3.508546755162757e-05, - "loss": 2.4854, - "step": 171050 - }, - { - "epoch": 0.3, - "learning_rate": 3.508459561170074e-05, - "loss": 2.4307, - "step": 171060 - }, - { - "epoch": 0.3, - "learning_rate": 3.508372367177391e-05, - "loss": 2.4238, - "step": 171070 - }, - { - "epoch": 0.3, - "learning_rate": 3.508285173184708e-05, - "loss": 2.4302, - "step": 171080 - }, - { - "epoch": 0.3, - "learning_rate": 3.508197979192026e-05, - "loss": 2.4378, - "step": 171090 - }, - { - "epoch": 0.3, - "learning_rate": 3.5081107851993434e-05, - "loss": 2.3462, - "step": 171100 - }, - { - "epoch": 0.3, - "learning_rate": 3.5080235912066605e-05, - "loss": 2.4127, - "step": 171110 - }, - { - "epoch": 0.3, - "learning_rate": 3.5079363972139775e-05, - "loss": 2.3591, - "step": 171120 - }, - { - "epoch": 0.3, - "learning_rate": 3.507849203221295e-05, - "loss": 2.4109, - "step": 171130 - }, - { - "epoch": 0.3, - "learning_rate": 3.507762009228612e-05, - "loss": 2.4182, - "step": 171140 - }, - { - "epoch": 0.3, - "learning_rate": 3.507674815235929e-05, - "loss": 2.4908, - "step": 171150 - }, - { - "epoch": 0.3, - "learning_rate": 3.507587621243247e-05, - "loss": 2.4484, - "step": 171160 - }, - { - "epoch": 0.3, - "learning_rate": 3.507500427250564e-05, - "loss": 2.4686, - "step": 171170 - }, - { - "epoch": 0.3, - "learning_rate": 3.507413233257882e-05, - "loss": 2.3781, - "step": 171180 - }, - { - "epoch": 0.3, - "learning_rate": 3.507326039265199e-05, - "loss": 2.4609, - "step": 171190 - }, - { - "epoch": 0.3, - "learning_rate": 3.5072388452725165e-05, - "loss": 2.4689, - "step": 171200 - }, - { - "epoch": 0.3, - "learning_rate": 3.5071516512798335e-05, - "loss": 2.5941, - "step": 171210 - }, - { - "epoch": 0.3, - "learning_rate": 3.5070644572871506e-05, - "loss": 2.5562, - "step": 171220 - }, - { - "epoch": 0.3, - "learning_rate": 3.506977263294468e-05, - "loss": 2.5365, - "step": 171230 - }, - { - "epoch": 0.3, - "learning_rate": 3.5068900693017853e-05, - "loss": 2.4518, - "step": 171240 - }, - { - "epoch": 0.3, - "learning_rate": 3.506802875309103e-05, - "loss": 2.4065, - "step": 171250 - }, - { - "epoch": 0.3, - "learning_rate": 3.50671568131642e-05, - "loss": 2.4452, - "step": 171260 - }, - { - "epoch": 0.3, - "learning_rate": 3.506628487323738e-05, - "loss": 2.3516, - "step": 171270 - }, - { - "epoch": 0.3, - "learning_rate": 3.506541293331055e-05, - "loss": 2.5136, - "step": 171280 - }, - { - "epoch": 0.3, - "learning_rate": 3.506454099338372e-05, - "loss": 2.4296, - "step": 171290 - }, - { - "epoch": 0.3, - "learning_rate": 3.5063669053456896e-05, - "loss": 2.5232, - "step": 171300 - }, - { - "epoch": 0.3, - "learning_rate": 3.5062797113530066e-05, - "loss": 2.3535, - "step": 171310 - }, - { - "epoch": 0.3, - "learning_rate": 3.506192517360324e-05, - "loss": 2.3023, - "step": 171320 - }, - { - "epoch": 0.3, - "learning_rate": 3.5061053233676414e-05, - "loss": 2.5012, - "step": 171330 - }, - { - "epoch": 0.3, - "learning_rate": 3.506018129374959e-05, - "loss": 2.3717, - "step": 171340 - }, - { - "epoch": 0.3, - "learning_rate": 3.505930935382276e-05, - "loss": 2.3418, - "step": 171350 - }, - { - "epoch": 0.3, - "learning_rate": 3.505843741389593e-05, - "loss": 2.4048, - "step": 171360 - }, - { - "epoch": 0.3, - "learning_rate": 3.505756547396911e-05, - "loss": 2.495, - "step": 171370 - }, - { - "epoch": 0.3, - "learning_rate": 3.505669353404228e-05, - "loss": 2.4059, - "step": 171380 - }, - { - "epoch": 0.3, - "learning_rate": 3.505582159411545e-05, - "loss": 2.4908, - "step": 171390 - }, - { - "epoch": 0.3, - "learning_rate": 3.505494965418863e-05, - "loss": 2.4911, - "step": 171400 - }, - { - "epoch": 0.3, - "learning_rate": 3.5054077714261804e-05, - "loss": 2.4146, - "step": 171410 - }, - { - "epoch": 0.3, - "learning_rate": 3.5053205774334974e-05, - "loss": 2.4893, - "step": 171420 - }, - { - "epoch": 0.3, - "learning_rate": 3.5052333834408145e-05, - "loss": 2.5168, - "step": 171430 - }, - { - "epoch": 0.3, - "learning_rate": 3.505146189448132e-05, - "loss": 2.5788, - "step": 171440 - }, - { - "epoch": 0.3, - "learning_rate": 3.505058995455449e-05, - "loss": 2.4354, - "step": 171450 - }, - { - "epoch": 0.3, - "learning_rate": 3.504971801462766e-05, - "loss": 2.4416, - "step": 171460 - }, - { - "epoch": 0.3, - "learning_rate": 3.504884607470084e-05, - "loss": 2.3826, - "step": 171470 - }, - { - "epoch": 0.3, - "learning_rate": 3.504797413477402e-05, - "loss": 2.4962, - "step": 171480 - }, - { - "epoch": 0.3, - "learning_rate": 3.504710219484719e-05, - "loss": 2.4921, - "step": 171490 - }, - { - "epoch": 0.3, - "learning_rate": 3.504623025492036e-05, - "loss": 2.4196, - "step": 171500 - }, - { - "epoch": 0.3, - "learning_rate": 3.504535831499353e-05, - "loss": 2.4541, - "step": 171510 - }, - { - "epoch": 0.3, - "learning_rate": 3.5044486375066705e-05, - "loss": 2.4221, - "step": 171520 - }, - { - "epoch": 0.3, - "learning_rate": 3.5043614435139876e-05, - "loss": 2.4274, - "step": 171530 - }, - { - "epoch": 0.3, - "learning_rate": 3.5042742495213046e-05, - "loss": 2.4186, - "step": 171540 - }, - { - "epoch": 0.3, - "learning_rate": 3.504187055528623e-05, - "loss": 2.3856, - "step": 171550 - }, - { - "epoch": 0.3, - "learning_rate": 3.50409986153594e-05, - "loss": 2.4765, - "step": 171560 - }, - { - "epoch": 0.3, - "learning_rate": 3.504012667543257e-05, - "loss": 2.5352, - "step": 171570 - }, - { - "epoch": 0.3, - "learning_rate": 3.503925473550574e-05, - "loss": 2.4771, - "step": 171580 - }, - { - "epoch": 0.3, - "learning_rate": 3.503838279557892e-05, - "loss": 2.5548, - "step": 171590 - }, - { - "epoch": 0.3, - "learning_rate": 3.503751085565209e-05, - "loss": 2.3618, - "step": 171600 - }, - { - "epoch": 0.3, - "learning_rate": 3.503663891572526e-05, - "loss": 2.3714, - "step": 171610 - }, - { - "epoch": 0.3, - "learning_rate": 3.5035766975798436e-05, - "loss": 2.4445, - "step": 171620 - }, - { - "epoch": 0.3, - "learning_rate": 3.5034895035871613e-05, - "loss": 2.4638, - "step": 171630 - }, - { - "epoch": 0.3, - "learning_rate": 3.5034023095944784e-05, - "loss": 2.447, - "step": 171640 - }, - { - "epoch": 0.3, - "learning_rate": 3.5033151156017954e-05, - "loss": 2.4627, - "step": 171650 - }, - { - "epoch": 0.3, - "learning_rate": 3.503227921609113e-05, - "loss": 2.3996, - "step": 171660 - }, - { - "epoch": 0.3, - "learning_rate": 3.50314072761643e-05, - "loss": 2.3845, - "step": 171670 - }, - { - "epoch": 0.3, - "learning_rate": 3.503053533623747e-05, - "loss": 2.5237, - "step": 171680 - }, - { - "epoch": 0.3, - "learning_rate": 3.502966339631065e-05, - "loss": 2.441, - "step": 171690 - }, - { - "epoch": 0.3, - "learning_rate": 3.5028791456383826e-05, - "loss": 2.5339, - "step": 171700 - }, - { - "epoch": 0.3, - "learning_rate": 3.5027919516457e-05, - "loss": 2.3801, - "step": 171710 - }, - { - "epoch": 0.3, - "learning_rate": 3.502704757653017e-05, - "loss": 2.4769, - "step": 171720 - }, - { - "epoch": 0.3, - "learning_rate": 3.5026175636603344e-05, - "loss": 2.3532, - "step": 171730 - }, - { - "epoch": 0.3, - "learning_rate": 3.5025303696676515e-05, - "loss": 2.4735, - "step": 171740 - }, - { - "epoch": 0.3, - "learning_rate": 3.5024431756749685e-05, - "loss": 2.5605, - "step": 171750 - }, - { - "epoch": 0.3, - "learning_rate": 3.502355981682286e-05, - "loss": 2.4867, - "step": 171760 - }, - { - "epoch": 0.3, - "learning_rate": 3.502268787689604e-05, - "loss": 2.556, - "step": 171770 - }, - { - "epoch": 0.3, - "learning_rate": 3.502181593696921e-05, - "loss": 2.5071, - "step": 171780 - }, - { - "epoch": 0.3, - "learning_rate": 3.502094399704238e-05, - "loss": 2.4085, - "step": 171790 - }, - { - "epoch": 0.3, - "learning_rate": 3.502007205711556e-05, - "loss": 2.3597, - "step": 171800 - }, - { - "epoch": 0.3, - "learning_rate": 3.501920011718873e-05, - "loss": 2.4776, - "step": 171810 - }, - { - "epoch": 0.3, - "learning_rate": 3.50183281772619e-05, - "loss": 2.4976, - "step": 171820 - }, - { - "epoch": 0.3, - "learning_rate": 3.5017456237335075e-05, - "loss": 2.472, - "step": 171830 - }, - { - "epoch": 0.3, - "learning_rate": 3.5016584297408246e-05, - "loss": 2.5214, - "step": 171840 - }, - { - "epoch": 0.3, - "learning_rate": 3.501571235748142e-05, - "loss": 2.4435, - "step": 171850 - }, - { - "epoch": 0.3, - "learning_rate": 3.501484041755459e-05, - "loss": 2.4794, - "step": 171860 - }, - { - "epoch": 0.3, - "learning_rate": 3.501396847762777e-05, - "loss": 2.2727, - "step": 171870 - }, - { - "epoch": 0.3, - "learning_rate": 3.501309653770094e-05, - "loss": 2.4919, - "step": 171880 - }, - { - "epoch": 0.3, - "learning_rate": 3.501222459777411e-05, - "loss": 2.4122, - "step": 171890 - }, - { - "epoch": 0.3, - "learning_rate": 3.501135265784729e-05, - "loss": 2.4942, - "step": 171900 - }, - { - "epoch": 0.3, - "learning_rate": 3.501048071792046e-05, - "loss": 2.458, - "step": 171910 - }, - { - "epoch": 0.3, - "learning_rate": 3.5009608777993636e-05, - "loss": 2.4895, - "step": 171920 - }, - { - "epoch": 0.3, - "learning_rate": 3.5008736838066806e-05, - "loss": 2.4068, - "step": 171930 - }, - { - "epoch": 0.3, - "learning_rate": 3.5007864898139983e-05, - "loss": 2.4267, - "step": 171940 - }, - { - "epoch": 0.3, - "learning_rate": 3.5006992958213154e-05, - "loss": 2.5237, - "step": 171950 - }, - { - "epoch": 0.3, - "learning_rate": 3.5006121018286324e-05, - "loss": 2.5134, - "step": 171960 - }, - { - "epoch": 0.3, - "learning_rate": 3.5005249078359495e-05, - "loss": 2.6451, - "step": 171970 - }, - { - "epoch": 0.3, - "learning_rate": 3.500437713843267e-05, - "loss": 2.4712, - "step": 171980 - }, - { - "epoch": 0.3, - "learning_rate": 3.500350519850584e-05, - "loss": 2.4843, - "step": 171990 - }, - { - "epoch": 0.3, - "learning_rate": 3.500263325857902e-05, - "loss": 2.4127, - "step": 172000 - }, - { - "epoch": 0.3, - "learning_rate": 3.5001761318652196e-05, - "loss": 2.5146, - "step": 172010 - }, - { - "epoch": 0.3, - "learning_rate": 3.500088937872537e-05, - "loss": 2.3642, - "step": 172020 - }, - { - "epoch": 0.3, - "learning_rate": 3.500001743879854e-05, - "loss": 2.4779, - "step": 172030 - }, - { - "epoch": 0.3, - "learning_rate": 3.499914549887171e-05, - "loss": 2.4252, - "step": 172040 - }, - { - "epoch": 0.3, - "learning_rate": 3.4998273558944885e-05, - "loss": 2.5739, - "step": 172050 - }, - { - "epoch": 0.3, - "learning_rate": 3.4997401619018055e-05, - "loss": 2.4672, - "step": 172060 - }, - { - "epoch": 0.3, - "learning_rate": 3.499652967909123e-05, - "loss": 2.3631, - "step": 172070 - }, - { - "epoch": 0.3, - "learning_rate": 3.49956577391644e-05, - "loss": 2.4231, - "step": 172080 - }, - { - "epoch": 0.3, - "learning_rate": 3.499478579923758e-05, - "loss": 2.3321, - "step": 172090 - }, - { - "epoch": 0.3, - "learning_rate": 3.499391385931075e-05, - "loss": 2.4321, - "step": 172100 - }, - { - "epoch": 0.3, - "learning_rate": 3.499304191938392e-05, - "loss": 2.3201, - "step": 172110 - }, - { - "epoch": 0.3, - "learning_rate": 3.49921699794571e-05, - "loss": 2.4805, - "step": 172120 - }, - { - "epoch": 0.3, - "learning_rate": 3.499129803953027e-05, - "loss": 2.5232, - "step": 172130 - }, - { - "epoch": 0.3, - "learning_rate": 3.4990426099603445e-05, - "loss": 2.5427, - "step": 172140 - }, - { - "epoch": 0.3, - "learning_rate": 3.4989554159676616e-05, - "loss": 2.4634, - "step": 172150 - }, - { - "epoch": 0.3, - "learning_rate": 3.498868221974979e-05, - "loss": 2.4523, - "step": 172160 - }, - { - "epoch": 0.3, - "learning_rate": 3.498781027982296e-05, - "loss": 2.4458, - "step": 172170 - }, - { - "epoch": 0.3, - "learning_rate": 3.4986938339896134e-05, - "loss": 2.2425, - "step": 172180 - }, - { - "epoch": 0.3, - "learning_rate": 3.498606639996931e-05, - "loss": 2.4235, - "step": 172190 - }, - { - "epoch": 0.3, - "learning_rate": 3.498519446004248e-05, - "loss": 2.4964, - "step": 172200 - }, - { - "epoch": 0.3, - "learning_rate": 3.498432252011565e-05, - "loss": 2.4409, - "step": 172210 - }, - { - "epoch": 0.3, - "learning_rate": 3.498345058018883e-05, - "loss": 2.318, - "step": 172220 - }, - { - "epoch": 0.3, - "learning_rate": 3.4982578640262006e-05, - "loss": 2.4677, - "step": 172230 - }, - { - "epoch": 0.3, - "learning_rate": 3.4981706700335176e-05, - "loss": 2.4221, - "step": 172240 - }, - { - "epoch": 0.3, - "learning_rate": 3.4980834760408347e-05, - "loss": 2.484, - "step": 172250 - }, - { - "epoch": 0.3, - "learning_rate": 3.4979962820481524e-05, - "loss": 2.4463, - "step": 172260 - }, - { - "epoch": 0.3, - "learning_rate": 3.4979090880554694e-05, - "loss": 2.3864, - "step": 172270 - }, - { - "epoch": 0.3, - "learning_rate": 3.4978218940627864e-05, - "loss": 2.4007, - "step": 172280 - }, - { - "epoch": 0.3, - "learning_rate": 3.497734700070104e-05, - "loss": 2.5035, - "step": 172290 - }, - { - "epoch": 0.3, - "learning_rate": 3.497647506077422e-05, - "loss": 2.3414, - "step": 172300 - }, - { - "epoch": 0.3, - "learning_rate": 3.497560312084739e-05, - "loss": 2.4183, - "step": 172310 - }, - { - "epoch": 0.3, - "learning_rate": 3.497473118092056e-05, - "loss": 2.4935, - "step": 172320 - }, - { - "epoch": 0.3, - "learning_rate": 3.497385924099374e-05, - "loss": 2.4761, - "step": 172330 - }, - { - "epoch": 0.3, - "learning_rate": 3.497298730106691e-05, - "loss": 2.572, - "step": 172340 - }, - { - "epoch": 0.3, - "learning_rate": 3.497211536114008e-05, - "loss": 2.5572, - "step": 172350 - }, - { - "epoch": 0.3, - "learning_rate": 3.497124342121325e-05, - "loss": 2.4397, - "step": 172360 - }, - { - "epoch": 0.3, - "learning_rate": 3.497037148128643e-05, - "loss": 2.4417, - "step": 172370 - }, - { - "epoch": 0.3, - "learning_rate": 3.49694995413596e-05, - "loss": 2.5231, - "step": 172380 - }, - { - "epoch": 0.3, - "learning_rate": 3.496862760143277e-05, - "loss": 2.4672, - "step": 172390 - }, - { - "epoch": 0.3, - "learning_rate": 3.496775566150595e-05, - "loss": 2.5936, - "step": 172400 - }, - { - "epoch": 0.3, - "learning_rate": 3.496688372157912e-05, - "loss": 2.4218, - "step": 172410 - }, - { - "epoch": 0.3, - "learning_rate": 3.496601178165229e-05, - "loss": 2.4802, - "step": 172420 - }, - { - "epoch": 0.3, - "learning_rate": 3.496513984172546e-05, - "loss": 2.4744, - "step": 172430 - }, - { - "epoch": 0.3, - "learning_rate": 3.4964267901798645e-05, - "loss": 2.3543, - "step": 172440 - }, - { - "epoch": 0.3, - "learning_rate": 3.4963395961871815e-05, - "loss": 2.3905, - "step": 172450 - }, - { - "epoch": 0.3, - "learning_rate": 3.4962524021944986e-05, - "loss": 2.5011, - "step": 172460 - }, - { - "epoch": 0.3, - "learning_rate": 3.4961652082018156e-05, - "loss": 2.4851, - "step": 172470 - }, - { - "epoch": 0.3, - "learning_rate": 3.496078014209133e-05, - "loss": 2.443, - "step": 172480 - }, - { - "epoch": 0.3, - "learning_rate": 3.4959908202164503e-05, - "loss": 2.3522, - "step": 172490 - }, - { - "epoch": 0.3, - "learning_rate": 3.4959036262237674e-05, - "loss": 2.5204, - "step": 172500 - }, - { - "epoch": 0.3, - "learning_rate": 3.495816432231085e-05, - "loss": 2.5476, - "step": 172510 - }, - { - "epoch": 0.3, - "learning_rate": 3.495729238238403e-05, - "loss": 2.6021, - "step": 172520 - }, - { - "epoch": 0.3, - "learning_rate": 3.49564204424572e-05, - "loss": 2.6045, - "step": 172530 - }, - { - "epoch": 0.3, - "learning_rate": 3.495554850253037e-05, - "loss": 2.379, - "step": 172540 - }, - { - "epoch": 0.3, - "learning_rate": 3.4954676562603546e-05, - "loss": 2.4226, - "step": 172550 - }, - { - "epoch": 0.3, - "learning_rate": 3.4953804622676716e-05, - "loss": 2.5259, - "step": 172560 - }, - { - "epoch": 0.3, - "learning_rate": 3.495293268274989e-05, - "loss": 2.4543, - "step": 172570 - }, - { - "epoch": 0.3, - "learning_rate": 3.4952060742823064e-05, - "loss": 2.3957, - "step": 172580 - }, - { - "epoch": 0.3, - "learning_rate": 3.495118880289624e-05, - "loss": 2.4094, - "step": 172590 - }, - { - "epoch": 0.3, - "learning_rate": 3.495031686296941e-05, - "loss": 2.5011, - "step": 172600 - }, - { - "epoch": 0.3, - "learning_rate": 3.494944492304258e-05, - "loss": 2.4671, - "step": 172610 - }, - { - "epoch": 0.3, - "learning_rate": 3.494857298311576e-05, - "loss": 2.5067, - "step": 172620 - }, - { - "epoch": 0.3, - "learning_rate": 3.494770104318893e-05, - "loss": 2.471, - "step": 172630 - }, - { - "epoch": 0.3, - "learning_rate": 3.49468291032621e-05, - "loss": 2.4192, - "step": 172640 - }, - { - "epoch": 0.3, - "learning_rate": 3.494595716333528e-05, - "loss": 2.4633, - "step": 172650 - }, - { - "epoch": 0.3, - "learning_rate": 3.4945085223408454e-05, - "loss": 2.5677, - "step": 172660 - }, - { - "epoch": 0.3, - "learning_rate": 3.4944213283481625e-05, - "loss": 2.3439, - "step": 172670 - }, - { - "epoch": 0.3, - "learning_rate": 3.4943341343554795e-05, - "loss": 2.4964, - "step": 172680 - }, - { - "epoch": 0.3, - "learning_rate": 3.494246940362797e-05, - "loss": 2.515, - "step": 172690 - }, - { - "epoch": 0.3, - "learning_rate": 3.494159746370114e-05, - "loss": 2.5015, - "step": 172700 - }, - { - "epoch": 0.3, - "learning_rate": 3.494072552377431e-05, - "loss": 2.5017, - "step": 172710 - }, - { - "epoch": 0.3, - "learning_rate": 3.493985358384749e-05, - "loss": 2.512, - "step": 172720 - }, - { - "epoch": 0.3, - "learning_rate": 3.493898164392066e-05, - "loss": 2.3934, - "step": 172730 - }, - { - "epoch": 0.3, - "learning_rate": 3.493810970399384e-05, - "loss": 2.4473, - "step": 172740 - }, - { - "epoch": 0.3, - "learning_rate": 3.493723776406701e-05, - "loss": 2.4241, - "step": 172750 - }, - { - "epoch": 0.3, - "learning_rate": 3.4936365824140185e-05, - "loss": 2.4689, - "step": 172760 - }, - { - "epoch": 0.3, - "learning_rate": 3.4935493884213356e-05, - "loss": 2.411, - "step": 172770 - }, - { - "epoch": 0.3, - "learning_rate": 3.4934621944286526e-05, - "loss": 2.4489, - "step": 172780 - }, - { - "epoch": 0.3, - "learning_rate": 3.49337500043597e-05, - "loss": 2.4208, - "step": 172790 - }, - { - "epoch": 0.3, - "learning_rate": 3.4932878064432873e-05, - "loss": 2.4827, - "step": 172800 - }, - { - "epoch": 0.3, - "learning_rate": 3.493200612450605e-05, - "loss": 2.3382, - "step": 172810 - }, - { - "epoch": 0.3, - "learning_rate": 3.493113418457922e-05, - "loss": 2.4919, - "step": 172820 - }, - { - "epoch": 0.3, - "learning_rate": 3.49302622446524e-05, - "loss": 2.3415, - "step": 172830 - }, - { - "epoch": 0.3, - "learning_rate": 3.492939030472557e-05, - "loss": 2.3312, - "step": 172840 - }, - { - "epoch": 0.3, - "learning_rate": 3.492851836479874e-05, - "loss": 2.4628, - "step": 172850 - }, - { - "epoch": 0.3, - "learning_rate": 3.492764642487191e-05, - "loss": 2.3773, - "step": 172860 - }, - { - "epoch": 0.3, - "learning_rate": 3.4926774484945086e-05, - "loss": 2.4302, - "step": 172870 - }, - { - "epoch": 0.3, - "learning_rate": 3.492590254501826e-05, - "loss": 2.4348, - "step": 172880 - }, - { - "epoch": 0.3, - "learning_rate": 3.4925030605091434e-05, - "loss": 2.504, - "step": 172890 - }, - { - "epoch": 0.3, - "learning_rate": 3.492415866516461e-05, - "loss": 2.4739, - "step": 172900 - }, - { - "epoch": 0.3, - "learning_rate": 3.492328672523778e-05, - "loss": 2.4738, - "step": 172910 - }, - { - "epoch": 0.3, - "learning_rate": 3.492241478531095e-05, - "loss": 2.4861, - "step": 172920 - }, - { - "epoch": 0.3, - "learning_rate": 3.492154284538412e-05, - "loss": 2.465, - "step": 172930 - }, - { - "epoch": 0.3, - "learning_rate": 3.49206709054573e-05, - "loss": 2.5145, - "step": 172940 - }, - { - "epoch": 0.3, - "learning_rate": 3.491979896553047e-05, - "loss": 2.4295, - "step": 172950 - }, - { - "epoch": 0.3, - "learning_rate": 3.491892702560365e-05, - "loss": 2.4914, - "step": 172960 - }, - { - "epoch": 0.3, - "learning_rate": 3.491805508567682e-05, - "loss": 2.444, - "step": 172970 - }, - { - "epoch": 0.3, - "learning_rate": 3.4917183145749995e-05, - "loss": 2.5587, - "step": 172980 - }, - { - "epoch": 0.3, - "learning_rate": 3.4916311205823165e-05, - "loss": 2.5549, - "step": 172990 - }, - { - "epoch": 0.3, - "learning_rate": 3.4915439265896335e-05, - "loss": 2.4583, - "step": 173000 - }, - { - "epoch": 0.3, - "learning_rate": 3.491456732596951e-05, - "loss": 2.3826, - "step": 173010 - }, - { - "epoch": 0.3, - "learning_rate": 3.491369538604268e-05, - "loss": 2.4852, - "step": 173020 - }, - { - "epoch": 0.3, - "learning_rate": 3.491282344611585e-05, - "loss": 2.4781, - "step": 173030 - }, - { - "epoch": 0.3, - "learning_rate": 3.491195150618903e-05, - "loss": 2.472, - "step": 173040 - }, - { - "epoch": 0.3, - "learning_rate": 3.491107956626221e-05, - "loss": 2.484, - "step": 173050 - }, - { - "epoch": 0.3, - "learning_rate": 3.491020762633538e-05, - "loss": 2.2318, - "step": 173060 - }, - { - "epoch": 0.3, - "learning_rate": 3.490933568640855e-05, - "loss": 2.4088, - "step": 173070 - }, - { - "epoch": 0.3, - "learning_rate": 3.4908463746481725e-05, - "loss": 2.5226, - "step": 173080 - }, - { - "epoch": 0.3, - "learning_rate": 3.4907591806554896e-05, - "loss": 2.3705, - "step": 173090 - }, - { - "epoch": 0.3, - "learning_rate": 3.4906719866628066e-05, - "loss": 2.5224, - "step": 173100 - }, - { - "epoch": 0.3, - "learning_rate": 3.490584792670124e-05, - "loss": 2.392, - "step": 173110 - }, - { - "epoch": 0.3, - "learning_rate": 3.490497598677442e-05, - "loss": 2.3669, - "step": 173120 - }, - { - "epoch": 0.3, - "learning_rate": 3.490410404684759e-05, - "loss": 2.4271, - "step": 173130 - }, - { - "epoch": 0.3, - "learning_rate": 3.490323210692076e-05, - "loss": 2.5656, - "step": 173140 - }, - { - "epoch": 0.3, - "learning_rate": 3.490236016699394e-05, - "loss": 2.3506, - "step": 173150 - }, - { - "epoch": 0.3, - "learning_rate": 3.490148822706711e-05, - "loss": 2.5092, - "step": 173160 - }, - { - "epoch": 0.3, - "learning_rate": 3.490061628714028e-05, - "loss": 2.4334, - "step": 173170 - }, - { - "epoch": 0.3, - "learning_rate": 3.4899744347213456e-05, - "loss": 2.5404, - "step": 173180 - }, - { - "epoch": 0.3, - "learning_rate": 3.4898872407286634e-05, - "loss": 2.4191, - "step": 173190 - }, - { - "epoch": 0.3, - "learning_rate": 3.4898000467359804e-05, - "loss": 2.417, - "step": 173200 - }, - { - "epoch": 0.3, - "learning_rate": 3.4897128527432974e-05, - "loss": 2.4899, - "step": 173210 - }, - { - "epoch": 0.3, - "learning_rate": 3.489625658750615e-05, - "loss": 2.4811, - "step": 173220 - }, - { - "epoch": 0.3, - "learning_rate": 3.489538464757932e-05, - "loss": 2.3615, - "step": 173230 - }, - { - "epoch": 0.3, - "learning_rate": 3.489451270765249e-05, - "loss": 2.5496, - "step": 173240 - }, - { - "epoch": 0.3, - "learning_rate": 3.489364076772567e-05, - "loss": 2.4099, - "step": 173250 - }, - { - "epoch": 0.3, - "learning_rate": 3.4892768827798847e-05, - "loss": 2.5481, - "step": 173260 - }, - { - "epoch": 0.3, - "learning_rate": 3.489189688787202e-05, - "loss": 2.4822, - "step": 173270 - }, - { - "epoch": 0.3, - "learning_rate": 3.489102494794519e-05, - "loss": 2.4966, - "step": 173280 - }, - { - "epoch": 0.3, - "learning_rate": 3.4890153008018364e-05, - "loss": 2.5644, - "step": 173290 - }, - { - "epoch": 0.3, - "learning_rate": 3.4889281068091535e-05, - "loss": 2.4028, - "step": 173300 - }, - { - "epoch": 0.3, - "learning_rate": 3.4888409128164705e-05, - "loss": 2.4477, - "step": 173310 - }, - { - "epoch": 0.3, - "learning_rate": 3.4887537188237876e-05, - "loss": 2.5061, - "step": 173320 - }, - { - "epoch": 0.3, - "learning_rate": 3.488666524831106e-05, - "loss": 2.3554, - "step": 173330 - }, - { - "epoch": 0.3, - "learning_rate": 3.488579330838423e-05, - "loss": 2.5149, - "step": 173340 - }, - { - "epoch": 0.3, - "learning_rate": 3.48849213684574e-05, - "loss": 2.4374, - "step": 173350 - }, - { - "epoch": 0.3, - "learning_rate": 3.488404942853058e-05, - "loss": 2.2803, - "step": 173360 - }, - { - "epoch": 0.3, - "learning_rate": 3.488317748860375e-05, - "loss": 2.4691, - "step": 173370 - }, - { - "epoch": 0.3, - "learning_rate": 3.488230554867692e-05, - "loss": 2.2296, - "step": 173380 - }, - { - "epoch": 0.3, - "learning_rate": 3.488143360875009e-05, - "loss": 2.4108, - "step": 173390 - }, - { - "epoch": 0.3, - "learning_rate": 3.4880561668823266e-05, - "loss": 2.4885, - "step": 173400 - }, - { - "epoch": 0.3, - "learning_rate": 3.487968972889644e-05, - "loss": 2.5633, - "step": 173410 - }, - { - "epoch": 0.3, - "learning_rate": 3.487881778896961e-05, - "loss": 2.5516, - "step": 173420 - }, - { - "epoch": 0.3, - "learning_rate": 3.4877945849042784e-05, - "loss": 2.4711, - "step": 173430 - }, - { - "epoch": 0.3, - "learning_rate": 3.487707390911596e-05, - "loss": 2.4092, - "step": 173440 - }, - { - "epoch": 0.3, - "learning_rate": 3.487620196918913e-05, - "loss": 2.5631, - "step": 173450 - }, - { - "epoch": 0.3, - "learning_rate": 3.48753300292623e-05, - "loss": 2.4351, - "step": 173460 - }, - { - "epoch": 0.3, - "learning_rate": 3.487445808933548e-05, - "loss": 2.355, - "step": 173470 - }, - { - "epoch": 0.3, - "learning_rate": 3.4873586149408656e-05, - "loss": 2.5041, - "step": 173480 - }, - { - "epoch": 0.3, - "learning_rate": 3.4872714209481826e-05, - "loss": 2.4566, - "step": 173490 - }, - { - "epoch": 0.3, - "learning_rate": 3.4871842269555e-05, - "loss": 2.4446, - "step": 173500 - }, - { - "epoch": 0.3, - "learning_rate": 3.4870970329628174e-05, - "loss": 2.3408, - "step": 173510 - }, - { - "epoch": 0.3, - "learning_rate": 3.4870098389701344e-05, - "loss": 2.4805, - "step": 173520 - }, - { - "epoch": 0.3, - "learning_rate": 3.4869226449774515e-05, - "loss": 2.4147, - "step": 173530 - }, - { - "epoch": 0.3, - "learning_rate": 3.486835450984769e-05, - "loss": 2.4256, - "step": 173540 - }, - { - "epoch": 0.3, - "learning_rate": 3.486748256992086e-05, - "loss": 2.5505, - "step": 173550 - }, - { - "epoch": 0.3, - "learning_rate": 3.486661062999404e-05, - "loss": 2.3998, - "step": 173560 - }, - { - "epoch": 0.3, - "learning_rate": 3.486573869006721e-05, - "loss": 2.3542, - "step": 173570 - }, - { - "epoch": 0.3, - "learning_rate": 3.486486675014039e-05, - "loss": 2.4336, - "step": 173580 - }, - { - "epoch": 0.3, - "learning_rate": 3.486399481021356e-05, - "loss": 2.5114, - "step": 173590 - }, - { - "epoch": 0.3, - "learning_rate": 3.486312287028673e-05, - "loss": 2.3971, - "step": 173600 - }, - { - "epoch": 0.3, - "learning_rate": 3.4862250930359905e-05, - "loss": 2.4421, - "step": 173610 - }, - { - "epoch": 0.3, - "learning_rate": 3.4861378990433075e-05, - "loss": 2.4251, - "step": 173620 - }, - { - "epoch": 0.3, - "learning_rate": 3.486050705050625e-05, - "loss": 2.3288, - "step": 173630 - }, - { - "epoch": 0.3, - "learning_rate": 3.485963511057942e-05, - "loss": 2.3257, - "step": 173640 - }, - { - "epoch": 0.3, - "learning_rate": 3.48587631706526e-05, - "loss": 2.613, - "step": 173650 - }, - { - "epoch": 0.3, - "learning_rate": 3.485789123072577e-05, - "loss": 2.586, - "step": 173660 - }, - { - "epoch": 0.3, - "learning_rate": 3.485701929079894e-05, - "loss": 2.4779, - "step": 173670 - }, - { - "epoch": 0.3, - "learning_rate": 3.485614735087212e-05, - "loss": 2.4202, - "step": 173680 - }, - { - "epoch": 0.3, - "learning_rate": 3.485527541094529e-05, - "loss": 2.4837, - "step": 173690 - }, - { - "epoch": 0.3, - "learning_rate": 3.485440347101846e-05, - "loss": 2.3195, - "step": 173700 - }, - { - "epoch": 0.3, - "learning_rate": 3.4853531531091636e-05, - "loss": 2.4638, - "step": 173710 - }, - { - "epoch": 0.3, - "learning_rate": 3.485265959116481e-05, - "loss": 2.4716, - "step": 173720 - }, - { - "epoch": 0.3, - "learning_rate": 3.485178765123798e-05, - "loss": 2.3992, - "step": 173730 - }, - { - "epoch": 0.3, - "learning_rate": 3.4850915711311154e-05, - "loss": 2.5135, - "step": 173740 - }, - { - "epoch": 0.3, - "learning_rate": 3.485004377138433e-05, - "loss": 2.4338, - "step": 173750 - }, - { - "epoch": 0.3, - "learning_rate": 3.48491718314575e-05, - "loss": 2.3258, - "step": 173760 - }, - { - "epoch": 0.3, - "learning_rate": 3.484829989153067e-05, - "loss": 2.3267, - "step": 173770 - }, - { - "epoch": 0.3, - "learning_rate": 3.484742795160385e-05, - "loss": 2.569, - "step": 173780 - }, - { - "epoch": 0.3, - "learning_rate": 3.4846556011677026e-05, - "loss": 2.4554, - "step": 173790 - }, - { - "epoch": 0.3, - "learning_rate": 3.4845684071750196e-05, - "loss": 2.5476, - "step": 173800 - }, - { - "epoch": 0.3, - "learning_rate": 3.4844812131823367e-05, - "loss": 2.5154, - "step": 173810 - }, - { - "epoch": 0.3, - "learning_rate": 3.484394019189654e-05, - "loss": 2.353, - "step": 173820 - }, - { - "epoch": 0.3, - "learning_rate": 3.4843068251969714e-05, - "loss": 2.4405, - "step": 173830 - }, - { - "epoch": 0.3, - "learning_rate": 3.4842196312042885e-05, - "loss": 2.405, - "step": 173840 - }, - { - "epoch": 0.3, - "learning_rate": 3.4841324372116055e-05, - "loss": 2.4776, - "step": 173850 - }, - { - "epoch": 0.3, - "learning_rate": 3.484045243218924e-05, - "loss": 2.3168, - "step": 173860 - }, - { - "epoch": 0.3, - "learning_rate": 3.483958049226241e-05, - "loss": 2.4475, - "step": 173870 - }, - { - "epoch": 0.3, - "learning_rate": 3.483870855233558e-05, - "loss": 2.4341, - "step": 173880 - }, - { - "epoch": 0.3, - "learning_rate": 3.483783661240875e-05, - "loss": 2.4252, - "step": 173890 - }, - { - "epoch": 0.3, - "learning_rate": 3.483696467248193e-05, - "loss": 2.4537, - "step": 173900 - }, - { - "epoch": 0.3, - "learning_rate": 3.48360927325551e-05, - "loss": 2.4927, - "step": 173910 - }, - { - "epoch": 0.3, - "learning_rate": 3.483522079262827e-05, - "loss": 2.5147, - "step": 173920 - }, - { - "epoch": 0.3, - "learning_rate": 3.4834348852701445e-05, - "loss": 2.4302, - "step": 173930 - }, - { - "epoch": 0.3, - "learning_rate": 3.483347691277462e-05, - "loss": 2.4615, - "step": 173940 - }, - { - "epoch": 0.3, - "learning_rate": 3.483260497284779e-05, - "loss": 2.5192, - "step": 173950 - }, - { - "epoch": 0.3, - "learning_rate": 3.483173303292096e-05, - "loss": 2.4314, - "step": 173960 - }, - { - "epoch": 0.3, - "learning_rate": 3.483086109299414e-05, - "loss": 2.4989, - "step": 173970 - }, - { - "epoch": 0.3, - "learning_rate": 3.482998915306731e-05, - "loss": 2.5497, - "step": 173980 - }, - { - "epoch": 0.3, - "learning_rate": 3.482911721314048e-05, - "loss": 2.5144, - "step": 173990 - }, - { - "epoch": 0.3, - "learning_rate": 3.482824527321366e-05, - "loss": 2.4828, - "step": 174000 - }, - { - "epoch": 0.3, - "learning_rate": 3.4827373333286835e-05, - "loss": 2.5554, - "step": 174010 - }, - { - "epoch": 0.3, - "learning_rate": 3.4826501393360006e-05, - "loss": 2.374, - "step": 174020 - }, - { - "epoch": 0.3, - "learning_rate": 3.4825629453433176e-05, - "loss": 2.4285, - "step": 174030 - }, - { - "epoch": 0.3, - "learning_rate": 3.482475751350635e-05, - "loss": 2.363, - "step": 174040 - }, - { - "epoch": 0.3, - "learning_rate": 3.4823885573579524e-05, - "loss": 2.5932, - "step": 174050 - }, - { - "epoch": 0.3, - "learning_rate": 3.4823013633652694e-05, - "loss": 2.4809, - "step": 174060 - }, - { - "epoch": 0.3, - "learning_rate": 3.482214169372587e-05, - "loss": 2.4399, - "step": 174070 - }, - { - "epoch": 0.3, - "learning_rate": 3.482126975379905e-05, - "loss": 2.4875, - "step": 174080 - }, - { - "epoch": 0.3, - "learning_rate": 3.482039781387222e-05, - "loss": 2.4083, - "step": 174090 - }, - { - "epoch": 0.3, - "learning_rate": 3.481952587394539e-05, - "loss": 2.4835, - "step": 174100 - }, - { - "epoch": 0.3, - "learning_rate": 3.4818653934018566e-05, - "loss": 2.4701, - "step": 174110 - }, - { - "epoch": 0.3, - "learning_rate": 3.4817781994091737e-05, - "loss": 2.4823, - "step": 174120 - }, - { - "epoch": 0.3, - "learning_rate": 3.481691005416491e-05, - "loss": 2.479, - "step": 174130 - }, - { - "epoch": 0.3, - "learning_rate": 3.4816038114238084e-05, - "loss": 2.3501, - "step": 174140 - }, - { - "epoch": 0.3, - "learning_rate": 3.481516617431126e-05, - "loss": 2.4484, - "step": 174150 - }, - { - "epoch": 0.3, - "learning_rate": 3.481429423438443e-05, - "loss": 2.4404, - "step": 174160 - }, - { - "epoch": 0.3, - "learning_rate": 3.48134222944576e-05, - "loss": 2.4419, - "step": 174170 - }, - { - "epoch": 0.3, - "learning_rate": 3.481255035453078e-05, - "loss": 2.5225, - "step": 174180 - }, - { - "epoch": 0.3, - "learning_rate": 3.481167841460395e-05, - "loss": 2.3593, - "step": 174190 - }, - { - "epoch": 0.3, - "learning_rate": 3.481080647467712e-05, - "loss": 2.4979, - "step": 174200 - }, - { - "epoch": 0.3, - "learning_rate": 3.480993453475029e-05, - "loss": 2.4331, - "step": 174210 - }, - { - "epoch": 0.3, - "learning_rate": 3.480906259482347e-05, - "loss": 2.5201, - "step": 174220 - }, - { - "epoch": 0.3, - "learning_rate": 3.4808190654896645e-05, - "loss": 2.3525, - "step": 174230 - }, - { - "epoch": 0.3, - "learning_rate": 3.4807318714969815e-05, - "loss": 2.3253, - "step": 174240 - }, - { - "epoch": 0.3, - "learning_rate": 3.480644677504299e-05, - "loss": 2.4275, - "step": 174250 - }, - { - "epoch": 0.3, - "learning_rate": 3.480557483511616e-05, - "loss": 2.4007, - "step": 174260 - }, - { - "epoch": 0.3, - "learning_rate": 3.480470289518933e-05, - "loss": 2.3693, - "step": 174270 - }, - { - "epoch": 0.3, - "learning_rate": 3.48038309552625e-05, - "loss": 2.524, - "step": 174280 - }, - { - "epoch": 0.3, - "learning_rate": 3.480295901533568e-05, - "loss": 2.5016, - "step": 174290 - }, - { - "epoch": 0.3, - "learning_rate": 3.480208707540886e-05, - "loss": 2.5021, - "step": 174300 - }, - { - "epoch": 0.3, - "learning_rate": 3.480121513548203e-05, - "loss": 2.4369, - "step": 174310 - }, - { - "epoch": 0.3, - "learning_rate": 3.48003431955552e-05, - "loss": 2.525, - "step": 174320 - }, - { - "epoch": 0.3, - "learning_rate": 3.4799471255628376e-05, - "loss": 2.3806, - "step": 174330 - }, - { - "epoch": 0.3, - "learning_rate": 3.4798599315701546e-05, - "loss": 2.5232, - "step": 174340 - }, - { - "epoch": 0.3, - "learning_rate": 3.4797727375774716e-05, - "loss": 2.4216, - "step": 174350 - }, - { - "epoch": 0.3, - "learning_rate": 3.4796855435847893e-05, - "loss": 2.5351, - "step": 174360 - }, - { - "epoch": 0.3, - "learning_rate": 3.4795983495921064e-05, - "loss": 2.4246, - "step": 174370 - }, - { - "epoch": 0.3, - "learning_rate": 3.479511155599424e-05, - "loss": 2.4667, - "step": 174380 - }, - { - "epoch": 0.3, - "learning_rate": 3.479423961606741e-05, - "loss": 2.4235, - "step": 174390 - }, - { - "epoch": 0.3, - "learning_rate": 3.479336767614059e-05, - "loss": 2.4986, - "step": 174400 - }, - { - "epoch": 0.3, - "learning_rate": 3.479249573621376e-05, - "loss": 2.5107, - "step": 174410 - }, - { - "epoch": 0.3, - "learning_rate": 3.479162379628693e-05, - "loss": 2.5386, - "step": 174420 - }, - { - "epoch": 0.3, - "learning_rate": 3.4790751856360106e-05, - "loss": 2.5733, - "step": 174430 - }, - { - "epoch": 0.3, - "learning_rate": 3.478987991643328e-05, - "loss": 2.4199, - "step": 174440 - }, - { - "epoch": 0.3, - "learning_rate": 3.4789007976506454e-05, - "loss": 2.3961, - "step": 174450 - }, - { - "epoch": 0.3, - "learning_rate": 3.4788136036579624e-05, - "loss": 2.4946, - "step": 174460 - }, - { - "epoch": 0.3, - "learning_rate": 3.47872640966528e-05, - "loss": 2.4838, - "step": 174470 - }, - { - "epoch": 0.3, - "learning_rate": 3.478639215672597e-05, - "loss": 2.4738, - "step": 174480 - }, - { - "epoch": 0.3, - "learning_rate": 3.478552021679914e-05, - "loss": 2.4961, - "step": 174490 - }, - { - "epoch": 0.3, - "learning_rate": 3.478464827687232e-05, - "loss": 2.469, - "step": 174500 - }, - { - "epoch": 0.3, - "learning_rate": 3.478377633694549e-05, - "loss": 2.4876, - "step": 174510 - }, - { - "epoch": 0.3, - "learning_rate": 3.478290439701867e-05, - "loss": 2.5279, - "step": 174520 - }, - { - "epoch": 0.3, - "learning_rate": 3.478203245709184e-05, - "loss": 2.4916, - "step": 174530 - }, - { - "epoch": 0.3, - "learning_rate": 3.4781160517165015e-05, - "loss": 2.4571, - "step": 174540 - }, - { - "epoch": 0.3, - "learning_rate": 3.4780288577238185e-05, - "loss": 2.4274, - "step": 174550 - }, - { - "epoch": 0.3, - "learning_rate": 3.4779416637311355e-05, - "loss": 2.4681, - "step": 174560 - }, - { - "epoch": 0.3, - "learning_rate": 3.477854469738453e-05, - "loss": 2.4727, - "step": 174570 - }, - { - "epoch": 0.3, - "learning_rate": 3.47776727574577e-05, - "loss": 2.3817, - "step": 174580 - }, - { - "epoch": 0.3, - "learning_rate": 3.477680081753087e-05, - "loss": 2.5025, - "step": 174590 - }, - { - "epoch": 0.3, - "learning_rate": 3.477592887760405e-05, - "loss": 2.4287, - "step": 174600 - }, - { - "epoch": 0.3, - "learning_rate": 3.477505693767723e-05, - "loss": 2.4456, - "step": 174610 - }, - { - "epoch": 0.3, - "learning_rate": 3.47741849977504e-05, - "loss": 2.5446, - "step": 174620 - }, - { - "epoch": 0.3, - "learning_rate": 3.477331305782357e-05, - "loss": 2.5698, - "step": 174630 - }, - { - "epoch": 0.3, - "learning_rate": 3.4772441117896745e-05, - "loss": 2.5314, - "step": 174640 - }, - { - "epoch": 0.3, - "learning_rate": 3.4771569177969916e-05, - "loss": 2.4314, - "step": 174650 - }, - { - "epoch": 0.3, - "learning_rate": 3.4770697238043086e-05, - "loss": 2.5183, - "step": 174660 - }, - { - "epoch": 0.3, - "learning_rate": 3.476982529811626e-05, - "loss": 2.5006, - "step": 174670 - }, - { - "epoch": 0.3, - "learning_rate": 3.476895335818944e-05, - "loss": 2.3844, - "step": 174680 - }, - { - "epoch": 0.3, - "learning_rate": 3.476808141826261e-05, - "loss": 2.5086, - "step": 174690 - }, - { - "epoch": 0.3, - "learning_rate": 3.476720947833578e-05, - "loss": 2.4865, - "step": 174700 - }, - { - "epoch": 0.3, - "learning_rate": 3.476633753840896e-05, - "loss": 2.3941, - "step": 174710 - }, - { - "epoch": 0.3, - "learning_rate": 3.476546559848213e-05, - "loss": 2.4696, - "step": 174720 - }, - { - "epoch": 0.3, - "learning_rate": 3.47645936585553e-05, - "loss": 2.4036, - "step": 174730 - }, - { - "epoch": 0.3, - "learning_rate": 3.476372171862847e-05, - "loss": 2.3725, - "step": 174740 - }, - { - "epoch": 0.3, - "learning_rate": 3.4762849778701654e-05, - "loss": 2.4611, - "step": 174750 - }, - { - "epoch": 0.3, - "learning_rate": 3.4761977838774824e-05, - "loss": 2.3847, - "step": 174760 - }, - { - "epoch": 0.3, - "learning_rate": 3.4761105898847994e-05, - "loss": 2.559, - "step": 174770 - }, - { - "epoch": 0.3, - "learning_rate": 3.4760233958921165e-05, - "loss": 2.4422, - "step": 174780 - }, - { - "epoch": 0.3, - "learning_rate": 3.475936201899434e-05, - "loss": 2.5638, - "step": 174790 - }, - { - "epoch": 0.3, - "learning_rate": 3.475849007906751e-05, - "loss": 2.5028, - "step": 174800 - }, - { - "epoch": 0.3, - "learning_rate": 3.475761813914068e-05, - "loss": 2.532, - "step": 174810 - }, - { - "epoch": 0.3, - "learning_rate": 3.4756746199213867e-05, - "loss": 2.2778, - "step": 174820 - }, - { - "epoch": 0.3, - "learning_rate": 3.475587425928704e-05, - "loss": 2.4432, - "step": 174830 - }, - { - "epoch": 0.3, - "learning_rate": 3.475500231936021e-05, - "loss": 2.5242, - "step": 174840 - }, - { - "epoch": 0.3, - "learning_rate": 3.475413037943338e-05, - "loss": 2.3776, - "step": 174850 - }, - { - "epoch": 0.3, - "learning_rate": 3.4753258439506555e-05, - "loss": 2.5092, - "step": 174860 - }, - { - "epoch": 0.3, - "learning_rate": 3.4752386499579725e-05, - "loss": 2.3722, - "step": 174870 - }, - { - "epoch": 0.3, - "learning_rate": 3.4751514559652896e-05, - "loss": 2.491, - "step": 174880 - }, - { - "epoch": 0.3, - "learning_rate": 3.475064261972607e-05, - "loss": 2.5153, - "step": 174890 - }, - { - "epoch": 0.31, - "learning_rate": 3.474977067979925e-05, - "loss": 2.5439, - "step": 174900 - }, - { - "epoch": 0.31, - "learning_rate": 3.474889873987242e-05, - "loss": 2.4165, - "step": 174910 - }, - { - "epoch": 0.31, - "learning_rate": 3.474802679994559e-05, - "loss": 2.4636, - "step": 174920 - }, - { - "epoch": 0.31, - "learning_rate": 3.474715486001877e-05, - "loss": 2.4366, - "step": 174930 - }, - { - "epoch": 0.31, - "learning_rate": 3.474628292009194e-05, - "loss": 2.3586, - "step": 174940 - }, - { - "epoch": 0.31, - "learning_rate": 3.474541098016511e-05, - "loss": 2.4234, - "step": 174950 - }, - { - "epoch": 0.31, - "learning_rate": 3.4744539040238286e-05, - "loss": 2.4701, - "step": 174960 - }, - { - "epoch": 0.31, - "learning_rate": 3.474366710031146e-05, - "loss": 2.458, - "step": 174970 - }, - { - "epoch": 0.31, - "learning_rate": 3.474279516038463e-05, - "loss": 2.4575, - "step": 174980 - }, - { - "epoch": 0.31, - "learning_rate": 3.4741923220457804e-05, - "loss": 2.4922, - "step": 174990 - }, - { - "epoch": 0.31, - "learning_rate": 3.474105128053098e-05, - "loss": 2.5298, - "step": 175000 - }, - { - "epoch": 0.31, - "learning_rate": 3.474017934060415e-05, - "loss": 2.4862, - "step": 175010 - }, - { - "epoch": 0.31, - "learning_rate": 3.473930740067732e-05, - "loss": 2.3974, - "step": 175020 - }, - { - "epoch": 0.31, - "learning_rate": 3.47384354607505e-05, - "loss": 2.5298, - "step": 175030 - }, - { - "epoch": 0.31, - "learning_rate": 3.473756352082367e-05, - "loss": 2.507, - "step": 175040 - }, - { - "epoch": 0.31, - "learning_rate": 3.4736691580896846e-05, - "loss": 2.4723, - "step": 175050 - }, - { - "epoch": 0.31, - "learning_rate": 3.473581964097002e-05, - "loss": 2.3929, - "step": 175060 - }, - { - "epoch": 0.31, - "learning_rate": 3.4734947701043194e-05, - "loss": 2.4837, - "step": 175070 - }, - { - "epoch": 0.31, - "learning_rate": 3.4734075761116364e-05, - "loss": 2.4299, - "step": 175080 - }, - { - "epoch": 0.31, - "learning_rate": 3.4733203821189535e-05, - "loss": 2.3951, - "step": 175090 - }, - { - "epoch": 0.31, - "learning_rate": 3.473233188126271e-05, - "loss": 2.4494, - "step": 175100 - }, - { - "epoch": 0.31, - "learning_rate": 3.473145994133588e-05, - "loss": 2.4101, - "step": 175110 - }, - { - "epoch": 0.31, - "learning_rate": 3.473058800140906e-05, - "loss": 2.3644, - "step": 175120 - }, - { - "epoch": 0.31, - "learning_rate": 3.472971606148223e-05, - "loss": 2.3514, - "step": 175130 - }, - { - "epoch": 0.31, - "learning_rate": 3.472884412155541e-05, - "loss": 2.4023, - "step": 175140 - }, - { - "epoch": 0.31, - "learning_rate": 3.472797218162858e-05, - "loss": 2.4909, - "step": 175150 - }, - { - "epoch": 0.31, - "learning_rate": 3.472710024170175e-05, - "loss": 2.3896, - "step": 175160 - }, - { - "epoch": 0.31, - "learning_rate": 3.472622830177492e-05, - "loss": 2.3426, - "step": 175170 - }, - { - "epoch": 0.31, - "learning_rate": 3.4725356361848095e-05, - "loss": 2.4574, - "step": 175180 - }, - { - "epoch": 0.31, - "learning_rate": 3.472448442192127e-05, - "loss": 2.3787, - "step": 175190 - }, - { - "epoch": 0.31, - "learning_rate": 3.472361248199444e-05, - "loss": 2.5224, - "step": 175200 - }, - { - "epoch": 0.31, - "learning_rate": 3.472274054206762e-05, - "loss": 2.3911, - "step": 175210 - }, - { - "epoch": 0.31, - "learning_rate": 3.472186860214079e-05, - "loss": 2.4904, - "step": 175220 - }, - { - "epoch": 0.31, - "learning_rate": 3.472099666221396e-05, - "loss": 2.391, - "step": 175230 - }, - { - "epoch": 0.31, - "learning_rate": 3.472012472228713e-05, - "loss": 2.4988, - "step": 175240 - }, - { - "epoch": 0.31, - "learning_rate": 3.471925278236031e-05, - "loss": 2.3873, - "step": 175250 - }, - { - "epoch": 0.31, - "learning_rate": 3.471838084243348e-05, - "loss": 2.4731, - "step": 175260 - }, - { - "epoch": 0.31, - "learning_rate": 3.4717508902506656e-05, - "loss": 2.4042, - "step": 175270 - }, - { - "epoch": 0.31, - "learning_rate": 3.4716636962579826e-05, - "loss": 2.4563, - "step": 175280 - }, - { - "epoch": 0.31, - "learning_rate": 3.4715765022653e-05, - "loss": 2.384, - "step": 175290 - }, - { - "epoch": 0.31, - "learning_rate": 3.4714893082726174e-05, - "loss": 2.3981, - "step": 175300 - }, - { - "epoch": 0.31, - "learning_rate": 3.4714021142799344e-05, - "loss": 2.5356, - "step": 175310 - }, - { - "epoch": 0.31, - "learning_rate": 3.471314920287252e-05, - "loss": 2.4311, - "step": 175320 - }, - { - "epoch": 0.31, - "learning_rate": 3.471227726294569e-05, - "loss": 2.515, - "step": 175330 - }, - { - "epoch": 0.31, - "learning_rate": 3.471140532301887e-05, - "loss": 2.5068, - "step": 175340 - }, - { - "epoch": 0.31, - "learning_rate": 3.471053338309204e-05, - "loss": 2.4462, - "step": 175350 - }, - { - "epoch": 0.31, - "learning_rate": 3.4709661443165216e-05, - "loss": 2.5589, - "step": 175360 - }, - { - "epoch": 0.31, - "learning_rate": 3.4708789503238387e-05, - "loss": 2.4457, - "step": 175370 - }, - { - "epoch": 0.31, - "learning_rate": 3.470791756331156e-05, - "loss": 2.4681, - "step": 175380 - }, - { - "epoch": 0.31, - "learning_rate": 3.4707045623384734e-05, - "loss": 2.4073, - "step": 175390 - }, - { - "epoch": 0.31, - "learning_rate": 3.4706173683457905e-05, - "loss": 2.3495, - "step": 175400 - }, - { - "epoch": 0.31, - "learning_rate": 3.4705301743531075e-05, - "loss": 2.296, - "step": 175410 - }, - { - "epoch": 0.31, - "learning_rate": 3.470442980360425e-05, - "loss": 2.4465, - "step": 175420 - }, - { - "epoch": 0.31, - "learning_rate": 3.470355786367743e-05, - "loss": 2.429, - "step": 175430 - }, - { - "epoch": 0.31, - "learning_rate": 3.47026859237506e-05, - "loss": 2.439, - "step": 175440 - }, - { - "epoch": 0.31, - "learning_rate": 3.470181398382377e-05, - "loss": 2.4023, - "step": 175450 - }, - { - "epoch": 0.31, - "learning_rate": 3.470094204389695e-05, - "loss": 2.4124, - "step": 175460 - }, - { - "epoch": 0.31, - "learning_rate": 3.470007010397012e-05, - "loss": 2.4838, - "step": 175470 - }, - { - "epoch": 0.31, - "learning_rate": 3.469919816404329e-05, - "loss": 2.4952, - "step": 175480 - }, - { - "epoch": 0.31, - "learning_rate": 3.4698326224116465e-05, - "loss": 2.4994, - "step": 175490 - }, - { - "epoch": 0.31, - "learning_rate": 3.469745428418964e-05, - "loss": 2.463, - "step": 175500 - }, - { - "epoch": 0.31, - "learning_rate": 3.469658234426281e-05, - "loss": 2.4003, - "step": 175510 - }, - { - "epoch": 0.31, - "learning_rate": 3.469571040433598e-05, - "loss": 2.4021, - "step": 175520 - }, - { - "epoch": 0.31, - "learning_rate": 3.469483846440916e-05, - "loss": 2.479, - "step": 175530 - }, - { - "epoch": 0.31, - "learning_rate": 3.469396652448233e-05, - "loss": 2.4018, - "step": 175540 - }, - { - "epoch": 0.31, - "learning_rate": 3.46930945845555e-05, - "loss": 2.4388, - "step": 175550 - }, - { - "epoch": 0.31, - "learning_rate": 3.469222264462867e-05, - "loss": 2.4173, - "step": 175560 - }, - { - "epoch": 0.31, - "learning_rate": 3.4691350704701855e-05, - "loss": 2.5095, - "step": 175570 - }, - { - "epoch": 0.31, - "learning_rate": 3.4690478764775026e-05, - "loss": 2.4909, - "step": 175580 - }, - { - "epoch": 0.31, - "learning_rate": 3.4689606824848196e-05, - "loss": 2.5051, - "step": 175590 - }, - { - "epoch": 0.31, - "learning_rate": 3.468873488492137e-05, - "loss": 2.4509, - "step": 175600 - }, - { - "epoch": 0.31, - "learning_rate": 3.4687862944994544e-05, - "loss": 2.4873, - "step": 175610 - }, - { - "epoch": 0.31, - "learning_rate": 3.4686991005067714e-05, - "loss": 2.2958, - "step": 175620 - }, - { - "epoch": 0.31, - "learning_rate": 3.4686119065140884e-05, - "loss": 2.3316, - "step": 175630 - }, - { - "epoch": 0.31, - "learning_rate": 3.468524712521407e-05, - "loss": 2.5188, - "step": 175640 - }, - { - "epoch": 0.31, - "learning_rate": 3.468437518528724e-05, - "loss": 2.4654, - "step": 175650 - }, - { - "epoch": 0.31, - "learning_rate": 3.468350324536041e-05, - "loss": 2.4817, - "step": 175660 - }, - { - "epoch": 0.31, - "learning_rate": 3.468263130543358e-05, - "loss": 2.3804, - "step": 175670 - }, - { - "epoch": 0.31, - "learning_rate": 3.4681759365506757e-05, - "loss": 2.4678, - "step": 175680 - }, - { - "epoch": 0.31, - "learning_rate": 3.468088742557993e-05, - "loss": 2.3927, - "step": 175690 - }, - { - "epoch": 0.31, - "learning_rate": 3.46800154856531e-05, - "loss": 2.4953, - "step": 175700 - }, - { - "epoch": 0.31, - "learning_rate": 3.4679143545726274e-05, - "loss": 2.4123, - "step": 175710 - }, - { - "epoch": 0.31, - "learning_rate": 3.467827160579945e-05, - "loss": 2.4909, - "step": 175720 - }, - { - "epoch": 0.31, - "learning_rate": 3.467739966587262e-05, - "loss": 2.3377, - "step": 175730 - }, - { - "epoch": 0.31, - "learning_rate": 3.467652772594579e-05, - "loss": 2.4691, - "step": 175740 - }, - { - "epoch": 0.31, - "learning_rate": 3.467565578601897e-05, - "loss": 2.4052, - "step": 175750 - }, - { - "epoch": 0.31, - "learning_rate": 3.467478384609214e-05, - "loss": 2.4771, - "step": 175760 - }, - { - "epoch": 0.31, - "learning_rate": 3.467391190616531e-05, - "loss": 2.5331, - "step": 175770 - }, - { - "epoch": 0.31, - "learning_rate": 3.467303996623849e-05, - "loss": 2.5493, - "step": 175780 - }, - { - "epoch": 0.31, - "learning_rate": 3.4672168026311665e-05, - "loss": 2.5149, - "step": 175790 - }, - { - "epoch": 0.31, - "learning_rate": 3.4671296086384835e-05, - "loss": 2.416, - "step": 175800 - }, - { - "epoch": 0.31, - "learning_rate": 3.4670424146458005e-05, - "loss": 2.3879, - "step": 175810 - }, - { - "epoch": 0.31, - "learning_rate": 3.466955220653118e-05, - "loss": 2.4943, - "step": 175820 - }, - { - "epoch": 0.31, - "learning_rate": 3.466868026660435e-05, - "loss": 2.5891, - "step": 175830 - }, - { - "epoch": 0.31, - "learning_rate": 3.466780832667752e-05, - "loss": 2.3969, - "step": 175840 - }, - { - "epoch": 0.31, - "learning_rate": 3.46669363867507e-05, - "loss": 2.4807, - "step": 175850 - }, - { - "epoch": 0.31, - "learning_rate": 3.466606444682388e-05, - "loss": 2.3174, - "step": 175860 - }, - { - "epoch": 0.31, - "learning_rate": 3.466519250689705e-05, - "loss": 2.3968, - "step": 175870 - }, - { - "epoch": 0.31, - "learning_rate": 3.466432056697022e-05, - "loss": 2.4663, - "step": 175880 - }, - { - "epoch": 0.31, - "learning_rate": 3.4663448627043396e-05, - "loss": 2.4311, - "step": 175890 - }, - { - "epoch": 0.31, - "learning_rate": 3.4662576687116566e-05, - "loss": 2.5489, - "step": 175900 - }, - { - "epoch": 0.31, - "learning_rate": 3.4661704747189736e-05, - "loss": 2.3934, - "step": 175910 - }, - { - "epoch": 0.31, - "learning_rate": 3.4660832807262913e-05, - "loss": 2.3865, - "step": 175920 - }, - { - "epoch": 0.31, - "learning_rate": 3.4659960867336084e-05, - "loss": 2.2773, - "step": 175930 - }, - { - "epoch": 0.31, - "learning_rate": 3.465908892740926e-05, - "loss": 2.501, - "step": 175940 - }, - { - "epoch": 0.31, - "learning_rate": 3.465821698748243e-05, - "loss": 2.4966, - "step": 175950 - }, - { - "epoch": 0.31, - "learning_rate": 3.465734504755561e-05, - "loss": 2.4709, - "step": 175960 - }, - { - "epoch": 0.31, - "learning_rate": 3.465647310762878e-05, - "loss": 2.4808, - "step": 175970 - }, - { - "epoch": 0.31, - "learning_rate": 3.465560116770195e-05, - "loss": 2.3991, - "step": 175980 - }, - { - "epoch": 0.31, - "learning_rate": 3.4654729227775126e-05, - "loss": 2.3801, - "step": 175990 - }, - { - "epoch": 0.31, - "learning_rate": 3.46538572878483e-05, - "loss": 2.4486, - "step": 176000 - }, - { - "epoch": 0.31, - "learning_rate": 3.4652985347921474e-05, - "loss": 2.5249, - "step": 176010 - }, - { - "epoch": 0.31, - "learning_rate": 3.4652113407994644e-05, - "loss": 2.4286, - "step": 176020 - }, - { - "epoch": 0.31, - "learning_rate": 3.465124146806782e-05, - "loss": 2.4907, - "step": 176030 - }, - { - "epoch": 0.31, - "learning_rate": 3.465036952814099e-05, - "loss": 2.4314, - "step": 176040 - }, - { - "epoch": 0.31, - "learning_rate": 3.464949758821416e-05, - "loss": 2.3974, - "step": 176050 - }, - { - "epoch": 0.31, - "learning_rate": 3.464862564828734e-05, - "loss": 2.4264, - "step": 176060 - }, - { - "epoch": 0.31, - "learning_rate": 3.464775370836051e-05, - "loss": 2.4542, - "step": 176070 - }, - { - "epoch": 0.31, - "learning_rate": 3.464688176843368e-05, - "loss": 2.2812, - "step": 176080 - }, - { - "epoch": 0.31, - "learning_rate": 3.464600982850686e-05, - "loss": 2.5055, - "step": 176090 - }, - { - "epoch": 0.31, - "learning_rate": 3.4645137888580035e-05, - "loss": 2.5393, - "step": 176100 - }, - { - "epoch": 0.31, - "learning_rate": 3.4644265948653205e-05, - "loss": 2.4789, - "step": 176110 - }, - { - "epoch": 0.31, - "learning_rate": 3.4643394008726375e-05, - "loss": 2.4033, - "step": 176120 - }, - { - "epoch": 0.31, - "learning_rate": 3.4642522068799546e-05, - "loss": 2.504, - "step": 176130 - }, - { - "epoch": 0.31, - "learning_rate": 3.464165012887272e-05, - "loss": 2.4328, - "step": 176140 - }, - { - "epoch": 0.31, - "learning_rate": 3.464077818894589e-05, - "loss": 2.4493, - "step": 176150 - }, - { - "epoch": 0.31, - "learning_rate": 3.463990624901907e-05, - "loss": 2.5134, - "step": 176160 - }, - { - "epoch": 0.31, - "learning_rate": 3.463903430909225e-05, - "loss": 2.4889, - "step": 176170 - }, - { - "epoch": 0.31, - "learning_rate": 3.463816236916542e-05, - "loss": 2.4257, - "step": 176180 - }, - { - "epoch": 0.31, - "learning_rate": 3.463729042923859e-05, - "loss": 2.3495, - "step": 176190 - }, - { - "epoch": 0.31, - "learning_rate": 3.463641848931176e-05, - "loss": 2.4787, - "step": 176200 - }, - { - "epoch": 0.31, - "learning_rate": 3.4635546549384936e-05, - "loss": 2.3976, - "step": 176210 - }, - { - "epoch": 0.31, - "learning_rate": 3.4634674609458106e-05, - "loss": 2.3269, - "step": 176220 - }, - { - "epoch": 0.31, - "learning_rate": 3.4633802669531277e-05, - "loss": 2.4284, - "step": 176230 - }, - { - "epoch": 0.31, - "learning_rate": 3.4632930729604454e-05, - "loss": 2.4397, - "step": 176240 - }, - { - "epoch": 0.31, - "learning_rate": 3.463205878967763e-05, - "loss": 2.4515, - "step": 176250 - }, - { - "epoch": 0.31, - "learning_rate": 3.46311868497508e-05, - "loss": 2.3573, - "step": 176260 - }, - { - "epoch": 0.31, - "learning_rate": 3.463031490982397e-05, - "loss": 2.2911, - "step": 176270 - }, - { - "epoch": 0.31, - "learning_rate": 3.462944296989715e-05, - "loss": 2.6332, - "step": 176280 - }, - { - "epoch": 0.31, - "learning_rate": 3.462857102997032e-05, - "loss": 2.3279, - "step": 176290 - }, - { - "epoch": 0.31, - "learning_rate": 3.462769909004349e-05, - "loss": 2.4828, - "step": 176300 - }, - { - "epoch": 0.31, - "learning_rate": 3.462682715011667e-05, - "loss": 2.3914, - "step": 176310 - }, - { - "epoch": 0.31, - "learning_rate": 3.4625955210189844e-05, - "loss": 2.4212, - "step": 176320 - }, - { - "epoch": 0.31, - "learning_rate": 3.4625083270263014e-05, - "loss": 2.3999, - "step": 176330 - }, - { - "epoch": 0.31, - "learning_rate": 3.4624211330336185e-05, - "loss": 2.4394, - "step": 176340 - }, - { - "epoch": 0.31, - "learning_rate": 3.462333939040936e-05, - "loss": 2.4594, - "step": 176350 - }, - { - "epoch": 0.31, - "learning_rate": 3.462246745048253e-05, - "loss": 2.4719, - "step": 176360 - }, - { - "epoch": 0.31, - "learning_rate": 3.46215955105557e-05, - "loss": 2.462, - "step": 176370 - }, - { - "epoch": 0.31, - "learning_rate": 3.462072357062888e-05, - "loss": 2.5107, - "step": 176380 - }, - { - "epoch": 0.31, - "learning_rate": 3.461985163070206e-05, - "loss": 2.3965, - "step": 176390 - }, - { - "epoch": 0.31, - "learning_rate": 3.461897969077523e-05, - "loss": 2.4677, - "step": 176400 - }, - { - "epoch": 0.31, - "learning_rate": 3.46181077508484e-05, - "loss": 2.3647, - "step": 176410 - }, - { - "epoch": 0.31, - "learning_rate": 3.4617235810921575e-05, - "loss": 2.421, - "step": 176420 - }, - { - "epoch": 0.31, - "learning_rate": 3.4616363870994745e-05, - "loss": 2.2811, - "step": 176430 - }, - { - "epoch": 0.31, - "learning_rate": 3.4615491931067916e-05, - "loss": 2.336, - "step": 176440 - }, - { - "epoch": 0.31, - "learning_rate": 3.461461999114109e-05, - "loss": 2.48, - "step": 176450 - }, - { - "epoch": 0.31, - "learning_rate": 3.461374805121427e-05, - "loss": 2.4977, - "step": 176460 - }, - { - "epoch": 0.31, - "learning_rate": 3.461287611128744e-05, - "loss": 2.4027, - "step": 176470 - }, - { - "epoch": 0.31, - "learning_rate": 3.461200417136061e-05, - "loss": 2.3477, - "step": 176480 - }, - { - "epoch": 0.31, - "learning_rate": 3.461113223143379e-05, - "loss": 2.5662, - "step": 176490 - }, - { - "epoch": 0.31, - "learning_rate": 3.461026029150696e-05, - "loss": 2.505, - "step": 176500 - }, - { - "epoch": 0.31, - "learning_rate": 3.460938835158013e-05, - "loss": 2.399, - "step": 176510 - }, - { - "epoch": 0.31, - "learning_rate": 3.46085164116533e-05, - "loss": 2.4818, - "step": 176520 - }, - { - "epoch": 0.31, - "learning_rate": 3.460764447172648e-05, - "loss": 2.386, - "step": 176530 - }, - { - "epoch": 0.31, - "learning_rate": 3.460677253179965e-05, - "loss": 2.4832, - "step": 176540 - }, - { - "epoch": 0.31, - "learning_rate": 3.4605900591872824e-05, - "loss": 2.3386, - "step": 176550 - }, - { - "epoch": 0.31, - "learning_rate": 3.4605028651946e-05, - "loss": 2.5109, - "step": 176560 - }, - { - "epoch": 0.31, - "learning_rate": 3.460415671201917e-05, - "loss": 2.4837, - "step": 176570 - }, - { - "epoch": 0.31, - "learning_rate": 3.460328477209234e-05, - "loss": 2.4303, - "step": 176580 - }, - { - "epoch": 0.31, - "learning_rate": 3.460241283216551e-05, - "loss": 2.4654, - "step": 176590 - }, - { - "epoch": 0.31, - "learning_rate": 3.460154089223869e-05, - "loss": 2.3725, - "step": 176600 - }, - { - "epoch": 0.31, - "learning_rate": 3.4600668952311866e-05, - "loss": 2.4561, - "step": 176610 - }, - { - "epoch": 0.31, - "learning_rate": 3.459979701238504e-05, - "loss": 2.593, - "step": 176620 - }, - { - "epoch": 0.31, - "learning_rate": 3.459892507245821e-05, - "loss": 2.448, - "step": 176630 - }, - { - "epoch": 0.31, - "learning_rate": 3.4598053132531384e-05, - "loss": 2.4317, - "step": 176640 - }, - { - "epoch": 0.31, - "learning_rate": 3.4597181192604555e-05, - "loss": 2.4625, - "step": 176650 - }, - { - "epoch": 0.31, - "learning_rate": 3.4596309252677725e-05, - "loss": 2.5161, - "step": 176660 - }, - { - "epoch": 0.31, - "learning_rate": 3.45954373127509e-05, - "loss": 2.4167, - "step": 176670 - }, - { - "epoch": 0.31, - "learning_rate": 3.459456537282408e-05, - "loss": 2.4126, - "step": 176680 - }, - { - "epoch": 0.31, - "learning_rate": 3.459369343289725e-05, - "loss": 2.4601, - "step": 176690 - }, - { - "epoch": 0.31, - "learning_rate": 3.459282149297042e-05, - "loss": 2.5293, - "step": 176700 - }, - { - "epoch": 0.31, - "learning_rate": 3.45919495530436e-05, - "loss": 2.3067, - "step": 176710 - }, - { - "epoch": 0.31, - "learning_rate": 3.459107761311677e-05, - "loss": 2.5347, - "step": 176720 - }, - { - "epoch": 0.31, - "learning_rate": 3.459020567318994e-05, - "loss": 2.4159, - "step": 176730 - }, - { - "epoch": 0.31, - "learning_rate": 3.4589333733263115e-05, - "loss": 2.3181, - "step": 176740 - }, - { - "epoch": 0.31, - "learning_rate": 3.4588461793336286e-05, - "loss": 2.443, - "step": 176750 - }, - { - "epoch": 0.31, - "learning_rate": 3.458758985340946e-05, - "loss": 2.3403, - "step": 176760 - }, - { - "epoch": 0.31, - "learning_rate": 3.458671791348263e-05, - "loss": 2.4158, - "step": 176770 - }, - { - "epoch": 0.31, - "learning_rate": 3.458584597355581e-05, - "loss": 2.4101, - "step": 176780 - }, - { - "epoch": 0.31, - "learning_rate": 3.458497403362898e-05, - "loss": 2.5524, - "step": 176790 - }, - { - "epoch": 0.31, - "learning_rate": 3.458410209370215e-05, - "loss": 2.4513, - "step": 176800 - }, - { - "epoch": 0.31, - "learning_rate": 3.458323015377533e-05, - "loss": 2.4213, - "step": 176810 - }, - { - "epoch": 0.31, - "learning_rate": 3.45823582138485e-05, - "loss": 2.3921, - "step": 176820 - }, - { - "epoch": 0.31, - "learning_rate": 3.4581486273921676e-05, - "loss": 2.5129, - "step": 176830 - }, - { - "epoch": 0.31, - "learning_rate": 3.4580614333994846e-05, - "loss": 2.3777, - "step": 176840 - }, - { - "epoch": 0.31, - "learning_rate": 3.457974239406802e-05, - "loss": 2.5096, - "step": 176850 - }, - { - "epoch": 0.31, - "learning_rate": 3.4578870454141194e-05, - "loss": 2.4708, - "step": 176860 - }, - { - "epoch": 0.31, - "learning_rate": 3.4577998514214364e-05, - "loss": 2.331, - "step": 176870 - }, - { - "epoch": 0.31, - "learning_rate": 3.457712657428754e-05, - "loss": 2.4943, - "step": 176880 - }, - { - "epoch": 0.31, - "learning_rate": 3.457625463436071e-05, - "loss": 2.4888, - "step": 176890 - }, - { - "epoch": 0.31, - "learning_rate": 3.457538269443388e-05, - "loss": 2.4724, - "step": 176900 - }, - { - "epoch": 0.31, - "learning_rate": 3.457451075450706e-05, - "loss": 2.3371, - "step": 176910 - }, - { - "epoch": 0.31, - "learning_rate": 3.4573638814580236e-05, - "loss": 2.5098, - "step": 176920 - }, - { - "epoch": 0.31, - "learning_rate": 3.457276687465341e-05, - "loss": 2.4303, - "step": 176930 - }, - { - "epoch": 0.31, - "learning_rate": 3.457189493472658e-05, - "loss": 2.5357, - "step": 176940 - }, - { - "epoch": 0.31, - "learning_rate": 3.4571022994799754e-05, - "loss": 2.4667, - "step": 176950 - }, - { - "epoch": 0.31, - "learning_rate": 3.4570151054872925e-05, - "loss": 2.3857, - "step": 176960 - }, - { - "epoch": 0.31, - "learning_rate": 3.4569279114946095e-05, - "loss": 2.5795, - "step": 176970 - }, - { - "epoch": 0.31, - "learning_rate": 3.456840717501927e-05, - "loss": 2.4464, - "step": 176980 - }, - { - "epoch": 0.31, - "learning_rate": 3.456753523509245e-05, - "loss": 2.5866, - "step": 176990 - }, - { - "epoch": 0.31, - "learning_rate": 3.456666329516562e-05, - "loss": 2.4656, - "step": 177000 - }, - { - "epoch": 0.31, - "learning_rate": 3.456579135523879e-05, - "loss": 2.5063, - "step": 177010 - }, - { - "epoch": 0.31, - "learning_rate": 3.456491941531196e-05, - "loss": 2.3609, - "step": 177020 - }, - { - "epoch": 0.31, - "learning_rate": 3.456404747538514e-05, - "loss": 2.4255, - "step": 177030 - }, - { - "epoch": 0.31, - "learning_rate": 3.456317553545831e-05, - "loss": 2.4608, - "step": 177040 - }, - { - "epoch": 0.31, - "learning_rate": 3.4562303595531485e-05, - "loss": 2.2851, - "step": 177050 - }, - { - "epoch": 0.31, - "learning_rate": 3.456143165560466e-05, - "loss": 2.4759, - "step": 177060 - }, - { - "epoch": 0.31, - "learning_rate": 3.456055971567783e-05, - "loss": 2.4174, - "step": 177070 - }, - { - "epoch": 0.31, - "learning_rate": 3.4559687775751e-05, - "loss": 2.5096, - "step": 177080 - }, - { - "epoch": 0.31, - "learning_rate": 3.455881583582417e-05, - "loss": 2.4195, - "step": 177090 - }, - { - "epoch": 0.31, - "learning_rate": 3.455794389589735e-05, - "loss": 2.5528, - "step": 177100 - }, - { - "epoch": 0.31, - "learning_rate": 3.455707195597052e-05, - "loss": 2.4368, - "step": 177110 - }, - { - "epoch": 0.31, - "learning_rate": 3.455620001604369e-05, - "loss": 2.4419, - "step": 177120 - }, - { - "epoch": 0.31, - "learning_rate": 3.455532807611687e-05, - "loss": 2.483, - "step": 177130 - }, - { - "epoch": 0.31, - "learning_rate": 3.4554456136190046e-05, - "loss": 2.5722, - "step": 177140 - }, - { - "epoch": 0.31, - "learning_rate": 3.4553584196263216e-05, - "loss": 2.5083, - "step": 177150 - }, - { - "epoch": 0.31, - "learning_rate": 3.4552712256336386e-05, - "loss": 2.5109, - "step": 177160 - }, - { - "epoch": 0.31, - "learning_rate": 3.4551840316409564e-05, - "loss": 2.4664, - "step": 177170 - }, - { - "epoch": 0.31, - "learning_rate": 3.4550968376482734e-05, - "loss": 2.4735, - "step": 177180 - }, - { - "epoch": 0.31, - "learning_rate": 3.4550096436555904e-05, - "loss": 2.5632, - "step": 177190 - }, - { - "epoch": 0.31, - "learning_rate": 3.454922449662908e-05, - "loss": 2.436, - "step": 177200 - }, - { - "epoch": 0.31, - "learning_rate": 3.454835255670226e-05, - "loss": 2.4984, - "step": 177210 - }, - { - "epoch": 0.31, - "learning_rate": 3.454748061677543e-05, - "loss": 2.4736, - "step": 177220 - }, - { - "epoch": 0.31, - "learning_rate": 3.45466086768486e-05, - "loss": 2.4547, - "step": 177230 - }, - { - "epoch": 0.31, - "learning_rate": 3.4545736736921777e-05, - "loss": 2.4207, - "step": 177240 - }, - { - "epoch": 0.31, - "learning_rate": 3.454486479699495e-05, - "loss": 2.2302, - "step": 177250 - }, - { - "epoch": 0.31, - "learning_rate": 3.454399285706812e-05, - "loss": 2.4443, - "step": 177260 - }, - { - "epoch": 0.31, - "learning_rate": 3.4543120917141294e-05, - "loss": 2.3802, - "step": 177270 - }, - { - "epoch": 0.31, - "learning_rate": 3.454224897721447e-05, - "loss": 2.4855, - "step": 177280 - }, - { - "epoch": 0.31, - "learning_rate": 3.454137703728764e-05, - "loss": 2.4569, - "step": 177290 - }, - { - "epoch": 0.31, - "learning_rate": 3.454050509736081e-05, - "loss": 2.5284, - "step": 177300 - }, - { - "epoch": 0.31, - "learning_rate": 3.453963315743399e-05, - "loss": 2.3929, - "step": 177310 - }, - { - "epoch": 0.31, - "learning_rate": 3.453876121750716e-05, - "loss": 2.5053, - "step": 177320 - }, - { - "epoch": 0.31, - "learning_rate": 3.453788927758033e-05, - "loss": 2.4229, - "step": 177330 - }, - { - "epoch": 0.31, - "learning_rate": 3.453701733765351e-05, - "loss": 2.5473, - "step": 177340 - }, - { - "epoch": 0.31, - "learning_rate": 3.4536145397726685e-05, - "loss": 2.4733, - "step": 177350 - }, - { - "epoch": 0.31, - "learning_rate": 3.4535273457799855e-05, - "loss": 2.379, - "step": 177360 - }, - { - "epoch": 0.31, - "learning_rate": 3.4534401517873025e-05, - "loss": 2.5046, - "step": 177370 - }, - { - "epoch": 0.31, - "learning_rate": 3.45335295779462e-05, - "loss": 2.2803, - "step": 177380 - }, - { - "epoch": 0.31, - "learning_rate": 3.453265763801937e-05, - "loss": 2.5086, - "step": 177390 - }, - { - "epoch": 0.31, - "learning_rate": 3.453178569809254e-05, - "loss": 2.4484, - "step": 177400 - }, - { - "epoch": 0.31, - "learning_rate": 3.453091375816572e-05, - "loss": 2.5267, - "step": 177410 - }, - { - "epoch": 0.31, - "learning_rate": 3.453004181823889e-05, - "loss": 2.4489, - "step": 177420 - }, - { - "epoch": 0.31, - "learning_rate": 3.452916987831207e-05, - "loss": 2.5536, - "step": 177430 - }, - { - "epoch": 0.31, - "learning_rate": 3.452829793838524e-05, - "loss": 2.4722, - "step": 177440 - }, - { - "epoch": 0.31, - "learning_rate": 3.4527425998458416e-05, - "loss": 2.3636, - "step": 177450 - }, - { - "epoch": 0.31, - "learning_rate": 3.4526554058531586e-05, - "loss": 2.4939, - "step": 177460 - }, - { - "epoch": 0.31, - "learning_rate": 3.4525682118604756e-05, - "loss": 2.4014, - "step": 177470 - }, - { - "epoch": 0.31, - "learning_rate": 3.452481017867793e-05, - "loss": 2.4997, - "step": 177480 - }, - { - "epoch": 0.31, - "learning_rate": 3.4523938238751104e-05, - "loss": 2.502, - "step": 177490 - }, - { - "epoch": 0.31, - "learning_rate": 3.452306629882428e-05, - "loss": 2.2767, - "step": 177500 - }, - { - "epoch": 0.31, - "learning_rate": 3.452219435889745e-05, - "loss": 2.3046, - "step": 177510 - }, - { - "epoch": 0.31, - "learning_rate": 3.452132241897063e-05, - "loss": 2.4831, - "step": 177520 - }, - { - "epoch": 0.31, - "learning_rate": 3.45204504790438e-05, - "loss": 2.4384, - "step": 177530 - }, - { - "epoch": 0.31, - "learning_rate": 3.451957853911697e-05, - "loss": 2.348, - "step": 177540 - }, - { - "epoch": 0.31, - "learning_rate": 3.451870659919014e-05, - "loss": 2.4649, - "step": 177550 - }, - { - "epoch": 0.31, - "learning_rate": 3.451783465926332e-05, - "loss": 2.3746, - "step": 177560 - }, - { - "epoch": 0.31, - "learning_rate": 3.451696271933649e-05, - "loss": 2.5051, - "step": 177570 - }, - { - "epoch": 0.31, - "learning_rate": 3.4516090779409664e-05, - "loss": 2.4917, - "step": 177580 - }, - { - "epoch": 0.31, - "learning_rate": 3.4515218839482835e-05, - "loss": 2.4552, - "step": 177590 - }, - { - "epoch": 0.31, - "learning_rate": 3.451434689955601e-05, - "loss": 2.4258, - "step": 177600 - }, - { - "epoch": 0.31, - "learning_rate": 3.451347495962918e-05, - "loss": 2.4257, - "step": 177610 - }, - { - "epoch": 0.31, - "learning_rate": 3.451260301970235e-05, - "loss": 2.3749, - "step": 177620 - }, - { - "epoch": 0.31, - "learning_rate": 3.451173107977553e-05, - "loss": 2.5044, - "step": 177630 - }, - { - "epoch": 0.31, - "learning_rate": 3.45108591398487e-05, - "loss": 2.4904, - "step": 177640 - }, - { - "epoch": 0.31, - "learning_rate": 3.450998719992188e-05, - "loss": 2.3916, - "step": 177650 - }, - { - "epoch": 0.31, - "learning_rate": 3.450911525999505e-05, - "loss": 2.5031, - "step": 177660 - }, - { - "epoch": 0.31, - "learning_rate": 3.4508243320068225e-05, - "loss": 2.3587, - "step": 177670 - }, - { - "epoch": 0.31, - "learning_rate": 3.4507371380141395e-05, - "loss": 2.3501, - "step": 177680 - }, - { - "epoch": 0.31, - "learning_rate": 3.4506499440214566e-05, - "loss": 2.4078, - "step": 177690 - }, - { - "epoch": 0.31, - "learning_rate": 3.450562750028774e-05, - "loss": 2.5198, - "step": 177700 - }, - { - "epoch": 0.31, - "learning_rate": 3.450475556036091e-05, - "loss": 2.4924, - "step": 177710 - }, - { - "epoch": 0.31, - "learning_rate": 3.450388362043409e-05, - "loss": 2.443, - "step": 177720 - }, - { - "epoch": 0.31, - "learning_rate": 3.450301168050726e-05, - "loss": 2.4946, - "step": 177730 - }, - { - "epoch": 0.31, - "learning_rate": 3.450213974058044e-05, - "loss": 2.5387, - "step": 177740 - }, - { - "epoch": 0.31, - "learning_rate": 3.450126780065361e-05, - "loss": 2.422, - "step": 177750 - }, - { - "epoch": 0.31, - "learning_rate": 3.450039586072678e-05, - "loss": 2.552, - "step": 177760 - }, - { - "epoch": 0.31, - "learning_rate": 3.4499523920799956e-05, - "loss": 2.5253, - "step": 177770 - }, - { - "epoch": 0.31, - "learning_rate": 3.4498651980873126e-05, - "loss": 2.4517, - "step": 177780 - }, - { - "epoch": 0.31, - "learning_rate": 3.44977800409463e-05, - "loss": 2.4195, - "step": 177790 - }, - { - "epoch": 0.31, - "learning_rate": 3.4496908101019474e-05, - "loss": 2.4582, - "step": 177800 - }, - { - "epoch": 0.31, - "learning_rate": 3.449603616109265e-05, - "loss": 2.5251, - "step": 177810 - }, - { - "epoch": 0.31, - "learning_rate": 3.449516422116582e-05, - "loss": 2.495, - "step": 177820 - }, - { - "epoch": 0.31, - "learning_rate": 3.449429228123899e-05, - "loss": 2.4383, - "step": 177830 - }, - { - "epoch": 0.31, - "learning_rate": 3.449342034131217e-05, - "loss": 2.4725, - "step": 177840 - }, - { - "epoch": 0.31, - "learning_rate": 3.449254840138534e-05, - "loss": 2.3961, - "step": 177850 - }, - { - "epoch": 0.31, - "learning_rate": 3.449167646145851e-05, - "loss": 2.5526, - "step": 177860 - }, - { - "epoch": 0.31, - "learning_rate": 3.449080452153169e-05, - "loss": 2.482, - "step": 177870 - }, - { - "epoch": 0.31, - "learning_rate": 3.4489932581604864e-05, - "loss": 2.3158, - "step": 177880 - }, - { - "epoch": 0.31, - "learning_rate": 3.4489060641678034e-05, - "loss": 2.4396, - "step": 177890 - }, - { - "epoch": 0.31, - "learning_rate": 3.4488188701751205e-05, - "loss": 2.4649, - "step": 177900 - }, - { - "epoch": 0.31, - "learning_rate": 3.448731676182438e-05, - "loss": 2.5164, - "step": 177910 - }, - { - "epoch": 0.31, - "learning_rate": 3.448644482189755e-05, - "loss": 2.4655, - "step": 177920 - }, - { - "epoch": 0.31, - "learning_rate": 3.448557288197072e-05, - "loss": 2.4916, - "step": 177930 - }, - { - "epoch": 0.31, - "learning_rate": 3.448470094204389e-05, - "loss": 2.3897, - "step": 177940 - }, - { - "epoch": 0.31, - "learning_rate": 3.448382900211708e-05, - "loss": 2.4846, - "step": 177950 - }, - { - "epoch": 0.31, - "learning_rate": 3.448295706219025e-05, - "loss": 2.5546, - "step": 177960 - }, - { - "epoch": 0.31, - "learning_rate": 3.448208512226342e-05, - "loss": 2.427, - "step": 177970 - }, - { - "epoch": 0.31, - "learning_rate": 3.448121318233659e-05, - "loss": 2.4372, - "step": 177980 - }, - { - "epoch": 0.31, - "learning_rate": 3.4480341242409765e-05, - "loss": 2.6407, - "step": 177990 - }, - { - "epoch": 0.31, - "learning_rate": 3.4479469302482936e-05, - "loss": 2.4726, - "step": 178000 - }, - { - "epoch": 0.31, - "learning_rate": 3.4478597362556106e-05, - "loss": 2.5005, - "step": 178010 - }, - { - "epoch": 0.31, - "learning_rate": 3.447772542262929e-05, - "loss": 2.5465, - "step": 178020 - }, - { - "epoch": 0.31, - "learning_rate": 3.447685348270246e-05, - "loss": 2.4928, - "step": 178030 - }, - { - "epoch": 0.31, - "learning_rate": 3.447598154277563e-05, - "loss": 2.4959, - "step": 178040 - }, - { - "epoch": 0.31, - "learning_rate": 3.44751096028488e-05, - "loss": 2.3871, - "step": 178050 - }, - { - "epoch": 0.31, - "learning_rate": 3.447423766292198e-05, - "loss": 2.4779, - "step": 178060 - }, - { - "epoch": 0.31, - "learning_rate": 3.447336572299515e-05, - "loss": 2.5135, - "step": 178070 - }, - { - "epoch": 0.31, - "learning_rate": 3.447249378306832e-05, - "loss": 2.5244, - "step": 178080 - }, - { - "epoch": 0.31, - "learning_rate": 3.4471621843141496e-05, - "loss": 2.512, - "step": 178090 - }, - { - "epoch": 0.31, - "learning_rate": 3.447074990321467e-05, - "loss": 2.4825, - "step": 178100 - }, - { - "epoch": 0.31, - "learning_rate": 3.4469877963287844e-05, - "loss": 2.441, - "step": 178110 - }, - { - "epoch": 0.31, - "learning_rate": 3.4469006023361014e-05, - "loss": 2.3713, - "step": 178120 - }, - { - "epoch": 0.31, - "learning_rate": 3.446813408343419e-05, - "loss": 2.3909, - "step": 178130 - }, - { - "epoch": 0.31, - "learning_rate": 3.446726214350736e-05, - "loss": 2.4093, - "step": 178140 - }, - { - "epoch": 0.31, - "learning_rate": 3.446639020358053e-05, - "loss": 2.5052, - "step": 178150 - }, - { - "epoch": 0.31, - "learning_rate": 3.446551826365371e-05, - "loss": 2.3169, - "step": 178160 - }, - { - "epoch": 0.31, - "learning_rate": 3.4464646323726886e-05, - "loss": 2.463, - "step": 178170 - }, - { - "epoch": 0.31, - "learning_rate": 3.446377438380006e-05, - "loss": 2.5167, - "step": 178180 - }, - { - "epoch": 0.31, - "learning_rate": 3.446290244387323e-05, - "loss": 2.3485, - "step": 178190 - }, - { - "epoch": 0.31, - "learning_rate": 3.4462030503946404e-05, - "loss": 2.3939, - "step": 178200 - }, - { - "epoch": 0.31, - "learning_rate": 3.4461158564019575e-05, - "loss": 2.2944, - "step": 178210 - }, - { - "epoch": 0.31, - "learning_rate": 3.4460286624092745e-05, - "loss": 2.4506, - "step": 178220 - }, - { - "epoch": 0.31, - "learning_rate": 3.445941468416592e-05, - "loss": 2.424, - "step": 178230 - }, - { - "epoch": 0.31, - "learning_rate": 3.445854274423909e-05, - "loss": 2.4659, - "step": 178240 - }, - { - "epoch": 0.31, - "learning_rate": 3.445767080431227e-05, - "loss": 2.4847, - "step": 178250 - }, - { - "epoch": 0.31, - "learning_rate": 3.445679886438544e-05, - "loss": 2.4413, - "step": 178260 - }, - { - "epoch": 0.31, - "learning_rate": 3.445592692445862e-05, - "loss": 2.4261, - "step": 178270 - }, - { - "epoch": 0.31, - "learning_rate": 3.445505498453179e-05, - "loss": 2.4658, - "step": 178280 - }, - { - "epoch": 0.31, - "learning_rate": 3.445418304460496e-05, - "loss": 2.4115, - "step": 178290 - }, - { - "epoch": 0.31, - "learning_rate": 3.4453311104678135e-05, - "loss": 2.3159, - "step": 178300 - }, - { - "epoch": 0.31, - "learning_rate": 3.4452439164751306e-05, - "loss": 2.453, - "step": 178310 - }, - { - "epoch": 0.31, - "learning_rate": 3.445156722482448e-05, - "loss": 2.4535, - "step": 178320 - }, - { - "epoch": 0.31, - "learning_rate": 3.445069528489765e-05, - "loss": 2.4171, - "step": 178330 - }, - { - "epoch": 0.31, - "learning_rate": 3.444982334497083e-05, - "loss": 2.4288, - "step": 178340 - }, - { - "epoch": 0.31, - "learning_rate": 3.4448951405044e-05, - "loss": 2.241, - "step": 178350 - }, - { - "epoch": 0.31, - "learning_rate": 3.444807946511717e-05, - "loss": 2.4042, - "step": 178360 - }, - { - "epoch": 0.31, - "learning_rate": 3.444720752519034e-05, - "loss": 2.5267, - "step": 178370 - }, - { - "epoch": 0.31, - "learning_rate": 3.444633558526352e-05, - "loss": 2.3826, - "step": 178380 - }, - { - "epoch": 0.31, - "learning_rate": 3.4445463645336696e-05, - "loss": 2.4298, - "step": 178390 - }, - { - "epoch": 0.31, - "learning_rate": 3.4444591705409866e-05, - "loss": 2.4341, - "step": 178400 - }, - { - "epoch": 0.31, - "learning_rate": 3.444371976548304e-05, - "loss": 2.4896, - "step": 178410 - }, - { - "epoch": 0.31, - "learning_rate": 3.4442847825556214e-05, - "loss": 2.4538, - "step": 178420 - }, - { - "epoch": 0.31, - "learning_rate": 3.4441975885629384e-05, - "loss": 2.4394, - "step": 178430 - }, - { - "epoch": 0.31, - "learning_rate": 3.4441103945702554e-05, - "loss": 2.4293, - "step": 178440 - }, - { - "epoch": 0.31, - "learning_rate": 3.444023200577573e-05, - "loss": 2.3673, - "step": 178450 - }, - { - "epoch": 0.31, - "learning_rate": 3.44393600658489e-05, - "loss": 2.4195, - "step": 178460 - }, - { - "epoch": 0.31, - "learning_rate": 3.443848812592208e-05, - "loss": 2.3694, - "step": 178470 - }, - { - "epoch": 0.31, - "learning_rate": 3.443761618599525e-05, - "loss": 2.3659, - "step": 178480 - }, - { - "epoch": 0.31, - "learning_rate": 3.443674424606843e-05, - "loss": 2.3667, - "step": 178490 - }, - { - "epoch": 0.31, - "learning_rate": 3.44358723061416e-05, - "loss": 2.2577, - "step": 178500 - }, - { - "epoch": 0.31, - "learning_rate": 3.443500036621477e-05, - "loss": 2.4335, - "step": 178510 - }, - { - "epoch": 0.31, - "learning_rate": 3.4434128426287945e-05, - "loss": 2.4022, - "step": 178520 - }, - { - "epoch": 0.31, - "learning_rate": 3.4433256486361115e-05, - "loss": 2.4139, - "step": 178530 - }, - { - "epoch": 0.31, - "learning_rate": 3.443238454643429e-05, - "loss": 2.4278, - "step": 178540 - }, - { - "epoch": 0.31, - "learning_rate": 3.443151260650746e-05, - "loss": 2.3724, - "step": 178550 - }, - { - "epoch": 0.31, - "learning_rate": 3.443064066658064e-05, - "loss": 2.2945, - "step": 178560 - }, - { - "epoch": 0.31, - "learning_rate": 3.442976872665381e-05, - "loss": 2.454, - "step": 178570 - }, - { - "epoch": 0.31, - "learning_rate": 3.442889678672698e-05, - "loss": 2.5059, - "step": 178580 - }, - { - "epoch": 0.31, - "learning_rate": 3.442802484680016e-05, - "loss": 2.3414, - "step": 178590 - }, - { - "epoch": 0.31, - "learning_rate": 3.442715290687333e-05, - "loss": 2.3703, - "step": 178600 - }, - { - "epoch": 0.31, - "learning_rate": 3.44262809669465e-05, - "loss": 2.4825, - "step": 178610 - }, - { - "epoch": 0.31, - "learning_rate": 3.4425409027019675e-05, - "loss": 2.3662, - "step": 178620 - }, - { - "epoch": 0.31, - "learning_rate": 3.442453708709285e-05, - "loss": 2.4738, - "step": 178630 - }, - { - "epoch": 0.31, - "learning_rate": 3.442366514716602e-05, - "loss": 2.5802, - "step": 178640 - }, - { - "epoch": 0.31, - "learning_rate": 3.4422793207239193e-05, - "loss": 2.4503, - "step": 178650 - }, - { - "epoch": 0.31, - "learning_rate": 3.442192126731237e-05, - "loss": 2.456, - "step": 178660 - }, - { - "epoch": 0.31, - "learning_rate": 3.442104932738554e-05, - "loss": 2.4155, - "step": 178670 - }, - { - "epoch": 0.31, - "learning_rate": 3.442017738745871e-05, - "loss": 2.2935, - "step": 178680 - }, - { - "epoch": 0.31, - "learning_rate": 3.441930544753189e-05, - "loss": 2.6265, - "step": 178690 - }, - { - "epoch": 0.31, - "learning_rate": 3.4418433507605066e-05, - "loss": 2.4024, - "step": 178700 - }, - { - "epoch": 0.31, - "learning_rate": 3.4417561567678236e-05, - "loss": 2.5004, - "step": 178710 - }, - { - "epoch": 0.31, - "learning_rate": 3.4416689627751406e-05, - "loss": 2.4706, - "step": 178720 - }, - { - "epoch": 0.31, - "learning_rate": 3.4415817687824584e-05, - "loss": 2.3923, - "step": 178730 - }, - { - "epoch": 0.31, - "learning_rate": 3.4414945747897754e-05, - "loss": 2.3466, - "step": 178740 - }, - { - "epoch": 0.31, - "learning_rate": 3.4414073807970924e-05, - "loss": 2.4881, - "step": 178750 - }, - { - "epoch": 0.31, - "learning_rate": 3.44132018680441e-05, - "loss": 2.4288, - "step": 178760 - }, - { - "epoch": 0.31, - "learning_rate": 3.441232992811728e-05, - "loss": 2.3944, - "step": 178770 - }, - { - "epoch": 0.31, - "learning_rate": 3.441145798819045e-05, - "loss": 2.4008, - "step": 178780 - }, - { - "epoch": 0.31, - "learning_rate": 3.441058604826362e-05, - "loss": 2.4794, - "step": 178790 - }, - { - "epoch": 0.31, - "learning_rate": 3.4409714108336797e-05, - "loss": 2.4088, - "step": 178800 - }, - { - "epoch": 0.31, - "learning_rate": 3.440884216840997e-05, - "loss": 2.4659, - "step": 178810 - }, - { - "epoch": 0.31, - "learning_rate": 3.440797022848314e-05, - "loss": 2.5015, - "step": 178820 - }, - { - "epoch": 0.31, - "learning_rate": 3.440709828855631e-05, - "loss": 2.5493, - "step": 178830 - }, - { - "epoch": 0.31, - "learning_rate": 3.440622634862949e-05, - "loss": 2.4204, - "step": 178840 - }, - { - "epoch": 0.31, - "learning_rate": 3.440535440870266e-05, - "loss": 2.4063, - "step": 178850 - }, - { - "epoch": 0.31, - "learning_rate": 3.440448246877583e-05, - "loss": 2.4502, - "step": 178860 - }, - { - "epoch": 0.31, - "learning_rate": 3.440361052884901e-05, - "loss": 2.3614, - "step": 178870 - }, - { - "epoch": 0.31, - "learning_rate": 3.440273858892218e-05, - "loss": 2.4522, - "step": 178880 - }, - { - "epoch": 0.31, - "learning_rate": 3.440186664899535e-05, - "loss": 2.3663, - "step": 178890 - }, - { - "epoch": 0.31, - "learning_rate": 3.440099470906852e-05, - "loss": 2.4305, - "step": 178900 - }, - { - "epoch": 0.31, - "learning_rate": 3.4400122769141705e-05, - "loss": 2.4586, - "step": 178910 - }, - { - "epoch": 0.31, - "learning_rate": 3.4399250829214875e-05, - "loss": 2.3135, - "step": 178920 - }, - { - "epoch": 0.31, - "learning_rate": 3.4398378889288045e-05, - "loss": 2.3065, - "step": 178930 - }, - { - "epoch": 0.31, - "learning_rate": 3.4397506949361216e-05, - "loss": 2.4024, - "step": 178940 - }, - { - "epoch": 0.31, - "learning_rate": 3.439663500943439e-05, - "loss": 2.4086, - "step": 178950 - }, - { - "epoch": 0.31, - "learning_rate": 3.439576306950756e-05, - "loss": 2.3734, - "step": 178960 - }, - { - "epoch": 0.31, - "learning_rate": 3.4394891129580734e-05, - "loss": 2.4569, - "step": 178970 - }, - { - "epoch": 0.31, - "learning_rate": 3.439401918965391e-05, - "loss": 2.3995, - "step": 178980 - }, - { - "epoch": 0.31, - "learning_rate": 3.439314724972709e-05, - "loss": 2.4935, - "step": 178990 - }, - { - "epoch": 0.31, - "learning_rate": 3.439227530980026e-05, - "loss": 2.4557, - "step": 179000 - }, - { - "epoch": 0.31, - "learning_rate": 3.439140336987343e-05, - "loss": 2.5347, - "step": 179010 - }, - { - "epoch": 0.31, - "learning_rate": 3.4390531429946606e-05, - "loss": 2.4366, - "step": 179020 - }, - { - "epoch": 0.31, - "learning_rate": 3.4389659490019776e-05, - "loss": 2.4941, - "step": 179030 - }, - { - "epoch": 0.31, - "learning_rate": 3.438878755009295e-05, - "loss": 2.4503, - "step": 179040 - }, - { - "epoch": 0.31, - "learning_rate": 3.4387915610166124e-05, - "loss": 2.4028, - "step": 179050 - }, - { - "epoch": 0.31, - "learning_rate": 3.43870436702393e-05, - "loss": 2.2831, - "step": 179060 - }, - { - "epoch": 0.31, - "learning_rate": 3.438617173031247e-05, - "loss": 2.4475, - "step": 179070 - }, - { - "epoch": 0.31, - "learning_rate": 3.438529979038564e-05, - "loss": 2.5232, - "step": 179080 - }, - { - "epoch": 0.31, - "learning_rate": 3.438442785045882e-05, - "loss": 2.3864, - "step": 179090 - }, - { - "epoch": 0.31, - "learning_rate": 3.438355591053199e-05, - "loss": 2.434, - "step": 179100 - }, - { - "epoch": 0.31, - "learning_rate": 3.438268397060516e-05, - "loss": 2.4928, - "step": 179110 - }, - { - "epoch": 0.31, - "learning_rate": 3.438181203067834e-05, - "loss": 2.3524, - "step": 179120 - }, - { - "epoch": 0.31, - "learning_rate": 3.438094009075151e-05, - "loss": 2.487, - "step": 179130 - }, - { - "epoch": 0.31, - "learning_rate": 3.4380068150824684e-05, - "loss": 2.5601, - "step": 179140 - }, - { - "epoch": 0.31, - "learning_rate": 3.4379196210897855e-05, - "loss": 2.3997, - "step": 179150 - }, - { - "epoch": 0.31, - "learning_rate": 3.437832427097103e-05, - "loss": 2.5378, - "step": 179160 - }, - { - "epoch": 0.31, - "learning_rate": 3.43774523310442e-05, - "loss": 2.4441, - "step": 179170 - }, - { - "epoch": 0.31, - "learning_rate": 3.437658039111737e-05, - "loss": 2.4585, - "step": 179180 - }, - { - "epoch": 0.31, - "learning_rate": 3.437570845119055e-05, - "loss": 2.5612, - "step": 179190 - }, - { - "epoch": 0.31, - "learning_rate": 3.437483651126372e-05, - "loss": 2.299, - "step": 179200 - }, - { - "epoch": 0.31, - "learning_rate": 3.43739645713369e-05, - "loss": 2.5094, - "step": 179210 - }, - { - "epoch": 0.31, - "learning_rate": 3.437309263141007e-05, - "loss": 2.4593, - "step": 179220 - }, - { - "epoch": 0.31, - "learning_rate": 3.4372220691483245e-05, - "loss": 2.4299, - "step": 179230 - }, - { - "epoch": 0.31, - "learning_rate": 3.4371348751556415e-05, - "loss": 2.4129, - "step": 179240 - }, - { - "epoch": 0.31, - "learning_rate": 3.4370476811629586e-05, - "loss": 2.4272, - "step": 179250 - }, - { - "epoch": 0.31, - "learning_rate": 3.436960487170276e-05, - "loss": 2.4304, - "step": 179260 - }, - { - "epoch": 0.31, - "learning_rate": 3.436873293177593e-05, - "loss": 2.2521, - "step": 179270 - }, - { - "epoch": 0.31, - "learning_rate": 3.4367860991849104e-05, - "loss": 2.3523, - "step": 179280 - }, - { - "epoch": 0.31, - "learning_rate": 3.436698905192228e-05, - "loss": 2.4252, - "step": 179290 - }, - { - "epoch": 0.31, - "learning_rate": 3.436611711199546e-05, - "loss": 2.3935, - "step": 179300 - }, - { - "epoch": 0.31, - "learning_rate": 3.436524517206863e-05, - "loss": 2.4435, - "step": 179310 - }, - { - "epoch": 0.31, - "learning_rate": 3.43643732321418e-05, - "loss": 2.4973, - "step": 179320 - }, - { - "epoch": 0.31, - "learning_rate": 3.436350129221497e-05, - "loss": 2.4781, - "step": 179330 - }, - { - "epoch": 0.31, - "learning_rate": 3.4362629352288146e-05, - "loss": 2.4721, - "step": 179340 - }, - { - "epoch": 0.31, - "learning_rate": 3.436175741236132e-05, - "loss": 2.4268, - "step": 179350 - }, - { - "epoch": 0.31, - "learning_rate": 3.4360885472434494e-05, - "loss": 2.4326, - "step": 179360 - }, - { - "epoch": 0.31, - "learning_rate": 3.436001353250767e-05, - "loss": 2.2353, - "step": 179370 - }, - { - "epoch": 0.31, - "learning_rate": 3.435914159258084e-05, - "loss": 2.4181, - "step": 179380 - }, - { - "epoch": 0.31, - "learning_rate": 3.435826965265401e-05, - "loss": 2.5071, - "step": 179390 - }, - { - "epoch": 0.31, - "learning_rate": 3.435739771272718e-05, - "loss": 2.3592, - "step": 179400 - }, - { - "epoch": 0.31, - "learning_rate": 3.435652577280036e-05, - "loss": 2.3133, - "step": 179410 - }, - { - "epoch": 0.31, - "learning_rate": 3.435565383287353e-05, - "loss": 2.4075, - "step": 179420 - }, - { - "epoch": 0.31, - "learning_rate": 3.43547818929467e-05, - "loss": 2.4953, - "step": 179430 - }, - { - "epoch": 0.31, - "learning_rate": 3.435390995301988e-05, - "loss": 2.5216, - "step": 179440 - }, - { - "epoch": 0.31, - "learning_rate": 3.4353038013093054e-05, - "loss": 2.4226, - "step": 179450 - }, - { - "epoch": 0.31, - "learning_rate": 3.4352166073166225e-05, - "loss": 2.2645, - "step": 179460 - }, - { - "epoch": 0.31, - "learning_rate": 3.4351294133239395e-05, - "loss": 2.4233, - "step": 179470 - }, - { - "epoch": 0.31, - "learning_rate": 3.435042219331257e-05, - "loss": 2.4423, - "step": 179480 - }, - { - "epoch": 0.31, - "learning_rate": 3.434955025338574e-05, - "loss": 2.3901, - "step": 179490 - }, - { - "epoch": 0.31, - "learning_rate": 3.434867831345891e-05, - "loss": 2.5459, - "step": 179500 - }, - { - "epoch": 0.31, - "learning_rate": 3.434780637353209e-05, - "loss": 2.3465, - "step": 179510 - }, - { - "epoch": 0.31, - "learning_rate": 3.434693443360527e-05, - "loss": 2.3793, - "step": 179520 - }, - { - "epoch": 0.31, - "learning_rate": 3.434606249367844e-05, - "loss": 2.4672, - "step": 179530 - }, - { - "epoch": 0.31, - "learning_rate": 3.434519055375161e-05, - "loss": 2.3712, - "step": 179540 - }, - { - "epoch": 0.31, - "learning_rate": 3.4344318613824785e-05, - "loss": 2.5043, - "step": 179550 - }, - { - "epoch": 0.31, - "learning_rate": 3.4343446673897956e-05, - "loss": 2.4581, - "step": 179560 - }, - { - "epoch": 0.31, - "learning_rate": 3.4342574733971126e-05, - "loss": 2.5077, - "step": 179570 - }, - { - "epoch": 0.31, - "learning_rate": 3.43417027940443e-05, - "loss": 2.4286, - "step": 179580 - }, - { - "epoch": 0.31, - "learning_rate": 3.434083085411748e-05, - "loss": 2.4663, - "step": 179590 - }, - { - "epoch": 0.31, - "learning_rate": 3.433995891419065e-05, - "loss": 2.4009, - "step": 179600 - }, - { - "epoch": 0.31, - "learning_rate": 3.433908697426382e-05, - "loss": 2.4186, - "step": 179610 - }, - { - "epoch": 0.31, - "learning_rate": 3.4338215034337e-05, - "loss": 2.4538, - "step": 179620 - }, - { - "epoch": 0.31, - "learning_rate": 3.433734309441017e-05, - "loss": 2.4226, - "step": 179630 - }, - { - "epoch": 0.31, - "learning_rate": 3.433647115448334e-05, - "loss": 2.3881, - "step": 179640 - }, - { - "epoch": 0.31, - "learning_rate": 3.4335599214556516e-05, - "loss": 2.4386, - "step": 179650 - }, - { - "epoch": 0.31, - "learning_rate": 3.433472727462969e-05, - "loss": 2.3684, - "step": 179660 - }, - { - "epoch": 0.31, - "learning_rate": 3.4333855334702864e-05, - "loss": 2.4503, - "step": 179670 - }, - { - "epoch": 0.31, - "learning_rate": 3.4332983394776034e-05, - "loss": 2.4649, - "step": 179680 - }, - { - "epoch": 0.31, - "learning_rate": 3.433211145484921e-05, - "loss": 2.2999, - "step": 179690 - }, - { - "epoch": 0.31, - "learning_rate": 3.433123951492238e-05, - "loss": 2.3706, - "step": 179700 - }, - { - "epoch": 0.31, - "learning_rate": 3.433036757499555e-05, - "loss": 2.4586, - "step": 179710 - }, - { - "epoch": 0.31, - "learning_rate": 3.432949563506873e-05, - "loss": 2.4798, - "step": 179720 - }, - { - "epoch": 0.31, - "learning_rate": 3.4328623695141906e-05, - "loss": 2.449, - "step": 179730 - }, - { - "epoch": 0.31, - "learning_rate": 3.432775175521508e-05, - "loss": 2.4438, - "step": 179740 - }, - { - "epoch": 0.31, - "learning_rate": 3.432687981528825e-05, - "loss": 2.4743, - "step": 179750 - }, - { - "epoch": 0.31, - "learning_rate": 3.4326007875361424e-05, - "loss": 2.5212, - "step": 179760 - }, - { - "epoch": 0.31, - "learning_rate": 3.4325135935434595e-05, - "loss": 2.3916, - "step": 179770 - }, - { - "epoch": 0.31, - "learning_rate": 3.4324263995507765e-05, - "loss": 2.4617, - "step": 179780 - }, - { - "epoch": 0.31, - "learning_rate": 3.4323392055580935e-05, - "loss": 2.4928, - "step": 179790 - }, - { - "epoch": 0.31, - "learning_rate": 3.432252011565411e-05, - "loss": 2.4724, - "step": 179800 - }, - { - "epoch": 0.31, - "learning_rate": 3.432164817572729e-05, - "loss": 2.5039, - "step": 179810 - }, - { - "epoch": 0.31, - "learning_rate": 3.432077623580046e-05, - "loss": 2.4206, - "step": 179820 - }, - { - "epoch": 0.31, - "learning_rate": 3.431990429587364e-05, - "loss": 2.4838, - "step": 179830 - }, - { - "epoch": 0.31, - "learning_rate": 3.431903235594681e-05, - "loss": 2.4254, - "step": 179840 - }, - { - "epoch": 0.31, - "learning_rate": 3.431816041601998e-05, - "loss": 2.519, - "step": 179850 - }, - { - "epoch": 0.31, - "learning_rate": 3.431728847609315e-05, - "loss": 2.427, - "step": 179860 - }, - { - "epoch": 0.31, - "learning_rate": 3.4316416536166326e-05, - "loss": 2.5143, - "step": 179870 - }, - { - "epoch": 0.31, - "learning_rate": 3.43155445962395e-05, - "loss": 2.5267, - "step": 179880 - }, - { - "epoch": 0.31, - "learning_rate": 3.431467265631267e-05, - "loss": 2.4347, - "step": 179890 - }, - { - "epoch": 0.31, - "learning_rate": 3.4313800716385843e-05, - "loss": 2.4461, - "step": 179900 - }, - { - "epoch": 0.31, - "learning_rate": 3.431292877645902e-05, - "loss": 2.3454, - "step": 179910 - }, - { - "epoch": 0.31, - "learning_rate": 3.431205683653219e-05, - "loss": 2.4606, - "step": 179920 - }, - { - "epoch": 0.31, - "learning_rate": 3.431118489660536e-05, - "loss": 2.4903, - "step": 179930 - }, - { - "epoch": 0.31, - "learning_rate": 3.431031295667854e-05, - "loss": 2.4503, - "step": 179940 - }, - { - "epoch": 0.31, - "learning_rate": 3.430944101675171e-05, - "loss": 2.4668, - "step": 179950 - }, - { - "epoch": 0.31, - "learning_rate": 3.4308569076824886e-05, - "loss": 2.4788, - "step": 179960 - }, - { - "epoch": 0.31, - "learning_rate": 3.4307697136898056e-05, - "loss": 2.4052, - "step": 179970 - }, - { - "epoch": 0.31, - "learning_rate": 3.4306825196971234e-05, - "loss": 2.356, - "step": 179980 - }, - { - "epoch": 0.31, - "learning_rate": 3.4305953257044404e-05, - "loss": 2.3503, - "step": 179990 - }, - { - "epoch": 0.31, - "learning_rate": 3.4305081317117574e-05, - "loss": 2.4196, - "step": 180000 - }, - { - "epoch": 0.31, - "learning_rate": 3.430420937719075e-05, - "loss": 2.3143, - "step": 180010 - }, - { - "epoch": 0.31, - "learning_rate": 3.430333743726392e-05, - "loss": 2.353, - "step": 180020 - }, - { - "epoch": 0.31, - "learning_rate": 3.43024654973371e-05, - "loss": 2.4456, - "step": 180030 - }, - { - "epoch": 0.31, - "learning_rate": 3.430159355741027e-05, - "loss": 2.4303, - "step": 180040 - }, - { - "epoch": 0.31, - "learning_rate": 3.430072161748345e-05, - "loss": 2.3267, - "step": 180050 - }, - { - "epoch": 0.31, - "learning_rate": 3.429984967755662e-05, - "loss": 2.3519, - "step": 180060 - }, - { - "epoch": 0.31, - "learning_rate": 3.429897773762979e-05, - "loss": 2.4951, - "step": 180070 - }, - { - "epoch": 0.31, - "learning_rate": 3.4298105797702965e-05, - "loss": 2.5871, - "step": 180080 - }, - { - "epoch": 0.31, - "learning_rate": 3.4297233857776135e-05, - "loss": 2.4403, - "step": 180090 - }, - { - "epoch": 0.31, - "learning_rate": 3.4296361917849305e-05, - "loss": 2.4444, - "step": 180100 - }, - { - "epoch": 0.31, - "learning_rate": 3.429548997792248e-05, - "loss": 2.4355, - "step": 180110 - }, - { - "epoch": 0.31, - "learning_rate": 3.429461803799566e-05, - "loss": 2.4301, - "step": 180120 - }, - { - "epoch": 0.31, - "learning_rate": 3.429374609806883e-05, - "loss": 2.4532, - "step": 180130 - }, - { - "epoch": 0.31, - "learning_rate": 3.4292874158142e-05, - "loss": 2.3771, - "step": 180140 - }, - { - "epoch": 0.31, - "learning_rate": 3.429200221821518e-05, - "loss": 2.45, - "step": 180150 - }, - { - "epoch": 0.31, - "learning_rate": 3.429113027828835e-05, - "loss": 2.3684, - "step": 180160 - }, - { - "epoch": 0.31, - "learning_rate": 3.429025833836152e-05, - "loss": 2.4955, - "step": 180170 - }, - { - "epoch": 0.31, - "learning_rate": 3.4289386398434695e-05, - "loss": 2.5002, - "step": 180180 - }, - { - "epoch": 0.31, - "learning_rate": 3.428851445850787e-05, - "loss": 2.4987, - "step": 180190 - }, - { - "epoch": 0.31, - "learning_rate": 3.428764251858104e-05, - "loss": 2.4202, - "step": 180200 - }, - { - "epoch": 0.31, - "learning_rate": 3.4286770578654213e-05, - "loss": 2.3966, - "step": 180210 - }, - { - "epoch": 0.31, - "learning_rate": 3.428589863872739e-05, - "loss": 2.4858, - "step": 180220 - }, - { - "epoch": 0.31, - "learning_rate": 3.428502669880056e-05, - "loss": 2.398, - "step": 180230 - }, - { - "epoch": 0.31, - "learning_rate": 3.428415475887373e-05, - "loss": 2.3928, - "step": 180240 - }, - { - "epoch": 0.31, - "learning_rate": 3.428328281894691e-05, - "loss": 2.3756, - "step": 180250 - }, - { - "epoch": 0.31, - "learning_rate": 3.4282410879020086e-05, - "loss": 2.3851, - "step": 180260 - }, - { - "epoch": 0.31, - "learning_rate": 3.4281538939093256e-05, - "loss": 2.369, - "step": 180270 - }, - { - "epoch": 0.31, - "learning_rate": 3.4280666999166426e-05, - "loss": 2.4055, - "step": 180280 - }, - { - "epoch": 0.31, - "learning_rate": 3.42797950592396e-05, - "loss": 2.4631, - "step": 180290 - }, - { - "epoch": 0.31, - "learning_rate": 3.4278923119312774e-05, - "loss": 2.4653, - "step": 180300 - }, - { - "epoch": 0.31, - "learning_rate": 3.4278051179385944e-05, - "loss": 2.5684, - "step": 180310 - }, - { - "epoch": 0.31, - "learning_rate": 3.4277179239459115e-05, - "loss": 2.3773, - "step": 180320 - }, - { - "epoch": 0.31, - "learning_rate": 3.42763072995323e-05, - "loss": 2.5222, - "step": 180330 - }, - { - "epoch": 0.31, - "learning_rate": 3.427543535960547e-05, - "loss": 2.4235, - "step": 180340 - }, - { - "epoch": 0.31, - "learning_rate": 3.427456341967864e-05, - "loss": 2.4613, - "step": 180350 - }, - { - "epoch": 0.31, - "learning_rate": 3.427369147975181e-05, - "loss": 2.4426, - "step": 180360 - }, - { - "epoch": 0.31, - "learning_rate": 3.427281953982499e-05, - "loss": 2.4763, - "step": 180370 - }, - { - "epoch": 0.31, - "learning_rate": 3.427194759989816e-05, - "loss": 2.3751, - "step": 180380 - }, - { - "epoch": 0.31, - "learning_rate": 3.427107565997133e-05, - "loss": 2.465, - "step": 180390 - }, - { - "epoch": 0.31, - "learning_rate": 3.4270203720044505e-05, - "loss": 2.4713, - "step": 180400 - }, - { - "epoch": 0.31, - "learning_rate": 3.426933178011768e-05, - "loss": 2.4146, - "step": 180410 - }, - { - "epoch": 0.31, - "learning_rate": 3.426845984019085e-05, - "loss": 2.4029, - "step": 180420 - }, - { - "epoch": 0.31, - "learning_rate": 3.426758790026402e-05, - "loss": 2.4912, - "step": 180430 - }, - { - "epoch": 0.31, - "learning_rate": 3.42667159603372e-05, - "loss": 2.4811, - "step": 180440 - }, - { - "epoch": 0.31, - "learning_rate": 3.426584402041037e-05, - "loss": 2.4035, - "step": 180450 - }, - { - "epoch": 0.31, - "learning_rate": 3.426497208048354e-05, - "loss": 2.5189, - "step": 180460 - }, - { - "epoch": 0.31, - "learning_rate": 3.426410014055672e-05, - "loss": 2.4069, - "step": 180470 - }, - { - "epoch": 0.31, - "learning_rate": 3.4263228200629895e-05, - "loss": 2.3242, - "step": 180480 - }, - { - "epoch": 0.31, - "learning_rate": 3.4262356260703065e-05, - "loss": 2.4078, - "step": 180490 - }, - { - "epoch": 0.31, - "learning_rate": 3.4261484320776236e-05, - "loss": 2.3777, - "step": 180500 - }, - { - "epoch": 0.31, - "learning_rate": 3.426061238084941e-05, - "loss": 2.3783, - "step": 180510 - }, - { - "epoch": 0.31, - "learning_rate": 3.425974044092258e-05, - "loss": 2.4492, - "step": 180520 - }, - { - "epoch": 0.31, - "learning_rate": 3.4258868500995754e-05, - "loss": 2.451, - "step": 180530 - }, - { - "epoch": 0.31, - "learning_rate": 3.425799656106893e-05, - "loss": 2.4429, - "step": 180540 - }, - { - "epoch": 0.31, - "learning_rate": 3.425712462114211e-05, - "loss": 2.4083, - "step": 180550 - }, - { - "epoch": 0.31, - "learning_rate": 3.425625268121528e-05, - "loss": 2.501, - "step": 180560 - }, - { - "epoch": 0.31, - "learning_rate": 3.425538074128845e-05, - "loss": 2.4761, - "step": 180570 - }, - { - "epoch": 0.31, - "learning_rate": 3.4254508801361626e-05, - "loss": 2.4314, - "step": 180580 - }, - { - "epoch": 0.31, - "learning_rate": 3.4253636861434796e-05, - "loss": 2.4772, - "step": 180590 - }, - { - "epoch": 0.31, - "learning_rate": 3.425276492150797e-05, - "loss": 2.4462, - "step": 180600 - }, - { - "epoch": 0.31, - "learning_rate": 3.4251892981581144e-05, - "loss": 2.4165, - "step": 180610 - }, - { - "epoch": 0.31, - "learning_rate": 3.4251021041654314e-05, - "loss": 2.4258, - "step": 180620 - }, - { - "epoch": 0.31, - "learning_rate": 3.425014910172749e-05, - "loss": 2.5166, - "step": 180630 - }, - { - "epoch": 0.32, - "learning_rate": 3.424927716180066e-05, - "loss": 2.4217, - "step": 180640 - }, - { - "epoch": 0.32, - "learning_rate": 3.424840522187384e-05, - "loss": 2.4961, - "step": 180650 - }, - { - "epoch": 0.32, - "learning_rate": 3.424753328194701e-05, - "loss": 2.4082, - "step": 180660 - }, - { - "epoch": 0.32, - "learning_rate": 3.424666134202018e-05, - "loss": 2.4226, - "step": 180670 - }, - { - "epoch": 0.32, - "learning_rate": 3.424578940209335e-05, - "loss": 2.4301, - "step": 180680 - }, - { - "epoch": 0.32, - "learning_rate": 3.424491746216653e-05, - "loss": 2.2655, - "step": 180690 - }, - { - "epoch": 0.32, - "learning_rate": 3.4244045522239704e-05, - "loss": 2.4105, - "step": 180700 - }, - { - "epoch": 0.32, - "learning_rate": 3.4243173582312875e-05, - "loss": 2.4332, - "step": 180710 - }, - { - "epoch": 0.32, - "learning_rate": 3.424230164238605e-05, - "loss": 2.3709, - "step": 180720 - }, - { - "epoch": 0.32, - "learning_rate": 3.424142970245922e-05, - "loss": 2.3866, - "step": 180730 - }, - { - "epoch": 0.32, - "learning_rate": 3.424055776253239e-05, - "loss": 2.3909, - "step": 180740 - }, - { - "epoch": 0.32, - "learning_rate": 3.423968582260556e-05, - "loss": 2.4965, - "step": 180750 - }, - { - "epoch": 0.32, - "learning_rate": 3.423881388267874e-05, - "loss": 2.4613, - "step": 180760 - }, - { - "epoch": 0.32, - "learning_rate": 3.423794194275192e-05, - "loss": 2.4647, - "step": 180770 - }, - { - "epoch": 0.32, - "learning_rate": 3.423707000282509e-05, - "loss": 2.3249, - "step": 180780 - }, - { - "epoch": 0.32, - "learning_rate": 3.423619806289826e-05, - "loss": 2.4496, - "step": 180790 - }, - { - "epoch": 0.32, - "learning_rate": 3.4235326122971435e-05, - "loss": 2.372, - "step": 180800 - }, - { - "epoch": 0.32, - "learning_rate": 3.4234454183044606e-05, - "loss": 2.4142, - "step": 180810 - }, - { - "epoch": 0.32, - "learning_rate": 3.4233582243117776e-05, - "loss": 2.39, - "step": 180820 - }, - { - "epoch": 0.32, - "learning_rate": 3.423271030319095e-05, - "loss": 2.4712, - "step": 180830 - }, - { - "epoch": 0.32, - "learning_rate": 3.4231838363264124e-05, - "loss": 2.5297, - "step": 180840 - }, - { - "epoch": 0.32, - "learning_rate": 3.42309664233373e-05, - "loss": 2.4817, - "step": 180850 - }, - { - "epoch": 0.32, - "learning_rate": 3.423009448341047e-05, - "loss": 2.4643, - "step": 180860 - }, - { - "epoch": 0.32, - "learning_rate": 3.422922254348365e-05, - "loss": 2.431, - "step": 180870 - }, - { - "epoch": 0.32, - "learning_rate": 3.422835060355682e-05, - "loss": 2.4053, - "step": 180880 - }, - { - "epoch": 0.32, - "learning_rate": 3.422747866362999e-05, - "loss": 2.3776, - "step": 180890 - }, - { - "epoch": 0.32, - "learning_rate": 3.4226606723703166e-05, - "loss": 2.3682, - "step": 180900 - }, - { - "epoch": 0.32, - "learning_rate": 3.422573478377634e-05, - "loss": 2.4754, - "step": 180910 - }, - { - "epoch": 0.32, - "learning_rate": 3.4224862843849514e-05, - "loss": 2.4852, - "step": 180920 - }, - { - "epoch": 0.32, - "learning_rate": 3.4223990903922684e-05, - "loss": 2.5134, - "step": 180930 - }, - { - "epoch": 0.32, - "learning_rate": 3.422311896399586e-05, - "loss": 2.4635, - "step": 180940 - }, - { - "epoch": 0.32, - "learning_rate": 3.422224702406903e-05, - "loss": 2.4091, - "step": 180950 - }, - { - "epoch": 0.32, - "learning_rate": 3.42213750841422e-05, - "loss": 2.4948, - "step": 180960 - }, - { - "epoch": 0.32, - "learning_rate": 3.422050314421538e-05, - "loss": 2.3231, - "step": 180970 - }, - { - "epoch": 0.32, - "learning_rate": 3.421963120428855e-05, - "loss": 2.3084, - "step": 180980 - }, - { - "epoch": 0.32, - "learning_rate": 3.421875926436172e-05, - "loss": 2.4786, - "step": 180990 - }, - { - "epoch": 0.32, - "learning_rate": 3.42178873244349e-05, - "loss": 2.4062, - "step": 181000 - }, - { - "epoch": 0.32, - "learning_rate": 3.4217015384508074e-05, - "loss": 2.4519, - "step": 181010 - }, - { - "epoch": 0.32, - "learning_rate": 3.4216143444581245e-05, - "loss": 2.5184, - "step": 181020 - }, - { - "epoch": 0.32, - "learning_rate": 3.4215271504654415e-05, - "loss": 2.4035, - "step": 181030 - }, - { - "epoch": 0.32, - "learning_rate": 3.421439956472759e-05, - "loss": 2.4537, - "step": 181040 - }, - { - "epoch": 0.32, - "learning_rate": 3.421352762480076e-05, - "loss": 2.2689, - "step": 181050 - }, - { - "epoch": 0.32, - "learning_rate": 3.421265568487393e-05, - "loss": 2.4714, - "step": 181060 - }, - { - "epoch": 0.32, - "learning_rate": 3.421178374494711e-05, - "loss": 2.3761, - "step": 181070 - }, - { - "epoch": 0.32, - "learning_rate": 3.421091180502029e-05, - "loss": 2.3689, - "step": 181080 - }, - { - "epoch": 0.32, - "learning_rate": 3.421003986509346e-05, - "loss": 2.3878, - "step": 181090 - }, - { - "epoch": 0.32, - "learning_rate": 3.420916792516663e-05, - "loss": 2.4994, - "step": 181100 - }, - { - "epoch": 0.32, - "learning_rate": 3.4208295985239805e-05, - "loss": 2.5007, - "step": 181110 - }, - { - "epoch": 0.32, - "learning_rate": 3.4207424045312976e-05, - "loss": 2.5461, - "step": 181120 - }, - { - "epoch": 0.32, - "learning_rate": 3.4206552105386146e-05, - "loss": 2.3568, - "step": 181130 - }, - { - "epoch": 0.32, - "learning_rate": 3.4205680165459316e-05, - "loss": 2.3864, - "step": 181140 - }, - { - "epoch": 0.32, - "learning_rate": 3.42048082255325e-05, - "loss": 2.4071, - "step": 181150 - }, - { - "epoch": 0.32, - "learning_rate": 3.420393628560567e-05, - "loss": 2.4504, - "step": 181160 - }, - { - "epoch": 0.32, - "learning_rate": 3.420306434567884e-05, - "loss": 2.5011, - "step": 181170 - }, - { - "epoch": 0.32, - "learning_rate": 3.420219240575202e-05, - "loss": 2.4765, - "step": 181180 - }, - { - "epoch": 0.32, - "learning_rate": 3.420132046582519e-05, - "loss": 2.4942, - "step": 181190 - }, - { - "epoch": 0.32, - "learning_rate": 3.420044852589836e-05, - "loss": 2.4376, - "step": 181200 - }, - { - "epoch": 0.32, - "learning_rate": 3.419957658597153e-05, - "loss": 2.5374, - "step": 181210 - }, - { - "epoch": 0.32, - "learning_rate": 3.419870464604471e-05, - "loss": 2.4343, - "step": 181220 - }, - { - "epoch": 0.32, - "learning_rate": 3.4197832706117884e-05, - "loss": 2.4572, - "step": 181230 - }, - { - "epoch": 0.32, - "learning_rate": 3.4196960766191054e-05, - "loss": 2.4438, - "step": 181240 - }, - { - "epoch": 0.32, - "learning_rate": 3.4196088826264224e-05, - "loss": 2.4942, - "step": 181250 - }, - { - "epoch": 0.32, - "learning_rate": 3.41952168863374e-05, - "loss": 2.447, - "step": 181260 - }, - { - "epoch": 0.32, - "learning_rate": 3.419434494641057e-05, - "loss": 2.5612, - "step": 181270 - }, - { - "epoch": 0.32, - "learning_rate": 3.419347300648374e-05, - "loss": 2.3861, - "step": 181280 - }, - { - "epoch": 0.32, - "learning_rate": 3.419260106655692e-05, - "loss": 2.3341, - "step": 181290 - }, - { - "epoch": 0.32, - "learning_rate": 3.41917291266301e-05, - "loss": 2.4521, - "step": 181300 - }, - { - "epoch": 0.32, - "learning_rate": 3.419085718670327e-05, - "loss": 2.4088, - "step": 181310 - }, - { - "epoch": 0.32, - "learning_rate": 3.418998524677644e-05, - "loss": 2.4004, - "step": 181320 - }, - { - "epoch": 0.32, - "learning_rate": 3.4189113306849615e-05, - "loss": 2.542, - "step": 181330 - }, - { - "epoch": 0.32, - "learning_rate": 3.4188241366922785e-05, - "loss": 2.412, - "step": 181340 - }, - { - "epoch": 0.32, - "learning_rate": 3.4187369426995955e-05, - "loss": 2.468, - "step": 181350 - }, - { - "epoch": 0.32, - "learning_rate": 3.418649748706913e-05, - "loss": 2.3443, - "step": 181360 - }, - { - "epoch": 0.32, - "learning_rate": 3.418562554714231e-05, - "loss": 2.4158, - "step": 181370 - }, - { - "epoch": 0.32, - "learning_rate": 3.418475360721548e-05, - "loss": 2.4017, - "step": 181380 - }, - { - "epoch": 0.32, - "learning_rate": 3.418388166728865e-05, - "loss": 2.3, - "step": 181390 - }, - { - "epoch": 0.32, - "learning_rate": 3.418300972736183e-05, - "loss": 2.5037, - "step": 181400 - }, - { - "epoch": 0.32, - "learning_rate": 3.4182137787435e-05, - "loss": 2.5087, - "step": 181410 - }, - { - "epoch": 0.32, - "learning_rate": 3.418126584750817e-05, - "loss": 2.3, - "step": 181420 - }, - { - "epoch": 0.32, - "learning_rate": 3.4180393907581346e-05, - "loss": 2.3831, - "step": 181430 - }, - { - "epoch": 0.32, - "learning_rate": 3.417952196765452e-05, - "loss": 2.3476, - "step": 181440 - }, - { - "epoch": 0.32, - "learning_rate": 3.417865002772769e-05, - "loss": 2.3569, - "step": 181450 - }, - { - "epoch": 0.32, - "learning_rate": 3.4177778087800863e-05, - "loss": 2.452, - "step": 181460 - }, - { - "epoch": 0.32, - "learning_rate": 3.417690614787404e-05, - "loss": 2.4119, - "step": 181470 - }, - { - "epoch": 0.32, - "learning_rate": 3.417603420794721e-05, - "loss": 2.5435, - "step": 181480 - }, - { - "epoch": 0.32, - "learning_rate": 3.417516226802038e-05, - "loss": 2.3641, - "step": 181490 - }, - { - "epoch": 0.32, - "learning_rate": 3.417429032809356e-05, - "loss": 2.4316, - "step": 181500 - }, - { - "epoch": 0.32, - "learning_rate": 3.417341838816673e-05, - "loss": 2.5153, - "step": 181510 - }, - { - "epoch": 0.32, - "learning_rate": 3.4172546448239906e-05, - "loss": 2.4728, - "step": 181520 - }, - { - "epoch": 0.32, - "learning_rate": 3.4171674508313076e-05, - "loss": 2.5123, - "step": 181530 - }, - { - "epoch": 0.32, - "learning_rate": 3.4170802568386254e-05, - "loss": 2.3965, - "step": 181540 - }, - { - "epoch": 0.32, - "learning_rate": 3.4169930628459424e-05, - "loss": 2.4831, - "step": 181550 - }, - { - "epoch": 0.32, - "learning_rate": 3.4169058688532594e-05, - "loss": 2.359, - "step": 181560 - }, - { - "epoch": 0.32, - "learning_rate": 3.416818674860577e-05, - "loss": 2.3825, - "step": 181570 - }, - { - "epoch": 0.32, - "learning_rate": 3.416731480867894e-05, - "loss": 2.4399, - "step": 181580 - }, - { - "epoch": 0.32, - "learning_rate": 3.416644286875212e-05, - "loss": 2.4042, - "step": 181590 - }, - { - "epoch": 0.32, - "learning_rate": 3.416557092882529e-05, - "loss": 2.3958, - "step": 181600 - }, - { - "epoch": 0.32, - "learning_rate": 3.416469898889847e-05, - "loss": 2.4216, - "step": 181610 - }, - { - "epoch": 0.32, - "learning_rate": 3.416382704897164e-05, - "loss": 2.4657, - "step": 181620 - }, - { - "epoch": 0.32, - "learning_rate": 3.416295510904481e-05, - "loss": 2.3353, - "step": 181630 - }, - { - "epoch": 0.32, - "learning_rate": 3.416208316911798e-05, - "loss": 2.4629, - "step": 181640 - }, - { - "epoch": 0.32, - "learning_rate": 3.4161211229191155e-05, - "loss": 2.3279, - "step": 181650 - }, - { - "epoch": 0.32, - "learning_rate": 3.4160339289264325e-05, - "loss": 2.4812, - "step": 181660 - }, - { - "epoch": 0.32, - "learning_rate": 3.41594673493375e-05, - "loss": 2.4956, - "step": 181670 - }, - { - "epoch": 0.32, - "learning_rate": 3.415859540941068e-05, - "loss": 2.4382, - "step": 181680 - }, - { - "epoch": 0.32, - "learning_rate": 3.415772346948385e-05, - "loss": 2.298, - "step": 181690 - }, - { - "epoch": 0.32, - "learning_rate": 3.415685152955702e-05, - "loss": 2.5166, - "step": 181700 - }, - { - "epoch": 0.32, - "learning_rate": 3.415597958963019e-05, - "loss": 2.5194, - "step": 181710 - }, - { - "epoch": 0.32, - "learning_rate": 3.415510764970337e-05, - "loss": 2.581, - "step": 181720 - }, - { - "epoch": 0.32, - "learning_rate": 3.415423570977654e-05, - "loss": 2.3805, - "step": 181730 - }, - { - "epoch": 0.32, - "learning_rate": 3.4153363769849716e-05, - "loss": 2.4392, - "step": 181740 - }, - { - "epoch": 0.32, - "learning_rate": 3.4152491829922886e-05, - "loss": 2.3789, - "step": 181750 - }, - { - "epoch": 0.32, - "learning_rate": 3.415161988999606e-05, - "loss": 2.482, - "step": 181760 - }, - { - "epoch": 0.32, - "learning_rate": 3.4150747950069233e-05, - "loss": 2.4247, - "step": 181770 - }, - { - "epoch": 0.32, - "learning_rate": 3.4149876010142404e-05, - "loss": 2.3953, - "step": 181780 - }, - { - "epoch": 0.32, - "learning_rate": 3.414900407021558e-05, - "loss": 2.4089, - "step": 181790 - }, - { - "epoch": 0.32, - "learning_rate": 3.414813213028875e-05, - "loss": 2.4754, - "step": 181800 - }, - { - "epoch": 0.32, - "learning_rate": 3.414726019036192e-05, - "loss": 2.4614, - "step": 181810 - }, - { - "epoch": 0.32, - "learning_rate": 3.41463882504351e-05, - "loss": 2.459, - "step": 181820 - }, - { - "epoch": 0.32, - "learning_rate": 3.4145516310508276e-05, - "loss": 2.4191, - "step": 181830 - }, - { - "epoch": 0.32, - "learning_rate": 3.4144644370581446e-05, - "loss": 2.4465, - "step": 181840 - }, - { - "epoch": 0.32, - "learning_rate": 3.414377243065462e-05, - "loss": 2.4783, - "step": 181850 - }, - { - "epoch": 0.32, - "learning_rate": 3.4142900490727794e-05, - "loss": 2.486, - "step": 181860 - }, - { - "epoch": 0.32, - "learning_rate": 3.4142028550800964e-05, - "loss": 2.4283, - "step": 181870 - }, - { - "epoch": 0.32, - "learning_rate": 3.4141156610874135e-05, - "loss": 2.4732, - "step": 181880 - }, - { - "epoch": 0.32, - "learning_rate": 3.414028467094731e-05, - "loss": 2.4253, - "step": 181890 - }, - { - "epoch": 0.32, - "learning_rate": 3.413941273102049e-05, - "loss": 2.399, - "step": 181900 - }, - { - "epoch": 0.32, - "learning_rate": 3.413854079109366e-05, - "loss": 2.451, - "step": 181910 - }, - { - "epoch": 0.32, - "learning_rate": 3.413766885116683e-05, - "loss": 2.4329, - "step": 181920 - }, - { - "epoch": 0.32, - "learning_rate": 3.413679691124001e-05, - "loss": 2.4963, - "step": 181930 - }, - { - "epoch": 0.32, - "learning_rate": 3.413592497131318e-05, - "loss": 2.4945, - "step": 181940 - }, - { - "epoch": 0.32, - "learning_rate": 3.413505303138635e-05, - "loss": 2.519, - "step": 181950 - }, - { - "epoch": 0.32, - "learning_rate": 3.4134181091459525e-05, - "loss": 2.4347, - "step": 181960 - }, - { - "epoch": 0.32, - "learning_rate": 3.41333091515327e-05, - "loss": 2.3356, - "step": 181970 - }, - { - "epoch": 0.32, - "learning_rate": 3.413243721160587e-05, - "loss": 2.4907, - "step": 181980 - }, - { - "epoch": 0.32, - "learning_rate": 3.413156527167904e-05, - "loss": 2.4549, - "step": 181990 - }, - { - "epoch": 0.32, - "learning_rate": 3.413069333175222e-05, - "loss": 2.4624, - "step": 182000 - }, - { - "epoch": 0.32, - "learning_rate": 3.412982139182539e-05, - "loss": 2.4196, - "step": 182010 - }, - { - "epoch": 0.32, - "learning_rate": 3.412894945189856e-05, - "loss": 2.4266, - "step": 182020 - }, - { - "epoch": 0.32, - "learning_rate": 3.412807751197173e-05, - "loss": 2.4986, - "step": 182030 - }, - { - "epoch": 0.32, - "learning_rate": 3.4127205572044915e-05, - "loss": 2.3633, - "step": 182040 - }, - { - "epoch": 0.32, - "learning_rate": 3.4126333632118085e-05, - "loss": 2.4452, - "step": 182050 - }, - { - "epoch": 0.32, - "learning_rate": 3.4125461692191256e-05, - "loss": 2.4495, - "step": 182060 - }, - { - "epoch": 0.32, - "learning_rate": 3.412458975226443e-05, - "loss": 2.4336, - "step": 182070 - }, - { - "epoch": 0.32, - "learning_rate": 3.41237178123376e-05, - "loss": 2.4442, - "step": 182080 - }, - { - "epoch": 0.32, - "learning_rate": 3.4122845872410774e-05, - "loss": 2.4023, - "step": 182090 - }, - { - "epoch": 0.32, - "learning_rate": 3.4121973932483944e-05, - "loss": 2.4229, - "step": 182100 - }, - { - "epoch": 0.32, - "learning_rate": 3.412110199255713e-05, - "loss": 2.4753, - "step": 182110 - }, - { - "epoch": 0.32, - "learning_rate": 3.41202300526303e-05, - "loss": 2.4098, - "step": 182120 - }, - { - "epoch": 0.32, - "learning_rate": 3.411935811270347e-05, - "loss": 2.49, - "step": 182130 - }, - { - "epoch": 0.32, - "learning_rate": 3.411848617277664e-05, - "loss": 2.434, - "step": 182140 - }, - { - "epoch": 0.32, - "learning_rate": 3.4117614232849816e-05, - "loss": 2.4354, - "step": 182150 - }, - { - "epoch": 0.32, - "learning_rate": 3.411674229292299e-05, - "loss": 2.4192, - "step": 182160 - }, - { - "epoch": 0.32, - "learning_rate": 3.411587035299616e-05, - "loss": 2.4653, - "step": 182170 - }, - { - "epoch": 0.32, - "learning_rate": 3.4114998413069334e-05, - "loss": 2.3946, - "step": 182180 - }, - { - "epoch": 0.32, - "learning_rate": 3.411412647314251e-05, - "loss": 2.3488, - "step": 182190 - }, - { - "epoch": 0.32, - "learning_rate": 3.411325453321568e-05, - "loss": 2.4951, - "step": 182200 - }, - { - "epoch": 0.32, - "learning_rate": 3.411238259328885e-05, - "loss": 2.4846, - "step": 182210 - }, - { - "epoch": 0.32, - "learning_rate": 3.411151065336203e-05, - "loss": 2.5127, - "step": 182220 - }, - { - "epoch": 0.32, - "learning_rate": 3.41106387134352e-05, - "loss": 2.3252, - "step": 182230 - }, - { - "epoch": 0.32, - "learning_rate": 3.410976677350837e-05, - "loss": 2.49, - "step": 182240 - }, - { - "epoch": 0.32, - "learning_rate": 3.410889483358155e-05, - "loss": 2.5279, - "step": 182250 - }, - { - "epoch": 0.32, - "learning_rate": 3.4108022893654724e-05, - "loss": 2.4182, - "step": 182260 - }, - { - "epoch": 0.32, - "learning_rate": 3.4107150953727895e-05, - "loss": 2.4989, - "step": 182270 - }, - { - "epoch": 0.32, - "learning_rate": 3.4106279013801065e-05, - "loss": 2.416, - "step": 182280 - }, - { - "epoch": 0.32, - "learning_rate": 3.410540707387424e-05, - "loss": 2.4919, - "step": 182290 - }, - { - "epoch": 0.32, - "learning_rate": 3.410453513394741e-05, - "loss": 2.5124, - "step": 182300 - }, - { - "epoch": 0.32, - "learning_rate": 3.410366319402058e-05, - "loss": 2.555, - "step": 182310 - }, - { - "epoch": 0.32, - "learning_rate": 3.410279125409376e-05, - "loss": 2.4974, - "step": 182320 - }, - { - "epoch": 0.32, - "learning_rate": 3.410191931416693e-05, - "loss": 2.3959, - "step": 182330 - }, - { - "epoch": 0.32, - "learning_rate": 3.410104737424011e-05, - "loss": 2.5149, - "step": 182340 - }, - { - "epoch": 0.32, - "learning_rate": 3.410017543431328e-05, - "loss": 2.4596, - "step": 182350 - }, - { - "epoch": 0.32, - "learning_rate": 3.4099303494386455e-05, - "loss": 2.5419, - "step": 182360 - }, - { - "epoch": 0.32, - "learning_rate": 3.4098431554459626e-05, - "loss": 2.4918, - "step": 182370 - }, - { - "epoch": 0.32, - "learning_rate": 3.4097559614532796e-05, - "loss": 2.3558, - "step": 182380 - }, - { - "epoch": 0.32, - "learning_rate": 3.409668767460597e-05, - "loss": 2.5143, - "step": 182390 - }, - { - "epoch": 0.32, - "learning_rate": 3.4095815734679144e-05, - "loss": 2.4736, - "step": 182400 - }, - { - "epoch": 0.32, - "learning_rate": 3.409494379475232e-05, - "loss": 2.3672, - "step": 182410 - }, - { - "epoch": 0.32, - "learning_rate": 3.409407185482549e-05, - "loss": 2.5061, - "step": 182420 - }, - { - "epoch": 0.32, - "learning_rate": 3.409319991489867e-05, - "loss": 2.6046, - "step": 182430 - }, - { - "epoch": 0.32, - "learning_rate": 3.409232797497184e-05, - "loss": 2.4739, - "step": 182440 - }, - { - "epoch": 0.32, - "learning_rate": 3.409145603504501e-05, - "loss": 2.529, - "step": 182450 - }, - { - "epoch": 0.32, - "learning_rate": 3.4090584095118186e-05, - "loss": 2.5273, - "step": 182460 - }, - { - "epoch": 0.32, - "learning_rate": 3.408971215519136e-05, - "loss": 2.4741, - "step": 182470 - }, - { - "epoch": 0.32, - "learning_rate": 3.408884021526453e-05, - "loss": 2.484, - "step": 182480 - }, - { - "epoch": 0.32, - "learning_rate": 3.4087968275337704e-05, - "loss": 2.3741, - "step": 182490 - }, - { - "epoch": 0.32, - "learning_rate": 3.408709633541088e-05, - "loss": 2.3735, - "step": 182500 - }, - { - "epoch": 0.32, - "learning_rate": 3.408622439548405e-05, - "loss": 2.4127, - "step": 182510 - }, - { - "epoch": 0.32, - "learning_rate": 3.408535245555722e-05, - "loss": 2.4996, - "step": 182520 - }, - { - "epoch": 0.32, - "learning_rate": 3.40844805156304e-05, - "loss": 2.4271, - "step": 182530 - }, - { - "epoch": 0.32, - "learning_rate": 3.408360857570357e-05, - "loss": 2.4688, - "step": 182540 - }, - { - "epoch": 0.32, - "learning_rate": 3.408273663577674e-05, - "loss": 2.401, - "step": 182550 - }, - { - "epoch": 0.32, - "learning_rate": 3.408186469584992e-05, - "loss": 2.4069, - "step": 182560 - }, - { - "epoch": 0.32, - "learning_rate": 3.4080992755923094e-05, - "loss": 2.3595, - "step": 182570 - }, - { - "epoch": 0.32, - "learning_rate": 3.4080120815996265e-05, - "loss": 2.4614, - "step": 182580 - }, - { - "epoch": 0.32, - "learning_rate": 3.4079248876069435e-05, - "loss": 2.3549, - "step": 182590 - }, - { - "epoch": 0.32, - "learning_rate": 3.4078376936142606e-05, - "loss": 2.4085, - "step": 182600 - }, - { - "epoch": 0.32, - "learning_rate": 3.407750499621578e-05, - "loss": 2.4808, - "step": 182610 - }, - { - "epoch": 0.32, - "learning_rate": 3.407663305628895e-05, - "loss": 2.507, - "step": 182620 - }, - { - "epoch": 0.32, - "learning_rate": 3.4075761116362123e-05, - "loss": 2.4004, - "step": 182630 - }, - { - "epoch": 0.32, - "learning_rate": 3.407488917643531e-05, - "loss": 2.4158, - "step": 182640 - }, - { - "epoch": 0.32, - "learning_rate": 3.407401723650848e-05, - "loss": 2.4993, - "step": 182650 - }, - { - "epoch": 0.32, - "learning_rate": 3.407314529658165e-05, - "loss": 2.4191, - "step": 182660 - }, - { - "epoch": 0.32, - "learning_rate": 3.407227335665482e-05, - "loss": 2.322, - "step": 182670 - }, - { - "epoch": 0.32, - "learning_rate": 3.4071401416727996e-05, - "loss": 2.399, - "step": 182680 - }, - { - "epoch": 0.32, - "learning_rate": 3.4070529476801166e-05, - "loss": 2.4415, - "step": 182690 - }, - { - "epoch": 0.32, - "learning_rate": 3.4069657536874336e-05, - "loss": 2.2884, - "step": 182700 - }, - { - "epoch": 0.32, - "learning_rate": 3.4068785596947514e-05, - "loss": 2.519, - "step": 182710 - }, - { - "epoch": 0.32, - "learning_rate": 3.406791365702069e-05, - "loss": 2.4375, - "step": 182720 - }, - { - "epoch": 0.32, - "learning_rate": 3.406704171709386e-05, - "loss": 2.5529, - "step": 182730 - }, - { - "epoch": 0.32, - "learning_rate": 3.406616977716703e-05, - "loss": 2.3951, - "step": 182740 - }, - { - "epoch": 0.32, - "learning_rate": 3.406529783724021e-05, - "loss": 2.3971, - "step": 182750 - }, - { - "epoch": 0.32, - "learning_rate": 3.406442589731338e-05, - "loss": 2.389, - "step": 182760 - }, - { - "epoch": 0.32, - "learning_rate": 3.406355395738655e-05, - "loss": 2.4827, - "step": 182770 - }, - { - "epoch": 0.32, - "learning_rate": 3.4062682017459727e-05, - "loss": 2.4722, - "step": 182780 - }, - { - "epoch": 0.32, - "learning_rate": 3.4061810077532904e-05, - "loss": 2.3975, - "step": 182790 - }, - { - "epoch": 0.32, - "learning_rate": 3.4060938137606074e-05, - "loss": 2.4654, - "step": 182800 - }, - { - "epoch": 0.32, - "learning_rate": 3.4060066197679245e-05, - "loss": 2.3762, - "step": 182810 - }, - { - "epoch": 0.32, - "learning_rate": 3.405919425775242e-05, - "loss": 2.3382, - "step": 182820 - }, - { - "epoch": 0.32, - "learning_rate": 3.405832231782559e-05, - "loss": 2.3225, - "step": 182830 - }, - { - "epoch": 0.32, - "learning_rate": 3.405745037789876e-05, - "loss": 2.5992, - "step": 182840 - }, - { - "epoch": 0.32, - "learning_rate": 3.405657843797194e-05, - "loss": 2.3843, - "step": 182850 - }, - { - "epoch": 0.32, - "learning_rate": 3.405570649804512e-05, - "loss": 2.42, - "step": 182860 - }, - { - "epoch": 0.32, - "learning_rate": 3.405483455811829e-05, - "loss": 2.4415, - "step": 182870 - }, - { - "epoch": 0.32, - "learning_rate": 3.405396261819146e-05, - "loss": 2.4178, - "step": 182880 - }, - { - "epoch": 0.32, - "learning_rate": 3.4053090678264635e-05, - "loss": 2.508, - "step": 182890 - }, - { - "epoch": 0.32, - "learning_rate": 3.4052218738337805e-05, - "loss": 2.4363, - "step": 182900 - }, - { - "epoch": 0.32, - "learning_rate": 3.4051346798410975e-05, - "loss": 2.3682, - "step": 182910 - }, - { - "epoch": 0.32, - "learning_rate": 3.405047485848415e-05, - "loss": 2.4251, - "step": 182920 - }, - { - "epoch": 0.32, - "learning_rate": 3.404960291855733e-05, - "loss": 2.5009, - "step": 182930 - }, - { - "epoch": 0.32, - "learning_rate": 3.40487309786305e-05, - "loss": 2.3652, - "step": 182940 - }, - { - "epoch": 0.32, - "learning_rate": 3.404785903870367e-05, - "loss": 2.4005, - "step": 182950 - }, - { - "epoch": 0.32, - "learning_rate": 3.404698709877685e-05, - "loss": 2.4745, - "step": 182960 - }, - { - "epoch": 0.32, - "learning_rate": 3.404611515885002e-05, - "loss": 2.3535, - "step": 182970 - }, - { - "epoch": 0.32, - "learning_rate": 3.404524321892319e-05, - "loss": 2.4048, - "step": 182980 - }, - { - "epoch": 0.32, - "learning_rate": 3.404437127899636e-05, - "loss": 2.5371, - "step": 182990 - }, - { - "epoch": 0.32, - "learning_rate": 3.4043499339069536e-05, - "loss": 2.4242, - "step": 183000 - }, - { - "epoch": 0.32, - "learning_rate": 3.404262739914271e-05, - "loss": 2.3661, - "step": 183010 - }, - { - "epoch": 0.32, - "learning_rate": 3.4041755459215884e-05, - "loss": 2.3614, - "step": 183020 - }, - { - "epoch": 0.32, - "learning_rate": 3.404088351928906e-05, - "loss": 2.3447, - "step": 183030 - }, - { - "epoch": 0.32, - "learning_rate": 3.404001157936223e-05, - "loss": 2.3867, - "step": 183040 - }, - { - "epoch": 0.32, - "learning_rate": 3.40391396394354e-05, - "loss": 2.3345, - "step": 183050 - }, - { - "epoch": 0.32, - "learning_rate": 3.403826769950857e-05, - "loss": 2.4934, - "step": 183060 - }, - { - "epoch": 0.32, - "learning_rate": 3.403739575958175e-05, - "loss": 2.526, - "step": 183070 - }, - { - "epoch": 0.32, - "learning_rate": 3.4036523819654926e-05, - "loss": 2.4967, - "step": 183080 - }, - { - "epoch": 0.32, - "learning_rate": 3.4035651879728097e-05, - "loss": 2.5146, - "step": 183090 - }, - { - "epoch": 0.32, - "learning_rate": 3.403477993980127e-05, - "loss": 2.3262, - "step": 183100 - }, - { - "epoch": 0.32, - "learning_rate": 3.4033907999874444e-05, - "loss": 2.348, - "step": 183110 - }, - { - "epoch": 0.32, - "learning_rate": 3.4033036059947614e-05, - "loss": 2.3284, - "step": 183120 - }, - { - "epoch": 0.32, - "learning_rate": 3.4032164120020785e-05, - "loss": 2.5334, - "step": 183130 - }, - { - "epoch": 0.32, - "learning_rate": 3.403129218009396e-05, - "loss": 2.4353, - "step": 183140 - }, - { - "epoch": 0.32, - "learning_rate": 3.403042024016713e-05, - "loss": 2.3758, - "step": 183150 - }, - { - "epoch": 0.32, - "learning_rate": 3.402954830024031e-05, - "loss": 2.4222, - "step": 183160 - }, - { - "epoch": 0.32, - "learning_rate": 3.402867636031348e-05, - "loss": 2.4197, - "step": 183170 - }, - { - "epoch": 0.32, - "learning_rate": 3.402780442038666e-05, - "loss": 2.3955, - "step": 183180 - }, - { - "epoch": 0.32, - "learning_rate": 3.402693248045983e-05, - "loss": 2.4446, - "step": 183190 - }, - { - "epoch": 0.32, - "learning_rate": 3.4026060540533e-05, - "loss": 2.4697, - "step": 183200 - }, - { - "epoch": 0.32, - "learning_rate": 3.4025188600606175e-05, - "loss": 2.4134, - "step": 183210 - }, - { - "epoch": 0.32, - "learning_rate": 3.4024316660679345e-05, - "loss": 2.4341, - "step": 183220 - }, - { - "epoch": 0.32, - "learning_rate": 3.402344472075252e-05, - "loss": 2.3573, - "step": 183230 - }, - { - "epoch": 0.32, - "learning_rate": 3.402257278082569e-05, - "loss": 2.4588, - "step": 183240 - }, - { - "epoch": 0.32, - "learning_rate": 3.402170084089887e-05, - "loss": 2.5339, - "step": 183250 - }, - { - "epoch": 0.32, - "learning_rate": 3.402082890097204e-05, - "loss": 2.4213, - "step": 183260 - }, - { - "epoch": 0.32, - "learning_rate": 3.401995696104521e-05, - "loss": 2.5089, - "step": 183270 - }, - { - "epoch": 0.32, - "learning_rate": 3.401908502111839e-05, - "loss": 2.3452, - "step": 183280 - }, - { - "epoch": 0.32, - "learning_rate": 3.401821308119156e-05, - "loss": 2.465, - "step": 183290 - }, - { - "epoch": 0.32, - "learning_rate": 3.4017341141264736e-05, - "loss": 2.4622, - "step": 183300 - }, - { - "epoch": 0.32, - "learning_rate": 3.4016469201337906e-05, - "loss": 2.4518, - "step": 183310 - }, - { - "epoch": 0.32, - "learning_rate": 3.401559726141108e-05, - "loss": 2.3686, - "step": 183320 - }, - { - "epoch": 0.32, - "learning_rate": 3.4014725321484253e-05, - "loss": 2.4838, - "step": 183330 - }, - { - "epoch": 0.32, - "learning_rate": 3.4013853381557424e-05, - "loss": 2.2734, - "step": 183340 - }, - { - "epoch": 0.32, - "learning_rate": 3.40129814416306e-05, - "loss": 2.405, - "step": 183350 - }, - { - "epoch": 0.32, - "learning_rate": 3.401210950170377e-05, - "loss": 2.4095, - "step": 183360 - }, - { - "epoch": 0.32, - "learning_rate": 3.401123756177694e-05, - "loss": 2.4979, - "step": 183370 - }, - { - "epoch": 0.32, - "learning_rate": 3.401036562185012e-05, - "loss": 2.525, - "step": 183380 - }, - { - "epoch": 0.32, - "learning_rate": 3.4009493681923296e-05, - "loss": 2.3983, - "step": 183390 - }, - { - "epoch": 0.32, - "learning_rate": 3.4008621741996466e-05, - "loss": 2.3764, - "step": 183400 - }, - { - "epoch": 0.32, - "learning_rate": 3.400774980206964e-05, - "loss": 2.4705, - "step": 183410 - }, - { - "epoch": 0.32, - "learning_rate": 3.4006877862142814e-05, - "loss": 2.4844, - "step": 183420 - }, - { - "epoch": 0.32, - "learning_rate": 3.4006005922215984e-05, - "loss": 2.4824, - "step": 183430 - }, - { - "epoch": 0.32, - "learning_rate": 3.4005133982289155e-05, - "loss": 2.3806, - "step": 183440 - }, - { - "epoch": 0.32, - "learning_rate": 3.400426204236233e-05, - "loss": 2.485, - "step": 183450 - }, - { - "epoch": 0.32, - "learning_rate": 3.400339010243551e-05, - "loss": 2.4623, - "step": 183460 - }, - { - "epoch": 0.32, - "learning_rate": 3.400251816250868e-05, - "loss": 2.4229, - "step": 183470 - }, - { - "epoch": 0.32, - "learning_rate": 3.400164622258185e-05, - "loss": 2.5375, - "step": 183480 - }, - { - "epoch": 0.32, - "learning_rate": 3.400077428265502e-05, - "loss": 2.2974, - "step": 183490 - }, - { - "epoch": 0.32, - "learning_rate": 3.39999023427282e-05, - "loss": 2.5437, - "step": 183500 - }, - { - "epoch": 0.32, - "learning_rate": 3.399903040280137e-05, - "loss": 2.3359, - "step": 183510 - }, - { - "epoch": 0.32, - "learning_rate": 3.399815846287454e-05, - "loss": 2.489, - "step": 183520 - }, - { - "epoch": 0.32, - "learning_rate": 3.399728652294772e-05, - "loss": 2.285, - "step": 183530 - }, - { - "epoch": 0.32, - "learning_rate": 3.399641458302089e-05, - "loss": 2.4511, - "step": 183540 - }, - { - "epoch": 0.32, - "learning_rate": 3.399554264309406e-05, - "loss": 2.4074, - "step": 183550 - }, - { - "epoch": 0.32, - "learning_rate": 3.399467070316723e-05, - "loss": 2.3316, - "step": 183560 - }, - { - "epoch": 0.32, - "learning_rate": 3.399379876324041e-05, - "loss": 2.4362, - "step": 183570 - }, - { - "epoch": 0.32, - "learning_rate": 3.399292682331358e-05, - "loss": 2.4166, - "step": 183580 - }, - { - "epoch": 0.32, - "learning_rate": 3.399205488338675e-05, - "loss": 2.5126, - "step": 183590 - }, - { - "epoch": 0.32, - "learning_rate": 3.399118294345993e-05, - "loss": 2.5088, - "step": 183600 - }, - { - "epoch": 0.32, - "learning_rate": 3.3990311003533105e-05, - "loss": 2.4248, - "step": 183610 - }, - { - "epoch": 0.32, - "learning_rate": 3.3989439063606276e-05, - "loss": 2.3561, - "step": 183620 - }, - { - "epoch": 0.32, - "learning_rate": 3.3988567123679446e-05, - "loss": 2.475, - "step": 183630 - }, - { - "epoch": 0.32, - "learning_rate": 3.398769518375262e-05, - "loss": 2.494, - "step": 183640 - }, - { - "epoch": 0.32, - "learning_rate": 3.3986823243825794e-05, - "loss": 2.46, - "step": 183650 - }, - { - "epoch": 0.32, - "learning_rate": 3.3985951303898964e-05, - "loss": 2.4539, - "step": 183660 - }, - { - "epoch": 0.32, - "learning_rate": 3.398507936397214e-05, - "loss": 2.4798, - "step": 183670 - }, - { - "epoch": 0.32, - "learning_rate": 3.398420742404532e-05, - "loss": 2.368, - "step": 183680 - }, - { - "epoch": 0.32, - "learning_rate": 3.398333548411849e-05, - "loss": 2.291, - "step": 183690 - }, - { - "epoch": 0.32, - "learning_rate": 3.398246354419166e-05, - "loss": 2.5213, - "step": 183700 - }, - { - "epoch": 0.32, - "learning_rate": 3.3981591604264836e-05, - "loss": 2.4236, - "step": 183710 - }, - { - "epoch": 0.32, - "learning_rate": 3.398071966433801e-05, - "loss": 2.488, - "step": 183720 - }, - { - "epoch": 0.32, - "learning_rate": 3.397984772441118e-05, - "loss": 2.4463, - "step": 183730 - }, - { - "epoch": 0.32, - "learning_rate": 3.3978975784484354e-05, - "loss": 2.4366, - "step": 183740 - }, - { - "epoch": 0.32, - "learning_rate": 3.397810384455753e-05, - "loss": 2.3856, - "step": 183750 - }, - { - "epoch": 0.32, - "learning_rate": 3.39772319046307e-05, - "loss": 2.5343, - "step": 183760 - }, - { - "epoch": 0.32, - "learning_rate": 3.397635996470387e-05, - "loss": 2.4048, - "step": 183770 - }, - { - "epoch": 0.32, - "learning_rate": 3.397548802477705e-05, - "loss": 2.5708, - "step": 183780 - }, - { - "epoch": 0.32, - "learning_rate": 3.397461608485022e-05, - "loss": 2.5129, - "step": 183790 - }, - { - "epoch": 0.32, - "learning_rate": 3.397374414492339e-05, - "loss": 2.4056, - "step": 183800 - }, - { - "epoch": 0.32, - "learning_rate": 3.397287220499657e-05, - "loss": 2.4454, - "step": 183810 - }, - { - "epoch": 0.32, - "learning_rate": 3.397200026506974e-05, - "loss": 2.4262, - "step": 183820 - }, - { - "epoch": 0.32, - "learning_rate": 3.3971128325142915e-05, - "loss": 2.4484, - "step": 183830 - }, - { - "epoch": 0.32, - "learning_rate": 3.3970256385216085e-05, - "loss": 2.5566, - "step": 183840 - }, - { - "epoch": 0.32, - "learning_rate": 3.396938444528926e-05, - "loss": 2.4267, - "step": 183850 - }, - { - "epoch": 0.32, - "learning_rate": 3.396851250536243e-05, - "loss": 2.3885, - "step": 183860 - }, - { - "epoch": 0.32, - "learning_rate": 3.39676405654356e-05, - "loss": 2.4194, - "step": 183870 - }, - { - "epoch": 0.32, - "learning_rate": 3.396676862550878e-05, - "loss": 2.3334, - "step": 183880 - }, - { - "epoch": 0.32, - "learning_rate": 3.396589668558195e-05, - "loss": 2.3684, - "step": 183890 - }, - { - "epoch": 0.32, - "learning_rate": 3.396502474565513e-05, - "loss": 2.4161, - "step": 183900 - }, - { - "epoch": 0.32, - "learning_rate": 3.39641528057283e-05, - "loss": 2.4981, - "step": 183910 - }, - { - "epoch": 0.32, - "learning_rate": 3.3963280865801475e-05, - "loss": 2.5065, - "step": 183920 - }, - { - "epoch": 0.32, - "learning_rate": 3.3962408925874646e-05, - "loss": 2.4388, - "step": 183930 - }, - { - "epoch": 0.32, - "learning_rate": 3.3961536985947816e-05, - "loss": 2.4363, - "step": 183940 - }, - { - "epoch": 0.32, - "learning_rate": 3.3960665046020987e-05, - "loss": 2.3862, - "step": 183950 - }, - { - "epoch": 0.32, - "learning_rate": 3.3959793106094164e-05, - "loss": 2.3493, - "step": 183960 - }, - { - "epoch": 0.32, - "learning_rate": 3.395892116616734e-05, - "loss": 2.4066, - "step": 183970 - }, - { - "epoch": 0.32, - "learning_rate": 3.395804922624051e-05, - "loss": 2.4777, - "step": 183980 - }, - { - "epoch": 0.32, - "learning_rate": 3.395717728631369e-05, - "loss": 2.503, - "step": 183990 - }, - { - "epoch": 0.32, - "learning_rate": 3.395630534638686e-05, - "loss": 2.2871, - "step": 184000 - }, - { - "epoch": 0.32, - "learning_rate": 3.395543340646003e-05, - "loss": 2.4798, - "step": 184010 - }, - { - "epoch": 0.32, - "learning_rate": 3.39545614665332e-05, - "loss": 2.4758, - "step": 184020 - }, - { - "epoch": 0.32, - "learning_rate": 3.395368952660638e-05, - "loss": 2.3666, - "step": 184030 - }, - { - "epoch": 0.32, - "learning_rate": 3.395281758667955e-05, - "loss": 2.4513, - "step": 184040 - }, - { - "epoch": 0.32, - "learning_rate": 3.3951945646752724e-05, - "loss": 2.3143, - "step": 184050 - }, - { - "epoch": 0.32, - "learning_rate": 3.3951073706825895e-05, - "loss": 2.4392, - "step": 184060 - }, - { - "epoch": 0.32, - "learning_rate": 3.395020176689907e-05, - "loss": 2.4229, - "step": 184070 - }, - { - "epoch": 0.32, - "learning_rate": 3.394932982697224e-05, - "loss": 2.4357, - "step": 184080 - }, - { - "epoch": 0.32, - "learning_rate": 3.394845788704541e-05, - "loss": 2.4561, - "step": 184090 - }, - { - "epoch": 0.32, - "learning_rate": 3.394758594711859e-05, - "loss": 2.4301, - "step": 184100 - }, - { - "epoch": 0.32, - "learning_rate": 3.394671400719176e-05, - "loss": 2.5076, - "step": 184110 - }, - { - "epoch": 0.32, - "learning_rate": 3.394584206726494e-05, - "loss": 2.4351, - "step": 184120 - }, - { - "epoch": 0.32, - "learning_rate": 3.394497012733811e-05, - "loss": 2.4456, - "step": 184130 - }, - { - "epoch": 0.32, - "learning_rate": 3.3944098187411285e-05, - "loss": 2.5202, - "step": 184140 - }, - { - "epoch": 0.32, - "learning_rate": 3.3943226247484455e-05, - "loss": 2.5656, - "step": 184150 - }, - { - "epoch": 0.32, - "learning_rate": 3.3942354307557626e-05, - "loss": 2.4449, - "step": 184160 - }, - { - "epoch": 0.32, - "learning_rate": 3.39414823676308e-05, - "loss": 2.4795, - "step": 184170 - }, - { - "epoch": 0.32, - "learning_rate": 3.394061042770397e-05, - "loss": 2.4575, - "step": 184180 - }, - { - "epoch": 0.32, - "learning_rate": 3.3939738487777143e-05, - "loss": 2.5442, - "step": 184190 - }, - { - "epoch": 0.32, - "learning_rate": 3.393886654785032e-05, - "loss": 2.3655, - "step": 184200 - }, - { - "epoch": 0.32, - "learning_rate": 3.39379946079235e-05, - "loss": 2.4254, - "step": 184210 - }, - { - "epoch": 0.32, - "learning_rate": 3.393712266799667e-05, - "loss": 2.4849, - "step": 184220 - }, - { - "epoch": 0.32, - "learning_rate": 3.393625072806984e-05, - "loss": 2.4098, - "step": 184230 - }, - { - "epoch": 0.32, - "learning_rate": 3.3935378788143016e-05, - "loss": 2.353, - "step": 184240 - }, - { - "epoch": 0.32, - "learning_rate": 3.3934506848216186e-05, - "loss": 2.3732, - "step": 184250 - }, - { - "epoch": 0.32, - "learning_rate": 3.3933634908289356e-05, - "loss": 2.4198, - "step": 184260 - }, - { - "epoch": 0.32, - "learning_rate": 3.3932762968362534e-05, - "loss": 2.3151, - "step": 184270 - }, - { - "epoch": 0.32, - "learning_rate": 3.393189102843571e-05, - "loss": 2.405, - "step": 184280 - }, - { - "epoch": 0.32, - "learning_rate": 3.393101908850888e-05, - "loss": 2.4132, - "step": 184290 - }, - { - "epoch": 0.32, - "learning_rate": 3.393014714858205e-05, - "loss": 2.3474, - "step": 184300 - }, - { - "epoch": 0.32, - "learning_rate": 3.392927520865523e-05, - "loss": 2.5441, - "step": 184310 - }, - { - "epoch": 0.32, - "learning_rate": 3.39284032687284e-05, - "loss": 2.3145, - "step": 184320 - }, - { - "epoch": 0.32, - "learning_rate": 3.392753132880157e-05, - "loss": 2.4745, - "step": 184330 - }, - { - "epoch": 0.32, - "learning_rate": 3.392665938887474e-05, - "loss": 2.3436, - "step": 184340 - }, - { - "epoch": 0.32, - "learning_rate": 3.3925787448947924e-05, - "loss": 2.4452, - "step": 184350 - }, - { - "epoch": 0.32, - "learning_rate": 3.3924915509021094e-05, - "loss": 2.6217, - "step": 184360 - }, - { - "epoch": 0.32, - "learning_rate": 3.3924043569094265e-05, - "loss": 2.3715, - "step": 184370 - }, - { - "epoch": 0.32, - "learning_rate": 3.392317162916744e-05, - "loss": 2.4146, - "step": 184380 - }, - { - "epoch": 0.32, - "learning_rate": 3.392229968924061e-05, - "loss": 2.3575, - "step": 184390 - }, - { - "epoch": 0.32, - "learning_rate": 3.392142774931378e-05, - "loss": 2.4469, - "step": 184400 - }, - { - "epoch": 0.32, - "learning_rate": 3.392055580938695e-05, - "loss": 2.4877, - "step": 184410 - }, - { - "epoch": 0.32, - "learning_rate": 3.391968386946014e-05, - "loss": 2.3601, - "step": 184420 - }, - { - "epoch": 0.32, - "learning_rate": 3.391881192953331e-05, - "loss": 2.3658, - "step": 184430 - }, - { - "epoch": 0.32, - "learning_rate": 3.391793998960648e-05, - "loss": 2.4057, - "step": 184440 - }, - { - "epoch": 0.32, - "learning_rate": 3.391706804967965e-05, - "loss": 2.3706, - "step": 184450 - }, - { - "epoch": 0.32, - "learning_rate": 3.3916196109752825e-05, - "loss": 2.4588, - "step": 184460 - }, - { - "epoch": 0.32, - "learning_rate": 3.3915324169825995e-05, - "loss": 2.5113, - "step": 184470 - }, - { - "epoch": 0.32, - "learning_rate": 3.3914452229899166e-05, - "loss": 2.5097, - "step": 184480 - }, - { - "epoch": 0.32, - "learning_rate": 3.391358028997234e-05, - "loss": 2.458, - "step": 184490 - }, - { - "epoch": 0.32, - "learning_rate": 3.391270835004552e-05, - "loss": 2.4859, - "step": 184500 - }, - { - "epoch": 0.32, - "learning_rate": 3.391183641011869e-05, - "loss": 2.4128, - "step": 184510 - }, - { - "epoch": 0.32, - "learning_rate": 3.391096447019186e-05, - "loss": 2.5628, - "step": 184520 - }, - { - "epoch": 0.32, - "learning_rate": 3.391009253026504e-05, - "loss": 2.4401, - "step": 184530 - }, - { - "epoch": 0.32, - "learning_rate": 3.390922059033821e-05, - "loss": 2.435, - "step": 184540 - }, - { - "epoch": 0.32, - "learning_rate": 3.390834865041138e-05, - "loss": 2.4897, - "step": 184550 - }, - { - "epoch": 0.32, - "learning_rate": 3.3907476710484556e-05, - "loss": 2.388, - "step": 184560 - }, - { - "epoch": 0.32, - "learning_rate": 3.390660477055773e-05, - "loss": 2.4067, - "step": 184570 - }, - { - "epoch": 0.32, - "learning_rate": 3.3905732830630904e-05, - "loss": 2.4715, - "step": 184580 - }, - { - "epoch": 0.32, - "learning_rate": 3.3904860890704074e-05, - "loss": 2.3972, - "step": 184590 - }, - { - "epoch": 0.32, - "learning_rate": 3.390398895077725e-05, - "loss": 2.4441, - "step": 184600 - }, - { - "epoch": 0.32, - "learning_rate": 3.390311701085042e-05, - "loss": 2.425, - "step": 184610 - }, - { - "epoch": 0.32, - "learning_rate": 3.390224507092359e-05, - "loss": 2.5168, - "step": 184620 - }, - { - "epoch": 0.32, - "learning_rate": 3.390137313099677e-05, - "loss": 2.4173, - "step": 184630 - }, - { - "epoch": 0.32, - "learning_rate": 3.3900501191069946e-05, - "loss": 2.6083, - "step": 184640 - }, - { - "epoch": 0.32, - "learning_rate": 3.3899629251143117e-05, - "loss": 2.5281, - "step": 184650 - }, - { - "epoch": 0.32, - "learning_rate": 3.389875731121629e-05, - "loss": 2.3556, - "step": 184660 - }, - { - "epoch": 0.32, - "learning_rate": 3.3897885371289464e-05, - "loss": 2.5294, - "step": 184670 - }, - { - "epoch": 0.32, - "learning_rate": 3.3897013431362634e-05, - "loss": 2.3611, - "step": 184680 - }, - { - "epoch": 0.32, - "learning_rate": 3.3896141491435805e-05, - "loss": 2.469, - "step": 184690 - }, - { - "epoch": 0.32, - "learning_rate": 3.389526955150898e-05, - "loss": 2.3267, - "step": 184700 - }, - { - "epoch": 0.32, - "learning_rate": 3.389439761158215e-05, - "loss": 2.4025, - "step": 184710 - }, - { - "epoch": 0.32, - "learning_rate": 3.389352567165533e-05, - "loss": 2.3811, - "step": 184720 - }, - { - "epoch": 0.32, - "learning_rate": 3.38926537317285e-05, - "loss": 2.4953, - "step": 184730 - }, - { - "epoch": 0.32, - "learning_rate": 3.389178179180168e-05, - "loss": 2.3731, - "step": 184740 - }, - { - "epoch": 0.32, - "learning_rate": 3.389090985187485e-05, - "loss": 2.3287, - "step": 184750 - }, - { - "epoch": 0.32, - "learning_rate": 3.389003791194802e-05, - "loss": 2.4795, - "step": 184760 - }, - { - "epoch": 0.32, - "learning_rate": 3.3889165972021195e-05, - "loss": 2.4997, - "step": 184770 - }, - { - "epoch": 0.32, - "learning_rate": 3.3888294032094365e-05, - "loss": 2.4453, - "step": 184780 - }, - { - "epoch": 0.32, - "learning_rate": 3.388742209216754e-05, - "loss": 2.4558, - "step": 184790 - }, - { - "epoch": 0.32, - "learning_rate": 3.388655015224071e-05, - "loss": 2.4239, - "step": 184800 - }, - { - "epoch": 0.32, - "learning_rate": 3.388567821231389e-05, - "loss": 2.3631, - "step": 184810 - }, - { - "epoch": 0.32, - "learning_rate": 3.388480627238706e-05, - "loss": 2.4131, - "step": 184820 - }, - { - "epoch": 0.32, - "learning_rate": 3.388393433246023e-05, - "loss": 2.3918, - "step": 184830 - }, - { - "epoch": 0.32, - "learning_rate": 3.38830623925334e-05, - "loss": 2.427, - "step": 184840 - }, - { - "epoch": 0.32, - "learning_rate": 3.388219045260658e-05, - "loss": 2.4944, - "step": 184850 - }, - { - "epoch": 0.32, - "learning_rate": 3.388131851267975e-05, - "loss": 2.4298, - "step": 184860 - }, - { - "epoch": 0.32, - "learning_rate": 3.3880446572752926e-05, - "loss": 2.4965, - "step": 184870 - }, - { - "epoch": 0.32, - "learning_rate": 3.38795746328261e-05, - "loss": 2.4051, - "step": 184880 - }, - { - "epoch": 0.32, - "learning_rate": 3.3878702692899273e-05, - "loss": 2.3611, - "step": 184890 - }, - { - "epoch": 0.32, - "learning_rate": 3.3877830752972444e-05, - "loss": 2.4047, - "step": 184900 - }, - { - "epoch": 0.32, - "learning_rate": 3.3876958813045614e-05, - "loss": 2.3576, - "step": 184910 - }, - { - "epoch": 0.32, - "learning_rate": 3.387608687311879e-05, - "loss": 2.3989, - "step": 184920 - }, - { - "epoch": 0.32, - "learning_rate": 3.387521493319196e-05, - "loss": 2.309, - "step": 184930 - }, - { - "epoch": 0.32, - "learning_rate": 3.387434299326514e-05, - "loss": 2.343, - "step": 184940 - }, - { - "epoch": 0.32, - "learning_rate": 3.387347105333831e-05, - "loss": 2.387, - "step": 184950 - }, - { - "epoch": 0.32, - "learning_rate": 3.3872599113411486e-05, - "loss": 2.4012, - "step": 184960 - }, - { - "epoch": 0.32, - "learning_rate": 3.387172717348466e-05, - "loss": 2.467, - "step": 184970 - }, - { - "epoch": 0.32, - "learning_rate": 3.387085523355783e-05, - "loss": 2.4205, - "step": 184980 - }, - { - "epoch": 0.32, - "learning_rate": 3.3869983293631004e-05, - "loss": 2.4574, - "step": 184990 - }, - { - "epoch": 0.32, - "learning_rate": 3.3869111353704175e-05, - "loss": 2.4167, - "step": 185000 - }, - { - "epoch": 0.32, - "learning_rate": 3.3868239413777345e-05, - "loss": 2.4929, - "step": 185010 - }, - { - "epoch": 0.32, - "learning_rate": 3.386736747385052e-05, - "loss": 2.4262, - "step": 185020 - }, - { - "epoch": 0.32, - "learning_rate": 3.38664955339237e-05, - "loss": 2.3831, - "step": 185030 - }, - { - "epoch": 0.32, - "learning_rate": 3.386562359399687e-05, - "loss": 2.3498, - "step": 185040 - }, - { - "epoch": 0.32, - "learning_rate": 3.386475165407004e-05, - "loss": 2.3643, - "step": 185050 - }, - { - "epoch": 0.32, - "learning_rate": 3.386387971414322e-05, - "loss": 2.2579, - "step": 185060 - }, - { - "epoch": 0.32, - "learning_rate": 3.386300777421639e-05, - "loss": 2.4827, - "step": 185070 - }, - { - "epoch": 0.32, - "learning_rate": 3.386213583428956e-05, - "loss": 2.4079, - "step": 185080 - }, - { - "epoch": 0.32, - "learning_rate": 3.3861263894362735e-05, - "loss": 2.4876, - "step": 185090 - }, - { - "epoch": 0.32, - "learning_rate": 3.386039195443591e-05, - "loss": 2.5349, - "step": 185100 - }, - { - "epoch": 0.32, - "learning_rate": 3.385952001450908e-05, - "loss": 2.4277, - "step": 185110 - }, - { - "epoch": 0.32, - "learning_rate": 3.385864807458225e-05, - "loss": 2.433, - "step": 185120 - }, - { - "epoch": 0.32, - "learning_rate": 3.385777613465543e-05, - "loss": 2.5276, - "step": 185130 - }, - { - "epoch": 0.32, - "learning_rate": 3.38569041947286e-05, - "loss": 2.5316, - "step": 185140 - }, - { - "epoch": 0.32, - "learning_rate": 3.385603225480177e-05, - "loss": 2.522, - "step": 185150 - }, - { - "epoch": 0.32, - "learning_rate": 3.385516031487495e-05, - "loss": 2.5053, - "step": 185160 - }, - { - "epoch": 0.32, - "learning_rate": 3.3854288374948125e-05, - "loss": 2.2844, - "step": 185170 - }, - { - "epoch": 0.32, - "learning_rate": 3.3853416435021296e-05, - "loss": 2.4017, - "step": 185180 - }, - { - "epoch": 0.32, - "learning_rate": 3.3852544495094466e-05, - "loss": 2.4466, - "step": 185190 - }, - { - "epoch": 0.32, - "learning_rate": 3.385167255516764e-05, - "loss": 2.433, - "step": 185200 - }, - { - "epoch": 0.32, - "learning_rate": 3.3850800615240814e-05, - "loss": 2.5239, - "step": 185210 - }, - { - "epoch": 0.32, - "learning_rate": 3.3849928675313984e-05, - "loss": 2.4652, - "step": 185220 - }, - { - "epoch": 0.32, - "learning_rate": 3.384905673538716e-05, - "loss": 2.4177, - "step": 185230 - }, - { - "epoch": 0.32, - "learning_rate": 3.384818479546034e-05, - "loss": 2.4688, - "step": 185240 - }, - { - "epoch": 0.32, - "learning_rate": 3.384731285553351e-05, - "loss": 2.3758, - "step": 185250 - }, - { - "epoch": 0.32, - "learning_rate": 3.384644091560668e-05, - "loss": 2.4823, - "step": 185260 - }, - { - "epoch": 0.32, - "learning_rate": 3.3845568975679856e-05, - "loss": 2.5183, - "step": 185270 - }, - { - "epoch": 0.32, - "learning_rate": 3.384469703575303e-05, - "loss": 2.4251, - "step": 185280 - }, - { - "epoch": 0.32, - "learning_rate": 3.38438250958262e-05, - "loss": 2.4279, - "step": 185290 - }, - { - "epoch": 0.32, - "learning_rate": 3.384295315589937e-05, - "loss": 2.4908, - "step": 185300 - }, - { - "epoch": 0.32, - "learning_rate": 3.384208121597255e-05, - "loss": 2.3444, - "step": 185310 - }, - { - "epoch": 0.32, - "learning_rate": 3.384120927604572e-05, - "loss": 2.3846, - "step": 185320 - }, - { - "epoch": 0.32, - "learning_rate": 3.384033733611889e-05, - "loss": 2.4735, - "step": 185330 - }, - { - "epoch": 0.32, - "learning_rate": 3.383946539619207e-05, - "loss": 2.4167, - "step": 185340 - }, - { - "epoch": 0.32, - "learning_rate": 3.383859345626524e-05, - "loss": 2.5344, - "step": 185350 - }, - { - "epoch": 0.32, - "learning_rate": 3.383772151633841e-05, - "loss": 2.3708, - "step": 185360 - }, - { - "epoch": 0.32, - "learning_rate": 3.383684957641158e-05, - "loss": 2.4144, - "step": 185370 - }, - { - "epoch": 0.32, - "learning_rate": 3.383597763648476e-05, - "loss": 2.3832, - "step": 185380 - }, - { - "epoch": 0.32, - "learning_rate": 3.3835105696557935e-05, - "loss": 2.4784, - "step": 185390 - }, - { - "epoch": 0.32, - "learning_rate": 3.3834233756631105e-05, - "loss": 2.2918, - "step": 185400 - }, - { - "epoch": 0.32, - "learning_rate": 3.3833361816704276e-05, - "loss": 2.5397, - "step": 185410 - }, - { - "epoch": 0.32, - "learning_rate": 3.383248987677745e-05, - "loss": 2.3688, - "step": 185420 - }, - { - "epoch": 0.32, - "learning_rate": 3.383161793685062e-05, - "loss": 2.3587, - "step": 185430 - }, - { - "epoch": 0.32, - "learning_rate": 3.3830745996923794e-05, - "loss": 2.4156, - "step": 185440 - }, - { - "epoch": 0.32, - "learning_rate": 3.382987405699697e-05, - "loss": 2.4676, - "step": 185450 - }, - { - "epoch": 0.32, - "learning_rate": 3.382900211707015e-05, - "loss": 2.4115, - "step": 185460 - }, - { - "epoch": 0.32, - "learning_rate": 3.382813017714332e-05, - "loss": 2.4778, - "step": 185470 - }, - { - "epoch": 0.32, - "learning_rate": 3.382725823721649e-05, - "loss": 2.3937, - "step": 185480 - }, - { - "epoch": 0.32, - "learning_rate": 3.3826386297289666e-05, - "loss": 2.6008, - "step": 185490 - }, - { - "epoch": 0.32, - "learning_rate": 3.3825514357362836e-05, - "loss": 2.3789, - "step": 185500 - }, - { - "epoch": 0.32, - "learning_rate": 3.3824642417436007e-05, - "loss": 2.5184, - "step": 185510 - }, - { - "epoch": 0.32, - "learning_rate": 3.3823770477509184e-05, - "loss": 2.4604, - "step": 185520 - }, - { - "epoch": 0.32, - "learning_rate": 3.3822898537582354e-05, - "loss": 2.4658, - "step": 185530 - }, - { - "epoch": 0.32, - "learning_rate": 3.382202659765553e-05, - "loss": 2.3234, - "step": 185540 - }, - { - "epoch": 0.32, - "learning_rate": 3.38211546577287e-05, - "loss": 2.4373, - "step": 185550 - }, - { - "epoch": 0.32, - "learning_rate": 3.382028271780188e-05, - "loss": 2.4099, - "step": 185560 - }, - { - "epoch": 0.32, - "learning_rate": 3.381941077787505e-05, - "loss": 2.4382, - "step": 185570 - }, - { - "epoch": 0.32, - "learning_rate": 3.381853883794822e-05, - "loss": 2.5034, - "step": 185580 - }, - { - "epoch": 0.32, - "learning_rate": 3.38176668980214e-05, - "loss": 2.3126, - "step": 185590 - }, - { - "epoch": 0.32, - "learning_rate": 3.381679495809457e-05, - "loss": 2.5828, - "step": 185600 - }, - { - "epoch": 0.32, - "learning_rate": 3.3815923018167744e-05, - "loss": 2.3845, - "step": 185610 - }, - { - "epoch": 0.32, - "learning_rate": 3.3815051078240915e-05, - "loss": 2.335, - "step": 185620 - }, - { - "epoch": 0.32, - "learning_rate": 3.381417913831409e-05, - "loss": 2.4537, - "step": 185630 - }, - { - "epoch": 0.32, - "learning_rate": 3.381330719838726e-05, - "loss": 2.4975, - "step": 185640 - }, - { - "epoch": 0.32, - "learning_rate": 3.381243525846043e-05, - "loss": 2.4886, - "step": 185650 - }, - { - "epoch": 0.32, - "learning_rate": 3.381156331853361e-05, - "loss": 2.4998, - "step": 185660 - }, - { - "epoch": 0.32, - "learning_rate": 3.381069137860678e-05, - "loss": 2.4556, - "step": 185670 - }, - { - "epoch": 0.32, - "learning_rate": 3.380981943867995e-05, - "loss": 2.4317, - "step": 185680 - }, - { - "epoch": 0.32, - "learning_rate": 3.380894749875313e-05, - "loss": 2.4039, - "step": 185690 - }, - { - "epoch": 0.32, - "learning_rate": 3.3808075558826305e-05, - "loss": 2.3627, - "step": 185700 - }, - { - "epoch": 0.32, - "learning_rate": 3.3807203618899475e-05, - "loss": 2.5082, - "step": 185710 - }, - { - "epoch": 0.32, - "learning_rate": 3.3806331678972646e-05, - "loss": 2.4431, - "step": 185720 - }, - { - "epoch": 0.32, - "learning_rate": 3.380545973904582e-05, - "loss": 2.3924, - "step": 185730 - }, - { - "epoch": 0.32, - "learning_rate": 3.380458779911899e-05, - "loss": 2.4992, - "step": 185740 - }, - { - "epoch": 0.32, - "learning_rate": 3.3803715859192163e-05, - "loss": 2.3573, - "step": 185750 - }, - { - "epoch": 0.32, - "learning_rate": 3.380284391926534e-05, - "loss": 2.3494, - "step": 185760 - }, - { - "epoch": 0.32, - "learning_rate": 3.380197197933852e-05, - "loss": 2.4166, - "step": 185770 - }, - { - "epoch": 0.32, - "learning_rate": 3.380110003941169e-05, - "loss": 2.395, - "step": 185780 - }, - { - "epoch": 0.32, - "learning_rate": 3.380022809948486e-05, - "loss": 2.4249, - "step": 185790 - }, - { - "epoch": 0.32, - "learning_rate": 3.379935615955803e-05, - "loss": 2.4474, - "step": 185800 - }, - { - "epoch": 0.32, - "learning_rate": 3.3798484219631206e-05, - "loss": 2.3559, - "step": 185810 - }, - { - "epoch": 0.32, - "learning_rate": 3.3797612279704376e-05, - "loss": 2.6205, - "step": 185820 - }, - { - "epoch": 0.32, - "learning_rate": 3.3796740339777554e-05, - "loss": 2.4012, - "step": 185830 - }, - { - "epoch": 0.32, - "learning_rate": 3.379586839985073e-05, - "loss": 2.364, - "step": 185840 - }, - { - "epoch": 0.32, - "learning_rate": 3.37949964599239e-05, - "loss": 2.2339, - "step": 185850 - }, - { - "epoch": 0.32, - "learning_rate": 3.379412451999707e-05, - "loss": 2.5014, - "step": 185860 - }, - { - "epoch": 0.32, - "learning_rate": 3.379325258007024e-05, - "loss": 2.5375, - "step": 185870 - }, - { - "epoch": 0.32, - "learning_rate": 3.379238064014342e-05, - "loss": 2.4665, - "step": 185880 - }, - { - "epoch": 0.32, - "learning_rate": 3.379150870021659e-05, - "loss": 2.3536, - "step": 185890 - }, - { - "epoch": 0.32, - "learning_rate": 3.379063676028976e-05, - "loss": 2.4277, - "step": 185900 - }, - { - "epoch": 0.32, - "learning_rate": 3.378976482036294e-05, - "loss": 2.4033, - "step": 185910 - }, - { - "epoch": 0.32, - "learning_rate": 3.3788892880436114e-05, - "loss": 2.4116, - "step": 185920 - }, - { - "epoch": 0.32, - "learning_rate": 3.3788020940509285e-05, - "loss": 2.4886, - "step": 185930 - }, - { - "epoch": 0.32, - "learning_rate": 3.3787149000582455e-05, - "loss": 2.4315, - "step": 185940 - }, - { - "epoch": 0.32, - "learning_rate": 3.378627706065563e-05, - "loss": 2.3811, - "step": 185950 - }, - { - "epoch": 0.32, - "learning_rate": 3.37854051207288e-05, - "loss": 2.4186, - "step": 185960 - }, - { - "epoch": 0.32, - "learning_rate": 3.378453318080197e-05, - "loss": 2.3642, - "step": 185970 - }, - { - "epoch": 0.32, - "learning_rate": 3.378366124087515e-05, - "loss": 2.4252, - "step": 185980 - }, - { - "epoch": 0.32, - "learning_rate": 3.378278930094833e-05, - "loss": 2.4103, - "step": 185990 - }, - { - "epoch": 0.32, - "learning_rate": 3.37819173610215e-05, - "loss": 2.4297, - "step": 186000 - }, - { - "epoch": 0.32, - "learning_rate": 3.378104542109467e-05, - "loss": 2.3413, - "step": 186010 - }, - { - "epoch": 0.32, - "learning_rate": 3.3780173481167845e-05, - "loss": 2.3871, - "step": 186020 - }, - { - "epoch": 0.32, - "learning_rate": 3.3779301541241015e-05, - "loss": 2.4028, - "step": 186030 - }, - { - "epoch": 0.32, - "learning_rate": 3.3778429601314186e-05, - "loss": 2.4323, - "step": 186040 - }, - { - "epoch": 0.32, - "learning_rate": 3.377755766138736e-05, - "loss": 2.421, - "step": 186050 - }, - { - "epoch": 0.32, - "learning_rate": 3.377668572146054e-05, - "loss": 2.4696, - "step": 186060 - }, - { - "epoch": 0.32, - "learning_rate": 3.377581378153371e-05, - "loss": 2.3663, - "step": 186070 - }, - { - "epoch": 0.32, - "learning_rate": 3.377494184160688e-05, - "loss": 2.3972, - "step": 186080 - }, - { - "epoch": 0.32, - "learning_rate": 3.377406990168006e-05, - "loss": 2.4624, - "step": 186090 - }, - { - "epoch": 0.32, - "learning_rate": 3.377319796175323e-05, - "loss": 2.3885, - "step": 186100 - }, - { - "epoch": 0.32, - "learning_rate": 3.37723260218264e-05, - "loss": 2.4572, - "step": 186110 - }, - { - "epoch": 0.32, - "learning_rate": 3.3771454081899576e-05, - "loss": 2.4589, - "step": 186120 - }, - { - "epoch": 0.32, - "learning_rate": 3.377058214197275e-05, - "loss": 2.6446, - "step": 186130 - }, - { - "epoch": 0.32, - "learning_rate": 3.3769710202045924e-05, - "loss": 2.2499, - "step": 186140 - }, - { - "epoch": 0.32, - "learning_rate": 3.3768838262119094e-05, - "loss": 2.4642, - "step": 186150 - }, - { - "epoch": 0.32, - "learning_rate": 3.376796632219227e-05, - "loss": 2.4271, - "step": 186160 - }, - { - "epoch": 0.32, - "learning_rate": 3.376709438226544e-05, - "loss": 2.3983, - "step": 186170 - }, - { - "epoch": 0.32, - "learning_rate": 3.376622244233861e-05, - "loss": 2.4427, - "step": 186180 - }, - { - "epoch": 0.32, - "learning_rate": 3.376535050241178e-05, - "loss": 2.4767, - "step": 186190 - }, - { - "epoch": 0.32, - "learning_rate": 3.376447856248496e-05, - "loss": 2.4248, - "step": 186200 - }, - { - "epoch": 0.32, - "learning_rate": 3.3763606622558137e-05, - "loss": 2.3521, - "step": 186210 - }, - { - "epoch": 0.32, - "learning_rate": 3.376273468263131e-05, - "loss": 2.3493, - "step": 186220 - }, - { - "epoch": 0.32, - "learning_rate": 3.3761862742704484e-05, - "loss": 2.375, - "step": 186230 - }, - { - "epoch": 0.32, - "learning_rate": 3.3760990802777654e-05, - "loss": 2.4347, - "step": 186240 - }, - { - "epoch": 0.32, - "learning_rate": 3.3760118862850825e-05, - "loss": 2.4967, - "step": 186250 - }, - { - "epoch": 0.32, - "learning_rate": 3.3759246922923995e-05, - "loss": 2.5443, - "step": 186260 - }, - { - "epoch": 0.32, - "learning_rate": 3.375837498299717e-05, - "loss": 2.3057, - "step": 186270 - }, - { - "epoch": 0.32, - "learning_rate": 3.375750304307035e-05, - "loss": 2.5084, - "step": 186280 - }, - { - "epoch": 0.32, - "learning_rate": 3.375663110314352e-05, - "loss": 2.5466, - "step": 186290 - }, - { - "epoch": 0.32, - "learning_rate": 3.375575916321669e-05, - "loss": 2.4103, - "step": 186300 - }, - { - "epoch": 0.32, - "learning_rate": 3.375488722328987e-05, - "loss": 2.3543, - "step": 186310 - }, - { - "epoch": 0.32, - "learning_rate": 3.375401528336304e-05, - "loss": 2.4083, - "step": 186320 - }, - { - "epoch": 0.32, - "learning_rate": 3.375314334343621e-05, - "loss": 2.427, - "step": 186330 - }, - { - "epoch": 0.32, - "learning_rate": 3.3752271403509385e-05, - "loss": 2.4894, - "step": 186340 - }, - { - "epoch": 0.32, - "learning_rate": 3.3751399463582556e-05, - "loss": 2.5105, - "step": 186350 - }, - { - "epoch": 0.32, - "learning_rate": 3.375052752365573e-05, - "loss": 2.4023, - "step": 186360 - }, - { - "epoch": 0.33, - "learning_rate": 3.37496555837289e-05, - "loss": 2.3667, - "step": 186370 - }, - { - "epoch": 0.33, - "learning_rate": 3.374878364380208e-05, - "loss": 2.4208, - "step": 186380 - }, - { - "epoch": 0.33, - "learning_rate": 3.374791170387525e-05, - "loss": 2.5263, - "step": 186390 - }, - { - "epoch": 0.33, - "learning_rate": 3.374703976394842e-05, - "loss": 2.4588, - "step": 186400 - }, - { - "epoch": 0.33, - "learning_rate": 3.37461678240216e-05, - "loss": 2.4637, - "step": 186410 - }, - { - "epoch": 0.33, - "learning_rate": 3.374529588409477e-05, - "loss": 2.3748, - "step": 186420 - }, - { - "epoch": 0.33, - "learning_rate": 3.3744423944167946e-05, - "loss": 2.435, - "step": 186430 - }, - { - "epoch": 0.33, - "learning_rate": 3.3743552004241116e-05, - "loss": 2.4452, - "step": 186440 - }, - { - "epoch": 0.33, - "learning_rate": 3.3742680064314293e-05, - "loss": 2.409, - "step": 186450 - }, - { - "epoch": 0.33, - "learning_rate": 3.3741808124387464e-05, - "loss": 2.3132, - "step": 186460 - }, - { - "epoch": 0.33, - "learning_rate": 3.3740936184460634e-05, - "loss": 2.4378, - "step": 186470 - }, - { - "epoch": 0.33, - "learning_rate": 3.374006424453381e-05, - "loss": 2.367, - "step": 186480 - }, - { - "epoch": 0.33, - "learning_rate": 3.373919230460698e-05, - "loss": 2.4874, - "step": 186490 - }, - { - "epoch": 0.33, - "learning_rate": 3.373832036468016e-05, - "loss": 2.575, - "step": 186500 - }, - { - "epoch": 0.33, - "learning_rate": 3.373744842475333e-05, - "loss": 2.5241, - "step": 186510 - }, - { - "epoch": 0.33, - "learning_rate": 3.3736576484826506e-05, - "loss": 2.3321, - "step": 186520 - }, - { - "epoch": 0.33, - "learning_rate": 3.373570454489968e-05, - "loss": 2.4275, - "step": 186530 - }, - { - "epoch": 0.33, - "learning_rate": 3.373483260497285e-05, - "loss": 2.461, - "step": 186540 - }, - { - "epoch": 0.33, - "learning_rate": 3.3733960665046024e-05, - "loss": 2.4467, - "step": 186550 - }, - { - "epoch": 0.33, - "learning_rate": 3.3733088725119195e-05, - "loss": 2.4204, - "step": 186560 - }, - { - "epoch": 0.33, - "learning_rate": 3.3732216785192365e-05, - "loss": 2.4826, - "step": 186570 - }, - { - "epoch": 0.33, - "learning_rate": 3.373134484526554e-05, - "loss": 2.42, - "step": 186580 - }, - { - "epoch": 0.33, - "learning_rate": 3.373047290533872e-05, - "loss": 2.4091, - "step": 186590 - }, - { - "epoch": 0.33, - "learning_rate": 3.372960096541189e-05, - "loss": 2.5413, - "step": 186600 - }, - { - "epoch": 0.33, - "learning_rate": 3.372872902548506e-05, - "loss": 2.4294, - "step": 186610 - }, - { - "epoch": 0.33, - "learning_rate": 3.372785708555824e-05, - "loss": 2.5432, - "step": 186620 - }, - { - "epoch": 0.33, - "learning_rate": 3.372698514563141e-05, - "loss": 2.4697, - "step": 186630 - }, - { - "epoch": 0.33, - "learning_rate": 3.372611320570458e-05, - "loss": 2.5437, - "step": 186640 - }, - { - "epoch": 0.33, - "learning_rate": 3.3725241265777755e-05, - "loss": 2.4964, - "step": 186650 - }, - { - "epoch": 0.33, - "learning_rate": 3.372436932585093e-05, - "loss": 2.4463, - "step": 186660 - }, - { - "epoch": 0.33, - "learning_rate": 3.37234973859241e-05, - "loss": 2.5834, - "step": 186670 - }, - { - "epoch": 0.33, - "learning_rate": 3.372262544599727e-05, - "loss": 2.4709, - "step": 186680 - }, - { - "epoch": 0.33, - "learning_rate": 3.372175350607045e-05, - "loss": 2.4337, - "step": 186690 - }, - { - "epoch": 0.33, - "learning_rate": 3.372088156614362e-05, - "loss": 2.4135, - "step": 186700 - }, - { - "epoch": 0.33, - "learning_rate": 3.372000962621679e-05, - "loss": 2.3792, - "step": 186710 - }, - { - "epoch": 0.33, - "learning_rate": 3.371913768628996e-05, - "loss": 2.4102, - "step": 186720 - }, - { - "epoch": 0.33, - "learning_rate": 3.3718265746363145e-05, - "loss": 2.3583, - "step": 186730 - }, - { - "epoch": 0.33, - "learning_rate": 3.3717393806436316e-05, - "loss": 2.2898, - "step": 186740 - }, - { - "epoch": 0.33, - "learning_rate": 3.3716521866509486e-05, - "loss": 2.386, - "step": 186750 - }, - { - "epoch": 0.33, - "learning_rate": 3.371564992658266e-05, - "loss": 2.3832, - "step": 186760 - }, - { - "epoch": 0.33, - "learning_rate": 3.3714777986655834e-05, - "loss": 2.4145, - "step": 186770 - }, - { - "epoch": 0.33, - "learning_rate": 3.3713906046729004e-05, - "loss": 2.3867, - "step": 186780 - }, - { - "epoch": 0.33, - "learning_rate": 3.3713034106802175e-05, - "loss": 2.391, - "step": 186790 - }, - { - "epoch": 0.33, - "learning_rate": 3.371216216687536e-05, - "loss": 2.3987, - "step": 186800 - }, - { - "epoch": 0.33, - "learning_rate": 3.371129022694853e-05, - "loss": 2.3901, - "step": 186810 - }, - { - "epoch": 0.33, - "learning_rate": 3.37104182870217e-05, - "loss": 2.3973, - "step": 186820 - }, - { - "epoch": 0.33, - "learning_rate": 3.370954634709487e-05, - "loss": 2.3991, - "step": 186830 - }, - { - "epoch": 0.33, - "learning_rate": 3.370867440716805e-05, - "loss": 2.4347, - "step": 186840 - }, - { - "epoch": 0.33, - "learning_rate": 3.370780246724122e-05, - "loss": 2.3038, - "step": 186850 - }, - { - "epoch": 0.33, - "learning_rate": 3.370693052731439e-05, - "loss": 2.4704, - "step": 186860 - }, - { - "epoch": 0.33, - "learning_rate": 3.3706058587387565e-05, - "loss": 2.4831, - "step": 186870 - }, - { - "epoch": 0.33, - "learning_rate": 3.370518664746074e-05, - "loss": 2.4123, - "step": 186880 - }, - { - "epoch": 0.33, - "learning_rate": 3.370431470753391e-05, - "loss": 2.5022, - "step": 186890 - }, - { - "epoch": 0.33, - "learning_rate": 3.370344276760708e-05, - "loss": 2.438, - "step": 186900 - }, - { - "epoch": 0.33, - "learning_rate": 3.370257082768026e-05, - "loss": 2.3635, - "step": 186910 - }, - { - "epoch": 0.33, - "learning_rate": 3.370169888775343e-05, - "loss": 2.3533, - "step": 186920 - }, - { - "epoch": 0.33, - "learning_rate": 3.37008269478266e-05, - "loss": 2.4397, - "step": 186930 - }, - { - "epoch": 0.33, - "learning_rate": 3.369995500789978e-05, - "loss": 2.3947, - "step": 186940 - }, - { - "epoch": 0.33, - "learning_rate": 3.3699083067972955e-05, - "loss": 2.4716, - "step": 186950 - }, - { - "epoch": 0.33, - "learning_rate": 3.3698211128046125e-05, - "loss": 2.3458, - "step": 186960 - }, - { - "epoch": 0.33, - "learning_rate": 3.3697339188119296e-05, - "loss": 2.4197, - "step": 186970 - }, - { - "epoch": 0.33, - "learning_rate": 3.369646724819247e-05, - "loss": 2.4035, - "step": 186980 - }, - { - "epoch": 0.33, - "learning_rate": 3.369559530826564e-05, - "loss": 2.4253, - "step": 186990 - }, - { - "epoch": 0.33, - "learning_rate": 3.3694723368338814e-05, - "loss": 2.4414, - "step": 187000 - }, - { - "epoch": 0.33, - "learning_rate": 3.369385142841199e-05, - "loss": 2.3991, - "step": 187010 - }, - { - "epoch": 0.33, - "learning_rate": 3.369297948848516e-05, - "loss": 2.5385, - "step": 187020 - }, - { - "epoch": 0.33, - "learning_rate": 3.369210754855834e-05, - "loss": 2.4992, - "step": 187030 - }, - { - "epoch": 0.33, - "learning_rate": 3.369123560863151e-05, - "loss": 2.4274, - "step": 187040 - }, - { - "epoch": 0.33, - "learning_rate": 3.3690363668704686e-05, - "loss": 2.3283, - "step": 187050 - }, - { - "epoch": 0.33, - "learning_rate": 3.3689491728777856e-05, - "loss": 2.4782, - "step": 187060 - }, - { - "epoch": 0.33, - "learning_rate": 3.3688619788851027e-05, - "loss": 2.5264, - "step": 187070 - }, - { - "epoch": 0.33, - "learning_rate": 3.3687747848924204e-05, - "loss": 2.3358, - "step": 187080 - }, - { - "epoch": 0.33, - "learning_rate": 3.3686875908997374e-05, - "loss": 2.4943, - "step": 187090 - }, - { - "epoch": 0.33, - "learning_rate": 3.368600396907055e-05, - "loss": 2.468, - "step": 187100 - }, - { - "epoch": 0.33, - "learning_rate": 3.368513202914372e-05, - "loss": 2.4046, - "step": 187110 - }, - { - "epoch": 0.33, - "learning_rate": 3.36842600892169e-05, - "loss": 2.4882, - "step": 187120 - }, - { - "epoch": 0.33, - "learning_rate": 3.368338814929007e-05, - "loss": 2.3885, - "step": 187130 - }, - { - "epoch": 0.33, - "learning_rate": 3.368251620936324e-05, - "loss": 2.2899, - "step": 187140 - }, - { - "epoch": 0.33, - "learning_rate": 3.368164426943641e-05, - "loss": 2.3922, - "step": 187150 - }, - { - "epoch": 0.33, - "learning_rate": 3.368077232950959e-05, - "loss": 2.4451, - "step": 187160 - }, - { - "epoch": 0.33, - "learning_rate": 3.3679900389582764e-05, - "loss": 2.4985, - "step": 187170 - }, - { - "epoch": 0.33, - "learning_rate": 3.3679028449655935e-05, - "loss": 2.4307, - "step": 187180 - }, - { - "epoch": 0.33, - "learning_rate": 3.367815650972911e-05, - "loss": 2.3884, - "step": 187190 - }, - { - "epoch": 0.33, - "learning_rate": 3.367728456980228e-05, - "loss": 2.4542, - "step": 187200 - }, - { - "epoch": 0.33, - "learning_rate": 3.367641262987545e-05, - "loss": 2.3913, - "step": 187210 - }, - { - "epoch": 0.33, - "learning_rate": 3.367554068994862e-05, - "loss": 2.5733, - "step": 187220 - }, - { - "epoch": 0.33, - "learning_rate": 3.36746687500218e-05, - "loss": 2.4684, - "step": 187230 - }, - { - "epoch": 0.33, - "learning_rate": 3.367379681009497e-05, - "loss": 2.3966, - "step": 187240 - }, - { - "epoch": 0.33, - "learning_rate": 3.367292487016815e-05, - "loss": 2.4411, - "step": 187250 - }, - { - "epoch": 0.33, - "learning_rate": 3.367205293024132e-05, - "loss": 2.4423, - "step": 187260 - }, - { - "epoch": 0.33, - "learning_rate": 3.3671180990314495e-05, - "loss": 2.3319, - "step": 187270 - }, - { - "epoch": 0.33, - "learning_rate": 3.3670309050387666e-05, - "loss": 2.5238, - "step": 187280 - }, - { - "epoch": 0.33, - "learning_rate": 3.3669437110460836e-05, - "loss": 2.3715, - "step": 187290 - }, - { - "epoch": 0.33, - "learning_rate": 3.366856517053401e-05, - "loss": 2.3798, - "step": 187300 - }, - { - "epoch": 0.33, - "learning_rate": 3.3667693230607183e-05, - "loss": 2.422, - "step": 187310 - }, - { - "epoch": 0.33, - "learning_rate": 3.366682129068036e-05, - "loss": 2.4433, - "step": 187320 - }, - { - "epoch": 0.33, - "learning_rate": 3.366594935075353e-05, - "loss": 2.4842, - "step": 187330 - }, - { - "epoch": 0.33, - "learning_rate": 3.366507741082671e-05, - "loss": 2.4917, - "step": 187340 - }, - { - "epoch": 0.33, - "learning_rate": 3.366420547089988e-05, - "loss": 2.4431, - "step": 187350 - }, - { - "epoch": 0.33, - "learning_rate": 3.366333353097305e-05, - "loss": 2.321, - "step": 187360 - }, - { - "epoch": 0.33, - "learning_rate": 3.3662461591046226e-05, - "loss": 2.4105, - "step": 187370 - }, - { - "epoch": 0.33, - "learning_rate": 3.3661589651119396e-05, - "loss": 2.3863, - "step": 187380 - }, - { - "epoch": 0.33, - "learning_rate": 3.366071771119257e-05, - "loss": 2.5224, - "step": 187390 - }, - { - "epoch": 0.33, - "learning_rate": 3.3659845771265744e-05, - "loss": 2.3934, - "step": 187400 - }, - { - "epoch": 0.33, - "learning_rate": 3.365897383133892e-05, - "loss": 2.3863, - "step": 187410 - }, - { - "epoch": 0.33, - "learning_rate": 3.365810189141209e-05, - "loss": 2.4614, - "step": 187420 - }, - { - "epoch": 0.33, - "learning_rate": 3.365722995148526e-05, - "loss": 2.4524, - "step": 187430 - }, - { - "epoch": 0.33, - "learning_rate": 3.365635801155844e-05, - "loss": 2.3551, - "step": 187440 - }, - { - "epoch": 0.33, - "learning_rate": 3.365548607163161e-05, - "loss": 2.4502, - "step": 187450 - }, - { - "epoch": 0.33, - "learning_rate": 3.365461413170478e-05, - "loss": 2.464, - "step": 187460 - }, - { - "epoch": 0.33, - "learning_rate": 3.365374219177796e-05, - "loss": 2.4404, - "step": 187470 - }, - { - "epoch": 0.33, - "learning_rate": 3.3652870251851134e-05, - "loss": 2.5784, - "step": 187480 - }, - { - "epoch": 0.33, - "learning_rate": 3.3651998311924305e-05, - "loss": 2.2893, - "step": 187490 - }, - { - "epoch": 0.33, - "learning_rate": 3.3651126371997475e-05, - "loss": 2.3041, - "step": 187500 - }, - { - "epoch": 0.33, - "learning_rate": 3.365025443207065e-05, - "loss": 2.4584, - "step": 187510 - }, - { - "epoch": 0.33, - "learning_rate": 3.364938249214382e-05, - "loss": 2.4467, - "step": 187520 - }, - { - "epoch": 0.33, - "learning_rate": 3.364851055221699e-05, - "loss": 2.4889, - "step": 187530 - }, - { - "epoch": 0.33, - "learning_rate": 3.364763861229016e-05, - "loss": 2.3827, - "step": 187540 - }, - { - "epoch": 0.33, - "learning_rate": 3.364676667236335e-05, - "loss": 2.3975, - "step": 187550 - }, - { - "epoch": 0.33, - "learning_rate": 3.364589473243652e-05, - "loss": 2.4316, - "step": 187560 - }, - { - "epoch": 0.33, - "learning_rate": 3.364502279250969e-05, - "loss": 2.4471, - "step": 187570 - }, - { - "epoch": 0.33, - "learning_rate": 3.3644150852582865e-05, - "loss": 2.4387, - "step": 187580 - }, - { - "epoch": 0.33, - "learning_rate": 3.3643278912656035e-05, - "loss": 2.4339, - "step": 187590 - }, - { - "epoch": 0.33, - "learning_rate": 3.3642406972729206e-05, - "loss": 2.479, - "step": 187600 - }, - { - "epoch": 0.33, - "learning_rate": 3.3641535032802376e-05, - "loss": 2.5941, - "step": 187610 - }, - { - "epoch": 0.33, - "learning_rate": 3.364066309287556e-05, - "loss": 2.5235, - "step": 187620 - }, - { - "epoch": 0.33, - "learning_rate": 3.363979115294873e-05, - "loss": 2.3967, - "step": 187630 - }, - { - "epoch": 0.33, - "learning_rate": 3.36389192130219e-05, - "loss": 2.4778, - "step": 187640 - }, - { - "epoch": 0.33, - "learning_rate": 3.363804727309507e-05, - "loss": 2.4797, - "step": 187650 - }, - { - "epoch": 0.33, - "learning_rate": 3.363717533316825e-05, - "loss": 2.2695, - "step": 187660 - }, - { - "epoch": 0.33, - "learning_rate": 3.363630339324142e-05, - "loss": 2.3642, - "step": 187670 - }, - { - "epoch": 0.33, - "learning_rate": 3.363543145331459e-05, - "loss": 2.4431, - "step": 187680 - }, - { - "epoch": 0.33, - "learning_rate": 3.363455951338777e-05, - "loss": 2.4717, - "step": 187690 - }, - { - "epoch": 0.33, - "learning_rate": 3.3633687573460944e-05, - "loss": 2.54, - "step": 187700 - }, - { - "epoch": 0.33, - "learning_rate": 3.3632815633534114e-05, - "loss": 2.3796, - "step": 187710 - }, - { - "epoch": 0.33, - "learning_rate": 3.3631943693607284e-05, - "loss": 2.5043, - "step": 187720 - }, - { - "epoch": 0.33, - "learning_rate": 3.363107175368046e-05, - "loss": 2.4027, - "step": 187730 - }, - { - "epoch": 0.33, - "learning_rate": 3.363019981375363e-05, - "loss": 2.4352, - "step": 187740 - }, - { - "epoch": 0.33, - "learning_rate": 3.36293278738268e-05, - "loss": 2.3622, - "step": 187750 - }, - { - "epoch": 0.33, - "learning_rate": 3.362845593389998e-05, - "loss": 2.4902, - "step": 187760 - }, - { - "epoch": 0.33, - "learning_rate": 3.3627583993973157e-05, - "loss": 2.5447, - "step": 187770 - }, - { - "epoch": 0.33, - "learning_rate": 3.362671205404633e-05, - "loss": 2.4536, - "step": 187780 - }, - { - "epoch": 0.33, - "learning_rate": 3.36258401141195e-05, - "loss": 2.4395, - "step": 187790 - }, - { - "epoch": 0.33, - "learning_rate": 3.3624968174192674e-05, - "loss": 2.3794, - "step": 187800 - }, - { - "epoch": 0.33, - "learning_rate": 3.3624096234265845e-05, - "loss": 2.426, - "step": 187810 - }, - { - "epoch": 0.33, - "learning_rate": 3.3623224294339015e-05, - "loss": 2.4444, - "step": 187820 - }, - { - "epoch": 0.33, - "learning_rate": 3.362235235441219e-05, - "loss": 2.4609, - "step": 187830 - }, - { - "epoch": 0.33, - "learning_rate": 3.362148041448537e-05, - "loss": 2.5456, - "step": 187840 - }, - { - "epoch": 0.33, - "learning_rate": 3.362060847455854e-05, - "loss": 2.4735, - "step": 187850 - }, - { - "epoch": 0.33, - "learning_rate": 3.361973653463171e-05, - "loss": 2.4007, - "step": 187860 - }, - { - "epoch": 0.33, - "learning_rate": 3.361886459470489e-05, - "loss": 2.4055, - "step": 187870 - }, - { - "epoch": 0.33, - "learning_rate": 3.361799265477806e-05, - "loss": 2.4245, - "step": 187880 - }, - { - "epoch": 0.33, - "learning_rate": 3.361712071485123e-05, - "loss": 2.4822, - "step": 187890 - }, - { - "epoch": 0.33, - "learning_rate": 3.3616248774924405e-05, - "loss": 2.5009, - "step": 187900 - }, - { - "epoch": 0.33, - "learning_rate": 3.3615376834997576e-05, - "loss": 2.3937, - "step": 187910 - }, - { - "epoch": 0.33, - "learning_rate": 3.361450489507075e-05, - "loss": 2.3937, - "step": 187920 - }, - { - "epoch": 0.33, - "learning_rate": 3.361363295514392e-05, - "loss": 2.3209, - "step": 187930 - }, - { - "epoch": 0.33, - "learning_rate": 3.36127610152171e-05, - "loss": 2.4492, - "step": 187940 - }, - { - "epoch": 0.33, - "learning_rate": 3.361188907529027e-05, - "loss": 2.4285, - "step": 187950 - }, - { - "epoch": 0.33, - "learning_rate": 3.361101713536344e-05, - "loss": 2.4578, - "step": 187960 - }, - { - "epoch": 0.33, - "learning_rate": 3.361014519543662e-05, - "loss": 2.4346, - "step": 187970 - }, - { - "epoch": 0.33, - "learning_rate": 3.360927325550979e-05, - "loss": 2.3956, - "step": 187980 - }, - { - "epoch": 0.33, - "learning_rate": 3.3608401315582966e-05, - "loss": 2.5002, - "step": 187990 - }, - { - "epoch": 0.33, - "learning_rate": 3.3607529375656136e-05, - "loss": 2.3356, - "step": 188000 - }, - { - "epoch": 0.33, - "learning_rate": 3.3606657435729313e-05, - "loss": 2.4225, - "step": 188010 - }, - { - "epoch": 0.33, - "learning_rate": 3.3605785495802484e-05, - "loss": 2.4621, - "step": 188020 - }, - { - "epoch": 0.33, - "learning_rate": 3.3604913555875654e-05, - "loss": 2.3798, - "step": 188030 - }, - { - "epoch": 0.33, - "learning_rate": 3.360404161594883e-05, - "loss": 2.3195, - "step": 188040 - }, - { - "epoch": 0.33, - "learning_rate": 3.3603169676022e-05, - "loss": 2.4567, - "step": 188050 - }, - { - "epoch": 0.33, - "learning_rate": 3.360229773609517e-05, - "loss": 2.5278, - "step": 188060 - }, - { - "epoch": 0.33, - "learning_rate": 3.360142579616835e-05, - "loss": 2.4522, - "step": 188070 - }, - { - "epoch": 0.33, - "learning_rate": 3.3600553856241526e-05, - "loss": 2.361, - "step": 188080 - }, - { - "epoch": 0.33, - "learning_rate": 3.35996819163147e-05, - "loss": 2.4513, - "step": 188090 - }, - { - "epoch": 0.33, - "learning_rate": 3.359880997638787e-05, - "loss": 2.5194, - "step": 188100 - }, - { - "epoch": 0.33, - "learning_rate": 3.359793803646104e-05, - "loss": 2.4706, - "step": 188110 - }, - { - "epoch": 0.33, - "learning_rate": 3.3597066096534215e-05, - "loss": 2.2757, - "step": 188120 - }, - { - "epoch": 0.33, - "learning_rate": 3.3596194156607385e-05, - "loss": 2.4817, - "step": 188130 - }, - { - "epoch": 0.33, - "learning_rate": 3.359532221668056e-05, - "loss": 2.4637, - "step": 188140 - }, - { - "epoch": 0.33, - "learning_rate": 3.359445027675374e-05, - "loss": 2.5056, - "step": 188150 - }, - { - "epoch": 0.33, - "learning_rate": 3.359357833682691e-05, - "loss": 2.4133, - "step": 188160 - }, - { - "epoch": 0.33, - "learning_rate": 3.359270639690008e-05, - "loss": 2.4447, - "step": 188170 - }, - { - "epoch": 0.33, - "learning_rate": 3.359183445697325e-05, - "loss": 2.4338, - "step": 188180 - }, - { - "epoch": 0.33, - "learning_rate": 3.359096251704643e-05, - "loss": 2.3172, - "step": 188190 - }, - { - "epoch": 0.33, - "learning_rate": 3.35900905771196e-05, - "loss": 2.3234, - "step": 188200 - }, - { - "epoch": 0.33, - "learning_rate": 3.358921863719277e-05, - "loss": 2.3524, - "step": 188210 - }, - { - "epoch": 0.33, - "learning_rate": 3.3588346697265946e-05, - "loss": 2.4676, - "step": 188220 - }, - { - "epoch": 0.33, - "learning_rate": 3.358747475733912e-05, - "loss": 2.4722, - "step": 188230 - }, - { - "epoch": 0.33, - "learning_rate": 3.358660281741229e-05, - "loss": 2.422, - "step": 188240 - }, - { - "epoch": 0.33, - "learning_rate": 3.3585730877485464e-05, - "loss": 2.5847, - "step": 188250 - }, - { - "epoch": 0.33, - "learning_rate": 3.358485893755864e-05, - "loss": 2.4144, - "step": 188260 - }, - { - "epoch": 0.33, - "learning_rate": 3.358398699763181e-05, - "loss": 2.428, - "step": 188270 - }, - { - "epoch": 0.33, - "learning_rate": 3.358311505770498e-05, - "loss": 2.4266, - "step": 188280 - }, - { - "epoch": 0.33, - "learning_rate": 3.358224311777816e-05, - "loss": 2.4684, - "step": 188290 - }, - { - "epoch": 0.33, - "learning_rate": 3.3581371177851336e-05, - "loss": 2.3116, - "step": 188300 - }, - { - "epoch": 0.33, - "learning_rate": 3.3580499237924506e-05, - "loss": 2.4097, - "step": 188310 - }, - { - "epoch": 0.33, - "learning_rate": 3.357962729799768e-05, - "loss": 2.435, - "step": 188320 - }, - { - "epoch": 0.33, - "learning_rate": 3.3578755358070854e-05, - "loss": 2.3724, - "step": 188330 - }, - { - "epoch": 0.33, - "learning_rate": 3.3577883418144024e-05, - "loss": 2.3298, - "step": 188340 - }, - { - "epoch": 0.33, - "learning_rate": 3.3577011478217195e-05, - "loss": 2.4695, - "step": 188350 - }, - { - "epoch": 0.33, - "learning_rate": 3.357613953829037e-05, - "loss": 2.5158, - "step": 188360 - }, - { - "epoch": 0.33, - "learning_rate": 3.357526759836355e-05, - "loss": 2.4352, - "step": 188370 - }, - { - "epoch": 0.33, - "learning_rate": 3.357439565843672e-05, - "loss": 2.4552, - "step": 188380 - }, - { - "epoch": 0.33, - "learning_rate": 3.357352371850989e-05, - "loss": 2.4107, - "step": 188390 - }, - { - "epoch": 0.33, - "learning_rate": 3.357265177858307e-05, - "loss": 2.498, - "step": 188400 - }, - { - "epoch": 0.33, - "learning_rate": 3.357177983865624e-05, - "loss": 2.459, - "step": 188410 - }, - { - "epoch": 0.33, - "learning_rate": 3.357090789872941e-05, - "loss": 2.37, - "step": 188420 - }, - { - "epoch": 0.33, - "learning_rate": 3.3570035958802585e-05, - "loss": 2.4365, - "step": 188430 - }, - { - "epoch": 0.33, - "learning_rate": 3.356916401887576e-05, - "loss": 2.631, - "step": 188440 - }, - { - "epoch": 0.33, - "learning_rate": 3.356829207894893e-05, - "loss": 2.5303, - "step": 188450 - }, - { - "epoch": 0.33, - "learning_rate": 3.35674201390221e-05, - "loss": 2.4006, - "step": 188460 - }, - { - "epoch": 0.33, - "learning_rate": 3.356654819909528e-05, - "loss": 2.4611, - "step": 188470 - }, - { - "epoch": 0.33, - "learning_rate": 3.356567625916845e-05, - "loss": 2.4934, - "step": 188480 - }, - { - "epoch": 0.33, - "learning_rate": 3.356480431924162e-05, - "loss": 2.465, - "step": 188490 - }, - { - "epoch": 0.33, - "learning_rate": 3.356393237931479e-05, - "loss": 2.4593, - "step": 188500 - }, - { - "epoch": 0.33, - "learning_rate": 3.3563060439387975e-05, - "loss": 2.4563, - "step": 188510 - }, - { - "epoch": 0.33, - "learning_rate": 3.3562188499461145e-05, - "loss": 2.3968, - "step": 188520 - }, - { - "epoch": 0.33, - "learning_rate": 3.3561316559534316e-05, - "loss": 2.5582, - "step": 188530 - }, - { - "epoch": 0.33, - "learning_rate": 3.356044461960749e-05, - "loss": 2.4697, - "step": 188540 - }, - { - "epoch": 0.33, - "learning_rate": 3.355957267968066e-05, - "loss": 2.3266, - "step": 188550 - }, - { - "epoch": 0.33, - "learning_rate": 3.3558700739753834e-05, - "loss": 2.5055, - "step": 188560 - }, - { - "epoch": 0.33, - "learning_rate": 3.3557828799827004e-05, - "loss": 2.5233, - "step": 188570 - }, - { - "epoch": 0.33, - "learning_rate": 3.355695685990018e-05, - "loss": 2.5394, - "step": 188580 - }, - { - "epoch": 0.33, - "learning_rate": 3.355608491997336e-05, - "loss": 2.4772, - "step": 188590 - }, - { - "epoch": 0.33, - "learning_rate": 3.355521298004653e-05, - "loss": 2.5527, - "step": 188600 - }, - { - "epoch": 0.33, - "learning_rate": 3.35543410401197e-05, - "loss": 2.4514, - "step": 188610 - }, - { - "epoch": 0.33, - "learning_rate": 3.3553469100192876e-05, - "loss": 2.3815, - "step": 188620 - }, - { - "epoch": 0.33, - "learning_rate": 3.3552597160266047e-05, - "loss": 2.4575, - "step": 188630 - }, - { - "epoch": 0.33, - "learning_rate": 3.355172522033922e-05, - "loss": 2.4541, - "step": 188640 - }, - { - "epoch": 0.33, - "learning_rate": 3.3550853280412394e-05, - "loss": 2.4547, - "step": 188650 - }, - { - "epoch": 0.33, - "learning_rate": 3.354998134048557e-05, - "loss": 2.5815, - "step": 188660 - }, - { - "epoch": 0.33, - "learning_rate": 3.354910940055874e-05, - "loss": 2.4729, - "step": 188670 - }, - { - "epoch": 0.33, - "learning_rate": 3.354823746063191e-05, - "loss": 2.4883, - "step": 188680 - }, - { - "epoch": 0.33, - "learning_rate": 3.354736552070509e-05, - "loss": 2.4641, - "step": 188690 - }, - { - "epoch": 0.33, - "learning_rate": 3.354649358077826e-05, - "loss": 2.4387, - "step": 188700 - }, - { - "epoch": 0.33, - "learning_rate": 3.354562164085143e-05, - "loss": 2.4269, - "step": 188710 - }, - { - "epoch": 0.33, - "learning_rate": 3.354474970092461e-05, - "loss": 2.3209, - "step": 188720 - }, - { - "epoch": 0.33, - "learning_rate": 3.354387776099778e-05, - "loss": 2.5372, - "step": 188730 - }, - { - "epoch": 0.33, - "learning_rate": 3.3543005821070955e-05, - "loss": 2.4825, - "step": 188740 - }, - { - "epoch": 0.33, - "learning_rate": 3.3542133881144125e-05, - "loss": 2.4641, - "step": 188750 - }, - { - "epoch": 0.33, - "learning_rate": 3.35412619412173e-05, - "loss": 2.4351, - "step": 188760 - }, - { - "epoch": 0.33, - "learning_rate": 3.354039000129047e-05, - "loss": 2.4893, - "step": 188770 - }, - { - "epoch": 0.33, - "learning_rate": 3.353951806136364e-05, - "loss": 2.456, - "step": 188780 - }, - { - "epoch": 0.33, - "learning_rate": 3.353864612143682e-05, - "loss": 2.4659, - "step": 188790 - }, - { - "epoch": 0.33, - "learning_rate": 3.353777418150999e-05, - "loss": 2.4726, - "step": 188800 - }, - { - "epoch": 0.33, - "learning_rate": 3.353690224158317e-05, - "loss": 2.3798, - "step": 188810 - }, - { - "epoch": 0.33, - "learning_rate": 3.353603030165634e-05, - "loss": 2.4226, - "step": 188820 - }, - { - "epoch": 0.33, - "learning_rate": 3.3535158361729515e-05, - "loss": 2.3944, - "step": 188830 - }, - { - "epoch": 0.33, - "learning_rate": 3.3534286421802686e-05, - "loss": 2.4519, - "step": 188840 - }, - { - "epoch": 0.33, - "learning_rate": 3.3533414481875856e-05, - "loss": 2.5094, - "step": 188850 - }, - { - "epoch": 0.33, - "learning_rate": 3.353254254194903e-05, - "loss": 2.4752, - "step": 188860 - }, - { - "epoch": 0.33, - "learning_rate": 3.3531670602022203e-05, - "loss": 2.4526, - "step": 188870 - }, - { - "epoch": 0.33, - "learning_rate": 3.3530798662095374e-05, - "loss": 2.3856, - "step": 188880 - }, - { - "epoch": 0.33, - "learning_rate": 3.352992672216855e-05, - "loss": 2.5045, - "step": 188890 - }, - { - "epoch": 0.33, - "learning_rate": 3.352905478224173e-05, - "loss": 2.5707, - "step": 188900 - }, - { - "epoch": 0.33, - "learning_rate": 3.35281828423149e-05, - "loss": 2.4387, - "step": 188910 - }, - { - "epoch": 0.33, - "learning_rate": 3.352731090238807e-05, - "loss": 2.3362, - "step": 188920 - }, - { - "epoch": 0.33, - "learning_rate": 3.3526438962461246e-05, - "loss": 2.3654, - "step": 188930 - }, - { - "epoch": 0.33, - "learning_rate": 3.3525567022534416e-05, - "loss": 2.4981, - "step": 188940 - }, - { - "epoch": 0.33, - "learning_rate": 3.352469508260759e-05, - "loss": 2.395, - "step": 188950 - }, - { - "epoch": 0.33, - "learning_rate": 3.3523823142680764e-05, - "loss": 2.4528, - "step": 188960 - }, - { - "epoch": 0.33, - "learning_rate": 3.352295120275394e-05, - "loss": 2.4737, - "step": 188970 - }, - { - "epoch": 0.33, - "learning_rate": 3.352207926282711e-05, - "loss": 2.3364, - "step": 188980 - }, - { - "epoch": 0.33, - "learning_rate": 3.352120732290028e-05, - "loss": 2.5527, - "step": 188990 - }, - { - "epoch": 0.33, - "learning_rate": 3.352033538297345e-05, - "loss": 2.3962, - "step": 189000 - }, - { - "epoch": 0.33, - "learning_rate": 3.351946344304663e-05, - "loss": 2.4004, - "step": 189010 - }, - { - "epoch": 0.33, - "learning_rate": 3.35185915031198e-05, - "loss": 2.4486, - "step": 189020 - }, - { - "epoch": 0.33, - "learning_rate": 3.351771956319298e-05, - "loss": 2.4786, - "step": 189030 - }, - { - "epoch": 0.33, - "learning_rate": 3.3516847623266154e-05, - "loss": 2.5427, - "step": 189040 - }, - { - "epoch": 0.33, - "learning_rate": 3.3515975683339325e-05, - "loss": 2.4162, - "step": 189050 - }, - { - "epoch": 0.33, - "learning_rate": 3.3515103743412495e-05, - "loss": 2.3391, - "step": 189060 - }, - { - "epoch": 0.33, - "learning_rate": 3.3514231803485665e-05, - "loss": 2.4635, - "step": 189070 - }, - { - "epoch": 0.33, - "learning_rate": 3.351335986355884e-05, - "loss": 2.417, - "step": 189080 - }, - { - "epoch": 0.33, - "learning_rate": 3.351248792363201e-05, - "loss": 2.3962, - "step": 189090 - }, - { - "epoch": 0.33, - "learning_rate": 3.351161598370518e-05, - "loss": 2.6302, - "step": 189100 - }, - { - "epoch": 0.33, - "learning_rate": 3.351074404377836e-05, - "loss": 2.4463, - "step": 189110 - }, - { - "epoch": 0.33, - "learning_rate": 3.350987210385154e-05, - "loss": 2.4588, - "step": 189120 - }, - { - "epoch": 0.33, - "learning_rate": 3.350900016392471e-05, - "loss": 2.3591, - "step": 189130 - }, - { - "epoch": 0.33, - "learning_rate": 3.350812822399788e-05, - "loss": 2.4357, - "step": 189140 - }, - { - "epoch": 0.33, - "learning_rate": 3.3507256284071055e-05, - "loss": 2.4485, - "step": 189150 - }, - { - "epoch": 0.33, - "learning_rate": 3.3506384344144226e-05, - "loss": 2.4804, - "step": 189160 - }, - { - "epoch": 0.33, - "learning_rate": 3.3505512404217396e-05, - "loss": 2.4532, - "step": 189170 - }, - { - "epoch": 0.33, - "learning_rate": 3.3504640464290573e-05, - "loss": 2.3312, - "step": 189180 - }, - { - "epoch": 0.33, - "learning_rate": 3.350376852436375e-05, - "loss": 2.4259, - "step": 189190 - }, - { - "epoch": 0.33, - "learning_rate": 3.350289658443692e-05, - "loss": 2.4539, - "step": 189200 - }, - { - "epoch": 0.33, - "learning_rate": 3.350202464451009e-05, - "loss": 2.545, - "step": 189210 - }, - { - "epoch": 0.33, - "learning_rate": 3.350115270458327e-05, - "loss": 2.4594, - "step": 189220 - }, - { - "epoch": 0.33, - "learning_rate": 3.350028076465644e-05, - "loss": 2.3898, - "step": 189230 - }, - { - "epoch": 0.33, - "learning_rate": 3.349940882472961e-05, - "loss": 2.5334, - "step": 189240 - }, - { - "epoch": 0.33, - "learning_rate": 3.3498536884802786e-05, - "loss": 2.3728, - "step": 189250 - }, - { - "epoch": 0.33, - "learning_rate": 3.3497664944875964e-05, - "loss": 2.3776, - "step": 189260 - }, - { - "epoch": 0.33, - "learning_rate": 3.3496793004949134e-05, - "loss": 2.4419, - "step": 189270 - }, - { - "epoch": 0.33, - "learning_rate": 3.3495921065022304e-05, - "loss": 2.4705, - "step": 189280 - }, - { - "epoch": 0.33, - "learning_rate": 3.349504912509548e-05, - "loss": 2.4252, - "step": 189290 - }, - { - "epoch": 0.33, - "learning_rate": 3.349417718516865e-05, - "loss": 2.415, - "step": 189300 - }, - { - "epoch": 0.33, - "learning_rate": 3.349330524524182e-05, - "loss": 2.3208, - "step": 189310 - }, - { - "epoch": 0.33, - "learning_rate": 3.3492433305315e-05, - "loss": 2.5459, - "step": 189320 - }, - { - "epoch": 0.33, - "learning_rate": 3.3491561365388177e-05, - "loss": 2.4719, - "step": 189330 - }, - { - "epoch": 0.33, - "learning_rate": 3.349068942546135e-05, - "loss": 2.3204, - "step": 189340 - }, - { - "epoch": 0.33, - "learning_rate": 3.348981748553452e-05, - "loss": 2.4498, - "step": 189350 - }, - { - "epoch": 0.33, - "learning_rate": 3.3488945545607694e-05, - "loss": 2.4479, - "step": 189360 - }, - { - "epoch": 0.33, - "learning_rate": 3.3488073605680865e-05, - "loss": 2.5143, - "step": 189370 - }, - { - "epoch": 0.33, - "learning_rate": 3.3487201665754035e-05, - "loss": 2.3713, - "step": 189380 - }, - { - "epoch": 0.33, - "learning_rate": 3.348632972582721e-05, - "loss": 2.3719, - "step": 189390 - }, - { - "epoch": 0.33, - "learning_rate": 3.348545778590038e-05, - "loss": 2.4116, - "step": 189400 - }, - { - "epoch": 0.33, - "learning_rate": 3.348458584597356e-05, - "loss": 2.4287, - "step": 189410 - }, - { - "epoch": 0.33, - "learning_rate": 3.348371390604673e-05, - "loss": 2.4713, - "step": 189420 - }, - { - "epoch": 0.33, - "learning_rate": 3.348284196611991e-05, - "loss": 2.4337, - "step": 189430 - }, - { - "epoch": 0.33, - "learning_rate": 3.348197002619308e-05, - "loss": 2.4378, - "step": 189440 - }, - { - "epoch": 0.33, - "learning_rate": 3.348109808626625e-05, - "loss": 2.375, - "step": 189450 - }, - { - "epoch": 0.33, - "learning_rate": 3.348022614633942e-05, - "loss": 2.4759, - "step": 189460 - }, - { - "epoch": 0.33, - "learning_rate": 3.3479354206412596e-05, - "loss": 2.5032, - "step": 189470 - }, - { - "epoch": 0.33, - "learning_rate": 3.347848226648577e-05, - "loss": 2.377, - "step": 189480 - }, - { - "epoch": 0.33, - "learning_rate": 3.347761032655894e-05, - "loss": 2.3652, - "step": 189490 - }, - { - "epoch": 0.33, - "learning_rate": 3.347673838663212e-05, - "loss": 2.517, - "step": 189500 - }, - { - "epoch": 0.33, - "learning_rate": 3.347586644670529e-05, - "loss": 2.5485, - "step": 189510 - }, - { - "epoch": 0.33, - "learning_rate": 3.347499450677846e-05, - "loss": 2.5048, - "step": 189520 - }, - { - "epoch": 0.33, - "learning_rate": 3.347412256685163e-05, - "loss": 2.5847, - "step": 189530 - }, - { - "epoch": 0.33, - "learning_rate": 3.347325062692481e-05, - "loss": 2.4297, - "step": 189540 - }, - { - "epoch": 0.33, - "learning_rate": 3.3472378686997986e-05, - "loss": 2.4619, - "step": 189550 - }, - { - "epoch": 0.33, - "learning_rate": 3.3471506747071156e-05, - "loss": 2.4174, - "step": 189560 - }, - { - "epoch": 0.33, - "learning_rate": 3.347063480714433e-05, - "loss": 2.5105, - "step": 189570 - }, - { - "epoch": 0.33, - "learning_rate": 3.3469762867217504e-05, - "loss": 2.4842, - "step": 189580 - }, - { - "epoch": 0.33, - "learning_rate": 3.3468890927290674e-05, - "loss": 2.4943, - "step": 189590 - }, - { - "epoch": 0.33, - "learning_rate": 3.3468018987363845e-05, - "loss": 2.3686, - "step": 189600 - }, - { - "epoch": 0.33, - "learning_rate": 3.346714704743702e-05, - "loss": 2.4572, - "step": 189610 - }, - { - "epoch": 0.33, - "learning_rate": 3.346627510751019e-05, - "loss": 2.3874, - "step": 189620 - }, - { - "epoch": 0.33, - "learning_rate": 3.346540316758337e-05, - "loss": 2.4242, - "step": 189630 - }, - { - "epoch": 0.33, - "learning_rate": 3.346453122765654e-05, - "loss": 2.2941, - "step": 189640 - }, - { - "epoch": 0.33, - "learning_rate": 3.346365928772972e-05, - "loss": 2.4447, - "step": 189650 - }, - { - "epoch": 0.33, - "learning_rate": 3.346278734780289e-05, - "loss": 2.4004, - "step": 189660 - }, - { - "epoch": 0.33, - "learning_rate": 3.346191540787606e-05, - "loss": 2.3907, - "step": 189670 - }, - { - "epoch": 0.33, - "learning_rate": 3.3461043467949235e-05, - "loss": 2.4707, - "step": 189680 - }, - { - "epoch": 0.33, - "learning_rate": 3.3460171528022405e-05, - "loss": 2.4773, - "step": 189690 - }, - { - "epoch": 0.33, - "learning_rate": 3.345929958809558e-05, - "loss": 2.4986, - "step": 189700 - }, - { - "epoch": 0.33, - "learning_rate": 3.345842764816875e-05, - "loss": 2.4874, - "step": 189710 - }, - { - "epoch": 0.33, - "learning_rate": 3.345755570824193e-05, - "loss": 2.5817, - "step": 189720 - }, - { - "epoch": 0.33, - "learning_rate": 3.34566837683151e-05, - "loss": 2.3001, - "step": 189730 - }, - { - "epoch": 0.33, - "learning_rate": 3.345581182838827e-05, - "loss": 2.5117, - "step": 189740 - }, - { - "epoch": 0.33, - "learning_rate": 3.345493988846145e-05, - "loss": 2.4254, - "step": 189750 - }, - { - "epoch": 0.33, - "learning_rate": 3.345406794853462e-05, - "loss": 2.4289, - "step": 189760 - }, - { - "epoch": 0.33, - "learning_rate": 3.345319600860779e-05, - "loss": 2.4878, - "step": 189770 - }, - { - "epoch": 0.33, - "learning_rate": 3.3452324068680966e-05, - "loss": 2.4707, - "step": 189780 - }, - { - "epoch": 0.33, - "learning_rate": 3.345145212875414e-05, - "loss": 2.4896, - "step": 189790 - }, - { - "epoch": 0.33, - "learning_rate": 3.345058018882731e-05, - "loss": 2.4485, - "step": 189800 - }, - { - "epoch": 0.33, - "learning_rate": 3.3449708248900484e-05, - "loss": 2.405, - "step": 189810 - }, - { - "epoch": 0.33, - "learning_rate": 3.344883630897366e-05, - "loss": 2.3866, - "step": 189820 - }, - { - "epoch": 0.33, - "learning_rate": 3.344796436904683e-05, - "loss": 2.4105, - "step": 189830 - }, - { - "epoch": 0.33, - "learning_rate": 3.344709242912e-05, - "loss": 2.4214, - "step": 189840 - }, - { - "epoch": 0.33, - "learning_rate": 3.344622048919318e-05, - "loss": 2.4637, - "step": 189850 - }, - { - "epoch": 0.33, - "learning_rate": 3.3445348549266356e-05, - "loss": 2.3966, - "step": 189860 - }, - { - "epoch": 0.33, - "learning_rate": 3.3444476609339526e-05, - "loss": 2.3942, - "step": 189870 - }, - { - "epoch": 0.33, - "learning_rate": 3.34436046694127e-05, - "loss": 2.3534, - "step": 189880 - }, - { - "epoch": 0.33, - "learning_rate": 3.3442732729485874e-05, - "loss": 2.4966, - "step": 189890 - }, - { - "epoch": 0.33, - "learning_rate": 3.3441860789559044e-05, - "loss": 2.4865, - "step": 189900 - }, - { - "epoch": 0.33, - "learning_rate": 3.3440988849632215e-05, - "loss": 2.5208, - "step": 189910 - }, - { - "epoch": 0.33, - "learning_rate": 3.3440116909705385e-05, - "loss": 2.5085, - "step": 189920 - }, - { - "epoch": 0.33, - "learning_rate": 3.343924496977857e-05, - "loss": 2.4809, - "step": 189930 - }, - { - "epoch": 0.33, - "learning_rate": 3.343837302985174e-05, - "loss": 2.4838, - "step": 189940 - }, - { - "epoch": 0.33, - "learning_rate": 3.343750108992491e-05, - "loss": 2.5057, - "step": 189950 - }, - { - "epoch": 0.33, - "learning_rate": 3.343662914999808e-05, - "loss": 2.4082, - "step": 189960 - }, - { - "epoch": 0.33, - "learning_rate": 3.343575721007126e-05, - "loss": 2.5087, - "step": 189970 - }, - { - "epoch": 0.33, - "learning_rate": 3.343488527014443e-05, - "loss": 2.3558, - "step": 189980 - }, - { - "epoch": 0.33, - "learning_rate": 3.34340133302176e-05, - "loss": 2.4274, - "step": 189990 - }, - { - "epoch": 0.33, - "learning_rate": 3.343314139029078e-05, - "loss": 2.3603, - "step": 190000 - }, - { - "epoch": 0.33, - "learning_rate": 3.343226945036395e-05, - "loss": 2.3927, - "step": 190010 - }, - { - "epoch": 0.33, - "learning_rate": 3.343139751043712e-05, - "loss": 2.4216, - "step": 190020 - }, - { - "epoch": 0.33, - "learning_rate": 3.343052557051029e-05, - "loss": 2.492, - "step": 190030 - }, - { - "epoch": 0.33, - "learning_rate": 3.342965363058347e-05, - "loss": 2.4217, - "step": 190040 - }, - { - "epoch": 0.33, - "learning_rate": 3.342878169065664e-05, - "loss": 2.4628, - "step": 190050 - }, - { - "epoch": 0.33, - "learning_rate": 3.342790975072981e-05, - "loss": 2.5597, - "step": 190060 - }, - { - "epoch": 0.33, - "learning_rate": 3.342703781080299e-05, - "loss": 2.4214, - "step": 190070 - }, - { - "epoch": 0.33, - "learning_rate": 3.3426165870876165e-05, - "loss": 2.4455, - "step": 190080 - }, - { - "epoch": 0.33, - "learning_rate": 3.3425293930949336e-05, - "loss": 2.3705, - "step": 190090 - }, - { - "epoch": 0.33, - "learning_rate": 3.3424421991022506e-05, - "loss": 2.4675, - "step": 190100 - }, - { - "epoch": 0.33, - "learning_rate": 3.342355005109568e-05, - "loss": 2.3701, - "step": 190110 - }, - { - "epoch": 0.33, - "learning_rate": 3.3422678111168854e-05, - "loss": 2.3746, - "step": 190120 - }, - { - "epoch": 0.33, - "learning_rate": 3.3421806171242024e-05, - "loss": 2.3206, - "step": 190130 - }, - { - "epoch": 0.33, - "learning_rate": 3.34209342313152e-05, - "loss": 2.4819, - "step": 190140 - }, - { - "epoch": 0.33, - "learning_rate": 3.342006229138838e-05, - "loss": 2.3426, - "step": 190150 - }, - { - "epoch": 0.33, - "learning_rate": 3.341919035146155e-05, - "loss": 2.2801, - "step": 190160 - }, - { - "epoch": 0.33, - "learning_rate": 3.341831841153472e-05, - "loss": 2.4322, - "step": 190170 - }, - { - "epoch": 0.33, - "learning_rate": 3.3417446471607896e-05, - "loss": 2.5053, - "step": 190180 - }, - { - "epoch": 0.33, - "learning_rate": 3.3416574531681067e-05, - "loss": 2.4894, - "step": 190190 - }, - { - "epoch": 0.33, - "learning_rate": 3.341570259175424e-05, - "loss": 2.2786, - "step": 190200 - }, - { - "epoch": 0.33, - "learning_rate": 3.3414830651827414e-05, - "loss": 2.4732, - "step": 190210 - }, - { - "epoch": 0.33, - "learning_rate": 3.341395871190059e-05, - "loss": 2.5745, - "step": 190220 - }, - { - "epoch": 0.33, - "learning_rate": 3.341308677197376e-05, - "loss": 2.4764, - "step": 190230 - }, - { - "epoch": 0.33, - "learning_rate": 3.341221483204693e-05, - "loss": 2.426, - "step": 190240 - }, - { - "epoch": 0.33, - "learning_rate": 3.341134289212011e-05, - "loss": 2.299, - "step": 190250 - }, - { - "epoch": 0.33, - "learning_rate": 3.341047095219328e-05, - "loss": 2.4376, - "step": 190260 - }, - { - "epoch": 0.33, - "learning_rate": 3.340959901226645e-05, - "loss": 2.357, - "step": 190270 - }, - { - "epoch": 0.33, - "learning_rate": 3.340872707233963e-05, - "loss": 2.3893, - "step": 190280 - }, - { - "epoch": 0.33, - "learning_rate": 3.34078551324128e-05, - "loss": 2.4699, - "step": 190290 - }, - { - "epoch": 0.33, - "learning_rate": 3.3406983192485975e-05, - "loss": 2.4328, - "step": 190300 - }, - { - "epoch": 0.33, - "learning_rate": 3.3406111252559145e-05, - "loss": 2.3998, - "step": 190310 - }, - { - "epoch": 0.33, - "learning_rate": 3.340523931263232e-05, - "loss": 2.4372, - "step": 190320 - }, - { - "epoch": 0.33, - "learning_rate": 3.340436737270549e-05, - "loss": 2.4449, - "step": 190330 - }, - { - "epoch": 0.33, - "learning_rate": 3.340349543277866e-05, - "loss": 2.4499, - "step": 190340 - }, - { - "epoch": 0.33, - "learning_rate": 3.340262349285183e-05, - "loss": 2.3565, - "step": 190350 - }, - { - "epoch": 0.33, - "learning_rate": 3.340175155292501e-05, - "loss": 2.4982, - "step": 190360 - }, - { - "epoch": 0.33, - "learning_rate": 3.340087961299819e-05, - "loss": 2.5079, - "step": 190370 - }, - { - "epoch": 0.33, - "learning_rate": 3.340000767307136e-05, - "loss": 2.5706, - "step": 190380 - }, - { - "epoch": 0.33, - "learning_rate": 3.3399135733144535e-05, - "loss": 2.2872, - "step": 190390 - }, - { - "epoch": 0.33, - "learning_rate": 3.3398263793217706e-05, - "loss": 2.3859, - "step": 190400 - }, - { - "epoch": 0.33, - "learning_rate": 3.3397391853290876e-05, - "loss": 2.3716, - "step": 190410 - }, - { - "epoch": 0.33, - "learning_rate": 3.3396519913364046e-05, - "loss": 2.2884, - "step": 190420 - }, - { - "epoch": 0.33, - "learning_rate": 3.3395647973437223e-05, - "loss": 2.5887, - "step": 190430 - }, - { - "epoch": 0.33, - "learning_rate": 3.3394776033510394e-05, - "loss": 2.4318, - "step": 190440 - }, - { - "epoch": 0.33, - "learning_rate": 3.339390409358357e-05, - "loss": 2.448, - "step": 190450 - }, - { - "epoch": 0.33, - "learning_rate": 3.339303215365674e-05, - "loss": 2.459, - "step": 190460 - }, - { - "epoch": 0.33, - "learning_rate": 3.339216021372992e-05, - "loss": 2.4976, - "step": 190470 - }, - { - "epoch": 0.33, - "learning_rate": 3.339128827380309e-05, - "loss": 2.3874, - "step": 190480 - }, - { - "epoch": 0.33, - "learning_rate": 3.339041633387626e-05, - "loss": 2.3926, - "step": 190490 - }, - { - "epoch": 0.33, - "learning_rate": 3.3389544393949436e-05, - "loss": 2.3924, - "step": 190500 - }, - { - "epoch": 0.33, - "learning_rate": 3.338867245402261e-05, - "loss": 2.5253, - "step": 190510 - }, - { - "epoch": 0.33, - "learning_rate": 3.3387800514095784e-05, - "loss": 2.4164, - "step": 190520 - }, - { - "epoch": 0.33, - "learning_rate": 3.3386928574168954e-05, - "loss": 2.409, - "step": 190530 - }, - { - "epoch": 0.33, - "learning_rate": 3.338605663424213e-05, - "loss": 2.4724, - "step": 190540 - }, - { - "epoch": 0.33, - "learning_rate": 3.33851846943153e-05, - "loss": 2.4732, - "step": 190550 - }, - { - "epoch": 0.33, - "learning_rate": 3.338431275438847e-05, - "loss": 2.5336, - "step": 190560 - }, - { - "epoch": 0.33, - "learning_rate": 3.338344081446165e-05, - "loss": 2.4003, - "step": 190570 - }, - { - "epoch": 0.33, - "learning_rate": 3.338256887453482e-05, - "loss": 2.4209, - "step": 190580 - }, - { - "epoch": 0.33, - "learning_rate": 3.338169693460799e-05, - "loss": 2.4703, - "step": 190590 - }, - { - "epoch": 0.33, - "learning_rate": 3.338082499468117e-05, - "loss": 2.3704, - "step": 190600 - }, - { - "epoch": 0.33, - "learning_rate": 3.3379953054754345e-05, - "loss": 2.2732, - "step": 190610 - }, - { - "epoch": 0.33, - "learning_rate": 3.3379081114827515e-05, - "loss": 2.3875, - "step": 190620 - }, - { - "epoch": 0.33, - "learning_rate": 3.3378209174900685e-05, - "loss": 2.3805, - "step": 190630 - }, - { - "epoch": 0.33, - "learning_rate": 3.337733723497386e-05, - "loss": 2.4338, - "step": 190640 - }, - { - "epoch": 0.33, - "learning_rate": 3.337646529504703e-05, - "loss": 2.4178, - "step": 190650 - }, - { - "epoch": 0.33, - "learning_rate": 3.33755933551202e-05, - "loss": 2.5433, - "step": 190660 - }, - { - "epoch": 0.33, - "learning_rate": 3.337472141519338e-05, - "loss": 2.404, - "step": 190670 - }, - { - "epoch": 0.33, - "learning_rate": 3.337384947526656e-05, - "loss": 2.4139, - "step": 190680 - }, - { - "epoch": 0.33, - "learning_rate": 3.337297753533973e-05, - "loss": 2.3875, - "step": 190690 - }, - { - "epoch": 0.33, - "learning_rate": 3.33721055954129e-05, - "loss": 2.4912, - "step": 190700 - }, - { - "epoch": 0.33, - "learning_rate": 3.3371233655486076e-05, - "loss": 2.434, - "step": 190710 - }, - { - "epoch": 0.33, - "learning_rate": 3.3370361715559246e-05, - "loss": 2.4334, - "step": 190720 - }, - { - "epoch": 0.33, - "learning_rate": 3.3369489775632416e-05, - "loss": 2.54, - "step": 190730 - }, - { - "epoch": 0.33, - "learning_rate": 3.3368617835705593e-05, - "loss": 2.4742, - "step": 190740 - }, - { - "epoch": 0.33, - "learning_rate": 3.336774589577877e-05, - "loss": 2.478, - "step": 190750 - }, - { - "epoch": 0.33, - "learning_rate": 3.336687395585194e-05, - "loss": 2.4799, - "step": 190760 - }, - { - "epoch": 0.33, - "learning_rate": 3.336600201592511e-05, - "loss": 2.3174, - "step": 190770 - }, - { - "epoch": 0.33, - "learning_rate": 3.336513007599829e-05, - "loss": 2.5017, - "step": 190780 - }, - { - "epoch": 0.33, - "learning_rate": 3.336425813607146e-05, - "loss": 2.3806, - "step": 190790 - }, - { - "epoch": 0.33, - "learning_rate": 3.336338619614463e-05, - "loss": 2.4903, - "step": 190800 - }, - { - "epoch": 0.33, - "learning_rate": 3.33625142562178e-05, - "loss": 2.4707, - "step": 190810 - }, - { - "epoch": 0.33, - "learning_rate": 3.3361642316290984e-05, - "loss": 2.4336, - "step": 190820 - }, - { - "epoch": 0.33, - "learning_rate": 3.3360770376364154e-05, - "loss": 2.4717, - "step": 190830 - }, - { - "epoch": 0.33, - "learning_rate": 3.3359898436437324e-05, - "loss": 2.4101, - "step": 190840 - }, - { - "epoch": 0.33, - "learning_rate": 3.33590264965105e-05, - "loss": 2.4818, - "step": 190850 - }, - { - "epoch": 0.33, - "learning_rate": 3.335815455658367e-05, - "loss": 2.4568, - "step": 190860 - }, - { - "epoch": 0.33, - "learning_rate": 3.335728261665684e-05, - "loss": 2.5177, - "step": 190870 - }, - { - "epoch": 0.33, - "learning_rate": 3.335641067673001e-05, - "loss": 2.3422, - "step": 190880 - }, - { - "epoch": 0.33, - "learning_rate": 3.3355538736803197e-05, - "loss": 2.4604, - "step": 190890 - }, - { - "epoch": 0.33, - "learning_rate": 3.335466679687637e-05, - "loss": 2.4187, - "step": 190900 - }, - { - "epoch": 0.33, - "learning_rate": 3.335379485694954e-05, - "loss": 2.4026, - "step": 190910 - }, - { - "epoch": 0.33, - "learning_rate": 3.335292291702271e-05, - "loss": 2.3168, - "step": 190920 - }, - { - "epoch": 0.33, - "learning_rate": 3.3352050977095885e-05, - "loss": 2.5947, - "step": 190930 - }, - { - "epoch": 0.33, - "learning_rate": 3.3351179037169055e-05, - "loss": 2.4356, - "step": 190940 - }, - { - "epoch": 0.33, - "learning_rate": 3.3350307097242226e-05, - "loss": 2.4428, - "step": 190950 - }, - { - "epoch": 0.33, - "learning_rate": 3.33494351573154e-05, - "loss": 2.3631, - "step": 190960 - }, - { - "epoch": 0.33, - "learning_rate": 3.334856321738858e-05, - "loss": 2.6188, - "step": 190970 - }, - { - "epoch": 0.33, - "learning_rate": 3.334769127746175e-05, - "loss": 2.4927, - "step": 190980 - }, - { - "epoch": 0.33, - "learning_rate": 3.334681933753492e-05, - "loss": 2.5502, - "step": 190990 - }, - { - "epoch": 0.33, - "learning_rate": 3.33459473976081e-05, - "loss": 2.5034, - "step": 191000 - }, - { - "epoch": 0.33, - "learning_rate": 3.334507545768127e-05, - "loss": 2.4449, - "step": 191010 - }, - { - "epoch": 0.33, - "learning_rate": 3.334420351775444e-05, - "loss": 2.4811, - "step": 191020 - }, - { - "epoch": 0.33, - "learning_rate": 3.3343331577827616e-05, - "loss": 2.5197, - "step": 191030 - }, - { - "epoch": 0.33, - "learning_rate": 3.334245963790079e-05, - "loss": 2.5593, - "step": 191040 - }, - { - "epoch": 0.33, - "learning_rate": 3.334158769797396e-05, - "loss": 2.424, - "step": 191050 - }, - { - "epoch": 0.33, - "learning_rate": 3.3340715758047134e-05, - "loss": 2.3978, - "step": 191060 - }, - { - "epoch": 0.33, - "learning_rate": 3.333984381812031e-05, - "loss": 2.4826, - "step": 191070 - }, - { - "epoch": 0.33, - "learning_rate": 3.333897187819348e-05, - "loss": 2.541, - "step": 191080 - }, - { - "epoch": 0.33, - "learning_rate": 3.333809993826665e-05, - "loss": 2.3744, - "step": 191090 - }, - { - "epoch": 0.33, - "learning_rate": 3.333722799833983e-05, - "loss": 2.4154, - "step": 191100 - }, - { - "epoch": 0.33, - "learning_rate": 3.3336356058413e-05, - "loss": 2.2399, - "step": 191110 - }, - { - "epoch": 0.33, - "learning_rate": 3.3335484118486176e-05, - "loss": 2.4484, - "step": 191120 - }, - { - "epoch": 0.33, - "learning_rate": 3.333461217855935e-05, - "loss": 2.2706, - "step": 191130 - }, - { - "epoch": 0.33, - "learning_rate": 3.3333740238632524e-05, - "loss": 2.4782, - "step": 191140 - }, - { - "epoch": 0.33, - "learning_rate": 3.3332868298705694e-05, - "loss": 2.4446, - "step": 191150 - }, - { - "epoch": 0.33, - "learning_rate": 3.3331996358778865e-05, - "loss": 2.5012, - "step": 191160 - }, - { - "epoch": 0.33, - "learning_rate": 3.333112441885204e-05, - "loss": 2.4386, - "step": 191170 - }, - { - "epoch": 0.33, - "learning_rate": 3.333025247892521e-05, - "loss": 2.3215, - "step": 191180 - }, - { - "epoch": 0.33, - "learning_rate": 3.332938053899839e-05, - "loss": 2.519, - "step": 191190 - }, - { - "epoch": 0.33, - "learning_rate": 3.332850859907156e-05, - "loss": 2.5019, - "step": 191200 - }, - { - "epoch": 0.33, - "learning_rate": 3.332763665914474e-05, - "loss": 2.4418, - "step": 191210 - }, - { - "epoch": 0.33, - "learning_rate": 3.332676471921791e-05, - "loss": 2.3303, - "step": 191220 - }, - { - "epoch": 0.33, - "learning_rate": 3.332589277929108e-05, - "loss": 2.472, - "step": 191230 - }, - { - "epoch": 0.33, - "learning_rate": 3.3325020839364255e-05, - "loss": 2.4854, - "step": 191240 - }, - { - "epoch": 0.33, - "learning_rate": 3.3324148899437425e-05, - "loss": 2.3412, - "step": 191250 - }, - { - "epoch": 0.33, - "learning_rate": 3.3323276959510596e-05, - "loss": 2.4379, - "step": 191260 - }, - { - "epoch": 0.33, - "learning_rate": 3.332240501958377e-05, - "loss": 2.372, - "step": 191270 - }, - { - "epoch": 0.33, - "learning_rate": 3.332153307965695e-05, - "loss": 2.5306, - "step": 191280 - }, - { - "epoch": 0.33, - "learning_rate": 3.332066113973012e-05, - "loss": 2.5011, - "step": 191290 - }, - { - "epoch": 0.33, - "learning_rate": 3.331978919980329e-05, - "loss": 2.4494, - "step": 191300 - }, - { - "epoch": 0.33, - "learning_rate": 3.331891725987646e-05, - "loss": 2.2895, - "step": 191310 - }, - { - "epoch": 0.33, - "learning_rate": 3.331804531994964e-05, - "loss": 2.3783, - "step": 191320 - }, - { - "epoch": 0.33, - "learning_rate": 3.331717338002281e-05, - "loss": 2.4078, - "step": 191330 - }, - { - "epoch": 0.33, - "learning_rate": 3.3316301440095986e-05, - "loss": 2.4505, - "step": 191340 - }, - { - "epoch": 0.33, - "learning_rate": 3.331542950016916e-05, - "loss": 2.4461, - "step": 191350 - }, - { - "epoch": 0.33, - "learning_rate": 3.331455756024233e-05, - "loss": 2.4529, - "step": 191360 - }, - { - "epoch": 0.33, - "learning_rate": 3.3313685620315504e-05, - "loss": 2.4609, - "step": 191370 - }, - { - "epoch": 0.33, - "learning_rate": 3.3312813680388674e-05, - "loss": 2.5884, - "step": 191380 - }, - { - "epoch": 0.33, - "learning_rate": 3.331194174046185e-05, - "loss": 2.3083, - "step": 191390 - }, - { - "epoch": 0.33, - "learning_rate": 3.331106980053502e-05, - "loss": 2.3947, - "step": 191400 - }, - { - "epoch": 0.33, - "learning_rate": 3.331019786060819e-05, - "loss": 2.5387, - "step": 191410 - }, - { - "epoch": 0.33, - "learning_rate": 3.330932592068137e-05, - "loss": 2.3948, - "step": 191420 - }, - { - "epoch": 0.33, - "learning_rate": 3.3308453980754546e-05, - "loss": 2.4072, - "step": 191430 - }, - { - "epoch": 0.33, - "learning_rate": 3.330758204082772e-05, - "loss": 2.3705, - "step": 191440 - }, - { - "epoch": 0.33, - "learning_rate": 3.330671010090089e-05, - "loss": 2.4317, - "step": 191450 - }, - { - "epoch": 0.33, - "learning_rate": 3.3305838160974064e-05, - "loss": 2.3718, - "step": 191460 - }, - { - "epoch": 0.33, - "learning_rate": 3.3304966221047235e-05, - "loss": 2.3715, - "step": 191470 - }, - { - "epoch": 0.33, - "learning_rate": 3.3304094281120405e-05, - "loss": 2.409, - "step": 191480 - }, - { - "epoch": 0.33, - "learning_rate": 3.330322234119358e-05, - "loss": 2.4777, - "step": 191490 - }, - { - "epoch": 0.33, - "learning_rate": 3.330235040126676e-05, - "loss": 2.4054, - "step": 191500 - }, - { - "epoch": 0.33, - "learning_rate": 3.330147846133993e-05, - "loss": 2.4156, - "step": 191510 - }, - { - "epoch": 0.33, - "learning_rate": 3.33006065214131e-05, - "loss": 2.39, - "step": 191520 - }, - { - "epoch": 0.33, - "learning_rate": 3.329973458148628e-05, - "loss": 2.4797, - "step": 191530 - }, - { - "epoch": 0.33, - "learning_rate": 3.329886264155945e-05, - "loss": 2.4143, - "step": 191540 - }, - { - "epoch": 0.33, - "learning_rate": 3.329799070163262e-05, - "loss": 2.2633, - "step": 191550 - }, - { - "epoch": 0.33, - "learning_rate": 3.3297118761705795e-05, - "loss": 2.3777, - "step": 191560 - }, - { - "epoch": 0.33, - "learning_rate": 3.329624682177897e-05, - "loss": 2.445, - "step": 191570 - }, - { - "epoch": 0.33, - "learning_rate": 3.329537488185214e-05, - "loss": 2.4504, - "step": 191580 - }, - { - "epoch": 0.33, - "learning_rate": 3.329450294192531e-05, - "loss": 2.47, - "step": 191590 - }, - { - "epoch": 0.33, - "learning_rate": 3.329363100199849e-05, - "loss": 2.294, - "step": 191600 - }, - { - "epoch": 0.33, - "learning_rate": 3.329275906207166e-05, - "loss": 2.39, - "step": 191610 - }, - { - "epoch": 0.33, - "learning_rate": 3.329188712214483e-05, - "loss": 2.5158, - "step": 191620 - }, - { - "epoch": 0.33, - "learning_rate": 3.329101518221801e-05, - "loss": 2.4104, - "step": 191630 - }, - { - "epoch": 0.33, - "learning_rate": 3.3290143242291185e-05, - "loss": 2.4792, - "step": 191640 - }, - { - "epoch": 0.33, - "learning_rate": 3.3289271302364356e-05, - "loss": 2.4448, - "step": 191650 - }, - { - "epoch": 0.33, - "learning_rate": 3.3288399362437526e-05, - "loss": 2.3836, - "step": 191660 - }, - { - "epoch": 0.33, - "learning_rate": 3.32875274225107e-05, - "loss": 2.6129, - "step": 191670 - }, - { - "epoch": 0.33, - "learning_rate": 3.3286655482583874e-05, - "loss": 2.3731, - "step": 191680 - }, - { - "epoch": 0.33, - "learning_rate": 3.3285783542657044e-05, - "loss": 2.3332, - "step": 191690 - }, - { - "epoch": 0.33, - "learning_rate": 3.3284911602730214e-05, - "loss": 2.5014, - "step": 191700 - }, - { - "epoch": 0.33, - "learning_rate": 3.32840396628034e-05, - "loss": 2.4134, - "step": 191710 - }, - { - "epoch": 0.33, - "learning_rate": 3.328316772287657e-05, - "loss": 2.4786, - "step": 191720 - }, - { - "epoch": 0.33, - "learning_rate": 3.328229578294974e-05, - "loss": 2.469, - "step": 191730 - }, - { - "epoch": 0.33, - "learning_rate": 3.3281423843022916e-05, - "loss": 2.4182, - "step": 191740 - }, - { - "epoch": 0.33, - "learning_rate": 3.3280551903096087e-05, - "loss": 2.4667, - "step": 191750 - }, - { - "epoch": 0.33, - "learning_rate": 3.327967996316926e-05, - "loss": 2.3379, - "step": 191760 - }, - { - "epoch": 0.33, - "learning_rate": 3.327880802324243e-05, - "loss": 2.291, - "step": 191770 - }, - { - "epoch": 0.33, - "learning_rate": 3.3277936083315605e-05, - "loss": 2.4346, - "step": 191780 - }, - { - "epoch": 0.33, - "learning_rate": 3.327706414338878e-05, - "loss": 2.3154, - "step": 191790 - }, - { - "epoch": 0.33, - "learning_rate": 3.327619220346195e-05, - "loss": 2.3453, - "step": 191800 - }, - { - "epoch": 0.33, - "learning_rate": 3.327532026353512e-05, - "loss": 2.4225, - "step": 191810 - }, - { - "epoch": 0.33, - "learning_rate": 3.32744483236083e-05, - "loss": 2.4165, - "step": 191820 - }, - { - "epoch": 0.33, - "learning_rate": 3.327357638368147e-05, - "loss": 2.2875, - "step": 191830 - }, - { - "epoch": 0.33, - "learning_rate": 3.327270444375464e-05, - "loss": 2.4933, - "step": 191840 - }, - { - "epoch": 0.33, - "learning_rate": 3.327183250382782e-05, - "loss": 2.3382, - "step": 191850 - }, - { - "epoch": 0.33, - "learning_rate": 3.3270960563900995e-05, - "loss": 2.5299, - "step": 191860 - }, - { - "epoch": 0.33, - "learning_rate": 3.3270088623974165e-05, - "loss": 2.4061, - "step": 191870 - }, - { - "epoch": 0.33, - "learning_rate": 3.3269216684047335e-05, - "loss": 2.3445, - "step": 191880 - }, - { - "epoch": 0.33, - "learning_rate": 3.326834474412051e-05, - "loss": 2.3511, - "step": 191890 - }, - { - "epoch": 0.33, - "learning_rate": 3.326747280419368e-05, - "loss": 2.5167, - "step": 191900 - }, - { - "epoch": 0.33, - "learning_rate": 3.326660086426685e-05, - "loss": 2.4076, - "step": 191910 - }, - { - "epoch": 0.33, - "learning_rate": 3.326572892434003e-05, - "loss": 2.4197, - "step": 191920 - }, - { - "epoch": 0.33, - "learning_rate": 3.32648569844132e-05, - "loss": 2.3165, - "step": 191930 - }, - { - "epoch": 0.33, - "learning_rate": 3.326398504448638e-05, - "loss": 2.5103, - "step": 191940 - }, - { - "epoch": 0.33, - "learning_rate": 3.326311310455955e-05, - "loss": 2.3432, - "step": 191950 - }, - { - "epoch": 0.33, - "learning_rate": 3.3262241164632726e-05, - "loss": 2.3434, - "step": 191960 - }, - { - "epoch": 0.33, - "learning_rate": 3.3261369224705896e-05, - "loss": 2.2802, - "step": 191970 - }, - { - "epoch": 0.33, - "learning_rate": 3.3260497284779066e-05, - "loss": 2.4481, - "step": 191980 - }, - { - "epoch": 0.33, - "learning_rate": 3.3259625344852244e-05, - "loss": 2.4515, - "step": 191990 - }, - { - "epoch": 0.33, - "learning_rate": 3.3258753404925414e-05, - "loss": 2.3934, - "step": 192000 - }, - { - "epoch": 0.33, - "learning_rate": 3.325788146499859e-05, - "loss": 2.4725, - "step": 192010 - }, - { - "epoch": 0.33, - "learning_rate": 3.325700952507176e-05, - "loss": 2.4504, - "step": 192020 - }, - { - "epoch": 0.33, - "learning_rate": 3.325613758514494e-05, - "loss": 2.4248, - "step": 192030 - }, - { - "epoch": 0.33, - "learning_rate": 3.325526564521811e-05, - "loss": 2.4741, - "step": 192040 - }, - { - "epoch": 0.33, - "learning_rate": 3.325439370529128e-05, - "loss": 2.3226, - "step": 192050 - }, - { - "epoch": 0.33, - "learning_rate": 3.3253521765364457e-05, - "loss": 2.538, - "step": 192060 - }, - { - "epoch": 0.33, - "learning_rate": 3.325264982543763e-05, - "loss": 2.3361, - "step": 192070 - }, - { - "epoch": 0.33, - "learning_rate": 3.3251777885510804e-05, - "loss": 2.454, - "step": 192080 - }, - { - "epoch": 0.33, - "learning_rate": 3.3250905945583974e-05, - "loss": 2.5529, - "step": 192090 - }, - { - "epoch": 0.33, - "learning_rate": 3.325003400565715e-05, - "loss": 2.5235, - "step": 192100 - }, - { - "epoch": 0.34, - "learning_rate": 3.324916206573032e-05, - "loss": 2.4516, - "step": 192110 - }, - { - "epoch": 0.34, - "learning_rate": 3.324829012580349e-05, - "loss": 2.4504, - "step": 192120 - }, - { - "epoch": 0.34, - "learning_rate": 3.324741818587667e-05, - "loss": 2.4027, - "step": 192130 - }, - { - "epoch": 0.34, - "learning_rate": 3.324654624594984e-05, - "loss": 2.3929, - "step": 192140 - }, - { - "epoch": 0.34, - "learning_rate": 3.324567430602301e-05, - "loss": 2.3891, - "step": 192150 - }, - { - "epoch": 0.34, - "learning_rate": 3.324480236609619e-05, - "loss": 2.4718, - "step": 192160 - }, - { - "epoch": 0.34, - "learning_rate": 3.3243930426169365e-05, - "loss": 2.4602, - "step": 192170 - }, - { - "epoch": 0.34, - "learning_rate": 3.3243058486242535e-05, - "loss": 2.4821, - "step": 192180 - }, - { - "epoch": 0.34, - "learning_rate": 3.3242186546315705e-05, - "loss": 2.4666, - "step": 192190 - }, - { - "epoch": 0.34, - "learning_rate": 3.324131460638888e-05, - "loss": 2.4397, - "step": 192200 - }, - { - "epoch": 0.34, - "learning_rate": 3.324044266646205e-05, - "loss": 2.3757, - "step": 192210 - }, - { - "epoch": 0.34, - "learning_rate": 3.323957072653522e-05, - "loss": 2.6443, - "step": 192220 - }, - { - "epoch": 0.34, - "learning_rate": 3.32386987866084e-05, - "loss": 2.377, - "step": 192230 - }, - { - "epoch": 0.34, - "learning_rate": 3.323782684668158e-05, - "loss": 2.4891, - "step": 192240 - }, - { - "epoch": 0.34, - "learning_rate": 3.323695490675475e-05, - "loss": 2.4077, - "step": 192250 - }, - { - "epoch": 0.34, - "learning_rate": 3.323608296682792e-05, - "loss": 2.3957, - "step": 192260 - }, - { - "epoch": 0.34, - "learning_rate": 3.323521102690109e-05, - "loss": 2.4682, - "step": 192270 - }, - { - "epoch": 0.34, - "learning_rate": 3.3234339086974266e-05, - "loss": 2.3475, - "step": 192280 - }, - { - "epoch": 0.34, - "learning_rate": 3.3233467147047436e-05, - "loss": 2.4577, - "step": 192290 - }, - { - "epoch": 0.34, - "learning_rate": 3.323259520712061e-05, - "loss": 2.4962, - "step": 192300 - }, - { - "epoch": 0.34, - "learning_rate": 3.323172326719379e-05, - "loss": 2.4228, - "step": 192310 - }, - { - "epoch": 0.34, - "learning_rate": 3.323085132726696e-05, - "loss": 2.4265, - "step": 192320 - }, - { - "epoch": 0.34, - "learning_rate": 3.322997938734013e-05, - "loss": 2.3484, - "step": 192330 - }, - { - "epoch": 0.34, - "learning_rate": 3.32291074474133e-05, - "loss": 2.4704, - "step": 192340 - }, - { - "epoch": 0.34, - "learning_rate": 3.322823550748648e-05, - "loss": 2.5081, - "step": 192350 - }, - { - "epoch": 0.34, - "learning_rate": 3.322736356755965e-05, - "loss": 2.3777, - "step": 192360 - }, - { - "epoch": 0.34, - "learning_rate": 3.322649162763282e-05, - "loss": 2.5145, - "step": 192370 - }, - { - "epoch": 0.34, - "learning_rate": 3.3225619687706e-05, - "loss": 2.3224, - "step": 192380 - }, - { - "epoch": 0.34, - "learning_rate": 3.3224747747779174e-05, - "loss": 2.5004, - "step": 192390 - }, - { - "epoch": 0.34, - "learning_rate": 3.3223875807852344e-05, - "loss": 2.4774, - "step": 192400 - }, - { - "epoch": 0.34, - "learning_rate": 3.3223003867925515e-05, - "loss": 2.5468, - "step": 192410 - }, - { - "epoch": 0.34, - "learning_rate": 3.322213192799869e-05, - "loss": 2.3892, - "step": 192420 - }, - { - "epoch": 0.34, - "learning_rate": 3.322125998807186e-05, - "loss": 2.3257, - "step": 192430 - }, - { - "epoch": 0.34, - "learning_rate": 3.322038804814503e-05, - "loss": 2.3381, - "step": 192440 - }, - { - "epoch": 0.34, - "learning_rate": 3.321951610821821e-05, - "loss": 2.42, - "step": 192450 - }, - { - "epoch": 0.34, - "learning_rate": 3.321864416829139e-05, - "loss": 2.322, - "step": 192460 - }, - { - "epoch": 0.34, - "learning_rate": 3.321777222836456e-05, - "loss": 2.3762, - "step": 192470 - }, - { - "epoch": 0.34, - "learning_rate": 3.321690028843773e-05, - "loss": 2.4978, - "step": 192480 - }, - { - "epoch": 0.34, - "learning_rate": 3.3216028348510905e-05, - "loss": 2.5228, - "step": 192490 - }, - { - "epoch": 0.34, - "learning_rate": 3.3215156408584075e-05, - "loss": 2.3638, - "step": 192500 - }, - { - "epoch": 0.34, - "learning_rate": 3.3214284468657246e-05, - "loss": 2.2971, - "step": 192510 - }, - { - "epoch": 0.34, - "learning_rate": 3.321341252873042e-05, - "loss": 2.4831, - "step": 192520 - }, - { - "epoch": 0.34, - "learning_rate": 3.32125405888036e-05, - "loss": 2.3396, - "step": 192530 - }, - { - "epoch": 0.34, - "learning_rate": 3.321166864887677e-05, - "loss": 2.3068, - "step": 192540 - }, - { - "epoch": 0.34, - "learning_rate": 3.321079670894994e-05, - "loss": 2.5457, - "step": 192550 - }, - { - "epoch": 0.34, - "learning_rate": 3.320992476902312e-05, - "loss": 2.411, - "step": 192560 - }, - { - "epoch": 0.34, - "learning_rate": 3.320905282909629e-05, - "loss": 2.486, - "step": 192570 - }, - { - "epoch": 0.34, - "learning_rate": 3.320818088916946e-05, - "loss": 2.4924, - "step": 192580 - }, - { - "epoch": 0.34, - "learning_rate": 3.3207308949242636e-05, - "loss": 2.4024, - "step": 192590 - }, - { - "epoch": 0.34, - "learning_rate": 3.3206437009315806e-05, - "loss": 2.5566, - "step": 192600 - }, - { - "epoch": 0.34, - "learning_rate": 3.320556506938898e-05, - "loss": 2.5425, - "step": 192610 - }, - { - "epoch": 0.34, - "learning_rate": 3.3204693129462154e-05, - "loss": 2.3568, - "step": 192620 - }, - { - "epoch": 0.34, - "learning_rate": 3.320382118953533e-05, - "loss": 2.4847, - "step": 192630 - }, - { - "epoch": 0.34, - "learning_rate": 3.32029492496085e-05, - "loss": 2.3947, - "step": 192640 - }, - { - "epoch": 0.34, - "learning_rate": 3.320207730968167e-05, - "loss": 2.3653, - "step": 192650 - }, - { - "epoch": 0.34, - "learning_rate": 3.320120536975484e-05, - "loss": 2.4084, - "step": 192660 - }, - { - "epoch": 0.34, - "learning_rate": 3.320033342982802e-05, - "loss": 2.2821, - "step": 192670 - }, - { - "epoch": 0.34, - "learning_rate": 3.3199461489901196e-05, - "loss": 2.394, - "step": 192680 - }, - { - "epoch": 0.34, - "learning_rate": 3.319858954997437e-05, - "loss": 2.3042, - "step": 192690 - }, - { - "epoch": 0.34, - "learning_rate": 3.3197717610047544e-05, - "loss": 2.3762, - "step": 192700 - }, - { - "epoch": 0.34, - "learning_rate": 3.3196845670120714e-05, - "loss": 2.5112, - "step": 192710 - }, - { - "epoch": 0.34, - "learning_rate": 3.3195973730193885e-05, - "loss": 2.4113, - "step": 192720 - }, - { - "epoch": 0.34, - "learning_rate": 3.3195101790267055e-05, - "loss": 2.4546, - "step": 192730 - }, - { - "epoch": 0.34, - "learning_rate": 3.319422985034023e-05, - "loss": 2.3143, - "step": 192740 - }, - { - "epoch": 0.34, - "learning_rate": 3.319335791041341e-05, - "loss": 2.5473, - "step": 192750 - }, - { - "epoch": 0.34, - "learning_rate": 3.319248597048658e-05, - "loss": 2.3107, - "step": 192760 - }, - { - "epoch": 0.34, - "learning_rate": 3.319161403055975e-05, - "loss": 2.3703, - "step": 192770 - }, - { - "epoch": 0.34, - "learning_rate": 3.319074209063293e-05, - "loss": 2.5208, - "step": 192780 - }, - { - "epoch": 0.34, - "learning_rate": 3.31898701507061e-05, - "loss": 2.4401, - "step": 192790 - }, - { - "epoch": 0.34, - "learning_rate": 3.318899821077927e-05, - "loss": 2.3506, - "step": 192800 - }, - { - "epoch": 0.34, - "learning_rate": 3.3188126270852445e-05, - "loss": 2.3429, - "step": 192810 - }, - { - "epoch": 0.34, - "learning_rate": 3.3187254330925616e-05, - "loss": 2.455, - "step": 192820 - }, - { - "epoch": 0.34, - "learning_rate": 3.318638239099879e-05, - "loss": 2.3035, - "step": 192830 - }, - { - "epoch": 0.34, - "learning_rate": 3.318551045107196e-05, - "loss": 2.4524, - "step": 192840 - }, - { - "epoch": 0.34, - "learning_rate": 3.318463851114514e-05, - "loss": 2.4177, - "step": 192850 - }, - { - "epoch": 0.34, - "learning_rate": 3.318376657121831e-05, - "loss": 2.4365, - "step": 192860 - }, - { - "epoch": 0.34, - "learning_rate": 3.318289463129148e-05, - "loss": 2.3642, - "step": 192870 - }, - { - "epoch": 0.34, - "learning_rate": 3.318202269136466e-05, - "loss": 2.5531, - "step": 192880 - }, - { - "epoch": 0.34, - "learning_rate": 3.318115075143783e-05, - "loss": 2.5109, - "step": 192890 - }, - { - "epoch": 0.34, - "learning_rate": 3.3180278811511006e-05, - "loss": 2.4013, - "step": 192900 - }, - { - "epoch": 0.34, - "learning_rate": 3.3179406871584176e-05, - "loss": 2.3285, - "step": 192910 - }, - { - "epoch": 0.34, - "learning_rate": 3.317853493165735e-05, - "loss": 2.3825, - "step": 192920 - }, - { - "epoch": 0.34, - "learning_rate": 3.3177662991730524e-05, - "loss": 2.3802, - "step": 192930 - }, - { - "epoch": 0.34, - "learning_rate": 3.3176791051803694e-05, - "loss": 2.4713, - "step": 192940 - }, - { - "epoch": 0.34, - "learning_rate": 3.317591911187687e-05, - "loss": 2.4325, - "step": 192950 - }, - { - "epoch": 0.34, - "learning_rate": 3.317504717195004e-05, - "loss": 2.4037, - "step": 192960 - }, - { - "epoch": 0.34, - "learning_rate": 3.317417523202321e-05, - "loss": 2.4993, - "step": 192970 - }, - { - "epoch": 0.34, - "learning_rate": 3.317330329209639e-05, - "loss": 2.3834, - "step": 192980 - }, - { - "epoch": 0.34, - "learning_rate": 3.3172431352169566e-05, - "loss": 2.5672, - "step": 192990 - }, - { - "epoch": 0.34, - "learning_rate": 3.317155941224274e-05, - "loss": 2.4699, - "step": 193000 - }, - { - "epoch": 0.34, - "learning_rate": 3.317068747231591e-05, - "loss": 2.4578, - "step": 193010 - }, - { - "epoch": 0.34, - "learning_rate": 3.3169815532389084e-05, - "loss": 2.4521, - "step": 193020 - }, - { - "epoch": 0.34, - "learning_rate": 3.3168943592462255e-05, - "loss": 2.4899, - "step": 193030 - }, - { - "epoch": 0.34, - "learning_rate": 3.3168071652535425e-05, - "loss": 2.393, - "step": 193040 - }, - { - "epoch": 0.34, - "learning_rate": 3.31671997126086e-05, - "loss": 2.4331, - "step": 193050 - }, - { - "epoch": 0.34, - "learning_rate": 3.316632777268178e-05, - "loss": 2.4286, - "step": 193060 - }, - { - "epoch": 0.34, - "learning_rate": 3.316545583275495e-05, - "loss": 2.4385, - "step": 193070 - }, - { - "epoch": 0.34, - "learning_rate": 3.316458389282812e-05, - "loss": 2.4328, - "step": 193080 - }, - { - "epoch": 0.34, - "learning_rate": 3.31637119529013e-05, - "loss": 2.5086, - "step": 193090 - }, - { - "epoch": 0.34, - "learning_rate": 3.316284001297447e-05, - "loss": 2.4362, - "step": 193100 - }, - { - "epoch": 0.34, - "learning_rate": 3.316196807304764e-05, - "loss": 2.4469, - "step": 193110 - }, - { - "epoch": 0.34, - "learning_rate": 3.316109613312081e-05, - "loss": 2.4381, - "step": 193120 - }, - { - "epoch": 0.34, - "learning_rate": 3.316022419319399e-05, - "loss": 2.3801, - "step": 193130 - }, - { - "epoch": 0.34, - "learning_rate": 3.315935225326716e-05, - "loss": 2.4589, - "step": 193140 - }, - { - "epoch": 0.34, - "learning_rate": 3.315848031334033e-05, - "loss": 2.4109, - "step": 193150 - }, - { - "epoch": 0.34, - "learning_rate": 3.3157608373413503e-05, - "loss": 2.325, - "step": 193160 - }, - { - "epoch": 0.34, - "learning_rate": 3.315673643348668e-05, - "loss": 2.3225, - "step": 193170 - }, - { - "epoch": 0.34, - "learning_rate": 3.315586449355985e-05, - "loss": 2.4517, - "step": 193180 - }, - { - "epoch": 0.34, - "learning_rate": 3.315499255363302e-05, - "loss": 2.51, - "step": 193190 - }, - { - "epoch": 0.34, - "learning_rate": 3.3154120613706205e-05, - "loss": 2.457, - "step": 193200 - }, - { - "epoch": 0.34, - "learning_rate": 3.3153248673779376e-05, - "loss": 2.3673, - "step": 193210 - }, - { - "epoch": 0.34, - "learning_rate": 3.3152376733852546e-05, - "loss": 2.4826, - "step": 193220 - }, - { - "epoch": 0.34, - "learning_rate": 3.3151504793925716e-05, - "loss": 2.4564, - "step": 193230 - }, - { - "epoch": 0.34, - "learning_rate": 3.3150632853998894e-05, - "loss": 2.4204, - "step": 193240 - }, - { - "epoch": 0.34, - "learning_rate": 3.3149760914072064e-05, - "loss": 2.3578, - "step": 193250 - }, - { - "epoch": 0.34, - "learning_rate": 3.3148888974145234e-05, - "loss": 2.4918, - "step": 193260 - }, - { - "epoch": 0.34, - "learning_rate": 3.314801703421841e-05, - "loss": 2.4652, - "step": 193270 - }, - { - "epoch": 0.34, - "learning_rate": 3.314714509429159e-05, - "loss": 2.446, - "step": 193280 - }, - { - "epoch": 0.34, - "learning_rate": 3.314627315436476e-05, - "loss": 2.4129, - "step": 193290 - }, - { - "epoch": 0.34, - "learning_rate": 3.314540121443793e-05, - "loss": 2.2954, - "step": 193300 - }, - { - "epoch": 0.34, - "learning_rate": 3.3144529274511107e-05, - "loss": 2.4354, - "step": 193310 - }, - { - "epoch": 0.34, - "learning_rate": 3.314365733458428e-05, - "loss": 2.3995, - "step": 193320 - }, - { - "epoch": 0.34, - "learning_rate": 3.314278539465745e-05, - "loss": 2.5063, - "step": 193330 - }, - { - "epoch": 0.34, - "learning_rate": 3.3141913454730625e-05, - "loss": 2.4427, - "step": 193340 - }, - { - "epoch": 0.34, - "learning_rate": 3.31410415148038e-05, - "loss": 2.4377, - "step": 193350 - }, - { - "epoch": 0.34, - "learning_rate": 3.314016957487697e-05, - "loss": 2.4731, - "step": 193360 - }, - { - "epoch": 0.34, - "learning_rate": 3.313929763495014e-05, - "loss": 2.4404, - "step": 193370 - }, - { - "epoch": 0.34, - "learning_rate": 3.313842569502332e-05, - "loss": 2.4158, - "step": 193380 - }, - { - "epoch": 0.34, - "learning_rate": 3.313755375509649e-05, - "loss": 2.3362, - "step": 193390 - }, - { - "epoch": 0.34, - "learning_rate": 3.313668181516966e-05, - "loss": 2.4743, - "step": 193400 - }, - { - "epoch": 0.34, - "learning_rate": 3.313580987524284e-05, - "loss": 2.4323, - "step": 193410 - }, - { - "epoch": 0.34, - "learning_rate": 3.3134937935316015e-05, - "loss": 2.2747, - "step": 193420 - }, - { - "epoch": 0.34, - "learning_rate": 3.3134065995389185e-05, - "loss": 2.4482, - "step": 193430 - }, - { - "epoch": 0.34, - "learning_rate": 3.3133194055462355e-05, - "loss": 2.4293, - "step": 193440 - }, - { - "epoch": 0.34, - "learning_rate": 3.313232211553553e-05, - "loss": 2.3803, - "step": 193450 - }, - { - "epoch": 0.34, - "learning_rate": 3.31314501756087e-05, - "loss": 2.4494, - "step": 193460 - }, - { - "epoch": 0.34, - "learning_rate": 3.313057823568187e-05, - "loss": 2.4583, - "step": 193470 - }, - { - "epoch": 0.34, - "learning_rate": 3.312970629575505e-05, - "loss": 2.5495, - "step": 193480 - }, - { - "epoch": 0.34, - "learning_rate": 3.312883435582822e-05, - "loss": 2.4301, - "step": 193490 - }, - { - "epoch": 0.34, - "learning_rate": 3.31279624159014e-05, - "loss": 2.3632, - "step": 193500 - }, - { - "epoch": 0.34, - "learning_rate": 3.312709047597457e-05, - "loss": 2.455, - "step": 193510 - }, - { - "epoch": 0.34, - "learning_rate": 3.3126218536047746e-05, - "loss": 2.4514, - "step": 193520 - }, - { - "epoch": 0.34, - "learning_rate": 3.3125346596120916e-05, - "loss": 2.3447, - "step": 193530 - }, - { - "epoch": 0.34, - "learning_rate": 3.3124474656194086e-05, - "loss": 2.4309, - "step": 193540 - }, - { - "epoch": 0.34, - "learning_rate": 3.3123602716267264e-05, - "loss": 2.5727, - "step": 193550 - }, - { - "epoch": 0.34, - "learning_rate": 3.3122730776340434e-05, - "loss": 2.3626, - "step": 193560 - }, - { - "epoch": 0.34, - "learning_rate": 3.312185883641361e-05, - "loss": 2.3082, - "step": 193570 - }, - { - "epoch": 0.34, - "learning_rate": 3.312098689648678e-05, - "loss": 2.4508, - "step": 193580 - }, - { - "epoch": 0.34, - "learning_rate": 3.312011495655996e-05, - "loss": 2.45, - "step": 193590 - }, - { - "epoch": 0.34, - "learning_rate": 3.311924301663313e-05, - "loss": 2.4831, - "step": 193600 - }, - { - "epoch": 0.34, - "learning_rate": 3.31183710767063e-05, - "loss": 2.4057, - "step": 193610 - }, - { - "epoch": 0.34, - "learning_rate": 3.311749913677947e-05, - "loss": 2.4203, - "step": 193620 - }, - { - "epoch": 0.34, - "learning_rate": 3.311662719685265e-05, - "loss": 2.4026, - "step": 193630 - }, - { - "epoch": 0.34, - "learning_rate": 3.311575525692582e-05, - "loss": 2.4461, - "step": 193640 - }, - { - "epoch": 0.34, - "learning_rate": 3.3114883316998994e-05, - "loss": 2.5093, - "step": 193650 - }, - { - "epoch": 0.34, - "learning_rate": 3.311401137707217e-05, - "loss": 2.4198, - "step": 193660 - }, - { - "epoch": 0.34, - "learning_rate": 3.311313943714534e-05, - "loss": 2.4377, - "step": 193670 - }, - { - "epoch": 0.34, - "learning_rate": 3.311226749721851e-05, - "loss": 2.3823, - "step": 193680 - }, - { - "epoch": 0.34, - "learning_rate": 3.311139555729168e-05, - "loss": 2.4657, - "step": 193690 - }, - { - "epoch": 0.34, - "learning_rate": 3.311052361736486e-05, - "loss": 2.4662, - "step": 193700 - }, - { - "epoch": 0.34, - "learning_rate": 3.310965167743803e-05, - "loss": 2.4642, - "step": 193710 - }, - { - "epoch": 0.34, - "learning_rate": 3.310877973751121e-05, - "loss": 2.4697, - "step": 193720 - }, - { - "epoch": 0.34, - "learning_rate": 3.310790779758438e-05, - "loss": 2.3557, - "step": 193730 - }, - { - "epoch": 0.34, - "learning_rate": 3.3107035857657555e-05, - "loss": 2.4406, - "step": 193740 - }, - { - "epoch": 0.34, - "learning_rate": 3.3106163917730725e-05, - "loss": 2.4376, - "step": 193750 - }, - { - "epoch": 0.34, - "learning_rate": 3.3105291977803896e-05, - "loss": 2.328, - "step": 193760 - }, - { - "epoch": 0.34, - "learning_rate": 3.310442003787707e-05, - "loss": 2.4054, - "step": 193770 - }, - { - "epoch": 0.34, - "learning_rate": 3.310354809795024e-05, - "loss": 2.2929, - "step": 193780 - }, - { - "epoch": 0.34, - "learning_rate": 3.3102676158023414e-05, - "loss": 2.5431, - "step": 193790 - }, - { - "epoch": 0.34, - "learning_rate": 3.310180421809659e-05, - "loss": 2.3436, - "step": 193800 - }, - { - "epoch": 0.34, - "learning_rate": 3.310093227816977e-05, - "loss": 2.4661, - "step": 193810 - }, - { - "epoch": 0.34, - "learning_rate": 3.310006033824294e-05, - "loss": 2.4452, - "step": 193820 - }, - { - "epoch": 0.34, - "learning_rate": 3.309918839831611e-05, - "loss": 2.4171, - "step": 193830 - }, - { - "epoch": 0.34, - "learning_rate": 3.3098316458389286e-05, - "loss": 2.4338, - "step": 193840 - }, - { - "epoch": 0.34, - "learning_rate": 3.3097444518462456e-05, - "loss": 2.3268, - "step": 193850 - }, - { - "epoch": 0.34, - "learning_rate": 3.309657257853563e-05, - "loss": 2.4305, - "step": 193860 - }, - { - "epoch": 0.34, - "learning_rate": 3.3095700638608804e-05, - "loss": 2.3772, - "step": 193870 - }, - { - "epoch": 0.34, - "learning_rate": 3.309482869868198e-05, - "loss": 2.4303, - "step": 193880 - }, - { - "epoch": 0.34, - "learning_rate": 3.309395675875515e-05, - "loss": 2.3843, - "step": 193890 - }, - { - "epoch": 0.34, - "learning_rate": 3.309308481882832e-05, - "loss": 2.3819, - "step": 193900 - }, - { - "epoch": 0.34, - "learning_rate": 3.30922128789015e-05, - "loss": 2.4441, - "step": 193910 - }, - { - "epoch": 0.34, - "learning_rate": 3.309134093897467e-05, - "loss": 2.4818, - "step": 193920 - }, - { - "epoch": 0.34, - "learning_rate": 3.309046899904784e-05, - "loss": 2.4069, - "step": 193930 - }, - { - "epoch": 0.34, - "learning_rate": 3.308959705912102e-05, - "loss": 2.4206, - "step": 193940 - }, - { - "epoch": 0.34, - "learning_rate": 3.3088725119194194e-05, - "loss": 2.3917, - "step": 193950 - }, - { - "epoch": 0.34, - "learning_rate": 3.3087853179267364e-05, - "loss": 2.4352, - "step": 193960 - }, - { - "epoch": 0.34, - "learning_rate": 3.3086981239340535e-05, - "loss": 2.3454, - "step": 193970 - }, - { - "epoch": 0.34, - "learning_rate": 3.308610929941371e-05, - "loss": 2.5658, - "step": 193980 - }, - { - "epoch": 0.34, - "learning_rate": 3.308523735948688e-05, - "loss": 2.4465, - "step": 193990 - }, - { - "epoch": 0.34, - "learning_rate": 3.308436541956005e-05, - "loss": 2.3165, - "step": 194000 - }, - { - "epoch": 0.34, - "learning_rate": 3.308349347963322e-05, - "loss": 2.3528, - "step": 194010 - }, - { - "epoch": 0.34, - "learning_rate": 3.308262153970641e-05, - "loss": 2.3399, - "step": 194020 - }, - { - "epoch": 0.34, - "learning_rate": 3.308174959977958e-05, - "loss": 2.5062, - "step": 194030 - }, - { - "epoch": 0.34, - "learning_rate": 3.308087765985275e-05, - "loss": 2.4537, - "step": 194040 - }, - { - "epoch": 0.34, - "learning_rate": 3.3080005719925925e-05, - "loss": 2.4072, - "step": 194050 - }, - { - "epoch": 0.34, - "learning_rate": 3.3079133779999095e-05, - "loss": 2.4253, - "step": 194060 - }, - { - "epoch": 0.34, - "learning_rate": 3.3078261840072266e-05, - "loss": 2.3759, - "step": 194070 - }, - { - "epoch": 0.34, - "learning_rate": 3.3077389900145436e-05, - "loss": 2.3782, - "step": 194080 - }, - { - "epoch": 0.34, - "learning_rate": 3.307651796021862e-05, - "loss": 2.3931, - "step": 194090 - }, - { - "epoch": 0.34, - "learning_rate": 3.307564602029179e-05, - "loss": 2.3278, - "step": 194100 - }, - { - "epoch": 0.34, - "learning_rate": 3.307477408036496e-05, - "loss": 2.3083, - "step": 194110 - }, - { - "epoch": 0.34, - "learning_rate": 3.307390214043813e-05, - "loss": 2.4369, - "step": 194120 - }, - { - "epoch": 0.34, - "learning_rate": 3.307303020051131e-05, - "loss": 2.4228, - "step": 194130 - }, - { - "epoch": 0.34, - "learning_rate": 3.307215826058448e-05, - "loss": 2.353, - "step": 194140 - }, - { - "epoch": 0.34, - "learning_rate": 3.307128632065765e-05, - "loss": 2.3752, - "step": 194150 - }, - { - "epoch": 0.34, - "learning_rate": 3.3070414380730826e-05, - "loss": 2.4835, - "step": 194160 - }, - { - "epoch": 0.34, - "learning_rate": 3.3069542440804e-05, - "loss": 2.3901, - "step": 194170 - }, - { - "epoch": 0.34, - "learning_rate": 3.3068670500877174e-05, - "loss": 2.3488, - "step": 194180 - }, - { - "epoch": 0.34, - "learning_rate": 3.3067798560950344e-05, - "loss": 2.3111, - "step": 194190 - }, - { - "epoch": 0.34, - "learning_rate": 3.306692662102352e-05, - "loss": 2.4337, - "step": 194200 - }, - { - "epoch": 0.34, - "learning_rate": 3.306605468109669e-05, - "loss": 2.4515, - "step": 194210 - }, - { - "epoch": 0.34, - "learning_rate": 3.306518274116986e-05, - "loss": 2.4374, - "step": 194220 - }, - { - "epoch": 0.34, - "learning_rate": 3.306431080124304e-05, - "loss": 2.5623, - "step": 194230 - }, - { - "epoch": 0.34, - "learning_rate": 3.3063438861316216e-05, - "loss": 2.4458, - "step": 194240 - }, - { - "epoch": 0.34, - "learning_rate": 3.306256692138939e-05, - "loss": 2.4435, - "step": 194250 - }, - { - "epoch": 0.34, - "learning_rate": 3.306169498146256e-05, - "loss": 2.5066, - "step": 194260 - }, - { - "epoch": 0.34, - "learning_rate": 3.3060823041535734e-05, - "loss": 2.4488, - "step": 194270 - }, - { - "epoch": 0.34, - "learning_rate": 3.3059951101608905e-05, - "loss": 2.4348, - "step": 194280 - }, - { - "epoch": 0.34, - "learning_rate": 3.3059079161682075e-05, - "loss": 2.374, - "step": 194290 - }, - { - "epoch": 0.34, - "learning_rate": 3.305820722175525e-05, - "loss": 2.341, - "step": 194300 - }, - { - "epoch": 0.34, - "learning_rate": 3.305733528182842e-05, - "loss": 2.4225, - "step": 194310 - }, - { - "epoch": 0.34, - "learning_rate": 3.30564633419016e-05, - "loss": 2.4747, - "step": 194320 - }, - { - "epoch": 0.34, - "learning_rate": 3.305559140197477e-05, - "loss": 2.4524, - "step": 194330 - }, - { - "epoch": 0.34, - "learning_rate": 3.305471946204795e-05, - "loss": 2.4515, - "step": 194340 - }, - { - "epoch": 0.34, - "learning_rate": 3.305384752212112e-05, - "loss": 2.4063, - "step": 194350 - }, - { - "epoch": 0.34, - "learning_rate": 3.305297558219429e-05, - "loss": 2.5356, - "step": 194360 - }, - { - "epoch": 0.34, - "learning_rate": 3.3052103642267465e-05, - "loss": 2.4062, - "step": 194370 - }, - { - "epoch": 0.34, - "learning_rate": 3.3051231702340636e-05, - "loss": 2.4851, - "step": 194380 - }, - { - "epoch": 0.34, - "learning_rate": 3.305035976241381e-05, - "loss": 2.4727, - "step": 194390 - }, - { - "epoch": 0.34, - "learning_rate": 3.304948782248698e-05, - "loss": 2.4758, - "step": 194400 - }, - { - "epoch": 0.34, - "learning_rate": 3.304861588256016e-05, - "loss": 2.4609, - "step": 194410 - }, - { - "epoch": 0.34, - "learning_rate": 3.304774394263333e-05, - "loss": 2.4537, - "step": 194420 - }, - { - "epoch": 0.34, - "learning_rate": 3.30468720027065e-05, - "loss": 2.4332, - "step": 194430 - }, - { - "epoch": 0.34, - "learning_rate": 3.304600006277968e-05, - "loss": 2.3538, - "step": 194440 - }, - { - "epoch": 0.34, - "learning_rate": 3.304512812285285e-05, - "loss": 2.4692, - "step": 194450 - }, - { - "epoch": 0.34, - "learning_rate": 3.304425618292602e-05, - "loss": 2.4031, - "step": 194460 - }, - { - "epoch": 0.34, - "learning_rate": 3.3043384242999196e-05, - "loss": 2.433, - "step": 194470 - }, - { - "epoch": 0.34, - "learning_rate": 3.304251230307237e-05, - "loss": 2.419, - "step": 194480 - }, - { - "epoch": 0.34, - "learning_rate": 3.3041640363145544e-05, - "loss": 2.4645, - "step": 194490 - }, - { - "epoch": 0.34, - "learning_rate": 3.3040768423218714e-05, - "loss": 2.4822, - "step": 194500 - }, - { - "epoch": 0.34, - "learning_rate": 3.3039896483291884e-05, - "loss": 2.4139, - "step": 194510 - }, - { - "epoch": 0.34, - "learning_rate": 3.303902454336506e-05, - "loss": 2.3682, - "step": 194520 - }, - { - "epoch": 0.34, - "learning_rate": 3.303815260343823e-05, - "loss": 2.3006, - "step": 194530 - }, - { - "epoch": 0.34, - "learning_rate": 3.303728066351141e-05, - "loss": 2.3557, - "step": 194540 - }, - { - "epoch": 0.34, - "learning_rate": 3.3036408723584586e-05, - "loss": 2.437, - "step": 194550 - }, - { - "epoch": 0.34, - "learning_rate": 3.303553678365776e-05, - "loss": 2.3903, - "step": 194560 - }, - { - "epoch": 0.34, - "learning_rate": 3.303466484373093e-05, - "loss": 2.5014, - "step": 194570 - }, - { - "epoch": 0.34, - "learning_rate": 3.30337929038041e-05, - "loss": 2.5314, - "step": 194580 - }, - { - "epoch": 0.34, - "learning_rate": 3.3032920963877275e-05, - "loss": 2.3841, - "step": 194590 - }, - { - "epoch": 0.34, - "learning_rate": 3.3032049023950445e-05, - "loss": 2.3789, - "step": 194600 - }, - { - "epoch": 0.34, - "learning_rate": 3.303117708402362e-05, - "loss": 2.3565, - "step": 194610 - }, - { - "epoch": 0.34, - "learning_rate": 3.303030514409679e-05, - "loss": 2.4982, - "step": 194620 - }, - { - "epoch": 0.34, - "learning_rate": 3.302943320416997e-05, - "loss": 2.199, - "step": 194630 - }, - { - "epoch": 0.34, - "learning_rate": 3.302856126424314e-05, - "loss": 2.4505, - "step": 194640 - }, - { - "epoch": 0.34, - "learning_rate": 3.302768932431631e-05, - "loss": 2.4036, - "step": 194650 - }, - { - "epoch": 0.34, - "learning_rate": 3.302681738438949e-05, - "loss": 2.3676, - "step": 194660 - }, - { - "epoch": 0.34, - "learning_rate": 3.302594544446266e-05, - "loss": 2.5948, - "step": 194670 - }, - { - "epoch": 0.34, - "learning_rate": 3.302507350453583e-05, - "loss": 2.404, - "step": 194680 - }, - { - "epoch": 0.34, - "learning_rate": 3.3024201564609006e-05, - "loss": 2.4483, - "step": 194690 - }, - { - "epoch": 0.34, - "learning_rate": 3.302332962468218e-05, - "loss": 2.3434, - "step": 194700 - }, - { - "epoch": 0.34, - "learning_rate": 3.302245768475535e-05, - "loss": 2.577, - "step": 194710 - }, - { - "epoch": 0.34, - "learning_rate": 3.3021585744828523e-05, - "loss": 2.5122, - "step": 194720 - }, - { - "epoch": 0.34, - "learning_rate": 3.30207138049017e-05, - "loss": 2.3342, - "step": 194730 - }, - { - "epoch": 0.34, - "learning_rate": 3.301984186497487e-05, - "loss": 2.4233, - "step": 194740 - }, - { - "epoch": 0.34, - "learning_rate": 3.301896992504804e-05, - "loss": 2.4828, - "step": 194750 - }, - { - "epoch": 0.34, - "learning_rate": 3.301809798512122e-05, - "loss": 2.4428, - "step": 194760 - }, - { - "epoch": 0.34, - "learning_rate": 3.3017226045194396e-05, - "loss": 2.518, - "step": 194770 - }, - { - "epoch": 0.34, - "learning_rate": 3.3016354105267566e-05, - "loss": 2.4626, - "step": 194780 - }, - { - "epoch": 0.34, - "learning_rate": 3.3015482165340736e-05, - "loss": 2.3645, - "step": 194790 - }, - { - "epoch": 0.34, - "learning_rate": 3.3014610225413914e-05, - "loss": 2.4595, - "step": 194800 - }, - { - "epoch": 0.34, - "learning_rate": 3.3013738285487084e-05, - "loss": 2.5236, - "step": 194810 - }, - { - "epoch": 0.34, - "learning_rate": 3.3012866345560254e-05, - "loss": 2.5007, - "step": 194820 - }, - { - "epoch": 0.34, - "learning_rate": 3.301199440563343e-05, - "loss": 2.2951, - "step": 194830 - }, - { - "epoch": 0.34, - "learning_rate": 3.301112246570661e-05, - "loss": 2.4262, - "step": 194840 - }, - { - "epoch": 0.34, - "learning_rate": 3.301025052577978e-05, - "loss": 2.4841, - "step": 194850 - }, - { - "epoch": 0.34, - "learning_rate": 3.300937858585295e-05, - "loss": 2.421, - "step": 194860 - }, - { - "epoch": 0.34, - "learning_rate": 3.300850664592613e-05, - "loss": 2.4949, - "step": 194870 - }, - { - "epoch": 0.34, - "learning_rate": 3.30076347059993e-05, - "loss": 2.4524, - "step": 194880 - }, - { - "epoch": 0.34, - "learning_rate": 3.300676276607247e-05, - "loss": 2.3849, - "step": 194890 - }, - { - "epoch": 0.34, - "learning_rate": 3.3005890826145645e-05, - "loss": 2.2879, - "step": 194900 - }, - { - "epoch": 0.34, - "learning_rate": 3.300501888621882e-05, - "loss": 2.4527, - "step": 194910 - }, - { - "epoch": 0.34, - "learning_rate": 3.300414694629199e-05, - "loss": 2.3848, - "step": 194920 - }, - { - "epoch": 0.34, - "learning_rate": 3.300327500636516e-05, - "loss": 2.4362, - "step": 194930 - }, - { - "epoch": 0.34, - "learning_rate": 3.300240306643834e-05, - "loss": 2.4454, - "step": 194940 - }, - { - "epoch": 0.34, - "learning_rate": 3.300153112651151e-05, - "loss": 2.4034, - "step": 194950 - }, - { - "epoch": 0.34, - "learning_rate": 3.300065918658468e-05, - "loss": 2.5513, - "step": 194960 - }, - { - "epoch": 0.34, - "learning_rate": 3.299978724665785e-05, - "loss": 2.4858, - "step": 194970 - }, - { - "epoch": 0.34, - "learning_rate": 3.299891530673103e-05, - "loss": 2.452, - "step": 194980 - }, - { - "epoch": 0.34, - "learning_rate": 3.2998043366804205e-05, - "loss": 2.5097, - "step": 194990 - }, - { - "epoch": 0.34, - "learning_rate": 3.2997171426877375e-05, - "loss": 2.3902, - "step": 195000 - }, - { - "epoch": 0.34, - "learning_rate": 3.299629948695055e-05, - "loss": 2.4648, - "step": 195010 - }, - { - "epoch": 0.34, - "learning_rate": 3.299542754702372e-05, - "loss": 2.365, - "step": 195020 - }, - { - "epoch": 0.34, - "learning_rate": 3.299455560709689e-05, - "loss": 2.4414, - "step": 195030 - }, - { - "epoch": 0.34, - "learning_rate": 3.2993683667170064e-05, - "loss": 2.4892, - "step": 195040 - }, - { - "epoch": 0.34, - "learning_rate": 3.299281172724324e-05, - "loss": 2.4146, - "step": 195050 - }, - { - "epoch": 0.34, - "learning_rate": 3.299193978731642e-05, - "loss": 2.4699, - "step": 195060 - }, - { - "epoch": 0.34, - "learning_rate": 3.299106784738959e-05, - "loss": 2.4364, - "step": 195070 - }, - { - "epoch": 0.34, - "learning_rate": 3.299019590746276e-05, - "loss": 2.4444, - "step": 195080 - }, - { - "epoch": 0.34, - "learning_rate": 3.2989323967535936e-05, - "loss": 2.3237, - "step": 195090 - }, - { - "epoch": 0.34, - "learning_rate": 3.2988452027609106e-05, - "loss": 2.4424, - "step": 195100 - }, - { - "epoch": 0.34, - "learning_rate": 3.298758008768228e-05, - "loss": 2.3058, - "step": 195110 - }, - { - "epoch": 0.34, - "learning_rate": 3.2986708147755454e-05, - "loss": 2.3586, - "step": 195120 - }, - { - "epoch": 0.34, - "learning_rate": 3.2985836207828624e-05, - "loss": 2.3803, - "step": 195130 - }, - { - "epoch": 0.34, - "learning_rate": 3.29849642679018e-05, - "loss": 2.5268, - "step": 195140 - }, - { - "epoch": 0.34, - "learning_rate": 3.298409232797497e-05, - "loss": 2.4222, - "step": 195150 - }, - { - "epoch": 0.34, - "learning_rate": 3.298322038804815e-05, - "loss": 2.4853, - "step": 195160 - }, - { - "epoch": 0.34, - "learning_rate": 3.298234844812132e-05, - "loss": 2.5044, - "step": 195170 - }, - { - "epoch": 0.34, - "learning_rate": 3.298147650819449e-05, - "loss": 2.551, - "step": 195180 - }, - { - "epoch": 0.34, - "learning_rate": 3.298060456826767e-05, - "loss": 2.4921, - "step": 195190 - }, - { - "epoch": 0.34, - "learning_rate": 3.297973262834084e-05, - "loss": 2.5335, - "step": 195200 - }, - { - "epoch": 0.34, - "learning_rate": 3.2978860688414014e-05, - "loss": 2.3852, - "step": 195210 - }, - { - "epoch": 0.34, - "learning_rate": 3.2977988748487185e-05, - "loss": 2.5035, - "step": 195220 - }, - { - "epoch": 0.34, - "learning_rate": 3.297711680856036e-05, - "loss": 2.5327, - "step": 195230 - }, - { - "epoch": 0.34, - "learning_rate": 3.297624486863353e-05, - "loss": 2.5531, - "step": 195240 - }, - { - "epoch": 0.34, - "learning_rate": 3.29753729287067e-05, - "loss": 2.5099, - "step": 195250 - }, - { - "epoch": 0.34, - "learning_rate": 3.297450098877988e-05, - "loss": 2.3819, - "step": 195260 - }, - { - "epoch": 0.34, - "learning_rate": 3.297362904885305e-05, - "loss": 2.431, - "step": 195270 - }, - { - "epoch": 0.34, - "learning_rate": 3.297275710892623e-05, - "loss": 2.3013, - "step": 195280 - }, - { - "epoch": 0.34, - "learning_rate": 3.29718851689994e-05, - "loss": 2.4968, - "step": 195290 - }, - { - "epoch": 0.34, - "learning_rate": 3.2971013229072575e-05, - "loss": 2.4667, - "step": 195300 - }, - { - "epoch": 0.34, - "learning_rate": 3.2970141289145745e-05, - "loss": 2.3711, - "step": 195310 - }, - { - "epoch": 0.34, - "learning_rate": 3.2969269349218916e-05, - "loss": 2.431, - "step": 195320 - }, - { - "epoch": 0.34, - "learning_rate": 3.296839740929209e-05, - "loss": 2.3606, - "step": 195330 - }, - { - "epoch": 0.34, - "learning_rate": 3.296752546936526e-05, - "loss": 2.336, - "step": 195340 - }, - { - "epoch": 0.34, - "learning_rate": 3.2966653529438434e-05, - "loss": 2.4474, - "step": 195350 - }, - { - "epoch": 0.34, - "learning_rate": 3.296578158951161e-05, - "loss": 2.4252, - "step": 195360 - }, - { - "epoch": 0.34, - "learning_rate": 3.296490964958479e-05, - "loss": 2.5484, - "step": 195370 - }, - { - "epoch": 0.34, - "learning_rate": 3.296403770965796e-05, - "loss": 2.3289, - "step": 195380 - }, - { - "epoch": 0.34, - "learning_rate": 3.296316576973113e-05, - "loss": 2.392, - "step": 195390 - }, - { - "epoch": 0.34, - "learning_rate": 3.2962293829804306e-05, - "loss": 2.5111, - "step": 195400 - }, - { - "epoch": 0.34, - "learning_rate": 3.2961421889877476e-05, - "loss": 2.3768, - "step": 195410 - }, - { - "epoch": 0.34, - "learning_rate": 3.296054994995065e-05, - "loss": 2.4207, - "step": 195420 - }, - { - "epoch": 0.34, - "learning_rate": 3.2959678010023824e-05, - "loss": 2.4897, - "step": 195430 - }, - { - "epoch": 0.34, - "learning_rate": 3.2958806070097e-05, - "loss": 2.2932, - "step": 195440 - }, - { - "epoch": 0.34, - "learning_rate": 3.295793413017017e-05, - "loss": 2.4267, - "step": 195450 - }, - { - "epoch": 0.34, - "learning_rate": 3.295706219024334e-05, - "loss": 2.3956, - "step": 195460 - }, - { - "epoch": 0.34, - "learning_rate": 3.295619025031651e-05, - "loss": 2.4517, - "step": 195470 - }, - { - "epoch": 0.34, - "learning_rate": 3.295531831038969e-05, - "loss": 2.3154, - "step": 195480 - }, - { - "epoch": 0.34, - "learning_rate": 3.295444637046286e-05, - "loss": 2.4418, - "step": 195490 - }, - { - "epoch": 0.34, - "learning_rate": 3.295357443053603e-05, - "loss": 2.3954, - "step": 195500 - }, - { - "epoch": 0.34, - "learning_rate": 3.2952702490609214e-05, - "loss": 2.383, - "step": 195510 - }, - { - "epoch": 0.34, - "learning_rate": 3.2951830550682384e-05, - "loss": 2.3856, - "step": 195520 - }, - { - "epoch": 0.34, - "learning_rate": 3.2950958610755555e-05, - "loss": 2.4079, - "step": 195530 - }, - { - "epoch": 0.34, - "learning_rate": 3.2950086670828725e-05, - "loss": 2.3877, - "step": 195540 - }, - { - "epoch": 0.34, - "learning_rate": 3.29492147309019e-05, - "loss": 2.3346, - "step": 195550 - }, - { - "epoch": 0.34, - "learning_rate": 3.294834279097507e-05, - "loss": 2.3229, - "step": 195560 - }, - { - "epoch": 0.34, - "learning_rate": 3.294747085104824e-05, - "loss": 2.4965, - "step": 195570 - }, - { - "epoch": 0.34, - "learning_rate": 3.294659891112142e-05, - "loss": 2.3875, - "step": 195580 - }, - { - "epoch": 0.34, - "learning_rate": 3.29457269711946e-05, - "loss": 2.5118, - "step": 195590 - }, - { - "epoch": 0.34, - "learning_rate": 3.294485503126777e-05, - "loss": 2.4796, - "step": 195600 - }, - { - "epoch": 0.34, - "learning_rate": 3.294398309134094e-05, - "loss": 2.3503, - "step": 195610 - }, - { - "epoch": 0.34, - "learning_rate": 3.2943111151414115e-05, - "loss": 2.4926, - "step": 195620 - }, - { - "epoch": 0.34, - "learning_rate": 3.2942239211487286e-05, - "loss": 2.4564, - "step": 195630 - }, - { - "epoch": 0.34, - "learning_rate": 3.2941367271560456e-05, - "loss": 2.3809, - "step": 195640 - }, - { - "epoch": 0.34, - "learning_rate": 3.294049533163363e-05, - "loss": 2.3878, - "step": 195650 - }, - { - "epoch": 0.34, - "learning_rate": 3.293962339170681e-05, - "loss": 2.3591, - "step": 195660 - }, - { - "epoch": 0.34, - "learning_rate": 3.293875145177998e-05, - "loss": 2.5826, - "step": 195670 - }, - { - "epoch": 0.34, - "learning_rate": 3.293787951185315e-05, - "loss": 2.4256, - "step": 195680 - }, - { - "epoch": 0.34, - "learning_rate": 3.293700757192633e-05, - "loss": 2.4177, - "step": 195690 - }, - { - "epoch": 0.34, - "learning_rate": 3.29361356319995e-05, - "loss": 2.2731, - "step": 195700 - }, - { - "epoch": 0.34, - "learning_rate": 3.293526369207267e-05, - "loss": 2.4207, - "step": 195710 - }, - { - "epoch": 0.34, - "learning_rate": 3.2934391752145846e-05, - "loss": 2.479, - "step": 195720 - }, - { - "epoch": 0.34, - "learning_rate": 3.2933519812219023e-05, - "loss": 2.3537, - "step": 195730 - }, - { - "epoch": 0.34, - "learning_rate": 3.2932647872292194e-05, - "loss": 2.433, - "step": 195740 - }, - { - "epoch": 0.34, - "learning_rate": 3.2931775932365364e-05, - "loss": 2.4844, - "step": 195750 - }, - { - "epoch": 0.34, - "learning_rate": 3.293090399243854e-05, - "loss": 2.4362, - "step": 195760 - }, - { - "epoch": 0.34, - "learning_rate": 3.293003205251171e-05, - "loss": 2.5045, - "step": 195770 - }, - { - "epoch": 0.34, - "learning_rate": 3.292916011258488e-05, - "loss": 2.5006, - "step": 195780 - }, - { - "epoch": 0.34, - "learning_rate": 3.292828817265806e-05, - "loss": 2.3688, - "step": 195790 - }, - { - "epoch": 0.34, - "learning_rate": 3.292741623273123e-05, - "loss": 2.3847, - "step": 195800 - }, - { - "epoch": 0.34, - "learning_rate": 3.292654429280441e-05, - "loss": 2.349, - "step": 195810 - }, - { - "epoch": 0.34, - "learning_rate": 3.292567235287758e-05, - "loss": 2.4771, - "step": 195820 - }, - { - "epoch": 0.34, - "learning_rate": 3.2924800412950754e-05, - "loss": 2.395, - "step": 195830 - }, - { - "epoch": 0.34, - "learning_rate": 3.2923928473023925e-05, - "loss": 2.4429, - "step": 195840 - }, - { - "epoch": 0.34, - "learning_rate": 3.2923056533097095e-05, - "loss": 2.3885, - "step": 195850 - }, - { - "epoch": 0.34, - "learning_rate": 3.2922184593170265e-05, - "loss": 2.3345, - "step": 195860 - }, - { - "epoch": 0.34, - "learning_rate": 3.292131265324344e-05, - "loss": 2.4395, - "step": 195870 - }, - { - "epoch": 0.34, - "learning_rate": 3.292044071331662e-05, - "loss": 2.4213, - "step": 195880 - }, - { - "epoch": 0.34, - "learning_rate": 3.291956877338979e-05, - "loss": 2.4485, - "step": 195890 - }, - { - "epoch": 0.34, - "learning_rate": 3.291869683346297e-05, - "loss": 2.5571, - "step": 195900 - }, - { - "epoch": 0.34, - "learning_rate": 3.291782489353614e-05, - "loss": 2.4477, - "step": 195910 - }, - { - "epoch": 0.34, - "learning_rate": 3.291695295360931e-05, - "loss": 2.4242, - "step": 195920 - }, - { - "epoch": 0.34, - "learning_rate": 3.291608101368248e-05, - "loss": 2.4496, - "step": 195930 - }, - { - "epoch": 0.34, - "learning_rate": 3.2915209073755656e-05, - "loss": 2.4595, - "step": 195940 - }, - { - "epoch": 0.34, - "learning_rate": 3.291433713382883e-05, - "loss": 2.4314, - "step": 195950 - }, - { - "epoch": 0.34, - "learning_rate": 3.2913465193902e-05, - "loss": 2.4445, - "step": 195960 - }, - { - "epoch": 0.34, - "learning_rate": 3.2912593253975174e-05, - "loss": 2.5034, - "step": 195970 - }, - { - "epoch": 0.34, - "learning_rate": 3.291172131404835e-05, - "loss": 2.4866, - "step": 195980 - }, - { - "epoch": 0.34, - "learning_rate": 3.291084937412152e-05, - "loss": 2.3646, - "step": 195990 - }, - { - "epoch": 0.34, - "learning_rate": 3.290997743419469e-05, - "loss": 2.3915, - "step": 196000 - }, - { - "epoch": 0.34, - "learning_rate": 3.290910549426787e-05, - "loss": 2.4029, - "step": 196010 - }, - { - "epoch": 0.34, - "learning_rate": 3.290823355434104e-05, - "loss": 2.3731, - "step": 196020 - }, - { - "epoch": 0.34, - "learning_rate": 3.2907361614414216e-05, - "loss": 2.2222, - "step": 196030 - }, - { - "epoch": 0.34, - "learning_rate": 3.2906489674487387e-05, - "loss": 2.3923, - "step": 196040 - }, - { - "epoch": 0.34, - "learning_rate": 3.2905617734560564e-05, - "loss": 2.336, - "step": 196050 - }, - { - "epoch": 0.34, - "learning_rate": 3.2904745794633734e-05, - "loss": 2.3057, - "step": 196060 - }, - { - "epoch": 0.34, - "learning_rate": 3.2903873854706904e-05, - "loss": 2.525, - "step": 196070 - }, - { - "epoch": 0.34, - "learning_rate": 3.290300191478008e-05, - "loss": 2.4401, - "step": 196080 - }, - { - "epoch": 0.34, - "learning_rate": 3.290212997485325e-05, - "loss": 2.4996, - "step": 196090 - }, - { - "epoch": 0.34, - "learning_rate": 3.290125803492643e-05, - "loss": 2.4439, - "step": 196100 - }, - { - "epoch": 0.34, - "learning_rate": 3.29003860949996e-05, - "loss": 2.4193, - "step": 196110 - }, - { - "epoch": 0.34, - "learning_rate": 3.289951415507278e-05, - "loss": 2.3983, - "step": 196120 - }, - { - "epoch": 0.34, - "learning_rate": 3.289864221514595e-05, - "loss": 2.4759, - "step": 196130 - }, - { - "epoch": 0.34, - "learning_rate": 3.289777027521912e-05, - "loss": 2.5924, - "step": 196140 - }, - { - "epoch": 0.34, - "learning_rate": 3.2896898335292295e-05, - "loss": 2.419, - "step": 196150 - }, - { - "epoch": 0.34, - "learning_rate": 3.2896026395365465e-05, - "loss": 2.4186, - "step": 196160 - }, - { - "epoch": 0.34, - "learning_rate": 3.2895154455438635e-05, - "loss": 2.3971, - "step": 196170 - }, - { - "epoch": 0.34, - "learning_rate": 3.289428251551181e-05, - "loss": 2.5124, - "step": 196180 - }, - { - "epoch": 0.34, - "learning_rate": 3.289341057558499e-05, - "loss": 2.4813, - "step": 196190 - }, - { - "epoch": 0.34, - "learning_rate": 3.289253863565816e-05, - "loss": 2.3771, - "step": 196200 - }, - { - "epoch": 0.34, - "learning_rate": 3.289166669573133e-05, - "loss": 2.4428, - "step": 196210 - }, - { - "epoch": 0.34, - "learning_rate": 3.289079475580451e-05, - "loss": 2.5916, - "step": 196220 - }, - { - "epoch": 0.34, - "learning_rate": 3.288992281587768e-05, - "loss": 2.4995, - "step": 196230 - }, - { - "epoch": 0.34, - "learning_rate": 3.288905087595085e-05, - "loss": 2.4555, - "step": 196240 - }, - { - "epoch": 0.34, - "learning_rate": 3.2888178936024026e-05, - "loss": 2.4908, - "step": 196250 - }, - { - "epoch": 0.34, - "learning_rate": 3.28873069960972e-05, - "loss": 2.4987, - "step": 196260 - }, - { - "epoch": 0.34, - "learning_rate": 3.288643505617037e-05, - "loss": 2.3531, - "step": 196270 - }, - { - "epoch": 0.34, - "learning_rate": 3.2885563116243543e-05, - "loss": 2.4454, - "step": 196280 - }, - { - "epoch": 0.34, - "learning_rate": 3.288469117631672e-05, - "loss": 2.5531, - "step": 196290 - }, - { - "epoch": 0.34, - "learning_rate": 3.288381923638989e-05, - "loss": 2.4689, - "step": 196300 - }, - { - "epoch": 0.34, - "learning_rate": 3.288294729646306e-05, - "loss": 2.5183, - "step": 196310 - }, - { - "epoch": 0.34, - "learning_rate": 3.288207535653623e-05, - "loss": 2.3593, - "step": 196320 - }, - { - "epoch": 0.34, - "learning_rate": 3.2881203416609416e-05, - "loss": 2.4692, - "step": 196330 - }, - { - "epoch": 0.34, - "learning_rate": 3.2880331476682586e-05, - "loss": 2.4414, - "step": 196340 - }, - { - "epoch": 0.34, - "learning_rate": 3.2879459536755756e-05, - "loss": 2.4312, - "step": 196350 - }, - { - "epoch": 0.34, - "learning_rate": 3.2878587596828934e-05, - "loss": 2.3258, - "step": 196360 - }, - { - "epoch": 0.34, - "learning_rate": 3.2877715656902104e-05, - "loss": 2.547, - "step": 196370 - }, - { - "epoch": 0.34, - "learning_rate": 3.2876843716975274e-05, - "loss": 2.463, - "step": 196380 - }, - { - "epoch": 0.34, - "learning_rate": 3.2875971777048445e-05, - "loss": 2.3565, - "step": 196390 - }, - { - "epoch": 0.34, - "learning_rate": 3.287509983712163e-05, - "loss": 2.3105, - "step": 196400 - }, - { - "epoch": 0.34, - "learning_rate": 3.28742278971948e-05, - "loss": 2.4097, - "step": 196410 - }, - { - "epoch": 0.34, - "learning_rate": 3.287335595726797e-05, - "loss": 2.4992, - "step": 196420 - }, - { - "epoch": 0.34, - "learning_rate": 3.287248401734114e-05, - "loss": 2.4154, - "step": 196430 - }, - { - "epoch": 0.34, - "learning_rate": 3.287161207741432e-05, - "loss": 2.4619, - "step": 196440 - }, - { - "epoch": 0.34, - "learning_rate": 3.287074013748749e-05, - "loss": 2.4778, - "step": 196450 - }, - { - "epoch": 0.34, - "learning_rate": 3.286986819756066e-05, - "loss": 2.4179, - "step": 196460 - }, - { - "epoch": 0.34, - "learning_rate": 3.286899625763384e-05, - "loss": 2.4269, - "step": 196470 - }, - { - "epoch": 0.34, - "learning_rate": 3.286812431770701e-05, - "loss": 2.5742, - "step": 196480 - }, - { - "epoch": 0.34, - "learning_rate": 3.286725237778018e-05, - "loss": 2.3355, - "step": 196490 - }, - { - "epoch": 0.34, - "learning_rate": 3.286638043785335e-05, - "loss": 2.5561, - "step": 196500 - }, - { - "epoch": 0.34, - "learning_rate": 3.286550849792653e-05, - "loss": 2.4422, - "step": 196510 - }, - { - "epoch": 0.34, - "learning_rate": 3.28646365579997e-05, - "loss": 2.3579, - "step": 196520 - }, - { - "epoch": 0.34, - "learning_rate": 3.286376461807287e-05, - "loss": 2.3806, - "step": 196530 - }, - { - "epoch": 0.34, - "learning_rate": 3.286289267814605e-05, - "loss": 2.4357, - "step": 196540 - }, - { - "epoch": 0.34, - "learning_rate": 3.2862020738219225e-05, - "loss": 2.4337, - "step": 196550 - }, - { - "epoch": 0.34, - "learning_rate": 3.2861148798292395e-05, - "loss": 2.5019, - "step": 196560 - }, - { - "epoch": 0.34, - "learning_rate": 3.2860276858365566e-05, - "loss": 2.3138, - "step": 196570 - }, - { - "epoch": 0.34, - "learning_rate": 3.285940491843874e-05, - "loss": 2.4566, - "step": 196580 - }, - { - "epoch": 0.34, - "learning_rate": 3.2858532978511913e-05, - "loss": 2.4665, - "step": 196590 - }, - { - "epoch": 0.34, - "learning_rate": 3.2857661038585084e-05, - "loss": 2.3649, - "step": 196600 - }, - { - "epoch": 0.34, - "learning_rate": 3.285678909865826e-05, - "loss": 2.3847, - "step": 196610 - }, - { - "epoch": 0.34, - "learning_rate": 3.285591715873144e-05, - "loss": 2.4399, - "step": 196620 - }, - { - "epoch": 0.34, - "learning_rate": 3.285504521880461e-05, - "loss": 2.3267, - "step": 196630 - }, - { - "epoch": 0.34, - "learning_rate": 3.285417327887778e-05, - "loss": 2.414, - "step": 196640 - }, - { - "epoch": 0.34, - "learning_rate": 3.2853301338950956e-05, - "loss": 2.4315, - "step": 196650 - }, - { - "epoch": 0.34, - "learning_rate": 3.2852429399024126e-05, - "loss": 2.3586, - "step": 196660 - }, - { - "epoch": 0.34, - "learning_rate": 3.28515574590973e-05, - "loss": 2.4564, - "step": 196670 - }, - { - "epoch": 0.34, - "learning_rate": 3.2850685519170474e-05, - "loss": 2.4476, - "step": 196680 - }, - { - "epoch": 0.34, - "learning_rate": 3.2849813579243644e-05, - "loss": 2.3552, - "step": 196690 - }, - { - "epoch": 0.34, - "learning_rate": 3.284894163931682e-05, - "loss": 2.4156, - "step": 196700 - }, - { - "epoch": 0.34, - "learning_rate": 3.284806969938999e-05, - "loss": 2.398, - "step": 196710 - }, - { - "epoch": 0.34, - "learning_rate": 3.284719775946317e-05, - "loss": 2.365, - "step": 196720 - }, - { - "epoch": 0.34, - "learning_rate": 3.284632581953634e-05, - "loss": 2.4704, - "step": 196730 - }, - { - "epoch": 0.34, - "learning_rate": 3.284545387960951e-05, - "loss": 2.5401, - "step": 196740 - }, - { - "epoch": 0.34, - "learning_rate": 3.284458193968269e-05, - "loss": 2.3435, - "step": 196750 - }, - { - "epoch": 0.34, - "learning_rate": 3.284370999975586e-05, - "loss": 2.4099, - "step": 196760 - }, - { - "epoch": 0.34, - "learning_rate": 3.2842838059829034e-05, - "loss": 2.3921, - "step": 196770 - }, - { - "epoch": 0.34, - "learning_rate": 3.2841966119902205e-05, - "loss": 2.385, - "step": 196780 - }, - { - "epoch": 0.34, - "learning_rate": 3.284109417997538e-05, - "loss": 2.5766, - "step": 196790 - }, - { - "epoch": 0.34, - "learning_rate": 3.284022224004855e-05, - "loss": 2.3179, - "step": 196800 - }, - { - "epoch": 0.34, - "learning_rate": 3.283935030012172e-05, - "loss": 2.501, - "step": 196810 - }, - { - "epoch": 0.34, - "learning_rate": 3.283847836019489e-05, - "loss": 2.434, - "step": 196820 - }, - { - "epoch": 0.34, - "learning_rate": 3.283760642026807e-05, - "loss": 2.3942, - "step": 196830 - }, - { - "epoch": 0.34, - "learning_rate": 3.283673448034124e-05, - "loss": 2.4678, - "step": 196840 - }, - { - "epoch": 0.34, - "learning_rate": 3.283586254041442e-05, - "loss": 2.3404, - "step": 196850 - }, - { - "epoch": 0.34, - "learning_rate": 3.2834990600487595e-05, - "loss": 2.4059, - "step": 196860 - }, - { - "epoch": 0.34, - "learning_rate": 3.2834118660560765e-05, - "loss": 2.3999, - "step": 196870 - }, - { - "epoch": 0.34, - "learning_rate": 3.2833246720633936e-05, - "loss": 2.4223, - "step": 196880 - }, - { - "epoch": 0.34, - "learning_rate": 3.2832374780707106e-05, - "loss": 2.4292, - "step": 196890 - }, - { - "epoch": 0.34, - "learning_rate": 3.283150284078028e-05, - "loss": 2.5726, - "step": 196900 - }, - { - "epoch": 0.34, - "learning_rate": 3.2830630900853454e-05, - "loss": 2.4264, - "step": 196910 - }, - { - "epoch": 0.34, - "learning_rate": 3.282975896092663e-05, - "loss": 2.5193, - "step": 196920 - }, - { - "epoch": 0.34, - "learning_rate": 3.28288870209998e-05, - "loss": 2.4353, - "step": 196930 - }, - { - "epoch": 0.34, - "learning_rate": 3.282801508107298e-05, - "loss": 2.329, - "step": 196940 - }, - { - "epoch": 0.34, - "learning_rate": 3.282714314114615e-05, - "loss": 2.3524, - "step": 196950 - }, - { - "epoch": 0.34, - "learning_rate": 3.282627120121932e-05, - "loss": 2.3616, - "step": 196960 - }, - { - "epoch": 0.34, - "learning_rate": 3.2825399261292496e-05, - "loss": 2.4817, - "step": 196970 - }, - { - "epoch": 0.34, - "learning_rate": 3.282452732136567e-05, - "loss": 2.4201, - "step": 196980 - }, - { - "epoch": 0.34, - "learning_rate": 3.282365538143884e-05, - "loss": 2.4115, - "step": 196990 - }, - { - "epoch": 0.34, - "learning_rate": 3.2822783441512014e-05, - "loss": 2.4124, - "step": 197000 - }, - { - "epoch": 0.34, - "learning_rate": 3.282191150158519e-05, - "loss": 2.3631, - "step": 197010 - }, - { - "epoch": 0.34, - "learning_rate": 3.282103956165836e-05, - "loss": 2.414, - "step": 197020 - }, - { - "epoch": 0.34, - "learning_rate": 3.282016762173153e-05, - "loss": 2.4704, - "step": 197030 - }, - { - "epoch": 0.34, - "learning_rate": 3.281929568180471e-05, - "loss": 2.5027, - "step": 197040 - }, - { - "epoch": 0.34, - "learning_rate": 3.281842374187788e-05, - "loss": 2.3949, - "step": 197050 - }, - { - "epoch": 0.34, - "learning_rate": 3.281755180195105e-05, - "loss": 2.3845, - "step": 197060 - }, - { - "epoch": 0.34, - "learning_rate": 3.281667986202423e-05, - "loss": 2.3689, - "step": 197070 - }, - { - "epoch": 0.34, - "learning_rate": 3.2815807922097404e-05, - "loss": 2.3801, - "step": 197080 - }, - { - "epoch": 0.34, - "learning_rate": 3.2814935982170575e-05, - "loss": 2.4366, - "step": 197090 - }, - { - "epoch": 0.34, - "learning_rate": 3.2814064042243745e-05, - "loss": 2.2625, - "step": 197100 - }, - { - "epoch": 0.34, - "learning_rate": 3.281319210231692e-05, - "loss": 2.4049, - "step": 197110 - }, - { - "epoch": 0.34, - "learning_rate": 3.281232016239009e-05, - "loss": 2.4485, - "step": 197120 - }, - { - "epoch": 0.34, - "learning_rate": 3.281144822246326e-05, - "loss": 2.455, - "step": 197130 - }, - { - "epoch": 0.34, - "learning_rate": 3.281057628253644e-05, - "loss": 2.3916, - "step": 197140 - }, - { - "epoch": 0.34, - "learning_rate": 3.280970434260962e-05, - "loss": 2.4447, - "step": 197150 - }, - { - "epoch": 0.34, - "learning_rate": 3.280883240268279e-05, - "loss": 2.3374, - "step": 197160 - }, - { - "epoch": 0.34, - "learning_rate": 3.280796046275596e-05, - "loss": 2.4143, - "step": 197170 - }, - { - "epoch": 0.34, - "learning_rate": 3.2807088522829135e-05, - "loss": 2.3823, - "step": 197180 - }, - { - "epoch": 0.34, - "learning_rate": 3.2806216582902306e-05, - "loss": 2.5207, - "step": 197190 - }, - { - "epoch": 0.34, - "learning_rate": 3.2805344642975476e-05, - "loss": 2.3257, - "step": 197200 - }, - { - "epoch": 0.34, - "learning_rate": 3.2804472703048646e-05, - "loss": 2.4762, - "step": 197210 - }, - { - "epoch": 0.34, - "learning_rate": 3.280360076312183e-05, - "loss": 2.3175, - "step": 197220 - }, - { - "epoch": 0.34, - "learning_rate": 3.2802728823195e-05, - "loss": 2.3376, - "step": 197230 - }, - { - "epoch": 0.34, - "learning_rate": 3.280185688326817e-05, - "loss": 2.5033, - "step": 197240 - }, - { - "epoch": 0.34, - "learning_rate": 3.280098494334135e-05, - "loss": 2.3689, - "step": 197250 - }, - { - "epoch": 0.34, - "learning_rate": 3.280011300341452e-05, - "loss": 2.3967, - "step": 197260 - }, - { - "epoch": 0.34, - "learning_rate": 3.279924106348769e-05, - "loss": 2.4953, - "step": 197270 - }, - { - "epoch": 0.34, - "learning_rate": 3.279836912356086e-05, - "loss": 2.478, - "step": 197280 - }, - { - "epoch": 0.34, - "learning_rate": 3.2797497183634043e-05, - "loss": 2.3888, - "step": 197290 - }, - { - "epoch": 0.34, - "learning_rate": 3.2796625243707214e-05, - "loss": 2.4684, - "step": 197300 - }, - { - "epoch": 0.34, - "learning_rate": 3.2795753303780384e-05, - "loss": 2.2935, - "step": 197310 - }, - { - "epoch": 0.34, - "learning_rate": 3.2794881363853555e-05, - "loss": 2.43, - "step": 197320 - }, - { - "epoch": 0.34, - "learning_rate": 3.279400942392673e-05, - "loss": 2.3893, - "step": 197330 - }, - { - "epoch": 0.34, - "learning_rate": 3.27931374839999e-05, - "loss": 2.3266, - "step": 197340 - }, - { - "epoch": 0.34, - "learning_rate": 3.279226554407307e-05, - "loss": 2.287, - "step": 197350 - }, - { - "epoch": 0.34, - "learning_rate": 3.279139360414625e-05, - "loss": 2.4158, - "step": 197360 - }, - { - "epoch": 0.34, - "learning_rate": 3.279052166421943e-05, - "loss": 2.4059, - "step": 197370 - }, - { - "epoch": 0.34, - "learning_rate": 3.27896497242926e-05, - "loss": 2.3842, - "step": 197380 - }, - { - "epoch": 0.34, - "learning_rate": 3.278877778436577e-05, - "loss": 2.3955, - "step": 197390 - }, - { - "epoch": 0.34, - "learning_rate": 3.2787905844438945e-05, - "loss": 2.3588, - "step": 197400 - }, - { - "epoch": 0.34, - "learning_rate": 3.2787033904512115e-05, - "loss": 2.2616, - "step": 197410 - }, - { - "epoch": 0.34, - "learning_rate": 3.2786161964585285e-05, - "loss": 2.4946, - "step": 197420 - }, - { - "epoch": 0.34, - "learning_rate": 3.278529002465846e-05, - "loss": 2.3678, - "step": 197430 - }, - { - "epoch": 0.34, - "learning_rate": 3.278441808473164e-05, - "loss": 2.4445, - "step": 197440 - }, - { - "epoch": 0.34, - "learning_rate": 3.278354614480481e-05, - "loss": 2.4463, - "step": 197450 - }, - { - "epoch": 0.34, - "learning_rate": 3.278267420487798e-05, - "loss": 2.5301, - "step": 197460 - }, - { - "epoch": 0.34, - "learning_rate": 3.278180226495116e-05, - "loss": 2.42, - "step": 197470 - }, - { - "epoch": 0.34, - "learning_rate": 3.278093032502433e-05, - "loss": 2.4671, - "step": 197480 - }, - { - "epoch": 0.34, - "learning_rate": 3.27800583850975e-05, - "loss": 2.4242, - "step": 197490 - }, - { - "epoch": 0.34, - "learning_rate": 3.2779186445170676e-05, - "loss": 2.338, - "step": 197500 - }, - { - "epoch": 0.34, - "learning_rate": 3.2778314505243846e-05, - "loss": 2.3659, - "step": 197510 - }, - { - "epoch": 0.34, - "learning_rate": 3.277744256531702e-05, - "loss": 2.4196, - "step": 197520 - }, - { - "epoch": 0.34, - "learning_rate": 3.2776570625390194e-05, - "loss": 2.5184, - "step": 197530 - }, - { - "epoch": 0.34, - "learning_rate": 3.277569868546337e-05, - "loss": 2.3613, - "step": 197540 - }, - { - "epoch": 0.34, - "learning_rate": 3.277482674553654e-05, - "loss": 2.4309, - "step": 197550 - }, - { - "epoch": 0.34, - "learning_rate": 3.277395480560971e-05, - "loss": 2.4146, - "step": 197560 - }, - { - "epoch": 0.34, - "learning_rate": 3.277308286568289e-05, - "loss": 2.4372, - "step": 197570 - }, - { - "epoch": 0.34, - "learning_rate": 3.277221092575606e-05, - "loss": 2.2628, - "step": 197580 - }, - { - "epoch": 0.34, - "learning_rate": 3.2771338985829236e-05, - "loss": 2.5031, - "step": 197590 - }, - { - "epoch": 0.34, - "learning_rate": 3.2770467045902407e-05, - "loss": 2.3892, - "step": 197600 - }, - { - "epoch": 0.34, - "learning_rate": 3.2769595105975584e-05, - "loss": 2.4125, - "step": 197610 - }, - { - "epoch": 0.34, - "learning_rate": 3.2768723166048754e-05, - "loss": 2.4465, - "step": 197620 - }, - { - "epoch": 0.34, - "learning_rate": 3.2767851226121924e-05, - "loss": 2.4173, - "step": 197630 - }, - { - "epoch": 0.34, - "learning_rate": 3.27669792861951e-05, - "loss": 2.5536, - "step": 197640 - }, - { - "epoch": 0.34, - "learning_rate": 3.276610734626827e-05, - "loss": 2.3995, - "step": 197650 - }, - { - "epoch": 0.34, - "learning_rate": 3.276523540634144e-05, - "loss": 2.3616, - "step": 197660 - }, - { - "epoch": 0.34, - "learning_rate": 3.276436346641462e-05, - "loss": 2.3817, - "step": 197670 - }, - { - "epoch": 0.34, - "learning_rate": 3.27634915264878e-05, - "loss": 2.3813, - "step": 197680 - }, - { - "epoch": 0.34, - "learning_rate": 3.276261958656097e-05, - "loss": 2.4029, - "step": 197690 - }, - { - "epoch": 0.34, - "learning_rate": 3.276174764663414e-05, - "loss": 2.3832, - "step": 197700 - }, - { - "epoch": 0.34, - "learning_rate": 3.2760875706707315e-05, - "loss": 2.4866, - "step": 197710 - }, - { - "epoch": 0.34, - "learning_rate": 3.2760003766780485e-05, - "loss": 2.3855, - "step": 197720 - }, - { - "epoch": 0.34, - "learning_rate": 3.2759131826853655e-05, - "loss": 2.5165, - "step": 197730 - }, - { - "epoch": 0.34, - "learning_rate": 3.275825988692683e-05, - "loss": 2.489, - "step": 197740 - }, - { - "epoch": 0.34, - "learning_rate": 3.275738794700001e-05, - "loss": 2.4633, - "step": 197750 - }, - { - "epoch": 0.34, - "learning_rate": 3.275651600707318e-05, - "loss": 2.4175, - "step": 197760 - }, - { - "epoch": 0.34, - "learning_rate": 3.275564406714635e-05, - "loss": 2.3845, - "step": 197770 - }, - { - "epoch": 0.34, - "learning_rate": 3.275477212721952e-05, - "loss": 2.4227, - "step": 197780 - }, - { - "epoch": 0.34, - "learning_rate": 3.27539001872927e-05, - "loss": 2.3905, - "step": 197790 - }, - { - "epoch": 0.34, - "learning_rate": 3.275302824736587e-05, - "loss": 2.3225, - "step": 197800 - }, - { - "epoch": 0.34, - "learning_rate": 3.2752156307439046e-05, - "loss": 2.4173, - "step": 197810 - }, - { - "epoch": 0.34, - "learning_rate": 3.275128436751222e-05, - "loss": 2.3955, - "step": 197820 - }, - { - "epoch": 0.34, - "learning_rate": 3.275041242758539e-05, - "loss": 2.3891, - "step": 197830 - }, - { - "epoch": 0.35, - "learning_rate": 3.2749540487658563e-05, - "loss": 2.3459, - "step": 197840 - }, - { - "epoch": 0.35, - "learning_rate": 3.2748668547731734e-05, - "loss": 2.3574, - "step": 197850 - }, - { - "epoch": 0.35, - "learning_rate": 3.274779660780491e-05, - "loss": 2.3638, - "step": 197860 - }, - { - "epoch": 0.35, - "learning_rate": 3.274692466787808e-05, - "loss": 2.4282, - "step": 197870 - }, - { - "epoch": 0.35, - "learning_rate": 3.274605272795125e-05, - "loss": 2.4323, - "step": 197880 - }, - { - "epoch": 0.35, - "learning_rate": 3.274518078802443e-05, - "loss": 2.3476, - "step": 197890 - }, - { - "epoch": 0.35, - "learning_rate": 3.2744308848097606e-05, - "loss": 2.4799, - "step": 197900 - }, - { - "epoch": 0.35, - "learning_rate": 3.2743436908170776e-05, - "loss": 2.4199, - "step": 197910 - }, - { - "epoch": 0.35, - "learning_rate": 3.274256496824395e-05, - "loss": 2.4037, - "step": 197920 - }, - { - "epoch": 0.35, - "learning_rate": 3.2741693028317124e-05, - "loss": 2.4509, - "step": 197930 - }, - { - "epoch": 0.35, - "learning_rate": 3.2740821088390294e-05, - "loss": 2.448, - "step": 197940 - }, - { - "epoch": 0.35, - "learning_rate": 3.2739949148463465e-05, - "loss": 2.4416, - "step": 197950 - }, - { - "epoch": 0.35, - "learning_rate": 3.273907720853664e-05, - "loss": 2.4769, - "step": 197960 - }, - { - "epoch": 0.35, - "learning_rate": 3.273820526860982e-05, - "loss": 2.4829, - "step": 197970 - }, - { - "epoch": 0.35, - "learning_rate": 3.273733332868299e-05, - "loss": 2.4326, - "step": 197980 - }, - { - "epoch": 0.35, - "learning_rate": 3.273646138875616e-05, - "loss": 2.4176, - "step": 197990 - }, - { - "epoch": 0.35, - "learning_rate": 3.273558944882934e-05, - "loss": 2.5475, - "step": 198000 - }, - { - "epoch": 0.35, - "learning_rate": 3.273471750890251e-05, - "loss": 2.312, - "step": 198010 - }, - { - "epoch": 0.35, - "learning_rate": 3.273384556897568e-05, - "loss": 2.4056, - "step": 198020 - }, - { - "epoch": 0.35, - "learning_rate": 3.2732973629048855e-05, - "loss": 2.3903, - "step": 198030 - }, - { - "epoch": 0.35, - "learning_rate": 3.273210168912203e-05, - "loss": 2.4798, - "step": 198040 - }, - { - "epoch": 0.35, - "learning_rate": 3.27312297491952e-05, - "loss": 2.3929, - "step": 198050 - }, - { - "epoch": 0.35, - "learning_rate": 3.273035780926837e-05, - "loss": 2.4085, - "step": 198060 - }, - { - "epoch": 0.35, - "learning_rate": 3.272948586934155e-05, - "loss": 2.4689, - "step": 198070 - }, - { - "epoch": 0.35, - "learning_rate": 3.272861392941472e-05, - "loss": 2.5175, - "step": 198080 - }, - { - "epoch": 0.35, - "learning_rate": 3.272774198948789e-05, - "loss": 2.3855, - "step": 198090 - }, - { - "epoch": 0.35, - "learning_rate": 3.272687004956107e-05, - "loss": 2.2596, - "step": 198100 - }, - { - "epoch": 0.35, - "learning_rate": 3.2725998109634245e-05, - "loss": 2.3381, - "step": 198110 - }, - { - "epoch": 0.35, - "learning_rate": 3.2725126169707415e-05, - "loss": 2.5421, - "step": 198120 - }, - { - "epoch": 0.35, - "learning_rate": 3.2724254229780586e-05, - "loss": 2.4908, - "step": 198130 - }, - { - "epoch": 0.35, - "learning_rate": 3.272338228985376e-05, - "loss": 2.3996, - "step": 198140 - }, - { - "epoch": 0.35, - "learning_rate": 3.2722510349926933e-05, - "loss": 2.4501, - "step": 198150 - }, - { - "epoch": 0.35, - "learning_rate": 3.2721638410000104e-05, - "loss": 2.4486, - "step": 198160 - }, - { - "epoch": 0.35, - "learning_rate": 3.2720766470073274e-05, - "loss": 2.3831, - "step": 198170 - }, - { - "epoch": 0.35, - "learning_rate": 3.271989453014645e-05, - "loss": 2.4209, - "step": 198180 - }, - { - "epoch": 0.35, - "learning_rate": 3.271902259021963e-05, - "loss": 2.3984, - "step": 198190 - }, - { - "epoch": 0.35, - "learning_rate": 3.27181506502928e-05, - "loss": 2.4279, - "step": 198200 - }, - { - "epoch": 0.35, - "learning_rate": 3.2717278710365976e-05, - "loss": 2.524, - "step": 198210 - }, - { - "epoch": 0.35, - "learning_rate": 3.2716406770439146e-05, - "loss": 2.5045, - "step": 198220 - }, - { - "epoch": 0.35, - "learning_rate": 3.271553483051232e-05, - "loss": 2.5091, - "step": 198230 - }, - { - "epoch": 0.35, - "learning_rate": 3.271466289058549e-05, - "loss": 2.4571, - "step": 198240 - }, - { - "epoch": 0.35, - "learning_rate": 3.2713790950658664e-05, - "loss": 2.3588, - "step": 198250 - }, - { - "epoch": 0.35, - "learning_rate": 3.271291901073184e-05, - "loss": 2.4771, - "step": 198260 - }, - { - "epoch": 0.35, - "learning_rate": 3.271204707080501e-05, - "loss": 2.4653, - "step": 198270 - }, - { - "epoch": 0.35, - "learning_rate": 3.271117513087818e-05, - "loss": 2.369, - "step": 198280 - }, - { - "epoch": 0.35, - "learning_rate": 3.271030319095136e-05, - "loss": 2.3752, - "step": 198290 - }, - { - "epoch": 0.35, - "learning_rate": 3.270943125102453e-05, - "loss": 2.3578, - "step": 198300 - }, - { - "epoch": 0.35, - "learning_rate": 3.27085593110977e-05, - "loss": 2.3974, - "step": 198310 - }, - { - "epoch": 0.35, - "learning_rate": 3.270768737117088e-05, - "loss": 2.487, - "step": 198320 - }, - { - "epoch": 0.35, - "learning_rate": 3.2706815431244054e-05, - "loss": 2.5572, - "step": 198330 - }, - { - "epoch": 0.35, - "learning_rate": 3.2705943491317225e-05, - "loss": 2.3625, - "step": 198340 - }, - { - "epoch": 0.35, - "learning_rate": 3.2705071551390395e-05, - "loss": 2.4762, - "step": 198350 - }, - { - "epoch": 0.35, - "learning_rate": 3.270419961146357e-05, - "loss": 2.4687, - "step": 198360 - }, - { - "epoch": 0.35, - "learning_rate": 3.270332767153674e-05, - "loss": 2.5188, - "step": 198370 - }, - { - "epoch": 0.35, - "learning_rate": 3.270245573160991e-05, - "loss": 2.3417, - "step": 198380 - }, - { - "epoch": 0.35, - "learning_rate": 3.270158379168309e-05, - "loss": 2.3281, - "step": 198390 - }, - { - "epoch": 0.35, - "learning_rate": 3.270071185175626e-05, - "loss": 2.4652, - "step": 198400 - }, - { - "epoch": 0.35, - "learning_rate": 3.269983991182944e-05, - "loss": 2.5224, - "step": 198410 - }, - { - "epoch": 0.35, - "learning_rate": 3.269896797190261e-05, - "loss": 2.4124, - "step": 198420 - }, - { - "epoch": 0.35, - "learning_rate": 3.2698096031975785e-05, - "loss": 2.4789, - "step": 198430 - }, - { - "epoch": 0.35, - "learning_rate": 3.2697224092048956e-05, - "loss": 2.4617, - "step": 198440 - }, - { - "epoch": 0.35, - "learning_rate": 3.2696352152122126e-05, - "loss": 2.4195, - "step": 198450 - }, - { - "epoch": 0.35, - "learning_rate": 3.26954802121953e-05, - "loss": 2.4181, - "step": 198460 - }, - { - "epoch": 0.35, - "learning_rate": 3.2694608272268474e-05, - "loss": 2.3752, - "step": 198470 - }, - { - "epoch": 0.35, - "learning_rate": 3.269373633234165e-05, - "loss": 2.4485, - "step": 198480 - }, - { - "epoch": 0.35, - "learning_rate": 3.269286439241482e-05, - "loss": 2.5333, - "step": 198490 - }, - { - "epoch": 0.35, - "learning_rate": 3.2691992452488e-05, - "loss": 2.5055, - "step": 198500 - }, - { - "epoch": 0.35, - "learning_rate": 3.269112051256117e-05, - "loss": 2.4167, - "step": 198510 - }, - { - "epoch": 0.35, - "learning_rate": 3.269024857263434e-05, - "loss": 2.325, - "step": 198520 - }, - { - "epoch": 0.35, - "learning_rate": 3.2689376632707516e-05, - "loss": 2.4221, - "step": 198530 - }, - { - "epoch": 0.35, - "learning_rate": 3.268850469278069e-05, - "loss": 2.3227, - "step": 198540 - }, - { - "epoch": 0.35, - "learning_rate": 3.268763275285386e-05, - "loss": 2.4009, - "step": 198550 - }, - { - "epoch": 0.35, - "learning_rate": 3.2686760812927034e-05, - "loss": 2.4924, - "step": 198560 - }, - { - "epoch": 0.35, - "learning_rate": 3.268588887300021e-05, - "loss": 2.4998, - "step": 198570 - }, - { - "epoch": 0.35, - "learning_rate": 3.268501693307338e-05, - "loss": 2.5625, - "step": 198580 - }, - { - "epoch": 0.35, - "learning_rate": 3.268414499314655e-05, - "loss": 2.5713, - "step": 198590 - }, - { - "epoch": 0.35, - "learning_rate": 3.268327305321973e-05, - "loss": 2.3628, - "step": 198600 - }, - { - "epoch": 0.35, - "learning_rate": 3.26824011132929e-05, - "loss": 2.5879, - "step": 198610 - }, - { - "epoch": 0.35, - "learning_rate": 3.268152917336607e-05, - "loss": 2.3452, - "step": 198620 - }, - { - "epoch": 0.35, - "learning_rate": 3.268065723343925e-05, - "loss": 2.4237, - "step": 198630 - }, - { - "epoch": 0.35, - "learning_rate": 3.2679785293512424e-05, - "loss": 2.4769, - "step": 198640 - }, - { - "epoch": 0.35, - "learning_rate": 3.2678913353585595e-05, - "loss": 2.462, - "step": 198650 - }, - { - "epoch": 0.35, - "learning_rate": 3.2678041413658765e-05, - "loss": 2.4017, - "step": 198660 - }, - { - "epoch": 0.35, - "learning_rate": 3.2677169473731936e-05, - "loss": 2.3617, - "step": 198670 - }, - { - "epoch": 0.35, - "learning_rate": 3.267629753380511e-05, - "loss": 2.5034, - "step": 198680 - }, - { - "epoch": 0.35, - "learning_rate": 3.267542559387828e-05, - "loss": 2.5002, - "step": 198690 - }, - { - "epoch": 0.35, - "learning_rate": 3.2674553653951453e-05, - "loss": 2.4398, - "step": 198700 - }, - { - "epoch": 0.35, - "learning_rate": 3.267368171402464e-05, - "loss": 2.5269, - "step": 198710 - }, - { - "epoch": 0.35, - "learning_rate": 3.267280977409781e-05, - "loss": 2.4625, - "step": 198720 - }, - { - "epoch": 0.35, - "learning_rate": 3.267193783417098e-05, - "loss": 2.4227, - "step": 198730 - }, - { - "epoch": 0.35, - "learning_rate": 3.267106589424415e-05, - "loss": 2.4081, - "step": 198740 - }, - { - "epoch": 0.35, - "learning_rate": 3.2670193954317326e-05, - "loss": 2.4563, - "step": 198750 - }, - { - "epoch": 0.35, - "learning_rate": 3.2669322014390496e-05, - "loss": 2.3753, - "step": 198760 - }, - { - "epoch": 0.35, - "learning_rate": 3.2668450074463666e-05, - "loss": 2.4041, - "step": 198770 - }, - { - "epoch": 0.35, - "learning_rate": 3.2667578134536844e-05, - "loss": 2.5012, - "step": 198780 - }, - { - "epoch": 0.35, - "learning_rate": 3.266670619461002e-05, - "loss": 2.4334, - "step": 198790 - }, - { - "epoch": 0.35, - "learning_rate": 3.266583425468319e-05, - "loss": 2.3591, - "step": 198800 - }, - { - "epoch": 0.35, - "learning_rate": 3.266496231475636e-05, - "loss": 2.4966, - "step": 198810 - }, - { - "epoch": 0.35, - "learning_rate": 3.266409037482954e-05, - "loss": 2.374, - "step": 198820 - }, - { - "epoch": 0.35, - "learning_rate": 3.266321843490271e-05, - "loss": 2.5311, - "step": 198830 - }, - { - "epoch": 0.35, - "learning_rate": 3.266234649497588e-05, - "loss": 2.4285, - "step": 198840 - }, - { - "epoch": 0.35, - "learning_rate": 3.266147455504906e-05, - "loss": 2.4086, - "step": 198850 - }, - { - "epoch": 0.35, - "learning_rate": 3.2660602615122234e-05, - "loss": 2.4313, - "step": 198860 - }, - { - "epoch": 0.35, - "learning_rate": 3.2659730675195404e-05, - "loss": 2.5595, - "step": 198870 - }, - { - "epoch": 0.35, - "learning_rate": 3.2658858735268575e-05, - "loss": 2.4121, - "step": 198880 - }, - { - "epoch": 0.35, - "learning_rate": 3.265798679534175e-05, - "loss": 2.4785, - "step": 198890 - }, - { - "epoch": 0.35, - "learning_rate": 3.265711485541492e-05, - "loss": 2.4694, - "step": 198900 - }, - { - "epoch": 0.35, - "learning_rate": 3.265624291548809e-05, - "loss": 2.5109, - "step": 198910 - }, - { - "epoch": 0.35, - "learning_rate": 3.265537097556127e-05, - "loss": 2.3871, - "step": 198920 - }, - { - "epoch": 0.35, - "learning_rate": 3.265449903563445e-05, - "loss": 2.4365, - "step": 198930 - }, - { - "epoch": 0.35, - "learning_rate": 3.265362709570762e-05, - "loss": 2.3069, - "step": 198940 - }, - { - "epoch": 0.35, - "learning_rate": 3.265275515578079e-05, - "loss": 2.4487, - "step": 198950 - }, - { - "epoch": 0.35, - "learning_rate": 3.2651883215853965e-05, - "loss": 2.4408, - "step": 198960 - }, - { - "epoch": 0.35, - "learning_rate": 3.2651011275927135e-05, - "loss": 2.4553, - "step": 198970 - }, - { - "epoch": 0.35, - "learning_rate": 3.2650139336000305e-05, - "loss": 2.4517, - "step": 198980 - }, - { - "epoch": 0.35, - "learning_rate": 3.264926739607348e-05, - "loss": 2.4025, - "step": 198990 - }, - { - "epoch": 0.35, - "learning_rate": 3.264839545614666e-05, - "loss": 2.5362, - "step": 199000 - }, - { - "epoch": 0.35, - "learning_rate": 3.264752351621983e-05, - "loss": 2.3784, - "step": 199010 - }, - { - "epoch": 0.35, - "learning_rate": 3.2646651576293e-05, - "loss": 2.4592, - "step": 199020 - }, - { - "epoch": 0.35, - "learning_rate": 3.264577963636618e-05, - "loss": 2.3538, - "step": 199030 - }, - { - "epoch": 0.35, - "learning_rate": 3.264490769643935e-05, - "loss": 2.3656, - "step": 199040 - }, - { - "epoch": 0.35, - "learning_rate": 3.264403575651252e-05, - "loss": 2.3562, - "step": 199050 - }, - { - "epoch": 0.35, - "learning_rate": 3.2643163816585696e-05, - "loss": 2.4429, - "step": 199060 - }, - { - "epoch": 0.35, - "learning_rate": 3.2642291876658866e-05, - "loss": 2.4409, - "step": 199070 - }, - { - "epoch": 0.35, - "learning_rate": 3.264141993673204e-05, - "loss": 2.3889, - "step": 199080 - }, - { - "epoch": 0.35, - "learning_rate": 3.2640547996805214e-05, - "loss": 2.4449, - "step": 199090 - }, - { - "epoch": 0.35, - "learning_rate": 3.263967605687839e-05, - "loss": 2.3462, - "step": 199100 - }, - { - "epoch": 0.35, - "learning_rate": 3.263880411695156e-05, - "loss": 2.3999, - "step": 199110 - }, - { - "epoch": 0.35, - "learning_rate": 3.263793217702473e-05, - "loss": 2.4371, - "step": 199120 - }, - { - "epoch": 0.35, - "learning_rate": 3.26370602370979e-05, - "loss": 2.3326, - "step": 199130 - }, - { - "epoch": 0.35, - "learning_rate": 3.263618829717108e-05, - "loss": 2.299, - "step": 199140 - }, - { - "epoch": 0.35, - "learning_rate": 3.2635316357244256e-05, - "loss": 2.2778, - "step": 199150 - }, - { - "epoch": 0.35, - "learning_rate": 3.2634444417317427e-05, - "loss": 2.4341, - "step": 199160 - }, - { - "epoch": 0.35, - "learning_rate": 3.2633572477390604e-05, - "loss": 2.3902, - "step": 199170 - }, - { - "epoch": 0.35, - "learning_rate": 3.2632700537463774e-05, - "loss": 2.4315, - "step": 199180 - }, - { - "epoch": 0.35, - "learning_rate": 3.2631828597536944e-05, - "loss": 2.5137, - "step": 199190 - }, - { - "epoch": 0.35, - "learning_rate": 3.2630956657610115e-05, - "loss": 2.4676, - "step": 199200 - }, - { - "epoch": 0.35, - "learning_rate": 3.263008471768329e-05, - "loss": 2.4558, - "step": 199210 - }, - { - "epoch": 0.35, - "learning_rate": 3.262921277775646e-05, - "loss": 2.5041, - "step": 199220 - }, - { - "epoch": 0.35, - "learning_rate": 3.262834083782964e-05, - "loss": 2.5027, - "step": 199230 - }, - { - "epoch": 0.35, - "learning_rate": 3.262746889790281e-05, - "loss": 2.4124, - "step": 199240 - }, - { - "epoch": 0.35, - "learning_rate": 3.262659695797599e-05, - "loss": 2.37, - "step": 199250 - }, - { - "epoch": 0.35, - "learning_rate": 3.262572501804916e-05, - "loss": 2.3537, - "step": 199260 - }, - { - "epoch": 0.35, - "learning_rate": 3.262485307812233e-05, - "loss": 2.2568, - "step": 199270 - }, - { - "epoch": 0.35, - "learning_rate": 3.2623981138195505e-05, - "loss": 2.4383, - "step": 199280 - }, - { - "epoch": 0.35, - "learning_rate": 3.2623109198268675e-05, - "loss": 2.416, - "step": 199290 - }, - { - "epoch": 0.35, - "learning_rate": 3.262223725834185e-05, - "loss": 2.4458, - "step": 199300 - }, - { - "epoch": 0.35, - "learning_rate": 3.262136531841502e-05, - "loss": 2.4909, - "step": 199310 - }, - { - "epoch": 0.35, - "learning_rate": 3.26204933784882e-05, - "loss": 2.3691, - "step": 199320 - }, - { - "epoch": 0.35, - "learning_rate": 3.261962143856137e-05, - "loss": 2.4178, - "step": 199330 - }, - { - "epoch": 0.35, - "learning_rate": 3.261874949863454e-05, - "loss": 2.4862, - "step": 199340 - }, - { - "epoch": 0.35, - "learning_rate": 3.261787755870772e-05, - "loss": 2.3762, - "step": 199350 - }, - { - "epoch": 0.35, - "learning_rate": 3.261700561878089e-05, - "loss": 2.4365, - "step": 199360 - }, - { - "epoch": 0.35, - "learning_rate": 3.261613367885406e-05, - "loss": 2.4009, - "step": 199370 - }, - { - "epoch": 0.35, - "learning_rate": 3.2615261738927236e-05, - "loss": 2.4796, - "step": 199380 - }, - { - "epoch": 0.35, - "learning_rate": 3.261438979900041e-05, - "loss": 2.3846, - "step": 199390 - }, - { - "epoch": 0.35, - "learning_rate": 3.2613517859073584e-05, - "loss": 2.3258, - "step": 199400 - }, - { - "epoch": 0.35, - "learning_rate": 3.2612645919146754e-05, - "loss": 2.376, - "step": 199410 - }, - { - "epoch": 0.35, - "learning_rate": 3.261177397921993e-05, - "loss": 2.4126, - "step": 199420 - }, - { - "epoch": 0.35, - "learning_rate": 3.26109020392931e-05, - "loss": 2.4482, - "step": 199430 - }, - { - "epoch": 0.35, - "learning_rate": 3.261003009936627e-05, - "loss": 2.3738, - "step": 199440 - }, - { - "epoch": 0.35, - "learning_rate": 3.260915815943945e-05, - "loss": 2.443, - "step": 199450 - }, - { - "epoch": 0.35, - "learning_rate": 3.2608286219512626e-05, - "loss": 2.402, - "step": 199460 - }, - { - "epoch": 0.35, - "learning_rate": 3.2607414279585797e-05, - "loss": 2.3742, - "step": 199470 - }, - { - "epoch": 0.35, - "learning_rate": 3.260654233965897e-05, - "loss": 2.4329, - "step": 199480 - }, - { - "epoch": 0.35, - "learning_rate": 3.2605670399732144e-05, - "loss": 2.3985, - "step": 199490 - }, - { - "epoch": 0.35, - "learning_rate": 3.2604798459805314e-05, - "loss": 2.4421, - "step": 199500 - }, - { - "epoch": 0.35, - "learning_rate": 3.2603926519878485e-05, - "loss": 2.5025, - "step": 199510 - }, - { - "epoch": 0.35, - "learning_rate": 3.2603054579951655e-05, - "loss": 2.2736, - "step": 199520 - }, - { - "epoch": 0.35, - "learning_rate": 3.260218264002484e-05, - "loss": 2.408, - "step": 199530 - }, - { - "epoch": 0.35, - "learning_rate": 3.260131070009801e-05, - "loss": 2.4409, - "step": 199540 - }, - { - "epoch": 0.35, - "learning_rate": 3.260043876017118e-05, - "loss": 2.3861, - "step": 199550 - }, - { - "epoch": 0.35, - "learning_rate": 3.259956682024436e-05, - "loss": 2.2761, - "step": 199560 - }, - { - "epoch": 0.35, - "learning_rate": 3.259869488031753e-05, - "loss": 2.3794, - "step": 199570 - }, - { - "epoch": 0.35, - "learning_rate": 3.25978229403907e-05, - "loss": 2.4682, - "step": 199580 - }, - { - "epoch": 0.35, - "learning_rate": 3.259695100046387e-05, - "loss": 2.4653, - "step": 199590 - }, - { - "epoch": 0.35, - "learning_rate": 3.259607906053705e-05, - "loss": 2.3939, - "step": 199600 - }, - { - "epoch": 0.35, - "learning_rate": 3.259520712061022e-05, - "loss": 2.4258, - "step": 199610 - }, - { - "epoch": 0.35, - "learning_rate": 3.259433518068339e-05, - "loss": 2.4438, - "step": 199620 - }, - { - "epoch": 0.35, - "learning_rate": 3.259346324075656e-05, - "loss": 2.3699, - "step": 199630 - }, - { - "epoch": 0.35, - "learning_rate": 3.259259130082974e-05, - "loss": 2.5553, - "step": 199640 - }, - { - "epoch": 0.35, - "learning_rate": 3.259171936090291e-05, - "loss": 2.4395, - "step": 199650 - }, - { - "epoch": 0.35, - "learning_rate": 3.259084742097608e-05, - "loss": 2.413, - "step": 199660 - }, - { - "epoch": 0.35, - "learning_rate": 3.2589975481049265e-05, - "loss": 2.3086, - "step": 199670 - }, - { - "epoch": 0.35, - "learning_rate": 3.2589103541122436e-05, - "loss": 2.4864, - "step": 199680 - }, - { - "epoch": 0.35, - "learning_rate": 3.2588231601195606e-05, - "loss": 2.4191, - "step": 199690 - }, - { - "epoch": 0.35, - "learning_rate": 3.2587359661268776e-05, - "loss": 2.3275, - "step": 199700 - }, - { - "epoch": 0.35, - "learning_rate": 3.2586487721341953e-05, - "loss": 2.4964, - "step": 199710 - }, - { - "epoch": 0.35, - "learning_rate": 3.2585615781415124e-05, - "loss": 2.4897, - "step": 199720 - }, - { - "epoch": 0.35, - "learning_rate": 3.2584743841488294e-05, - "loss": 2.4301, - "step": 199730 - }, - { - "epoch": 0.35, - "learning_rate": 3.258387190156147e-05, - "loss": 2.4251, - "step": 199740 - }, - { - "epoch": 0.35, - "learning_rate": 3.258299996163465e-05, - "loss": 2.3386, - "step": 199750 - }, - { - "epoch": 0.35, - "learning_rate": 3.258212802170782e-05, - "loss": 2.471, - "step": 199760 - }, - { - "epoch": 0.35, - "learning_rate": 3.258125608178099e-05, - "loss": 2.2313, - "step": 199770 - }, - { - "epoch": 0.35, - "learning_rate": 3.2580384141854166e-05, - "loss": 2.3081, - "step": 199780 - }, - { - "epoch": 0.35, - "learning_rate": 3.257951220192734e-05, - "loss": 2.4874, - "step": 199790 - }, - { - "epoch": 0.35, - "learning_rate": 3.257864026200051e-05, - "loss": 2.3451, - "step": 199800 - }, - { - "epoch": 0.35, - "learning_rate": 3.2577768322073684e-05, - "loss": 2.4659, - "step": 199810 - }, - { - "epoch": 0.35, - "learning_rate": 3.257689638214686e-05, - "loss": 2.3594, - "step": 199820 - }, - { - "epoch": 0.35, - "learning_rate": 3.257602444222003e-05, - "loss": 2.3494, - "step": 199830 - }, - { - "epoch": 0.35, - "learning_rate": 3.25751525022932e-05, - "loss": 2.2746, - "step": 199840 - }, - { - "epoch": 0.35, - "learning_rate": 3.257428056236638e-05, - "loss": 2.4961, - "step": 199850 - }, - { - "epoch": 0.35, - "learning_rate": 3.257340862243955e-05, - "loss": 2.3841, - "step": 199860 - }, - { - "epoch": 0.35, - "learning_rate": 3.257253668251272e-05, - "loss": 2.4391, - "step": 199870 - }, - { - "epoch": 0.35, - "learning_rate": 3.25716647425859e-05, - "loss": 2.3875, - "step": 199880 - }, - { - "epoch": 0.35, - "learning_rate": 3.257079280265907e-05, - "loss": 2.5286, - "step": 199890 - }, - { - "epoch": 0.35, - "learning_rate": 3.2569920862732245e-05, - "loss": 2.294, - "step": 199900 - }, - { - "epoch": 0.35, - "learning_rate": 3.2569048922805415e-05, - "loss": 2.4811, - "step": 199910 - }, - { - "epoch": 0.35, - "learning_rate": 3.256817698287859e-05, - "loss": 2.5192, - "step": 199920 - }, - { - "epoch": 0.35, - "learning_rate": 3.256730504295176e-05, - "loss": 2.353, - "step": 199930 - }, - { - "epoch": 0.35, - "learning_rate": 3.256643310302493e-05, - "loss": 2.3902, - "step": 199940 - }, - { - "epoch": 0.35, - "learning_rate": 3.256556116309811e-05, - "loss": 2.4699, - "step": 199950 - }, - { - "epoch": 0.35, - "learning_rate": 3.256468922317128e-05, - "loss": 2.4408, - "step": 199960 - }, - { - "epoch": 0.35, - "learning_rate": 3.256381728324446e-05, - "loss": 2.4956, - "step": 199970 - }, - { - "epoch": 0.35, - "learning_rate": 3.256294534331763e-05, - "loss": 2.4474, - "step": 199980 - }, - { - "epoch": 0.35, - "learning_rate": 3.2562073403390805e-05, - "loss": 2.4985, - "step": 199990 - }, - { - "epoch": 0.35, - "learning_rate": 3.2561201463463976e-05, - "loss": 2.3258, - "step": 200000 - }, - { - "epoch": 0.35, - "learning_rate": 3.2560329523537146e-05, - "loss": 2.375, - "step": 200010 - }, - { - "epoch": 0.35, - "learning_rate": 3.2559457583610317e-05, - "loss": 2.4304, - "step": 200020 - }, - { - "epoch": 0.35, - "learning_rate": 3.2558585643683494e-05, - "loss": 2.5263, - "step": 200030 - }, - { - "epoch": 0.35, - "learning_rate": 3.2557713703756664e-05, - "loss": 2.4025, - "step": 200040 - }, - { - "epoch": 0.35, - "learning_rate": 3.255684176382984e-05, - "loss": 2.4592, - "step": 200050 - }, - { - "epoch": 0.35, - "learning_rate": 3.255596982390302e-05, - "loss": 2.4198, - "step": 200060 - }, - { - "epoch": 0.35, - "learning_rate": 3.255509788397619e-05, - "loss": 2.4058, - "step": 200070 - }, - { - "epoch": 0.35, - "learning_rate": 3.255422594404936e-05, - "loss": 2.3121, - "step": 200080 - }, - { - "epoch": 0.35, - "learning_rate": 3.255335400412253e-05, - "loss": 2.4499, - "step": 200090 - }, - { - "epoch": 0.35, - "learning_rate": 3.255248206419571e-05, - "loss": 2.3441, - "step": 200100 - }, - { - "epoch": 0.35, - "learning_rate": 3.255161012426888e-05, - "loss": 2.3203, - "step": 200110 - }, - { - "epoch": 0.35, - "learning_rate": 3.2550738184342054e-05, - "loss": 2.3759, - "step": 200120 - }, - { - "epoch": 0.35, - "learning_rate": 3.2549866244415225e-05, - "loss": 2.3744, - "step": 200130 - }, - { - "epoch": 0.35, - "learning_rate": 3.25489943044884e-05, - "loss": 2.3382, - "step": 200140 - }, - { - "epoch": 0.35, - "learning_rate": 3.254812236456157e-05, - "loss": 2.4322, - "step": 200150 - }, - { - "epoch": 0.35, - "learning_rate": 3.254725042463474e-05, - "loss": 2.4109, - "step": 200160 - }, - { - "epoch": 0.35, - "learning_rate": 3.254637848470792e-05, - "loss": 2.3789, - "step": 200170 - }, - { - "epoch": 0.35, - "learning_rate": 3.254550654478109e-05, - "loss": 2.424, - "step": 200180 - }, - { - "epoch": 0.35, - "learning_rate": 3.254463460485427e-05, - "loss": 2.3609, - "step": 200190 - }, - { - "epoch": 0.35, - "learning_rate": 3.254376266492744e-05, - "loss": 2.4249, - "step": 200200 - }, - { - "epoch": 0.35, - "learning_rate": 3.2542890725000615e-05, - "loss": 2.3976, - "step": 200210 - }, - { - "epoch": 0.35, - "learning_rate": 3.2542018785073785e-05, - "loss": 2.4664, - "step": 200220 - }, - { - "epoch": 0.35, - "learning_rate": 3.2541146845146956e-05, - "loss": 2.5167, - "step": 200230 - }, - { - "epoch": 0.35, - "learning_rate": 3.254027490522013e-05, - "loss": 2.4559, - "step": 200240 - }, - { - "epoch": 0.35, - "learning_rate": 3.25394029652933e-05, - "loss": 2.4562, - "step": 200250 - }, - { - "epoch": 0.35, - "learning_rate": 3.2538531025366474e-05, - "loss": 2.4423, - "step": 200260 - }, - { - "epoch": 0.35, - "learning_rate": 3.253765908543965e-05, - "loss": 2.3411, - "step": 200270 - }, - { - "epoch": 0.35, - "learning_rate": 3.253678714551283e-05, - "loss": 2.4759, - "step": 200280 - }, - { - "epoch": 0.35, - "learning_rate": 3.2535915205586e-05, - "loss": 2.4588, - "step": 200290 - }, - { - "epoch": 0.35, - "learning_rate": 3.253504326565917e-05, - "loss": 2.4729, - "step": 200300 - }, - { - "epoch": 0.35, - "learning_rate": 3.2534171325732346e-05, - "loss": 2.5079, - "step": 200310 - }, - { - "epoch": 0.35, - "learning_rate": 3.2533299385805516e-05, - "loss": 2.3768, - "step": 200320 - }, - { - "epoch": 0.35, - "learning_rate": 3.2532427445878687e-05, - "loss": 2.4536, - "step": 200330 - }, - { - "epoch": 0.35, - "learning_rate": 3.2531555505951864e-05, - "loss": 2.4222, - "step": 200340 - }, - { - "epoch": 0.35, - "learning_rate": 3.253068356602504e-05, - "loss": 2.4645, - "step": 200350 - }, - { - "epoch": 0.35, - "learning_rate": 3.252981162609821e-05, - "loss": 2.4242, - "step": 200360 - }, - { - "epoch": 0.35, - "learning_rate": 3.252893968617138e-05, - "loss": 2.3308, - "step": 200370 - }, - { - "epoch": 0.35, - "learning_rate": 3.252806774624456e-05, - "loss": 2.5865, - "step": 200380 - }, - { - "epoch": 0.35, - "learning_rate": 3.252719580631773e-05, - "loss": 2.4242, - "step": 200390 - }, - { - "epoch": 0.35, - "learning_rate": 3.25263238663909e-05, - "loss": 2.4043, - "step": 200400 - }, - { - "epoch": 0.35, - "learning_rate": 3.252545192646408e-05, - "loss": 2.3827, - "step": 200410 - }, - { - "epoch": 0.35, - "learning_rate": 3.2524579986537254e-05, - "loss": 2.492, - "step": 200420 - }, - { - "epoch": 0.35, - "learning_rate": 3.2523708046610424e-05, - "loss": 2.4153, - "step": 200430 - }, - { - "epoch": 0.35, - "learning_rate": 3.2522836106683595e-05, - "loss": 2.4152, - "step": 200440 - }, - { - "epoch": 0.35, - "learning_rate": 3.252196416675677e-05, - "loss": 2.4897, - "step": 200450 - }, - { - "epoch": 0.35, - "learning_rate": 3.252109222682994e-05, - "loss": 2.4158, - "step": 200460 - }, - { - "epoch": 0.35, - "learning_rate": 3.252022028690311e-05, - "loss": 2.3367, - "step": 200470 - }, - { - "epoch": 0.35, - "learning_rate": 3.251934834697628e-05, - "loss": 2.4927, - "step": 200480 - }, - { - "epoch": 0.35, - "learning_rate": 3.251847640704947e-05, - "loss": 2.3526, - "step": 200490 - }, - { - "epoch": 0.35, - "learning_rate": 3.251760446712264e-05, - "loss": 2.4911, - "step": 200500 - }, - { - "epoch": 0.35, - "learning_rate": 3.251673252719581e-05, - "loss": 2.387, - "step": 200510 - }, - { - "epoch": 0.35, - "learning_rate": 3.2515860587268985e-05, - "loss": 2.579, - "step": 200520 - }, - { - "epoch": 0.35, - "learning_rate": 3.2514988647342155e-05, - "loss": 2.3701, - "step": 200530 - }, - { - "epoch": 0.35, - "learning_rate": 3.2514116707415326e-05, - "loss": 2.4414, - "step": 200540 - }, - { - "epoch": 0.35, - "learning_rate": 3.2513244767488496e-05, - "loss": 2.4518, - "step": 200550 - }, - { - "epoch": 0.35, - "learning_rate": 3.251237282756167e-05, - "loss": 2.3626, - "step": 200560 - }, - { - "epoch": 0.35, - "learning_rate": 3.251150088763485e-05, - "loss": 2.4489, - "step": 200570 - }, - { - "epoch": 0.35, - "learning_rate": 3.251062894770802e-05, - "loss": 2.4973, - "step": 200580 - }, - { - "epoch": 0.35, - "learning_rate": 3.250975700778119e-05, - "loss": 2.3838, - "step": 200590 - }, - { - "epoch": 0.35, - "learning_rate": 3.250888506785437e-05, - "loss": 2.4427, - "step": 200600 - }, - { - "epoch": 0.35, - "learning_rate": 3.250801312792754e-05, - "loss": 2.5204, - "step": 200610 - }, - { - "epoch": 0.35, - "learning_rate": 3.250714118800071e-05, - "loss": 2.3146, - "step": 200620 - }, - { - "epoch": 0.35, - "learning_rate": 3.2506269248073886e-05, - "loss": 2.4796, - "step": 200630 - }, - { - "epoch": 0.35, - "learning_rate": 3.250539730814706e-05, - "loss": 2.4298, - "step": 200640 - }, - { - "epoch": 0.35, - "learning_rate": 3.2504525368220234e-05, - "loss": 2.3469, - "step": 200650 - }, - { - "epoch": 0.35, - "learning_rate": 3.2503653428293404e-05, - "loss": 2.4688, - "step": 200660 - }, - { - "epoch": 0.35, - "learning_rate": 3.250278148836658e-05, - "loss": 2.4075, - "step": 200670 - }, - { - "epoch": 0.35, - "learning_rate": 3.250190954843975e-05, - "loss": 2.4646, - "step": 200680 - }, - { - "epoch": 0.35, - "learning_rate": 3.250103760851292e-05, - "loss": 2.4594, - "step": 200690 - }, - { - "epoch": 0.35, - "learning_rate": 3.25001656685861e-05, - "loss": 2.4527, - "step": 200700 - }, - { - "epoch": 0.35, - "learning_rate": 3.249929372865927e-05, - "loss": 2.3821, - "step": 200710 - }, - { - "epoch": 0.35, - "learning_rate": 3.2498421788732447e-05, - "loss": 2.4244, - "step": 200720 - }, - { - "epoch": 0.35, - "learning_rate": 3.249754984880562e-05, - "loss": 2.4261, - "step": 200730 - }, - { - "epoch": 0.35, - "learning_rate": 3.2496677908878794e-05, - "loss": 2.3534, - "step": 200740 - }, - { - "epoch": 0.35, - "learning_rate": 3.2495805968951965e-05, - "loss": 2.5238, - "step": 200750 - }, - { - "epoch": 0.35, - "learning_rate": 3.2494934029025135e-05, - "loss": 2.4096, - "step": 200760 - }, - { - "epoch": 0.35, - "learning_rate": 3.249406208909831e-05, - "loss": 2.4505, - "step": 200770 - }, - { - "epoch": 0.35, - "learning_rate": 3.249319014917148e-05, - "loss": 2.5289, - "step": 200780 - }, - { - "epoch": 0.35, - "learning_rate": 3.249231820924466e-05, - "loss": 2.3185, - "step": 200790 - }, - { - "epoch": 0.35, - "learning_rate": 3.249144626931783e-05, - "loss": 2.4866, - "step": 200800 - }, - { - "epoch": 0.35, - "learning_rate": 3.249057432939101e-05, - "loss": 2.483, - "step": 200810 - }, - { - "epoch": 0.35, - "learning_rate": 3.248970238946418e-05, - "loss": 2.4259, - "step": 200820 - }, - { - "epoch": 0.35, - "learning_rate": 3.248883044953735e-05, - "loss": 2.5148, - "step": 200830 - }, - { - "epoch": 0.35, - "learning_rate": 3.2487958509610525e-05, - "loss": 2.4259, - "step": 200840 - }, - { - "epoch": 0.35, - "learning_rate": 3.2487086569683695e-05, - "loss": 2.3345, - "step": 200850 - }, - { - "epoch": 0.35, - "learning_rate": 3.248621462975687e-05, - "loss": 2.3989, - "step": 200860 - }, - { - "epoch": 0.35, - "learning_rate": 3.248534268983004e-05, - "loss": 2.4234, - "step": 200870 - }, - { - "epoch": 0.35, - "learning_rate": 3.248447074990322e-05, - "loss": 2.3935, - "step": 200880 - }, - { - "epoch": 0.35, - "learning_rate": 3.248359880997639e-05, - "loss": 2.3581, - "step": 200890 - }, - { - "epoch": 0.35, - "learning_rate": 3.248272687004956e-05, - "loss": 2.3465, - "step": 200900 - }, - { - "epoch": 0.35, - "learning_rate": 3.248185493012274e-05, - "loss": 2.4603, - "step": 200910 - }, - { - "epoch": 0.35, - "learning_rate": 3.248098299019591e-05, - "loss": 2.3332, - "step": 200920 - }, - { - "epoch": 0.35, - "learning_rate": 3.248011105026908e-05, - "loss": 2.3961, - "step": 200930 - }, - { - "epoch": 0.35, - "learning_rate": 3.2479239110342256e-05, - "loss": 2.3703, - "step": 200940 - }, - { - "epoch": 0.35, - "learning_rate": 3.247836717041543e-05, - "loss": 2.4118, - "step": 200950 - }, - { - "epoch": 0.35, - "learning_rate": 3.2477495230488604e-05, - "loss": 2.49, - "step": 200960 - }, - { - "epoch": 0.35, - "learning_rate": 3.2476623290561774e-05, - "loss": 2.4424, - "step": 200970 - }, - { - "epoch": 0.35, - "learning_rate": 3.2475751350634944e-05, - "loss": 2.3982, - "step": 200980 - }, - { - "epoch": 0.35, - "learning_rate": 3.247487941070812e-05, - "loss": 2.3806, - "step": 200990 - }, - { - "epoch": 0.35, - "learning_rate": 3.247400747078129e-05, - "loss": 2.3538, - "step": 201000 - }, - { - "epoch": 0.35, - "learning_rate": 3.247313553085447e-05, - "loss": 2.4384, - "step": 201010 - }, - { - "epoch": 0.35, - "learning_rate": 3.2472263590927646e-05, - "loss": 2.4275, - "step": 201020 - }, - { - "epoch": 0.35, - "learning_rate": 3.2471391651000817e-05, - "loss": 2.4233, - "step": 201030 - }, - { - "epoch": 0.35, - "learning_rate": 3.247051971107399e-05, - "loss": 2.4223, - "step": 201040 - }, - { - "epoch": 0.35, - "learning_rate": 3.246964777114716e-05, - "loss": 2.3752, - "step": 201050 - }, - { - "epoch": 0.35, - "learning_rate": 3.2468775831220334e-05, - "loss": 2.3823, - "step": 201060 - }, - { - "epoch": 0.35, - "learning_rate": 3.2467903891293505e-05, - "loss": 2.4281, - "step": 201070 - }, - { - "epoch": 0.35, - "learning_rate": 3.2467031951366675e-05, - "loss": 2.4507, - "step": 201080 - }, - { - "epoch": 0.35, - "learning_rate": 3.246616001143985e-05, - "loss": 2.4033, - "step": 201090 - }, - { - "epoch": 0.35, - "learning_rate": 3.246528807151303e-05, - "loss": 2.4424, - "step": 201100 - }, - { - "epoch": 0.35, - "learning_rate": 3.24644161315862e-05, - "loss": 2.4155, - "step": 201110 - }, - { - "epoch": 0.35, - "learning_rate": 3.246354419165937e-05, - "loss": 2.4169, - "step": 201120 - }, - { - "epoch": 0.35, - "learning_rate": 3.246267225173255e-05, - "loss": 2.3678, - "step": 201130 - }, - { - "epoch": 0.35, - "learning_rate": 3.246180031180572e-05, - "loss": 2.3108, - "step": 201140 - }, - { - "epoch": 0.35, - "learning_rate": 3.246092837187889e-05, - "loss": 2.5288, - "step": 201150 - }, - { - "epoch": 0.35, - "learning_rate": 3.2460056431952065e-05, - "loss": 2.3546, - "step": 201160 - }, - { - "epoch": 0.35, - "learning_rate": 3.245918449202524e-05, - "loss": 2.3813, - "step": 201170 - }, - { - "epoch": 0.35, - "learning_rate": 3.245831255209841e-05, - "loss": 2.3928, - "step": 201180 - }, - { - "epoch": 0.35, - "learning_rate": 3.245744061217158e-05, - "loss": 2.3716, - "step": 201190 - }, - { - "epoch": 0.35, - "learning_rate": 3.245656867224476e-05, - "loss": 2.4358, - "step": 201200 - }, - { - "epoch": 0.35, - "learning_rate": 3.245569673231793e-05, - "loss": 2.3645, - "step": 201210 - }, - { - "epoch": 0.35, - "learning_rate": 3.24548247923911e-05, - "loss": 2.4729, - "step": 201220 - }, - { - "epoch": 0.35, - "learning_rate": 3.245395285246428e-05, - "loss": 2.3615, - "step": 201230 - }, - { - "epoch": 0.35, - "learning_rate": 3.2453080912537456e-05, - "loss": 2.4312, - "step": 201240 - }, - { - "epoch": 0.35, - "learning_rate": 3.2452208972610626e-05, - "loss": 2.3032, - "step": 201250 - }, - { - "epoch": 0.35, - "learning_rate": 3.2451337032683796e-05, - "loss": 2.4882, - "step": 201260 - }, - { - "epoch": 0.35, - "learning_rate": 3.2450465092756973e-05, - "loss": 2.513, - "step": 201270 - }, - { - "epoch": 0.35, - "learning_rate": 3.2449593152830144e-05, - "loss": 2.4526, - "step": 201280 - }, - { - "epoch": 0.35, - "learning_rate": 3.2448721212903314e-05, - "loss": 2.4917, - "step": 201290 - }, - { - "epoch": 0.35, - "learning_rate": 3.244784927297649e-05, - "loss": 2.3853, - "step": 201300 - }, - { - "epoch": 0.35, - "learning_rate": 3.244697733304967e-05, - "loss": 2.3954, - "step": 201310 - }, - { - "epoch": 0.35, - "learning_rate": 3.244610539312284e-05, - "loss": 2.4784, - "step": 201320 - }, - { - "epoch": 0.35, - "learning_rate": 3.244523345319601e-05, - "loss": 2.4022, - "step": 201330 - }, - { - "epoch": 0.35, - "learning_rate": 3.2444361513269186e-05, - "loss": 2.3918, - "step": 201340 - }, - { - "epoch": 0.35, - "learning_rate": 3.244348957334236e-05, - "loss": 2.4944, - "step": 201350 - }, - { - "epoch": 0.35, - "learning_rate": 3.244261763341553e-05, - "loss": 2.6049, - "step": 201360 - }, - { - "epoch": 0.35, - "learning_rate": 3.24417456934887e-05, - "loss": 2.5186, - "step": 201370 - }, - { - "epoch": 0.35, - "learning_rate": 3.2440873753561875e-05, - "loss": 2.4607, - "step": 201380 - }, - { - "epoch": 0.35, - "learning_rate": 3.244000181363505e-05, - "loss": 2.3236, - "step": 201390 - }, - { - "epoch": 0.35, - "learning_rate": 3.243912987370822e-05, - "loss": 2.3682, - "step": 201400 - }, - { - "epoch": 0.35, - "learning_rate": 3.24382579337814e-05, - "loss": 2.5258, - "step": 201410 - }, - { - "epoch": 0.35, - "learning_rate": 3.243738599385457e-05, - "loss": 2.3778, - "step": 201420 - }, - { - "epoch": 0.35, - "learning_rate": 3.243651405392774e-05, - "loss": 2.3834, - "step": 201430 - }, - { - "epoch": 0.35, - "learning_rate": 3.243564211400091e-05, - "loss": 2.4949, - "step": 201440 - }, - { - "epoch": 0.35, - "learning_rate": 3.243477017407409e-05, - "loss": 2.4027, - "step": 201450 - }, - { - "epoch": 0.35, - "learning_rate": 3.2433898234147265e-05, - "loss": 2.4303, - "step": 201460 - }, - { - "epoch": 0.35, - "learning_rate": 3.2433026294220435e-05, - "loss": 2.4754, - "step": 201470 - }, - { - "epoch": 0.35, - "learning_rate": 3.2432154354293606e-05, - "loss": 2.281, - "step": 201480 - }, - { - "epoch": 0.35, - "learning_rate": 3.243128241436678e-05, - "loss": 2.4382, - "step": 201490 - }, - { - "epoch": 0.35, - "learning_rate": 3.243041047443995e-05, - "loss": 2.2203, - "step": 201500 - }, - { - "epoch": 0.35, - "learning_rate": 3.2429538534513124e-05, - "loss": 2.4512, - "step": 201510 - }, - { - "epoch": 0.35, - "learning_rate": 3.24286665945863e-05, - "loss": 2.3811, - "step": 201520 - }, - { - "epoch": 0.35, - "learning_rate": 3.242779465465948e-05, - "loss": 2.3694, - "step": 201530 - }, - { - "epoch": 0.35, - "learning_rate": 3.242692271473265e-05, - "loss": 2.5255, - "step": 201540 - }, - { - "epoch": 0.35, - "learning_rate": 3.242605077480582e-05, - "loss": 2.4703, - "step": 201550 - }, - { - "epoch": 0.35, - "learning_rate": 3.2425178834878996e-05, - "loss": 2.5133, - "step": 201560 - }, - { - "epoch": 0.35, - "learning_rate": 3.2424306894952166e-05, - "loss": 2.3681, - "step": 201570 - }, - { - "epoch": 0.35, - "learning_rate": 3.2423434955025337e-05, - "loss": 2.3794, - "step": 201580 - }, - { - "epoch": 0.35, - "learning_rate": 3.2422563015098514e-05, - "loss": 2.4627, - "step": 201590 - }, - { - "epoch": 0.35, - "learning_rate": 3.2421691075171684e-05, - "loss": 2.4418, - "step": 201600 - }, - { - "epoch": 0.35, - "learning_rate": 3.242081913524486e-05, - "loss": 2.38, - "step": 201610 - }, - { - "epoch": 0.35, - "learning_rate": 3.241994719531803e-05, - "loss": 2.3085, - "step": 201620 - }, - { - "epoch": 0.35, - "learning_rate": 3.241907525539121e-05, - "loss": 2.4332, - "step": 201630 - }, - { - "epoch": 0.35, - "learning_rate": 3.241820331546438e-05, - "loss": 2.489, - "step": 201640 - }, - { - "epoch": 0.35, - "learning_rate": 3.241733137553755e-05, - "loss": 2.4621, - "step": 201650 - }, - { - "epoch": 0.35, - "learning_rate": 3.241645943561073e-05, - "loss": 2.3413, - "step": 201660 - }, - { - "epoch": 0.35, - "learning_rate": 3.24155874956839e-05, - "loss": 2.2316, - "step": 201670 - }, - { - "epoch": 0.35, - "learning_rate": 3.2414715555757074e-05, - "loss": 2.3554, - "step": 201680 - }, - { - "epoch": 0.35, - "learning_rate": 3.2413843615830245e-05, - "loss": 2.5251, - "step": 201690 - }, - { - "epoch": 0.35, - "learning_rate": 3.241297167590342e-05, - "loss": 2.3847, - "step": 201700 - }, - { - "epoch": 0.35, - "learning_rate": 3.241209973597659e-05, - "loss": 2.4042, - "step": 201710 - }, - { - "epoch": 0.35, - "learning_rate": 3.241122779604976e-05, - "loss": 2.3598, - "step": 201720 - }, - { - "epoch": 0.35, - "learning_rate": 3.241035585612294e-05, - "loss": 2.4446, - "step": 201730 - }, - { - "epoch": 0.35, - "learning_rate": 3.240948391619611e-05, - "loss": 2.3335, - "step": 201740 - }, - { - "epoch": 0.35, - "learning_rate": 3.240861197626928e-05, - "loss": 2.4473, - "step": 201750 - }, - { - "epoch": 0.35, - "learning_rate": 3.240774003634246e-05, - "loss": 2.3514, - "step": 201760 - }, - { - "epoch": 0.35, - "learning_rate": 3.2406868096415635e-05, - "loss": 2.4963, - "step": 201770 - }, - { - "epoch": 0.35, - "learning_rate": 3.2405996156488805e-05, - "loss": 2.4546, - "step": 201780 - }, - { - "epoch": 0.35, - "learning_rate": 3.2405124216561976e-05, - "loss": 2.4747, - "step": 201790 - }, - { - "epoch": 0.35, - "learning_rate": 3.240425227663515e-05, - "loss": 2.4181, - "step": 201800 - }, - { - "epoch": 0.35, - "learning_rate": 3.240338033670832e-05, - "loss": 2.4214, - "step": 201810 - }, - { - "epoch": 0.35, - "learning_rate": 3.2402508396781494e-05, - "loss": 2.4848, - "step": 201820 - }, - { - "epoch": 0.35, - "learning_rate": 3.240163645685467e-05, - "loss": 2.4386, - "step": 201830 - }, - { - "epoch": 0.35, - "learning_rate": 3.240076451692785e-05, - "loss": 2.3804, - "step": 201840 - }, - { - "epoch": 0.35, - "learning_rate": 3.239989257700102e-05, - "loss": 2.3736, - "step": 201850 - }, - { - "epoch": 0.35, - "learning_rate": 3.239902063707419e-05, - "loss": 2.4183, - "step": 201860 - }, - { - "epoch": 0.35, - "learning_rate": 3.2398148697147366e-05, - "loss": 2.4921, - "step": 201870 - }, - { - "epoch": 0.35, - "learning_rate": 3.2397276757220536e-05, - "loss": 2.4321, - "step": 201880 - }, - { - "epoch": 0.35, - "learning_rate": 3.2396404817293707e-05, - "loss": 2.4125, - "step": 201890 - }, - { - "epoch": 0.35, - "learning_rate": 3.239553287736688e-05, - "loss": 2.386, - "step": 201900 - }, - { - "epoch": 0.35, - "learning_rate": 3.239466093744006e-05, - "loss": 2.3718, - "step": 201910 - }, - { - "epoch": 0.35, - "learning_rate": 3.239378899751323e-05, - "loss": 2.4983, - "step": 201920 - }, - { - "epoch": 0.35, - "learning_rate": 3.23929170575864e-05, - "loss": 2.4627, - "step": 201930 - }, - { - "epoch": 0.35, - "learning_rate": 3.239204511765957e-05, - "loss": 2.4486, - "step": 201940 - }, - { - "epoch": 0.35, - "learning_rate": 3.239117317773275e-05, - "loss": 2.34, - "step": 201950 - }, - { - "epoch": 0.35, - "learning_rate": 3.239030123780592e-05, - "loss": 2.4307, - "step": 201960 - }, - { - "epoch": 0.35, - "learning_rate": 3.238942929787909e-05, - "loss": 2.3929, - "step": 201970 - }, - { - "epoch": 0.35, - "learning_rate": 3.2388557357952274e-05, - "loss": 2.4342, - "step": 201980 - }, - { - "epoch": 0.35, - "learning_rate": 3.2387685418025444e-05, - "loss": 2.2701, - "step": 201990 - }, - { - "epoch": 0.35, - "learning_rate": 3.2386813478098615e-05, - "loss": 2.3773, - "step": 202000 - }, - { - "epoch": 0.35, - "learning_rate": 3.2385941538171785e-05, - "loss": 2.2789, - "step": 202010 - }, - { - "epoch": 0.35, - "learning_rate": 3.238506959824496e-05, - "loss": 2.338, - "step": 202020 - }, - { - "epoch": 0.35, - "learning_rate": 3.238419765831813e-05, - "loss": 2.4533, - "step": 202030 - }, - { - "epoch": 0.35, - "learning_rate": 3.23833257183913e-05, - "loss": 2.4273, - "step": 202040 - }, - { - "epoch": 0.35, - "learning_rate": 3.238245377846448e-05, - "loss": 2.3155, - "step": 202050 - }, - { - "epoch": 0.35, - "learning_rate": 3.238158183853766e-05, - "loss": 2.3899, - "step": 202060 - }, - { - "epoch": 0.35, - "learning_rate": 3.238070989861083e-05, - "loss": 2.4386, - "step": 202070 - }, - { - "epoch": 0.35, - "learning_rate": 3.2379837958684e-05, - "loss": 2.4283, - "step": 202080 - }, - { - "epoch": 0.35, - "learning_rate": 3.2378966018757175e-05, - "loss": 2.4419, - "step": 202090 - }, - { - "epoch": 0.35, - "learning_rate": 3.2378094078830346e-05, - "loss": 2.4818, - "step": 202100 - }, - { - "epoch": 0.35, - "learning_rate": 3.2377222138903516e-05, - "loss": 2.418, - "step": 202110 - }, - { - "epoch": 0.35, - "learning_rate": 3.237635019897669e-05, - "loss": 2.4851, - "step": 202120 - }, - { - "epoch": 0.35, - "learning_rate": 3.237547825904987e-05, - "loss": 2.4878, - "step": 202130 - }, - { - "epoch": 0.35, - "learning_rate": 3.237460631912304e-05, - "loss": 2.3674, - "step": 202140 - }, - { - "epoch": 0.35, - "learning_rate": 3.237373437919621e-05, - "loss": 2.314, - "step": 202150 - }, - { - "epoch": 0.35, - "learning_rate": 3.237286243926939e-05, - "loss": 2.4007, - "step": 202160 - }, - { - "epoch": 0.35, - "learning_rate": 3.237199049934256e-05, - "loss": 2.4175, - "step": 202170 - }, - { - "epoch": 0.35, - "learning_rate": 3.237111855941573e-05, - "loss": 2.4046, - "step": 202180 - }, - { - "epoch": 0.35, - "learning_rate": 3.2370246619488906e-05, - "loss": 2.3138, - "step": 202190 - }, - { - "epoch": 0.35, - "learning_rate": 3.236937467956208e-05, - "loss": 2.4456, - "step": 202200 - }, - { - "epoch": 0.35, - "learning_rate": 3.2368502739635254e-05, - "loss": 2.4531, - "step": 202210 - }, - { - "epoch": 0.35, - "learning_rate": 3.2367630799708424e-05, - "loss": 2.4124, - "step": 202220 - }, - { - "epoch": 0.35, - "learning_rate": 3.23667588597816e-05, - "loss": 2.3967, - "step": 202230 - }, - { - "epoch": 0.35, - "learning_rate": 3.236588691985477e-05, - "loss": 2.4926, - "step": 202240 - }, - { - "epoch": 0.35, - "learning_rate": 3.236501497992794e-05, - "loss": 2.3153, - "step": 202250 - }, - { - "epoch": 0.35, - "learning_rate": 3.236414304000112e-05, - "loss": 2.4156, - "step": 202260 - }, - { - "epoch": 0.35, - "learning_rate": 3.236327110007429e-05, - "loss": 2.4385, - "step": 202270 - }, - { - "epoch": 0.35, - "learning_rate": 3.2362399160147467e-05, - "loss": 2.3051, - "step": 202280 - }, - { - "epoch": 0.35, - "learning_rate": 3.236152722022064e-05, - "loss": 2.4096, - "step": 202290 - }, - { - "epoch": 0.35, - "learning_rate": 3.2360655280293814e-05, - "loss": 2.3712, - "step": 202300 - }, - { - "epoch": 0.35, - "learning_rate": 3.2359783340366985e-05, - "loss": 2.5039, - "step": 202310 - }, - { - "epoch": 0.35, - "learning_rate": 3.2358911400440155e-05, - "loss": 2.3538, - "step": 202320 - }, - { - "epoch": 0.35, - "learning_rate": 3.2358039460513325e-05, - "loss": 2.3654, - "step": 202330 - }, - { - "epoch": 0.35, - "learning_rate": 3.23571675205865e-05, - "loss": 2.4158, - "step": 202340 - }, - { - "epoch": 0.35, - "learning_rate": 3.235629558065968e-05, - "loss": 2.295, - "step": 202350 - }, - { - "epoch": 0.35, - "learning_rate": 3.235542364073285e-05, - "loss": 2.37, - "step": 202360 - }, - { - "epoch": 0.35, - "learning_rate": 3.235455170080603e-05, - "loss": 2.4822, - "step": 202370 - }, - { - "epoch": 0.35, - "learning_rate": 3.23536797608792e-05, - "loss": 2.366, - "step": 202380 - }, - { - "epoch": 0.35, - "learning_rate": 3.235280782095237e-05, - "loss": 2.359, - "step": 202390 - }, - { - "epoch": 0.35, - "learning_rate": 3.235193588102554e-05, - "loss": 2.4812, - "step": 202400 - }, - { - "epoch": 0.35, - "learning_rate": 3.2351063941098715e-05, - "loss": 2.4373, - "step": 202410 - }, - { - "epoch": 0.35, - "learning_rate": 3.2350192001171886e-05, - "loss": 2.3575, - "step": 202420 - }, - { - "epoch": 0.35, - "learning_rate": 3.234932006124506e-05, - "loss": 2.3987, - "step": 202430 - }, - { - "epoch": 0.35, - "learning_rate": 3.234844812131823e-05, - "loss": 2.553, - "step": 202440 - }, - { - "epoch": 0.35, - "learning_rate": 3.234757618139141e-05, - "loss": 2.3915, - "step": 202450 - }, - { - "epoch": 0.35, - "learning_rate": 3.234670424146458e-05, - "loss": 2.4228, - "step": 202460 - }, - { - "epoch": 0.35, - "learning_rate": 3.234583230153775e-05, - "loss": 2.4015, - "step": 202470 - }, - { - "epoch": 0.35, - "learning_rate": 3.234496036161093e-05, - "loss": 2.4981, - "step": 202480 - }, - { - "epoch": 0.35, - "learning_rate": 3.23440884216841e-05, - "loss": 2.3373, - "step": 202490 - }, - { - "epoch": 0.35, - "learning_rate": 3.2343216481757276e-05, - "loss": 2.3354, - "step": 202500 - }, - { - "epoch": 0.35, - "learning_rate": 3.2342344541830446e-05, - "loss": 2.4393, - "step": 202510 - }, - { - "epoch": 0.35, - "learning_rate": 3.2341472601903624e-05, - "loss": 2.4996, - "step": 202520 - }, - { - "epoch": 0.35, - "learning_rate": 3.2340600661976794e-05, - "loss": 2.3782, - "step": 202530 - }, - { - "epoch": 0.35, - "learning_rate": 3.2339728722049964e-05, - "loss": 2.4083, - "step": 202540 - }, - { - "epoch": 0.35, - "learning_rate": 3.233885678212314e-05, - "loss": 2.459, - "step": 202550 - }, - { - "epoch": 0.35, - "learning_rate": 3.233798484219631e-05, - "loss": 2.4184, - "step": 202560 - }, - { - "epoch": 0.35, - "learning_rate": 3.233711290226948e-05, - "loss": 2.3561, - "step": 202570 - }, - { - "epoch": 0.35, - "learning_rate": 3.233624096234266e-05, - "loss": 2.4403, - "step": 202580 - }, - { - "epoch": 0.35, - "learning_rate": 3.2335369022415837e-05, - "loss": 2.4345, - "step": 202590 - }, - { - "epoch": 0.35, - "learning_rate": 3.233449708248901e-05, - "loss": 2.3534, - "step": 202600 - }, - { - "epoch": 0.35, - "learning_rate": 3.233362514256218e-05, - "loss": 2.3854, - "step": 202610 - }, - { - "epoch": 0.35, - "learning_rate": 3.2332753202635354e-05, - "loss": 2.4893, - "step": 202620 - }, - { - "epoch": 0.35, - "learning_rate": 3.2331881262708525e-05, - "loss": 2.5185, - "step": 202630 - }, - { - "epoch": 0.35, - "learning_rate": 3.2331009322781695e-05, - "loss": 2.554, - "step": 202640 - }, - { - "epoch": 0.35, - "learning_rate": 3.233013738285487e-05, - "loss": 2.3962, - "step": 202650 - }, - { - "epoch": 0.35, - "learning_rate": 3.232926544292805e-05, - "loss": 2.4047, - "step": 202660 - }, - { - "epoch": 0.35, - "learning_rate": 3.232839350300122e-05, - "loss": 2.4358, - "step": 202670 - }, - { - "epoch": 0.35, - "learning_rate": 3.232752156307439e-05, - "loss": 2.4621, - "step": 202680 - }, - { - "epoch": 0.35, - "learning_rate": 3.232664962314757e-05, - "loss": 2.4004, - "step": 202690 - }, - { - "epoch": 0.35, - "learning_rate": 3.232577768322074e-05, - "loss": 2.3807, - "step": 202700 - }, - { - "epoch": 0.35, - "learning_rate": 3.232490574329391e-05, - "loss": 2.4454, - "step": 202710 - }, - { - "epoch": 0.35, - "learning_rate": 3.2324033803367085e-05, - "loss": 2.3777, - "step": 202720 - }, - { - "epoch": 0.35, - "learning_rate": 3.232316186344026e-05, - "loss": 2.4031, - "step": 202730 - }, - { - "epoch": 0.35, - "learning_rate": 3.232228992351343e-05, - "loss": 2.4452, - "step": 202740 - }, - { - "epoch": 0.35, - "learning_rate": 3.23214179835866e-05, - "loss": 2.4067, - "step": 202750 - }, - { - "epoch": 0.35, - "learning_rate": 3.232054604365978e-05, - "loss": 2.3668, - "step": 202760 - }, - { - "epoch": 0.35, - "learning_rate": 3.231967410373295e-05, - "loss": 2.4116, - "step": 202770 - }, - { - "epoch": 0.35, - "learning_rate": 3.231880216380612e-05, - "loss": 2.3657, - "step": 202780 - }, - { - "epoch": 0.35, - "learning_rate": 3.231793022387929e-05, - "loss": 2.3823, - "step": 202790 - }, - { - "epoch": 0.35, - "learning_rate": 3.2317058283952476e-05, - "loss": 2.5166, - "step": 202800 - }, - { - "epoch": 0.35, - "learning_rate": 3.2316186344025646e-05, - "loss": 2.4353, - "step": 202810 - }, - { - "epoch": 0.35, - "learning_rate": 3.2315314404098816e-05, - "loss": 2.4749, - "step": 202820 - }, - { - "epoch": 0.35, - "learning_rate": 3.231444246417199e-05, - "loss": 2.4003, - "step": 202830 - }, - { - "epoch": 0.35, - "learning_rate": 3.2313570524245164e-05, - "loss": 2.3324, - "step": 202840 - }, - { - "epoch": 0.35, - "learning_rate": 3.2312698584318334e-05, - "loss": 2.448, - "step": 202850 - }, - { - "epoch": 0.35, - "learning_rate": 3.2311826644391505e-05, - "loss": 2.3531, - "step": 202860 - }, - { - "epoch": 0.35, - "learning_rate": 3.231095470446469e-05, - "loss": 2.3562, - "step": 202870 - }, - { - "epoch": 0.35, - "learning_rate": 3.231008276453786e-05, - "loss": 2.429, - "step": 202880 - }, - { - "epoch": 0.35, - "learning_rate": 3.230921082461103e-05, - "loss": 2.4637, - "step": 202890 - }, - { - "epoch": 0.35, - "learning_rate": 3.23083388846842e-05, - "loss": 2.4482, - "step": 202900 - }, - { - "epoch": 0.35, - "learning_rate": 3.230746694475738e-05, - "loss": 2.2619, - "step": 202910 - }, - { - "epoch": 0.35, - "learning_rate": 3.230659500483055e-05, - "loss": 2.3817, - "step": 202920 - }, - { - "epoch": 0.35, - "learning_rate": 3.230572306490372e-05, - "loss": 2.4484, - "step": 202930 - }, - { - "epoch": 0.35, - "learning_rate": 3.2304851124976895e-05, - "loss": 2.4728, - "step": 202940 - }, - { - "epoch": 0.35, - "learning_rate": 3.230397918505007e-05, - "loss": 2.3688, - "step": 202950 - }, - { - "epoch": 0.35, - "learning_rate": 3.230310724512324e-05, - "loss": 2.2871, - "step": 202960 - }, - { - "epoch": 0.35, - "learning_rate": 3.230223530519641e-05, - "loss": 2.4209, - "step": 202970 - }, - { - "epoch": 0.35, - "learning_rate": 3.230136336526959e-05, - "loss": 2.3582, - "step": 202980 - }, - { - "epoch": 0.35, - "learning_rate": 3.230049142534276e-05, - "loss": 2.4804, - "step": 202990 - }, - { - "epoch": 0.35, - "learning_rate": 3.229961948541593e-05, - "loss": 2.4255, - "step": 203000 - }, - { - "epoch": 0.35, - "learning_rate": 3.229874754548911e-05, - "loss": 2.3366, - "step": 203010 - }, - { - "epoch": 0.35, - "learning_rate": 3.2297875605562285e-05, - "loss": 2.3974, - "step": 203020 - }, - { - "epoch": 0.35, - "learning_rate": 3.2297003665635455e-05, - "loss": 2.3461, - "step": 203030 - }, - { - "epoch": 0.35, - "learning_rate": 3.2296131725708626e-05, - "loss": 2.4049, - "step": 203040 - }, - { - "epoch": 0.35, - "learning_rate": 3.22952597857818e-05, - "loss": 2.4426, - "step": 203050 - }, - { - "epoch": 0.35, - "learning_rate": 3.229438784585497e-05, - "loss": 2.6098, - "step": 203060 - }, - { - "epoch": 0.35, - "learning_rate": 3.2293515905928144e-05, - "loss": 2.3895, - "step": 203070 - }, - { - "epoch": 0.35, - "learning_rate": 3.229264396600132e-05, - "loss": 2.4299, - "step": 203080 - }, - { - "epoch": 0.35, - "learning_rate": 3.229177202607449e-05, - "loss": 2.5059, - "step": 203090 - }, - { - "epoch": 0.35, - "learning_rate": 3.229090008614767e-05, - "loss": 2.4061, - "step": 203100 - }, - { - "epoch": 0.35, - "learning_rate": 3.229002814622084e-05, - "loss": 2.4935, - "step": 203110 - }, - { - "epoch": 0.35, - "learning_rate": 3.2289156206294016e-05, - "loss": 2.2173, - "step": 203120 - }, - { - "epoch": 0.35, - "learning_rate": 3.2288284266367186e-05, - "loss": 2.3327, - "step": 203130 - }, - { - "epoch": 0.35, - "learning_rate": 3.2287412326440357e-05, - "loss": 2.4351, - "step": 203140 - }, - { - "epoch": 0.35, - "learning_rate": 3.2286540386513534e-05, - "loss": 2.4924, - "step": 203150 - }, - { - "epoch": 0.35, - "learning_rate": 3.2285668446586704e-05, - "loss": 2.3331, - "step": 203160 - }, - { - "epoch": 0.35, - "learning_rate": 3.228479650665988e-05, - "loss": 2.4122, - "step": 203170 - }, - { - "epoch": 0.35, - "learning_rate": 3.228392456673305e-05, - "loss": 2.423, - "step": 203180 - }, - { - "epoch": 0.35, - "learning_rate": 3.228305262680623e-05, - "loss": 2.5257, - "step": 203190 - }, - { - "epoch": 0.35, - "learning_rate": 3.22821806868794e-05, - "loss": 2.4978, - "step": 203200 - }, - { - "epoch": 0.35, - "learning_rate": 3.228130874695257e-05, - "loss": 2.4109, - "step": 203210 - }, - { - "epoch": 0.35, - "learning_rate": 3.228043680702575e-05, - "loss": 2.3598, - "step": 203220 - }, - { - "epoch": 0.35, - "learning_rate": 3.227956486709892e-05, - "loss": 2.5092, - "step": 203230 - }, - { - "epoch": 0.35, - "learning_rate": 3.227869292717209e-05, - "loss": 2.3613, - "step": 203240 - }, - { - "epoch": 0.35, - "learning_rate": 3.2277820987245265e-05, - "loss": 2.3746, - "step": 203250 - }, - { - "epoch": 0.35, - "learning_rate": 3.227694904731844e-05, - "loss": 2.3131, - "step": 203260 - }, - { - "epoch": 0.35, - "learning_rate": 3.227607710739161e-05, - "loss": 2.5153, - "step": 203270 - }, - { - "epoch": 0.35, - "learning_rate": 3.227520516746478e-05, - "loss": 2.4182, - "step": 203280 - }, - { - "epoch": 0.35, - "learning_rate": 3.227433322753795e-05, - "loss": 2.4106, - "step": 203290 - }, - { - "epoch": 0.35, - "learning_rate": 3.227346128761113e-05, - "loss": 2.3502, - "step": 203300 - }, - { - "epoch": 0.35, - "learning_rate": 3.22725893476843e-05, - "loss": 2.401, - "step": 203310 - }, - { - "epoch": 0.35, - "learning_rate": 3.227171740775748e-05, - "loss": 2.418, - "step": 203320 - }, - { - "epoch": 0.35, - "learning_rate": 3.2270845467830655e-05, - "loss": 2.2494, - "step": 203330 - }, - { - "epoch": 0.35, - "learning_rate": 3.2269973527903825e-05, - "loss": 2.3566, - "step": 203340 - }, - { - "epoch": 0.35, - "learning_rate": 3.2269101587976996e-05, - "loss": 2.4247, - "step": 203350 - }, - { - "epoch": 0.35, - "learning_rate": 3.2268229648050166e-05, - "loss": 2.4335, - "step": 203360 - }, - { - "epoch": 0.35, - "learning_rate": 3.226735770812334e-05, - "loss": 2.3699, - "step": 203370 - }, - { - "epoch": 0.35, - "learning_rate": 3.2266485768196514e-05, - "loss": 2.4133, - "step": 203380 - }, - { - "epoch": 0.35, - "learning_rate": 3.226561382826969e-05, - "loss": 2.4559, - "step": 203390 - }, - { - "epoch": 0.35, - "learning_rate": 3.226474188834286e-05, - "loss": 2.3513, - "step": 203400 - }, - { - "epoch": 0.35, - "learning_rate": 3.226386994841604e-05, - "loss": 2.4937, - "step": 203410 - }, - { - "epoch": 0.35, - "learning_rate": 3.226299800848921e-05, - "loss": 2.4737, - "step": 203420 - }, - { - "epoch": 0.35, - "learning_rate": 3.226212606856238e-05, - "loss": 2.4162, - "step": 203430 - }, - { - "epoch": 0.35, - "learning_rate": 3.2261254128635556e-05, - "loss": 2.3584, - "step": 203440 - }, - { - "epoch": 0.35, - "learning_rate": 3.2260382188708727e-05, - "loss": 2.339, - "step": 203450 - }, - { - "epoch": 0.35, - "learning_rate": 3.22595102487819e-05, - "loss": 2.351, - "step": 203460 - }, - { - "epoch": 0.35, - "learning_rate": 3.2258638308855074e-05, - "loss": 2.372, - "step": 203470 - }, - { - "epoch": 0.35, - "learning_rate": 3.225776636892825e-05, - "loss": 2.3025, - "step": 203480 - }, - { - "epoch": 0.35, - "learning_rate": 3.225689442900142e-05, - "loss": 2.3287, - "step": 203490 - }, - { - "epoch": 0.35, - "learning_rate": 3.225602248907459e-05, - "loss": 2.42, - "step": 203500 - }, - { - "epoch": 0.35, - "learning_rate": 3.225515054914777e-05, - "loss": 2.4611, - "step": 203510 - }, - { - "epoch": 0.35, - "learning_rate": 3.225427860922094e-05, - "loss": 2.4427, - "step": 203520 - }, - { - "epoch": 0.35, - "learning_rate": 3.225340666929411e-05, - "loss": 2.3682, - "step": 203530 - }, - { - "epoch": 0.35, - "learning_rate": 3.225253472936729e-05, - "loss": 2.3323, - "step": 203540 - }, - { - "epoch": 0.35, - "learning_rate": 3.2251662789440464e-05, - "loss": 2.3887, - "step": 203550 - }, - { - "epoch": 0.35, - "learning_rate": 3.2250790849513635e-05, - "loss": 2.5595, - "step": 203560 - }, - { - "epoch": 0.36, - "learning_rate": 3.2249918909586805e-05, - "loss": 2.4039, - "step": 203570 - }, - { - "epoch": 0.36, - "learning_rate": 3.224904696965998e-05, - "loss": 2.4151, - "step": 203580 - }, - { - "epoch": 0.36, - "learning_rate": 3.224817502973315e-05, - "loss": 2.3732, - "step": 203590 - }, - { - "epoch": 0.36, - "learning_rate": 3.224730308980632e-05, - "loss": 2.3595, - "step": 203600 - }, - { - "epoch": 0.36, - "learning_rate": 3.22464311498795e-05, - "loss": 2.5053, - "step": 203610 - }, - { - "epoch": 0.36, - "learning_rate": 3.224555920995268e-05, - "loss": 2.434, - "step": 203620 - }, - { - "epoch": 0.36, - "learning_rate": 3.224468727002585e-05, - "loss": 2.3947, - "step": 203630 - }, - { - "epoch": 0.36, - "learning_rate": 3.224381533009902e-05, - "loss": 2.466, - "step": 203640 - }, - { - "epoch": 0.36, - "learning_rate": 3.2242943390172195e-05, - "loss": 2.2854, - "step": 203650 - }, - { - "epoch": 0.36, - "learning_rate": 3.2242071450245366e-05, - "loss": 2.4452, - "step": 203660 - }, - { - "epoch": 0.36, - "learning_rate": 3.2241199510318536e-05, - "loss": 2.4592, - "step": 203670 - }, - { - "epoch": 0.36, - "learning_rate": 3.2240327570391706e-05, - "loss": 2.388, - "step": 203680 - }, - { - "epoch": 0.36, - "learning_rate": 3.223945563046489e-05, - "loss": 2.3522, - "step": 203690 - }, - { - "epoch": 0.36, - "learning_rate": 3.223858369053806e-05, - "loss": 2.4029, - "step": 203700 - }, - { - "epoch": 0.36, - "learning_rate": 3.223771175061123e-05, - "loss": 2.4648, - "step": 203710 - }, - { - "epoch": 0.36, - "learning_rate": 3.223683981068441e-05, - "loss": 2.52, - "step": 203720 - }, - { - "epoch": 0.36, - "learning_rate": 3.223596787075758e-05, - "loss": 2.2897, - "step": 203730 - }, - { - "epoch": 0.36, - "learning_rate": 3.223509593083075e-05, - "loss": 2.4578, - "step": 203740 - }, - { - "epoch": 0.36, - "learning_rate": 3.223422399090392e-05, - "loss": 2.4215, - "step": 203750 - }, - { - "epoch": 0.36, - "learning_rate": 3.2233352050977096e-05, - "loss": 2.3833, - "step": 203760 - }, - { - "epoch": 0.36, - "learning_rate": 3.2232480111050274e-05, - "loss": 2.4098, - "step": 203770 - }, - { - "epoch": 0.36, - "learning_rate": 3.2231608171123444e-05, - "loss": 2.3018, - "step": 203780 - }, - { - "epoch": 0.36, - "learning_rate": 3.2230736231196614e-05, - "loss": 2.3939, - "step": 203790 - }, - { - "epoch": 0.36, - "learning_rate": 3.222986429126979e-05, - "loss": 2.3346, - "step": 203800 - }, - { - "epoch": 0.36, - "learning_rate": 3.222899235134296e-05, - "loss": 2.4914, - "step": 203810 - }, - { - "epoch": 0.36, - "learning_rate": 3.222812041141613e-05, - "loss": 2.4602, - "step": 203820 - }, - { - "epoch": 0.36, - "learning_rate": 3.222724847148931e-05, - "loss": 2.4321, - "step": 203830 - }, - { - "epoch": 0.36, - "learning_rate": 3.222637653156249e-05, - "loss": 2.4817, - "step": 203840 - }, - { - "epoch": 0.36, - "learning_rate": 3.222550459163566e-05, - "loss": 2.374, - "step": 203850 - }, - { - "epoch": 0.36, - "learning_rate": 3.222463265170883e-05, - "loss": 2.3671, - "step": 203860 - }, - { - "epoch": 0.36, - "learning_rate": 3.2223760711782005e-05, - "loss": 2.3589, - "step": 203870 - }, - { - "epoch": 0.36, - "learning_rate": 3.2222888771855175e-05, - "loss": 2.426, - "step": 203880 - }, - { - "epoch": 0.36, - "learning_rate": 3.2222016831928345e-05, - "loss": 2.4198, - "step": 203890 - }, - { - "epoch": 0.36, - "learning_rate": 3.222114489200152e-05, - "loss": 2.4484, - "step": 203900 - }, - { - "epoch": 0.36, - "learning_rate": 3.222027295207469e-05, - "loss": 2.4851, - "step": 203910 - }, - { - "epoch": 0.36, - "learning_rate": 3.221940101214787e-05, - "loss": 2.3949, - "step": 203920 - }, - { - "epoch": 0.36, - "learning_rate": 3.221852907222104e-05, - "loss": 2.5058, - "step": 203930 - }, - { - "epoch": 0.36, - "learning_rate": 3.221765713229422e-05, - "loss": 2.3946, - "step": 203940 - }, - { - "epoch": 0.36, - "learning_rate": 3.221678519236739e-05, - "loss": 2.3741, - "step": 203950 - }, - { - "epoch": 0.36, - "learning_rate": 3.221591325244056e-05, - "loss": 2.4569, - "step": 203960 - }, - { - "epoch": 0.36, - "learning_rate": 3.2215041312513735e-05, - "loss": 2.3288, - "step": 203970 - }, - { - "epoch": 0.36, - "learning_rate": 3.2214169372586906e-05, - "loss": 2.4244, - "step": 203980 - }, - { - "epoch": 0.36, - "learning_rate": 3.221329743266008e-05, - "loss": 2.4652, - "step": 203990 - }, - { - "epoch": 0.36, - "learning_rate": 3.221242549273325e-05, - "loss": 2.4508, - "step": 204000 - }, - { - "epoch": 0.36, - "learning_rate": 3.221155355280643e-05, - "loss": 2.3453, - "step": 204010 - }, - { - "epoch": 0.36, - "learning_rate": 3.22106816128796e-05, - "loss": 2.3967, - "step": 204020 - }, - { - "epoch": 0.36, - "learning_rate": 3.220980967295277e-05, - "loss": 2.4297, - "step": 204030 - }, - { - "epoch": 0.36, - "learning_rate": 3.220893773302595e-05, - "loss": 2.3522, - "step": 204040 - }, - { - "epoch": 0.36, - "learning_rate": 3.220806579309912e-05, - "loss": 2.3487, - "step": 204050 - }, - { - "epoch": 0.36, - "learning_rate": 3.2207193853172296e-05, - "loss": 2.3988, - "step": 204060 - }, - { - "epoch": 0.36, - "learning_rate": 3.2206321913245466e-05, - "loss": 2.22, - "step": 204070 - }, - { - "epoch": 0.36, - "learning_rate": 3.2205449973318644e-05, - "loss": 2.3798, - "step": 204080 - }, - { - "epoch": 0.36, - "learning_rate": 3.2204578033391814e-05, - "loss": 2.3909, - "step": 204090 - }, - { - "epoch": 0.36, - "learning_rate": 3.2203706093464984e-05, - "loss": 2.4061, - "step": 204100 - }, - { - "epoch": 0.36, - "learning_rate": 3.220283415353816e-05, - "loss": 2.3703, - "step": 204110 - }, - { - "epoch": 0.36, - "learning_rate": 3.220196221361133e-05, - "loss": 2.4229, - "step": 204120 - }, - { - "epoch": 0.36, - "learning_rate": 3.22010902736845e-05, - "loss": 2.4107, - "step": 204130 - }, - { - "epoch": 0.36, - "learning_rate": 3.220021833375768e-05, - "loss": 2.2285, - "step": 204140 - }, - { - "epoch": 0.36, - "learning_rate": 3.2199346393830857e-05, - "loss": 2.4774, - "step": 204150 - }, - { - "epoch": 0.36, - "learning_rate": 3.219847445390403e-05, - "loss": 2.5074, - "step": 204160 - }, - { - "epoch": 0.36, - "learning_rate": 3.21976025139772e-05, - "loss": 2.4143, - "step": 204170 - }, - { - "epoch": 0.36, - "learning_rate": 3.219673057405037e-05, - "loss": 2.4419, - "step": 204180 - }, - { - "epoch": 0.36, - "learning_rate": 3.2195858634123545e-05, - "loss": 2.4282, - "step": 204190 - }, - { - "epoch": 0.36, - "learning_rate": 3.2194986694196715e-05, - "loss": 2.512, - "step": 204200 - }, - { - "epoch": 0.36, - "learning_rate": 3.219411475426989e-05, - "loss": 2.3237, - "step": 204210 - }, - { - "epoch": 0.36, - "learning_rate": 3.219324281434307e-05, - "loss": 2.4317, - "step": 204220 - }, - { - "epoch": 0.36, - "learning_rate": 3.219237087441624e-05, - "loss": 2.4371, - "step": 204230 - }, - { - "epoch": 0.36, - "learning_rate": 3.219149893448941e-05, - "loss": 2.3861, - "step": 204240 - }, - { - "epoch": 0.36, - "learning_rate": 3.219062699456258e-05, - "loss": 2.4251, - "step": 204250 - }, - { - "epoch": 0.36, - "learning_rate": 3.218975505463576e-05, - "loss": 2.3981, - "step": 204260 - }, - { - "epoch": 0.36, - "learning_rate": 3.218888311470893e-05, - "loss": 2.3849, - "step": 204270 - }, - { - "epoch": 0.36, - "learning_rate": 3.21880111747821e-05, - "loss": 2.4491, - "step": 204280 - }, - { - "epoch": 0.36, - "learning_rate": 3.2187139234855276e-05, - "loss": 2.4571, - "step": 204290 - }, - { - "epoch": 0.36, - "learning_rate": 3.218626729492845e-05, - "loss": 2.4905, - "step": 204300 - }, - { - "epoch": 0.36, - "learning_rate": 3.218539535500162e-05, - "loss": 2.4894, - "step": 204310 - }, - { - "epoch": 0.36, - "learning_rate": 3.2184523415074794e-05, - "loss": 2.4818, - "step": 204320 - }, - { - "epoch": 0.36, - "learning_rate": 3.218365147514797e-05, - "loss": 2.4772, - "step": 204330 - }, - { - "epoch": 0.36, - "learning_rate": 3.218277953522114e-05, - "loss": 2.504, - "step": 204340 - }, - { - "epoch": 0.36, - "learning_rate": 3.218190759529431e-05, - "loss": 2.4284, - "step": 204350 - }, - { - "epoch": 0.36, - "learning_rate": 3.218103565536749e-05, - "loss": 2.4503, - "step": 204360 - }, - { - "epoch": 0.36, - "learning_rate": 3.2180163715440666e-05, - "loss": 2.3631, - "step": 204370 - }, - { - "epoch": 0.36, - "learning_rate": 3.2179291775513836e-05, - "loss": 2.3825, - "step": 204380 - }, - { - "epoch": 0.36, - "learning_rate": 3.217841983558701e-05, - "loss": 2.4239, - "step": 204390 - }, - { - "epoch": 0.36, - "learning_rate": 3.2177547895660184e-05, - "loss": 2.3963, - "step": 204400 - }, - { - "epoch": 0.36, - "learning_rate": 3.2176675955733354e-05, - "loss": 2.425, - "step": 204410 - }, - { - "epoch": 0.36, - "learning_rate": 3.2175804015806525e-05, - "loss": 2.3052, - "step": 204420 - }, - { - "epoch": 0.36, - "learning_rate": 3.21749320758797e-05, - "loss": 2.4638, - "step": 204430 - }, - { - "epoch": 0.36, - "learning_rate": 3.217406013595288e-05, - "loss": 2.4068, - "step": 204440 - }, - { - "epoch": 0.36, - "learning_rate": 3.217318819602605e-05, - "loss": 2.5206, - "step": 204450 - }, - { - "epoch": 0.36, - "learning_rate": 3.217231625609922e-05, - "loss": 2.4477, - "step": 204460 - }, - { - "epoch": 0.36, - "learning_rate": 3.21714443161724e-05, - "loss": 2.4418, - "step": 204470 - }, - { - "epoch": 0.36, - "learning_rate": 3.217057237624557e-05, - "loss": 2.6085, - "step": 204480 - }, - { - "epoch": 0.36, - "learning_rate": 3.216970043631874e-05, - "loss": 2.4092, - "step": 204490 - }, - { - "epoch": 0.36, - "learning_rate": 3.2168828496391915e-05, - "loss": 2.3916, - "step": 204500 - }, - { - "epoch": 0.36, - "learning_rate": 3.216795655646509e-05, - "loss": 2.4623, - "step": 204510 - }, - { - "epoch": 0.36, - "learning_rate": 3.216708461653826e-05, - "loss": 2.5044, - "step": 204520 - }, - { - "epoch": 0.36, - "learning_rate": 3.216621267661143e-05, - "loss": 2.3471, - "step": 204530 - }, - { - "epoch": 0.36, - "learning_rate": 3.216534073668461e-05, - "loss": 2.3176, - "step": 204540 - }, - { - "epoch": 0.36, - "learning_rate": 3.216446879675778e-05, - "loss": 2.4662, - "step": 204550 - }, - { - "epoch": 0.36, - "learning_rate": 3.216359685683095e-05, - "loss": 2.4473, - "step": 204560 - }, - { - "epoch": 0.36, - "learning_rate": 3.216272491690413e-05, - "loss": 2.4612, - "step": 204570 - }, - { - "epoch": 0.36, - "learning_rate": 3.2161852976977305e-05, - "loss": 2.4454, - "step": 204580 - }, - { - "epoch": 0.36, - "learning_rate": 3.2160981037050475e-05, - "loss": 2.5055, - "step": 204590 - }, - { - "epoch": 0.36, - "learning_rate": 3.2160109097123646e-05, - "loss": 2.6031, - "step": 204600 - }, - { - "epoch": 0.36, - "learning_rate": 3.215923715719682e-05, - "loss": 2.4223, - "step": 204610 - }, - { - "epoch": 0.36, - "learning_rate": 3.215836521726999e-05, - "loss": 2.5363, - "step": 204620 - }, - { - "epoch": 0.36, - "learning_rate": 3.2157493277343164e-05, - "loss": 2.3929, - "step": 204630 - }, - { - "epoch": 0.36, - "learning_rate": 3.2156621337416334e-05, - "loss": 2.4773, - "step": 204640 - }, - { - "epoch": 0.36, - "learning_rate": 3.215574939748951e-05, - "loss": 2.5391, - "step": 204650 - }, - { - "epoch": 0.36, - "learning_rate": 3.215487745756269e-05, - "loss": 2.4727, - "step": 204660 - }, - { - "epoch": 0.36, - "learning_rate": 3.215400551763586e-05, - "loss": 2.3687, - "step": 204670 - }, - { - "epoch": 0.36, - "learning_rate": 3.2153133577709036e-05, - "loss": 2.2996, - "step": 204680 - }, - { - "epoch": 0.36, - "learning_rate": 3.2152261637782206e-05, - "loss": 2.3644, - "step": 204690 - }, - { - "epoch": 0.36, - "learning_rate": 3.215138969785538e-05, - "loss": 2.34, - "step": 204700 - }, - { - "epoch": 0.36, - "learning_rate": 3.215051775792855e-05, - "loss": 2.2241, - "step": 204710 - }, - { - "epoch": 0.36, - "learning_rate": 3.2149645818001724e-05, - "loss": 2.4408, - "step": 204720 - }, - { - "epoch": 0.36, - "learning_rate": 3.21487738780749e-05, - "loss": 2.4375, - "step": 204730 - }, - { - "epoch": 0.36, - "learning_rate": 3.214790193814807e-05, - "loss": 2.4367, - "step": 204740 - }, - { - "epoch": 0.36, - "learning_rate": 3.214702999822124e-05, - "loss": 2.3915, - "step": 204750 - }, - { - "epoch": 0.36, - "learning_rate": 3.214615805829442e-05, - "loss": 2.4747, - "step": 204760 - }, - { - "epoch": 0.36, - "learning_rate": 3.214528611836759e-05, - "loss": 2.4452, - "step": 204770 - }, - { - "epoch": 0.36, - "learning_rate": 3.214441417844076e-05, - "loss": 2.5077, - "step": 204780 - }, - { - "epoch": 0.36, - "learning_rate": 3.214354223851394e-05, - "loss": 2.3176, - "step": 204790 - }, - { - "epoch": 0.36, - "learning_rate": 3.214267029858711e-05, - "loss": 2.3676, - "step": 204800 - }, - { - "epoch": 0.36, - "learning_rate": 3.2141798358660285e-05, - "loss": 2.3398, - "step": 204810 - }, - { - "epoch": 0.36, - "learning_rate": 3.2140926418733455e-05, - "loss": 2.3739, - "step": 204820 - }, - { - "epoch": 0.36, - "learning_rate": 3.214005447880663e-05, - "loss": 2.4678, - "step": 204830 - }, - { - "epoch": 0.36, - "learning_rate": 3.21391825388798e-05, - "loss": 2.4204, - "step": 204840 - }, - { - "epoch": 0.36, - "learning_rate": 3.213831059895297e-05, - "loss": 2.3983, - "step": 204850 - }, - { - "epoch": 0.36, - "learning_rate": 3.213743865902615e-05, - "loss": 2.4578, - "step": 204860 - }, - { - "epoch": 0.36, - "learning_rate": 3.213656671909932e-05, - "loss": 2.4549, - "step": 204870 - }, - { - "epoch": 0.36, - "learning_rate": 3.21356947791725e-05, - "loss": 2.308, - "step": 204880 - }, - { - "epoch": 0.36, - "learning_rate": 3.213482283924567e-05, - "loss": 2.4147, - "step": 204890 - }, - { - "epoch": 0.36, - "learning_rate": 3.2133950899318845e-05, - "loss": 2.3012, - "step": 204900 - }, - { - "epoch": 0.36, - "learning_rate": 3.2133078959392016e-05, - "loss": 2.4941, - "step": 204910 - }, - { - "epoch": 0.36, - "learning_rate": 3.2132207019465186e-05, - "loss": 2.464, - "step": 204920 - }, - { - "epoch": 0.36, - "learning_rate": 3.213133507953836e-05, - "loss": 2.4847, - "step": 204930 - }, - { - "epoch": 0.36, - "learning_rate": 3.2130463139611534e-05, - "loss": 2.356, - "step": 204940 - }, - { - "epoch": 0.36, - "learning_rate": 3.2129591199684704e-05, - "loss": 2.4926, - "step": 204950 - }, - { - "epoch": 0.36, - "learning_rate": 3.212871925975788e-05, - "loss": 2.416, - "step": 204960 - }, - { - "epoch": 0.36, - "learning_rate": 3.212784731983106e-05, - "loss": 2.4901, - "step": 204970 - }, - { - "epoch": 0.36, - "learning_rate": 3.212697537990423e-05, - "loss": 2.386, - "step": 204980 - }, - { - "epoch": 0.36, - "learning_rate": 3.21261034399774e-05, - "loss": 2.411, - "step": 204990 - }, - { - "epoch": 0.36, - "learning_rate": 3.2125231500050576e-05, - "loss": 2.4975, - "step": 205000 - }, - { - "epoch": 0.36, - "learning_rate": 3.2124359560123747e-05, - "loss": 2.4597, - "step": 205010 - }, - { - "epoch": 0.36, - "learning_rate": 3.212348762019692e-05, - "loss": 2.3781, - "step": 205020 - }, - { - "epoch": 0.36, - "learning_rate": 3.2122615680270094e-05, - "loss": 2.344, - "step": 205030 - }, - { - "epoch": 0.36, - "learning_rate": 3.212174374034327e-05, - "loss": 2.4791, - "step": 205040 - }, - { - "epoch": 0.36, - "learning_rate": 3.212087180041644e-05, - "loss": 2.4369, - "step": 205050 - }, - { - "epoch": 0.36, - "learning_rate": 3.211999986048961e-05, - "loss": 2.4544, - "step": 205060 - }, - { - "epoch": 0.36, - "learning_rate": 3.211912792056279e-05, - "loss": 2.4523, - "step": 205070 - }, - { - "epoch": 0.36, - "learning_rate": 3.211825598063596e-05, - "loss": 2.3102, - "step": 205080 - }, - { - "epoch": 0.36, - "learning_rate": 3.211738404070913e-05, - "loss": 2.3949, - "step": 205090 - }, - { - "epoch": 0.36, - "learning_rate": 3.21165121007823e-05, - "loss": 2.3915, - "step": 205100 - }, - { - "epoch": 0.36, - "learning_rate": 3.2115640160855484e-05, - "loss": 2.4835, - "step": 205110 - }, - { - "epoch": 0.36, - "learning_rate": 3.2114768220928655e-05, - "loss": 2.4571, - "step": 205120 - }, - { - "epoch": 0.36, - "learning_rate": 3.2113896281001825e-05, - "loss": 2.4145, - "step": 205130 - }, - { - "epoch": 0.36, - "learning_rate": 3.2113024341074995e-05, - "loss": 2.4523, - "step": 205140 - }, - { - "epoch": 0.36, - "learning_rate": 3.211215240114817e-05, - "loss": 2.4613, - "step": 205150 - }, - { - "epoch": 0.36, - "learning_rate": 3.211128046122134e-05, - "loss": 2.4811, - "step": 205160 - }, - { - "epoch": 0.36, - "learning_rate": 3.211040852129451e-05, - "loss": 2.5162, - "step": 205170 - }, - { - "epoch": 0.36, - "learning_rate": 3.21095365813677e-05, - "loss": 2.3821, - "step": 205180 - }, - { - "epoch": 0.36, - "learning_rate": 3.210866464144087e-05, - "loss": 2.4468, - "step": 205190 - }, - { - "epoch": 0.36, - "learning_rate": 3.210779270151404e-05, - "loss": 2.3566, - "step": 205200 - }, - { - "epoch": 0.36, - "learning_rate": 3.210692076158721e-05, - "loss": 2.4032, - "step": 205210 - }, - { - "epoch": 0.36, - "learning_rate": 3.2106048821660386e-05, - "loss": 2.436, - "step": 205220 - }, - { - "epoch": 0.36, - "learning_rate": 3.2105176881733556e-05, - "loss": 2.4623, - "step": 205230 - }, - { - "epoch": 0.36, - "learning_rate": 3.2104304941806726e-05, - "loss": 2.5085, - "step": 205240 - }, - { - "epoch": 0.36, - "learning_rate": 3.2103433001879903e-05, - "loss": 2.5545, - "step": 205250 - }, - { - "epoch": 0.36, - "learning_rate": 3.210256106195308e-05, - "loss": 2.5158, - "step": 205260 - }, - { - "epoch": 0.36, - "learning_rate": 3.210168912202625e-05, - "loss": 2.3772, - "step": 205270 - }, - { - "epoch": 0.36, - "learning_rate": 3.210081718209942e-05, - "loss": 2.3742, - "step": 205280 - }, - { - "epoch": 0.36, - "learning_rate": 3.20999452421726e-05, - "loss": 2.3735, - "step": 205290 - }, - { - "epoch": 0.36, - "learning_rate": 3.209907330224577e-05, - "loss": 2.4435, - "step": 205300 - }, - { - "epoch": 0.36, - "learning_rate": 3.209820136231894e-05, - "loss": 2.5038, - "step": 205310 - }, - { - "epoch": 0.36, - "learning_rate": 3.2097329422392116e-05, - "loss": 2.4329, - "step": 205320 - }, - { - "epoch": 0.36, - "learning_rate": 3.2096457482465294e-05, - "loss": 2.3991, - "step": 205330 - }, - { - "epoch": 0.36, - "learning_rate": 3.2095585542538464e-05, - "loss": 2.4746, - "step": 205340 - }, - { - "epoch": 0.36, - "learning_rate": 3.2094713602611634e-05, - "loss": 2.4944, - "step": 205350 - }, - { - "epoch": 0.36, - "learning_rate": 3.209384166268481e-05, - "loss": 2.5041, - "step": 205360 - }, - { - "epoch": 0.36, - "learning_rate": 3.209296972275798e-05, - "loss": 2.4942, - "step": 205370 - }, - { - "epoch": 0.36, - "learning_rate": 3.209209778283115e-05, - "loss": 2.3403, - "step": 205380 - }, - { - "epoch": 0.36, - "learning_rate": 3.209122584290433e-05, - "loss": 2.3407, - "step": 205390 - }, - { - "epoch": 0.36, - "learning_rate": 3.209035390297751e-05, - "loss": 2.4883, - "step": 205400 - }, - { - "epoch": 0.36, - "learning_rate": 3.208948196305068e-05, - "loss": 2.363, - "step": 205410 - }, - { - "epoch": 0.36, - "learning_rate": 3.208861002312385e-05, - "loss": 2.4351, - "step": 205420 - }, - { - "epoch": 0.36, - "learning_rate": 3.2087738083197025e-05, - "loss": 2.344, - "step": 205430 - }, - { - "epoch": 0.36, - "learning_rate": 3.2086866143270195e-05, - "loss": 2.3733, - "step": 205440 - }, - { - "epoch": 0.36, - "learning_rate": 3.2085994203343365e-05, - "loss": 2.4213, - "step": 205450 - }, - { - "epoch": 0.36, - "learning_rate": 3.208512226341654e-05, - "loss": 2.3833, - "step": 205460 - }, - { - "epoch": 0.36, - "learning_rate": 3.208425032348971e-05, - "loss": 2.4326, - "step": 205470 - }, - { - "epoch": 0.36, - "learning_rate": 3.208337838356289e-05, - "loss": 2.4012, - "step": 205480 - }, - { - "epoch": 0.36, - "learning_rate": 3.208250644363606e-05, - "loss": 2.332, - "step": 205490 - }, - { - "epoch": 0.36, - "learning_rate": 3.208163450370924e-05, - "loss": 2.3448, - "step": 205500 - }, - { - "epoch": 0.36, - "learning_rate": 3.208076256378241e-05, - "loss": 2.553, - "step": 205510 - }, - { - "epoch": 0.36, - "learning_rate": 3.207989062385558e-05, - "loss": 2.3735, - "step": 205520 - }, - { - "epoch": 0.36, - "learning_rate": 3.2079018683928755e-05, - "loss": 2.4431, - "step": 205530 - }, - { - "epoch": 0.36, - "learning_rate": 3.2078146744001926e-05, - "loss": 2.3169, - "step": 205540 - }, - { - "epoch": 0.36, - "learning_rate": 3.20772748040751e-05, - "loss": 2.4381, - "step": 205550 - }, - { - "epoch": 0.36, - "learning_rate": 3.2076402864148273e-05, - "loss": 2.396, - "step": 205560 - }, - { - "epoch": 0.36, - "learning_rate": 3.207553092422145e-05, - "loss": 2.3588, - "step": 205570 - }, - { - "epoch": 0.36, - "learning_rate": 3.207465898429462e-05, - "loss": 2.4418, - "step": 205580 - }, - { - "epoch": 0.36, - "learning_rate": 3.207378704436779e-05, - "loss": 2.3774, - "step": 205590 - }, - { - "epoch": 0.36, - "learning_rate": 3.207291510444096e-05, - "loss": 2.4011, - "step": 205600 - }, - { - "epoch": 0.36, - "learning_rate": 3.207204316451414e-05, - "loss": 2.3516, - "step": 205610 - }, - { - "epoch": 0.36, - "learning_rate": 3.207117122458731e-05, - "loss": 2.5026, - "step": 205620 - }, - { - "epoch": 0.36, - "learning_rate": 3.2070299284660486e-05, - "loss": 2.3792, - "step": 205630 - }, - { - "epoch": 0.36, - "learning_rate": 3.2069427344733664e-05, - "loss": 2.4209, - "step": 205640 - }, - { - "epoch": 0.36, - "learning_rate": 3.2068555404806834e-05, - "loss": 2.4254, - "step": 205650 - }, - { - "epoch": 0.36, - "learning_rate": 3.2067683464880004e-05, - "loss": 2.4302, - "step": 205660 - }, - { - "epoch": 0.36, - "learning_rate": 3.2066811524953175e-05, - "loss": 2.3218, - "step": 205670 - }, - { - "epoch": 0.36, - "learning_rate": 3.206593958502635e-05, - "loss": 2.4864, - "step": 205680 - }, - { - "epoch": 0.36, - "learning_rate": 3.206506764509952e-05, - "loss": 2.478, - "step": 205690 - }, - { - "epoch": 0.36, - "learning_rate": 3.20641957051727e-05, - "loss": 2.2895, - "step": 205700 - }, - { - "epoch": 0.36, - "learning_rate": 3.206332376524587e-05, - "loss": 2.5352, - "step": 205710 - }, - { - "epoch": 0.36, - "learning_rate": 3.206245182531905e-05, - "loss": 2.3424, - "step": 205720 - }, - { - "epoch": 0.36, - "learning_rate": 3.206157988539222e-05, - "loss": 2.3866, - "step": 205730 - }, - { - "epoch": 0.36, - "learning_rate": 3.206070794546539e-05, - "loss": 2.3592, - "step": 205740 - }, - { - "epoch": 0.36, - "learning_rate": 3.2059836005538565e-05, - "loss": 2.5298, - "step": 205750 - }, - { - "epoch": 0.36, - "learning_rate": 3.2058964065611735e-05, - "loss": 2.4929, - "step": 205760 - }, - { - "epoch": 0.36, - "learning_rate": 3.2058092125684906e-05, - "loss": 2.4346, - "step": 205770 - }, - { - "epoch": 0.36, - "learning_rate": 3.205722018575808e-05, - "loss": 2.3927, - "step": 205780 - }, - { - "epoch": 0.36, - "learning_rate": 3.205634824583126e-05, - "loss": 2.4053, - "step": 205790 - }, - { - "epoch": 0.36, - "learning_rate": 3.205547630590443e-05, - "loss": 2.3, - "step": 205800 - }, - { - "epoch": 0.36, - "learning_rate": 3.20546043659776e-05, - "loss": 2.4661, - "step": 205810 - }, - { - "epoch": 0.36, - "learning_rate": 3.205373242605078e-05, - "loss": 2.4696, - "step": 205820 - }, - { - "epoch": 0.36, - "learning_rate": 3.205286048612395e-05, - "loss": 2.4056, - "step": 205830 - }, - { - "epoch": 0.36, - "learning_rate": 3.205198854619712e-05, - "loss": 2.4186, - "step": 205840 - }, - { - "epoch": 0.36, - "learning_rate": 3.2051116606270296e-05, - "loss": 2.4548, - "step": 205850 - }, - { - "epoch": 0.36, - "learning_rate": 3.205024466634347e-05, - "loss": 2.4633, - "step": 205860 - }, - { - "epoch": 0.36, - "learning_rate": 3.204937272641664e-05, - "loss": 2.5082, - "step": 205870 - }, - { - "epoch": 0.36, - "learning_rate": 3.2048500786489814e-05, - "loss": 2.4491, - "step": 205880 - }, - { - "epoch": 0.36, - "learning_rate": 3.204762884656299e-05, - "loss": 2.4017, - "step": 205890 - }, - { - "epoch": 0.36, - "learning_rate": 3.204675690663616e-05, - "loss": 2.2991, - "step": 205900 - }, - { - "epoch": 0.36, - "learning_rate": 3.204588496670933e-05, - "loss": 2.2784, - "step": 205910 - }, - { - "epoch": 0.36, - "learning_rate": 3.204501302678251e-05, - "loss": 2.4183, - "step": 205920 - }, - { - "epoch": 0.36, - "learning_rate": 3.2044141086855686e-05, - "loss": 2.3781, - "step": 205930 - }, - { - "epoch": 0.36, - "learning_rate": 3.2043269146928856e-05, - "loss": 2.3872, - "step": 205940 - }, - { - "epoch": 0.36, - "learning_rate": 3.204239720700203e-05, - "loss": 2.483, - "step": 205950 - }, - { - "epoch": 0.36, - "learning_rate": 3.2041525267075204e-05, - "loss": 2.4383, - "step": 205960 - }, - { - "epoch": 0.36, - "learning_rate": 3.2040653327148374e-05, - "loss": 2.3506, - "step": 205970 - }, - { - "epoch": 0.36, - "learning_rate": 3.2039781387221545e-05, - "loss": 2.4038, - "step": 205980 - }, - { - "epoch": 0.36, - "learning_rate": 3.2038909447294715e-05, - "loss": 2.3971, - "step": 205990 - }, - { - "epoch": 0.36, - "learning_rate": 3.20380375073679e-05, - "loss": 2.3146, - "step": 206000 - }, - { - "epoch": 0.36, - "learning_rate": 3.203716556744107e-05, - "loss": 2.4633, - "step": 206010 - }, - { - "epoch": 0.36, - "learning_rate": 3.203629362751424e-05, - "loss": 2.3234, - "step": 206020 - }, - { - "epoch": 0.36, - "learning_rate": 3.203542168758742e-05, - "loss": 2.3612, - "step": 206030 - }, - { - "epoch": 0.36, - "learning_rate": 3.203454974766059e-05, - "loss": 2.4307, - "step": 206040 - }, - { - "epoch": 0.36, - "learning_rate": 3.203367780773376e-05, - "loss": 2.4082, - "step": 206050 - }, - { - "epoch": 0.36, - "learning_rate": 3.203280586780693e-05, - "loss": 2.4394, - "step": 206060 - }, - { - "epoch": 0.36, - "learning_rate": 3.203193392788011e-05, - "loss": 2.3177, - "step": 206070 - }, - { - "epoch": 0.36, - "learning_rate": 3.203106198795328e-05, - "loss": 2.5199, - "step": 206080 - }, - { - "epoch": 0.36, - "learning_rate": 3.203019004802645e-05, - "loss": 2.2875, - "step": 206090 - }, - { - "epoch": 0.36, - "learning_rate": 3.202931810809962e-05, - "loss": 2.4504, - "step": 206100 - }, - { - "epoch": 0.36, - "learning_rate": 3.20284461681728e-05, - "loss": 2.4676, - "step": 206110 - }, - { - "epoch": 0.36, - "learning_rate": 3.202757422824597e-05, - "loss": 2.5626, - "step": 206120 - }, - { - "epoch": 0.36, - "learning_rate": 3.202670228831914e-05, - "loss": 2.3572, - "step": 206130 - }, - { - "epoch": 0.36, - "learning_rate": 3.202583034839232e-05, - "loss": 2.3653, - "step": 206140 - }, - { - "epoch": 0.36, - "learning_rate": 3.2024958408465495e-05, - "loss": 2.5401, - "step": 206150 - }, - { - "epoch": 0.36, - "learning_rate": 3.2024086468538666e-05, - "loss": 2.4316, - "step": 206160 - }, - { - "epoch": 0.36, - "learning_rate": 3.2023214528611836e-05, - "loss": 2.4854, - "step": 206170 - }, - { - "epoch": 0.36, - "learning_rate": 3.202234258868501e-05, - "loss": 2.572, - "step": 206180 - }, - { - "epoch": 0.36, - "learning_rate": 3.2021470648758184e-05, - "loss": 2.5298, - "step": 206190 - }, - { - "epoch": 0.36, - "learning_rate": 3.2020598708831354e-05, - "loss": 2.4161, - "step": 206200 - }, - { - "epoch": 0.36, - "learning_rate": 3.201972676890453e-05, - "loss": 2.4386, - "step": 206210 - }, - { - "epoch": 0.36, - "learning_rate": 3.201885482897771e-05, - "loss": 2.5539, - "step": 206220 - }, - { - "epoch": 0.36, - "learning_rate": 3.201798288905088e-05, - "loss": 2.4, - "step": 206230 - }, - { - "epoch": 0.36, - "learning_rate": 3.201711094912405e-05, - "loss": 2.2398, - "step": 206240 - }, - { - "epoch": 0.36, - "learning_rate": 3.2016239009197226e-05, - "loss": 2.3641, - "step": 206250 - }, - { - "epoch": 0.36, - "learning_rate": 3.20153670692704e-05, - "loss": 2.5389, - "step": 206260 - }, - { - "epoch": 0.36, - "learning_rate": 3.201449512934357e-05, - "loss": 2.3465, - "step": 206270 - }, - { - "epoch": 0.36, - "learning_rate": 3.2013623189416744e-05, - "loss": 2.4226, - "step": 206280 - }, - { - "epoch": 0.36, - "learning_rate": 3.2012751249489915e-05, - "loss": 2.3347, - "step": 206290 - }, - { - "epoch": 0.36, - "learning_rate": 3.201187930956309e-05, - "loss": 2.4195, - "step": 206300 - }, - { - "epoch": 0.36, - "learning_rate": 3.201100736963626e-05, - "loss": 2.4098, - "step": 206310 - }, - { - "epoch": 0.36, - "learning_rate": 3.201013542970944e-05, - "loss": 2.3531, - "step": 206320 - }, - { - "epoch": 0.36, - "learning_rate": 3.200926348978261e-05, - "loss": 2.3788, - "step": 206330 - }, - { - "epoch": 0.36, - "learning_rate": 3.200839154985578e-05, - "loss": 2.465, - "step": 206340 - }, - { - "epoch": 0.36, - "learning_rate": 3.200751960992896e-05, - "loss": 2.3533, - "step": 206350 - }, - { - "epoch": 0.36, - "learning_rate": 3.200664767000213e-05, - "loss": 2.2632, - "step": 206360 - }, - { - "epoch": 0.36, - "learning_rate": 3.2005775730075305e-05, - "loss": 2.447, - "step": 206370 - }, - { - "epoch": 0.36, - "learning_rate": 3.2004903790148475e-05, - "loss": 2.399, - "step": 206380 - }, - { - "epoch": 0.36, - "learning_rate": 3.200403185022165e-05, - "loss": 2.5187, - "step": 206390 - }, - { - "epoch": 0.36, - "learning_rate": 3.200315991029482e-05, - "loss": 2.4086, - "step": 206400 - }, - { - "epoch": 0.36, - "learning_rate": 3.200228797036799e-05, - "loss": 2.5178, - "step": 206410 - }, - { - "epoch": 0.36, - "learning_rate": 3.200141603044117e-05, - "loss": 2.4429, - "step": 206420 - }, - { - "epoch": 0.36, - "learning_rate": 3.200054409051434e-05, - "loss": 2.4299, - "step": 206430 - }, - { - "epoch": 0.36, - "learning_rate": 3.199967215058751e-05, - "loss": 2.4583, - "step": 206440 - }, - { - "epoch": 0.36, - "learning_rate": 3.199880021066069e-05, - "loss": 2.4348, - "step": 206450 - }, - { - "epoch": 0.36, - "learning_rate": 3.1997928270733865e-05, - "loss": 2.3486, - "step": 206460 - }, - { - "epoch": 0.36, - "learning_rate": 3.1997056330807036e-05, - "loss": 2.3471, - "step": 206470 - }, - { - "epoch": 0.36, - "learning_rate": 3.1996184390880206e-05, - "loss": 2.3922, - "step": 206480 - }, - { - "epoch": 0.36, - "learning_rate": 3.1995312450953376e-05, - "loss": 2.3836, - "step": 206490 - }, - { - "epoch": 0.36, - "learning_rate": 3.1994440511026554e-05, - "loss": 2.4037, - "step": 206500 - }, - { - "epoch": 0.36, - "learning_rate": 3.1993568571099724e-05, - "loss": 2.4566, - "step": 206510 - }, - { - "epoch": 0.36, - "learning_rate": 3.19926966311729e-05, - "loss": 2.4493, - "step": 206520 - }, - { - "epoch": 0.36, - "learning_rate": 3.199182469124608e-05, - "loss": 2.4554, - "step": 206530 - }, - { - "epoch": 0.36, - "learning_rate": 3.199095275131925e-05, - "loss": 2.3917, - "step": 206540 - }, - { - "epoch": 0.36, - "learning_rate": 3.199008081139242e-05, - "loss": 2.4728, - "step": 206550 - }, - { - "epoch": 0.36, - "learning_rate": 3.198920887146559e-05, - "loss": 2.4733, - "step": 206560 - }, - { - "epoch": 0.36, - "learning_rate": 3.1988336931538767e-05, - "loss": 2.3515, - "step": 206570 - }, - { - "epoch": 0.36, - "learning_rate": 3.198746499161194e-05, - "loss": 2.424, - "step": 206580 - }, - { - "epoch": 0.36, - "learning_rate": 3.1986593051685114e-05, - "loss": 2.3485, - "step": 206590 - }, - { - "epoch": 0.36, - "learning_rate": 3.1985721111758284e-05, - "loss": 2.4471, - "step": 206600 - }, - { - "epoch": 0.36, - "learning_rate": 3.198484917183146e-05, - "loss": 2.3241, - "step": 206610 - }, - { - "epoch": 0.36, - "learning_rate": 3.198397723190463e-05, - "loss": 2.447, - "step": 206620 - }, - { - "epoch": 0.36, - "learning_rate": 3.19831052919778e-05, - "loss": 2.3131, - "step": 206630 - }, - { - "epoch": 0.36, - "learning_rate": 3.198223335205098e-05, - "loss": 2.2678, - "step": 206640 - }, - { - "epoch": 0.36, - "learning_rate": 3.198136141212415e-05, - "loss": 2.467, - "step": 206650 - }, - { - "epoch": 0.36, - "learning_rate": 3.198048947219732e-05, - "loss": 2.4695, - "step": 206660 - }, - { - "epoch": 0.36, - "learning_rate": 3.19796175322705e-05, - "loss": 2.3462, - "step": 206670 - }, - { - "epoch": 0.36, - "learning_rate": 3.1978745592343675e-05, - "loss": 2.4485, - "step": 206680 - }, - { - "epoch": 0.36, - "learning_rate": 3.1977873652416845e-05, - "loss": 2.5422, - "step": 206690 - }, - { - "epoch": 0.36, - "learning_rate": 3.1977001712490015e-05, - "loss": 2.3385, - "step": 206700 - }, - { - "epoch": 0.36, - "learning_rate": 3.197612977256319e-05, - "loss": 2.3732, - "step": 206710 - }, - { - "epoch": 0.36, - "learning_rate": 3.197525783263636e-05, - "loss": 2.431, - "step": 206720 - }, - { - "epoch": 0.36, - "learning_rate": 3.197438589270953e-05, - "loss": 2.4376, - "step": 206730 - }, - { - "epoch": 0.36, - "learning_rate": 3.197351395278271e-05, - "loss": 2.3579, - "step": 206740 - }, - { - "epoch": 0.36, - "learning_rate": 3.197264201285589e-05, - "loss": 2.4233, - "step": 206750 - }, - { - "epoch": 0.36, - "learning_rate": 3.197177007292906e-05, - "loss": 2.4765, - "step": 206760 - }, - { - "epoch": 0.36, - "learning_rate": 3.197089813300223e-05, - "loss": 2.2997, - "step": 206770 - }, - { - "epoch": 0.36, - "learning_rate": 3.1970026193075406e-05, - "loss": 2.4318, - "step": 206780 - }, - { - "epoch": 0.36, - "learning_rate": 3.1969154253148576e-05, - "loss": 2.3837, - "step": 206790 - }, - { - "epoch": 0.36, - "learning_rate": 3.1968282313221746e-05, - "loss": 2.4966, - "step": 206800 - }, - { - "epoch": 0.36, - "learning_rate": 3.1967410373294923e-05, - "loss": 2.3675, - "step": 206810 - }, - { - "epoch": 0.36, - "learning_rate": 3.19665384333681e-05, - "loss": 2.2523, - "step": 206820 - }, - { - "epoch": 0.36, - "learning_rate": 3.196566649344127e-05, - "loss": 2.5456, - "step": 206830 - }, - { - "epoch": 0.36, - "learning_rate": 3.196479455351444e-05, - "loss": 2.2706, - "step": 206840 - }, - { - "epoch": 0.36, - "learning_rate": 3.196392261358762e-05, - "loss": 2.2939, - "step": 206850 - }, - { - "epoch": 0.36, - "learning_rate": 3.196305067366079e-05, - "loss": 2.5291, - "step": 206860 - }, - { - "epoch": 0.36, - "learning_rate": 3.196217873373396e-05, - "loss": 2.3676, - "step": 206870 - }, - { - "epoch": 0.36, - "learning_rate": 3.1961306793807136e-05, - "loss": 2.4266, - "step": 206880 - }, - { - "epoch": 0.36, - "learning_rate": 3.1960434853880314e-05, - "loss": 2.5004, - "step": 206890 - }, - { - "epoch": 0.36, - "learning_rate": 3.1959562913953484e-05, - "loss": 2.3749, - "step": 206900 - }, - { - "epoch": 0.36, - "learning_rate": 3.1958690974026654e-05, - "loss": 2.3072, - "step": 206910 - }, - { - "epoch": 0.36, - "learning_rate": 3.195781903409983e-05, - "loss": 2.4957, - "step": 206920 - }, - { - "epoch": 0.36, - "learning_rate": 3.1956947094173e-05, - "loss": 2.547, - "step": 206930 - }, - { - "epoch": 0.36, - "learning_rate": 3.195607515424617e-05, - "loss": 2.4674, - "step": 206940 - }, - { - "epoch": 0.36, - "learning_rate": 3.195520321431934e-05, - "loss": 2.453, - "step": 206950 - }, - { - "epoch": 0.36, - "learning_rate": 3.195433127439252e-05, - "loss": 2.3531, - "step": 206960 - }, - { - "epoch": 0.36, - "learning_rate": 3.19534593344657e-05, - "loss": 2.4749, - "step": 206970 - }, - { - "epoch": 0.36, - "learning_rate": 3.195258739453887e-05, - "loss": 2.5248, - "step": 206980 - }, - { - "epoch": 0.36, - "learning_rate": 3.1951715454612045e-05, - "loss": 2.3522, - "step": 206990 - }, - { - "epoch": 0.36, - "learning_rate": 3.1950843514685215e-05, - "loss": 2.4521, - "step": 207000 - }, - { - "epoch": 0.36, - "learning_rate": 3.1949971574758385e-05, - "loss": 2.3771, - "step": 207010 - }, - { - "epoch": 0.36, - "learning_rate": 3.1949099634831556e-05, - "loss": 2.3731, - "step": 207020 - }, - { - "epoch": 0.36, - "learning_rate": 3.194822769490473e-05, - "loss": 2.4715, - "step": 207030 - }, - { - "epoch": 0.36, - "learning_rate": 3.194735575497791e-05, - "loss": 2.4104, - "step": 207040 - }, - { - "epoch": 0.36, - "learning_rate": 3.194648381505108e-05, - "loss": 2.4022, - "step": 207050 - }, - { - "epoch": 0.36, - "learning_rate": 3.194561187512425e-05, - "loss": 2.3295, - "step": 207060 - }, - { - "epoch": 0.36, - "learning_rate": 3.194473993519743e-05, - "loss": 2.2718, - "step": 207070 - }, - { - "epoch": 0.36, - "learning_rate": 3.19438679952706e-05, - "loss": 2.4076, - "step": 207080 - }, - { - "epoch": 0.36, - "learning_rate": 3.194299605534377e-05, - "loss": 2.526, - "step": 207090 - }, - { - "epoch": 0.36, - "learning_rate": 3.1942124115416946e-05, - "loss": 2.4078, - "step": 207100 - }, - { - "epoch": 0.36, - "learning_rate": 3.194125217549012e-05, - "loss": 2.2204, - "step": 207110 - }, - { - "epoch": 0.36, - "learning_rate": 3.1940380235563293e-05, - "loss": 2.5293, - "step": 207120 - }, - { - "epoch": 0.36, - "learning_rate": 3.1939508295636464e-05, - "loss": 2.5344, - "step": 207130 - }, - { - "epoch": 0.36, - "learning_rate": 3.193863635570964e-05, - "loss": 2.429, - "step": 207140 - }, - { - "epoch": 0.36, - "learning_rate": 3.193776441578281e-05, - "loss": 2.4581, - "step": 207150 - }, - { - "epoch": 0.36, - "learning_rate": 3.193689247585598e-05, - "loss": 2.4176, - "step": 207160 - }, - { - "epoch": 0.36, - "learning_rate": 3.193602053592916e-05, - "loss": 2.4113, - "step": 207170 - }, - { - "epoch": 0.36, - "learning_rate": 3.193514859600233e-05, - "loss": 2.4627, - "step": 207180 - }, - { - "epoch": 0.36, - "learning_rate": 3.1934276656075506e-05, - "loss": 2.3895, - "step": 207190 - }, - { - "epoch": 0.36, - "learning_rate": 3.193340471614868e-05, - "loss": 2.3824, - "step": 207200 - }, - { - "epoch": 0.36, - "learning_rate": 3.1932532776221854e-05, - "loss": 2.4154, - "step": 207210 - }, - { - "epoch": 0.36, - "learning_rate": 3.1931660836295024e-05, - "loss": 2.3355, - "step": 207220 - }, - { - "epoch": 0.36, - "learning_rate": 3.1930788896368195e-05, - "loss": 2.4038, - "step": 207230 - }, - { - "epoch": 0.36, - "learning_rate": 3.192991695644137e-05, - "loss": 2.4415, - "step": 207240 - }, - { - "epoch": 0.36, - "learning_rate": 3.192904501651454e-05, - "loss": 2.4575, - "step": 207250 - }, - { - "epoch": 0.36, - "learning_rate": 3.192817307658772e-05, - "loss": 2.4085, - "step": 207260 - }, - { - "epoch": 0.36, - "learning_rate": 3.192730113666089e-05, - "loss": 2.4097, - "step": 207270 - }, - { - "epoch": 0.36, - "learning_rate": 3.192642919673407e-05, - "loss": 2.4289, - "step": 207280 - }, - { - "epoch": 0.36, - "learning_rate": 3.192555725680724e-05, - "loss": 2.3699, - "step": 207290 - }, - { - "epoch": 0.36, - "learning_rate": 3.192468531688041e-05, - "loss": 2.4076, - "step": 207300 - }, - { - "epoch": 0.36, - "learning_rate": 3.1923813376953585e-05, - "loss": 2.4169, - "step": 207310 - }, - { - "epoch": 0.36, - "learning_rate": 3.1922941437026755e-05, - "loss": 2.4195, - "step": 207320 - }, - { - "epoch": 0.36, - "learning_rate": 3.1922069497099926e-05, - "loss": 2.4144, - "step": 207330 - }, - { - "epoch": 0.36, - "learning_rate": 3.19211975571731e-05, - "loss": 2.3487, - "step": 207340 - }, - { - "epoch": 0.36, - "learning_rate": 3.192032561724628e-05, - "loss": 2.3558, - "step": 207350 - }, - { - "epoch": 0.36, - "learning_rate": 3.191945367731945e-05, - "loss": 2.4179, - "step": 207360 - }, - { - "epoch": 0.36, - "learning_rate": 3.191858173739262e-05, - "loss": 2.3572, - "step": 207370 - }, - { - "epoch": 0.36, - "learning_rate": 3.19177097974658e-05, - "loss": 2.3826, - "step": 207380 - }, - { - "epoch": 0.36, - "learning_rate": 3.191683785753897e-05, - "loss": 2.5028, - "step": 207390 - }, - { - "epoch": 0.36, - "learning_rate": 3.191596591761214e-05, - "loss": 2.4195, - "step": 207400 - }, - { - "epoch": 0.36, - "learning_rate": 3.1915093977685316e-05, - "loss": 2.4371, - "step": 207410 - }, - { - "epoch": 0.36, - "learning_rate": 3.191422203775849e-05, - "loss": 2.4014, - "step": 207420 - }, - { - "epoch": 0.36, - "learning_rate": 3.191335009783166e-05, - "loss": 2.4286, - "step": 207430 - }, - { - "epoch": 0.36, - "learning_rate": 3.1912478157904834e-05, - "loss": 2.3791, - "step": 207440 - }, - { - "epoch": 0.36, - "learning_rate": 3.1911606217978004e-05, - "loss": 2.2904, - "step": 207450 - }, - { - "epoch": 0.36, - "learning_rate": 3.191073427805118e-05, - "loss": 2.4537, - "step": 207460 - }, - { - "epoch": 0.36, - "learning_rate": 3.190986233812435e-05, - "loss": 2.3853, - "step": 207470 - }, - { - "epoch": 0.36, - "learning_rate": 3.190899039819752e-05, - "loss": 2.4731, - "step": 207480 - }, - { - "epoch": 0.36, - "learning_rate": 3.1908118458270706e-05, - "loss": 2.4904, - "step": 207490 - }, - { - "epoch": 0.36, - "learning_rate": 3.1907246518343876e-05, - "loss": 2.3755, - "step": 207500 - }, - { - "epoch": 0.36, - "learning_rate": 3.190637457841705e-05, - "loss": 2.3009, - "step": 207510 - }, - { - "epoch": 0.36, - "learning_rate": 3.190550263849022e-05, - "loss": 2.3059, - "step": 207520 - }, - { - "epoch": 0.36, - "learning_rate": 3.1904630698563394e-05, - "loss": 2.3447, - "step": 207530 - }, - { - "epoch": 0.36, - "learning_rate": 3.1903758758636565e-05, - "loss": 2.3895, - "step": 207540 - }, - { - "epoch": 0.36, - "learning_rate": 3.1902886818709735e-05, - "loss": 2.43, - "step": 207550 - }, - { - "epoch": 0.36, - "learning_rate": 3.190201487878291e-05, - "loss": 2.426, - "step": 207560 - }, - { - "epoch": 0.36, - "learning_rate": 3.190114293885609e-05, - "loss": 2.4636, - "step": 207570 - }, - { - "epoch": 0.36, - "learning_rate": 3.190027099892926e-05, - "loss": 2.4327, - "step": 207580 - }, - { - "epoch": 0.36, - "learning_rate": 3.189939905900243e-05, - "loss": 2.4612, - "step": 207590 - }, - { - "epoch": 0.36, - "learning_rate": 3.189852711907561e-05, - "loss": 2.3482, - "step": 207600 - }, - { - "epoch": 0.36, - "learning_rate": 3.189765517914878e-05, - "loss": 2.4998, - "step": 207610 - }, - { - "epoch": 0.36, - "learning_rate": 3.189678323922195e-05, - "loss": 2.3713, - "step": 207620 - }, - { - "epoch": 0.36, - "learning_rate": 3.1895911299295125e-05, - "loss": 2.4666, - "step": 207630 - }, - { - "epoch": 0.36, - "learning_rate": 3.18950393593683e-05, - "loss": 2.3717, - "step": 207640 - }, - { - "epoch": 0.36, - "learning_rate": 3.189416741944147e-05, - "loss": 2.3665, - "step": 207650 - }, - { - "epoch": 0.36, - "learning_rate": 3.189329547951464e-05, - "loss": 2.4269, - "step": 207660 - }, - { - "epoch": 0.36, - "learning_rate": 3.189242353958782e-05, - "loss": 2.3747, - "step": 207670 - }, - { - "epoch": 0.36, - "learning_rate": 3.189155159966099e-05, - "loss": 2.4152, - "step": 207680 - }, - { - "epoch": 0.36, - "learning_rate": 3.189067965973416e-05, - "loss": 2.4594, - "step": 207690 - }, - { - "epoch": 0.36, - "learning_rate": 3.188980771980734e-05, - "loss": 2.4218, - "step": 207700 - }, - { - "epoch": 0.36, - "learning_rate": 3.1888935779880515e-05, - "loss": 2.5022, - "step": 207710 - }, - { - "epoch": 0.36, - "learning_rate": 3.1888063839953686e-05, - "loss": 2.417, - "step": 207720 - }, - { - "epoch": 0.36, - "learning_rate": 3.1887191900026856e-05, - "loss": 2.3903, - "step": 207730 - }, - { - "epoch": 0.36, - "learning_rate": 3.188631996010003e-05, - "loss": 2.3784, - "step": 207740 - }, - { - "epoch": 0.36, - "learning_rate": 3.1885448020173204e-05, - "loss": 2.3511, - "step": 207750 - }, - { - "epoch": 0.36, - "learning_rate": 3.1884576080246374e-05, - "loss": 2.4279, - "step": 207760 - }, - { - "epoch": 0.36, - "learning_rate": 3.188370414031955e-05, - "loss": 2.4383, - "step": 207770 - }, - { - "epoch": 0.36, - "learning_rate": 3.188283220039273e-05, - "loss": 2.3437, - "step": 207780 - }, - { - "epoch": 0.36, - "learning_rate": 3.18819602604659e-05, - "loss": 2.3554, - "step": 207790 - }, - { - "epoch": 0.36, - "learning_rate": 3.188108832053907e-05, - "loss": 2.3576, - "step": 207800 - }, - { - "epoch": 0.36, - "learning_rate": 3.1880216380612246e-05, - "loss": 2.3858, - "step": 207810 - }, - { - "epoch": 0.36, - "learning_rate": 3.187934444068542e-05, - "loss": 2.4186, - "step": 207820 - }, - { - "epoch": 0.36, - "learning_rate": 3.187847250075859e-05, - "loss": 2.3685, - "step": 207830 - }, - { - "epoch": 0.36, - "learning_rate": 3.187760056083176e-05, - "loss": 2.324, - "step": 207840 - }, - { - "epoch": 0.36, - "learning_rate": 3.1876728620904935e-05, - "loss": 2.4002, - "step": 207850 - }, - { - "epoch": 0.36, - "learning_rate": 3.187585668097811e-05, - "loss": 2.3171, - "step": 207860 - }, - { - "epoch": 0.36, - "learning_rate": 3.187498474105128e-05, - "loss": 2.4421, - "step": 207870 - }, - { - "epoch": 0.36, - "learning_rate": 3.187411280112446e-05, - "loss": 2.3965, - "step": 207880 - }, - { - "epoch": 0.36, - "learning_rate": 3.187324086119763e-05, - "loss": 2.4362, - "step": 207890 - }, - { - "epoch": 0.36, - "learning_rate": 3.18723689212708e-05, - "loss": 2.4392, - "step": 207900 - }, - { - "epoch": 0.36, - "learning_rate": 3.187149698134397e-05, - "loss": 2.4564, - "step": 207910 - }, - { - "epoch": 0.36, - "learning_rate": 3.187062504141715e-05, - "loss": 2.4082, - "step": 207920 - }, - { - "epoch": 0.36, - "learning_rate": 3.1869753101490325e-05, - "loss": 2.2948, - "step": 207930 - }, - { - "epoch": 0.36, - "learning_rate": 3.1868881161563495e-05, - "loss": 2.349, - "step": 207940 - }, - { - "epoch": 0.36, - "learning_rate": 3.1868009221636665e-05, - "loss": 2.4873, - "step": 207950 - }, - { - "epoch": 0.36, - "learning_rate": 3.186713728170984e-05, - "loss": 2.4297, - "step": 207960 - }, - { - "epoch": 0.36, - "learning_rate": 3.186626534178301e-05, - "loss": 2.4357, - "step": 207970 - }, - { - "epoch": 0.36, - "learning_rate": 3.1865393401856183e-05, - "loss": 2.3501, - "step": 207980 - }, - { - "epoch": 0.36, - "learning_rate": 3.186452146192936e-05, - "loss": 2.4188, - "step": 207990 - }, - { - "epoch": 0.36, - "learning_rate": 3.186364952200253e-05, - "loss": 2.4635, - "step": 208000 - }, - { - "epoch": 0.36, - "learning_rate": 3.186277758207571e-05, - "loss": 2.3461, - "step": 208010 - }, - { - "epoch": 0.36, - "learning_rate": 3.186190564214888e-05, - "loss": 2.3222, - "step": 208020 - }, - { - "epoch": 0.36, - "learning_rate": 3.1861033702222056e-05, - "loss": 2.4247, - "step": 208030 - }, - { - "epoch": 0.36, - "learning_rate": 3.1860161762295226e-05, - "loss": 2.4515, - "step": 208040 - }, - { - "epoch": 0.36, - "learning_rate": 3.1859289822368396e-05, - "loss": 2.4169, - "step": 208050 - }, - { - "epoch": 0.36, - "learning_rate": 3.1858417882441574e-05, - "loss": 2.4565, - "step": 208060 - }, - { - "epoch": 0.36, - "learning_rate": 3.1857545942514744e-05, - "loss": 2.352, - "step": 208070 - }, - { - "epoch": 0.36, - "learning_rate": 3.185667400258792e-05, - "loss": 2.2751, - "step": 208080 - }, - { - "epoch": 0.36, - "learning_rate": 3.185580206266109e-05, - "loss": 2.4217, - "step": 208090 - }, - { - "epoch": 0.36, - "learning_rate": 3.185493012273427e-05, - "loss": 2.2913, - "step": 208100 - }, - { - "epoch": 0.36, - "learning_rate": 3.185405818280744e-05, - "loss": 2.4145, - "step": 208110 - }, - { - "epoch": 0.36, - "learning_rate": 3.185318624288061e-05, - "loss": 2.5038, - "step": 208120 - }, - { - "epoch": 0.36, - "learning_rate": 3.1852314302953787e-05, - "loss": 2.4875, - "step": 208130 - }, - { - "epoch": 0.36, - "learning_rate": 3.185144236302696e-05, - "loss": 2.3713, - "step": 208140 - }, - { - "epoch": 0.36, - "learning_rate": 3.185057042310013e-05, - "loss": 2.3854, - "step": 208150 - }, - { - "epoch": 0.36, - "learning_rate": 3.1849698483173304e-05, - "loss": 2.4602, - "step": 208160 - }, - { - "epoch": 0.36, - "learning_rate": 3.184882654324648e-05, - "loss": 2.3618, - "step": 208170 - }, - { - "epoch": 0.36, - "learning_rate": 3.184795460331965e-05, - "loss": 2.4308, - "step": 208180 - }, - { - "epoch": 0.36, - "learning_rate": 3.184708266339282e-05, - "loss": 2.4332, - "step": 208190 - }, - { - "epoch": 0.36, - "learning_rate": 3.1846210723466e-05, - "loss": 2.3763, - "step": 208200 - }, - { - "epoch": 0.36, - "learning_rate": 3.184533878353917e-05, - "loss": 2.4227, - "step": 208210 - }, - { - "epoch": 0.36, - "learning_rate": 3.184446684361234e-05, - "loss": 2.4029, - "step": 208220 - }, - { - "epoch": 0.36, - "learning_rate": 3.184359490368552e-05, - "loss": 2.4692, - "step": 208230 - }, - { - "epoch": 0.36, - "learning_rate": 3.1842722963758695e-05, - "loss": 2.4417, - "step": 208240 - }, - { - "epoch": 0.36, - "learning_rate": 3.1841851023831865e-05, - "loss": 2.5285, - "step": 208250 - }, - { - "epoch": 0.36, - "learning_rate": 3.1840979083905035e-05, - "loss": 2.4722, - "step": 208260 - }, - { - "epoch": 0.36, - "learning_rate": 3.184010714397821e-05, - "loss": 2.4754, - "step": 208270 - }, - { - "epoch": 0.36, - "learning_rate": 3.183923520405138e-05, - "loss": 2.2927, - "step": 208280 - }, - { - "epoch": 0.36, - "learning_rate": 3.183836326412455e-05, - "loss": 2.3897, - "step": 208290 - }, - { - "epoch": 0.36, - "learning_rate": 3.1837491324197724e-05, - "loss": 2.356, - "step": 208300 - }, - { - "epoch": 0.36, - "learning_rate": 3.183661938427091e-05, - "loss": 2.5083, - "step": 208310 - }, - { - "epoch": 0.36, - "learning_rate": 3.183574744434408e-05, - "loss": 2.4535, - "step": 208320 - }, - { - "epoch": 0.36, - "learning_rate": 3.183487550441725e-05, - "loss": 2.4361, - "step": 208330 - }, - { - "epoch": 0.36, - "learning_rate": 3.1834003564490426e-05, - "loss": 2.3735, - "step": 208340 - }, - { - "epoch": 0.36, - "learning_rate": 3.1833131624563596e-05, - "loss": 2.3053, - "step": 208350 - }, - { - "epoch": 0.36, - "learning_rate": 3.1832259684636766e-05, - "loss": 2.456, - "step": 208360 - }, - { - "epoch": 0.36, - "learning_rate": 3.183138774470994e-05, - "loss": 2.3746, - "step": 208370 - }, - { - "epoch": 0.36, - "learning_rate": 3.183051580478312e-05, - "loss": 2.5363, - "step": 208380 - }, - { - "epoch": 0.36, - "learning_rate": 3.182964386485629e-05, - "loss": 2.3822, - "step": 208390 - }, - { - "epoch": 0.36, - "learning_rate": 3.182877192492946e-05, - "loss": 2.3467, - "step": 208400 - }, - { - "epoch": 0.36, - "learning_rate": 3.182789998500263e-05, - "loss": 2.3276, - "step": 208410 - }, - { - "epoch": 0.36, - "learning_rate": 3.182702804507581e-05, - "loss": 2.3952, - "step": 208420 - }, - { - "epoch": 0.36, - "learning_rate": 3.182615610514898e-05, - "loss": 2.6023, - "step": 208430 - }, - { - "epoch": 0.36, - "learning_rate": 3.182528416522215e-05, - "loss": 2.4998, - "step": 208440 - }, - { - "epoch": 0.36, - "learning_rate": 3.1824412225295334e-05, - "loss": 2.3387, - "step": 208450 - }, - { - "epoch": 0.36, - "learning_rate": 3.1823540285368504e-05, - "loss": 2.4572, - "step": 208460 - }, - { - "epoch": 0.36, - "learning_rate": 3.1822668345441674e-05, - "loss": 2.5158, - "step": 208470 - }, - { - "epoch": 0.36, - "learning_rate": 3.1821796405514845e-05, - "loss": 2.5044, - "step": 208480 - }, - { - "epoch": 0.36, - "learning_rate": 3.182092446558802e-05, - "loss": 2.369, - "step": 208490 - }, - { - "epoch": 0.36, - "learning_rate": 3.182005252566119e-05, - "loss": 2.3162, - "step": 208500 - }, - { - "epoch": 0.36, - "learning_rate": 3.181918058573436e-05, - "loss": 2.4519, - "step": 208510 - }, - { - "epoch": 0.36, - "learning_rate": 3.181830864580754e-05, - "loss": 2.3627, - "step": 208520 - }, - { - "epoch": 0.36, - "learning_rate": 3.181743670588072e-05, - "loss": 2.4583, - "step": 208530 - }, - { - "epoch": 0.36, - "learning_rate": 3.181656476595389e-05, - "loss": 2.4502, - "step": 208540 - }, - { - "epoch": 0.36, - "learning_rate": 3.181569282602706e-05, - "loss": 2.3167, - "step": 208550 - }, - { - "epoch": 0.36, - "learning_rate": 3.1814820886100235e-05, - "loss": 2.3756, - "step": 208560 - }, - { - "epoch": 0.36, - "learning_rate": 3.1813948946173405e-05, - "loss": 2.3252, - "step": 208570 - }, - { - "epoch": 0.36, - "learning_rate": 3.1813077006246576e-05, - "loss": 2.3703, - "step": 208580 - }, - { - "epoch": 0.36, - "learning_rate": 3.181220506631975e-05, - "loss": 2.405, - "step": 208590 - }, - { - "epoch": 0.36, - "learning_rate": 3.181133312639293e-05, - "loss": 2.4488, - "step": 208600 - }, - { - "epoch": 0.36, - "learning_rate": 3.18104611864661e-05, - "loss": 2.4048, - "step": 208610 - }, - { - "epoch": 0.36, - "learning_rate": 3.180958924653927e-05, - "loss": 2.4943, - "step": 208620 - }, - { - "epoch": 0.36, - "learning_rate": 3.180871730661245e-05, - "loss": 2.3906, - "step": 208630 - }, - { - "epoch": 0.36, - "learning_rate": 3.180784536668562e-05, - "loss": 2.5032, - "step": 208640 - }, - { - "epoch": 0.36, - "learning_rate": 3.180697342675879e-05, - "loss": 2.4431, - "step": 208650 - }, - { - "epoch": 0.36, - "learning_rate": 3.1806101486831966e-05, - "loss": 2.4193, - "step": 208660 - }, - { - "epoch": 0.36, - "learning_rate": 3.1805229546905136e-05, - "loss": 2.3768, - "step": 208670 - }, - { - "epoch": 0.36, - "learning_rate": 3.1804357606978313e-05, - "loss": 2.4155, - "step": 208680 - }, - { - "epoch": 0.36, - "learning_rate": 3.1803485667051484e-05, - "loss": 2.4219, - "step": 208690 - }, - { - "epoch": 0.36, - "learning_rate": 3.180261372712466e-05, - "loss": 2.36, - "step": 208700 - }, - { - "epoch": 0.36, - "learning_rate": 3.180174178719783e-05, - "loss": 2.5088, - "step": 208710 - }, - { - "epoch": 0.36, - "learning_rate": 3.1800869847271e-05, - "loss": 2.3339, - "step": 208720 - }, - { - "epoch": 0.36, - "learning_rate": 3.179999790734418e-05, - "loss": 2.4089, - "step": 208730 - }, - { - "epoch": 0.36, - "learning_rate": 3.179912596741735e-05, - "loss": 2.3727, - "step": 208740 - }, - { - "epoch": 0.36, - "learning_rate": 3.1798254027490526e-05, - "loss": 2.3506, - "step": 208750 - }, - { - "epoch": 0.36, - "learning_rate": 3.17973820875637e-05, - "loss": 2.5363, - "step": 208760 - }, - { - "epoch": 0.36, - "learning_rate": 3.1796510147636874e-05, - "loss": 2.493, - "step": 208770 - }, - { - "epoch": 0.36, - "learning_rate": 3.1795638207710044e-05, - "loss": 2.3839, - "step": 208780 - }, - { - "epoch": 0.36, - "learning_rate": 3.1794766267783215e-05, - "loss": 2.435, - "step": 208790 - }, - { - "epoch": 0.36, - "learning_rate": 3.1793894327856385e-05, - "loss": 2.5456, - "step": 208800 - }, - { - "epoch": 0.36, - "learning_rate": 3.179302238792956e-05, - "loss": 2.4977, - "step": 208810 - }, - { - "epoch": 0.36, - "learning_rate": 3.179215044800273e-05, - "loss": 2.3438, - "step": 208820 - }, - { - "epoch": 0.36, - "learning_rate": 3.179127850807591e-05, - "loss": 2.4502, - "step": 208830 - }, - { - "epoch": 0.36, - "learning_rate": 3.179040656814909e-05, - "loss": 2.4388, - "step": 208840 - }, - { - "epoch": 0.36, - "learning_rate": 3.178953462822226e-05, - "loss": 2.4067, - "step": 208850 - }, - { - "epoch": 0.36, - "learning_rate": 3.178866268829543e-05, - "loss": 2.4531, - "step": 208860 - }, - { - "epoch": 0.36, - "learning_rate": 3.17877907483686e-05, - "loss": 2.4063, - "step": 208870 - }, - { - "epoch": 0.36, - "learning_rate": 3.1786918808441775e-05, - "loss": 2.5662, - "step": 208880 - }, - { - "epoch": 0.36, - "learning_rate": 3.1786046868514946e-05, - "loss": 2.4172, - "step": 208890 - }, - { - "epoch": 0.36, - "learning_rate": 3.178517492858812e-05, - "loss": 2.5452, - "step": 208900 - }, - { - "epoch": 0.36, - "learning_rate": 3.178430298866129e-05, - "loss": 2.4926, - "step": 208910 - }, - { - "epoch": 0.36, - "learning_rate": 3.178343104873447e-05, - "loss": 2.359, - "step": 208920 - }, - { - "epoch": 0.36, - "learning_rate": 3.178255910880764e-05, - "loss": 2.4385, - "step": 208930 - }, - { - "epoch": 0.36, - "learning_rate": 3.178168716888081e-05, - "loss": 2.4903, - "step": 208940 - }, - { - "epoch": 0.36, - "learning_rate": 3.178081522895399e-05, - "loss": 2.4118, - "step": 208950 - }, - { - "epoch": 0.36, - "learning_rate": 3.177994328902716e-05, - "loss": 2.3087, - "step": 208960 - }, - { - "epoch": 0.36, - "learning_rate": 3.1779071349100336e-05, - "loss": 2.4239, - "step": 208970 - }, - { - "epoch": 0.36, - "learning_rate": 3.1778199409173506e-05, - "loss": 2.4106, - "step": 208980 - }, - { - "epoch": 0.36, - "learning_rate": 3.177732746924668e-05, - "loss": 2.3433, - "step": 208990 - }, - { - "epoch": 0.36, - "learning_rate": 3.1776455529319854e-05, - "loss": 2.4176, - "step": 209000 - }, - { - "epoch": 0.36, - "learning_rate": 3.1775583589393024e-05, - "loss": 2.3983, - "step": 209010 - }, - { - "epoch": 0.36, - "learning_rate": 3.17747116494662e-05, - "loss": 2.3356, - "step": 209020 - }, - { - "epoch": 0.36, - "learning_rate": 3.177383970953937e-05, - "loss": 2.3982, - "step": 209030 - }, - { - "epoch": 0.36, - "learning_rate": 3.177296776961254e-05, - "loss": 2.4517, - "step": 209040 - }, - { - "epoch": 0.36, - "learning_rate": 3.177209582968572e-05, - "loss": 2.3662, - "step": 209050 - }, - { - "epoch": 0.36, - "learning_rate": 3.1771223889758896e-05, - "loss": 2.4179, - "step": 209060 - }, - { - "epoch": 0.36, - "learning_rate": 3.177035194983207e-05, - "loss": 2.479, - "step": 209070 - }, - { - "epoch": 0.36, - "learning_rate": 3.176948000990524e-05, - "loss": 2.4826, - "step": 209080 - }, - { - "epoch": 0.36, - "learning_rate": 3.1768608069978414e-05, - "loss": 2.4218, - "step": 209090 - }, - { - "epoch": 0.36, - "learning_rate": 3.1767736130051585e-05, - "loss": 2.3221, - "step": 209100 - }, - { - "epoch": 0.36, - "learning_rate": 3.1766864190124755e-05, - "loss": 2.4119, - "step": 209110 - }, - { - "epoch": 0.36, - "learning_rate": 3.176599225019793e-05, - "loss": 2.3331, - "step": 209120 - }, - { - "epoch": 0.36, - "learning_rate": 3.176512031027111e-05, - "loss": 2.3336, - "step": 209130 - }, - { - "epoch": 0.36, - "learning_rate": 3.176424837034428e-05, - "loss": 2.3611, - "step": 209140 - }, - { - "epoch": 0.36, - "learning_rate": 3.176337643041745e-05, - "loss": 2.4464, - "step": 209150 - }, - { - "epoch": 0.36, - "learning_rate": 3.176250449049063e-05, - "loss": 2.4598, - "step": 209160 - }, - { - "epoch": 0.36, - "learning_rate": 3.17616325505638e-05, - "loss": 2.3108, - "step": 209170 - }, - { - "epoch": 0.36, - "learning_rate": 3.176076061063697e-05, - "loss": 2.3687, - "step": 209180 - }, - { - "epoch": 0.36, - "learning_rate": 3.175988867071014e-05, - "loss": 2.356, - "step": 209190 - }, - { - "epoch": 0.36, - "learning_rate": 3.175901673078332e-05, - "loss": 2.4639, - "step": 209200 - }, - { - "epoch": 0.36, - "learning_rate": 3.175814479085649e-05, - "loss": 2.4506, - "step": 209210 - }, - { - "epoch": 0.36, - "learning_rate": 3.175727285092966e-05, - "loss": 2.4858, - "step": 209220 - }, - { - "epoch": 0.36, - "learning_rate": 3.175640091100284e-05, - "loss": 2.4125, - "step": 209230 - }, - { - "epoch": 0.36, - "learning_rate": 3.175552897107601e-05, - "loss": 2.2683, - "step": 209240 - }, - { - "epoch": 0.36, - "learning_rate": 3.175465703114918e-05, - "loss": 2.2369, - "step": 209250 - }, - { - "epoch": 0.36, - "learning_rate": 3.175378509122235e-05, - "loss": 2.3279, - "step": 209260 - }, - { - "epoch": 0.36, - "learning_rate": 3.1752913151295535e-05, - "loss": 2.3288, - "step": 209270 - }, - { - "epoch": 0.36, - "learning_rate": 3.1752041211368706e-05, - "loss": 2.4517, - "step": 209280 - }, - { - "epoch": 0.36, - "learning_rate": 3.1751169271441876e-05, - "loss": 2.3714, - "step": 209290 - }, - { - "epoch": 0.36, - "learning_rate": 3.1750297331515047e-05, - "loss": 2.5762, - "step": 209300 - }, - { - "epoch": 0.37, - "learning_rate": 3.1749425391588224e-05, - "loss": 2.4919, - "step": 209310 - }, - { - "epoch": 0.37, - "learning_rate": 3.1748553451661394e-05, - "loss": 2.4199, - "step": 209320 - }, - { - "epoch": 0.37, - "learning_rate": 3.1747681511734564e-05, - "loss": 2.4534, - "step": 209330 - }, - { - "epoch": 0.37, - "learning_rate": 3.174680957180774e-05, - "loss": 2.4759, - "step": 209340 - }, - { - "epoch": 0.37, - "learning_rate": 3.174593763188092e-05, - "loss": 2.3253, - "step": 209350 - }, - { - "epoch": 0.37, - "learning_rate": 3.174506569195409e-05, - "loss": 2.4087, - "step": 209360 - }, - { - "epoch": 0.37, - "learning_rate": 3.174419375202726e-05, - "loss": 2.3769, - "step": 209370 - }, - { - "epoch": 0.37, - "learning_rate": 3.174332181210044e-05, - "loss": 2.3713, - "step": 209380 - }, - { - "epoch": 0.37, - "learning_rate": 3.174244987217361e-05, - "loss": 2.3829, - "step": 209390 - }, - { - "epoch": 0.37, - "learning_rate": 3.174157793224678e-05, - "loss": 2.4045, - "step": 209400 - }, - { - "epoch": 0.37, - "learning_rate": 3.1740705992319955e-05, - "loss": 2.3756, - "step": 209410 - }, - { - "epoch": 0.37, - "learning_rate": 3.173983405239313e-05, - "loss": 2.3966, - "step": 209420 - }, - { - "epoch": 0.37, - "learning_rate": 3.17389621124663e-05, - "loss": 2.3064, - "step": 209430 - }, - { - "epoch": 0.37, - "learning_rate": 3.173809017253947e-05, - "loss": 2.4577, - "step": 209440 - }, - { - "epoch": 0.37, - "learning_rate": 3.173721823261265e-05, - "loss": 2.4971, - "step": 209450 - }, - { - "epoch": 0.37, - "learning_rate": 3.173634629268582e-05, - "loss": 2.5004, - "step": 209460 - }, - { - "epoch": 0.37, - "learning_rate": 3.173547435275899e-05, - "loss": 2.4046, - "step": 209470 - }, - { - "epoch": 0.37, - "learning_rate": 3.173460241283217e-05, - "loss": 2.4611, - "step": 209480 - }, - { - "epoch": 0.37, - "learning_rate": 3.173373047290534e-05, - "loss": 2.4755, - "step": 209490 - }, - { - "epoch": 0.37, - "learning_rate": 3.1732858532978515e-05, - "loss": 2.3244, - "step": 209500 - }, - { - "epoch": 0.37, - "learning_rate": 3.1731986593051686e-05, - "loss": 2.5185, - "step": 209510 - }, - { - "epoch": 0.37, - "learning_rate": 3.173111465312486e-05, - "loss": 2.3749, - "step": 209520 - }, - { - "epoch": 0.37, - "learning_rate": 3.173024271319803e-05, - "loss": 2.5028, - "step": 209530 - }, - { - "epoch": 0.37, - "learning_rate": 3.1729370773271203e-05, - "loss": 2.4214, - "step": 209540 - }, - { - "epoch": 0.37, - "learning_rate": 3.172849883334438e-05, - "loss": 2.4758, - "step": 209550 - }, - { - "epoch": 0.37, - "learning_rate": 3.172762689341755e-05, - "loss": 2.3752, - "step": 209560 - }, - { - "epoch": 0.37, - "learning_rate": 3.172675495349073e-05, - "loss": 2.5271, - "step": 209570 - }, - { - "epoch": 0.37, - "learning_rate": 3.17258830135639e-05, - "loss": 2.3663, - "step": 209580 - }, - { - "epoch": 0.37, - "learning_rate": 3.1725011073637076e-05, - "loss": 2.3205, - "step": 209590 - }, - { - "epoch": 0.37, - "learning_rate": 3.1724139133710246e-05, - "loss": 2.3869, - "step": 209600 - }, - { - "epoch": 0.37, - "learning_rate": 3.1723267193783416e-05, - "loss": 2.4078, - "step": 209610 - }, - { - "epoch": 0.37, - "learning_rate": 3.1722395253856594e-05, - "loss": 2.4796, - "step": 209620 - }, - { - "epoch": 0.37, - "learning_rate": 3.1721523313929764e-05, - "loss": 2.412, - "step": 209630 - }, - { - "epoch": 0.37, - "learning_rate": 3.172065137400294e-05, - "loss": 2.331, - "step": 209640 - }, - { - "epoch": 0.37, - "learning_rate": 3.171977943407611e-05, - "loss": 2.492, - "step": 209650 - }, - { - "epoch": 0.37, - "learning_rate": 3.171890749414929e-05, - "loss": 2.3668, - "step": 209660 - }, - { - "epoch": 0.37, - "learning_rate": 3.171803555422246e-05, - "loss": 2.4698, - "step": 209670 - }, - { - "epoch": 0.37, - "learning_rate": 3.171716361429563e-05, - "loss": 2.4714, - "step": 209680 - }, - { - "epoch": 0.37, - "learning_rate": 3.1716291674368807e-05, - "loss": 2.2913, - "step": 209690 - }, - { - "epoch": 0.37, - "learning_rate": 3.171541973444198e-05, - "loss": 2.381, - "step": 209700 - }, - { - "epoch": 0.37, - "learning_rate": 3.171454779451515e-05, - "loss": 2.3433, - "step": 209710 - }, - { - "epoch": 0.37, - "learning_rate": 3.1713675854588325e-05, - "loss": 2.4431, - "step": 209720 - }, - { - "epoch": 0.37, - "learning_rate": 3.17128039146615e-05, - "loss": 2.3564, - "step": 209730 - }, - { - "epoch": 0.37, - "learning_rate": 3.171193197473467e-05, - "loss": 2.4877, - "step": 209740 - }, - { - "epoch": 0.37, - "learning_rate": 3.171106003480784e-05, - "loss": 2.5378, - "step": 209750 - }, - { - "epoch": 0.37, - "learning_rate": 3.171018809488101e-05, - "loss": 2.4146, - "step": 209760 - }, - { - "epoch": 0.37, - "learning_rate": 3.170931615495419e-05, - "loss": 2.4483, - "step": 209770 - }, - { - "epoch": 0.37, - "learning_rate": 3.170844421502736e-05, - "loss": 2.331, - "step": 209780 - }, - { - "epoch": 0.37, - "learning_rate": 3.170757227510054e-05, - "loss": 2.3795, - "step": 209790 - }, - { - "epoch": 0.37, - "learning_rate": 3.1706700335173715e-05, - "loss": 2.4093, - "step": 209800 - }, - { - "epoch": 0.37, - "learning_rate": 3.1705828395246885e-05, - "loss": 2.331, - "step": 209810 - }, - { - "epoch": 0.37, - "learning_rate": 3.1704956455320055e-05, - "loss": 2.3769, - "step": 209820 - }, - { - "epoch": 0.37, - "learning_rate": 3.1704084515393226e-05, - "loss": 2.4692, - "step": 209830 - }, - { - "epoch": 0.37, - "learning_rate": 3.17032125754664e-05, - "loss": 2.4154, - "step": 209840 - }, - { - "epoch": 0.37, - "learning_rate": 3.170234063553957e-05, - "loss": 2.4244, - "step": 209850 - }, - { - "epoch": 0.37, - "learning_rate": 3.1701468695612744e-05, - "loss": 2.431, - "step": 209860 - }, - { - "epoch": 0.37, - "learning_rate": 3.170059675568592e-05, - "loss": 2.5301, - "step": 209870 - }, - { - "epoch": 0.37, - "learning_rate": 3.16997248157591e-05, - "loss": 2.5213, - "step": 209880 - }, - { - "epoch": 0.37, - "learning_rate": 3.169885287583227e-05, - "loss": 2.3757, - "step": 209890 - }, - { - "epoch": 0.37, - "learning_rate": 3.169798093590544e-05, - "loss": 2.2731, - "step": 209900 - }, - { - "epoch": 0.37, - "learning_rate": 3.1697108995978616e-05, - "loss": 2.3664, - "step": 209910 - }, - { - "epoch": 0.37, - "learning_rate": 3.1696237056051786e-05, - "loss": 2.4555, - "step": 209920 - }, - { - "epoch": 0.37, - "learning_rate": 3.169536511612496e-05, - "loss": 2.3027, - "step": 209930 - }, - { - "epoch": 0.37, - "learning_rate": 3.1694493176198134e-05, - "loss": 2.3742, - "step": 209940 - }, - { - "epoch": 0.37, - "learning_rate": 3.169362123627131e-05, - "loss": 2.377, - "step": 209950 - }, - { - "epoch": 0.37, - "learning_rate": 3.169274929634448e-05, - "loss": 2.3923, - "step": 209960 - }, - { - "epoch": 0.37, - "learning_rate": 3.169187735641765e-05, - "loss": 2.3354, - "step": 209970 - }, - { - "epoch": 0.37, - "learning_rate": 3.169100541649083e-05, - "loss": 2.391, - "step": 209980 - }, - { - "epoch": 0.37, - "learning_rate": 3.1690133476564e-05, - "loss": 2.5144, - "step": 209990 - }, - { - "epoch": 0.37, - "learning_rate": 3.168926153663717e-05, - "loss": 2.3314, - "step": 210000 - }, - { - "epoch": 0.37, - "learning_rate": 3.168838959671035e-05, - "loss": 2.4694, - "step": 210010 - }, - { - "epoch": 0.37, - "learning_rate": 3.1687517656783524e-05, - "loss": 2.423, - "step": 210020 - }, - { - "epoch": 0.37, - "learning_rate": 3.1686645716856694e-05, - "loss": 2.5076, - "step": 210030 - }, - { - "epoch": 0.37, - "learning_rate": 3.1685773776929865e-05, - "loss": 2.4191, - "step": 210040 - }, - { - "epoch": 0.37, - "learning_rate": 3.168490183700304e-05, - "loss": 2.3309, - "step": 210050 - }, - { - "epoch": 0.37, - "learning_rate": 3.168402989707621e-05, - "loss": 2.5923, - "step": 210060 - }, - { - "epoch": 0.37, - "learning_rate": 3.168315795714938e-05, - "loss": 2.3605, - "step": 210070 - }, - { - "epoch": 0.37, - "learning_rate": 3.168228601722256e-05, - "loss": 2.3292, - "step": 210080 - }, - { - "epoch": 0.37, - "learning_rate": 3.168141407729574e-05, - "loss": 2.4949, - "step": 210090 - }, - { - "epoch": 0.37, - "learning_rate": 3.168054213736891e-05, - "loss": 2.4377, - "step": 210100 - }, - { - "epoch": 0.37, - "learning_rate": 3.167967019744208e-05, - "loss": 2.4585, - "step": 210110 - }, - { - "epoch": 0.37, - "learning_rate": 3.1678798257515255e-05, - "loss": 2.3974, - "step": 210120 - }, - { - "epoch": 0.37, - "learning_rate": 3.1677926317588425e-05, - "loss": 2.4007, - "step": 210130 - }, - { - "epoch": 0.37, - "learning_rate": 3.1677054377661596e-05, - "loss": 2.3877, - "step": 210140 - }, - { - "epoch": 0.37, - "learning_rate": 3.1676182437734766e-05, - "loss": 2.4468, - "step": 210150 - }, - { - "epoch": 0.37, - "learning_rate": 3.167531049780794e-05, - "loss": 2.4419, - "step": 210160 - }, - { - "epoch": 0.37, - "learning_rate": 3.167443855788112e-05, - "loss": 2.5096, - "step": 210170 - }, - { - "epoch": 0.37, - "learning_rate": 3.167356661795429e-05, - "loss": 2.4113, - "step": 210180 - }, - { - "epoch": 0.37, - "learning_rate": 3.167269467802747e-05, - "loss": 2.3679, - "step": 210190 - }, - { - "epoch": 0.37, - "learning_rate": 3.167182273810064e-05, - "loss": 2.2662, - "step": 210200 - }, - { - "epoch": 0.37, - "learning_rate": 3.167095079817381e-05, - "loss": 2.3866, - "step": 210210 - }, - { - "epoch": 0.37, - "learning_rate": 3.167007885824698e-05, - "loss": 2.415, - "step": 210220 - }, - { - "epoch": 0.37, - "learning_rate": 3.1669206918320156e-05, - "loss": 2.522, - "step": 210230 - }, - { - "epoch": 0.37, - "learning_rate": 3.1668334978393333e-05, - "loss": 2.4889, - "step": 210240 - }, - { - "epoch": 0.37, - "learning_rate": 3.1667463038466504e-05, - "loss": 2.4518, - "step": 210250 - }, - { - "epoch": 0.37, - "learning_rate": 3.1666591098539674e-05, - "loss": 2.5101, - "step": 210260 - }, - { - "epoch": 0.37, - "learning_rate": 3.166571915861285e-05, - "loss": 2.3304, - "step": 210270 - }, - { - "epoch": 0.37, - "learning_rate": 3.166484721868602e-05, - "loss": 2.4084, - "step": 210280 - }, - { - "epoch": 0.37, - "learning_rate": 3.166397527875919e-05, - "loss": 2.4133, - "step": 210290 - }, - { - "epoch": 0.37, - "learning_rate": 3.166310333883237e-05, - "loss": 2.3198, - "step": 210300 - }, - { - "epoch": 0.37, - "learning_rate": 3.1662231398905546e-05, - "loss": 2.3881, - "step": 210310 - }, - { - "epoch": 0.37, - "learning_rate": 3.166135945897872e-05, - "loss": 2.4682, - "step": 210320 - }, - { - "epoch": 0.37, - "learning_rate": 3.166048751905189e-05, - "loss": 2.3575, - "step": 210330 - }, - { - "epoch": 0.37, - "learning_rate": 3.1659615579125064e-05, - "loss": 2.2665, - "step": 210340 - }, - { - "epoch": 0.37, - "learning_rate": 3.1658743639198235e-05, - "loss": 2.3873, - "step": 210350 - }, - { - "epoch": 0.37, - "learning_rate": 3.1657871699271405e-05, - "loss": 2.3866, - "step": 210360 - }, - { - "epoch": 0.37, - "learning_rate": 3.165699975934458e-05, - "loss": 2.49, - "step": 210370 - }, - { - "epoch": 0.37, - "learning_rate": 3.165612781941775e-05, - "loss": 2.389, - "step": 210380 - }, - { - "epoch": 0.37, - "learning_rate": 3.165525587949093e-05, - "loss": 2.5185, - "step": 210390 - }, - { - "epoch": 0.37, - "learning_rate": 3.16543839395641e-05, - "loss": 2.4239, - "step": 210400 - }, - { - "epoch": 0.37, - "learning_rate": 3.165351199963728e-05, - "loss": 2.3982, - "step": 210410 - }, - { - "epoch": 0.37, - "learning_rate": 3.165264005971045e-05, - "loss": 2.4586, - "step": 210420 - }, - { - "epoch": 0.37, - "learning_rate": 3.165176811978362e-05, - "loss": 2.5157, - "step": 210430 - }, - { - "epoch": 0.37, - "learning_rate": 3.1650896179856795e-05, - "loss": 2.4134, - "step": 210440 - }, - { - "epoch": 0.37, - "learning_rate": 3.1650024239929966e-05, - "loss": 2.475, - "step": 210450 - }, - { - "epoch": 0.37, - "learning_rate": 3.164915230000314e-05, - "loss": 2.4684, - "step": 210460 - }, - { - "epoch": 0.37, - "learning_rate": 3.164828036007631e-05, - "loss": 2.5609, - "step": 210470 - }, - { - "epoch": 0.37, - "learning_rate": 3.164740842014949e-05, - "loss": 2.3646, - "step": 210480 - }, - { - "epoch": 0.37, - "learning_rate": 3.164653648022266e-05, - "loss": 2.513, - "step": 210490 - }, - { - "epoch": 0.37, - "learning_rate": 3.164566454029583e-05, - "loss": 2.4102, - "step": 210500 - }, - { - "epoch": 0.37, - "learning_rate": 3.164479260036901e-05, - "loss": 2.4664, - "step": 210510 - }, - { - "epoch": 0.37, - "learning_rate": 3.164392066044218e-05, - "loss": 2.4097, - "step": 210520 - }, - { - "epoch": 0.37, - "learning_rate": 3.164304872051535e-05, - "loss": 2.3823, - "step": 210530 - }, - { - "epoch": 0.37, - "learning_rate": 3.1642176780588526e-05, - "loss": 2.3175, - "step": 210540 - }, - { - "epoch": 0.37, - "learning_rate": 3.16413048406617e-05, - "loss": 2.4211, - "step": 210550 - }, - { - "epoch": 0.37, - "learning_rate": 3.1640432900734874e-05, - "loss": 2.3822, - "step": 210560 - }, - { - "epoch": 0.37, - "learning_rate": 3.1639560960808044e-05, - "loss": 2.3114, - "step": 210570 - }, - { - "epoch": 0.37, - "learning_rate": 3.163868902088122e-05, - "loss": 2.4123, - "step": 210580 - }, - { - "epoch": 0.37, - "learning_rate": 3.163781708095439e-05, - "loss": 2.4888, - "step": 210590 - }, - { - "epoch": 0.37, - "learning_rate": 3.163694514102756e-05, - "loss": 2.4468, - "step": 210600 - }, - { - "epoch": 0.37, - "learning_rate": 3.163607320110074e-05, - "loss": 2.42, - "step": 210610 - }, - { - "epoch": 0.37, - "learning_rate": 3.1635201261173916e-05, - "loss": 2.4802, - "step": 210620 - }, - { - "epoch": 0.37, - "learning_rate": 3.163432932124709e-05, - "loss": 2.4069, - "step": 210630 - }, - { - "epoch": 0.37, - "learning_rate": 3.163345738132026e-05, - "loss": 2.4512, - "step": 210640 - }, - { - "epoch": 0.37, - "learning_rate": 3.163258544139343e-05, - "loss": 2.4557, - "step": 210650 - }, - { - "epoch": 0.37, - "learning_rate": 3.1631713501466605e-05, - "loss": 2.248, - "step": 210660 - }, - { - "epoch": 0.37, - "learning_rate": 3.1630841561539775e-05, - "loss": 2.4948, - "step": 210670 - }, - { - "epoch": 0.37, - "learning_rate": 3.1629969621612945e-05, - "loss": 2.283, - "step": 210680 - }, - { - "epoch": 0.37, - "learning_rate": 3.162909768168613e-05, - "loss": 2.4146, - "step": 210690 - }, - { - "epoch": 0.37, - "learning_rate": 3.16282257417593e-05, - "loss": 2.5003, - "step": 210700 - }, - { - "epoch": 0.37, - "learning_rate": 3.162735380183247e-05, - "loss": 2.3931, - "step": 210710 - }, - { - "epoch": 0.37, - "learning_rate": 3.162648186190564e-05, - "loss": 2.352, - "step": 210720 - }, - { - "epoch": 0.37, - "learning_rate": 3.162560992197882e-05, - "loss": 2.3794, - "step": 210730 - }, - { - "epoch": 0.37, - "learning_rate": 3.162473798205199e-05, - "loss": 2.3687, - "step": 210740 - }, - { - "epoch": 0.37, - "learning_rate": 3.162386604212516e-05, - "loss": 2.4427, - "step": 210750 - }, - { - "epoch": 0.37, - "learning_rate": 3.1622994102198336e-05, - "loss": 2.4689, - "step": 210760 - }, - { - "epoch": 0.37, - "learning_rate": 3.162212216227151e-05, - "loss": 2.3997, - "step": 210770 - }, - { - "epoch": 0.37, - "learning_rate": 3.162125022234468e-05, - "loss": 2.408, - "step": 210780 - }, - { - "epoch": 0.37, - "learning_rate": 3.1620378282417854e-05, - "loss": 2.4727, - "step": 210790 - }, - { - "epoch": 0.37, - "learning_rate": 3.161950634249103e-05, - "loss": 2.3476, - "step": 210800 - }, - { - "epoch": 0.37, - "learning_rate": 3.16186344025642e-05, - "loss": 2.5546, - "step": 210810 - }, - { - "epoch": 0.37, - "learning_rate": 3.161776246263737e-05, - "loss": 2.4558, - "step": 210820 - }, - { - "epoch": 0.37, - "learning_rate": 3.161689052271055e-05, - "loss": 2.2174, - "step": 210830 - }, - { - "epoch": 0.37, - "learning_rate": 3.1616018582783726e-05, - "loss": 2.4562, - "step": 210840 - }, - { - "epoch": 0.37, - "learning_rate": 3.1615146642856896e-05, - "loss": 2.3438, - "step": 210850 - }, - { - "epoch": 0.37, - "learning_rate": 3.1614274702930067e-05, - "loss": 2.4528, - "step": 210860 - }, - { - "epoch": 0.37, - "learning_rate": 3.1613402763003244e-05, - "loss": 2.3562, - "step": 210870 - }, - { - "epoch": 0.37, - "learning_rate": 3.1612530823076414e-05, - "loss": 2.3051, - "step": 210880 - }, - { - "epoch": 0.37, - "learning_rate": 3.1611658883149584e-05, - "loss": 2.3295, - "step": 210890 - }, - { - "epoch": 0.37, - "learning_rate": 3.161078694322276e-05, - "loss": 2.4211, - "step": 210900 - }, - { - "epoch": 0.37, - "learning_rate": 3.160991500329594e-05, - "loss": 2.4998, - "step": 210910 - }, - { - "epoch": 0.37, - "learning_rate": 3.160904306336911e-05, - "loss": 2.3776, - "step": 210920 - }, - { - "epoch": 0.37, - "learning_rate": 3.160817112344228e-05, - "loss": 2.3729, - "step": 210930 - }, - { - "epoch": 0.37, - "learning_rate": 3.160729918351546e-05, - "loss": 2.3473, - "step": 210940 - }, - { - "epoch": 0.37, - "learning_rate": 3.160642724358863e-05, - "loss": 2.4563, - "step": 210950 - }, - { - "epoch": 0.37, - "learning_rate": 3.16055553036618e-05, - "loss": 2.4091, - "step": 210960 - }, - { - "epoch": 0.37, - "learning_rate": 3.1604683363734975e-05, - "loss": 2.4401, - "step": 210970 - }, - { - "epoch": 0.37, - "learning_rate": 3.160381142380815e-05, - "loss": 2.3963, - "step": 210980 - }, - { - "epoch": 0.37, - "learning_rate": 3.160293948388132e-05, - "loss": 2.4289, - "step": 210990 - }, - { - "epoch": 0.37, - "learning_rate": 3.160206754395449e-05, - "loss": 2.4774, - "step": 211000 - }, - { - "epoch": 0.37, - "learning_rate": 3.160119560402767e-05, - "loss": 2.3187, - "step": 211010 - }, - { - "epoch": 0.37, - "learning_rate": 3.160032366410084e-05, - "loss": 2.453, - "step": 211020 - }, - { - "epoch": 0.37, - "learning_rate": 3.159945172417401e-05, - "loss": 2.3286, - "step": 211030 - }, - { - "epoch": 0.37, - "learning_rate": 3.159857978424719e-05, - "loss": 2.4094, - "step": 211040 - }, - { - "epoch": 0.37, - "learning_rate": 3.159770784432036e-05, - "loss": 2.3485, - "step": 211050 - }, - { - "epoch": 0.37, - "learning_rate": 3.1596835904393535e-05, - "loss": 2.3804, - "step": 211060 - }, - { - "epoch": 0.37, - "learning_rate": 3.1595963964466706e-05, - "loss": 2.5039, - "step": 211070 - }, - { - "epoch": 0.37, - "learning_rate": 3.159509202453988e-05, - "loss": 2.4522, - "step": 211080 - }, - { - "epoch": 0.37, - "learning_rate": 3.159422008461305e-05, - "loss": 2.4529, - "step": 211090 - }, - { - "epoch": 0.37, - "learning_rate": 3.1593348144686223e-05, - "loss": 2.5001, - "step": 211100 - }, - { - "epoch": 0.37, - "learning_rate": 3.1592476204759394e-05, - "loss": 2.3556, - "step": 211110 - }, - { - "epoch": 0.37, - "learning_rate": 3.159160426483257e-05, - "loss": 2.4933, - "step": 211120 - }, - { - "epoch": 0.37, - "learning_rate": 3.159073232490575e-05, - "loss": 2.3778, - "step": 211130 - }, - { - "epoch": 0.37, - "learning_rate": 3.158986038497892e-05, - "loss": 2.5327, - "step": 211140 - }, - { - "epoch": 0.37, - "learning_rate": 3.1588988445052096e-05, - "loss": 2.3995, - "step": 211150 - }, - { - "epoch": 0.37, - "learning_rate": 3.1588116505125266e-05, - "loss": 2.4711, - "step": 211160 - }, - { - "epoch": 0.37, - "learning_rate": 3.1587244565198436e-05, - "loss": 2.4397, - "step": 211170 - }, - { - "epoch": 0.37, - "learning_rate": 3.158637262527161e-05, - "loss": 2.4429, - "step": 211180 - }, - { - "epoch": 0.37, - "learning_rate": 3.1585500685344784e-05, - "loss": 2.3577, - "step": 211190 - }, - { - "epoch": 0.37, - "learning_rate": 3.1584628745417954e-05, - "loss": 2.4634, - "step": 211200 - }, - { - "epoch": 0.37, - "learning_rate": 3.158375680549113e-05, - "loss": 2.4046, - "step": 211210 - }, - { - "epoch": 0.37, - "learning_rate": 3.15828848655643e-05, - "loss": 2.3966, - "step": 211220 - }, - { - "epoch": 0.37, - "learning_rate": 3.158201292563748e-05, - "loss": 2.4445, - "step": 211230 - }, - { - "epoch": 0.37, - "learning_rate": 3.158114098571065e-05, - "loss": 2.3401, - "step": 211240 - }, - { - "epoch": 0.37, - "learning_rate": 3.158026904578382e-05, - "loss": 2.4866, - "step": 211250 - }, - { - "epoch": 0.37, - "learning_rate": 3.1579397105857e-05, - "loss": 2.415, - "step": 211260 - }, - { - "epoch": 0.37, - "learning_rate": 3.157852516593017e-05, - "loss": 2.2678, - "step": 211270 - }, - { - "epoch": 0.37, - "learning_rate": 3.1577653226003345e-05, - "loss": 2.4289, - "step": 211280 - }, - { - "epoch": 0.37, - "learning_rate": 3.1576781286076515e-05, - "loss": 2.3775, - "step": 211290 - }, - { - "epoch": 0.37, - "learning_rate": 3.157590934614969e-05, - "loss": 2.3748, - "step": 211300 - }, - { - "epoch": 0.37, - "learning_rate": 3.157503740622286e-05, - "loss": 2.3847, - "step": 211310 - }, - { - "epoch": 0.37, - "learning_rate": 3.157416546629603e-05, - "loss": 2.3587, - "step": 211320 - }, - { - "epoch": 0.37, - "learning_rate": 3.157329352636921e-05, - "loss": 2.4281, - "step": 211330 - }, - { - "epoch": 0.37, - "learning_rate": 3.157242158644238e-05, - "loss": 2.4313, - "step": 211340 - }, - { - "epoch": 0.37, - "learning_rate": 3.157154964651555e-05, - "loss": 2.4482, - "step": 211350 - }, - { - "epoch": 0.37, - "learning_rate": 3.157067770658873e-05, - "loss": 2.2841, - "step": 211360 - }, - { - "epoch": 0.37, - "learning_rate": 3.1569805766661905e-05, - "loss": 2.578, - "step": 211370 - }, - { - "epoch": 0.37, - "learning_rate": 3.1568933826735075e-05, - "loss": 2.3901, - "step": 211380 - }, - { - "epoch": 0.37, - "learning_rate": 3.1568061886808246e-05, - "loss": 2.4288, - "step": 211390 - }, - { - "epoch": 0.37, - "learning_rate": 3.156718994688142e-05, - "loss": 2.2802, - "step": 211400 - }, - { - "epoch": 0.37, - "learning_rate": 3.156631800695459e-05, - "loss": 2.4544, - "step": 211410 - }, - { - "epoch": 0.37, - "learning_rate": 3.1565446067027764e-05, - "loss": 2.312, - "step": 211420 - }, - { - "epoch": 0.37, - "learning_rate": 3.156457412710094e-05, - "loss": 2.395, - "step": 211430 - }, - { - "epoch": 0.37, - "learning_rate": 3.156370218717412e-05, - "loss": 2.479, - "step": 211440 - }, - { - "epoch": 0.37, - "learning_rate": 3.156283024724729e-05, - "loss": 2.5405, - "step": 211450 - }, - { - "epoch": 0.37, - "learning_rate": 3.156195830732046e-05, - "loss": 2.3803, - "step": 211460 - }, - { - "epoch": 0.37, - "learning_rate": 3.1561086367393636e-05, - "loss": 2.4159, - "step": 211470 - }, - { - "epoch": 0.37, - "learning_rate": 3.1560214427466806e-05, - "loss": 2.4502, - "step": 211480 - }, - { - "epoch": 0.37, - "learning_rate": 3.155934248753998e-05, - "loss": 2.4452, - "step": 211490 - }, - { - "epoch": 0.37, - "learning_rate": 3.1558470547613154e-05, - "loss": 2.349, - "step": 211500 - }, - { - "epoch": 0.37, - "learning_rate": 3.155759860768633e-05, - "loss": 2.4145, - "step": 211510 - }, - { - "epoch": 0.37, - "learning_rate": 3.15567266677595e-05, - "loss": 2.2856, - "step": 211520 - }, - { - "epoch": 0.37, - "learning_rate": 3.155585472783267e-05, - "loss": 2.3872, - "step": 211530 - }, - { - "epoch": 0.37, - "learning_rate": 3.155498278790585e-05, - "loss": 2.409, - "step": 211540 - }, - { - "epoch": 0.37, - "learning_rate": 3.155411084797902e-05, - "loss": 2.4892, - "step": 211550 - }, - { - "epoch": 0.37, - "learning_rate": 3.155323890805219e-05, - "loss": 2.3375, - "step": 211560 - }, - { - "epoch": 0.37, - "learning_rate": 3.155236696812536e-05, - "loss": 2.3064, - "step": 211570 - }, - { - "epoch": 0.37, - "learning_rate": 3.1551495028198544e-05, - "loss": 2.3752, - "step": 211580 - }, - { - "epoch": 0.37, - "learning_rate": 3.1550623088271714e-05, - "loss": 2.444, - "step": 211590 - }, - { - "epoch": 0.37, - "learning_rate": 3.1549751148344885e-05, - "loss": 2.3603, - "step": 211600 - }, - { - "epoch": 0.37, - "learning_rate": 3.1548879208418055e-05, - "loss": 2.368, - "step": 211610 - }, - { - "epoch": 0.37, - "learning_rate": 3.154800726849123e-05, - "loss": 2.4911, - "step": 211620 - }, - { - "epoch": 0.37, - "learning_rate": 3.15471353285644e-05, - "loss": 2.4093, - "step": 211630 - }, - { - "epoch": 0.37, - "learning_rate": 3.154626338863757e-05, - "loss": 2.4095, - "step": 211640 - }, - { - "epoch": 0.37, - "learning_rate": 3.154539144871076e-05, - "loss": 2.2348, - "step": 211650 - }, - { - "epoch": 0.37, - "learning_rate": 3.154451950878393e-05, - "loss": 2.422, - "step": 211660 - }, - { - "epoch": 0.37, - "learning_rate": 3.15436475688571e-05, - "loss": 2.4846, - "step": 211670 - }, - { - "epoch": 0.37, - "learning_rate": 3.154277562893027e-05, - "loss": 2.4548, - "step": 211680 - }, - { - "epoch": 0.37, - "learning_rate": 3.1541903689003445e-05, - "loss": 2.4273, - "step": 211690 - }, - { - "epoch": 0.37, - "learning_rate": 3.1541031749076616e-05, - "loss": 2.5392, - "step": 211700 - }, - { - "epoch": 0.37, - "learning_rate": 3.1540159809149786e-05, - "loss": 2.3986, - "step": 211710 - }, - { - "epoch": 0.37, - "learning_rate": 3.153928786922296e-05, - "loss": 2.5153, - "step": 211720 - }, - { - "epoch": 0.37, - "learning_rate": 3.153841592929614e-05, - "loss": 2.3819, - "step": 211730 - }, - { - "epoch": 0.37, - "learning_rate": 3.153754398936931e-05, - "loss": 2.4925, - "step": 211740 - }, - { - "epoch": 0.37, - "learning_rate": 3.153667204944248e-05, - "loss": 2.5186, - "step": 211750 - }, - { - "epoch": 0.37, - "learning_rate": 3.153580010951566e-05, - "loss": 2.3608, - "step": 211760 - }, - { - "epoch": 0.37, - "learning_rate": 3.153492816958883e-05, - "loss": 2.3266, - "step": 211770 - }, - { - "epoch": 0.37, - "learning_rate": 3.1534056229662e-05, - "loss": 2.3794, - "step": 211780 - }, - { - "epoch": 0.37, - "learning_rate": 3.1533184289735176e-05, - "loss": 2.4694, - "step": 211790 - }, - { - "epoch": 0.37, - "learning_rate": 3.1532312349808353e-05, - "loss": 2.3865, - "step": 211800 - }, - { - "epoch": 0.37, - "learning_rate": 3.1531440409881524e-05, - "loss": 2.349, - "step": 211810 - }, - { - "epoch": 0.37, - "learning_rate": 3.1530568469954694e-05, - "loss": 2.4814, - "step": 211820 - }, - { - "epoch": 0.37, - "learning_rate": 3.152969653002787e-05, - "loss": 2.3826, - "step": 211830 - }, - { - "epoch": 0.37, - "learning_rate": 3.152882459010104e-05, - "loss": 2.3809, - "step": 211840 - }, - { - "epoch": 0.37, - "learning_rate": 3.152795265017421e-05, - "loss": 2.3144, - "step": 211850 - }, - { - "epoch": 0.37, - "learning_rate": 3.152708071024739e-05, - "loss": 2.3981, - "step": 211860 - }, - { - "epoch": 0.37, - "learning_rate": 3.152620877032056e-05, - "loss": 2.4496, - "step": 211870 - }, - { - "epoch": 0.37, - "learning_rate": 3.152533683039374e-05, - "loss": 2.4168, - "step": 211880 - }, - { - "epoch": 0.37, - "learning_rate": 3.152446489046691e-05, - "loss": 2.3311, - "step": 211890 - }, - { - "epoch": 0.37, - "learning_rate": 3.1523592950540084e-05, - "loss": 2.302, - "step": 211900 - }, - { - "epoch": 0.37, - "learning_rate": 3.1522721010613255e-05, - "loss": 2.3416, - "step": 211910 - }, - { - "epoch": 0.37, - "learning_rate": 3.1521849070686425e-05, - "loss": 2.3936, - "step": 211920 - }, - { - "epoch": 0.37, - "learning_rate": 3.15209771307596e-05, - "loss": 2.4449, - "step": 211930 - }, - { - "epoch": 0.37, - "learning_rate": 3.152010519083277e-05, - "loss": 2.4575, - "step": 211940 - }, - { - "epoch": 0.37, - "learning_rate": 3.151923325090595e-05, - "loss": 2.3706, - "step": 211950 - }, - { - "epoch": 0.37, - "learning_rate": 3.151836131097912e-05, - "loss": 2.4281, - "step": 211960 - }, - { - "epoch": 0.37, - "learning_rate": 3.15174893710523e-05, - "loss": 2.3249, - "step": 211970 - }, - { - "epoch": 0.37, - "learning_rate": 3.151661743112547e-05, - "loss": 2.2819, - "step": 211980 - }, - { - "epoch": 0.37, - "learning_rate": 3.151574549119864e-05, - "loss": 2.5215, - "step": 211990 - }, - { - "epoch": 0.37, - "learning_rate": 3.151487355127181e-05, - "loss": 2.4359, - "step": 212000 - }, - { - "epoch": 0.37, - "learning_rate": 3.1514001611344986e-05, - "loss": 2.527, - "step": 212010 - }, - { - "epoch": 0.37, - "learning_rate": 3.1513129671418156e-05, - "loss": 2.3518, - "step": 212020 - }, - { - "epoch": 0.37, - "learning_rate": 3.151225773149133e-05, - "loss": 2.321, - "step": 212030 - }, - { - "epoch": 0.37, - "learning_rate": 3.151138579156451e-05, - "loss": 2.3774, - "step": 212040 - }, - { - "epoch": 0.37, - "learning_rate": 3.151051385163768e-05, - "loss": 2.5002, - "step": 212050 - }, - { - "epoch": 0.37, - "learning_rate": 3.150964191171085e-05, - "loss": 2.2998, - "step": 212060 - }, - { - "epoch": 0.37, - "learning_rate": 3.150876997178402e-05, - "loss": 2.3234, - "step": 212070 - }, - { - "epoch": 0.37, - "learning_rate": 3.15078980318572e-05, - "loss": 2.4301, - "step": 212080 - }, - { - "epoch": 0.37, - "learning_rate": 3.150702609193037e-05, - "loss": 2.3836, - "step": 212090 - }, - { - "epoch": 0.37, - "learning_rate": 3.1506154152003546e-05, - "loss": 2.2711, - "step": 212100 - }, - { - "epoch": 0.37, - "learning_rate": 3.1505282212076717e-05, - "loss": 2.3964, - "step": 212110 - }, - { - "epoch": 0.37, - "learning_rate": 3.1504410272149894e-05, - "loss": 2.5385, - "step": 212120 - }, - { - "epoch": 0.37, - "learning_rate": 3.1503538332223064e-05, - "loss": 2.4481, - "step": 212130 - }, - { - "epoch": 0.37, - "learning_rate": 3.1502666392296235e-05, - "loss": 2.4381, - "step": 212140 - }, - { - "epoch": 0.37, - "learning_rate": 3.150179445236941e-05, - "loss": 2.3555, - "step": 212150 - }, - { - "epoch": 0.37, - "learning_rate": 3.150092251244258e-05, - "loss": 2.4613, - "step": 212160 - }, - { - "epoch": 0.37, - "learning_rate": 3.150005057251576e-05, - "loss": 2.3274, - "step": 212170 - }, - { - "epoch": 0.37, - "learning_rate": 3.149917863258893e-05, - "loss": 2.5112, - "step": 212180 - }, - { - "epoch": 0.37, - "learning_rate": 3.149830669266211e-05, - "loss": 2.4744, - "step": 212190 - }, - { - "epoch": 0.37, - "learning_rate": 3.149743475273528e-05, - "loss": 2.4683, - "step": 212200 - }, - { - "epoch": 0.37, - "learning_rate": 3.149656281280845e-05, - "loss": 2.3427, - "step": 212210 - }, - { - "epoch": 0.37, - "learning_rate": 3.1495690872881625e-05, - "loss": 2.2921, - "step": 212220 - }, - { - "epoch": 0.37, - "learning_rate": 3.1494818932954795e-05, - "loss": 2.3814, - "step": 212230 - }, - { - "epoch": 0.37, - "learning_rate": 3.1493946993027965e-05, - "loss": 2.3593, - "step": 212240 - }, - { - "epoch": 0.37, - "learning_rate": 3.149307505310114e-05, - "loss": 2.3163, - "step": 212250 - }, - { - "epoch": 0.37, - "learning_rate": 3.149220311317432e-05, - "loss": 2.4756, - "step": 212260 - }, - { - "epoch": 0.37, - "learning_rate": 3.149133117324749e-05, - "loss": 2.4133, - "step": 212270 - }, - { - "epoch": 0.37, - "learning_rate": 3.149045923332066e-05, - "loss": 2.4069, - "step": 212280 - }, - { - "epoch": 0.37, - "learning_rate": 3.148958729339384e-05, - "loss": 2.4374, - "step": 212290 - }, - { - "epoch": 0.37, - "learning_rate": 3.148871535346701e-05, - "loss": 2.4058, - "step": 212300 - }, - { - "epoch": 0.37, - "learning_rate": 3.148784341354018e-05, - "loss": 2.4451, - "step": 212310 - }, - { - "epoch": 0.37, - "learning_rate": 3.1486971473613356e-05, - "loss": 2.4724, - "step": 212320 - }, - { - "epoch": 0.37, - "learning_rate": 3.148609953368653e-05, - "loss": 2.4148, - "step": 212330 - }, - { - "epoch": 0.37, - "learning_rate": 3.14852275937597e-05, - "loss": 2.3622, - "step": 212340 - }, - { - "epoch": 0.37, - "learning_rate": 3.1484355653832874e-05, - "loss": 2.2931, - "step": 212350 - }, - { - "epoch": 0.37, - "learning_rate": 3.148348371390605e-05, - "loss": 2.505, - "step": 212360 - }, - { - "epoch": 0.37, - "learning_rate": 3.148261177397922e-05, - "loss": 2.4683, - "step": 212370 - }, - { - "epoch": 0.37, - "learning_rate": 3.148173983405239e-05, - "loss": 2.3398, - "step": 212380 - }, - { - "epoch": 0.37, - "learning_rate": 3.148086789412557e-05, - "loss": 2.4735, - "step": 212390 - }, - { - "epoch": 0.37, - "learning_rate": 3.1479995954198746e-05, - "loss": 2.4378, - "step": 212400 - }, - { - "epoch": 0.37, - "learning_rate": 3.1479124014271916e-05, - "loss": 2.402, - "step": 212410 - }, - { - "epoch": 0.37, - "learning_rate": 3.1478252074345087e-05, - "loss": 2.4017, - "step": 212420 - }, - { - "epoch": 0.37, - "learning_rate": 3.1477380134418264e-05, - "loss": 2.4058, - "step": 212430 - }, - { - "epoch": 0.37, - "learning_rate": 3.1476508194491434e-05, - "loss": 2.3798, - "step": 212440 - }, - { - "epoch": 0.37, - "learning_rate": 3.1475636254564604e-05, - "loss": 2.4111, - "step": 212450 - }, - { - "epoch": 0.37, - "learning_rate": 3.1474764314637775e-05, - "loss": 2.2709, - "step": 212460 - }, - { - "epoch": 0.37, - "learning_rate": 3.147389237471096e-05, - "loss": 2.3721, - "step": 212470 - }, - { - "epoch": 0.37, - "learning_rate": 3.147302043478413e-05, - "loss": 2.3424, - "step": 212480 - }, - { - "epoch": 0.37, - "learning_rate": 3.14721484948573e-05, - "loss": 2.4382, - "step": 212490 - }, - { - "epoch": 0.37, - "learning_rate": 3.147127655493048e-05, - "loss": 2.3654, - "step": 212500 - }, - { - "epoch": 0.37, - "learning_rate": 3.147040461500365e-05, - "loss": 2.3275, - "step": 212510 - }, - { - "epoch": 0.37, - "learning_rate": 3.146953267507682e-05, - "loss": 2.3819, - "step": 212520 - }, - { - "epoch": 0.37, - "learning_rate": 3.146866073514999e-05, - "loss": 2.2925, - "step": 212530 - }, - { - "epoch": 0.37, - "learning_rate": 3.1467788795223165e-05, - "loss": 2.4558, - "step": 212540 - }, - { - "epoch": 0.37, - "learning_rate": 3.146691685529634e-05, - "loss": 2.4475, - "step": 212550 - }, - { - "epoch": 0.37, - "learning_rate": 3.146604491536951e-05, - "loss": 2.4064, - "step": 212560 - }, - { - "epoch": 0.37, - "learning_rate": 3.146517297544268e-05, - "loss": 2.4832, - "step": 212570 - }, - { - "epoch": 0.37, - "learning_rate": 3.146430103551586e-05, - "loss": 2.443, - "step": 212580 - }, - { - "epoch": 0.37, - "learning_rate": 3.146342909558903e-05, - "loss": 2.3341, - "step": 212590 - }, - { - "epoch": 0.37, - "learning_rate": 3.14625571556622e-05, - "loss": 2.4504, - "step": 212600 - }, - { - "epoch": 0.37, - "learning_rate": 3.146168521573538e-05, - "loss": 2.4142, - "step": 212610 - }, - { - "epoch": 0.37, - "learning_rate": 3.1460813275808555e-05, - "loss": 2.27, - "step": 212620 - }, - { - "epoch": 0.37, - "learning_rate": 3.1459941335881726e-05, - "loss": 2.3274, - "step": 212630 - }, - { - "epoch": 0.37, - "learning_rate": 3.1459069395954896e-05, - "loss": 2.4544, - "step": 212640 - }, - { - "epoch": 0.37, - "learning_rate": 3.145819745602807e-05, - "loss": 2.4255, - "step": 212650 - }, - { - "epoch": 0.37, - "learning_rate": 3.1457325516101243e-05, - "loss": 2.5695, - "step": 212660 - }, - { - "epoch": 0.37, - "learning_rate": 3.1456453576174414e-05, - "loss": 2.4812, - "step": 212670 - }, - { - "epoch": 0.37, - "learning_rate": 3.145558163624759e-05, - "loss": 2.3774, - "step": 212680 - }, - { - "epoch": 0.37, - "learning_rate": 3.145470969632076e-05, - "loss": 2.3345, - "step": 212690 - }, - { - "epoch": 0.37, - "learning_rate": 3.145383775639394e-05, - "loss": 2.4578, - "step": 212700 - }, - { - "epoch": 0.37, - "learning_rate": 3.145296581646711e-05, - "loss": 2.3458, - "step": 212710 - }, - { - "epoch": 0.37, - "learning_rate": 3.1452093876540286e-05, - "loss": 2.3343, - "step": 212720 - }, - { - "epoch": 0.37, - "learning_rate": 3.1451221936613456e-05, - "loss": 2.4175, - "step": 212730 - }, - { - "epoch": 0.37, - "learning_rate": 3.145034999668663e-05, - "loss": 2.3696, - "step": 212740 - }, - { - "epoch": 0.37, - "learning_rate": 3.1449478056759804e-05, - "loss": 2.3931, - "step": 212750 - }, - { - "epoch": 0.37, - "learning_rate": 3.1448606116832974e-05, - "loss": 2.4196, - "step": 212760 - }, - { - "epoch": 0.37, - "learning_rate": 3.144773417690615e-05, - "loss": 2.4131, - "step": 212770 - }, - { - "epoch": 0.37, - "learning_rate": 3.144686223697932e-05, - "loss": 2.4026, - "step": 212780 - }, - { - "epoch": 0.37, - "learning_rate": 3.14459902970525e-05, - "loss": 2.4308, - "step": 212790 - }, - { - "epoch": 0.37, - "learning_rate": 3.144511835712567e-05, - "loss": 2.302, - "step": 212800 - }, - { - "epoch": 0.37, - "learning_rate": 3.144424641719884e-05, - "loss": 2.4553, - "step": 212810 - }, - { - "epoch": 0.37, - "learning_rate": 3.144337447727202e-05, - "loss": 2.3261, - "step": 212820 - }, - { - "epoch": 0.37, - "learning_rate": 3.144250253734519e-05, - "loss": 2.33, - "step": 212830 - }, - { - "epoch": 0.37, - "learning_rate": 3.1441630597418365e-05, - "loss": 2.5527, - "step": 212840 - }, - { - "epoch": 0.37, - "learning_rate": 3.1440758657491535e-05, - "loss": 2.4329, - "step": 212850 - }, - { - "epoch": 0.37, - "learning_rate": 3.143988671756471e-05, - "loss": 2.3848, - "step": 212860 - }, - { - "epoch": 0.37, - "learning_rate": 3.143901477763788e-05, - "loss": 2.4381, - "step": 212870 - }, - { - "epoch": 0.37, - "learning_rate": 3.143814283771105e-05, - "loss": 2.3694, - "step": 212880 - }, - { - "epoch": 0.37, - "learning_rate": 3.143727089778423e-05, - "loss": 2.4212, - "step": 212890 - }, - { - "epoch": 0.37, - "learning_rate": 3.14363989578574e-05, - "loss": 2.3569, - "step": 212900 - }, - { - "epoch": 0.37, - "learning_rate": 3.143552701793057e-05, - "loss": 2.4401, - "step": 212910 - }, - { - "epoch": 0.37, - "learning_rate": 3.143465507800375e-05, - "loss": 2.3959, - "step": 212920 - }, - { - "epoch": 0.37, - "learning_rate": 3.1433783138076925e-05, - "loss": 2.4186, - "step": 212930 - }, - { - "epoch": 0.37, - "learning_rate": 3.1432911198150095e-05, - "loss": 2.3407, - "step": 212940 - }, - { - "epoch": 0.37, - "learning_rate": 3.1432039258223266e-05, - "loss": 2.3765, - "step": 212950 - }, - { - "epoch": 0.37, - "learning_rate": 3.1431167318296436e-05, - "loss": 2.3623, - "step": 212960 - }, - { - "epoch": 0.37, - "learning_rate": 3.143029537836961e-05, - "loss": 2.4542, - "step": 212970 - }, - { - "epoch": 0.37, - "learning_rate": 3.1429423438442784e-05, - "loss": 2.3206, - "step": 212980 - }, - { - "epoch": 0.37, - "learning_rate": 3.142855149851596e-05, - "loss": 2.3542, - "step": 212990 - }, - { - "epoch": 0.37, - "learning_rate": 3.142767955858914e-05, - "loss": 2.3635, - "step": 213000 - }, - { - "epoch": 0.37, - "learning_rate": 3.142680761866231e-05, - "loss": 2.3971, - "step": 213010 - }, - { - "epoch": 0.37, - "learning_rate": 3.142593567873548e-05, - "loss": 2.3809, - "step": 213020 - }, - { - "epoch": 0.37, - "learning_rate": 3.142506373880865e-05, - "loss": 2.4077, - "step": 213030 - }, - { - "epoch": 0.37, - "learning_rate": 3.1424191798881826e-05, - "loss": 2.5393, - "step": 213040 - }, - { - "epoch": 0.37, - "learning_rate": 3.1423319858955e-05, - "loss": 2.4087, - "step": 213050 - }, - { - "epoch": 0.37, - "learning_rate": 3.142244791902817e-05, - "loss": 2.3138, - "step": 213060 - }, - { - "epoch": 0.37, - "learning_rate": 3.1421575979101344e-05, - "loss": 2.4273, - "step": 213070 - }, - { - "epoch": 0.37, - "learning_rate": 3.142070403917452e-05, - "loss": 2.4709, - "step": 213080 - }, - { - "epoch": 0.37, - "learning_rate": 3.141983209924769e-05, - "loss": 2.4504, - "step": 213090 - }, - { - "epoch": 0.37, - "learning_rate": 3.141896015932086e-05, - "loss": 2.3567, - "step": 213100 - }, - { - "epoch": 0.37, - "learning_rate": 3.141808821939404e-05, - "loss": 2.4647, - "step": 213110 - }, - { - "epoch": 0.37, - "learning_rate": 3.141721627946721e-05, - "loss": 2.3743, - "step": 213120 - }, - { - "epoch": 0.37, - "learning_rate": 3.141634433954038e-05, - "loss": 2.2484, - "step": 213130 - }, - { - "epoch": 0.37, - "learning_rate": 3.141547239961356e-05, - "loss": 2.3748, - "step": 213140 - }, - { - "epoch": 0.37, - "learning_rate": 3.1414600459686734e-05, - "loss": 2.3609, - "step": 213150 - }, - { - "epoch": 0.37, - "learning_rate": 3.1413728519759905e-05, - "loss": 2.427, - "step": 213160 - }, - { - "epoch": 0.37, - "learning_rate": 3.1412856579833075e-05, - "loss": 2.392, - "step": 213170 - }, - { - "epoch": 0.37, - "learning_rate": 3.141198463990625e-05, - "loss": 2.4125, - "step": 213180 - }, - { - "epoch": 0.37, - "learning_rate": 3.141111269997942e-05, - "loss": 2.3819, - "step": 213190 - }, - { - "epoch": 0.37, - "learning_rate": 3.141024076005259e-05, - "loss": 2.3893, - "step": 213200 - }, - { - "epoch": 0.37, - "learning_rate": 3.140936882012577e-05, - "loss": 2.3597, - "step": 213210 - }, - { - "epoch": 0.37, - "learning_rate": 3.140849688019895e-05, - "loss": 2.4757, - "step": 213220 - }, - { - "epoch": 0.37, - "learning_rate": 3.140762494027212e-05, - "loss": 2.4017, - "step": 213230 - }, - { - "epoch": 0.37, - "learning_rate": 3.140675300034529e-05, - "loss": 2.28, - "step": 213240 - }, - { - "epoch": 0.37, - "learning_rate": 3.1405881060418465e-05, - "loss": 2.3962, - "step": 213250 - }, - { - "epoch": 0.37, - "learning_rate": 3.1405009120491636e-05, - "loss": 2.4795, - "step": 213260 - }, - { - "epoch": 0.37, - "learning_rate": 3.1404137180564806e-05, - "loss": 2.2566, - "step": 213270 - }, - { - "epoch": 0.37, - "learning_rate": 3.140326524063798e-05, - "loss": 2.4645, - "step": 213280 - }, - { - "epoch": 0.37, - "learning_rate": 3.140239330071116e-05, - "loss": 2.3896, - "step": 213290 - }, - { - "epoch": 0.37, - "learning_rate": 3.140152136078433e-05, - "loss": 2.4572, - "step": 213300 - }, - { - "epoch": 0.37, - "learning_rate": 3.14006494208575e-05, - "loss": 2.4409, - "step": 213310 - }, - { - "epoch": 0.37, - "learning_rate": 3.139977748093068e-05, - "loss": 2.4071, - "step": 213320 - }, - { - "epoch": 0.37, - "learning_rate": 3.139890554100385e-05, - "loss": 2.4938, - "step": 213330 - }, - { - "epoch": 0.37, - "learning_rate": 3.139803360107702e-05, - "loss": 2.4387, - "step": 213340 - }, - { - "epoch": 0.37, - "learning_rate": 3.139716166115019e-05, - "loss": 2.3161, - "step": 213350 - }, - { - "epoch": 0.37, - "learning_rate": 3.1396289721223373e-05, - "loss": 2.4333, - "step": 213360 - }, - { - "epoch": 0.37, - "learning_rate": 3.1395417781296544e-05, - "loss": 2.4882, - "step": 213370 - }, - { - "epoch": 0.37, - "learning_rate": 3.1394545841369714e-05, - "loss": 2.4633, - "step": 213380 - }, - { - "epoch": 0.37, - "learning_rate": 3.139367390144289e-05, - "loss": 2.3256, - "step": 213390 - }, - { - "epoch": 0.37, - "learning_rate": 3.139280196151606e-05, - "loss": 2.446, - "step": 213400 - }, - { - "epoch": 0.37, - "learning_rate": 3.139193002158923e-05, - "loss": 2.3834, - "step": 213410 - }, - { - "epoch": 0.37, - "learning_rate": 3.13910580816624e-05, - "loss": 2.3445, - "step": 213420 - }, - { - "epoch": 0.37, - "learning_rate": 3.139018614173558e-05, - "loss": 2.4379, - "step": 213430 - }, - { - "epoch": 0.37, - "learning_rate": 3.138931420180876e-05, - "loss": 2.4476, - "step": 213440 - }, - { - "epoch": 0.37, - "learning_rate": 3.138844226188193e-05, - "loss": 2.4777, - "step": 213450 - }, - { - "epoch": 0.37, - "learning_rate": 3.13875703219551e-05, - "loss": 2.44, - "step": 213460 - }, - { - "epoch": 0.37, - "learning_rate": 3.1386698382028275e-05, - "loss": 2.3754, - "step": 213470 - }, - { - "epoch": 0.37, - "learning_rate": 3.1385826442101445e-05, - "loss": 2.3381, - "step": 213480 - }, - { - "epoch": 0.37, - "learning_rate": 3.1384954502174616e-05, - "loss": 2.4609, - "step": 213490 - }, - { - "epoch": 0.37, - "learning_rate": 3.138408256224779e-05, - "loss": 2.4353, - "step": 213500 - }, - { - "epoch": 0.37, - "learning_rate": 3.138321062232097e-05, - "loss": 2.5419, - "step": 213510 - }, - { - "epoch": 0.37, - "learning_rate": 3.138233868239414e-05, - "loss": 2.3311, - "step": 213520 - }, - { - "epoch": 0.37, - "learning_rate": 3.138146674246731e-05, - "loss": 2.3732, - "step": 213530 - }, - { - "epoch": 0.37, - "learning_rate": 3.138059480254049e-05, - "loss": 2.5169, - "step": 213540 - }, - { - "epoch": 0.37, - "learning_rate": 3.137972286261366e-05, - "loss": 2.437, - "step": 213550 - }, - { - "epoch": 0.37, - "learning_rate": 3.137885092268683e-05, - "loss": 2.5028, - "step": 213560 - }, - { - "epoch": 0.37, - "learning_rate": 3.1377978982760006e-05, - "loss": 2.327, - "step": 213570 - }, - { - "epoch": 0.37, - "learning_rate": 3.1377107042833176e-05, - "loss": 2.3398, - "step": 213580 - }, - { - "epoch": 0.37, - "learning_rate": 3.137623510290635e-05, - "loss": 2.3347, - "step": 213590 - }, - { - "epoch": 0.37, - "learning_rate": 3.1375363162979524e-05, - "loss": 2.3499, - "step": 213600 - }, - { - "epoch": 0.37, - "learning_rate": 3.13744912230527e-05, - "loss": 2.5159, - "step": 213610 - }, - { - "epoch": 0.37, - "learning_rate": 3.137361928312587e-05, - "loss": 2.4316, - "step": 213620 - }, - { - "epoch": 0.37, - "learning_rate": 3.137274734319904e-05, - "loss": 2.4361, - "step": 213630 - }, - { - "epoch": 0.37, - "learning_rate": 3.137187540327222e-05, - "loss": 2.4269, - "step": 213640 - }, - { - "epoch": 0.37, - "learning_rate": 3.137100346334539e-05, - "loss": 2.4281, - "step": 213650 - }, - { - "epoch": 0.37, - "learning_rate": 3.1370131523418566e-05, - "loss": 2.3702, - "step": 213660 - }, - { - "epoch": 0.37, - "learning_rate": 3.136925958349174e-05, - "loss": 2.4515, - "step": 213670 - }, - { - "epoch": 0.37, - "learning_rate": 3.1368387643564914e-05, - "loss": 2.4485, - "step": 213680 - }, - { - "epoch": 0.37, - "learning_rate": 3.1367515703638084e-05, - "loss": 2.5595, - "step": 213690 - }, - { - "epoch": 0.37, - "learning_rate": 3.1366643763711255e-05, - "loss": 2.3175, - "step": 213700 - }, - { - "epoch": 0.37, - "learning_rate": 3.136577182378443e-05, - "loss": 2.3911, - "step": 213710 - }, - { - "epoch": 0.37, - "learning_rate": 3.13648998838576e-05, - "loss": 2.3999, - "step": 213720 - }, - { - "epoch": 0.37, - "learning_rate": 3.136402794393077e-05, - "loss": 2.5085, - "step": 213730 - }, - { - "epoch": 0.37, - "learning_rate": 3.136315600400395e-05, - "loss": 2.3191, - "step": 213740 - }, - { - "epoch": 0.37, - "learning_rate": 3.136228406407713e-05, - "loss": 2.3294, - "step": 213750 - }, - { - "epoch": 0.37, - "learning_rate": 3.13614121241503e-05, - "loss": 2.5127, - "step": 213760 - }, - { - "epoch": 0.37, - "learning_rate": 3.136054018422347e-05, - "loss": 2.5273, - "step": 213770 - }, - { - "epoch": 0.37, - "learning_rate": 3.1359668244296645e-05, - "loss": 2.5399, - "step": 213780 - }, - { - "epoch": 0.37, - "learning_rate": 3.1358796304369815e-05, - "loss": 2.4126, - "step": 213790 - }, - { - "epoch": 0.37, - "learning_rate": 3.1357924364442985e-05, - "loss": 2.3255, - "step": 213800 - }, - { - "epoch": 0.37, - "learning_rate": 3.135705242451616e-05, - "loss": 2.5157, - "step": 213810 - }, - { - "epoch": 0.37, - "learning_rate": 3.135618048458934e-05, - "loss": 2.3808, - "step": 213820 - }, - { - "epoch": 0.37, - "learning_rate": 3.135530854466251e-05, - "loss": 2.4184, - "step": 213830 - }, - { - "epoch": 0.37, - "learning_rate": 3.135443660473568e-05, - "loss": 2.403, - "step": 213840 - }, - { - "epoch": 0.37, - "learning_rate": 3.135356466480886e-05, - "loss": 2.4243, - "step": 213850 - }, - { - "epoch": 0.37, - "learning_rate": 3.135269272488203e-05, - "loss": 2.3642, - "step": 213860 - }, - { - "epoch": 0.37, - "learning_rate": 3.13518207849552e-05, - "loss": 2.2911, - "step": 213870 - }, - { - "epoch": 0.37, - "learning_rate": 3.135094884502837e-05, - "loss": 2.333, - "step": 213880 - }, - { - "epoch": 0.37, - "learning_rate": 3.135007690510155e-05, - "loss": 2.502, - "step": 213890 - }, - { - "epoch": 0.37, - "learning_rate": 3.134920496517472e-05, - "loss": 2.5684, - "step": 213900 - }, - { - "epoch": 0.37, - "learning_rate": 3.1348333025247894e-05, - "loss": 2.5132, - "step": 213910 - }, - { - "epoch": 0.37, - "learning_rate": 3.1347461085321064e-05, - "loss": 2.4373, - "step": 213920 - }, - { - "epoch": 0.37, - "learning_rate": 3.134658914539424e-05, - "loss": 2.4267, - "step": 213930 - }, - { - "epoch": 0.37, - "learning_rate": 3.134571720546741e-05, - "loss": 2.3269, - "step": 213940 - }, - { - "epoch": 0.37, - "learning_rate": 3.134484526554058e-05, - "loss": 2.3149, - "step": 213950 - }, - { - "epoch": 0.37, - "learning_rate": 3.1343973325613766e-05, - "loss": 2.3856, - "step": 213960 - }, - { - "epoch": 0.37, - "learning_rate": 3.1343101385686936e-05, - "loss": 2.3729, - "step": 213970 - }, - { - "epoch": 0.37, - "learning_rate": 3.1342229445760107e-05, - "loss": 2.4083, - "step": 213980 - }, - { - "epoch": 0.37, - "learning_rate": 3.134135750583328e-05, - "loss": 2.3155, - "step": 213990 - }, - { - "epoch": 0.37, - "learning_rate": 3.1340485565906454e-05, - "loss": 2.3079, - "step": 214000 - }, - { - "epoch": 0.37, - "learning_rate": 3.1339613625979624e-05, - "loss": 2.4054, - "step": 214010 - }, - { - "epoch": 0.37, - "learning_rate": 3.1338741686052795e-05, - "loss": 2.493, - "step": 214020 - }, - { - "epoch": 0.37, - "learning_rate": 3.133786974612597e-05, - "loss": 2.5583, - "step": 214030 - }, - { - "epoch": 0.37, - "learning_rate": 3.133699780619915e-05, - "loss": 2.4178, - "step": 214040 - }, - { - "epoch": 0.37, - "learning_rate": 3.133612586627232e-05, - "loss": 2.3391, - "step": 214050 - }, - { - "epoch": 0.37, - "learning_rate": 3.133525392634549e-05, - "loss": 2.3832, - "step": 214060 - }, - { - "epoch": 0.37, - "learning_rate": 3.133438198641867e-05, - "loss": 2.53, - "step": 214070 - }, - { - "epoch": 0.37, - "learning_rate": 3.133351004649184e-05, - "loss": 2.413, - "step": 214080 - }, - { - "epoch": 0.37, - "learning_rate": 3.133263810656501e-05, - "loss": 2.3981, - "step": 214090 - }, - { - "epoch": 0.37, - "learning_rate": 3.1331766166638185e-05, - "loss": 2.3788, - "step": 214100 - }, - { - "epoch": 0.37, - "learning_rate": 3.133089422671136e-05, - "loss": 2.332, - "step": 214110 - }, - { - "epoch": 0.37, - "learning_rate": 3.133002228678453e-05, - "loss": 2.3837, - "step": 214120 - }, - { - "epoch": 0.37, - "learning_rate": 3.13291503468577e-05, - "loss": 2.4725, - "step": 214130 - }, - { - "epoch": 0.37, - "learning_rate": 3.132827840693088e-05, - "loss": 2.431, - "step": 214140 - }, - { - "epoch": 0.37, - "learning_rate": 3.132740646700405e-05, - "loss": 2.4872, - "step": 214150 - }, - { - "epoch": 0.37, - "learning_rate": 3.132653452707722e-05, - "loss": 2.4132, - "step": 214160 - }, - { - "epoch": 0.37, - "learning_rate": 3.13256625871504e-05, - "loss": 2.2885, - "step": 214170 - }, - { - "epoch": 0.37, - "learning_rate": 3.1324790647223575e-05, - "loss": 2.4386, - "step": 214180 - }, - { - "epoch": 0.37, - "learning_rate": 3.1323918707296746e-05, - "loss": 2.4563, - "step": 214190 - }, - { - "epoch": 0.37, - "learning_rate": 3.1323046767369916e-05, - "loss": 2.4155, - "step": 214200 - }, - { - "epoch": 0.37, - "learning_rate": 3.132217482744309e-05, - "loss": 2.3435, - "step": 214210 - }, - { - "epoch": 0.37, - "learning_rate": 3.1321302887516263e-05, - "loss": 2.4012, - "step": 214220 - }, - { - "epoch": 0.37, - "learning_rate": 3.1320430947589434e-05, - "loss": 2.5851, - "step": 214230 - }, - { - "epoch": 0.37, - "learning_rate": 3.131955900766261e-05, - "loss": 2.4625, - "step": 214240 - }, - { - "epoch": 0.37, - "learning_rate": 3.131868706773578e-05, - "loss": 2.4214, - "step": 214250 - }, - { - "epoch": 0.37, - "learning_rate": 3.131781512780896e-05, - "loss": 2.407, - "step": 214260 - }, - { - "epoch": 0.37, - "learning_rate": 3.131694318788213e-05, - "loss": 2.3884, - "step": 214270 - }, - { - "epoch": 0.37, - "learning_rate": 3.1316071247955306e-05, - "loss": 2.3834, - "step": 214280 - }, - { - "epoch": 0.37, - "learning_rate": 3.1315199308028476e-05, - "loss": 2.4081, - "step": 214290 - }, - { - "epoch": 0.37, - "learning_rate": 3.131432736810165e-05, - "loss": 2.4592, - "step": 214300 - }, - { - "epoch": 0.37, - "learning_rate": 3.131345542817482e-05, - "loss": 2.3026, - "step": 214310 - }, - { - "epoch": 0.37, - "learning_rate": 3.1312583488247994e-05, - "loss": 2.4638, - "step": 214320 - }, - { - "epoch": 0.37, - "learning_rate": 3.131171154832117e-05, - "loss": 2.3872, - "step": 214330 - }, - { - "epoch": 0.37, - "learning_rate": 3.131083960839434e-05, - "loss": 2.3322, - "step": 214340 - }, - { - "epoch": 0.37, - "learning_rate": 3.130996766846752e-05, - "loss": 2.2955, - "step": 214350 - }, - { - "epoch": 0.37, - "learning_rate": 3.130909572854069e-05, - "loss": 2.3531, - "step": 214360 - }, - { - "epoch": 0.37, - "learning_rate": 3.130822378861386e-05, - "loss": 2.3942, - "step": 214370 - }, - { - "epoch": 0.37, - "learning_rate": 3.130735184868703e-05, - "loss": 2.4654, - "step": 214380 - }, - { - "epoch": 0.37, - "learning_rate": 3.130647990876021e-05, - "loss": 2.276, - "step": 214390 - }, - { - "epoch": 0.37, - "learning_rate": 3.130560796883338e-05, - "loss": 2.3064, - "step": 214400 - }, - { - "epoch": 0.37, - "learning_rate": 3.1304736028906555e-05, - "loss": 2.4528, - "step": 214410 - }, - { - "epoch": 0.37, - "learning_rate": 3.1303864088979725e-05, - "loss": 2.4159, - "step": 214420 - }, - { - "epoch": 0.37, - "learning_rate": 3.13029921490529e-05, - "loss": 2.4886, - "step": 214430 - }, - { - "epoch": 0.37, - "learning_rate": 3.130212020912607e-05, - "loss": 2.4027, - "step": 214440 - }, - { - "epoch": 0.37, - "learning_rate": 3.130124826919924e-05, - "loss": 2.429, - "step": 214450 - }, - { - "epoch": 0.37, - "learning_rate": 3.130037632927242e-05, - "loss": 2.4051, - "step": 214460 - }, - { - "epoch": 0.37, - "learning_rate": 3.129950438934559e-05, - "loss": 2.2903, - "step": 214470 - }, - { - "epoch": 0.37, - "learning_rate": 3.129863244941877e-05, - "loss": 2.4429, - "step": 214480 - }, - { - "epoch": 0.37, - "learning_rate": 3.129776050949194e-05, - "loss": 2.5451, - "step": 214490 - }, - { - "epoch": 0.37, - "learning_rate": 3.1296888569565115e-05, - "loss": 2.4018, - "step": 214500 - }, - { - "epoch": 0.37, - "learning_rate": 3.1296016629638286e-05, - "loss": 2.3892, - "step": 214510 - }, - { - "epoch": 0.37, - "learning_rate": 3.1295144689711456e-05, - "loss": 2.45, - "step": 214520 - }, - { - "epoch": 0.37, - "learning_rate": 3.1294272749784633e-05, - "loss": 2.3945, - "step": 214530 - }, - { - "epoch": 0.37, - "learning_rate": 3.1293400809857804e-05, - "loss": 2.3462, - "step": 214540 - }, - { - "epoch": 0.37, - "learning_rate": 3.1292528869930974e-05, - "loss": 2.483, - "step": 214550 - }, - { - "epoch": 0.37, - "learning_rate": 3.129165693000415e-05, - "loss": 2.291, - "step": 214560 - }, - { - "epoch": 0.37, - "learning_rate": 3.129078499007733e-05, - "loss": 2.3414, - "step": 214570 - }, - { - "epoch": 0.37, - "learning_rate": 3.12899130501505e-05, - "loss": 2.313, - "step": 214580 - }, - { - "epoch": 0.37, - "learning_rate": 3.128904111022367e-05, - "loss": 2.3287, - "step": 214590 - }, - { - "epoch": 0.37, - "learning_rate": 3.1288169170296846e-05, - "loss": 2.518, - "step": 214600 - }, - { - "epoch": 0.37, - "learning_rate": 3.128729723037002e-05, - "loss": 2.5323, - "step": 214610 - }, - { - "epoch": 0.37, - "learning_rate": 3.128642529044319e-05, - "loss": 2.3581, - "step": 214620 - }, - { - "epoch": 0.37, - "learning_rate": 3.1285553350516364e-05, - "loss": 2.3179, - "step": 214630 - }, - { - "epoch": 0.37, - "learning_rate": 3.128468141058954e-05, - "loss": 2.4189, - "step": 214640 - }, - { - "epoch": 0.37, - "learning_rate": 3.128380947066271e-05, - "loss": 2.3542, - "step": 214650 - }, - { - "epoch": 0.37, - "learning_rate": 3.128293753073588e-05, - "loss": 2.5305, - "step": 214660 - }, - { - "epoch": 0.37, - "learning_rate": 3.128206559080906e-05, - "loss": 2.4392, - "step": 214670 - }, - { - "epoch": 0.37, - "learning_rate": 3.128119365088223e-05, - "loss": 2.3743, - "step": 214680 - }, - { - "epoch": 0.37, - "learning_rate": 3.12803217109554e-05, - "loss": 2.4344, - "step": 214690 - }, - { - "epoch": 0.37, - "learning_rate": 3.127944977102858e-05, - "loss": 2.4871, - "step": 214700 - }, - { - "epoch": 0.37, - "learning_rate": 3.1278577831101754e-05, - "loss": 2.4962, - "step": 214710 - }, - { - "epoch": 0.37, - "learning_rate": 3.1277705891174925e-05, - "loss": 2.354, - "step": 214720 - }, - { - "epoch": 0.37, - "learning_rate": 3.1276833951248095e-05, - "loss": 2.3799, - "step": 214730 - }, - { - "epoch": 0.37, - "learning_rate": 3.127596201132127e-05, - "loss": 2.4295, - "step": 214740 - }, - { - "epoch": 0.37, - "learning_rate": 3.127509007139444e-05, - "loss": 2.343, - "step": 214750 - }, - { - "epoch": 0.37, - "learning_rate": 3.127421813146761e-05, - "loss": 2.4167, - "step": 214760 - }, - { - "epoch": 0.37, - "learning_rate": 3.1273346191540784e-05, - "loss": 2.4698, - "step": 214770 - }, - { - "epoch": 0.37, - "learning_rate": 3.127247425161397e-05, - "loss": 2.3635, - "step": 214780 - }, - { - "epoch": 0.37, - "learning_rate": 3.127160231168714e-05, - "loss": 2.3302, - "step": 214790 - }, - { - "epoch": 0.37, - "learning_rate": 3.127073037176031e-05, - "loss": 2.5925, - "step": 214800 - }, - { - "epoch": 0.37, - "learning_rate": 3.126985843183348e-05, - "loss": 2.4329, - "step": 214810 - }, - { - "epoch": 0.37, - "learning_rate": 3.1268986491906656e-05, - "loss": 2.4233, - "step": 214820 - }, - { - "epoch": 0.37, - "learning_rate": 3.1268114551979826e-05, - "loss": 2.4971, - "step": 214830 - }, - { - "epoch": 0.37, - "learning_rate": 3.1267242612052997e-05, - "loss": 2.5679, - "step": 214840 - }, - { - "epoch": 0.37, - "learning_rate": 3.126637067212618e-05, - "loss": 2.3375, - "step": 214850 - }, - { - "epoch": 0.37, - "learning_rate": 3.126549873219935e-05, - "loss": 2.4669, - "step": 214860 - }, - { - "epoch": 0.37, - "learning_rate": 3.126462679227252e-05, - "loss": 2.3784, - "step": 214870 - }, - { - "epoch": 0.37, - "learning_rate": 3.126375485234569e-05, - "loss": 2.358, - "step": 214880 - }, - { - "epoch": 0.37, - "learning_rate": 3.126288291241887e-05, - "loss": 2.4008, - "step": 214890 - }, - { - "epoch": 0.37, - "learning_rate": 3.126201097249204e-05, - "loss": 2.3271, - "step": 214900 - }, - { - "epoch": 0.37, - "learning_rate": 3.126113903256521e-05, - "loss": 2.4632, - "step": 214910 - }, - { - "epoch": 0.37, - "learning_rate": 3.126026709263839e-05, - "loss": 2.3424, - "step": 214920 - }, - { - "epoch": 0.37, - "learning_rate": 3.1259395152711564e-05, - "loss": 2.3587, - "step": 214930 - }, - { - "epoch": 0.37, - "learning_rate": 3.1258523212784734e-05, - "loss": 2.4364, - "step": 214940 - }, - { - "epoch": 0.37, - "learning_rate": 3.1257651272857905e-05, - "loss": 2.5711, - "step": 214950 - }, - { - "epoch": 0.37, - "learning_rate": 3.125677933293108e-05, - "loss": 2.3449, - "step": 214960 - }, - { - "epoch": 0.37, - "learning_rate": 3.125590739300425e-05, - "loss": 2.3755, - "step": 214970 - }, - { - "epoch": 0.37, - "learning_rate": 3.125503545307742e-05, - "loss": 2.3156, - "step": 214980 - }, - { - "epoch": 0.37, - "learning_rate": 3.12541635131506e-05, - "loss": 2.3618, - "step": 214990 - }, - { - "epoch": 0.37, - "learning_rate": 3.125329157322378e-05, - "loss": 2.4386, - "step": 215000 - }, - { - "epoch": 0.37, - "learning_rate": 3.125241963329695e-05, - "loss": 2.4719, - "step": 215010 - }, - { - "epoch": 0.37, - "learning_rate": 3.125154769337012e-05, - "loss": 2.3835, - "step": 215020 - }, - { - "epoch": 0.37, - "learning_rate": 3.1250675753443295e-05, - "loss": 2.3427, - "step": 215030 - }, - { - "epoch": 0.38, - "learning_rate": 3.1249803813516465e-05, - "loss": 2.3775, - "step": 215040 - }, - { - "epoch": 0.38, - "learning_rate": 3.1248931873589636e-05, - "loss": 2.316, - "step": 215050 - }, - { - "epoch": 0.38, - "learning_rate": 3.124805993366281e-05, - "loss": 2.4302, - "step": 215060 - }, - { - "epoch": 0.38, - "learning_rate": 3.124718799373598e-05, - "loss": 2.4244, - "step": 215070 - }, - { - "epoch": 0.38, - "learning_rate": 3.124631605380916e-05, - "loss": 2.4498, - "step": 215080 - }, - { - "epoch": 0.38, - "learning_rate": 3.124544411388233e-05, - "loss": 2.4043, - "step": 215090 - }, - { - "epoch": 0.38, - "learning_rate": 3.124457217395551e-05, - "loss": 2.4023, - "step": 215100 - }, - { - "epoch": 0.38, - "learning_rate": 3.124370023402868e-05, - "loss": 2.3627, - "step": 215110 - }, - { - "epoch": 0.38, - "learning_rate": 3.124282829410185e-05, - "loss": 2.4099, - "step": 215120 - }, - { - "epoch": 0.38, - "learning_rate": 3.1241956354175026e-05, - "loss": 2.5333, - "step": 215130 - }, - { - "epoch": 0.38, - "learning_rate": 3.1241084414248196e-05, - "loss": 2.4619, - "step": 215140 - }, - { - "epoch": 0.38, - "learning_rate": 3.124021247432137e-05, - "loss": 2.3779, - "step": 215150 - }, - { - "epoch": 0.38, - "learning_rate": 3.1239340534394544e-05, - "loss": 2.3594, - "step": 215160 - }, - { - "epoch": 0.38, - "learning_rate": 3.123846859446772e-05, - "loss": 2.374, - "step": 215170 - }, - { - "epoch": 0.38, - "learning_rate": 3.123759665454089e-05, - "loss": 2.4544, - "step": 215180 - }, - { - "epoch": 0.38, - "learning_rate": 3.123672471461406e-05, - "loss": 2.4983, - "step": 215190 - }, - { - "epoch": 0.38, - "learning_rate": 3.123585277468724e-05, - "loss": 2.4042, - "step": 215200 - }, - { - "epoch": 0.38, - "learning_rate": 3.123498083476041e-05, - "loss": 2.4611, - "step": 215210 - }, - { - "epoch": 0.38, - "learning_rate": 3.123410889483358e-05, - "loss": 2.3174, - "step": 215220 - }, - { - "epoch": 0.38, - "learning_rate": 3.123323695490676e-05, - "loss": 2.424, - "step": 215230 - }, - { - "epoch": 0.38, - "learning_rate": 3.1232365014979934e-05, - "loss": 2.3757, - "step": 215240 - }, - { - "epoch": 0.38, - "learning_rate": 3.1231493075053104e-05, - "loss": 2.4944, - "step": 215250 - }, - { - "epoch": 0.38, - "learning_rate": 3.1230621135126275e-05, - "loss": 2.3329, - "step": 215260 - }, - { - "epoch": 0.38, - "learning_rate": 3.1229749195199445e-05, - "loss": 2.3904, - "step": 215270 - }, - { - "epoch": 0.38, - "learning_rate": 3.122887725527262e-05, - "loss": 2.4236, - "step": 215280 - }, - { - "epoch": 0.38, - "learning_rate": 3.122800531534579e-05, - "loss": 2.4042, - "step": 215290 - }, - { - "epoch": 0.38, - "learning_rate": 3.122713337541897e-05, - "loss": 2.4433, - "step": 215300 - }, - { - "epoch": 0.38, - "learning_rate": 3.122626143549215e-05, - "loss": 2.4457, - "step": 215310 - }, - { - "epoch": 0.38, - "learning_rate": 3.122538949556532e-05, - "loss": 2.4846, - "step": 215320 - }, - { - "epoch": 0.38, - "learning_rate": 3.122451755563849e-05, - "loss": 2.3441, - "step": 215330 - }, - { - "epoch": 0.38, - "learning_rate": 3.122364561571166e-05, - "loss": 2.35, - "step": 215340 - }, - { - "epoch": 0.38, - "learning_rate": 3.1222773675784835e-05, - "loss": 2.4669, - "step": 215350 - }, - { - "epoch": 0.38, - "learning_rate": 3.1221901735858005e-05, - "loss": 2.3679, - "step": 215360 - }, - { - "epoch": 0.38, - "learning_rate": 3.122102979593118e-05, - "loss": 2.4731, - "step": 215370 - }, - { - "epoch": 0.38, - "learning_rate": 3.122015785600435e-05, - "loss": 2.4014, - "step": 215380 - }, - { - "epoch": 0.38, - "learning_rate": 3.121928591607753e-05, - "loss": 2.2666, - "step": 215390 - }, - { - "epoch": 0.38, - "learning_rate": 3.12184139761507e-05, - "loss": 2.4621, - "step": 215400 - }, - { - "epoch": 0.38, - "learning_rate": 3.121754203622387e-05, - "loss": 2.4507, - "step": 215410 - }, - { - "epoch": 0.38, - "learning_rate": 3.121667009629705e-05, - "loss": 2.3302, - "step": 215420 - }, - { - "epoch": 0.38, - "learning_rate": 3.121579815637022e-05, - "loss": 2.439, - "step": 215430 - }, - { - "epoch": 0.38, - "learning_rate": 3.121492621644339e-05, - "loss": 2.4014, - "step": 215440 - }, - { - "epoch": 0.38, - "learning_rate": 3.1214054276516566e-05, - "loss": 2.5048, - "step": 215450 - }, - { - "epoch": 0.38, - "learning_rate": 3.121318233658974e-05, - "loss": 2.4362, - "step": 215460 - }, - { - "epoch": 0.38, - "learning_rate": 3.1212310396662914e-05, - "loss": 2.3518, - "step": 215470 - }, - { - "epoch": 0.38, - "learning_rate": 3.1211438456736084e-05, - "loss": 2.3881, - "step": 215480 - }, - { - "epoch": 0.38, - "learning_rate": 3.121056651680926e-05, - "loss": 2.4311, - "step": 215490 - }, - { - "epoch": 0.38, - "learning_rate": 3.120969457688243e-05, - "loss": 2.291, - "step": 215500 - }, - { - "epoch": 0.38, - "learning_rate": 3.12088226369556e-05, - "loss": 2.4807, - "step": 215510 - }, - { - "epoch": 0.38, - "learning_rate": 3.120795069702878e-05, - "loss": 2.4961, - "step": 215520 - }, - { - "epoch": 0.38, - "learning_rate": 3.1207078757101956e-05, - "loss": 2.4082, - "step": 215530 - }, - { - "epoch": 0.38, - "learning_rate": 3.1206206817175127e-05, - "loss": 2.4398, - "step": 215540 - }, - { - "epoch": 0.38, - "learning_rate": 3.12053348772483e-05, - "loss": 2.47, - "step": 215550 - }, - { - "epoch": 0.38, - "learning_rate": 3.1204462937321474e-05, - "loss": 2.4343, - "step": 215560 - }, - { - "epoch": 0.38, - "learning_rate": 3.1203590997394644e-05, - "loss": 2.349, - "step": 215570 - }, - { - "epoch": 0.38, - "learning_rate": 3.1202719057467815e-05, - "loss": 2.4006, - "step": 215580 - }, - { - "epoch": 0.38, - "learning_rate": 3.120184711754099e-05, - "loss": 2.4976, - "step": 215590 - }, - { - "epoch": 0.38, - "learning_rate": 3.120097517761417e-05, - "loss": 2.4, - "step": 215600 - }, - { - "epoch": 0.38, - "learning_rate": 3.120010323768734e-05, - "loss": 2.4108, - "step": 215610 - }, - { - "epoch": 0.38, - "learning_rate": 3.119923129776051e-05, - "loss": 2.4274, - "step": 215620 - }, - { - "epoch": 0.38, - "learning_rate": 3.119835935783369e-05, - "loss": 2.3461, - "step": 215630 - }, - { - "epoch": 0.38, - "learning_rate": 3.119748741790686e-05, - "loss": 2.3509, - "step": 215640 - }, - { - "epoch": 0.38, - "learning_rate": 3.119661547798003e-05, - "loss": 2.4348, - "step": 215650 - }, - { - "epoch": 0.38, - "learning_rate": 3.11957435380532e-05, - "loss": 2.4481, - "step": 215660 - }, - { - "epoch": 0.38, - "learning_rate": 3.119487159812638e-05, - "loss": 2.3454, - "step": 215670 - }, - { - "epoch": 0.38, - "learning_rate": 3.119399965819955e-05, - "loss": 2.3864, - "step": 215680 - }, - { - "epoch": 0.38, - "learning_rate": 3.119312771827272e-05, - "loss": 2.4999, - "step": 215690 - }, - { - "epoch": 0.38, - "learning_rate": 3.11922557783459e-05, - "loss": 2.3677, - "step": 215700 - }, - { - "epoch": 0.38, - "learning_rate": 3.119138383841907e-05, - "loss": 2.3196, - "step": 215710 - }, - { - "epoch": 0.38, - "learning_rate": 3.119051189849224e-05, - "loss": 2.4891, - "step": 215720 - }, - { - "epoch": 0.38, - "learning_rate": 3.118963995856541e-05, - "loss": 2.3378, - "step": 215730 - }, - { - "epoch": 0.38, - "learning_rate": 3.118876801863859e-05, - "loss": 2.5048, - "step": 215740 - }, - { - "epoch": 0.38, - "learning_rate": 3.1187896078711766e-05, - "loss": 2.4292, - "step": 215750 - }, - { - "epoch": 0.38, - "learning_rate": 3.1187024138784936e-05, - "loss": 2.5197, - "step": 215760 - }, - { - "epoch": 0.38, - "learning_rate": 3.1186152198858106e-05, - "loss": 2.4289, - "step": 215770 - }, - { - "epoch": 0.38, - "learning_rate": 3.1185280258931283e-05, - "loss": 2.5006, - "step": 215780 - }, - { - "epoch": 0.38, - "learning_rate": 3.1184408319004454e-05, - "loss": 2.4706, - "step": 215790 - }, - { - "epoch": 0.38, - "learning_rate": 3.1183536379077624e-05, - "loss": 2.5069, - "step": 215800 - }, - { - "epoch": 0.38, - "learning_rate": 3.11826644391508e-05, - "loss": 2.5063, - "step": 215810 - }, - { - "epoch": 0.38, - "learning_rate": 3.118179249922398e-05, - "loss": 2.3477, - "step": 215820 - }, - { - "epoch": 0.38, - "learning_rate": 3.118092055929715e-05, - "loss": 2.3363, - "step": 215830 - }, - { - "epoch": 0.38, - "learning_rate": 3.118004861937032e-05, - "loss": 2.3411, - "step": 215840 - }, - { - "epoch": 0.38, - "learning_rate": 3.1179176679443496e-05, - "loss": 2.3353, - "step": 215850 - }, - { - "epoch": 0.38, - "learning_rate": 3.117830473951667e-05, - "loss": 2.3617, - "step": 215860 - }, - { - "epoch": 0.38, - "learning_rate": 3.117743279958984e-05, - "loss": 2.4911, - "step": 215870 - }, - { - "epoch": 0.38, - "learning_rate": 3.1176560859663014e-05, - "loss": 2.3644, - "step": 215880 - }, - { - "epoch": 0.38, - "learning_rate": 3.117568891973619e-05, - "loss": 2.3499, - "step": 215890 - }, - { - "epoch": 0.38, - "learning_rate": 3.117481697980936e-05, - "loss": 2.5339, - "step": 215900 - }, - { - "epoch": 0.38, - "learning_rate": 3.117394503988253e-05, - "loss": 2.4872, - "step": 215910 - }, - { - "epoch": 0.38, - "learning_rate": 3.117307309995571e-05, - "loss": 2.4229, - "step": 215920 - }, - { - "epoch": 0.38, - "learning_rate": 3.117220116002888e-05, - "loss": 2.4732, - "step": 215930 - }, - { - "epoch": 0.38, - "learning_rate": 3.117132922010205e-05, - "loss": 2.4304, - "step": 215940 - }, - { - "epoch": 0.38, - "learning_rate": 3.117045728017523e-05, - "loss": 2.4873, - "step": 215950 - }, - { - "epoch": 0.38, - "learning_rate": 3.11695853402484e-05, - "loss": 2.4018, - "step": 215960 - }, - { - "epoch": 0.38, - "learning_rate": 3.1168713400321575e-05, - "loss": 2.3694, - "step": 215970 - }, - { - "epoch": 0.38, - "learning_rate": 3.1167841460394745e-05, - "loss": 2.5476, - "step": 215980 - }, - { - "epoch": 0.38, - "learning_rate": 3.116696952046792e-05, - "loss": 2.3618, - "step": 215990 - }, - { - "epoch": 0.38, - "learning_rate": 3.116609758054109e-05, - "loss": 2.2318, - "step": 216000 - }, - { - "epoch": 0.38, - "learning_rate": 3.116522564061426e-05, - "loss": 2.3668, - "step": 216010 - }, - { - "epoch": 0.38, - "learning_rate": 3.116435370068744e-05, - "loss": 2.388, - "step": 216020 - }, - { - "epoch": 0.38, - "learning_rate": 3.116348176076061e-05, - "loss": 2.4514, - "step": 216030 - }, - { - "epoch": 0.38, - "learning_rate": 3.116260982083379e-05, - "loss": 2.4116, - "step": 216040 - }, - { - "epoch": 0.38, - "learning_rate": 3.116173788090696e-05, - "loss": 2.4661, - "step": 216050 - }, - { - "epoch": 0.38, - "learning_rate": 3.1160865940980135e-05, - "loss": 2.5069, - "step": 216060 - }, - { - "epoch": 0.38, - "learning_rate": 3.1159994001053306e-05, - "loss": 2.4099, - "step": 216070 - }, - { - "epoch": 0.38, - "learning_rate": 3.1159122061126476e-05, - "loss": 2.4728, - "step": 216080 - }, - { - "epoch": 0.38, - "learning_rate": 3.1158250121199653e-05, - "loss": 2.3536, - "step": 216090 - }, - { - "epoch": 0.38, - "learning_rate": 3.1157378181272824e-05, - "loss": 2.3889, - "step": 216100 - }, - { - "epoch": 0.38, - "learning_rate": 3.1156506241345994e-05, - "loss": 2.4425, - "step": 216110 - }, - { - "epoch": 0.38, - "learning_rate": 3.115563430141917e-05, - "loss": 2.4376, - "step": 216120 - }, - { - "epoch": 0.38, - "learning_rate": 3.115476236149235e-05, - "loss": 2.4018, - "step": 216130 - }, - { - "epoch": 0.38, - "learning_rate": 3.115389042156552e-05, - "loss": 2.4918, - "step": 216140 - }, - { - "epoch": 0.38, - "learning_rate": 3.115301848163869e-05, - "loss": 2.394, - "step": 216150 - }, - { - "epoch": 0.38, - "learning_rate": 3.115214654171186e-05, - "loss": 2.3295, - "step": 216160 - }, - { - "epoch": 0.38, - "learning_rate": 3.115127460178504e-05, - "loss": 2.3768, - "step": 216170 - }, - { - "epoch": 0.38, - "learning_rate": 3.115040266185821e-05, - "loss": 2.3463, - "step": 216180 - }, - { - "epoch": 0.38, - "learning_rate": 3.1149530721931384e-05, - "loss": 2.3317, - "step": 216190 - }, - { - "epoch": 0.38, - "learning_rate": 3.114865878200456e-05, - "loss": 2.434, - "step": 216200 - }, - { - "epoch": 0.38, - "learning_rate": 3.114778684207773e-05, - "loss": 2.3071, - "step": 216210 - }, - { - "epoch": 0.38, - "learning_rate": 3.11469149021509e-05, - "loss": 2.4335, - "step": 216220 - }, - { - "epoch": 0.38, - "learning_rate": 3.114604296222407e-05, - "loss": 2.3321, - "step": 216230 - }, - { - "epoch": 0.38, - "learning_rate": 3.114517102229725e-05, - "loss": 2.5368, - "step": 216240 - }, - { - "epoch": 0.38, - "learning_rate": 3.114429908237042e-05, - "loss": 2.4526, - "step": 216250 - }, - { - "epoch": 0.38, - "learning_rate": 3.114342714244359e-05, - "loss": 2.3993, - "step": 216260 - }, - { - "epoch": 0.38, - "learning_rate": 3.114255520251677e-05, - "loss": 2.3927, - "step": 216270 - }, - { - "epoch": 0.38, - "learning_rate": 3.1141683262589945e-05, - "loss": 2.384, - "step": 216280 - }, - { - "epoch": 0.38, - "learning_rate": 3.1140811322663115e-05, - "loss": 2.4451, - "step": 216290 - }, - { - "epoch": 0.38, - "learning_rate": 3.1139939382736286e-05, - "loss": 2.4862, - "step": 216300 - }, - { - "epoch": 0.38, - "learning_rate": 3.113906744280946e-05, - "loss": 2.4058, - "step": 216310 - }, - { - "epoch": 0.38, - "learning_rate": 3.113819550288263e-05, - "loss": 2.3641, - "step": 216320 - }, - { - "epoch": 0.38, - "learning_rate": 3.1137323562955804e-05, - "loss": 2.3651, - "step": 216330 - }, - { - "epoch": 0.38, - "learning_rate": 3.113645162302898e-05, - "loss": 2.4574, - "step": 216340 - }, - { - "epoch": 0.38, - "learning_rate": 3.113557968310216e-05, - "loss": 2.395, - "step": 216350 - }, - { - "epoch": 0.38, - "learning_rate": 3.113470774317533e-05, - "loss": 2.3537, - "step": 216360 - }, - { - "epoch": 0.38, - "learning_rate": 3.11338358032485e-05, - "loss": 2.3351, - "step": 216370 - }, - { - "epoch": 0.38, - "learning_rate": 3.1132963863321676e-05, - "loss": 2.3451, - "step": 216380 - }, - { - "epoch": 0.38, - "learning_rate": 3.1132091923394846e-05, - "loss": 2.3632, - "step": 216390 - }, - { - "epoch": 0.38, - "learning_rate": 3.1131219983468017e-05, - "loss": 2.1991, - "step": 216400 - }, - { - "epoch": 0.38, - "learning_rate": 3.1130348043541194e-05, - "loss": 2.4533, - "step": 216410 - }, - { - "epoch": 0.38, - "learning_rate": 3.112947610361437e-05, - "loss": 2.4754, - "step": 216420 - }, - { - "epoch": 0.38, - "learning_rate": 3.112860416368754e-05, - "loss": 2.4361, - "step": 216430 - }, - { - "epoch": 0.38, - "learning_rate": 3.112773222376071e-05, - "loss": 2.38, - "step": 216440 - }, - { - "epoch": 0.38, - "learning_rate": 3.112686028383389e-05, - "loss": 2.3772, - "step": 216450 - }, - { - "epoch": 0.38, - "learning_rate": 3.112598834390706e-05, - "loss": 2.4133, - "step": 216460 - }, - { - "epoch": 0.38, - "learning_rate": 3.112511640398023e-05, - "loss": 2.3722, - "step": 216470 - }, - { - "epoch": 0.38, - "learning_rate": 3.112424446405341e-05, - "loss": 2.3517, - "step": 216480 - }, - { - "epoch": 0.38, - "learning_rate": 3.1123372524126584e-05, - "loss": 2.5136, - "step": 216490 - }, - { - "epoch": 0.38, - "learning_rate": 3.1122500584199754e-05, - "loss": 2.3758, - "step": 216500 - }, - { - "epoch": 0.38, - "learning_rate": 3.1121628644272925e-05, - "loss": 2.4138, - "step": 216510 - }, - { - "epoch": 0.38, - "learning_rate": 3.11207567043461e-05, - "loss": 2.4294, - "step": 216520 - }, - { - "epoch": 0.38, - "learning_rate": 3.111988476441927e-05, - "loss": 2.3976, - "step": 216530 - }, - { - "epoch": 0.38, - "learning_rate": 3.111901282449244e-05, - "loss": 2.4371, - "step": 216540 - }, - { - "epoch": 0.38, - "learning_rate": 3.111814088456562e-05, - "loss": 2.3392, - "step": 216550 - }, - { - "epoch": 0.38, - "learning_rate": 3.11172689446388e-05, - "loss": 2.4953, - "step": 216560 - }, - { - "epoch": 0.38, - "learning_rate": 3.111639700471197e-05, - "loss": 2.4379, - "step": 216570 - }, - { - "epoch": 0.38, - "learning_rate": 3.111552506478514e-05, - "loss": 2.4635, - "step": 216580 - }, - { - "epoch": 0.38, - "learning_rate": 3.1114653124858315e-05, - "loss": 2.4241, - "step": 216590 - }, - { - "epoch": 0.38, - "learning_rate": 3.1113781184931485e-05, - "loss": 2.492, - "step": 216600 - }, - { - "epoch": 0.38, - "learning_rate": 3.1112909245004656e-05, - "loss": 2.5106, - "step": 216610 - }, - { - "epoch": 0.38, - "learning_rate": 3.1112037305077826e-05, - "loss": 2.3478, - "step": 216620 - }, - { - "epoch": 0.38, - "learning_rate": 3.1111165365151e-05, - "loss": 2.4034, - "step": 216630 - }, - { - "epoch": 0.38, - "learning_rate": 3.111029342522418e-05, - "loss": 2.5187, - "step": 216640 - }, - { - "epoch": 0.38, - "learning_rate": 3.110942148529735e-05, - "loss": 2.412, - "step": 216650 - }, - { - "epoch": 0.38, - "learning_rate": 3.110854954537053e-05, - "loss": 2.4121, - "step": 216660 - }, - { - "epoch": 0.38, - "learning_rate": 3.11076776054437e-05, - "loss": 2.4467, - "step": 216670 - }, - { - "epoch": 0.38, - "learning_rate": 3.110680566551687e-05, - "loss": 2.3941, - "step": 216680 - }, - { - "epoch": 0.38, - "learning_rate": 3.110593372559004e-05, - "loss": 2.331, - "step": 216690 - }, - { - "epoch": 0.38, - "learning_rate": 3.1105061785663216e-05, - "loss": 2.3921, - "step": 216700 - }, - { - "epoch": 0.38, - "learning_rate": 3.110418984573639e-05, - "loss": 2.3964, - "step": 216710 - }, - { - "epoch": 0.38, - "learning_rate": 3.1103317905809564e-05, - "loss": 2.4358, - "step": 216720 - }, - { - "epoch": 0.38, - "learning_rate": 3.1102445965882734e-05, - "loss": 2.4416, - "step": 216730 - }, - { - "epoch": 0.38, - "learning_rate": 3.110157402595591e-05, - "loss": 2.5258, - "step": 216740 - }, - { - "epoch": 0.38, - "learning_rate": 3.110070208602908e-05, - "loss": 2.428, - "step": 216750 - }, - { - "epoch": 0.38, - "learning_rate": 3.109983014610225e-05, - "loss": 2.3372, - "step": 216760 - }, - { - "epoch": 0.38, - "learning_rate": 3.109895820617543e-05, - "loss": 2.4613, - "step": 216770 - }, - { - "epoch": 0.38, - "learning_rate": 3.10980862662486e-05, - "loss": 2.2863, - "step": 216780 - }, - { - "epoch": 0.38, - "learning_rate": 3.109721432632178e-05, - "loss": 2.3782, - "step": 216790 - }, - { - "epoch": 0.38, - "learning_rate": 3.109634238639495e-05, - "loss": 2.4668, - "step": 216800 - }, - { - "epoch": 0.38, - "learning_rate": 3.1095470446468124e-05, - "loss": 2.3855, - "step": 216810 - }, - { - "epoch": 0.38, - "learning_rate": 3.1094598506541295e-05, - "loss": 2.3144, - "step": 216820 - }, - { - "epoch": 0.38, - "learning_rate": 3.1093726566614465e-05, - "loss": 2.3664, - "step": 216830 - }, - { - "epoch": 0.38, - "learning_rate": 3.109285462668764e-05, - "loss": 2.4716, - "step": 216840 - }, - { - "epoch": 0.38, - "learning_rate": 3.109198268676081e-05, - "loss": 2.3957, - "step": 216850 - }, - { - "epoch": 0.38, - "learning_rate": 3.109111074683399e-05, - "loss": 2.4055, - "step": 216860 - }, - { - "epoch": 0.38, - "learning_rate": 3.109023880690716e-05, - "loss": 2.3497, - "step": 216870 - }, - { - "epoch": 0.38, - "learning_rate": 3.108936686698034e-05, - "loss": 2.4047, - "step": 216880 - }, - { - "epoch": 0.38, - "learning_rate": 3.108849492705351e-05, - "loss": 2.3191, - "step": 216890 - }, - { - "epoch": 0.38, - "learning_rate": 3.108762298712668e-05, - "loss": 2.4543, - "step": 216900 - }, - { - "epoch": 0.38, - "learning_rate": 3.1086751047199855e-05, - "loss": 2.3936, - "step": 216910 - }, - { - "epoch": 0.38, - "learning_rate": 3.1085879107273025e-05, - "loss": 2.4307, - "step": 216920 - }, - { - "epoch": 0.38, - "learning_rate": 3.1085007167346196e-05, - "loss": 2.4574, - "step": 216930 - }, - { - "epoch": 0.38, - "learning_rate": 3.108413522741937e-05, - "loss": 2.4951, - "step": 216940 - }, - { - "epoch": 0.38, - "learning_rate": 3.108326328749255e-05, - "loss": 2.2821, - "step": 216950 - }, - { - "epoch": 0.38, - "learning_rate": 3.108239134756572e-05, - "loss": 2.3458, - "step": 216960 - }, - { - "epoch": 0.38, - "learning_rate": 3.108151940763889e-05, - "loss": 2.3554, - "step": 216970 - }, - { - "epoch": 0.38, - "learning_rate": 3.108064746771207e-05, - "loss": 2.4126, - "step": 216980 - }, - { - "epoch": 0.38, - "learning_rate": 3.107977552778524e-05, - "loss": 2.3972, - "step": 216990 - }, - { - "epoch": 0.38, - "learning_rate": 3.107890358785841e-05, - "loss": 2.2766, - "step": 217000 - }, - { - "epoch": 0.38, - "learning_rate": 3.1078031647931586e-05, - "loss": 2.3331, - "step": 217010 - }, - { - "epoch": 0.38, - "learning_rate": 3.107715970800476e-05, - "loss": 2.2942, - "step": 217020 - }, - { - "epoch": 0.38, - "learning_rate": 3.1076287768077934e-05, - "loss": 2.4591, - "step": 217030 - }, - { - "epoch": 0.38, - "learning_rate": 3.1075415828151104e-05, - "loss": 2.499, - "step": 217040 - }, - { - "epoch": 0.38, - "learning_rate": 3.107454388822428e-05, - "loss": 2.4917, - "step": 217050 - }, - { - "epoch": 0.38, - "learning_rate": 3.107367194829745e-05, - "loss": 2.5051, - "step": 217060 - }, - { - "epoch": 0.38, - "learning_rate": 3.107280000837062e-05, - "loss": 2.4013, - "step": 217070 - }, - { - "epoch": 0.38, - "learning_rate": 3.107192806844379e-05, - "loss": 2.3216, - "step": 217080 - }, - { - "epoch": 0.38, - "learning_rate": 3.1071056128516976e-05, - "loss": 2.4064, - "step": 217090 - }, - { - "epoch": 0.38, - "learning_rate": 3.1070184188590147e-05, - "loss": 2.3283, - "step": 217100 - }, - { - "epoch": 0.38, - "learning_rate": 3.106931224866332e-05, - "loss": 2.4629, - "step": 217110 - }, - { - "epoch": 0.38, - "learning_rate": 3.106844030873649e-05, - "loss": 2.4501, - "step": 217120 - }, - { - "epoch": 0.38, - "learning_rate": 3.1067568368809664e-05, - "loss": 2.4642, - "step": 217130 - }, - { - "epoch": 0.38, - "learning_rate": 3.1066696428882835e-05, - "loss": 2.4116, - "step": 217140 - }, - { - "epoch": 0.38, - "learning_rate": 3.1065824488956005e-05, - "loss": 2.4402, - "step": 217150 - }, - { - "epoch": 0.38, - "learning_rate": 3.106495254902919e-05, - "loss": 2.3406, - "step": 217160 - }, - { - "epoch": 0.38, - "learning_rate": 3.106408060910236e-05, - "loss": 2.3767, - "step": 217170 - }, - { - "epoch": 0.38, - "learning_rate": 3.106320866917553e-05, - "loss": 2.4677, - "step": 217180 - }, - { - "epoch": 0.38, - "learning_rate": 3.10623367292487e-05, - "loss": 2.3082, - "step": 217190 - }, - { - "epoch": 0.38, - "learning_rate": 3.106146478932188e-05, - "loss": 2.3765, - "step": 217200 - }, - { - "epoch": 0.38, - "learning_rate": 3.106059284939505e-05, - "loss": 2.4774, - "step": 217210 - }, - { - "epoch": 0.38, - "learning_rate": 3.105972090946822e-05, - "loss": 2.4483, - "step": 217220 - }, - { - "epoch": 0.38, - "learning_rate": 3.1058848969541395e-05, - "loss": 2.3856, - "step": 217230 - }, - { - "epoch": 0.38, - "learning_rate": 3.105797702961457e-05, - "loss": 2.3673, - "step": 217240 - }, - { - "epoch": 0.38, - "learning_rate": 3.105710508968774e-05, - "loss": 2.3923, - "step": 217250 - }, - { - "epoch": 0.38, - "learning_rate": 3.105623314976091e-05, - "loss": 2.5076, - "step": 217260 - }, - { - "epoch": 0.38, - "learning_rate": 3.105536120983409e-05, - "loss": 2.4024, - "step": 217270 - }, - { - "epoch": 0.38, - "learning_rate": 3.105448926990726e-05, - "loss": 2.2455, - "step": 217280 - }, - { - "epoch": 0.38, - "learning_rate": 3.105361732998043e-05, - "loss": 2.308, - "step": 217290 - }, - { - "epoch": 0.38, - "learning_rate": 3.105274539005361e-05, - "loss": 2.4372, - "step": 217300 - }, - { - "epoch": 0.38, - "learning_rate": 3.1051873450126786e-05, - "loss": 2.5045, - "step": 217310 - }, - { - "epoch": 0.38, - "learning_rate": 3.1051001510199956e-05, - "loss": 2.5027, - "step": 217320 - }, - { - "epoch": 0.38, - "learning_rate": 3.1050129570273126e-05, - "loss": 2.4675, - "step": 217330 - }, - { - "epoch": 0.38, - "learning_rate": 3.1049257630346304e-05, - "loss": 2.4286, - "step": 217340 - }, - { - "epoch": 0.38, - "learning_rate": 3.1048385690419474e-05, - "loss": 2.2834, - "step": 217350 - }, - { - "epoch": 0.38, - "learning_rate": 3.1047513750492644e-05, - "loss": 2.462, - "step": 217360 - }, - { - "epoch": 0.38, - "learning_rate": 3.104664181056582e-05, - "loss": 2.4126, - "step": 217370 - }, - { - "epoch": 0.38, - "learning_rate": 3.1045769870639e-05, - "loss": 2.4038, - "step": 217380 - }, - { - "epoch": 0.38, - "learning_rate": 3.104489793071217e-05, - "loss": 2.2262, - "step": 217390 - }, - { - "epoch": 0.38, - "learning_rate": 3.104402599078534e-05, - "loss": 2.3882, - "step": 217400 - }, - { - "epoch": 0.38, - "learning_rate": 3.1043154050858517e-05, - "loss": 2.4242, - "step": 217410 - }, - { - "epoch": 0.38, - "learning_rate": 3.104228211093169e-05, - "loss": 2.4444, - "step": 217420 - }, - { - "epoch": 0.38, - "learning_rate": 3.104141017100486e-05, - "loss": 2.4527, - "step": 217430 - }, - { - "epoch": 0.38, - "learning_rate": 3.1040538231078034e-05, - "loss": 2.415, - "step": 217440 - }, - { - "epoch": 0.38, - "learning_rate": 3.1039666291151205e-05, - "loss": 2.3243, - "step": 217450 - }, - { - "epoch": 0.38, - "learning_rate": 3.103879435122438e-05, - "loss": 2.4649, - "step": 217460 - }, - { - "epoch": 0.38, - "learning_rate": 3.103792241129755e-05, - "loss": 2.3634, - "step": 217470 - }, - { - "epoch": 0.38, - "learning_rate": 3.103705047137073e-05, - "loss": 2.4255, - "step": 217480 - }, - { - "epoch": 0.38, - "learning_rate": 3.10361785314439e-05, - "loss": 2.4614, - "step": 217490 - }, - { - "epoch": 0.38, - "learning_rate": 3.103530659151707e-05, - "loss": 2.3921, - "step": 217500 - }, - { - "epoch": 0.38, - "learning_rate": 3.103443465159024e-05, - "loss": 2.3534, - "step": 217510 - }, - { - "epoch": 0.38, - "learning_rate": 3.103356271166342e-05, - "loss": 2.3606, - "step": 217520 - }, - { - "epoch": 0.38, - "learning_rate": 3.1032690771736595e-05, - "loss": 2.4702, - "step": 217530 - }, - { - "epoch": 0.38, - "learning_rate": 3.1031818831809765e-05, - "loss": 2.425, - "step": 217540 - }, - { - "epoch": 0.38, - "learning_rate": 3.103094689188294e-05, - "loss": 2.343, - "step": 217550 - }, - { - "epoch": 0.38, - "learning_rate": 3.103007495195611e-05, - "loss": 2.3816, - "step": 217560 - }, - { - "epoch": 0.38, - "learning_rate": 3.102920301202928e-05, - "loss": 2.4141, - "step": 217570 - }, - { - "epoch": 0.38, - "learning_rate": 3.1028331072102454e-05, - "loss": 2.5183, - "step": 217580 - }, - { - "epoch": 0.38, - "learning_rate": 3.102745913217563e-05, - "loss": 2.4164, - "step": 217590 - }, - { - "epoch": 0.38, - "learning_rate": 3.10265871922488e-05, - "loss": 2.4842, - "step": 217600 - }, - { - "epoch": 0.38, - "learning_rate": 3.102571525232198e-05, - "loss": 2.4135, - "step": 217610 - }, - { - "epoch": 0.38, - "learning_rate": 3.102484331239515e-05, - "loss": 2.3785, - "step": 217620 - }, - { - "epoch": 0.38, - "learning_rate": 3.1023971372468326e-05, - "loss": 2.4552, - "step": 217630 - }, - { - "epoch": 0.38, - "learning_rate": 3.1023099432541496e-05, - "loss": 2.3639, - "step": 217640 - }, - { - "epoch": 0.38, - "learning_rate": 3.102222749261467e-05, - "loss": 2.3514, - "step": 217650 - }, - { - "epoch": 0.38, - "learning_rate": 3.1021355552687844e-05, - "loss": 2.4046, - "step": 217660 - }, - { - "epoch": 0.38, - "learning_rate": 3.1020483612761014e-05, - "loss": 2.3926, - "step": 217670 - }, - { - "epoch": 0.38, - "learning_rate": 3.101961167283419e-05, - "loss": 2.4305, - "step": 217680 - }, - { - "epoch": 0.38, - "learning_rate": 3.101873973290736e-05, - "loss": 2.4456, - "step": 217690 - }, - { - "epoch": 0.38, - "learning_rate": 3.101786779298054e-05, - "loss": 2.2949, - "step": 217700 - }, - { - "epoch": 0.38, - "learning_rate": 3.101699585305371e-05, - "loss": 2.4623, - "step": 217710 - }, - { - "epoch": 0.38, - "learning_rate": 3.101612391312688e-05, - "loss": 2.4671, - "step": 217720 - }, - { - "epoch": 0.38, - "learning_rate": 3.101525197320006e-05, - "loss": 2.3806, - "step": 217730 - }, - { - "epoch": 0.38, - "learning_rate": 3.101438003327323e-05, - "loss": 2.3919, - "step": 217740 - }, - { - "epoch": 0.38, - "learning_rate": 3.1013508093346404e-05, - "loss": 2.4277, - "step": 217750 - }, - { - "epoch": 0.38, - "learning_rate": 3.1012636153419575e-05, - "loss": 2.3928, - "step": 217760 - }, - { - "epoch": 0.38, - "learning_rate": 3.101176421349275e-05, - "loss": 2.418, - "step": 217770 - }, - { - "epoch": 0.38, - "learning_rate": 3.101089227356592e-05, - "loss": 2.4941, - "step": 217780 - }, - { - "epoch": 0.38, - "learning_rate": 3.101002033363909e-05, - "loss": 2.4664, - "step": 217790 - }, - { - "epoch": 0.38, - "learning_rate": 3.100914839371227e-05, - "loss": 2.3574, - "step": 217800 - }, - { - "epoch": 0.38, - "learning_rate": 3.100827645378544e-05, - "loss": 2.3739, - "step": 217810 - }, - { - "epoch": 0.38, - "learning_rate": 3.100740451385861e-05, - "loss": 2.485, - "step": 217820 - }, - { - "epoch": 0.38, - "learning_rate": 3.100653257393179e-05, - "loss": 2.4637, - "step": 217830 - }, - { - "epoch": 0.38, - "learning_rate": 3.1005660634004965e-05, - "loss": 2.417, - "step": 217840 - }, - { - "epoch": 0.38, - "learning_rate": 3.1004788694078135e-05, - "loss": 2.3139, - "step": 217850 - }, - { - "epoch": 0.38, - "learning_rate": 3.1003916754151306e-05, - "loss": 2.4225, - "step": 217860 - }, - { - "epoch": 0.38, - "learning_rate": 3.100304481422448e-05, - "loss": 2.3242, - "step": 217870 - }, - { - "epoch": 0.38, - "learning_rate": 3.100217287429765e-05, - "loss": 2.4239, - "step": 217880 - }, - { - "epoch": 0.38, - "learning_rate": 3.1001300934370824e-05, - "loss": 2.4307, - "step": 217890 - }, - { - "epoch": 0.38, - "learning_rate": 3.1000428994444e-05, - "loss": 2.3686, - "step": 217900 - }, - { - "epoch": 0.38, - "learning_rate": 3.099955705451718e-05, - "loss": 2.4157, - "step": 217910 - }, - { - "epoch": 0.38, - "learning_rate": 3.099868511459035e-05, - "loss": 2.4049, - "step": 217920 - }, - { - "epoch": 0.38, - "learning_rate": 3.099781317466352e-05, - "loss": 2.4367, - "step": 217930 - }, - { - "epoch": 0.38, - "learning_rate": 3.0996941234736696e-05, - "loss": 2.4497, - "step": 217940 - }, - { - "epoch": 0.38, - "learning_rate": 3.0996069294809866e-05, - "loss": 2.3944, - "step": 217950 - }, - { - "epoch": 0.38, - "learning_rate": 3.0995197354883037e-05, - "loss": 2.4804, - "step": 217960 - }, - { - "epoch": 0.38, - "learning_rate": 3.099432541495621e-05, - "loss": 2.4756, - "step": 217970 - }, - { - "epoch": 0.38, - "learning_rate": 3.099345347502939e-05, - "loss": 2.5773, - "step": 217980 - }, - { - "epoch": 0.38, - "learning_rate": 3.099258153510256e-05, - "loss": 2.3881, - "step": 217990 - }, - { - "epoch": 0.38, - "learning_rate": 3.099170959517573e-05, - "loss": 2.4306, - "step": 218000 - }, - { - "epoch": 0.38, - "learning_rate": 3.099083765524891e-05, - "loss": 2.4765, - "step": 218010 - }, - { - "epoch": 0.38, - "learning_rate": 3.098996571532208e-05, - "loss": 2.4428, - "step": 218020 - }, - { - "epoch": 0.38, - "learning_rate": 3.098909377539525e-05, - "loss": 2.4398, - "step": 218030 - }, - { - "epoch": 0.38, - "learning_rate": 3.098822183546842e-05, - "loss": 2.469, - "step": 218040 - }, - { - "epoch": 0.38, - "learning_rate": 3.0987349895541604e-05, - "loss": 2.4706, - "step": 218050 - }, - { - "epoch": 0.38, - "learning_rate": 3.0986477955614774e-05, - "loss": 2.3556, - "step": 218060 - }, - { - "epoch": 0.38, - "learning_rate": 3.0985606015687945e-05, - "loss": 2.3839, - "step": 218070 - }, - { - "epoch": 0.38, - "learning_rate": 3.0984734075761115e-05, - "loss": 2.4811, - "step": 218080 - }, - { - "epoch": 0.38, - "learning_rate": 3.098386213583429e-05, - "loss": 2.4567, - "step": 218090 - }, - { - "epoch": 0.38, - "learning_rate": 3.098299019590746e-05, - "loss": 2.3146, - "step": 218100 - }, - { - "epoch": 0.38, - "learning_rate": 3.098211825598063e-05, - "loss": 2.4289, - "step": 218110 - }, - { - "epoch": 0.38, - "learning_rate": 3.098124631605381e-05, - "loss": 2.3726, - "step": 218120 - }, - { - "epoch": 0.38, - "learning_rate": 3.098037437612699e-05, - "loss": 2.4561, - "step": 218130 - }, - { - "epoch": 0.38, - "learning_rate": 3.097950243620016e-05, - "loss": 2.3417, - "step": 218140 - }, - { - "epoch": 0.38, - "learning_rate": 3.097863049627333e-05, - "loss": 2.3546, - "step": 218150 - }, - { - "epoch": 0.38, - "learning_rate": 3.0977758556346505e-05, - "loss": 2.3691, - "step": 218160 - }, - { - "epoch": 0.38, - "learning_rate": 3.0976886616419676e-05, - "loss": 2.4856, - "step": 218170 - }, - { - "epoch": 0.38, - "learning_rate": 3.0976014676492846e-05, - "loss": 2.5545, - "step": 218180 - }, - { - "epoch": 0.38, - "learning_rate": 3.097514273656602e-05, - "loss": 2.4226, - "step": 218190 - }, - { - "epoch": 0.38, - "learning_rate": 3.09742707966392e-05, - "loss": 2.4539, - "step": 218200 - }, - { - "epoch": 0.38, - "learning_rate": 3.097339885671237e-05, - "loss": 2.4321, - "step": 218210 - }, - { - "epoch": 0.38, - "learning_rate": 3.097252691678554e-05, - "loss": 2.303, - "step": 218220 - }, - { - "epoch": 0.38, - "learning_rate": 3.097165497685872e-05, - "loss": 2.4495, - "step": 218230 - }, - { - "epoch": 0.38, - "learning_rate": 3.097078303693189e-05, - "loss": 2.518, - "step": 218240 - }, - { - "epoch": 0.38, - "learning_rate": 3.096991109700506e-05, - "loss": 2.45, - "step": 218250 - }, - { - "epoch": 0.38, - "learning_rate": 3.0969039157078236e-05, - "loss": 2.4445, - "step": 218260 - }, - { - "epoch": 0.38, - "learning_rate": 3.0968167217151407e-05, - "loss": 2.3831, - "step": 218270 - }, - { - "epoch": 0.38, - "learning_rate": 3.0967295277224584e-05, - "loss": 2.3795, - "step": 218280 - }, - { - "epoch": 0.38, - "learning_rate": 3.0966423337297754e-05, - "loss": 2.3446, - "step": 218290 - }, - { - "epoch": 0.38, - "learning_rate": 3.096555139737093e-05, - "loss": 2.3345, - "step": 218300 - }, - { - "epoch": 0.38, - "learning_rate": 3.09646794574441e-05, - "loss": 2.3919, - "step": 218310 - }, - { - "epoch": 0.38, - "learning_rate": 3.096380751751727e-05, - "loss": 2.397, - "step": 218320 - }, - { - "epoch": 0.38, - "learning_rate": 3.096293557759045e-05, - "loss": 2.4504, - "step": 218330 - }, - { - "epoch": 0.38, - "learning_rate": 3.096206363766362e-05, - "loss": 2.3957, - "step": 218340 - }, - { - "epoch": 0.38, - "learning_rate": 3.09611916977368e-05, - "loss": 2.4119, - "step": 218350 - }, - { - "epoch": 0.38, - "learning_rate": 3.096031975780997e-05, - "loss": 2.4082, - "step": 218360 - }, - { - "epoch": 0.38, - "learning_rate": 3.0959447817883144e-05, - "loss": 2.4047, - "step": 218370 - }, - { - "epoch": 0.38, - "learning_rate": 3.0958575877956315e-05, - "loss": 2.3311, - "step": 218380 - }, - { - "epoch": 0.38, - "learning_rate": 3.0957703938029485e-05, - "loss": 2.3955, - "step": 218390 - }, - { - "epoch": 0.38, - "learning_rate": 3.095683199810266e-05, - "loss": 2.3495, - "step": 218400 - }, - { - "epoch": 0.38, - "learning_rate": 3.095596005817583e-05, - "loss": 2.4512, - "step": 218410 - }, - { - "epoch": 0.38, - "learning_rate": 3.095508811824901e-05, - "loss": 2.4399, - "step": 218420 - }, - { - "epoch": 0.38, - "learning_rate": 3.095421617832218e-05, - "loss": 2.3573, - "step": 218430 - }, - { - "epoch": 0.38, - "learning_rate": 3.095334423839536e-05, - "loss": 2.3385, - "step": 218440 - }, - { - "epoch": 0.38, - "learning_rate": 3.095247229846853e-05, - "loss": 2.4026, - "step": 218450 - }, - { - "epoch": 0.38, - "learning_rate": 3.09516003585417e-05, - "loss": 2.4856, - "step": 218460 - }, - { - "epoch": 0.38, - "learning_rate": 3.095072841861487e-05, - "loss": 2.3993, - "step": 218470 - }, - { - "epoch": 0.38, - "learning_rate": 3.0949856478688046e-05, - "loss": 2.439, - "step": 218480 - }, - { - "epoch": 0.38, - "learning_rate": 3.0948984538761216e-05, - "loss": 2.4042, - "step": 218490 - }, - { - "epoch": 0.38, - "learning_rate": 3.094811259883439e-05, - "loss": 2.4398, - "step": 218500 - }, - { - "epoch": 0.38, - "learning_rate": 3.094724065890757e-05, - "loss": 2.4334, - "step": 218510 - }, - { - "epoch": 0.38, - "learning_rate": 3.094636871898074e-05, - "loss": 2.4154, - "step": 218520 - }, - { - "epoch": 0.38, - "learning_rate": 3.094549677905391e-05, - "loss": 2.4137, - "step": 218530 - }, - { - "epoch": 0.38, - "learning_rate": 3.094462483912708e-05, - "loss": 2.4037, - "step": 218540 - }, - { - "epoch": 0.38, - "learning_rate": 3.094375289920026e-05, - "loss": 2.3949, - "step": 218550 - }, - { - "epoch": 0.38, - "learning_rate": 3.094288095927343e-05, - "loss": 2.4996, - "step": 218560 - }, - { - "epoch": 0.38, - "learning_rate": 3.0942009019346606e-05, - "loss": 2.4877, - "step": 218570 - }, - { - "epoch": 0.38, - "learning_rate": 3.0941137079419776e-05, - "loss": 2.4115, - "step": 218580 - }, - { - "epoch": 0.38, - "learning_rate": 3.0940265139492954e-05, - "loss": 2.3796, - "step": 218590 - }, - { - "epoch": 0.38, - "learning_rate": 3.0939393199566124e-05, - "loss": 2.5107, - "step": 218600 - }, - { - "epoch": 0.38, - "learning_rate": 3.0938521259639294e-05, - "loss": 2.3803, - "step": 218610 - }, - { - "epoch": 0.38, - "learning_rate": 3.093764931971247e-05, - "loss": 2.2734, - "step": 218620 - }, - { - "epoch": 0.38, - "learning_rate": 3.093677737978564e-05, - "loss": 2.4496, - "step": 218630 - }, - { - "epoch": 0.38, - "learning_rate": 3.093590543985881e-05, - "loss": 2.4128, - "step": 218640 - }, - { - "epoch": 0.38, - "learning_rate": 3.093503349993199e-05, - "loss": 2.3573, - "step": 218650 - }, - { - "epoch": 0.38, - "learning_rate": 3.0934161560005167e-05, - "loss": 2.4494, - "step": 218660 - }, - { - "epoch": 0.38, - "learning_rate": 3.093328962007834e-05, - "loss": 2.4519, - "step": 218670 - }, - { - "epoch": 0.38, - "learning_rate": 3.093241768015151e-05, - "loss": 2.5883, - "step": 218680 - }, - { - "epoch": 0.38, - "learning_rate": 3.0931545740224685e-05, - "loss": 2.4336, - "step": 218690 - }, - { - "epoch": 0.38, - "learning_rate": 3.0930673800297855e-05, - "loss": 2.2765, - "step": 218700 - }, - { - "epoch": 0.38, - "learning_rate": 3.0929801860371025e-05, - "loss": 2.4942, - "step": 218710 - }, - { - "epoch": 0.38, - "learning_rate": 3.09289299204442e-05, - "loss": 2.3079, - "step": 218720 - }, - { - "epoch": 0.38, - "learning_rate": 3.092805798051738e-05, - "loss": 2.3511, - "step": 218730 - }, - { - "epoch": 0.38, - "learning_rate": 3.092718604059055e-05, - "loss": 2.5402, - "step": 218740 - }, - { - "epoch": 0.38, - "learning_rate": 3.092631410066372e-05, - "loss": 2.3192, - "step": 218750 - }, - { - "epoch": 0.38, - "learning_rate": 3.09254421607369e-05, - "loss": 2.3571, - "step": 218760 - }, - { - "epoch": 0.38, - "learning_rate": 3.092457022081007e-05, - "loss": 2.3554, - "step": 218770 - }, - { - "epoch": 0.38, - "learning_rate": 3.092369828088324e-05, - "loss": 2.2394, - "step": 218780 - }, - { - "epoch": 0.38, - "learning_rate": 3.0922826340956415e-05, - "loss": 2.4372, - "step": 218790 - }, - { - "epoch": 0.38, - "learning_rate": 3.092195440102959e-05, - "loss": 2.3665, - "step": 218800 - }, - { - "epoch": 0.38, - "learning_rate": 3.092108246110276e-05, - "loss": 2.4756, - "step": 218810 - }, - { - "epoch": 0.38, - "learning_rate": 3.092021052117593e-05, - "loss": 2.3534, - "step": 218820 - }, - { - "epoch": 0.38, - "learning_rate": 3.091933858124911e-05, - "loss": 2.4686, - "step": 218830 - }, - { - "epoch": 0.38, - "learning_rate": 3.091846664132228e-05, - "loss": 2.4002, - "step": 218840 - }, - { - "epoch": 0.38, - "learning_rate": 3.091759470139545e-05, - "loss": 2.3567, - "step": 218850 - }, - { - "epoch": 0.38, - "learning_rate": 3.091672276146862e-05, - "loss": 2.3728, - "step": 218860 - }, - { - "epoch": 0.38, - "learning_rate": 3.0915850821541806e-05, - "loss": 2.3398, - "step": 218870 - }, - { - "epoch": 0.38, - "learning_rate": 3.0914978881614976e-05, - "loss": 2.339, - "step": 218880 - }, - { - "epoch": 0.38, - "learning_rate": 3.0914106941688146e-05, - "loss": 2.4888, - "step": 218890 - }, - { - "epoch": 0.38, - "learning_rate": 3.0913235001761324e-05, - "loss": 2.4843, - "step": 218900 - }, - { - "epoch": 0.38, - "learning_rate": 3.0912363061834494e-05, - "loss": 2.542, - "step": 218910 - }, - { - "epoch": 0.38, - "learning_rate": 3.0911491121907664e-05, - "loss": 2.4153, - "step": 218920 - }, - { - "epoch": 0.38, - "learning_rate": 3.0910619181980835e-05, - "loss": 2.3253, - "step": 218930 - }, - { - "epoch": 0.38, - "learning_rate": 3.090974724205401e-05, - "loss": 2.4235, - "step": 218940 - }, - { - "epoch": 0.38, - "learning_rate": 3.090887530212719e-05, - "loss": 2.4738, - "step": 218950 - }, - { - "epoch": 0.38, - "learning_rate": 3.090800336220036e-05, - "loss": 2.4123, - "step": 218960 - }, - { - "epoch": 0.38, - "learning_rate": 3.090713142227353e-05, - "loss": 2.3408, - "step": 218970 - }, - { - "epoch": 0.38, - "learning_rate": 3.090625948234671e-05, - "loss": 2.3451, - "step": 218980 - }, - { - "epoch": 0.38, - "learning_rate": 3.090538754241988e-05, - "loss": 2.2698, - "step": 218990 - }, - { - "epoch": 0.38, - "learning_rate": 3.090451560249305e-05, - "loss": 2.4378, - "step": 219000 - }, - { - "epoch": 0.38, - "learning_rate": 3.0903643662566225e-05, - "loss": 2.4308, - "step": 219010 - }, - { - "epoch": 0.38, - "learning_rate": 3.09027717226394e-05, - "loss": 2.2904, - "step": 219020 - }, - { - "epoch": 0.38, - "learning_rate": 3.090189978271257e-05, - "loss": 2.4327, - "step": 219030 - }, - { - "epoch": 0.38, - "learning_rate": 3.090102784278574e-05, - "loss": 2.2951, - "step": 219040 - }, - { - "epoch": 0.38, - "learning_rate": 3.090015590285892e-05, - "loss": 2.3841, - "step": 219050 - }, - { - "epoch": 0.38, - "learning_rate": 3.089928396293209e-05, - "loss": 2.2962, - "step": 219060 - }, - { - "epoch": 0.38, - "learning_rate": 3.089841202300526e-05, - "loss": 2.4271, - "step": 219070 - }, - { - "epoch": 0.38, - "learning_rate": 3.089754008307844e-05, - "loss": 2.3686, - "step": 219080 - }, - { - "epoch": 0.38, - "learning_rate": 3.0896668143151615e-05, - "loss": 2.4467, - "step": 219090 - }, - { - "epoch": 0.38, - "learning_rate": 3.0895796203224785e-05, - "loss": 2.3321, - "step": 219100 - }, - { - "epoch": 0.38, - "learning_rate": 3.0894924263297956e-05, - "loss": 2.449, - "step": 219110 - }, - { - "epoch": 0.38, - "learning_rate": 3.089405232337113e-05, - "loss": 2.3713, - "step": 219120 - }, - { - "epoch": 0.38, - "learning_rate": 3.08931803834443e-05, - "loss": 2.4259, - "step": 219130 - }, - { - "epoch": 0.38, - "learning_rate": 3.0892308443517474e-05, - "loss": 2.4179, - "step": 219140 - }, - { - "epoch": 0.38, - "learning_rate": 3.089143650359065e-05, - "loss": 2.4932, - "step": 219150 - }, - { - "epoch": 0.38, - "learning_rate": 3.089056456366382e-05, - "loss": 2.3979, - "step": 219160 - }, - { - "epoch": 0.38, - "learning_rate": 3.0889692623737e-05, - "loss": 2.3317, - "step": 219170 - }, - { - "epoch": 0.38, - "learning_rate": 3.088882068381017e-05, - "loss": 2.4597, - "step": 219180 - }, - { - "epoch": 0.38, - "learning_rate": 3.0887948743883346e-05, - "loss": 2.304, - "step": 219190 - }, - { - "epoch": 0.38, - "learning_rate": 3.0887076803956516e-05, - "loss": 2.388, - "step": 219200 - }, - { - "epoch": 0.38, - "learning_rate": 3.088620486402969e-05, - "loss": 2.3984, - "step": 219210 - }, - { - "epoch": 0.38, - "learning_rate": 3.0885332924102864e-05, - "loss": 2.4573, - "step": 219220 - }, - { - "epoch": 0.38, - "learning_rate": 3.0884460984176034e-05, - "loss": 2.3247, - "step": 219230 - }, - { - "epoch": 0.38, - "learning_rate": 3.088358904424921e-05, - "loss": 2.451, - "step": 219240 - }, - { - "epoch": 0.38, - "learning_rate": 3.088271710432238e-05, - "loss": 2.4613, - "step": 219250 - }, - { - "epoch": 0.38, - "learning_rate": 3.088184516439556e-05, - "loss": 2.5041, - "step": 219260 - }, - { - "epoch": 0.38, - "learning_rate": 3.088097322446873e-05, - "loss": 2.3757, - "step": 219270 - }, - { - "epoch": 0.38, - "learning_rate": 3.08801012845419e-05, - "loss": 2.3702, - "step": 219280 - }, - { - "epoch": 0.38, - "learning_rate": 3.087922934461508e-05, - "loss": 2.3216, - "step": 219290 - }, - { - "epoch": 0.38, - "learning_rate": 3.087835740468825e-05, - "loss": 2.3721, - "step": 219300 - }, - { - "epoch": 0.38, - "learning_rate": 3.087748546476142e-05, - "loss": 2.3188, - "step": 219310 - }, - { - "epoch": 0.38, - "learning_rate": 3.0876613524834595e-05, - "loss": 2.4671, - "step": 219320 - }, - { - "epoch": 0.38, - "learning_rate": 3.087574158490777e-05, - "loss": 2.4944, - "step": 219330 - }, - { - "epoch": 0.38, - "learning_rate": 3.087486964498094e-05, - "loss": 2.5027, - "step": 219340 - }, - { - "epoch": 0.38, - "learning_rate": 3.087399770505411e-05, - "loss": 2.3971, - "step": 219350 - }, - { - "epoch": 0.38, - "learning_rate": 3.087312576512729e-05, - "loss": 2.3181, - "step": 219360 - }, - { - "epoch": 0.38, - "learning_rate": 3.087225382520046e-05, - "loss": 2.401, - "step": 219370 - }, - { - "epoch": 0.38, - "learning_rate": 3.087138188527363e-05, - "loss": 2.3652, - "step": 219380 - }, - { - "epoch": 0.38, - "learning_rate": 3.087050994534681e-05, - "loss": 2.4736, - "step": 219390 - }, - { - "epoch": 0.38, - "learning_rate": 3.0869638005419985e-05, - "loss": 2.3452, - "step": 219400 - }, - { - "epoch": 0.38, - "learning_rate": 3.0868766065493155e-05, - "loss": 2.4165, - "step": 219410 - }, - { - "epoch": 0.38, - "learning_rate": 3.0867894125566326e-05, - "loss": 2.416, - "step": 219420 - }, - { - "epoch": 0.38, - "learning_rate": 3.0867022185639496e-05, - "loss": 2.3319, - "step": 219430 - }, - { - "epoch": 0.38, - "learning_rate": 3.086615024571267e-05, - "loss": 2.3446, - "step": 219440 - }, - { - "epoch": 0.38, - "learning_rate": 3.0865278305785844e-05, - "loss": 2.3673, - "step": 219450 - }, - { - "epoch": 0.38, - "learning_rate": 3.0864406365859014e-05, - "loss": 2.3972, - "step": 219460 - }, - { - "epoch": 0.38, - "learning_rate": 3.08635344259322e-05, - "loss": 2.3483, - "step": 219470 - }, - { - "epoch": 0.38, - "learning_rate": 3.086266248600537e-05, - "loss": 2.3019, - "step": 219480 - }, - { - "epoch": 0.38, - "learning_rate": 3.086179054607854e-05, - "loss": 2.4144, - "step": 219490 - }, - { - "epoch": 0.38, - "learning_rate": 3.086091860615171e-05, - "loss": 2.3565, - "step": 219500 - }, - { - "epoch": 0.38, - "learning_rate": 3.0860046666224886e-05, - "loss": 2.2501, - "step": 219510 - }, - { - "epoch": 0.38, - "learning_rate": 3.0859174726298057e-05, - "loss": 2.3973, - "step": 219520 - }, - { - "epoch": 0.38, - "learning_rate": 3.085830278637123e-05, - "loss": 2.4944, - "step": 219530 - }, - { - "epoch": 0.38, - "learning_rate": 3.0857430846444404e-05, - "loss": 2.4709, - "step": 219540 - }, - { - "epoch": 0.38, - "learning_rate": 3.085655890651758e-05, - "loss": 2.4557, - "step": 219550 - }, - { - "epoch": 0.38, - "learning_rate": 3.085568696659075e-05, - "loss": 2.4846, - "step": 219560 - }, - { - "epoch": 0.38, - "learning_rate": 3.085481502666392e-05, - "loss": 2.4258, - "step": 219570 - }, - { - "epoch": 0.38, - "learning_rate": 3.08539430867371e-05, - "loss": 2.4485, - "step": 219580 - }, - { - "epoch": 0.38, - "learning_rate": 3.085307114681027e-05, - "loss": 2.4369, - "step": 219590 - }, - { - "epoch": 0.38, - "learning_rate": 3.085219920688344e-05, - "loss": 2.4114, - "step": 219600 - }, - { - "epoch": 0.38, - "learning_rate": 3.085132726695662e-05, - "loss": 2.3056, - "step": 219610 - }, - { - "epoch": 0.38, - "learning_rate": 3.0850455327029794e-05, - "loss": 2.3453, - "step": 219620 - }, - { - "epoch": 0.38, - "learning_rate": 3.0849583387102965e-05, - "loss": 2.507, - "step": 219630 - }, - { - "epoch": 0.38, - "learning_rate": 3.0848711447176135e-05, - "loss": 2.453, - "step": 219640 - }, - { - "epoch": 0.38, - "learning_rate": 3.084783950724931e-05, - "loss": 2.3168, - "step": 219650 - }, - { - "epoch": 0.38, - "learning_rate": 3.084696756732248e-05, - "loss": 2.3585, - "step": 219660 - }, - { - "epoch": 0.38, - "learning_rate": 3.084609562739565e-05, - "loss": 2.4609, - "step": 219670 - }, - { - "epoch": 0.38, - "learning_rate": 3.084522368746883e-05, - "loss": 2.4161, - "step": 219680 - }, - { - "epoch": 0.38, - "learning_rate": 3.084435174754201e-05, - "loss": 2.3752, - "step": 219690 - }, - { - "epoch": 0.38, - "learning_rate": 3.084347980761518e-05, - "loss": 2.4033, - "step": 219700 - }, - { - "epoch": 0.38, - "learning_rate": 3.084260786768835e-05, - "loss": 2.4724, - "step": 219710 - }, - { - "epoch": 0.38, - "learning_rate": 3.0841735927761525e-05, - "loss": 2.4783, - "step": 219720 - }, - { - "epoch": 0.38, - "learning_rate": 3.0840863987834696e-05, - "loss": 2.5021, - "step": 219730 - }, - { - "epoch": 0.38, - "learning_rate": 3.0839992047907866e-05, - "loss": 2.4954, - "step": 219740 - }, - { - "epoch": 0.38, - "learning_rate": 3.083912010798104e-05, - "loss": 2.3791, - "step": 219750 - }, - { - "epoch": 0.38, - "learning_rate": 3.083824816805422e-05, - "loss": 2.3617, - "step": 219760 - }, - { - "epoch": 0.38, - "learning_rate": 3.083737622812739e-05, - "loss": 2.4164, - "step": 219770 - }, - { - "epoch": 0.38, - "learning_rate": 3.083650428820056e-05, - "loss": 2.3965, - "step": 219780 - }, - { - "epoch": 0.38, - "learning_rate": 3.083563234827374e-05, - "loss": 2.4316, - "step": 219790 - }, - { - "epoch": 0.38, - "learning_rate": 3.083476040834691e-05, - "loss": 2.3516, - "step": 219800 - }, - { - "epoch": 0.38, - "learning_rate": 3.083388846842008e-05, - "loss": 2.4541, - "step": 219810 - }, - { - "epoch": 0.38, - "learning_rate": 3.083301652849325e-05, - "loss": 2.4653, - "step": 219820 - }, - { - "epoch": 0.38, - "learning_rate": 3.0832144588566427e-05, - "loss": 2.3306, - "step": 219830 - }, - { - "epoch": 0.38, - "learning_rate": 3.0831272648639604e-05, - "loss": 2.4571, - "step": 219840 - }, - { - "epoch": 0.38, - "learning_rate": 3.0830400708712774e-05, - "loss": 2.3896, - "step": 219850 - }, - { - "epoch": 0.38, - "learning_rate": 3.082952876878595e-05, - "loss": 2.4494, - "step": 219860 - }, - { - "epoch": 0.38, - "learning_rate": 3.082865682885912e-05, - "loss": 2.3522, - "step": 219870 - }, - { - "epoch": 0.38, - "learning_rate": 3.082778488893229e-05, - "loss": 2.4299, - "step": 219880 - }, - { - "epoch": 0.38, - "learning_rate": 3.082691294900546e-05, - "loss": 2.3781, - "step": 219890 - }, - { - "epoch": 0.38, - "learning_rate": 3.082604100907864e-05, - "loss": 2.422, - "step": 219900 - }, - { - "epoch": 0.38, - "learning_rate": 3.082516906915182e-05, - "loss": 2.4191, - "step": 219910 - }, - { - "epoch": 0.38, - "learning_rate": 3.082429712922499e-05, - "loss": 2.3743, - "step": 219920 - }, - { - "epoch": 0.38, - "learning_rate": 3.082342518929816e-05, - "loss": 2.3307, - "step": 219930 - }, - { - "epoch": 0.38, - "learning_rate": 3.0822553249371335e-05, - "loss": 2.3893, - "step": 219940 - }, - { - "epoch": 0.38, - "learning_rate": 3.0821681309444505e-05, - "loss": 2.4206, - "step": 219950 - }, - { - "epoch": 0.38, - "learning_rate": 3.0820809369517675e-05, - "loss": 2.3648, - "step": 219960 - }, - { - "epoch": 0.38, - "learning_rate": 3.081993742959085e-05, - "loss": 2.3318, - "step": 219970 - }, - { - "epoch": 0.38, - "learning_rate": 3.081906548966402e-05, - "loss": 2.3309, - "step": 219980 - }, - { - "epoch": 0.38, - "learning_rate": 3.08181935497372e-05, - "loss": 2.3593, - "step": 219990 - }, - { - "epoch": 0.38, - "learning_rate": 3.081732160981037e-05, - "loss": 2.4683, - "step": 220000 - }, - { - "epoch": 0.38, - "learning_rate": 3.081644966988355e-05, - "loss": 2.3946, - "step": 220010 - }, - { - "epoch": 0.38, - "learning_rate": 3.081557772995672e-05, - "loss": 2.3775, - "step": 220020 - }, - { - "epoch": 0.38, - "learning_rate": 3.081470579002989e-05, - "loss": 2.434, - "step": 220030 - }, - { - "epoch": 0.38, - "learning_rate": 3.0813833850103066e-05, - "loss": 2.3122, - "step": 220040 - }, - { - "epoch": 0.38, - "learning_rate": 3.0812961910176236e-05, - "loss": 2.4275, - "step": 220050 - }, - { - "epoch": 0.38, - "learning_rate": 3.081208997024941e-05, - "loss": 2.4542, - "step": 220060 - }, - { - "epoch": 0.38, - "learning_rate": 3.0811218030322583e-05, - "loss": 2.4001, - "step": 220070 - }, - { - "epoch": 0.38, - "learning_rate": 3.081034609039576e-05, - "loss": 2.4276, - "step": 220080 - }, - { - "epoch": 0.38, - "learning_rate": 3.080947415046893e-05, - "loss": 2.4589, - "step": 220090 - }, - { - "epoch": 0.38, - "learning_rate": 3.08086022105421e-05, - "loss": 2.4639, - "step": 220100 - }, - { - "epoch": 0.38, - "learning_rate": 3.080773027061528e-05, - "loss": 2.4465, - "step": 220110 - }, - { - "epoch": 0.38, - "learning_rate": 3.080685833068845e-05, - "loss": 2.3854, - "step": 220120 - }, - { - "epoch": 0.38, - "learning_rate": 3.080598639076162e-05, - "loss": 2.3576, - "step": 220130 - }, - { - "epoch": 0.38, - "learning_rate": 3.0805114450834796e-05, - "loss": 2.4477, - "step": 220140 - }, - { - "epoch": 0.38, - "learning_rate": 3.0804242510907974e-05, - "loss": 2.3764, - "step": 220150 - }, - { - "epoch": 0.38, - "learning_rate": 3.0803370570981144e-05, - "loss": 2.4282, - "step": 220160 - }, - { - "epoch": 0.38, - "learning_rate": 3.0802498631054314e-05, - "loss": 2.4217, - "step": 220170 - }, - { - "epoch": 0.38, - "learning_rate": 3.080162669112749e-05, - "loss": 2.4261, - "step": 220180 - }, - { - "epoch": 0.38, - "learning_rate": 3.080075475120066e-05, - "loss": 2.4379, - "step": 220190 - }, - { - "epoch": 0.38, - "learning_rate": 3.079988281127383e-05, - "loss": 2.5129, - "step": 220200 - }, - { - "epoch": 0.38, - "learning_rate": 3.079901087134701e-05, - "loss": 2.4443, - "step": 220210 - }, - { - "epoch": 0.38, - "learning_rate": 3.0798138931420187e-05, - "loss": 2.3999, - "step": 220220 - }, - { - "epoch": 0.38, - "learning_rate": 3.079726699149336e-05, - "loss": 2.4491, - "step": 220230 - }, - { - "epoch": 0.38, - "learning_rate": 3.079639505156653e-05, - "loss": 2.4375, - "step": 220240 - }, - { - "epoch": 0.38, - "learning_rate": 3.0795523111639705e-05, - "loss": 2.2736, - "step": 220250 - }, - { - "epoch": 0.38, - "learning_rate": 3.0794651171712875e-05, - "loss": 2.482, - "step": 220260 - }, - { - "epoch": 0.38, - "learning_rate": 3.0793779231786045e-05, - "loss": 2.5344, - "step": 220270 - }, - { - "epoch": 0.38, - "learning_rate": 3.079290729185922e-05, - "loss": 2.3401, - "step": 220280 - }, - { - "epoch": 0.38, - "learning_rate": 3.07920353519324e-05, - "loss": 2.6185, - "step": 220290 - }, - { - "epoch": 0.38, - "learning_rate": 3.079116341200557e-05, - "loss": 2.4605, - "step": 220300 - }, - { - "epoch": 0.38, - "learning_rate": 3.079029147207874e-05, - "loss": 2.3403, - "step": 220310 - }, - { - "epoch": 0.38, - "learning_rate": 3.078941953215191e-05, - "loss": 2.5613, - "step": 220320 - }, - { - "epoch": 0.38, - "learning_rate": 3.078854759222509e-05, - "loss": 2.4331, - "step": 220330 - }, - { - "epoch": 0.38, - "learning_rate": 3.078767565229826e-05, - "loss": 2.3263, - "step": 220340 - }, - { - "epoch": 0.38, - "learning_rate": 3.078680371237143e-05, - "loss": 2.3976, - "step": 220350 - }, - { - "epoch": 0.38, - "learning_rate": 3.078593177244461e-05, - "loss": 2.3361, - "step": 220360 - }, - { - "epoch": 0.38, - "learning_rate": 3.078505983251778e-05, - "loss": 2.5645, - "step": 220370 - }, - { - "epoch": 0.38, - "learning_rate": 3.078418789259095e-05, - "loss": 2.265, - "step": 220380 - }, - { - "epoch": 0.38, - "learning_rate": 3.0783315952664124e-05, - "loss": 2.3827, - "step": 220390 - }, - { - "epoch": 0.38, - "learning_rate": 3.07824440127373e-05, - "loss": 2.4246, - "step": 220400 - }, - { - "epoch": 0.38, - "learning_rate": 3.078157207281047e-05, - "loss": 2.3858, - "step": 220410 - }, - { - "epoch": 0.38, - "learning_rate": 3.078070013288364e-05, - "loss": 2.4091, - "step": 220420 - }, - { - "epoch": 0.38, - "learning_rate": 3.077982819295682e-05, - "loss": 2.2833, - "step": 220430 - }, - { - "epoch": 0.38, - "learning_rate": 3.0778956253029996e-05, - "loss": 2.4121, - "step": 220440 - }, - { - "epoch": 0.38, - "learning_rate": 3.0778084313103166e-05, - "loss": 2.3893, - "step": 220450 - }, - { - "epoch": 0.38, - "learning_rate": 3.077721237317634e-05, - "loss": 2.3872, - "step": 220460 - }, - { - "epoch": 0.38, - "learning_rate": 3.0776340433249514e-05, - "loss": 2.3849, - "step": 220470 - }, - { - "epoch": 0.38, - "learning_rate": 3.0775468493322684e-05, - "loss": 2.3256, - "step": 220480 - }, - { - "epoch": 0.38, - "learning_rate": 3.0774596553395855e-05, - "loss": 2.4281, - "step": 220490 - }, - { - "epoch": 0.38, - "learning_rate": 3.077372461346903e-05, - "loss": 2.3624, - "step": 220500 - }, - { - "epoch": 0.38, - "learning_rate": 3.077285267354221e-05, - "loss": 2.4482, - "step": 220510 - }, - { - "epoch": 0.38, - "learning_rate": 3.077198073361538e-05, - "loss": 2.4134, - "step": 220520 - }, - { - "epoch": 0.38, - "learning_rate": 3.077110879368855e-05, - "loss": 2.4123, - "step": 220530 - }, - { - "epoch": 0.38, - "learning_rate": 3.077023685376173e-05, - "loss": 2.4431, - "step": 220540 - }, - { - "epoch": 0.38, - "learning_rate": 3.07693649138349e-05, - "loss": 2.4778, - "step": 220550 - }, - { - "epoch": 0.38, - "learning_rate": 3.076849297390807e-05, - "loss": 2.4132, - "step": 220560 - }, - { - "epoch": 0.38, - "learning_rate": 3.0767621033981245e-05, - "loss": 2.4273, - "step": 220570 - }, - { - "epoch": 0.38, - "learning_rate": 3.076674909405442e-05, - "loss": 2.4297, - "step": 220580 - }, - { - "epoch": 0.38, - "learning_rate": 3.076587715412759e-05, - "loss": 2.405, - "step": 220590 - }, - { - "epoch": 0.38, - "learning_rate": 3.076500521420076e-05, - "loss": 2.4745, - "step": 220600 - }, - { - "epoch": 0.38, - "learning_rate": 3.076413327427394e-05, - "loss": 2.3984, - "step": 220610 - }, - { - "epoch": 0.38, - "learning_rate": 3.076326133434711e-05, - "loss": 2.4243, - "step": 220620 - }, - { - "epoch": 0.38, - "learning_rate": 3.076238939442028e-05, - "loss": 2.3327, - "step": 220630 - }, - { - "epoch": 0.38, - "learning_rate": 3.076151745449346e-05, - "loss": 2.4472, - "step": 220640 - }, - { - "epoch": 0.38, - "learning_rate": 3.076064551456663e-05, - "loss": 2.4225, - "step": 220650 - }, - { - "epoch": 0.38, - "learning_rate": 3.0759773574639805e-05, - "loss": 2.3931, - "step": 220660 - }, - { - "epoch": 0.38, - "learning_rate": 3.0758901634712976e-05, - "loss": 2.4382, - "step": 220670 - }, - { - "epoch": 0.38, - "learning_rate": 3.075802969478615e-05, - "loss": 2.4582, - "step": 220680 - }, - { - "epoch": 0.38, - "learning_rate": 3.075715775485932e-05, - "loss": 2.4426, - "step": 220690 - }, - { - "epoch": 0.38, - "learning_rate": 3.0756285814932494e-05, - "loss": 2.2736, - "step": 220700 - }, - { - "epoch": 0.38, - "learning_rate": 3.075541387500567e-05, - "loss": 2.4874, - "step": 220710 - }, - { - "epoch": 0.38, - "learning_rate": 3.075454193507884e-05, - "loss": 2.5076, - "step": 220720 - }, - { - "epoch": 0.38, - "learning_rate": 3.075366999515202e-05, - "loss": 2.5026, - "step": 220730 - }, - { - "epoch": 0.38, - "learning_rate": 3.075279805522519e-05, - "loss": 2.5884, - "step": 220740 - }, - { - "epoch": 0.38, - "learning_rate": 3.0751926115298366e-05, - "loss": 2.2963, - "step": 220750 - }, - { - "epoch": 0.38, - "learning_rate": 3.0751054175371536e-05, - "loss": 2.4193, - "step": 220760 - }, - { - "epoch": 0.38, - "learning_rate": 3.075018223544471e-05, - "loss": 2.2332, - "step": 220770 - }, - { - "epoch": 0.39, - "learning_rate": 3.074931029551788e-05, - "loss": 2.4148, - "step": 220780 - }, - { - "epoch": 0.39, - "learning_rate": 3.0748438355591054e-05, - "loss": 2.5514, - "step": 220790 - }, - { - "epoch": 0.39, - "learning_rate": 3.0747566415664225e-05, - "loss": 2.2729, - "step": 220800 - }, - { - "epoch": 0.39, - "learning_rate": 3.07466944757374e-05, - "loss": 2.4196, - "step": 220810 - }, - { - "epoch": 0.39, - "learning_rate": 3.074582253581058e-05, - "loss": 2.3122, - "step": 220820 - }, - { - "epoch": 0.39, - "learning_rate": 3.074495059588375e-05, - "loss": 2.3815, - "step": 220830 - }, - { - "epoch": 0.39, - "learning_rate": 3.074407865595692e-05, - "loss": 2.4283, - "step": 220840 - }, - { - "epoch": 0.39, - "learning_rate": 3.074320671603009e-05, - "loss": 2.4718, - "step": 220850 - }, - { - "epoch": 0.39, - "learning_rate": 3.074233477610327e-05, - "loss": 2.4984, - "step": 220860 - }, - { - "epoch": 0.39, - "learning_rate": 3.074146283617644e-05, - "loss": 2.3594, - "step": 220870 - }, - { - "epoch": 0.39, - "learning_rate": 3.0740590896249615e-05, - "loss": 2.4588, - "step": 220880 - }, - { - "epoch": 0.39, - "learning_rate": 3.0739718956322785e-05, - "loss": 2.3204, - "step": 220890 - }, - { - "epoch": 0.39, - "learning_rate": 3.073884701639596e-05, - "loss": 2.3925, - "step": 220900 - }, - { - "epoch": 0.39, - "learning_rate": 3.073797507646913e-05, - "loss": 2.3953, - "step": 220910 - }, - { - "epoch": 0.39, - "learning_rate": 3.07371031365423e-05, - "loss": 2.3742, - "step": 220920 - }, - { - "epoch": 0.39, - "learning_rate": 3.073623119661548e-05, - "loss": 2.5209, - "step": 220930 - }, - { - "epoch": 0.39, - "learning_rate": 3.073535925668865e-05, - "loss": 2.4091, - "step": 220940 - }, - { - "epoch": 0.39, - "learning_rate": 3.073448731676183e-05, - "loss": 2.4941, - "step": 220950 - }, - { - "epoch": 0.39, - "learning_rate": 3.0733615376835e-05, - "loss": 2.3396, - "step": 220960 - }, - { - "epoch": 0.39, - "learning_rate": 3.0732743436908175e-05, - "loss": 2.4468, - "step": 220970 - }, - { - "epoch": 0.39, - "learning_rate": 3.0731871496981346e-05, - "loss": 2.306, - "step": 220980 - }, - { - "epoch": 0.39, - "learning_rate": 3.0730999557054516e-05, - "loss": 2.4959, - "step": 220990 - }, - { - "epoch": 0.39, - "learning_rate": 3.073012761712769e-05, - "loss": 2.3464, - "step": 221000 - }, - { - "epoch": 0.39, - "learning_rate": 3.0729255677200864e-05, - "loss": 2.3416, - "step": 221010 - }, - { - "epoch": 0.39, - "learning_rate": 3.0728383737274034e-05, - "loss": 2.2784, - "step": 221020 - }, - { - "epoch": 0.39, - "learning_rate": 3.072751179734721e-05, - "loss": 2.329, - "step": 221030 - }, - { - "epoch": 0.39, - "learning_rate": 3.072663985742039e-05, - "loss": 2.4687, - "step": 221040 - }, - { - "epoch": 0.39, - "learning_rate": 3.072576791749356e-05, - "loss": 2.4926, - "step": 221050 - }, - { - "epoch": 0.39, - "learning_rate": 3.072489597756673e-05, - "loss": 2.287, - "step": 221060 - }, - { - "epoch": 0.39, - "learning_rate": 3.0724024037639906e-05, - "loss": 2.4409, - "step": 221070 - }, - { - "epoch": 0.39, - "learning_rate": 3.0723152097713077e-05, - "loss": 2.4169, - "step": 221080 - }, - { - "epoch": 0.39, - "learning_rate": 3.072228015778625e-05, - "loss": 2.33, - "step": 221090 - }, - { - "epoch": 0.39, - "learning_rate": 3.0721408217859424e-05, - "loss": 2.4557, - "step": 221100 - }, - { - "epoch": 0.39, - "learning_rate": 3.07205362779326e-05, - "loss": 2.4461, - "step": 221110 - }, - { - "epoch": 0.39, - "learning_rate": 3.071966433800577e-05, - "loss": 2.4407, - "step": 221120 - }, - { - "epoch": 0.39, - "learning_rate": 3.071879239807894e-05, - "loss": 2.343, - "step": 221130 - }, - { - "epoch": 0.39, - "learning_rate": 3.071792045815212e-05, - "loss": 2.4102, - "step": 221140 - }, - { - "epoch": 0.39, - "learning_rate": 3.071704851822529e-05, - "loss": 2.4164, - "step": 221150 - }, - { - "epoch": 0.39, - "learning_rate": 3.071617657829846e-05, - "loss": 2.4123, - "step": 221160 - }, - { - "epoch": 0.39, - "learning_rate": 3.071530463837163e-05, - "loss": 2.5312, - "step": 221170 - }, - { - "epoch": 0.39, - "learning_rate": 3.0714432698444814e-05, - "loss": 2.5306, - "step": 221180 - }, - { - "epoch": 0.39, - "learning_rate": 3.0713560758517985e-05, - "loss": 2.405, - "step": 221190 - }, - { - "epoch": 0.39, - "learning_rate": 3.0712688818591155e-05, - "loss": 2.2547, - "step": 221200 - }, - { - "epoch": 0.39, - "learning_rate": 3.071181687866433e-05, - "loss": 2.4021, - "step": 221210 - }, - { - "epoch": 0.39, - "learning_rate": 3.07109449387375e-05, - "loss": 2.4599, - "step": 221220 - }, - { - "epoch": 0.39, - "learning_rate": 3.071007299881067e-05, - "loss": 2.3919, - "step": 221230 - }, - { - "epoch": 0.39, - "learning_rate": 3.070920105888384e-05, - "loss": 2.5551, - "step": 221240 - }, - { - "epoch": 0.39, - "learning_rate": 3.070832911895703e-05, - "loss": 2.4523, - "step": 221250 - }, - { - "epoch": 0.39, - "learning_rate": 3.07074571790302e-05, - "loss": 2.3258, - "step": 221260 - }, - { - "epoch": 0.39, - "learning_rate": 3.070658523910337e-05, - "loss": 2.2031, - "step": 221270 - }, - { - "epoch": 0.39, - "learning_rate": 3.070571329917654e-05, - "loss": 2.4316, - "step": 221280 - }, - { - "epoch": 0.39, - "learning_rate": 3.0704841359249716e-05, - "loss": 2.5034, - "step": 221290 - }, - { - "epoch": 0.39, - "learning_rate": 3.0703969419322886e-05, - "loss": 2.3911, - "step": 221300 - }, - { - "epoch": 0.39, - "learning_rate": 3.0703097479396056e-05, - "loss": 2.3742, - "step": 221310 - }, - { - "epoch": 0.39, - "learning_rate": 3.0702225539469234e-05, - "loss": 2.3617, - "step": 221320 - }, - { - "epoch": 0.39, - "learning_rate": 3.070135359954241e-05, - "loss": 2.4834, - "step": 221330 - }, - { - "epoch": 0.39, - "learning_rate": 3.070048165961558e-05, - "loss": 2.3477, - "step": 221340 - }, - { - "epoch": 0.39, - "learning_rate": 3.069960971968875e-05, - "loss": 2.386, - "step": 221350 - }, - { - "epoch": 0.39, - "learning_rate": 3.069873777976193e-05, - "loss": 2.4411, - "step": 221360 - }, - { - "epoch": 0.39, - "learning_rate": 3.06978658398351e-05, - "loss": 2.3036, - "step": 221370 - }, - { - "epoch": 0.39, - "learning_rate": 3.069699389990827e-05, - "loss": 2.4537, - "step": 221380 - }, - { - "epoch": 0.39, - "learning_rate": 3.0696121959981447e-05, - "loss": 2.4622, - "step": 221390 - }, - { - "epoch": 0.39, - "learning_rate": 3.0695250020054624e-05, - "loss": 2.3244, - "step": 221400 - }, - { - "epoch": 0.39, - "learning_rate": 3.0694378080127794e-05, - "loss": 2.3704, - "step": 221410 - }, - { - "epoch": 0.39, - "learning_rate": 3.0693506140200964e-05, - "loss": 2.4831, - "step": 221420 - }, - { - "epoch": 0.39, - "learning_rate": 3.069263420027414e-05, - "loss": 2.4986, - "step": 221430 - }, - { - "epoch": 0.39, - "learning_rate": 3.069176226034731e-05, - "loss": 2.4865, - "step": 221440 - }, - { - "epoch": 0.39, - "learning_rate": 3.069089032042048e-05, - "loss": 2.2011, - "step": 221450 - }, - { - "epoch": 0.39, - "learning_rate": 3.069001838049366e-05, - "loss": 2.448, - "step": 221460 - }, - { - "epoch": 0.39, - "learning_rate": 3.068914644056683e-05, - "loss": 2.5187, - "step": 221470 - }, - { - "epoch": 0.39, - "learning_rate": 3.068827450064001e-05, - "loss": 2.4738, - "step": 221480 - }, - { - "epoch": 0.39, - "learning_rate": 3.068740256071318e-05, - "loss": 2.3584, - "step": 221490 - }, - { - "epoch": 0.39, - "learning_rate": 3.0686530620786355e-05, - "loss": 2.2956, - "step": 221500 - }, - { - "epoch": 0.39, - "learning_rate": 3.0685658680859525e-05, - "loss": 2.4209, - "step": 221510 - }, - { - "epoch": 0.39, - "learning_rate": 3.0684786740932695e-05, - "loss": 2.3908, - "step": 221520 - }, - { - "epoch": 0.39, - "learning_rate": 3.068391480100587e-05, - "loss": 2.4011, - "step": 221530 - }, - { - "epoch": 0.39, - "learning_rate": 3.068304286107904e-05, - "loss": 2.5407, - "step": 221540 - }, - { - "epoch": 0.39, - "learning_rate": 3.068217092115222e-05, - "loss": 2.419, - "step": 221550 - }, - { - "epoch": 0.39, - "learning_rate": 3.068129898122539e-05, - "loss": 2.389, - "step": 221560 - }, - { - "epoch": 0.39, - "learning_rate": 3.068042704129857e-05, - "loss": 2.2761, - "step": 221570 - }, - { - "epoch": 0.39, - "learning_rate": 3.067955510137174e-05, - "loss": 2.3897, - "step": 221580 - }, - { - "epoch": 0.39, - "learning_rate": 3.067868316144491e-05, - "loss": 2.4084, - "step": 221590 - }, - { - "epoch": 0.39, - "learning_rate": 3.0677811221518086e-05, - "loss": 2.4065, - "step": 221600 - }, - { - "epoch": 0.39, - "learning_rate": 3.0676939281591256e-05, - "loss": 2.4565, - "step": 221610 - }, - { - "epoch": 0.39, - "learning_rate": 3.067606734166443e-05, - "loss": 2.4221, - "step": 221620 - }, - { - "epoch": 0.39, - "learning_rate": 3.0675195401737603e-05, - "loss": 2.4128, - "step": 221630 - }, - { - "epoch": 0.39, - "learning_rate": 3.067432346181078e-05, - "loss": 2.4099, - "step": 221640 - }, - { - "epoch": 0.39, - "learning_rate": 3.067345152188395e-05, - "loss": 2.3207, - "step": 221650 - }, - { - "epoch": 0.39, - "learning_rate": 3.067257958195712e-05, - "loss": 2.3479, - "step": 221660 - }, - { - "epoch": 0.39, - "learning_rate": 3.067170764203029e-05, - "loss": 2.3407, - "step": 221670 - }, - { - "epoch": 0.39, - "learning_rate": 3.067083570210347e-05, - "loss": 2.4024, - "step": 221680 - }, - { - "epoch": 0.39, - "learning_rate": 3.066996376217664e-05, - "loss": 2.3508, - "step": 221690 - }, - { - "epoch": 0.39, - "learning_rate": 3.0669091822249816e-05, - "loss": 2.3865, - "step": 221700 - }, - { - "epoch": 0.39, - "learning_rate": 3.0668219882322994e-05, - "loss": 2.3508, - "step": 221710 - }, - { - "epoch": 0.39, - "learning_rate": 3.0667347942396164e-05, - "loss": 2.3831, - "step": 221720 - }, - { - "epoch": 0.39, - "learning_rate": 3.0666476002469334e-05, - "loss": 2.4501, - "step": 221730 - }, - { - "epoch": 0.39, - "learning_rate": 3.0665604062542505e-05, - "loss": 2.4623, - "step": 221740 - }, - { - "epoch": 0.39, - "learning_rate": 3.066473212261568e-05, - "loss": 2.4777, - "step": 221750 - }, - { - "epoch": 0.39, - "learning_rate": 3.066386018268885e-05, - "loss": 2.3716, - "step": 221760 - }, - { - "epoch": 0.39, - "learning_rate": 3.066298824276203e-05, - "loss": 2.4841, - "step": 221770 - }, - { - "epoch": 0.39, - "learning_rate": 3.06621163028352e-05, - "loss": 2.4094, - "step": 221780 - }, - { - "epoch": 0.39, - "learning_rate": 3.066124436290838e-05, - "loss": 2.3743, - "step": 221790 - }, - { - "epoch": 0.39, - "learning_rate": 3.066037242298155e-05, - "loss": 2.4228, - "step": 221800 - }, - { - "epoch": 0.39, - "learning_rate": 3.065950048305472e-05, - "loss": 2.3512, - "step": 221810 - }, - { - "epoch": 0.39, - "learning_rate": 3.0658628543127895e-05, - "loss": 2.4001, - "step": 221820 - }, - { - "epoch": 0.39, - "learning_rate": 3.0657756603201065e-05, - "loss": 2.4233, - "step": 221830 - }, - { - "epoch": 0.39, - "learning_rate": 3.0656884663274236e-05, - "loss": 2.4672, - "step": 221840 - }, - { - "epoch": 0.39, - "learning_rate": 3.065601272334741e-05, - "loss": 2.5508, - "step": 221850 - }, - { - "epoch": 0.39, - "learning_rate": 3.065514078342059e-05, - "loss": 2.4285, - "step": 221860 - }, - { - "epoch": 0.39, - "learning_rate": 3.065426884349376e-05, - "loss": 2.3135, - "step": 221870 - }, - { - "epoch": 0.39, - "learning_rate": 3.065339690356693e-05, - "loss": 2.4251, - "step": 221880 - }, - { - "epoch": 0.39, - "learning_rate": 3.065252496364011e-05, - "loss": 2.4781, - "step": 221890 - }, - { - "epoch": 0.39, - "learning_rate": 3.065165302371328e-05, - "loss": 2.4958, - "step": 221900 - }, - { - "epoch": 0.39, - "learning_rate": 3.065078108378645e-05, - "loss": 2.3911, - "step": 221910 - }, - { - "epoch": 0.39, - "learning_rate": 3.0649909143859626e-05, - "loss": 2.3769, - "step": 221920 - }, - { - "epoch": 0.39, - "learning_rate": 3.06490372039328e-05, - "loss": 2.379, - "step": 221930 - }, - { - "epoch": 0.39, - "learning_rate": 3.064816526400597e-05, - "loss": 2.3222, - "step": 221940 - }, - { - "epoch": 0.39, - "learning_rate": 3.0647293324079144e-05, - "loss": 2.3922, - "step": 221950 - }, - { - "epoch": 0.39, - "learning_rate": 3.064642138415232e-05, - "loss": 2.4247, - "step": 221960 - }, - { - "epoch": 0.39, - "learning_rate": 3.064554944422549e-05, - "loss": 2.4008, - "step": 221970 - }, - { - "epoch": 0.39, - "learning_rate": 3.064467750429866e-05, - "loss": 2.3837, - "step": 221980 - }, - { - "epoch": 0.39, - "learning_rate": 3.064380556437184e-05, - "loss": 2.392, - "step": 221990 - }, - { - "epoch": 0.39, - "learning_rate": 3.0642933624445016e-05, - "loss": 2.4082, - "step": 222000 - }, - { - "epoch": 0.39, - "learning_rate": 3.0642061684518186e-05, - "loss": 2.4928, - "step": 222010 - }, - { - "epoch": 0.39, - "learning_rate": 3.064118974459136e-05, - "loss": 2.3022, - "step": 222020 - }, - { - "epoch": 0.39, - "learning_rate": 3.0640317804664534e-05, - "loss": 2.3594, - "step": 222030 - }, - { - "epoch": 0.39, - "learning_rate": 3.0639445864737704e-05, - "loss": 2.4334, - "step": 222040 - }, - { - "epoch": 0.39, - "learning_rate": 3.0638573924810875e-05, - "loss": 2.3963, - "step": 222050 - }, - { - "epoch": 0.39, - "learning_rate": 3.063770198488405e-05, - "loss": 2.4585, - "step": 222060 - }, - { - "epoch": 0.39, - "learning_rate": 3.063683004495723e-05, - "loss": 2.3863, - "step": 222070 - }, - { - "epoch": 0.39, - "learning_rate": 3.06359581050304e-05, - "loss": 2.4689, - "step": 222080 - }, - { - "epoch": 0.39, - "learning_rate": 3.063508616510357e-05, - "loss": 2.3479, - "step": 222090 - }, - { - "epoch": 0.39, - "learning_rate": 3.063421422517675e-05, - "loss": 2.338, - "step": 222100 - }, - { - "epoch": 0.39, - "learning_rate": 3.063334228524992e-05, - "loss": 2.4688, - "step": 222110 - }, - { - "epoch": 0.39, - "learning_rate": 3.063247034532309e-05, - "loss": 2.3733, - "step": 222120 - }, - { - "epoch": 0.39, - "learning_rate": 3.063159840539626e-05, - "loss": 2.4046, - "step": 222130 - }, - { - "epoch": 0.39, - "learning_rate": 3.063072646546944e-05, - "loss": 2.2712, - "step": 222140 - }, - { - "epoch": 0.39, - "learning_rate": 3.062985452554261e-05, - "loss": 2.4299, - "step": 222150 - }, - { - "epoch": 0.39, - "learning_rate": 3.062898258561578e-05, - "loss": 2.4678, - "step": 222160 - }, - { - "epoch": 0.39, - "learning_rate": 3.062811064568896e-05, - "loss": 2.4169, - "step": 222170 - }, - { - "epoch": 0.39, - "learning_rate": 3.062723870576213e-05, - "loss": 2.3934, - "step": 222180 - }, - { - "epoch": 0.39, - "learning_rate": 3.06263667658353e-05, - "loss": 2.2935, - "step": 222190 - }, - { - "epoch": 0.39, - "learning_rate": 3.062549482590847e-05, - "loss": 2.3706, - "step": 222200 - }, - { - "epoch": 0.39, - "learning_rate": 3.062462288598165e-05, - "loss": 2.4223, - "step": 222210 - }, - { - "epoch": 0.39, - "learning_rate": 3.0623750946054825e-05, - "loss": 2.4367, - "step": 222220 - }, - { - "epoch": 0.39, - "learning_rate": 3.0622879006127996e-05, - "loss": 2.4341, - "step": 222230 - }, - { - "epoch": 0.39, - "learning_rate": 3.0622007066201166e-05, - "loss": 2.4594, - "step": 222240 - }, - { - "epoch": 0.39, - "learning_rate": 3.062113512627434e-05, - "loss": 2.2921, - "step": 222250 - }, - { - "epoch": 0.39, - "learning_rate": 3.0620263186347514e-05, - "loss": 2.3994, - "step": 222260 - }, - { - "epoch": 0.39, - "learning_rate": 3.0619391246420684e-05, - "loss": 2.3272, - "step": 222270 - }, - { - "epoch": 0.39, - "learning_rate": 3.061851930649386e-05, - "loss": 2.4161, - "step": 222280 - }, - { - "epoch": 0.39, - "learning_rate": 3.061764736656704e-05, - "loss": 2.3757, - "step": 222290 - }, - { - "epoch": 0.39, - "learning_rate": 3.061677542664021e-05, - "loss": 2.4055, - "step": 222300 - }, - { - "epoch": 0.39, - "learning_rate": 3.061590348671338e-05, - "loss": 2.3691, - "step": 222310 - }, - { - "epoch": 0.39, - "learning_rate": 3.0615031546786556e-05, - "loss": 2.3895, - "step": 222320 - }, - { - "epoch": 0.39, - "learning_rate": 3.061415960685973e-05, - "loss": 2.4458, - "step": 222330 - }, - { - "epoch": 0.39, - "learning_rate": 3.06132876669329e-05, - "loss": 2.2778, - "step": 222340 - }, - { - "epoch": 0.39, - "learning_rate": 3.0612415727006074e-05, - "loss": 2.3017, - "step": 222350 - }, - { - "epoch": 0.39, - "learning_rate": 3.0611543787079245e-05, - "loss": 2.3786, - "step": 222360 - }, - { - "epoch": 0.39, - "learning_rate": 3.061067184715242e-05, - "loss": 2.3347, - "step": 222370 - }, - { - "epoch": 0.39, - "learning_rate": 3.060979990722559e-05, - "loss": 2.5736, - "step": 222380 - }, - { - "epoch": 0.39, - "learning_rate": 3.060892796729877e-05, - "loss": 2.3233, - "step": 222390 - }, - { - "epoch": 0.39, - "learning_rate": 3.060805602737194e-05, - "loss": 2.3949, - "step": 222400 - }, - { - "epoch": 0.39, - "learning_rate": 3.060718408744511e-05, - "loss": 2.4063, - "step": 222410 - }, - { - "epoch": 0.39, - "learning_rate": 3.060631214751829e-05, - "loss": 2.3705, - "step": 222420 - }, - { - "epoch": 0.39, - "learning_rate": 3.060544020759146e-05, - "loss": 2.408, - "step": 222430 - }, - { - "epoch": 0.39, - "learning_rate": 3.0604568267664635e-05, - "loss": 2.3447, - "step": 222440 - }, - { - "epoch": 0.39, - "learning_rate": 3.0603696327737805e-05, - "loss": 2.4829, - "step": 222450 - }, - { - "epoch": 0.39, - "learning_rate": 3.060282438781098e-05, - "loss": 2.3946, - "step": 222460 - }, - { - "epoch": 0.39, - "learning_rate": 3.060195244788415e-05, - "loss": 2.3973, - "step": 222470 - }, - { - "epoch": 0.39, - "learning_rate": 3.060108050795732e-05, - "loss": 2.4347, - "step": 222480 - }, - { - "epoch": 0.39, - "learning_rate": 3.06002085680305e-05, - "loss": 2.3386, - "step": 222490 - }, - { - "epoch": 0.39, - "learning_rate": 3.059933662810367e-05, - "loss": 2.4312, - "step": 222500 - }, - { - "epoch": 0.39, - "learning_rate": 3.059846468817684e-05, - "loss": 2.4465, - "step": 222510 - }, - { - "epoch": 0.39, - "learning_rate": 3.059759274825002e-05, - "loss": 2.3666, - "step": 222520 - }, - { - "epoch": 0.39, - "learning_rate": 3.0596720808323195e-05, - "loss": 2.3695, - "step": 222530 - }, - { - "epoch": 0.39, - "learning_rate": 3.0595848868396366e-05, - "loss": 2.3584, - "step": 222540 - }, - { - "epoch": 0.39, - "learning_rate": 3.0594976928469536e-05, - "loss": 2.4464, - "step": 222550 - }, - { - "epoch": 0.39, - "learning_rate": 3.059410498854271e-05, - "loss": 2.4993, - "step": 222560 - }, - { - "epoch": 0.39, - "learning_rate": 3.0593233048615884e-05, - "loss": 2.419, - "step": 222570 - }, - { - "epoch": 0.39, - "learning_rate": 3.0592361108689054e-05, - "loss": 2.3024, - "step": 222580 - }, - { - "epoch": 0.39, - "learning_rate": 3.059148916876223e-05, - "loss": 2.4065, - "step": 222590 - }, - { - "epoch": 0.39, - "learning_rate": 3.059061722883541e-05, - "loss": 2.4622, - "step": 222600 - }, - { - "epoch": 0.39, - "learning_rate": 3.058974528890858e-05, - "loss": 2.4306, - "step": 222610 - }, - { - "epoch": 0.39, - "learning_rate": 3.058887334898175e-05, - "loss": 2.4311, - "step": 222620 - }, - { - "epoch": 0.39, - "learning_rate": 3.058800140905492e-05, - "loss": 2.4826, - "step": 222630 - }, - { - "epoch": 0.39, - "learning_rate": 3.05871294691281e-05, - "loss": 2.5891, - "step": 222640 - }, - { - "epoch": 0.39, - "learning_rate": 3.058625752920127e-05, - "loss": 2.5458, - "step": 222650 - }, - { - "epoch": 0.39, - "learning_rate": 3.058538558927444e-05, - "loss": 2.4952, - "step": 222660 - }, - { - "epoch": 0.39, - "learning_rate": 3.058451364934762e-05, - "loss": 2.3108, - "step": 222670 - }, - { - "epoch": 0.39, - "learning_rate": 3.058364170942079e-05, - "loss": 2.4945, - "step": 222680 - }, - { - "epoch": 0.39, - "learning_rate": 3.058276976949396e-05, - "loss": 2.3559, - "step": 222690 - }, - { - "epoch": 0.39, - "learning_rate": 3.058189782956713e-05, - "loss": 2.4597, - "step": 222700 - }, - { - "epoch": 0.39, - "learning_rate": 3.058102588964031e-05, - "loss": 2.2791, - "step": 222710 - }, - { - "epoch": 0.39, - "learning_rate": 3.058015394971348e-05, - "loss": 2.3924, - "step": 222720 - }, - { - "epoch": 0.39, - "learning_rate": 3.057928200978665e-05, - "loss": 2.366, - "step": 222730 - }, - { - "epoch": 0.39, - "learning_rate": 3.057841006985983e-05, - "loss": 2.3724, - "step": 222740 - }, - { - "epoch": 0.39, - "learning_rate": 3.0577538129933005e-05, - "loss": 2.3295, - "step": 222750 - }, - { - "epoch": 0.39, - "learning_rate": 3.0576666190006175e-05, - "loss": 2.366, - "step": 222760 - }, - { - "epoch": 0.39, - "learning_rate": 3.0575794250079345e-05, - "loss": 2.4688, - "step": 222770 - }, - { - "epoch": 0.39, - "learning_rate": 3.057492231015252e-05, - "loss": 2.3258, - "step": 222780 - }, - { - "epoch": 0.39, - "learning_rate": 3.057405037022569e-05, - "loss": 2.4736, - "step": 222790 - }, - { - "epoch": 0.39, - "learning_rate": 3.0573178430298863e-05, - "loss": 2.3895, - "step": 222800 - }, - { - "epoch": 0.39, - "learning_rate": 3.057230649037204e-05, - "loss": 2.5169, - "step": 222810 - }, - { - "epoch": 0.39, - "learning_rate": 3.057143455044522e-05, - "loss": 2.5234, - "step": 222820 - }, - { - "epoch": 0.39, - "learning_rate": 3.057056261051839e-05, - "loss": 2.5532, - "step": 222830 - }, - { - "epoch": 0.39, - "learning_rate": 3.056969067059156e-05, - "loss": 2.4576, - "step": 222840 - }, - { - "epoch": 0.39, - "learning_rate": 3.0568818730664736e-05, - "loss": 2.5279, - "step": 222850 - }, - { - "epoch": 0.39, - "learning_rate": 3.0567946790737906e-05, - "loss": 2.4529, - "step": 222860 - }, - { - "epoch": 0.39, - "learning_rate": 3.0567074850811076e-05, - "loss": 2.4246, - "step": 222870 - }, - { - "epoch": 0.39, - "learning_rate": 3.0566202910884254e-05, - "loss": 2.4192, - "step": 222880 - }, - { - "epoch": 0.39, - "learning_rate": 3.056533097095743e-05, - "loss": 2.4604, - "step": 222890 - }, - { - "epoch": 0.39, - "learning_rate": 3.05644590310306e-05, - "loss": 2.4744, - "step": 222900 - }, - { - "epoch": 0.39, - "learning_rate": 3.056358709110377e-05, - "loss": 2.3649, - "step": 222910 - }, - { - "epoch": 0.39, - "learning_rate": 3.056271515117695e-05, - "loss": 2.3258, - "step": 222920 - }, - { - "epoch": 0.39, - "learning_rate": 3.056184321125012e-05, - "loss": 2.4366, - "step": 222930 - }, - { - "epoch": 0.39, - "learning_rate": 3.056097127132329e-05, - "loss": 2.3586, - "step": 222940 - }, - { - "epoch": 0.39, - "learning_rate": 3.0560099331396467e-05, - "loss": 2.2794, - "step": 222950 - }, - { - "epoch": 0.39, - "learning_rate": 3.0559227391469644e-05, - "loss": 2.5327, - "step": 222960 - }, - { - "epoch": 0.39, - "learning_rate": 3.0558355451542814e-05, - "loss": 2.4295, - "step": 222970 - }, - { - "epoch": 0.39, - "learning_rate": 3.0557483511615984e-05, - "loss": 2.4375, - "step": 222980 - }, - { - "epoch": 0.39, - "learning_rate": 3.055661157168916e-05, - "loss": 2.4149, - "step": 222990 - }, - { - "epoch": 0.39, - "learning_rate": 3.055573963176233e-05, - "loss": 2.4145, - "step": 223000 - }, - { - "epoch": 0.39, - "learning_rate": 3.05548676918355e-05, - "loss": 2.4226, - "step": 223010 - }, - { - "epoch": 0.39, - "learning_rate": 3.055399575190867e-05, - "loss": 2.2988, - "step": 223020 - }, - { - "epoch": 0.39, - "learning_rate": 3.055312381198185e-05, - "loss": 2.3995, - "step": 223030 - }, - { - "epoch": 0.39, - "learning_rate": 3.055225187205503e-05, - "loss": 2.4747, - "step": 223040 - }, - { - "epoch": 0.39, - "learning_rate": 3.05513799321282e-05, - "loss": 2.3891, - "step": 223050 - }, - { - "epoch": 0.39, - "learning_rate": 3.0550507992201375e-05, - "loss": 2.4762, - "step": 223060 - }, - { - "epoch": 0.39, - "learning_rate": 3.0549636052274545e-05, - "loss": 2.4388, - "step": 223070 - }, - { - "epoch": 0.39, - "learning_rate": 3.0548764112347715e-05, - "loss": 2.4034, - "step": 223080 - }, - { - "epoch": 0.39, - "learning_rate": 3.0547892172420886e-05, - "loss": 2.478, - "step": 223090 - }, - { - "epoch": 0.39, - "learning_rate": 3.054702023249406e-05, - "loss": 2.4125, - "step": 223100 - }, - { - "epoch": 0.39, - "learning_rate": 3.054614829256724e-05, - "loss": 2.4514, - "step": 223110 - }, - { - "epoch": 0.39, - "learning_rate": 3.054527635264041e-05, - "loss": 2.4435, - "step": 223120 - }, - { - "epoch": 0.39, - "learning_rate": 3.054440441271358e-05, - "loss": 2.4117, - "step": 223130 - }, - { - "epoch": 0.39, - "learning_rate": 3.054353247278676e-05, - "loss": 2.3401, - "step": 223140 - }, - { - "epoch": 0.39, - "learning_rate": 3.054266053285993e-05, - "loss": 2.3627, - "step": 223150 - }, - { - "epoch": 0.39, - "learning_rate": 3.05417885929331e-05, - "loss": 2.3614, - "step": 223160 - }, - { - "epoch": 0.39, - "learning_rate": 3.0540916653006276e-05, - "loss": 2.4348, - "step": 223170 - }, - { - "epoch": 0.39, - "learning_rate": 3.0540044713079446e-05, - "loss": 2.3159, - "step": 223180 - }, - { - "epoch": 0.39, - "learning_rate": 3.0539172773152623e-05, - "loss": 2.418, - "step": 223190 - }, - { - "epoch": 0.39, - "learning_rate": 3.0538300833225794e-05, - "loss": 2.312, - "step": 223200 - }, - { - "epoch": 0.39, - "learning_rate": 3.053742889329897e-05, - "loss": 2.3073, - "step": 223210 - }, - { - "epoch": 0.39, - "learning_rate": 3.053655695337214e-05, - "loss": 2.3813, - "step": 223220 - }, - { - "epoch": 0.39, - "learning_rate": 3.053568501344531e-05, - "loss": 2.5441, - "step": 223230 - }, - { - "epoch": 0.39, - "learning_rate": 3.053481307351849e-05, - "loss": 2.3519, - "step": 223240 - }, - { - "epoch": 0.39, - "learning_rate": 3.053394113359166e-05, - "loss": 2.4459, - "step": 223250 - }, - { - "epoch": 0.39, - "learning_rate": 3.0533069193664836e-05, - "loss": 2.4116, - "step": 223260 - }, - { - "epoch": 0.39, - "learning_rate": 3.053219725373801e-05, - "loss": 2.3573, - "step": 223270 - }, - { - "epoch": 0.39, - "learning_rate": 3.0531325313811184e-05, - "loss": 2.3721, - "step": 223280 - }, - { - "epoch": 0.39, - "learning_rate": 3.0530453373884354e-05, - "loss": 2.4026, - "step": 223290 - }, - { - "epoch": 0.39, - "learning_rate": 3.0529581433957525e-05, - "loss": 2.4285, - "step": 223300 - }, - { - "epoch": 0.39, - "learning_rate": 3.05287094940307e-05, - "loss": 2.4622, - "step": 223310 - }, - { - "epoch": 0.39, - "learning_rate": 3.052783755410387e-05, - "loss": 2.296, - "step": 223320 - }, - { - "epoch": 0.39, - "learning_rate": 3.052696561417704e-05, - "loss": 2.4715, - "step": 223330 - }, - { - "epoch": 0.39, - "learning_rate": 3.052609367425022e-05, - "loss": 2.3671, - "step": 223340 - }, - { - "epoch": 0.39, - "learning_rate": 3.05252217343234e-05, - "loss": 2.4405, - "step": 223350 - }, - { - "epoch": 0.39, - "learning_rate": 3.052434979439657e-05, - "loss": 2.4298, - "step": 223360 - }, - { - "epoch": 0.39, - "learning_rate": 3.052347785446974e-05, - "loss": 2.3613, - "step": 223370 - }, - { - "epoch": 0.39, - "learning_rate": 3.0522605914542915e-05, - "loss": 2.3121, - "step": 223380 - }, - { - "epoch": 0.39, - "learning_rate": 3.0521733974616085e-05, - "loss": 2.507, - "step": 223390 - }, - { - "epoch": 0.39, - "learning_rate": 3.0520862034689256e-05, - "loss": 2.4568, - "step": 223400 - }, - { - "epoch": 0.39, - "learning_rate": 3.051999009476243e-05, - "loss": 2.4652, - "step": 223410 - }, - { - "epoch": 0.39, - "learning_rate": 3.051911815483561e-05, - "loss": 2.457, - "step": 223420 - }, - { - "epoch": 0.39, - "learning_rate": 3.051824621490878e-05, - "loss": 2.4217, - "step": 223430 - }, - { - "epoch": 0.39, - "learning_rate": 3.051737427498195e-05, - "loss": 2.4825, - "step": 223440 - }, - { - "epoch": 0.39, - "learning_rate": 3.0516502335055125e-05, - "loss": 2.4418, - "step": 223450 - }, - { - "epoch": 0.39, - "learning_rate": 3.05156303951283e-05, - "loss": 2.4847, - "step": 223460 - }, - { - "epoch": 0.39, - "learning_rate": 3.051475845520147e-05, - "loss": 2.451, - "step": 223470 - }, - { - "epoch": 0.39, - "learning_rate": 3.051388651527465e-05, - "loss": 2.4539, - "step": 223480 - }, - { - "epoch": 0.39, - "learning_rate": 3.051301457534782e-05, - "loss": 2.4833, - "step": 223490 - }, - { - "epoch": 0.39, - "learning_rate": 3.0512142635420993e-05, - "loss": 2.4762, - "step": 223500 - }, - { - "epoch": 0.39, - "learning_rate": 3.0511270695494164e-05, - "loss": 2.5384, - "step": 223510 - }, - { - "epoch": 0.39, - "learning_rate": 3.0510398755567338e-05, - "loss": 2.3898, - "step": 223520 - }, - { - "epoch": 0.39, - "learning_rate": 3.050952681564051e-05, - "loss": 2.3615, - "step": 223530 - }, - { - "epoch": 0.39, - "learning_rate": 3.0508654875713682e-05, - "loss": 2.5305, - "step": 223540 - }, - { - "epoch": 0.39, - "learning_rate": 3.0507782935786855e-05, - "loss": 2.3582, - "step": 223550 - }, - { - "epoch": 0.39, - "learning_rate": 3.0506910995860033e-05, - "loss": 2.4266, - "step": 223560 - }, - { - "epoch": 0.39, - "learning_rate": 3.0506039055933206e-05, - "loss": 2.4302, - "step": 223570 - }, - { - "epoch": 0.39, - "learning_rate": 3.0505167116006377e-05, - "loss": 2.4313, - "step": 223580 - }, - { - "epoch": 0.39, - "learning_rate": 3.050429517607955e-05, - "loss": 2.3129, - "step": 223590 - }, - { - "epoch": 0.39, - "learning_rate": 3.0503423236152724e-05, - "loss": 2.3591, - "step": 223600 - }, - { - "epoch": 0.39, - "learning_rate": 3.0502551296225895e-05, - "loss": 2.3533, - "step": 223610 - }, - { - "epoch": 0.39, - "learning_rate": 3.050167935629907e-05, - "loss": 2.469, - "step": 223620 - }, - { - "epoch": 0.39, - "learning_rate": 3.0500807416372246e-05, - "loss": 2.4861, - "step": 223630 - }, - { - "epoch": 0.39, - "learning_rate": 3.049993547644542e-05, - "loss": 2.5584, - "step": 223640 - }, - { - "epoch": 0.39, - "learning_rate": 3.049906353651859e-05, - "loss": 2.328, - "step": 223650 - }, - { - "epoch": 0.39, - "learning_rate": 3.0498191596591764e-05, - "loss": 2.3163, - "step": 223660 - }, - { - "epoch": 0.39, - "learning_rate": 3.0497319656664934e-05, - "loss": 2.538, - "step": 223670 - }, - { - "epoch": 0.39, - "learning_rate": 3.0496447716738108e-05, - "loss": 2.4525, - "step": 223680 - }, - { - "epoch": 0.39, - "learning_rate": 3.049557577681128e-05, - "loss": 2.4103, - "step": 223690 - }, - { - "epoch": 0.39, - "learning_rate": 3.0494703836884452e-05, - "loss": 2.3033, - "step": 223700 - }, - { - "epoch": 0.39, - "learning_rate": 3.0493831896957632e-05, - "loss": 2.4561, - "step": 223710 - }, - { - "epoch": 0.39, - "learning_rate": 3.0492959957030803e-05, - "loss": 2.4589, - "step": 223720 - }, - { - "epoch": 0.39, - "learning_rate": 3.0492088017103977e-05, - "loss": 2.3911, - "step": 223730 - }, - { - "epoch": 0.39, - "learning_rate": 3.0491216077177147e-05, - "loss": 2.333, - "step": 223740 - }, - { - "epoch": 0.39, - "learning_rate": 3.049034413725032e-05, - "loss": 2.3813, - "step": 223750 - }, - { - "epoch": 0.39, - "learning_rate": 3.0489472197323494e-05, - "loss": 2.4733, - "step": 223760 - }, - { - "epoch": 0.39, - "learning_rate": 3.0488600257396665e-05, - "loss": 2.3541, - "step": 223770 - }, - { - "epoch": 0.39, - "learning_rate": 3.0487728317469842e-05, - "loss": 2.3023, - "step": 223780 - }, - { - "epoch": 0.39, - "learning_rate": 3.0486856377543016e-05, - "loss": 2.4737, - "step": 223790 - }, - { - "epoch": 0.39, - "learning_rate": 3.048598443761619e-05, - "loss": 2.3829, - "step": 223800 - }, - { - "epoch": 0.39, - "learning_rate": 3.048511249768936e-05, - "loss": 2.373, - "step": 223810 - }, - { - "epoch": 0.39, - "learning_rate": 3.0484240557762534e-05, - "loss": 2.3517, - "step": 223820 - }, - { - "epoch": 0.39, - "learning_rate": 3.0483368617835707e-05, - "loss": 2.3613, - "step": 223830 - }, - { - "epoch": 0.39, - "learning_rate": 3.0482496677908878e-05, - "loss": 2.3077, - "step": 223840 - }, - { - "epoch": 0.39, - "learning_rate": 3.048162473798205e-05, - "loss": 2.3338, - "step": 223850 - }, - { - "epoch": 0.39, - "learning_rate": 3.048075279805523e-05, - "loss": 2.4736, - "step": 223860 - }, - { - "epoch": 0.39, - "learning_rate": 3.0479880858128403e-05, - "loss": 2.3867, - "step": 223870 - }, - { - "epoch": 0.39, - "learning_rate": 3.0479008918201573e-05, - "loss": 2.2507, - "step": 223880 - }, - { - "epoch": 0.39, - "learning_rate": 3.0478136978274747e-05, - "loss": 2.4674, - "step": 223890 - }, - { - "epoch": 0.39, - "learning_rate": 3.0477265038347917e-05, - "loss": 2.4195, - "step": 223900 - }, - { - "epoch": 0.39, - "learning_rate": 3.047639309842109e-05, - "loss": 2.4562, - "step": 223910 - }, - { - "epoch": 0.39, - "learning_rate": 3.0475521158494265e-05, - "loss": 2.456, - "step": 223920 - }, - { - "epoch": 0.39, - "learning_rate": 3.0474649218567442e-05, - "loss": 2.4344, - "step": 223930 - }, - { - "epoch": 0.39, - "learning_rate": 3.0473777278640616e-05, - "loss": 2.2654, - "step": 223940 - }, - { - "epoch": 0.39, - "learning_rate": 3.0472905338713786e-05, - "loss": 2.4089, - "step": 223950 - }, - { - "epoch": 0.39, - "learning_rate": 3.047203339878696e-05, - "loss": 2.4577, - "step": 223960 - }, - { - "epoch": 0.39, - "learning_rate": 3.047116145886013e-05, - "loss": 2.4172, - "step": 223970 - }, - { - "epoch": 0.39, - "learning_rate": 3.0470289518933304e-05, - "loss": 2.3651, - "step": 223980 - }, - { - "epoch": 0.39, - "learning_rate": 3.0469417579006478e-05, - "loss": 2.416, - "step": 223990 - }, - { - "epoch": 0.39, - "learning_rate": 3.0468545639079655e-05, - "loss": 2.3133, - "step": 224000 - }, - { - "epoch": 0.39, - "learning_rate": 3.0467673699152825e-05, - "loss": 2.4263, - "step": 224010 - }, - { - "epoch": 0.39, - "learning_rate": 3.0466801759226e-05, - "loss": 2.3929, - "step": 224020 - }, - { - "epoch": 0.39, - "learning_rate": 3.0465929819299173e-05, - "loss": 2.4045, - "step": 224030 - }, - { - "epoch": 0.39, - "learning_rate": 3.0465057879372343e-05, - "loss": 2.5087, - "step": 224040 - }, - { - "epoch": 0.39, - "learning_rate": 3.0464185939445517e-05, - "loss": 2.4582, - "step": 224050 - }, - { - "epoch": 0.39, - "learning_rate": 3.0463313999518687e-05, - "loss": 2.4727, - "step": 224060 - }, - { - "epoch": 0.39, - "learning_rate": 3.046244205959186e-05, - "loss": 2.3833, - "step": 224070 - }, - { - "epoch": 0.39, - "learning_rate": 3.0461570119665038e-05, - "loss": 2.3472, - "step": 224080 - }, - { - "epoch": 0.39, - "learning_rate": 3.0460698179738212e-05, - "loss": 2.3551, - "step": 224090 - }, - { - "epoch": 0.39, - "learning_rate": 3.0459826239811386e-05, - "loss": 2.4509, - "step": 224100 - }, - { - "epoch": 0.39, - "learning_rate": 3.0458954299884556e-05, - "loss": 2.5285, - "step": 224110 - }, - { - "epoch": 0.39, - "learning_rate": 3.045808235995773e-05, - "loss": 2.4375, - "step": 224120 - }, - { - "epoch": 0.39, - "learning_rate": 3.04572104200309e-05, - "loss": 2.4441, - "step": 224130 - }, - { - "epoch": 0.39, - "learning_rate": 3.0456338480104074e-05, - "loss": 2.457, - "step": 224140 - }, - { - "epoch": 0.39, - "learning_rate": 3.045546654017725e-05, - "loss": 2.331, - "step": 224150 - }, - { - "epoch": 0.39, - "learning_rate": 3.0454594600250425e-05, - "loss": 2.3595, - "step": 224160 - }, - { - "epoch": 0.39, - "learning_rate": 3.0453722660323595e-05, - "loss": 2.3277, - "step": 224170 - }, - { - "epoch": 0.39, - "learning_rate": 3.045285072039677e-05, - "loss": 2.5035, - "step": 224180 - }, - { - "epoch": 0.39, - "learning_rate": 3.0451978780469943e-05, - "loss": 2.3812, - "step": 224190 - }, - { - "epoch": 0.39, - "learning_rate": 3.0451106840543113e-05, - "loss": 2.4589, - "step": 224200 - }, - { - "epoch": 0.39, - "learning_rate": 3.0450234900616287e-05, - "loss": 2.3239, - "step": 224210 - }, - { - "epoch": 0.39, - "learning_rate": 3.044936296068946e-05, - "loss": 2.3871, - "step": 224220 - }, - { - "epoch": 0.39, - "learning_rate": 3.0448491020762638e-05, - "loss": 2.4165, - "step": 224230 - }, - { - "epoch": 0.39, - "learning_rate": 3.044761908083581e-05, - "loss": 2.4241, - "step": 224240 - }, - { - "epoch": 0.39, - "learning_rate": 3.0446747140908982e-05, - "loss": 2.4613, - "step": 224250 - }, - { - "epoch": 0.39, - "learning_rate": 3.0445875200982156e-05, - "loss": 2.5357, - "step": 224260 - }, - { - "epoch": 0.39, - "learning_rate": 3.0445003261055326e-05, - "loss": 2.4357, - "step": 224270 - }, - { - "epoch": 0.39, - "learning_rate": 3.04441313211285e-05, - "loss": 2.3581, - "step": 224280 - }, - { - "epoch": 0.39, - "learning_rate": 3.044325938120167e-05, - "loss": 2.3635, - "step": 224290 - }, - { - "epoch": 0.39, - "learning_rate": 3.044238744127485e-05, - "loss": 2.4138, - "step": 224300 - }, - { - "epoch": 0.39, - "learning_rate": 3.044151550134802e-05, - "loss": 2.4075, - "step": 224310 - }, - { - "epoch": 0.39, - "learning_rate": 3.0440643561421195e-05, - "loss": 2.3921, - "step": 224320 - }, - { - "epoch": 0.39, - "learning_rate": 3.043977162149437e-05, - "loss": 2.4025, - "step": 224330 - }, - { - "epoch": 0.39, - "learning_rate": 3.043889968156754e-05, - "loss": 2.3086, - "step": 224340 - }, - { - "epoch": 0.39, - "learning_rate": 3.0438027741640713e-05, - "loss": 2.4293, - "step": 224350 - }, - { - "epoch": 0.39, - "learning_rate": 3.0437155801713883e-05, - "loss": 2.3729, - "step": 224360 - }, - { - "epoch": 0.39, - "learning_rate": 3.0436283861787057e-05, - "loss": 2.4959, - "step": 224370 - }, - { - "epoch": 0.39, - "learning_rate": 3.0435411921860234e-05, - "loss": 2.4225, - "step": 224380 - }, - { - "epoch": 0.39, - "learning_rate": 3.0434539981933408e-05, - "loss": 2.4875, - "step": 224390 - }, - { - "epoch": 0.39, - "learning_rate": 3.043366804200658e-05, - "loss": 2.3085, - "step": 224400 - }, - { - "epoch": 0.39, - "learning_rate": 3.0432796102079752e-05, - "loss": 2.4603, - "step": 224410 - }, - { - "epoch": 0.39, - "learning_rate": 3.0431924162152926e-05, - "loss": 2.3421, - "step": 224420 - }, - { - "epoch": 0.39, - "learning_rate": 3.0431052222226096e-05, - "loss": 2.338, - "step": 224430 - }, - { - "epoch": 0.39, - "learning_rate": 3.043018028229927e-05, - "loss": 2.3099, - "step": 224440 - }, - { - "epoch": 0.39, - "learning_rate": 3.0429308342372447e-05, - "loss": 2.3849, - "step": 224450 - }, - { - "epoch": 0.39, - "learning_rate": 3.042843640244562e-05, - "loss": 2.4955, - "step": 224460 - }, - { - "epoch": 0.39, - "learning_rate": 3.042756446251879e-05, - "loss": 2.4066, - "step": 224470 - }, - { - "epoch": 0.39, - "learning_rate": 3.0426692522591965e-05, - "loss": 2.3765, - "step": 224480 - }, - { - "epoch": 0.39, - "learning_rate": 3.042582058266514e-05, - "loss": 2.4109, - "step": 224490 - }, - { - "epoch": 0.39, - "learning_rate": 3.042494864273831e-05, - "loss": 2.3649, - "step": 224500 - }, - { - "epoch": 0.39, - "learning_rate": 3.0424076702811483e-05, - "loss": 2.3534, - "step": 224510 - }, - { - "epoch": 0.39, - "learning_rate": 3.0423204762884654e-05, - "loss": 2.2608, - "step": 224520 - }, - { - "epoch": 0.39, - "learning_rate": 3.0422332822957834e-05, - "loss": 2.3556, - "step": 224530 - }, - { - "epoch": 0.39, - "learning_rate": 3.0421460883031004e-05, - "loss": 2.4663, - "step": 224540 - }, - { - "epoch": 0.39, - "learning_rate": 3.0420588943104178e-05, - "loss": 2.4336, - "step": 224550 - }, - { - "epoch": 0.39, - "learning_rate": 3.0419717003177352e-05, - "loss": 2.3585, - "step": 224560 - }, - { - "epoch": 0.39, - "learning_rate": 3.0418845063250522e-05, - "loss": 2.3702, - "step": 224570 - }, - { - "epoch": 0.39, - "learning_rate": 3.0417973123323696e-05, - "loss": 2.433, - "step": 224580 - }, - { - "epoch": 0.39, - "learning_rate": 3.0417101183396867e-05, - "loss": 2.4577, - "step": 224590 - }, - { - "epoch": 0.39, - "learning_rate": 3.0416229243470047e-05, - "loss": 2.5034, - "step": 224600 - }, - { - "epoch": 0.39, - "learning_rate": 3.0415357303543217e-05, - "loss": 2.3944, - "step": 224610 - }, - { - "epoch": 0.39, - "learning_rate": 3.041448536361639e-05, - "loss": 2.4049, - "step": 224620 - }, - { - "epoch": 0.39, - "learning_rate": 3.041361342368956e-05, - "loss": 2.4554, - "step": 224630 - }, - { - "epoch": 0.39, - "learning_rate": 3.0412741483762735e-05, - "loss": 2.4048, - "step": 224640 - }, - { - "epoch": 0.39, - "learning_rate": 3.041186954383591e-05, - "loss": 2.4401, - "step": 224650 - }, - { - "epoch": 0.39, - "learning_rate": 3.041099760390908e-05, - "loss": 2.466, - "step": 224660 - }, - { - "epoch": 0.39, - "learning_rate": 3.041012566398226e-05, - "loss": 2.4611, - "step": 224670 - }, - { - "epoch": 0.39, - "learning_rate": 3.040925372405543e-05, - "loss": 2.3315, - "step": 224680 - }, - { - "epoch": 0.39, - "learning_rate": 3.0408381784128604e-05, - "loss": 2.4321, - "step": 224690 - }, - { - "epoch": 0.39, - "learning_rate": 3.0407509844201775e-05, - "loss": 2.3306, - "step": 224700 - }, - { - "epoch": 0.39, - "learning_rate": 3.040663790427495e-05, - "loss": 2.4858, - "step": 224710 - }, - { - "epoch": 0.39, - "learning_rate": 3.0405765964348122e-05, - "loss": 2.4007, - "step": 224720 - }, - { - "epoch": 0.39, - "learning_rate": 3.0404894024421293e-05, - "loss": 2.4416, - "step": 224730 - }, - { - "epoch": 0.39, - "learning_rate": 3.0404022084494466e-05, - "loss": 2.2938, - "step": 224740 - }, - { - "epoch": 0.39, - "learning_rate": 3.0403150144567643e-05, - "loss": 2.4451, - "step": 224750 - }, - { - "epoch": 0.39, - "learning_rate": 3.0402278204640817e-05, - "loss": 2.39, - "step": 224760 - }, - { - "epoch": 0.39, - "learning_rate": 3.0401406264713988e-05, - "loss": 2.4063, - "step": 224770 - }, - { - "epoch": 0.39, - "learning_rate": 3.040053432478716e-05, - "loss": 2.3804, - "step": 224780 - }, - { - "epoch": 0.39, - "learning_rate": 3.0399662384860332e-05, - "loss": 2.4216, - "step": 224790 - }, - { - "epoch": 0.39, - "learning_rate": 3.0398790444933506e-05, - "loss": 2.4603, - "step": 224800 - }, - { - "epoch": 0.39, - "learning_rate": 3.039791850500668e-05, - "loss": 2.2757, - "step": 224810 - }, - { - "epoch": 0.39, - "learning_rate": 3.0397046565079856e-05, - "loss": 2.3136, - "step": 224820 - }, - { - "epoch": 0.39, - "learning_rate": 3.039617462515303e-05, - "loss": 2.2087, - "step": 224830 - }, - { - "epoch": 0.39, - "learning_rate": 3.03953026852262e-05, - "loss": 2.4292, - "step": 224840 - }, - { - "epoch": 0.39, - "learning_rate": 3.0394430745299374e-05, - "loss": 2.3943, - "step": 224850 - }, - { - "epoch": 0.39, - "learning_rate": 3.0393558805372545e-05, - "loss": 2.4521, - "step": 224860 - }, - { - "epoch": 0.39, - "learning_rate": 3.039268686544572e-05, - "loss": 2.3748, - "step": 224870 - }, - { - "epoch": 0.39, - "learning_rate": 3.0391814925518892e-05, - "loss": 2.4587, - "step": 224880 - }, - { - "epoch": 0.39, - "learning_rate": 3.0390942985592063e-05, - "loss": 2.4099, - "step": 224890 - }, - { - "epoch": 0.39, - "learning_rate": 3.039007104566524e-05, - "loss": 2.331, - "step": 224900 - }, - { - "epoch": 0.39, - "learning_rate": 3.0389199105738414e-05, - "loss": 2.4216, - "step": 224910 - }, - { - "epoch": 0.39, - "learning_rate": 3.0388327165811587e-05, - "loss": 2.3948, - "step": 224920 - }, - { - "epoch": 0.39, - "learning_rate": 3.0387455225884758e-05, - "loss": 2.4289, - "step": 224930 - }, - { - "epoch": 0.39, - "learning_rate": 3.038658328595793e-05, - "loss": 2.4261, - "step": 224940 - }, - { - "epoch": 0.39, - "learning_rate": 3.0385711346031105e-05, - "loss": 2.4071, - "step": 224950 - }, - { - "epoch": 0.39, - "learning_rate": 3.0384839406104276e-05, - "loss": 2.4271, - "step": 224960 - }, - { - "epoch": 0.39, - "learning_rate": 3.0383967466177453e-05, - "loss": 2.385, - "step": 224970 - }, - { - "epoch": 0.39, - "learning_rate": 3.0383095526250627e-05, - "loss": 2.3996, - "step": 224980 - }, - { - "epoch": 0.39, - "learning_rate": 3.03822235863238e-05, - "loss": 2.3187, - "step": 224990 - }, - { - "epoch": 0.39, - "learning_rate": 3.038135164639697e-05, - "loss": 2.439, - "step": 225000 - }, - { - "epoch": 0.39, - "learning_rate": 3.0380479706470145e-05, - "loss": 2.407, - "step": 225010 - }, - { - "epoch": 0.39, - "learning_rate": 3.0379607766543315e-05, - "loss": 2.3839, - "step": 225020 - }, - { - "epoch": 0.39, - "learning_rate": 3.037873582661649e-05, - "loss": 2.3971, - "step": 225030 - }, - { - "epoch": 0.39, - "learning_rate": 3.0377863886689662e-05, - "loss": 2.4273, - "step": 225040 - }, - { - "epoch": 0.39, - "learning_rate": 3.037699194676284e-05, - "loss": 2.4419, - "step": 225050 - }, - { - "epoch": 0.39, - "learning_rate": 3.0376120006836013e-05, - "loss": 2.3896, - "step": 225060 - }, - { - "epoch": 0.39, - "learning_rate": 3.0375248066909184e-05, - "loss": 2.396, - "step": 225070 - }, - { - "epoch": 0.39, - "learning_rate": 3.0374376126982358e-05, - "loss": 2.3742, - "step": 225080 - }, - { - "epoch": 0.39, - "learning_rate": 3.0373504187055528e-05, - "loss": 2.3891, - "step": 225090 - }, - { - "epoch": 0.39, - "learning_rate": 3.0372632247128702e-05, - "loss": 2.4581, - "step": 225100 - }, - { - "epoch": 0.39, - "learning_rate": 3.0371760307201875e-05, - "loss": 2.3533, - "step": 225110 - }, - { - "epoch": 0.39, - "learning_rate": 3.0370888367275053e-05, - "loss": 2.3648, - "step": 225120 - }, - { - "epoch": 0.39, - "learning_rate": 3.0370016427348223e-05, - "loss": 2.4385, - "step": 225130 - }, - { - "epoch": 0.39, - "learning_rate": 3.0369144487421397e-05, - "loss": 2.4161, - "step": 225140 - }, - { - "epoch": 0.39, - "learning_rate": 3.036827254749457e-05, - "loss": 2.3423, - "step": 225150 - }, - { - "epoch": 0.39, - "learning_rate": 3.036740060756774e-05, - "loss": 2.4703, - "step": 225160 - }, - { - "epoch": 0.39, - "learning_rate": 3.0366528667640915e-05, - "loss": 2.434, - "step": 225170 - }, - { - "epoch": 0.39, - "learning_rate": 3.036565672771409e-05, - "loss": 2.335, - "step": 225180 - }, - { - "epoch": 0.39, - "learning_rate": 3.036478478778726e-05, - "loss": 2.5369, - "step": 225190 - }, - { - "epoch": 0.39, - "learning_rate": 3.0363912847860436e-05, - "loss": 2.3544, - "step": 225200 - }, - { - "epoch": 0.39, - "learning_rate": 3.036304090793361e-05, - "loss": 2.3824, - "step": 225210 - }, - { - "epoch": 0.39, - "learning_rate": 3.0362168968006784e-05, - "loss": 2.4065, - "step": 225220 - }, - { - "epoch": 0.39, - "learning_rate": 3.0361297028079954e-05, - "loss": 2.4106, - "step": 225230 - }, - { - "epoch": 0.39, - "learning_rate": 3.0360425088153128e-05, - "loss": 2.3614, - "step": 225240 - }, - { - "epoch": 0.39, - "learning_rate": 3.0359553148226298e-05, - "loss": 2.3389, - "step": 225250 - }, - { - "epoch": 0.39, - "learning_rate": 3.0358681208299472e-05, - "loss": 2.3719, - "step": 225260 - }, - { - "epoch": 0.39, - "learning_rate": 3.035780926837265e-05, - "loss": 2.4818, - "step": 225270 - }, - { - "epoch": 0.39, - "learning_rate": 3.0356937328445823e-05, - "loss": 2.3403, - "step": 225280 - }, - { - "epoch": 0.39, - "learning_rate": 3.0356065388518997e-05, - "loss": 2.3899, - "step": 225290 - }, - { - "epoch": 0.39, - "learning_rate": 3.0355193448592167e-05, - "loss": 2.3989, - "step": 225300 - }, - { - "epoch": 0.39, - "learning_rate": 3.035432150866534e-05, - "loss": 2.3347, - "step": 225310 - }, - { - "epoch": 0.39, - "learning_rate": 3.035344956873851e-05, - "loss": 2.3262, - "step": 225320 - }, - { - "epoch": 0.39, - "learning_rate": 3.0352577628811685e-05, - "loss": 2.3127, - "step": 225330 - }, - { - "epoch": 0.39, - "learning_rate": 3.0351705688884862e-05, - "loss": 2.2784, - "step": 225340 - }, - { - "epoch": 0.39, - "learning_rate": 3.0350833748958036e-05, - "loss": 2.6192, - "step": 225350 - }, - { - "epoch": 0.39, - "learning_rate": 3.0349961809031206e-05, - "loss": 2.4833, - "step": 225360 - }, - { - "epoch": 0.39, - "learning_rate": 3.034908986910438e-05, - "loss": 2.4617, - "step": 225370 - }, - { - "epoch": 0.39, - "learning_rate": 3.0348217929177554e-05, - "loss": 2.4573, - "step": 225380 - }, - { - "epoch": 0.39, - "learning_rate": 3.0347345989250724e-05, - "loss": 2.4162, - "step": 225390 - }, - { - "epoch": 0.39, - "learning_rate": 3.0346474049323898e-05, - "loss": 2.4023, - "step": 225400 - }, - { - "epoch": 0.39, - "learning_rate": 3.0345602109397068e-05, - "loss": 2.3175, - "step": 225410 - }, - { - "epoch": 0.39, - "learning_rate": 3.034473016947025e-05, - "loss": 2.2769, - "step": 225420 - }, - { - "epoch": 0.39, - "learning_rate": 3.034385822954342e-05, - "loss": 2.4227, - "step": 225430 - }, - { - "epoch": 0.39, - "learning_rate": 3.0342986289616593e-05, - "loss": 2.3806, - "step": 225440 - }, - { - "epoch": 0.39, - "learning_rate": 3.0342114349689767e-05, - "loss": 2.4387, - "step": 225450 - }, - { - "epoch": 0.39, - "learning_rate": 3.0341242409762937e-05, - "loss": 2.4675, - "step": 225460 - }, - { - "epoch": 0.39, - "learning_rate": 3.034037046983611e-05, - "loss": 2.5192, - "step": 225470 - }, - { - "epoch": 0.39, - "learning_rate": 3.033949852990928e-05, - "loss": 2.3135, - "step": 225480 - }, - { - "epoch": 0.39, - "learning_rate": 3.0338626589982462e-05, - "loss": 2.5263, - "step": 225490 - }, - { - "epoch": 0.39, - "learning_rate": 3.0337754650055632e-05, - "loss": 2.3496, - "step": 225500 - }, - { - "epoch": 0.39, - "learning_rate": 3.0336882710128806e-05, - "loss": 2.3435, - "step": 225510 - }, - { - "epoch": 0.39, - "learning_rate": 3.0336010770201976e-05, - "loss": 2.535, - "step": 225520 - }, - { - "epoch": 0.39, - "learning_rate": 3.033513883027515e-05, - "loss": 2.3788, - "step": 225530 - }, - { - "epoch": 0.39, - "learning_rate": 3.0334266890348324e-05, - "loss": 2.3515, - "step": 225540 - }, - { - "epoch": 0.39, - "learning_rate": 3.0333394950421494e-05, - "loss": 2.436, - "step": 225550 - }, - { - "epoch": 0.39, - "learning_rate": 3.0332523010494668e-05, - "loss": 2.409, - "step": 225560 - }, - { - "epoch": 0.39, - "learning_rate": 3.0331651070567845e-05, - "loss": 2.3702, - "step": 225570 - }, - { - "epoch": 0.39, - "learning_rate": 3.033077913064102e-05, - "loss": 2.4116, - "step": 225580 - }, - { - "epoch": 0.39, - "learning_rate": 3.032990719071419e-05, - "loss": 2.4258, - "step": 225590 - }, - { - "epoch": 0.39, - "learning_rate": 3.0329035250787363e-05, - "loss": 2.2385, - "step": 225600 - }, - { - "epoch": 0.39, - "learning_rate": 3.0328163310860537e-05, - "loss": 2.373, - "step": 225610 - }, - { - "epoch": 0.39, - "learning_rate": 3.0327291370933707e-05, - "loss": 2.4491, - "step": 225620 - }, - { - "epoch": 0.39, - "learning_rate": 3.032641943100688e-05, - "loss": 2.4426, - "step": 225630 - }, - { - "epoch": 0.39, - "learning_rate": 3.0325547491080058e-05, - "loss": 2.4065, - "step": 225640 - }, - { - "epoch": 0.39, - "learning_rate": 3.0324675551153232e-05, - "loss": 2.4683, - "step": 225650 - }, - { - "epoch": 0.39, - "learning_rate": 3.0323803611226402e-05, - "loss": 2.4709, - "step": 225660 - }, - { - "epoch": 0.39, - "learning_rate": 3.0322931671299576e-05, - "loss": 2.4263, - "step": 225670 - }, - { - "epoch": 0.39, - "learning_rate": 3.032205973137275e-05, - "loss": 2.349, - "step": 225680 - }, - { - "epoch": 0.39, - "learning_rate": 3.032118779144592e-05, - "loss": 2.3099, - "step": 225690 - }, - { - "epoch": 0.39, - "learning_rate": 3.0320315851519094e-05, - "loss": 2.4268, - "step": 225700 - }, - { - "epoch": 0.39, - "learning_rate": 3.0319443911592264e-05, - "loss": 2.322, - "step": 225710 - }, - { - "epoch": 0.39, - "learning_rate": 3.0318571971665445e-05, - "loss": 2.4065, - "step": 225720 - }, - { - "epoch": 0.39, - "learning_rate": 3.0317700031738615e-05, - "loss": 2.4813, - "step": 225730 - }, - { - "epoch": 0.39, - "learning_rate": 3.031682809181179e-05, - "loss": 2.4266, - "step": 225740 - }, - { - "epoch": 0.39, - "learning_rate": 3.031595615188496e-05, - "loss": 2.412, - "step": 225750 - }, - { - "epoch": 0.39, - "learning_rate": 3.0315084211958133e-05, - "loss": 2.3982, - "step": 225760 - }, - { - "epoch": 0.39, - "learning_rate": 3.0314212272031307e-05, - "loss": 2.3671, - "step": 225770 - }, - { - "epoch": 0.39, - "learning_rate": 3.0313340332104477e-05, - "loss": 2.4319, - "step": 225780 - }, - { - "epoch": 0.39, - "learning_rate": 3.0312468392177658e-05, - "loss": 2.4439, - "step": 225790 - }, - { - "epoch": 0.39, - "learning_rate": 3.031159645225083e-05, - "loss": 2.4768, - "step": 225800 - }, - { - "epoch": 0.39, - "learning_rate": 3.0310724512324002e-05, - "loss": 2.4285, - "step": 225810 - }, - { - "epoch": 0.39, - "learning_rate": 3.0309852572397172e-05, - "loss": 2.4034, - "step": 225820 - }, - { - "epoch": 0.39, - "learning_rate": 3.0308980632470346e-05, - "loss": 2.4057, - "step": 225830 - }, - { - "epoch": 0.39, - "learning_rate": 3.030810869254352e-05, - "loss": 2.3801, - "step": 225840 - }, - { - "epoch": 0.39, - "learning_rate": 3.030723675261669e-05, - "loss": 2.3933, - "step": 225850 - }, - { - "epoch": 0.39, - "learning_rate": 3.0306364812689864e-05, - "loss": 2.5, - "step": 225860 - }, - { - "epoch": 0.39, - "learning_rate": 3.030549287276304e-05, - "loss": 2.3594, - "step": 225870 - }, - { - "epoch": 0.39, - "learning_rate": 3.0304620932836215e-05, - "loss": 2.3141, - "step": 225880 - }, - { - "epoch": 0.39, - "learning_rate": 3.0303748992909385e-05, - "loss": 2.3865, - "step": 225890 - }, - { - "epoch": 0.39, - "learning_rate": 3.030287705298256e-05, - "loss": 2.4548, - "step": 225900 - }, - { - "epoch": 0.39, - "learning_rate": 3.0302005113055733e-05, - "loss": 2.3357, - "step": 225910 - }, - { - "epoch": 0.39, - "learning_rate": 3.0301133173128903e-05, - "loss": 2.3785, - "step": 225920 - }, - { - "epoch": 0.39, - "learning_rate": 3.0300261233202077e-05, - "loss": 2.4292, - "step": 225930 - }, - { - "epoch": 0.39, - "learning_rate": 3.0299389293275254e-05, - "loss": 2.3921, - "step": 225940 - }, - { - "epoch": 0.39, - "learning_rate": 3.0298517353348428e-05, - "loss": 2.4895, - "step": 225950 - }, - { - "epoch": 0.39, - "learning_rate": 3.02976454134216e-05, - "loss": 2.3358, - "step": 225960 - }, - { - "epoch": 0.39, - "learning_rate": 3.0296773473494772e-05, - "loss": 2.4065, - "step": 225970 - }, - { - "epoch": 0.39, - "learning_rate": 3.0295901533567943e-05, - "loss": 2.5033, - "step": 225980 - }, - { - "epoch": 0.39, - "learning_rate": 3.0295029593641116e-05, - "loss": 2.3803, - "step": 225990 - }, - { - "epoch": 0.39, - "learning_rate": 3.029415765371429e-05, - "loss": 2.3797, - "step": 226000 - }, - { - "epoch": 0.39, - "learning_rate": 3.0293285713787467e-05, - "loss": 2.3428, - "step": 226010 - }, - { - "epoch": 0.39, - "learning_rate": 3.029241377386064e-05, - "loss": 2.467, - "step": 226020 - }, - { - "epoch": 0.39, - "learning_rate": 3.029154183393381e-05, - "loss": 2.4685, - "step": 226030 - }, - { - "epoch": 0.39, - "learning_rate": 3.0290669894006985e-05, - "loss": 2.3942, - "step": 226040 - }, - { - "epoch": 0.39, - "learning_rate": 3.0289797954080156e-05, - "loss": 2.3762, - "step": 226050 - }, - { - "epoch": 0.39, - "learning_rate": 3.028892601415333e-05, - "loss": 2.4003, - "step": 226060 - }, - { - "epoch": 0.39, - "learning_rate": 3.0288054074226503e-05, - "loss": 2.43, - "step": 226070 - }, - { - "epoch": 0.39, - "learning_rate": 3.0287182134299674e-05, - "loss": 2.3512, - "step": 226080 - }, - { - "epoch": 0.39, - "learning_rate": 3.028631019437285e-05, - "loss": 2.4463, - "step": 226090 - }, - { - "epoch": 0.39, - "learning_rate": 3.0285438254446025e-05, - "loss": 2.4047, - "step": 226100 - }, - { - "epoch": 0.39, - "learning_rate": 3.0284566314519198e-05, - "loss": 2.4535, - "step": 226110 - }, - { - "epoch": 0.39, - "learning_rate": 3.028369437459237e-05, - "loss": 2.5024, - "step": 226120 - }, - { - "epoch": 0.39, - "learning_rate": 3.0282822434665542e-05, - "loss": 2.4391, - "step": 226130 - }, - { - "epoch": 0.39, - "learning_rate": 3.0281950494738713e-05, - "loss": 2.3483, - "step": 226140 - }, - { - "epoch": 0.39, - "learning_rate": 3.0281078554811887e-05, - "loss": 2.3273, - "step": 226150 - }, - { - "epoch": 0.39, - "learning_rate": 3.0280206614885064e-05, - "loss": 2.3908, - "step": 226160 - }, - { - "epoch": 0.39, - "learning_rate": 3.0279334674958238e-05, - "loss": 2.3576, - "step": 226170 - }, - { - "epoch": 0.39, - "learning_rate": 3.027846273503141e-05, - "loss": 2.4335, - "step": 226180 - }, - { - "epoch": 0.39, - "learning_rate": 3.027759079510458e-05, - "loss": 2.3814, - "step": 226190 - }, - { - "epoch": 0.39, - "learning_rate": 3.0276718855177755e-05, - "loss": 2.3871, - "step": 226200 - }, - { - "epoch": 0.39, - "learning_rate": 3.0275846915250926e-05, - "loss": 2.4505, - "step": 226210 - }, - { - "epoch": 0.39, - "learning_rate": 3.02749749753241e-05, - "loss": 2.4326, - "step": 226220 - }, - { - "epoch": 0.39, - "learning_rate": 3.0274103035397273e-05, - "loss": 2.4177, - "step": 226230 - }, - { - "epoch": 0.39, - "learning_rate": 3.027323109547045e-05, - "loss": 2.2896, - "step": 226240 - }, - { - "epoch": 0.39, - "learning_rate": 3.027235915554362e-05, - "loss": 2.432, - "step": 226250 - }, - { - "epoch": 0.39, - "learning_rate": 3.0271487215616795e-05, - "loss": 2.3497, - "step": 226260 - }, - { - "epoch": 0.39, - "learning_rate": 3.027061527568997e-05, - "loss": 2.3282, - "step": 226270 - }, - { - "epoch": 0.39, - "learning_rate": 3.026974333576314e-05, - "loss": 2.3653, - "step": 226280 - }, - { - "epoch": 0.39, - "learning_rate": 3.0268871395836313e-05, - "loss": 2.4103, - "step": 226290 - }, - { - "epoch": 0.39, - "learning_rate": 3.0267999455909486e-05, - "loss": 2.3864, - "step": 226300 - }, - { - "epoch": 0.39, - "learning_rate": 3.0267127515982664e-05, - "loss": 2.3398, - "step": 226310 - }, - { - "epoch": 0.39, - "learning_rate": 3.0266255576055834e-05, - "loss": 2.4603, - "step": 226320 - }, - { - "epoch": 0.39, - "learning_rate": 3.0265383636129008e-05, - "loss": 2.3761, - "step": 226330 - }, - { - "epoch": 0.39, - "learning_rate": 3.026451169620218e-05, - "loss": 2.3793, - "step": 226340 - }, - { - "epoch": 0.39, - "learning_rate": 3.0263639756275352e-05, - "loss": 2.3495, - "step": 226350 - }, - { - "epoch": 0.39, - "learning_rate": 3.0262767816348526e-05, - "loss": 2.4354, - "step": 226360 - }, - { - "epoch": 0.39, - "learning_rate": 3.0261895876421696e-05, - "loss": 2.3685, - "step": 226370 - }, - { - "epoch": 0.39, - "learning_rate": 3.026102393649487e-05, - "loss": 2.3611, - "step": 226380 - }, - { - "epoch": 0.39, - "learning_rate": 3.0260151996568047e-05, - "loss": 2.3234, - "step": 226390 - }, - { - "epoch": 0.39, - "learning_rate": 3.025928005664122e-05, - "loss": 2.3781, - "step": 226400 - }, - { - "epoch": 0.39, - "learning_rate": 3.0258408116714394e-05, - "loss": 2.3883, - "step": 226410 - }, - { - "epoch": 0.39, - "learning_rate": 3.0257536176787565e-05, - "loss": 2.2465, - "step": 226420 - }, - { - "epoch": 0.39, - "learning_rate": 3.025666423686074e-05, - "loss": 2.399, - "step": 226430 - }, - { - "epoch": 0.39, - "learning_rate": 3.025579229693391e-05, - "loss": 2.3755, - "step": 226440 - }, - { - "epoch": 0.39, - "learning_rate": 3.0254920357007083e-05, - "loss": 2.3924, - "step": 226450 - }, - { - "epoch": 0.39, - "learning_rate": 3.025404841708026e-05, - "loss": 2.4485, - "step": 226460 - }, - { - "epoch": 0.39, - "learning_rate": 3.0253176477153434e-05, - "loss": 2.3306, - "step": 226470 - }, - { - "epoch": 0.39, - "learning_rate": 3.0252304537226604e-05, - "loss": 2.4167, - "step": 226480 - }, - { - "epoch": 0.39, - "learning_rate": 3.0251432597299778e-05, - "loss": 2.3332, - "step": 226490 - }, - { - "epoch": 0.39, - "learning_rate": 3.025056065737295e-05, - "loss": 2.4247, - "step": 226500 - }, - { - "epoch": 0.4, - "learning_rate": 3.0249688717446122e-05, - "loss": 2.4381, - "step": 226510 - }, - { - "epoch": 0.4, - "learning_rate": 3.0248816777519296e-05, - "loss": 2.4718, - "step": 226520 - }, - { - "epoch": 0.4, - "learning_rate": 3.0247944837592473e-05, - "loss": 2.3527, - "step": 226530 - }, - { - "epoch": 0.4, - "learning_rate": 3.0247072897665647e-05, - "loss": 2.4868, - "step": 226540 - }, - { - "epoch": 0.4, - "learning_rate": 3.0246200957738817e-05, - "loss": 2.3517, - "step": 226550 - }, - { - "epoch": 0.4, - "learning_rate": 3.024532901781199e-05, - "loss": 2.3166, - "step": 226560 - }, - { - "epoch": 0.4, - "learning_rate": 3.0244457077885165e-05, - "loss": 2.4129, - "step": 226570 - }, - { - "epoch": 0.4, - "learning_rate": 3.0243585137958335e-05, - "loss": 2.4178, - "step": 226580 - }, - { - "epoch": 0.4, - "learning_rate": 3.024271319803151e-05, - "loss": 2.3208, - "step": 226590 - }, - { - "epoch": 0.4, - "learning_rate": 3.024184125810468e-05, - "loss": 2.3817, - "step": 226600 - }, - { - "epoch": 0.4, - "learning_rate": 3.024096931817786e-05, - "loss": 2.3739, - "step": 226610 - }, - { - "epoch": 0.4, - "learning_rate": 3.024009737825103e-05, - "loss": 2.5773, - "step": 226620 - }, - { - "epoch": 0.4, - "learning_rate": 3.0239225438324204e-05, - "loss": 2.323, - "step": 226630 - }, - { - "epoch": 0.4, - "learning_rate": 3.0238353498397378e-05, - "loss": 2.3837, - "step": 226640 - }, - { - "epoch": 0.4, - "learning_rate": 3.0237481558470548e-05, - "loss": 2.3738, - "step": 226650 - }, - { - "epoch": 0.4, - "learning_rate": 3.0236609618543722e-05, - "loss": 2.3874, - "step": 226660 - }, - { - "epoch": 0.4, - "learning_rate": 3.0235737678616892e-05, - "loss": 2.4332, - "step": 226670 - }, - { - "epoch": 0.4, - "learning_rate": 3.0234865738690073e-05, - "loss": 2.4773, - "step": 226680 - }, - { - "epoch": 0.4, - "learning_rate": 3.0233993798763243e-05, - "loss": 2.3665, - "step": 226690 - }, - { - "epoch": 0.4, - "learning_rate": 3.0233121858836417e-05, - "loss": 2.4199, - "step": 226700 - }, - { - "epoch": 0.4, - "learning_rate": 3.0232249918909587e-05, - "loss": 2.3063, - "step": 226710 - }, - { - "epoch": 0.4, - "learning_rate": 3.023137797898276e-05, - "loss": 2.4337, - "step": 226720 - }, - { - "epoch": 0.4, - "learning_rate": 3.0230506039055935e-05, - "loss": 2.3752, - "step": 226730 - }, - { - "epoch": 0.4, - "learning_rate": 3.0229634099129105e-05, - "loss": 2.3728, - "step": 226740 - }, - { - "epoch": 0.4, - "learning_rate": 3.022876215920228e-05, - "loss": 2.3931, - "step": 226750 - }, - { - "epoch": 0.4, - "learning_rate": 3.0227890219275456e-05, - "loss": 2.3843, - "step": 226760 - }, - { - "epoch": 0.4, - "learning_rate": 3.022701827934863e-05, - "loss": 2.4598, - "step": 226770 - }, - { - "epoch": 0.4, - "learning_rate": 3.02261463394218e-05, - "loss": 2.3631, - "step": 226780 - }, - { - "epoch": 0.4, - "learning_rate": 3.0225274399494974e-05, - "loss": 2.4687, - "step": 226790 - }, - { - "epoch": 0.4, - "learning_rate": 3.0224402459568148e-05, - "loss": 2.4595, - "step": 226800 - }, - { - "epoch": 0.4, - "learning_rate": 3.0223530519641318e-05, - "loss": 2.2797, - "step": 226810 - }, - { - "epoch": 0.4, - "learning_rate": 3.0222658579714492e-05, - "loss": 2.3264, - "step": 226820 - }, - { - "epoch": 0.4, - "learning_rate": 3.022178663978767e-05, - "loss": 2.4372, - "step": 226830 - }, - { - "epoch": 0.4, - "learning_rate": 3.0220914699860843e-05, - "loss": 2.366, - "step": 226840 - }, - { - "epoch": 0.4, - "learning_rate": 3.0220042759934013e-05, - "loss": 2.5229, - "step": 226850 - }, - { - "epoch": 0.4, - "learning_rate": 3.0219170820007187e-05, - "loss": 2.4639, - "step": 226860 - }, - { - "epoch": 0.4, - "learning_rate": 3.0218298880080357e-05, - "loss": 2.5099, - "step": 226870 - }, - { - "epoch": 0.4, - "learning_rate": 3.021742694015353e-05, - "loss": 2.3158, - "step": 226880 - }, - { - "epoch": 0.4, - "learning_rate": 3.0216555000226705e-05, - "loss": 2.5115, - "step": 226890 - }, - { - "epoch": 0.4, - "learning_rate": 3.0215683060299875e-05, - "loss": 2.2579, - "step": 226900 - }, - { - "epoch": 0.4, - "learning_rate": 3.0214811120373056e-05, - "loss": 2.4728, - "step": 226910 - }, - { - "epoch": 0.4, - "learning_rate": 3.0213939180446226e-05, - "loss": 2.414, - "step": 226920 - }, - { - "epoch": 0.4, - "learning_rate": 3.02130672405194e-05, - "loss": 2.2534, - "step": 226930 - }, - { - "epoch": 0.4, - "learning_rate": 3.021219530059257e-05, - "loss": 2.4101, - "step": 226940 - }, - { - "epoch": 0.4, - "learning_rate": 3.0211323360665744e-05, - "loss": 2.3455, - "step": 226950 - }, - { - "epoch": 0.4, - "learning_rate": 3.0210451420738918e-05, - "loss": 2.3973, - "step": 226960 - }, - { - "epoch": 0.4, - "learning_rate": 3.0209579480812088e-05, - "loss": 2.3894, - "step": 226970 - }, - { - "epoch": 0.4, - "learning_rate": 3.0208707540885265e-05, - "loss": 2.3961, - "step": 226980 - }, - { - "epoch": 0.4, - "learning_rate": 3.020783560095844e-05, - "loss": 2.318, - "step": 226990 - }, - { - "epoch": 0.4, - "learning_rate": 3.0206963661031613e-05, - "loss": 2.3494, - "step": 227000 - }, - { - "epoch": 0.4, - "learning_rate": 3.0206091721104783e-05, - "loss": 2.3643, - "step": 227010 - }, - { - "epoch": 0.4, - "learning_rate": 3.0205219781177957e-05, - "loss": 2.4532, - "step": 227020 - }, - { - "epoch": 0.4, - "learning_rate": 3.020434784125113e-05, - "loss": 2.3542, - "step": 227030 - }, - { - "epoch": 0.4, - "learning_rate": 3.02034759013243e-05, - "loss": 2.4696, - "step": 227040 - }, - { - "epoch": 0.4, - "learning_rate": 3.0202603961397475e-05, - "loss": 2.3853, - "step": 227050 - }, - { - "epoch": 0.4, - "learning_rate": 3.0201732021470652e-05, - "loss": 2.3982, - "step": 227060 - }, - { - "epoch": 0.4, - "learning_rate": 3.0200860081543826e-05, - "loss": 2.3299, - "step": 227070 - }, - { - "epoch": 0.4, - "learning_rate": 3.0199988141616996e-05, - "loss": 2.2973, - "step": 227080 - }, - { - "epoch": 0.4, - "learning_rate": 3.019911620169017e-05, - "loss": 2.2964, - "step": 227090 - }, - { - "epoch": 0.4, - "learning_rate": 3.019824426176334e-05, - "loss": 2.4338, - "step": 227100 - }, - { - "epoch": 0.4, - "learning_rate": 3.0197372321836514e-05, - "loss": 2.4077, - "step": 227110 - }, - { - "epoch": 0.4, - "learning_rate": 3.0196500381909688e-05, - "loss": 2.4755, - "step": 227120 - }, - { - "epoch": 0.4, - "learning_rate": 3.0195628441982865e-05, - "loss": 2.3625, - "step": 227130 - }, - { - "epoch": 0.4, - "learning_rate": 3.019475650205604e-05, - "loss": 2.3995, - "step": 227140 - }, - { - "epoch": 0.4, - "learning_rate": 3.019388456212921e-05, - "loss": 2.3064, - "step": 227150 - }, - { - "epoch": 0.4, - "learning_rate": 3.0193012622202383e-05, - "loss": 2.514, - "step": 227160 - }, - { - "epoch": 0.4, - "learning_rate": 3.0192140682275554e-05, - "loss": 2.4118, - "step": 227170 - }, - { - "epoch": 0.4, - "learning_rate": 3.0191268742348727e-05, - "loss": 2.4492, - "step": 227180 - }, - { - "epoch": 0.4, - "learning_rate": 3.01903968024219e-05, - "loss": 2.3609, - "step": 227190 - }, - { - "epoch": 0.4, - "learning_rate": 3.0189524862495078e-05, - "loss": 2.3885, - "step": 227200 - }, - { - "epoch": 0.4, - "learning_rate": 3.018865292256825e-05, - "loss": 2.299, - "step": 227210 - }, - { - "epoch": 0.4, - "learning_rate": 3.0187780982641422e-05, - "loss": 2.4592, - "step": 227220 - }, - { - "epoch": 0.4, - "learning_rate": 3.0186909042714596e-05, - "loss": 2.4248, - "step": 227230 - }, - { - "epoch": 0.4, - "learning_rate": 3.0186037102787767e-05, - "loss": 2.4355, - "step": 227240 - }, - { - "epoch": 0.4, - "learning_rate": 3.018516516286094e-05, - "loss": 2.3305, - "step": 227250 - }, - { - "epoch": 0.4, - "learning_rate": 3.0184293222934114e-05, - "loss": 2.2941, - "step": 227260 - }, - { - "epoch": 0.4, - "learning_rate": 3.0183421283007284e-05, - "loss": 2.3142, - "step": 227270 - }, - { - "epoch": 0.4, - "learning_rate": 3.018254934308046e-05, - "loss": 2.3326, - "step": 227280 - }, - { - "epoch": 0.4, - "learning_rate": 3.0181677403153635e-05, - "loss": 2.3414, - "step": 227290 - }, - { - "epoch": 0.4, - "learning_rate": 3.018080546322681e-05, - "loss": 2.432, - "step": 227300 - }, - { - "epoch": 0.4, - "learning_rate": 3.017993352329998e-05, - "loss": 2.4447, - "step": 227310 - }, - { - "epoch": 0.4, - "learning_rate": 3.0179061583373153e-05, - "loss": 2.4573, - "step": 227320 - }, - { - "epoch": 0.4, - "learning_rate": 3.0178189643446324e-05, - "loss": 2.3553, - "step": 227330 - }, - { - "epoch": 0.4, - "learning_rate": 3.0177317703519497e-05, - "loss": 2.3828, - "step": 227340 - }, - { - "epoch": 0.4, - "learning_rate": 3.0176445763592675e-05, - "loss": 2.3889, - "step": 227350 - }, - { - "epoch": 0.4, - "learning_rate": 3.017557382366585e-05, - "loss": 2.365, - "step": 227360 - }, - { - "epoch": 0.4, - "learning_rate": 3.0174701883739022e-05, - "loss": 2.3453, - "step": 227370 - }, - { - "epoch": 0.4, - "learning_rate": 3.0173829943812193e-05, - "loss": 2.4413, - "step": 227380 - }, - { - "epoch": 0.4, - "learning_rate": 3.0172958003885366e-05, - "loss": 2.2904, - "step": 227390 - }, - { - "epoch": 0.4, - "learning_rate": 3.0172086063958537e-05, - "loss": 2.444, - "step": 227400 - }, - { - "epoch": 0.4, - "learning_rate": 3.017121412403171e-05, - "loss": 2.4488, - "step": 227410 - }, - { - "epoch": 0.4, - "learning_rate": 3.0170342184104884e-05, - "loss": 2.3999, - "step": 227420 - }, - { - "epoch": 0.4, - "learning_rate": 3.016947024417806e-05, - "loss": 2.481, - "step": 227430 - }, - { - "epoch": 0.4, - "learning_rate": 3.0168598304251232e-05, - "loss": 2.4047, - "step": 227440 - }, - { - "epoch": 0.4, - "learning_rate": 3.0167726364324406e-05, - "loss": 2.4211, - "step": 227450 - }, - { - "epoch": 0.4, - "learning_rate": 3.016685442439758e-05, - "loss": 2.4031, - "step": 227460 - }, - { - "epoch": 0.4, - "learning_rate": 3.016598248447075e-05, - "loss": 2.4026, - "step": 227470 - }, - { - "epoch": 0.4, - "learning_rate": 3.0165110544543923e-05, - "loss": 2.3315, - "step": 227480 - }, - { - "epoch": 0.4, - "learning_rate": 3.0164238604617094e-05, - "loss": 2.6336, - "step": 227490 - }, - { - "epoch": 0.4, - "learning_rate": 3.0163366664690274e-05, - "loss": 2.3936, - "step": 227500 - }, - { - "epoch": 0.4, - "learning_rate": 3.0162494724763445e-05, - "loss": 2.4873, - "step": 227510 - }, - { - "epoch": 0.4, - "learning_rate": 3.016162278483662e-05, - "loss": 2.4723, - "step": 227520 - }, - { - "epoch": 0.4, - "learning_rate": 3.0160750844909792e-05, - "loss": 2.2936, - "step": 227530 - }, - { - "epoch": 0.4, - "learning_rate": 3.0159878904982963e-05, - "loss": 2.4943, - "step": 227540 - }, - { - "epoch": 0.4, - "learning_rate": 3.0159006965056136e-05, - "loss": 2.436, - "step": 227550 - }, - { - "epoch": 0.4, - "learning_rate": 3.0158135025129307e-05, - "loss": 2.3665, - "step": 227560 - }, - { - "epoch": 0.4, - "learning_rate": 3.015726308520248e-05, - "loss": 2.4892, - "step": 227570 - }, - { - "epoch": 0.4, - "learning_rate": 3.0156391145275658e-05, - "loss": 2.3677, - "step": 227580 - }, - { - "epoch": 0.4, - "learning_rate": 3.015551920534883e-05, - "loss": 2.3982, - "step": 227590 - }, - { - "epoch": 0.4, - "learning_rate": 3.0154647265422002e-05, - "loss": 2.3381, - "step": 227600 - }, - { - "epoch": 0.4, - "learning_rate": 3.0153775325495176e-05, - "loss": 2.3726, - "step": 227610 - }, - { - "epoch": 0.4, - "learning_rate": 3.015290338556835e-05, - "loss": 2.4701, - "step": 227620 - }, - { - "epoch": 0.4, - "learning_rate": 3.015203144564152e-05, - "loss": 2.3526, - "step": 227630 - }, - { - "epoch": 0.4, - "learning_rate": 3.0151159505714694e-05, - "loss": 2.3782, - "step": 227640 - }, - { - "epoch": 0.4, - "learning_rate": 3.015028756578787e-05, - "loss": 2.3786, - "step": 227650 - }, - { - "epoch": 0.4, - "learning_rate": 3.0149415625861045e-05, - "loss": 2.3287, - "step": 227660 - }, - { - "epoch": 0.4, - "learning_rate": 3.0148543685934215e-05, - "loss": 2.5151, - "step": 227670 - }, - { - "epoch": 0.4, - "learning_rate": 3.014767174600739e-05, - "loss": 2.4618, - "step": 227680 - }, - { - "epoch": 0.4, - "learning_rate": 3.0146799806080562e-05, - "loss": 2.4114, - "step": 227690 - }, - { - "epoch": 0.4, - "learning_rate": 3.0145927866153733e-05, - "loss": 2.4437, - "step": 227700 - }, - { - "epoch": 0.4, - "learning_rate": 3.0145055926226907e-05, - "loss": 2.3955, - "step": 227710 - }, - { - "epoch": 0.4, - "learning_rate": 3.0144183986300077e-05, - "loss": 2.3003, - "step": 227720 - }, - { - "epoch": 0.4, - "learning_rate": 3.0143312046373258e-05, - "loss": 2.4035, - "step": 227730 - }, - { - "epoch": 0.4, - "learning_rate": 3.0142440106446428e-05, - "loss": 2.4513, - "step": 227740 - }, - { - "epoch": 0.4, - "learning_rate": 3.01415681665196e-05, - "loss": 2.5157, - "step": 227750 - }, - { - "epoch": 0.4, - "learning_rate": 3.0140696226592775e-05, - "loss": 2.4375, - "step": 227760 - }, - { - "epoch": 0.4, - "learning_rate": 3.0139824286665946e-05, - "loss": 2.4091, - "step": 227770 - }, - { - "epoch": 0.4, - "learning_rate": 3.013895234673912e-05, - "loss": 2.3912, - "step": 227780 - }, - { - "epoch": 0.4, - "learning_rate": 3.013808040681229e-05, - "loss": 2.3237, - "step": 227790 - }, - { - "epoch": 0.4, - "learning_rate": 3.013720846688547e-05, - "loss": 2.4231, - "step": 227800 - }, - { - "epoch": 0.4, - "learning_rate": 3.013633652695864e-05, - "loss": 2.4252, - "step": 227810 - }, - { - "epoch": 0.4, - "learning_rate": 3.0135464587031815e-05, - "loss": 2.4417, - "step": 227820 - }, - { - "epoch": 0.4, - "learning_rate": 3.0134592647104985e-05, - "loss": 2.2845, - "step": 227830 - }, - { - "epoch": 0.4, - "learning_rate": 3.013372070717816e-05, - "loss": 2.3971, - "step": 227840 - }, - { - "epoch": 0.4, - "learning_rate": 3.0132848767251333e-05, - "loss": 2.5129, - "step": 227850 - }, - { - "epoch": 0.4, - "learning_rate": 3.0131976827324503e-05, - "loss": 2.3793, - "step": 227860 - }, - { - "epoch": 0.4, - "learning_rate": 3.0131104887397684e-05, - "loss": 2.3622, - "step": 227870 - }, - { - "epoch": 0.4, - "learning_rate": 3.0130232947470854e-05, - "loss": 2.387, - "step": 227880 - }, - { - "epoch": 0.4, - "learning_rate": 3.0129361007544028e-05, - "loss": 2.4549, - "step": 227890 - }, - { - "epoch": 0.4, - "learning_rate": 3.0128489067617198e-05, - "loss": 2.2664, - "step": 227900 - }, - { - "epoch": 0.4, - "learning_rate": 3.0127617127690372e-05, - "loss": 2.3122, - "step": 227910 - }, - { - "epoch": 0.4, - "learning_rate": 3.0126745187763546e-05, - "loss": 2.3408, - "step": 227920 - }, - { - "epoch": 0.4, - "learning_rate": 3.0125873247836716e-05, - "loss": 2.4657, - "step": 227930 - }, - { - "epoch": 0.4, - "learning_rate": 3.012500130790989e-05, - "loss": 2.3683, - "step": 227940 - }, - { - "epoch": 0.4, - "learning_rate": 3.0124129367983067e-05, - "loss": 2.3707, - "step": 227950 - }, - { - "epoch": 0.4, - "learning_rate": 3.012325742805624e-05, - "loss": 2.3308, - "step": 227960 - }, - { - "epoch": 0.4, - "learning_rate": 3.012238548812941e-05, - "loss": 2.4199, - "step": 227970 - }, - { - "epoch": 0.4, - "learning_rate": 3.0121513548202585e-05, - "loss": 2.3599, - "step": 227980 - }, - { - "epoch": 0.4, - "learning_rate": 3.012064160827576e-05, - "loss": 2.4091, - "step": 227990 - }, - { - "epoch": 0.4, - "learning_rate": 3.011976966834893e-05, - "loss": 2.3792, - "step": 228000 - }, - { - "epoch": 0.4, - "learning_rate": 3.0118897728422103e-05, - "loss": 2.3181, - "step": 228010 - }, - { - "epoch": 0.4, - "learning_rate": 3.011802578849528e-05, - "loss": 2.4577, - "step": 228020 - }, - { - "epoch": 0.4, - "learning_rate": 3.0117153848568454e-05, - "loss": 2.3489, - "step": 228030 - }, - { - "epoch": 0.4, - "learning_rate": 3.0116281908641624e-05, - "loss": 2.427, - "step": 228040 - }, - { - "epoch": 0.4, - "learning_rate": 3.0115409968714798e-05, - "loss": 2.3569, - "step": 228050 - }, - { - "epoch": 0.4, - "learning_rate": 3.0114538028787968e-05, - "loss": 2.4005, - "step": 228060 - }, - { - "epoch": 0.4, - "learning_rate": 3.0113666088861142e-05, - "loss": 2.4095, - "step": 228070 - }, - { - "epoch": 0.4, - "learning_rate": 3.0112794148934316e-05, - "loss": 2.4533, - "step": 228080 - }, - { - "epoch": 0.4, - "learning_rate": 3.0111922209007486e-05, - "loss": 2.4458, - "step": 228090 - }, - { - "epoch": 0.4, - "learning_rate": 3.0111050269080667e-05, - "loss": 2.3545, - "step": 228100 - }, - { - "epoch": 0.4, - "learning_rate": 3.0110178329153837e-05, - "loss": 2.4627, - "step": 228110 - }, - { - "epoch": 0.4, - "learning_rate": 3.010930638922701e-05, - "loss": 2.4283, - "step": 228120 - }, - { - "epoch": 0.4, - "learning_rate": 3.010843444930018e-05, - "loss": 2.4013, - "step": 228130 - }, - { - "epoch": 0.4, - "learning_rate": 3.0107562509373355e-05, - "loss": 2.5265, - "step": 228140 - }, - { - "epoch": 0.4, - "learning_rate": 3.010669056944653e-05, - "loss": 2.3931, - "step": 228150 - }, - { - "epoch": 0.4, - "learning_rate": 3.01058186295197e-05, - "loss": 2.4469, - "step": 228160 - }, - { - "epoch": 0.4, - "learning_rate": 3.0104946689592876e-05, - "loss": 2.3986, - "step": 228170 - }, - { - "epoch": 0.4, - "learning_rate": 3.010407474966605e-05, - "loss": 2.3571, - "step": 228180 - }, - { - "epoch": 0.4, - "learning_rate": 3.0103202809739224e-05, - "loss": 2.4391, - "step": 228190 - }, - { - "epoch": 0.4, - "learning_rate": 3.0102330869812394e-05, - "loss": 2.2686, - "step": 228200 - }, - { - "epoch": 0.4, - "learning_rate": 3.0101458929885568e-05, - "loss": 2.3176, - "step": 228210 - }, - { - "epoch": 0.4, - "learning_rate": 3.010058698995874e-05, - "loss": 2.3909, - "step": 228220 - }, - { - "epoch": 0.4, - "learning_rate": 3.0099715050031912e-05, - "loss": 2.4523, - "step": 228230 - }, - { - "epoch": 0.4, - "learning_rate": 3.0098843110105086e-05, - "loss": 2.3511, - "step": 228240 - }, - { - "epoch": 0.4, - "learning_rate": 3.0097971170178263e-05, - "loss": 2.4388, - "step": 228250 - }, - { - "epoch": 0.4, - "learning_rate": 3.0097099230251437e-05, - "loss": 2.4159, - "step": 228260 - }, - { - "epoch": 0.4, - "learning_rate": 3.0096227290324607e-05, - "loss": 2.4936, - "step": 228270 - }, - { - "epoch": 0.4, - "learning_rate": 3.009535535039778e-05, - "loss": 2.4067, - "step": 228280 - }, - { - "epoch": 0.4, - "learning_rate": 3.009448341047095e-05, - "loss": 2.4244, - "step": 228290 - }, - { - "epoch": 0.4, - "learning_rate": 3.0093611470544125e-05, - "loss": 2.4004, - "step": 228300 - }, - { - "epoch": 0.4, - "learning_rate": 3.00927395306173e-05, - "loss": 2.3827, - "step": 228310 - }, - { - "epoch": 0.4, - "learning_rate": 3.0091867590690476e-05, - "loss": 2.4014, - "step": 228320 - }, - { - "epoch": 0.4, - "learning_rate": 3.0090995650763646e-05, - "loss": 2.3108, - "step": 228330 - }, - { - "epoch": 0.4, - "learning_rate": 3.009012371083682e-05, - "loss": 2.3752, - "step": 228340 - }, - { - "epoch": 0.4, - "learning_rate": 3.0089251770909994e-05, - "loss": 2.383, - "step": 228350 - }, - { - "epoch": 0.4, - "learning_rate": 3.0088379830983164e-05, - "loss": 2.4643, - "step": 228360 - }, - { - "epoch": 0.4, - "learning_rate": 3.0087507891056338e-05, - "loss": 2.3931, - "step": 228370 - }, - { - "epoch": 0.4, - "learning_rate": 3.0086635951129512e-05, - "loss": 2.4844, - "step": 228380 - }, - { - "epoch": 0.4, - "learning_rate": 3.008576401120269e-05, - "loss": 2.3707, - "step": 228390 - }, - { - "epoch": 0.4, - "learning_rate": 3.008489207127586e-05, - "loss": 2.4261, - "step": 228400 - }, - { - "epoch": 0.4, - "learning_rate": 3.0084020131349033e-05, - "loss": 2.2833, - "step": 228410 - }, - { - "epoch": 0.4, - "learning_rate": 3.0083148191422207e-05, - "loss": 2.4031, - "step": 228420 - }, - { - "epoch": 0.4, - "learning_rate": 3.0082276251495377e-05, - "loss": 2.379, - "step": 228430 - }, - { - "epoch": 0.4, - "learning_rate": 3.008140431156855e-05, - "loss": 2.4282, - "step": 228440 - }, - { - "epoch": 0.4, - "learning_rate": 3.008053237164172e-05, - "loss": 2.4186, - "step": 228450 - }, - { - "epoch": 0.4, - "learning_rate": 3.0079660431714895e-05, - "loss": 2.4015, - "step": 228460 - }, - { - "epoch": 0.4, - "learning_rate": 3.0078788491788072e-05, - "loss": 2.3768, - "step": 228470 - }, - { - "epoch": 0.4, - "learning_rate": 3.0077916551861246e-05, - "loss": 2.4324, - "step": 228480 - }, - { - "epoch": 0.4, - "learning_rate": 3.007704461193442e-05, - "loss": 2.3539, - "step": 228490 - }, - { - "epoch": 0.4, - "learning_rate": 3.007617267200759e-05, - "loss": 2.4593, - "step": 228500 - }, - { - "epoch": 0.4, - "learning_rate": 3.0075300732080764e-05, - "loss": 2.3541, - "step": 228510 - }, - { - "epoch": 0.4, - "learning_rate": 3.0074428792153935e-05, - "loss": 2.4687, - "step": 228520 - }, - { - "epoch": 0.4, - "learning_rate": 3.0073556852227108e-05, - "loss": 2.2957, - "step": 228530 - }, - { - "epoch": 0.4, - "learning_rate": 3.0072684912300285e-05, - "loss": 2.3712, - "step": 228540 - }, - { - "epoch": 0.4, - "learning_rate": 3.007181297237346e-05, - "loss": 2.3883, - "step": 228550 - }, - { - "epoch": 0.4, - "learning_rate": 3.007094103244663e-05, - "loss": 2.3947, - "step": 228560 - }, - { - "epoch": 0.4, - "learning_rate": 3.0070069092519803e-05, - "loss": 2.5382, - "step": 228570 - }, - { - "epoch": 0.4, - "learning_rate": 3.0069197152592977e-05, - "loss": 2.4176, - "step": 228580 - }, - { - "epoch": 0.4, - "learning_rate": 3.0068325212666148e-05, - "loss": 2.3864, - "step": 228590 - }, - { - "epoch": 0.4, - "learning_rate": 3.006745327273932e-05, - "loss": 2.3765, - "step": 228600 - }, - { - "epoch": 0.4, - "learning_rate": 3.0066581332812495e-05, - "loss": 2.501, - "step": 228610 - }, - { - "epoch": 0.4, - "learning_rate": 3.0065709392885672e-05, - "loss": 2.4984, - "step": 228620 - }, - { - "epoch": 0.4, - "learning_rate": 3.0064837452958843e-05, - "loss": 2.3528, - "step": 228630 - }, - { - "epoch": 0.4, - "learning_rate": 3.0063965513032016e-05, - "loss": 2.4372, - "step": 228640 - }, - { - "epoch": 0.4, - "learning_rate": 3.006309357310519e-05, - "loss": 2.4225, - "step": 228650 - }, - { - "epoch": 0.4, - "learning_rate": 3.006222163317836e-05, - "loss": 2.319, - "step": 228660 - }, - { - "epoch": 0.4, - "learning_rate": 3.0061349693251534e-05, - "loss": 2.2999, - "step": 228670 - }, - { - "epoch": 0.4, - "learning_rate": 3.0060477753324705e-05, - "loss": 2.4998, - "step": 228680 - }, - { - "epoch": 0.4, - "learning_rate": 3.0059605813397885e-05, - "loss": 2.4799, - "step": 228690 - }, - { - "epoch": 0.4, - "learning_rate": 3.0058733873471056e-05, - "loss": 2.3579, - "step": 228700 - }, - { - "epoch": 0.4, - "learning_rate": 3.005786193354423e-05, - "loss": 2.3289, - "step": 228710 - }, - { - "epoch": 0.4, - "learning_rate": 3.0056989993617403e-05, - "loss": 2.4426, - "step": 228720 - }, - { - "epoch": 0.4, - "learning_rate": 3.0056118053690574e-05, - "loss": 2.2476, - "step": 228730 - }, - { - "epoch": 0.4, - "learning_rate": 3.0055246113763747e-05, - "loss": 2.3682, - "step": 228740 - }, - { - "epoch": 0.4, - "learning_rate": 3.0054374173836918e-05, - "loss": 2.4564, - "step": 228750 - }, - { - "epoch": 0.4, - "learning_rate": 3.005350223391009e-05, - "loss": 2.3832, - "step": 228760 - }, - { - "epoch": 0.4, - "learning_rate": 3.005263029398327e-05, - "loss": 2.2879, - "step": 228770 - }, - { - "epoch": 0.4, - "learning_rate": 3.0051758354056442e-05, - "loss": 2.3397, - "step": 228780 - }, - { - "epoch": 0.4, - "learning_rate": 3.0050886414129613e-05, - "loss": 2.3987, - "step": 228790 - }, - { - "epoch": 0.4, - "learning_rate": 3.0050014474202787e-05, - "loss": 2.4077, - "step": 228800 - }, - { - "epoch": 0.4, - "learning_rate": 3.004914253427596e-05, - "loss": 2.5326, - "step": 228810 - }, - { - "epoch": 0.4, - "learning_rate": 3.004827059434913e-05, - "loss": 2.3357, - "step": 228820 - }, - { - "epoch": 0.4, - "learning_rate": 3.0047398654422304e-05, - "loss": 2.3913, - "step": 228830 - }, - { - "epoch": 0.4, - "learning_rate": 3.004652671449548e-05, - "loss": 2.3902, - "step": 228840 - }, - { - "epoch": 0.4, - "learning_rate": 3.0045654774568655e-05, - "loss": 2.4817, - "step": 228850 - }, - { - "epoch": 0.4, - "learning_rate": 3.0044782834641826e-05, - "loss": 2.4754, - "step": 228860 - }, - { - "epoch": 0.4, - "learning_rate": 3.0043910894715e-05, - "loss": 2.4379, - "step": 228870 - }, - { - "epoch": 0.4, - "learning_rate": 3.0043038954788173e-05, - "loss": 2.3033, - "step": 228880 - }, - { - "epoch": 0.4, - "learning_rate": 3.0042167014861344e-05, - "loss": 2.4105, - "step": 228890 - }, - { - "epoch": 0.4, - "learning_rate": 3.0041295074934517e-05, - "loss": 2.5305, - "step": 228900 - }, - { - "epoch": 0.4, - "learning_rate": 3.0040423135007688e-05, - "loss": 2.3499, - "step": 228910 - }, - { - "epoch": 0.4, - "learning_rate": 3.003955119508087e-05, - "loss": 2.4149, - "step": 228920 - }, - { - "epoch": 0.4, - "learning_rate": 3.003867925515404e-05, - "loss": 2.4941, - "step": 228930 - }, - { - "epoch": 0.4, - "learning_rate": 3.0037807315227213e-05, - "loss": 2.2913, - "step": 228940 - }, - { - "epoch": 0.4, - "learning_rate": 3.0036935375300383e-05, - "loss": 2.3685, - "step": 228950 - }, - { - "epoch": 0.4, - "learning_rate": 3.0036063435373557e-05, - "loss": 2.4812, - "step": 228960 - }, - { - "epoch": 0.4, - "learning_rate": 3.003519149544673e-05, - "loss": 2.3526, - "step": 228970 - }, - { - "epoch": 0.4, - "learning_rate": 3.00343195555199e-05, - "loss": 2.4114, - "step": 228980 - }, - { - "epoch": 0.4, - "learning_rate": 3.003344761559308e-05, - "loss": 2.4372, - "step": 228990 - }, - { - "epoch": 0.4, - "learning_rate": 3.0032575675666252e-05, - "loss": 2.3688, - "step": 229000 - }, - { - "epoch": 0.4, - "learning_rate": 3.0031703735739426e-05, - "loss": 2.5684, - "step": 229010 - }, - { - "epoch": 0.4, - "learning_rate": 3.0030831795812596e-05, - "loss": 2.3578, - "step": 229020 - }, - { - "epoch": 0.4, - "learning_rate": 3.002995985588577e-05, - "loss": 2.4591, - "step": 229030 - }, - { - "epoch": 0.4, - "learning_rate": 3.0029087915958943e-05, - "loss": 2.4633, - "step": 229040 - }, - { - "epoch": 0.4, - "learning_rate": 3.0028215976032114e-05, - "loss": 2.4424, - "step": 229050 - }, - { - "epoch": 0.4, - "learning_rate": 3.002734403610529e-05, - "loss": 2.39, - "step": 229060 - }, - { - "epoch": 0.4, - "learning_rate": 3.0026472096178465e-05, - "loss": 2.36, - "step": 229070 - }, - { - "epoch": 0.4, - "learning_rate": 3.002560015625164e-05, - "loss": 2.3392, - "step": 229080 - }, - { - "epoch": 0.4, - "learning_rate": 3.002472821632481e-05, - "loss": 2.4401, - "step": 229090 - }, - { - "epoch": 0.4, - "learning_rate": 3.0023856276397983e-05, - "loss": 2.4074, - "step": 229100 - }, - { - "epoch": 0.4, - "learning_rate": 3.0022984336471156e-05, - "loss": 2.4014, - "step": 229110 - }, - { - "epoch": 0.4, - "learning_rate": 3.0022112396544327e-05, - "loss": 2.4165, - "step": 229120 - }, - { - "epoch": 0.4, - "learning_rate": 3.00212404566175e-05, - "loss": 2.3409, - "step": 229130 - }, - { - "epoch": 0.4, - "learning_rate": 3.0020368516690678e-05, - "loss": 2.5605, - "step": 229140 - }, - { - "epoch": 0.4, - "learning_rate": 3.001949657676385e-05, - "loss": 2.41, - "step": 229150 - }, - { - "epoch": 0.4, - "learning_rate": 3.0018624636837022e-05, - "loss": 2.413, - "step": 229160 - }, - { - "epoch": 0.4, - "learning_rate": 3.0017752696910196e-05, - "loss": 2.5036, - "step": 229170 - }, - { - "epoch": 0.4, - "learning_rate": 3.0016880756983366e-05, - "loss": 2.3787, - "step": 229180 - }, - { - "epoch": 0.4, - "learning_rate": 3.001600881705654e-05, - "loss": 2.372, - "step": 229190 - }, - { - "epoch": 0.4, - "learning_rate": 3.0015136877129714e-05, - "loss": 2.5239, - "step": 229200 - }, - { - "epoch": 0.4, - "learning_rate": 3.001426493720289e-05, - "loss": 2.4654, - "step": 229210 - }, - { - "epoch": 0.4, - "learning_rate": 3.0013392997276065e-05, - "loss": 2.3772, - "step": 229220 - }, - { - "epoch": 0.4, - "learning_rate": 3.0012521057349235e-05, - "loss": 2.3126, - "step": 229230 - }, - { - "epoch": 0.4, - "learning_rate": 3.001164911742241e-05, - "loss": 2.2879, - "step": 229240 - }, - { - "epoch": 0.4, - "learning_rate": 3.001077717749558e-05, - "loss": 2.3368, - "step": 229250 - }, - { - "epoch": 0.4, - "learning_rate": 3.0009905237568753e-05, - "loss": 2.5277, - "step": 229260 - }, - { - "epoch": 0.4, - "learning_rate": 3.0009033297641927e-05, - "loss": 2.3847, - "step": 229270 - }, - { - "epoch": 0.4, - "learning_rate": 3.0008161357715097e-05, - "loss": 2.3436, - "step": 229280 - }, - { - "epoch": 0.4, - "learning_rate": 3.0007289417788274e-05, - "loss": 2.3717, - "step": 229290 - }, - { - "epoch": 0.4, - "learning_rate": 3.0006417477861448e-05, - "loss": 2.3324, - "step": 229300 - }, - { - "epoch": 0.4, - "learning_rate": 3.000554553793462e-05, - "loss": 2.3799, - "step": 229310 - }, - { - "epoch": 0.4, - "learning_rate": 3.0004673598007792e-05, - "loss": 2.3948, - "step": 229320 - }, - { - "epoch": 0.4, - "learning_rate": 3.0003801658080966e-05, - "loss": 2.536, - "step": 229330 - }, - { - "epoch": 0.4, - "learning_rate": 3.000292971815414e-05, - "loss": 2.4389, - "step": 229340 - }, - { - "epoch": 0.4, - "learning_rate": 3.000205777822731e-05, - "loss": 2.3748, - "step": 229350 - }, - { - "epoch": 0.4, - "learning_rate": 3.0001185838300487e-05, - "loss": 2.4577, - "step": 229360 - }, - { - "epoch": 0.4, - "learning_rate": 3.000031389837366e-05, - "loss": 2.4191, - "step": 229370 - }, - { - "epoch": 0.4, - "learning_rate": 2.9999441958446835e-05, - "loss": 2.4343, - "step": 229380 - }, - { - "epoch": 0.4, - "learning_rate": 2.9998570018520005e-05, - "loss": 2.3488, - "step": 229390 - }, - { - "epoch": 0.4, - "learning_rate": 2.999769807859318e-05, - "loss": 2.3078, - "step": 229400 - }, - { - "epoch": 0.4, - "learning_rate": 2.999682613866635e-05, - "loss": 2.4495, - "step": 229410 - }, - { - "epoch": 0.4, - "learning_rate": 2.9995954198739523e-05, - "loss": 2.335, - "step": 229420 - }, - { - "epoch": 0.4, - "learning_rate": 2.9995082258812697e-05, - "loss": 2.3768, - "step": 229430 - }, - { - "epoch": 0.4, - "learning_rate": 2.9994210318885874e-05, - "loss": 2.4947, - "step": 229440 - }, - { - "epoch": 0.4, - "learning_rate": 2.9993338378959048e-05, - "loss": 2.5406, - "step": 229450 - }, - { - "epoch": 0.4, - "learning_rate": 2.9992466439032218e-05, - "loss": 2.3812, - "step": 229460 - }, - { - "epoch": 0.4, - "learning_rate": 2.9991594499105392e-05, - "loss": 2.311, - "step": 229470 - }, - { - "epoch": 0.4, - "learning_rate": 2.9990722559178562e-05, - "loss": 2.3023, - "step": 229480 - }, - { - "epoch": 0.4, - "learning_rate": 2.9989850619251736e-05, - "loss": 2.3307, - "step": 229490 - }, - { - "epoch": 0.4, - "learning_rate": 2.998897867932491e-05, - "loss": 2.4229, - "step": 229500 - }, - { - "epoch": 0.4, - "learning_rate": 2.9988106739398087e-05, - "loss": 2.3977, - "step": 229510 - }, - { - "epoch": 0.4, - "learning_rate": 2.9987234799471257e-05, - "loss": 2.4633, - "step": 229520 - }, - { - "epoch": 0.4, - "learning_rate": 2.998636285954443e-05, - "loss": 2.3847, - "step": 229530 - }, - { - "epoch": 0.4, - "learning_rate": 2.9985490919617605e-05, - "loss": 2.3912, - "step": 229540 - }, - { - "epoch": 0.4, - "learning_rate": 2.9984618979690775e-05, - "loss": 2.4079, - "step": 229550 - }, - { - "epoch": 0.4, - "learning_rate": 2.998374703976395e-05, - "loss": 2.4619, - "step": 229560 - }, - { - "epoch": 0.4, - "learning_rate": 2.998287509983712e-05, - "loss": 2.3957, - "step": 229570 - }, - { - "epoch": 0.4, - "learning_rate": 2.9982003159910293e-05, - "loss": 2.5016, - "step": 229580 - }, - { - "epoch": 0.4, - "learning_rate": 2.998113121998347e-05, - "loss": 2.4016, - "step": 229590 - }, - { - "epoch": 0.4, - "learning_rate": 2.9980259280056644e-05, - "loss": 2.3767, - "step": 229600 - }, - { - "epoch": 0.4, - "learning_rate": 2.9979387340129818e-05, - "loss": 2.3527, - "step": 229610 - }, - { - "epoch": 0.4, - "learning_rate": 2.9978515400202988e-05, - "loss": 2.461, - "step": 229620 - }, - { - "epoch": 0.4, - "learning_rate": 2.9977643460276162e-05, - "loss": 2.391, - "step": 229630 - }, - { - "epoch": 0.4, - "learning_rate": 2.9976771520349332e-05, - "loss": 2.4068, - "step": 229640 - }, - { - "epoch": 0.4, - "learning_rate": 2.9975899580422506e-05, - "loss": 2.2723, - "step": 229650 - }, - { - "epoch": 0.4, - "learning_rate": 2.9975027640495683e-05, - "loss": 2.4809, - "step": 229660 - }, - { - "epoch": 0.4, - "learning_rate": 2.9974155700568857e-05, - "loss": 2.418, - "step": 229670 - }, - { - "epoch": 0.4, - "learning_rate": 2.9973283760642027e-05, - "loss": 2.4203, - "step": 229680 - }, - { - "epoch": 0.4, - "learning_rate": 2.99724118207152e-05, - "loss": 2.4684, - "step": 229690 - }, - { - "epoch": 0.4, - "learning_rate": 2.9971539880788375e-05, - "loss": 2.3469, - "step": 229700 - }, - { - "epoch": 0.4, - "learning_rate": 2.9970667940861545e-05, - "loss": 2.3692, - "step": 229710 - }, - { - "epoch": 0.4, - "learning_rate": 2.996979600093472e-05, - "loss": 2.4128, - "step": 229720 - }, - { - "epoch": 0.4, - "learning_rate": 2.9968924061007896e-05, - "loss": 2.3543, - "step": 229730 - }, - { - "epoch": 0.4, - "learning_rate": 2.996805212108107e-05, - "loss": 2.2687, - "step": 229740 - }, - { - "epoch": 0.4, - "learning_rate": 2.996718018115424e-05, - "loss": 2.5014, - "step": 229750 - }, - { - "epoch": 0.4, - "learning_rate": 2.9966308241227414e-05, - "loss": 2.4241, - "step": 229760 - }, - { - "epoch": 0.4, - "learning_rate": 2.9965436301300588e-05, - "loss": 2.3707, - "step": 229770 - }, - { - "epoch": 0.4, - "learning_rate": 2.996456436137376e-05, - "loss": 2.4863, - "step": 229780 - }, - { - "epoch": 0.4, - "learning_rate": 2.9963692421446932e-05, - "loss": 2.368, - "step": 229790 - }, - { - "epoch": 0.4, - "learning_rate": 2.9962820481520103e-05, - "loss": 2.3334, - "step": 229800 - }, - { - "epoch": 0.4, - "learning_rate": 2.9961948541593283e-05, - "loss": 2.3477, - "step": 229810 - }, - { - "epoch": 0.4, - "learning_rate": 2.9961076601666453e-05, - "loss": 2.3531, - "step": 229820 - }, - { - "epoch": 0.4, - "learning_rate": 2.9960204661739627e-05, - "loss": 2.41, - "step": 229830 - }, - { - "epoch": 0.4, - "learning_rate": 2.99593327218128e-05, - "loss": 2.3816, - "step": 229840 - }, - { - "epoch": 0.4, - "learning_rate": 2.995846078188597e-05, - "loss": 2.5305, - "step": 229850 - }, - { - "epoch": 0.4, - "learning_rate": 2.9957588841959145e-05, - "loss": 2.4658, - "step": 229860 - }, - { - "epoch": 0.4, - "learning_rate": 2.9956716902032316e-05, - "loss": 2.3685, - "step": 229870 - }, - { - "epoch": 0.4, - "learning_rate": 2.9955844962105496e-05, - "loss": 2.3428, - "step": 229880 - }, - { - "epoch": 0.4, - "learning_rate": 2.9954973022178666e-05, - "loss": 2.3708, - "step": 229890 - }, - { - "epoch": 0.4, - "learning_rate": 2.995410108225184e-05, - "loss": 2.3753, - "step": 229900 - }, - { - "epoch": 0.4, - "learning_rate": 2.995322914232501e-05, - "loss": 2.3653, - "step": 229910 - }, - { - "epoch": 0.4, - "learning_rate": 2.9952357202398184e-05, - "loss": 2.3553, - "step": 229920 - }, - { - "epoch": 0.4, - "learning_rate": 2.9951485262471358e-05, - "loss": 2.3571, - "step": 229930 - }, - { - "epoch": 0.4, - "learning_rate": 2.995061332254453e-05, - "loss": 2.3451, - "step": 229940 - }, - { - "epoch": 0.4, - "learning_rate": 2.9949741382617702e-05, - "loss": 2.4391, - "step": 229950 - }, - { - "epoch": 0.4, - "learning_rate": 2.994886944269088e-05, - "loss": 2.3115, - "step": 229960 - }, - { - "epoch": 0.4, - "learning_rate": 2.9947997502764053e-05, - "loss": 2.4255, - "step": 229970 - }, - { - "epoch": 0.4, - "learning_rate": 2.9947125562837224e-05, - "loss": 2.3074, - "step": 229980 - }, - { - "epoch": 0.4, - "learning_rate": 2.9946253622910397e-05, - "loss": 2.3355, - "step": 229990 - }, - { - "epoch": 0.4, - "learning_rate": 2.994538168298357e-05, - "loss": 2.4978, - "step": 230000 - }, - { - "epoch": 0.4, - "learning_rate": 2.994450974305674e-05, - "loss": 2.3777, - "step": 230010 - }, - { - "epoch": 0.4, - "learning_rate": 2.9943637803129915e-05, - "loss": 2.4549, - "step": 230020 - }, - { - "epoch": 0.4, - "learning_rate": 2.9942765863203092e-05, - "loss": 2.3007, - "step": 230030 - }, - { - "epoch": 0.4, - "learning_rate": 2.9941893923276266e-05, - "loss": 2.4542, - "step": 230040 - }, - { - "epoch": 0.4, - "learning_rate": 2.9941021983349437e-05, - "loss": 2.4662, - "step": 230050 - }, - { - "epoch": 0.4, - "learning_rate": 2.994015004342261e-05, - "loss": 2.2724, - "step": 230060 - }, - { - "epoch": 0.4, - "learning_rate": 2.9939278103495784e-05, - "loss": 2.3585, - "step": 230070 - }, - { - "epoch": 0.4, - "learning_rate": 2.9938406163568955e-05, - "loss": 2.5, - "step": 230080 - }, - { - "epoch": 0.4, - "learning_rate": 2.9937534223642128e-05, - "loss": 2.4529, - "step": 230090 - }, - { - "epoch": 0.4, - "learning_rate": 2.99366622837153e-05, - "loss": 2.3394, - "step": 230100 - }, - { - "epoch": 0.4, - "learning_rate": 2.993579034378848e-05, - "loss": 2.3968, - "step": 230110 - }, - { - "epoch": 0.4, - "learning_rate": 2.993491840386165e-05, - "loss": 2.3874, - "step": 230120 - }, - { - "epoch": 0.4, - "learning_rate": 2.9934046463934823e-05, - "loss": 2.323, - "step": 230130 - }, - { - "epoch": 0.4, - "learning_rate": 2.9933174524007994e-05, - "loss": 2.3708, - "step": 230140 - }, - { - "epoch": 0.4, - "learning_rate": 2.9932302584081168e-05, - "loss": 2.3648, - "step": 230150 - }, - { - "epoch": 0.4, - "learning_rate": 2.993143064415434e-05, - "loss": 2.3297, - "step": 230160 - }, - { - "epoch": 0.4, - "learning_rate": 2.993055870422751e-05, - "loss": 2.3563, - "step": 230170 - }, - { - "epoch": 0.4, - "learning_rate": 2.9929686764300692e-05, - "loss": 2.3346, - "step": 230180 - }, - { - "epoch": 0.4, - "learning_rate": 2.9928814824373863e-05, - "loss": 2.422, - "step": 230190 - }, - { - "epoch": 0.4, - "learning_rate": 2.9927942884447036e-05, - "loss": 2.3892, - "step": 230200 - }, - { - "epoch": 0.4, - "learning_rate": 2.9927070944520207e-05, - "loss": 2.3009, - "step": 230210 - }, - { - "epoch": 0.4, - "learning_rate": 2.992619900459338e-05, - "loss": 2.2901, - "step": 230220 - }, - { - "epoch": 0.4, - "learning_rate": 2.9925327064666554e-05, - "loss": 2.3236, - "step": 230230 - }, - { - "epoch": 0.4, - "learning_rate": 2.9924455124739725e-05, - "loss": 2.4039, - "step": 230240 - }, - { - "epoch": 0.4, - "learning_rate": 2.99235831848129e-05, - "loss": 2.4187, - "step": 230250 - }, - { - "epoch": 0.4, - "learning_rate": 2.9922711244886076e-05, - "loss": 2.3976, - "step": 230260 - }, - { - "epoch": 0.4, - "learning_rate": 2.992183930495925e-05, - "loss": 2.4796, - "step": 230270 - }, - { - "epoch": 0.4, - "learning_rate": 2.992096736503242e-05, - "loss": 2.4787, - "step": 230280 - }, - { - "epoch": 0.4, - "learning_rate": 2.9920095425105594e-05, - "loss": 2.3778, - "step": 230290 - }, - { - "epoch": 0.4, - "learning_rate": 2.9919223485178764e-05, - "loss": 2.3789, - "step": 230300 - }, - { - "epoch": 0.4, - "learning_rate": 2.9918351545251938e-05, - "loss": 2.4116, - "step": 230310 - }, - { - "epoch": 0.4, - "learning_rate": 2.991747960532511e-05, - "loss": 2.4378, - "step": 230320 - }, - { - "epoch": 0.4, - "learning_rate": 2.991660766539829e-05, - "loss": 2.3434, - "step": 230330 - }, - { - "epoch": 0.4, - "learning_rate": 2.9915735725471462e-05, - "loss": 2.3771, - "step": 230340 - }, - { - "epoch": 0.4, - "learning_rate": 2.9914863785544633e-05, - "loss": 2.4692, - "step": 230350 - }, - { - "epoch": 0.4, - "learning_rate": 2.9913991845617807e-05, - "loss": 2.3964, - "step": 230360 - }, - { - "epoch": 0.4, - "learning_rate": 2.9913119905690977e-05, - "loss": 2.4336, - "step": 230370 - }, - { - "epoch": 0.4, - "learning_rate": 2.991224796576415e-05, - "loss": 2.4879, - "step": 230380 - }, - { - "epoch": 0.4, - "learning_rate": 2.9911376025837324e-05, - "loss": 2.3746, - "step": 230390 - }, - { - "epoch": 0.4, - "learning_rate": 2.99105040859105e-05, - "loss": 2.3379, - "step": 230400 - }, - { - "epoch": 0.4, - "learning_rate": 2.9909632145983672e-05, - "loss": 2.321, - "step": 230410 - }, - { - "epoch": 0.4, - "learning_rate": 2.9908760206056846e-05, - "loss": 2.3469, - "step": 230420 - }, - { - "epoch": 0.4, - "learning_rate": 2.990788826613002e-05, - "loss": 2.2469, - "step": 230430 - }, - { - "epoch": 0.4, - "learning_rate": 2.990701632620319e-05, - "loss": 2.2498, - "step": 230440 - }, - { - "epoch": 0.4, - "learning_rate": 2.9906144386276364e-05, - "loss": 2.4172, - "step": 230450 - }, - { - "epoch": 0.4, - "learning_rate": 2.9905272446349537e-05, - "loss": 2.3781, - "step": 230460 - }, - { - "epoch": 0.4, - "learning_rate": 2.9904400506422708e-05, - "loss": 2.3695, - "step": 230470 - }, - { - "epoch": 0.4, - "learning_rate": 2.9903528566495885e-05, - "loss": 2.4668, - "step": 230480 - }, - { - "epoch": 0.4, - "learning_rate": 2.990265662656906e-05, - "loss": 2.3288, - "step": 230490 - }, - { - "epoch": 0.4, - "learning_rate": 2.9901784686642233e-05, - "loss": 2.3539, - "step": 230500 - }, - { - "epoch": 0.4, - "learning_rate": 2.9900912746715403e-05, - "loss": 2.5015, - "step": 230510 - }, - { - "epoch": 0.4, - "learning_rate": 2.9900040806788577e-05, - "loss": 2.4994, - "step": 230520 - }, - { - "epoch": 0.4, - "learning_rate": 2.9899168866861747e-05, - "loss": 2.3228, - "step": 230530 - }, - { - "epoch": 0.4, - "learning_rate": 2.989829692693492e-05, - "loss": 2.4102, - "step": 230540 - }, - { - "epoch": 0.4, - "learning_rate": 2.9897424987008098e-05, - "loss": 2.4166, - "step": 230550 - }, - { - "epoch": 0.4, - "learning_rate": 2.9896553047081272e-05, - "loss": 2.418, - "step": 230560 - }, - { - "epoch": 0.4, - "learning_rate": 2.9895681107154446e-05, - "loss": 2.4007, - "step": 230570 - }, - { - "epoch": 0.4, - "learning_rate": 2.9894809167227616e-05, - "loss": 2.525, - "step": 230580 - }, - { - "epoch": 0.4, - "learning_rate": 2.989393722730079e-05, - "loss": 2.4292, - "step": 230590 - }, - { - "epoch": 0.4, - "learning_rate": 2.989306528737396e-05, - "loss": 2.4097, - "step": 230600 - }, - { - "epoch": 0.4, - "learning_rate": 2.9892193347447134e-05, - "loss": 2.3473, - "step": 230610 - }, - { - "epoch": 0.4, - "learning_rate": 2.9891321407520308e-05, - "loss": 2.4169, - "step": 230620 - }, - { - "epoch": 0.4, - "learning_rate": 2.9890449467593485e-05, - "loss": 2.4131, - "step": 230630 - }, - { - "epoch": 0.4, - "learning_rate": 2.9889577527666655e-05, - "loss": 2.4808, - "step": 230640 - }, - { - "epoch": 0.4, - "learning_rate": 2.988870558773983e-05, - "loss": 2.3472, - "step": 230650 - }, - { - "epoch": 0.4, - "learning_rate": 2.9887833647813003e-05, - "loss": 2.4317, - "step": 230660 - }, - { - "epoch": 0.4, - "learning_rate": 2.9886961707886173e-05, - "loss": 2.3459, - "step": 230670 - }, - { - "epoch": 0.4, - "learning_rate": 2.9886089767959347e-05, - "loss": 2.361, - "step": 230680 - }, - { - "epoch": 0.4, - "learning_rate": 2.988521782803252e-05, - "loss": 2.352, - "step": 230690 - }, - { - "epoch": 0.4, - "learning_rate": 2.9884345888105698e-05, - "loss": 2.3951, - "step": 230700 - }, - { - "epoch": 0.4, - "learning_rate": 2.9883473948178868e-05, - "loss": 2.3896, - "step": 230710 - }, - { - "epoch": 0.4, - "learning_rate": 2.9882602008252042e-05, - "loss": 2.3925, - "step": 230720 - }, - { - "epoch": 0.4, - "learning_rate": 2.9881730068325216e-05, - "loss": 2.3478, - "step": 230730 - }, - { - "epoch": 0.4, - "learning_rate": 2.9880858128398386e-05, - "loss": 2.4617, - "step": 230740 - }, - { - "epoch": 0.4, - "learning_rate": 2.987998618847156e-05, - "loss": 2.4918, - "step": 230750 - }, - { - "epoch": 0.4, - "learning_rate": 2.987911424854473e-05, - "loss": 2.3397, - "step": 230760 - }, - { - "epoch": 0.4, - "learning_rate": 2.9878242308617904e-05, - "loss": 2.3214, - "step": 230770 - }, - { - "epoch": 0.4, - "learning_rate": 2.987737036869108e-05, - "loss": 2.3959, - "step": 230780 - }, - { - "epoch": 0.4, - "learning_rate": 2.9876498428764255e-05, - "loss": 2.5179, - "step": 230790 - }, - { - "epoch": 0.4, - "learning_rate": 2.987562648883743e-05, - "loss": 2.402, - "step": 230800 - }, - { - "epoch": 0.4, - "learning_rate": 2.98747545489106e-05, - "loss": 2.4268, - "step": 230810 - }, - { - "epoch": 0.4, - "learning_rate": 2.9873882608983773e-05, - "loss": 2.4338, - "step": 230820 - }, - { - "epoch": 0.4, - "learning_rate": 2.9873010669056943e-05, - "loss": 2.3373, - "step": 230830 - }, - { - "epoch": 0.4, - "learning_rate": 2.9872138729130117e-05, - "loss": 2.2227, - "step": 230840 - }, - { - "epoch": 0.4, - "learning_rate": 2.9871266789203294e-05, - "loss": 2.3839, - "step": 230850 - }, - { - "epoch": 0.4, - "learning_rate": 2.9870394849276468e-05, - "loss": 2.2575, - "step": 230860 - }, - { - "epoch": 0.4, - "learning_rate": 2.986952290934964e-05, - "loss": 2.5047, - "step": 230870 - }, - { - "epoch": 0.4, - "learning_rate": 2.9868650969422812e-05, - "loss": 2.4687, - "step": 230880 - }, - { - "epoch": 0.4, - "learning_rate": 2.9867779029495986e-05, - "loss": 2.445, - "step": 230890 - }, - { - "epoch": 0.4, - "learning_rate": 2.9866907089569156e-05, - "loss": 2.4922, - "step": 230900 - }, - { - "epoch": 0.4, - "learning_rate": 2.986603514964233e-05, - "loss": 2.4281, - "step": 230910 - }, - { - "epoch": 0.4, - "learning_rate": 2.9865163209715507e-05, - "loss": 2.3408, - "step": 230920 - }, - { - "epoch": 0.4, - "learning_rate": 2.986429126978868e-05, - "loss": 2.3552, - "step": 230930 - }, - { - "epoch": 0.4, - "learning_rate": 2.986341932986185e-05, - "loss": 2.5562, - "step": 230940 - }, - { - "epoch": 0.4, - "learning_rate": 2.9862547389935025e-05, - "loss": 2.299, - "step": 230950 - }, - { - "epoch": 0.4, - "learning_rate": 2.98616754500082e-05, - "loss": 2.357, - "step": 230960 - }, - { - "epoch": 0.4, - "learning_rate": 2.986080351008137e-05, - "loss": 2.4147, - "step": 230970 - }, - { - "epoch": 0.4, - "learning_rate": 2.9859931570154543e-05, - "loss": 2.4306, - "step": 230980 - }, - { - "epoch": 0.4, - "learning_rate": 2.9859059630227713e-05, - "loss": 2.4869, - "step": 230990 - }, - { - "epoch": 0.4, - "learning_rate": 2.9858187690300894e-05, - "loss": 2.4109, - "step": 231000 - }, - { - "epoch": 0.4, - "learning_rate": 2.9857315750374064e-05, - "loss": 2.391, - "step": 231010 - }, - { - "epoch": 0.4, - "learning_rate": 2.9856443810447238e-05, - "loss": 2.4216, - "step": 231020 - }, - { - "epoch": 0.4, - "learning_rate": 2.9855571870520412e-05, - "loss": 2.2887, - "step": 231030 - }, - { - "epoch": 0.4, - "learning_rate": 2.9854699930593582e-05, - "loss": 2.362, - "step": 231040 - }, - { - "epoch": 0.4, - "learning_rate": 2.9853827990666756e-05, - "loss": 2.4044, - "step": 231050 - }, - { - "epoch": 0.4, - "learning_rate": 2.9852956050739926e-05, - "loss": 2.3729, - "step": 231060 - }, - { - "epoch": 0.4, - "learning_rate": 2.9852084110813107e-05, - "loss": 2.3427, - "step": 231070 - }, - { - "epoch": 0.4, - "learning_rate": 2.9851212170886277e-05, - "loss": 2.3985, - "step": 231080 - }, - { - "epoch": 0.4, - "learning_rate": 2.985034023095945e-05, - "loss": 2.4428, - "step": 231090 - }, - { - "epoch": 0.4, - "learning_rate": 2.984946829103262e-05, - "loss": 2.357, - "step": 231100 - }, - { - "epoch": 0.4, - "learning_rate": 2.9848596351105795e-05, - "loss": 2.3619, - "step": 231110 - }, - { - "epoch": 0.4, - "learning_rate": 2.984772441117897e-05, - "loss": 2.3417, - "step": 231120 - }, - { - "epoch": 0.4, - "learning_rate": 2.984685247125214e-05, - "loss": 2.4973, - "step": 231130 - }, - { - "epoch": 0.4, - "learning_rate": 2.9845980531325313e-05, - "loss": 2.2356, - "step": 231140 - }, - { - "epoch": 0.4, - "learning_rate": 2.984510859139849e-05, - "loss": 2.4192, - "step": 231150 - }, - { - "epoch": 0.4, - "learning_rate": 2.9844236651471664e-05, - "loss": 2.3558, - "step": 231160 - }, - { - "epoch": 0.4, - "learning_rate": 2.9843364711544834e-05, - "loss": 2.3991, - "step": 231170 - }, - { - "epoch": 0.4, - "learning_rate": 2.9842492771618008e-05, - "loss": 2.3005, - "step": 231180 - }, - { - "epoch": 0.4, - "learning_rate": 2.9841620831691182e-05, - "loss": 2.3912, - "step": 231190 - }, - { - "epoch": 0.4, - "learning_rate": 2.9840748891764352e-05, - "loss": 2.4654, - "step": 231200 - }, - { - "epoch": 0.4, - "learning_rate": 2.9839876951837526e-05, - "loss": 2.4095, - "step": 231210 - }, - { - "epoch": 0.4, - "learning_rate": 2.9839005011910703e-05, - "loss": 2.4597, - "step": 231220 - }, - { - "epoch": 0.4, - "learning_rate": 2.9838133071983877e-05, - "loss": 2.2971, - "step": 231230 - }, - { - "epoch": 0.4, - "learning_rate": 2.9837261132057047e-05, - "loss": 2.3373, - "step": 231240 - }, - { - "epoch": 0.4, - "learning_rate": 2.983638919213022e-05, - "loss": 2.2804, - "step": 231250 - }, - { - "epoch": 0.4, - "learning_rate": 2.983551725220339e-05, - "loss": 2.3311, - "step": 231260 - }, - { - "epoch": 0.4, - "learning_rate": 2.9834645312276565e-05, - "loss": 2.4305, - "step": 231270 - }, - { - "epoch": 0.4, - "learning_rate": 2.983377337234974e-05, - "loss": 2.4089, - "step": 231280 - }, - { - "epoch": 0.4, - "learning_rate": 2.983290143242291e-05, - "loss": 2.4755, - "step": 231290 - }, - { - "epoch": 0.4, - "learning_rate": 2.983202949249609e-05, - "loss": 2.3235, - "step": 231300 - }, - { - "epoch": 0.4, - "learning_rate": 2.983115755256926e-05, - "loss": 2.3228, - "step": 231310 - }, - { - "epoch": 0.4, - "learning_rate": 2.9830285612642434e-05, - "loss": 2.4026, - "step": 231320 - }, - { - "epoch": 0.4, - "learning_rate": 2.9829413672715605e-05, - "loss": 2.5069, - "step": 231330 - }, - { - "epoch": 0.4, - "learning_rate": 2.982854173278878e-05, - "loss": 2.3467, - "step": 231340 - }, - { - "epoch": 0.4, - "learning_rate": 2.9827669792861952e-05, - "loss": 2.3507, - "step": 231350 - }, - { - "epoch": 0.4, - "learning_rate": 2.9826797852935123e-05, - "loss": 2.5256, - "step": 231360 - }, - { - "epoch": 0.4, - "learning_rate": 2.98259259130083e-05, - "loss": 2.4744, - "step": 231370 - }, - { - "epoch": 0.4, - "learning_rate": 2.9825053973081473e-05, - "loss": 2.4307, - "step": 231380 - }, - { - "epoch": 0.4, - "learning_rate": 2.9824182033154647e-05, - "loss": 2.4986, - "step": 231390 - }, - { - "epoch": 0.4, - "learning_rate": 2.9823310093227818e-05, - "loss": 2.4659, - "step": 231400 - }, - { - "epoch": 0.4, - "learning_rate": 2.982243815330099e-05, - "loss": 2.3549, - "step": 231410 - }, - { - "epoch": 0.4, - "learning_rate": 2.9821566213374165e-05, - "loss": 2.3863, - "step": 231420 - }, - { - "epoch": 0.4, - "learning_rate": 2.9820694273447336e-05, - "loss": 2.3983, - "step": 231430 - }, - { - "epoch": 0.4, - "learning_rate": 2.981982233352051e-05, - "loss": 2.3269, - "step": 231440 - }, - { - "epoch": 0.4, - "learning_rate": 2.9818950393593686e-05, - "loss": 2.351, - "step": 231450 - }, - { - "epoch": 0.4, - "learning_rate": 2.981807845366686e-05, - "loss": 2.3511, - "step": 231460 - }, - { - "epoch": 0.4, - "learning_rate": 2.981720651374003e-05, - "loss": 2.4358, - "step": 231470 - }, - { - "epoch": 0.4, - "learning_rate": 2.9816334573813204e-05, - "loss": 2.369, - "step": 231480 - }, - { - "epoch": 0.4, - "learning_rate": 2.9815462633886375e-05, - "loss": 2.5157, - "step": 231490 - }, - { - "epoch": 0.4, - "learning_rate": 2.981459069395955e-05, - "loss": 2.3762, - "step": 231500 - }, - { - "epoch": 0.4, - "learning_rate": 2.9813718754032722e-05, - "loss": 2.4582, - "step": 231510 - }, - { - "epoch": 0.4, - "learning_rate": 2.98128468141059e-05, - "loss": 2.3831, - "step": 231520 - }, - { - "epoch": 0.4, - "learning_rate": 2.9811974874179073e-05, - "loss": 2.4322, - "step": 231530 - }, - { - "epoch": 0.4, - "learning_rate": 2.9811102934252244e-05, - "loss": 2.2944, - "step": 231540 - }, - { - "epoch": 0.4, - "learning_rate": 2.9810230994325417e-05, - "loss": 2.4614, - "step": 231550 - }, - { - "epoch": 0.4, - "learning_rate": 2.9809359054398588e-05, - "loss": 2.4199, - "step": 231560 - }, - { - "epoch": 0.4, - "learning_rate": 2.980848711447176e-05, - "loss": 2.4346, - "step": 231570 - }, - { - "epoch": 0.4, - "learning_rate": 2.9807615174544935e-05, - "loss": 2.3539, - "step": 231580 - }, - { - "epoch": 0.4, - "learning_rate": 2.9806743234618112e-05, - "loss": 2.4582, - "step": 231590 - }, - { - "epoch": 0.4, - "learning_rate": 2.9805871294691283e-05, - "loss": 2.5053, - "step": 231600 - }, - { - "epoch": 0.4, - "learning_rate": 2.9804999354764457e-05, - "loss": 2.3914, - "step": 231610 - }, - { - "epoch": 0.4, - "learning_rate": 2.980412741483763e-05, - "loss": 2.3949, - "step": 231620 - }, - { - "epoch": 0.4, - "learning_rate": 2.98032554749108e-05, - "loss": 2.2505, - "step": 231630 - }, - { - "epoch": 0.4, - "learning_rate": 2.9802383534983975e-05, - "loss": 2.3573, - "step": 231640 - }, - { - "epoch": 0.4, - "learning_rate": 2.980151159505715e-05, - "loss": 2.3877, - "step": 231650 - }, - { - "epoch": 0.4, - "learning_rate": 2.980063965513032e-05, - "loss": 2.4372, - "step": 231660 - }, - { - "epoch": 0.4, - "learning_rate": 2.9799767715203496e-05, - "loss": 2.3378, - "step": 231670 - }, - { - "epoch": 0.4, - "learning_rate": 2.979889577527667e-05, - "loss": 2.3575, - "step": 231680 - }, - { - "epoch": 0.4, - "learning_rate": 2.9798023835349843e-05, - "loss": 2.3293, - "step": 231690 - }, - { - "epoch": 0.4, - "learning_rate": 2.9797151895423014e-05, - "loss": 2.4183, - "step": 231700 - }, - { - "epoch": 0.4, - "learning_rate": 2.9796279955496188e-05, - "loss": 2.2318, - "step": 231710 - }, - { - "epoch": 0.4, - "learning_rate": 2.9795408015569358e-05, - "loss": 2.3539, - "step": 231720 - }, - { - "epoch": 0.4, - "learning_rate": 2.9794536075642532e-05, - "loss": 2.405, - "step": 231730 - }, - { - "epoch": 0.4, - "learning_rate": 2.979366413571571e-05, - "loss": 2.3797, - "step": 231740 - }, - { - "epoch": 0.4, - "learning_rate": 2.9792792195788883e-05, - "loss": 2.4393, - "step": 231750 - }, - { - "epoch": 0.4, - "learning_rate": 2.9791920255862056e-05, - "loss": 2.5018, - "step": 231760 - }, - { - "epoch": 0.4, - "learning_rate": 2.9791048315935227e-05, - "loss": 2.4739, - "step": 231770 - }, - { - "epoch": 0.4, - "learning_rate": 2.97901763760084e-05, - "loss": 2.4121, - "step": 231780 - }, - { - "epoch": 0.4, - "learning_rate": 2.978930443608157e-05, - "loss": 2.4645, - "step": 231790 - }, - { - "epoch": 0.4, - "learning_rate": 2.9788432496154745e-05, - "loss": 2.3552, - "step": 231800 - }, - { - "epoch": 0.4, - "learning_rate": 2.978756055622792e-05, - "loss": 2.4189, - "step": 231810 - }, - { - "epoch": 0.4, - "learning_rate": 2.9786688616301096e-05, - "loss": 2.4269, - "step": 231820 - }, - { - "epoch": 0.4, - "learning_rate": 2.9785816676374266e-05, - "loss": 2.4539, - "step": 231830 - }, - { - "epoch": 0.4, - "learning_rate": 2.978494473644744e-05, - "loss": 2.3633, - "step": 231840 - }, - { - "epoch": 0.4, - "learning_rate": 2.9784072796520614e-05, - "loss": 2.4301, - "step": 231850 - }, - { - "epoch": 0.4, - "learning_rate": 2.9783200856593784e-05, - "loss": 2.2732, - "step": 231860 - }, - { - "epoch": 0.4, - "learning_rate": 2.9782328916666958e-05, - "loss": 2.3595, - "step": 231870 - }, - { - "epoch": 0.4, - "learning_rate": 2.9781456976740128e-05, - "loss": 2.2825, - "step": 231880 - }, - { - "epoch": 0.4, - "learning_rate": 2.978058503681331e-05, - "loss": 2.3809, - "step": 231890 - }, - { - "epoch": 0.4, - "learning_rate": 2.977971309688648e-05, - "loss": 2.39, - "step": 231900 - }, - { - "epoch": 0.4, - "learning_rate": 2.9778841156959653e-05, - "loss": 2.4304, - "step": 231910 - }, - { - "epoch": 0.4, - "learning_rate": 2.9777969217032827e-05, - "loss": 2.3699, - "step": 231920 - }, - { - "epoch": 0.4, - "learning_rate": 2.9777097277105997e-05, - "loss": 2.4104, - "step": 231930 - }, - { - "epoch": 0.4, - "learning_rate": 2.977622533717917e-05, - "loss": 2.4074, - "step": 231940 - }, - { - "epoch": 0.4, - "learning_rate": 2.977535339725234e-05, - "loss": 2.4415, - "step": 231950 - }, - { - "epoch": 0.4, - "learning_rate": 2.9774481457325515e-05, - "loss": 2.4815, - "step": 231960 - }, - { - "epoch": 0.4, - "learning_rate": 2.9773609517398692e-05, - "loss": 2.5069, - "step": 231970 - }, - { - "epoch": 0.4, - "learning_rate": 2.9772737577471866e-05, - "loss": 2.3322, - "step": 231980 - }, - { - "epoch": 0.4, - "learning_rate": 2.9771865637545036e-05, - "loss": 2.3969, - "step": 231990 - }, - { - "epoch": 0.4, - "learning_rate": 2.977099369761821e-05, - "loss": 2.4008, - "step": 232000 - }, - { - "epoch": 0.4, - "learning_rate": 2.9770121757691384e-05, - "loss": 2.3191, - "step": 232010 - }, - { - "epoch": 0.4, - "learning_rate": 2.9769249817764554e-05, - "loss": 2.4005, - "step": 232020 - }, - { - "epoch": 0.4, - "learning_rate": 2.9768377877837728e-05, - "loss": 2.3146, - "step": 232030 - }, - { - "epoch": 0.4, - "learning_rate": 2.9767505937910905e-05, - "loss": 2.3899, - "step": 232040 - }, - { - "epoch": 0.4, - "learning_rate": 2.976663399798408e-05, - "loss": 2.4567, - "step": 232050 - }, - { - "epoch": 0.4, - "learning_rate": 2.976576205805725e-05, - "loss": 2.4565, - "step": 232060 - }, - { - "epoch": 0.4, - "learning_rate": 2.9764890118130423e-05, - "loss": 2.3935, - "step": 232070 - }, - { - "epoch": 0.4, - "learning_rate": 2.9764018178203597e-05, - "loss": 2.4386, - "step": 232080 - }, - { - "epoch": 0.4, - "learning_rate": 2.9763146238276767e-05, - "loss": 2.3994, - "step": 232090 - }, - { - "epoch": 0.4, - "learning_rate": 2.976227429834994e-05, - "loss": 2.3637, - "step": 232100 - }, - { - "epoch": 0.4, - "learning_rate": 2.976140235842311e-05, - "loss": 2.4205, - "step": 232110 - }, - { - "epoch": 0.4, - "learning_rate": 2.9760530418496292e-05, - "loss": 2.4104, - "step": 232120 - }, - { - "epoch": 0.4, - "learning_rate": 2.9759658478569462e-05, - "loss": 2.3465, - "step": 232130 - }, - { - "epoch": 0.4, - "learning_rate": 2.9758786538642636e-05, - "loss": 2.4043, - "step": 232140 - }, - { - "epoch": 0.4, - "learning_rate": 2.975791459871581e-05, - "loss": 2.3848, - "step": 232150 - }, - { - "epoch": 0.4, - "learning_rate": 2.975704265878898e-05, - "loss": 2.3846, - "step": 232160 - }, - { - "epoch": 0.4, - "learning_rate": 2.9756170718862154e-05, - "loss": 2.4007, - "step": 232170 - }, - { - "epoch": 0.4, - "learning_rate": 2.9755298778935324e-05, - "loss": 2.2471, - "step": 232180 - }, - { - "epoch": 0.4, - "learning_rate": 2.9754426839008505e-05, - "loss": 2.3616, - "step": 232190 - }, - { - "epoch": 0.4, - "learning_rate": 2.9753554899081675e-05, - "loss": 2.3497, - "step": 232200 - }, - { - "epoch": 0.4, - "learning_rate": 2.975268295915485e-05, - "loss": 2.3027, - "step": 232210 - }, - { - "epoch": 0.4, - "learning_rate": 2.975181101922802e-05, - "loss": 2.3087, - "step": 232220 - }, - { - "epoch": 0.4, - "learning_rate": 2.9750939079301193e-05, - "loss": 2.4973, - "step": 232230 - }, - { - "epoch": 0.4, - "learning_rate": 2.9750067139374367e-05, - "loss": 2.3185, - "step": 232240 - }, - { - "epoch": 0.41, - "learning_rate": 2.9749195199447537e-05, - "loss": 2.3104, - "step": 232250 - }, - { - "epoch": 0.41, - "learning_rate": 2.9748323259520718e-05, - "loss": 2.3617, - "step": 232260 - }, - { - "epoch": 0.41, - "learning_rate": 2.9747451319593888e-05, - "loss": 2.3295, - "step": 232270 - }, - { - "epoch": 0.41, - "learning_rate": 2.9746579379667062e-05, - "loss": 2.3568, - "step": 232280 - }, - { - "epoch": 0.41, - "learning_rate": 2.9745707439740232e-05, - "loss": 2.4768, - "step": 232290 - }, - { - "epoch": 0.41, - "learning_rate": 2.9744835499813406e-05, - "loss": 2.4529, - "step": 232300 - }, - { - "epoch": 0.41, - "learning_rate": 2.974396355988658e-05, - "loss": 2.4966, - "step": 232310 - }, - { - "epoch": 0.41, - "learning_rate": 2.974309161995975e-05, - "loss": 2.3394, - "step": 232320 - }, - { - "epoch": 0.41, - "learning_rate": 2.9742219680032924e-05, - "loss": 2.3647, - "step": 232330 - }, - { - "epoch": 0.41, - "learning_rate": 2.97413477401061e-05, - "loss": 2.3572, - "step": 232340 - }, - { - "epoch": 0.41, - "learning_rate": 2.9740475800179275e-05, - "loss": 2.3668, - "step": 232350 - }, - { - "epoch": 0.41, - "learning_rate": 2.9739603860252445e-05, - "loss": 2.5187, - "step": 232360 - }, - { - "epoch": 0.41, - "learning_rate": 2.973873192032562e-05, - "loss": 2.4372, - "step": 232370 - }, - { - "epoch": 0.41, - "learning_rate": 2.9737859980398793e-05, - "loss": 2.3871, - "step": 232380 - }, - { - "epoch": 0.41, - "learning_rate": 2.9736988040471963e-05, - "loss": 2.3562, - "step": 232390 - }, - { - "epoch": 0.41, - "learning_rate": 2.9736116100545137e-05, - "loss": 2.3976, - "step": 232400 - }, - { - "epoch": 0.41, - "learning_rate": 2.9735244160618314e-05, - "loss": 2.4743, - "step": 232410 - }, - { - "epoch": 0.41, - "learning_rate": 2.9734372220691488e-05, - "loss": 2.4963, - "step": 232420 - }, - { - "epoch": 0.41, - "learning_rate": 2.973350028076466e-05, - "loss": 2.404, - "step": 232430 - }, - { - "epoch": 0.41, - "learning_rate": 2.9732628340837832e-05, - "loss": 2.5043, - "step": 232440 - }, - { - "epoch": 0.41, - "learning_rate": 2.9731756400911002e-05, - "loss": 2.3465, - "step": 232450 - }, - { - "epoch": 0.41, - "learning_rate": 2.9730884460984176e-05, - "loss": 2.4492, - "step": 232460 - }, - { - "epoch": 0.41, - "learning_rate": 2.973001252105735e-05, - "loss": 2.4737, - "step": 232470 - }, - { - "epoch": 0.41, - "learning_rate": 2.972914058113052e-05, - "loss": 2.4531, - "step": 232480 - }, - { - "epoch": 0.41, - "learning_rate": 2.97282686412037e-05, - "loss": 2.4255, - "step": 232490 - }, - { - "epoch": 0.41, - "learning_rate": 2.972739670127687e-05, - "loss": 2.4134, - "step": 232500 - }, - { - "epoch": 0.41, - "learning_rate": 2.9726524761350045e-05, - "loss": 2.4101, - "step": 232510 - }, - { - "epoch": 0.41, - "learning_rate": 2.9725652821423215e-05, - "loss": 2.4663, - "step": 232520 - }, - { - "epoch": 0.41, - "learning_rate": 2.972478088149639e-05, - "loss": 2.3292, - "step": 232530 - }, - { - "epoch": 0.41, - "learning_rate": 2.9723908941569563e-05, - "loss": 2.2617, - "step": 232540 - }, - { - "epoch": 0.41, - "learning_rate": 2.9723037001642733e-05, - "loss": 2.3854, - "step": 232550 - }, - { - "epoch": 0.41, - "learning_rate": 2.972216506171591e-05, - "loss": 2.3261, - "step": 232560 - }, - { - "epoch": 0.41, - "learning_rate": 2.9721293121789084e-05, - "loss": 2.3862, - "step": 232570 - }, - { - "epoch": 0.41, - "learning_rate": 2.9720421181862258e-05, - "loss": 2.4385, - "step": 232580 - }, - { - "epoch": 0.41, - "learning_rate": 2.971954924193543e-05, - "loss": 2.318, - "step": 232590 - }, - { - "epoch": 0.41, - "learning_rate": 2.9718677302008602e-05, - "loss": 2.3195, - "step": 232600 - }, - { - "epoch": 0.41, - "learning_rate": 2.9717805362081773e-05, - "loss": 2.3718, - "step": 232610 - }, - { - "epoch": 0.41, - "learning_rate": 2.9716933422154946e-05, - "loss": 2.3789, - "step": 232620 - }, - { - "epoch": 0.41, - "learning_rate": 2.971606148222812e-05, - "loss": 2.4465, - "step": 232630 - }, - { - "epoch": 0.41, - "learning_rate": 2.9715189542301297e-05, - "loss": 2.5131, - "step": 232640 - }, - { - "epoch": 0.41, - "learning_rate": 2.971431760237447e-05, - "loss": 2.4977, - "step": 232650 - }, - { - "epoch": 0.41, - "learning_rate": 2.971344566244764e-05, - "loss": 2.4002, - "step": 232660 - }, - { - "epoch": 0.41, - "learning_rate": 2.9712573722520815e-05, - "loss": 2.4592, - "step": 232670 - }, - { - "epoch": 0.41, - "learning_rate": 2.9711701782593986e-05, - "loss": 2.4945, - "step": 232680 - }, - { - "epoch": 0.41, - "learning_rate": 2.971082984266716e-05, - "loss": 2.3709, - "step": 232690 - }, - { - "epoch": 0.41, - "learning_rate": 2.9709957902740333e-05, - "loss": 2.4394, - "step": 232700 - }, - { - "epoch": 0.41, - "learning_rate": 2.970908596281351e-05, - "loss": 2.4716, - "step": 232710 - }, - { - "epoch": 0.41, - "learning_rate": 2.970821402288668e-05, - "loss": 2.4003, - "step": 232720 - }, - { - "epoch": 0.41, - "learning_rate": 2.9707342082959854e-05, - "loss": 2.4783, - "step": 232730 - }, - { - "epoch": 0.41, - "learning_rate": 2.9706470143033028e-05, - "loss": 2.34, - "step": 232740 - }, - { - "epoch": 0.41, - "learning_rate": 2.97055982031062e-05, - "loss": 2.3739, - "step": 232750 - }, - { - "epoch": 0.41, - "learning_rate": 2.9704726263179372e-05, - "loss": 2.4218, - "step": 232760 - }, - { - "epoch": 0.41, - "learning_rate": 2.9703854323252546e-05, - "loss": 2.4219, - "step": 232770 - }, - { - "epoch": 0.41, - "learning_rate": 2.9702982383325723e-05, - "loss": 2.5032, - "step": 232780 - }, - { - "epoch": 0.41, - "learning_rate": 2.9702110443398894e-05, - "loss": 2.225, - "step": 232790 - }, - { - "epoch": 0.41, - "learning_rate": 2.9701238503472067e-05, - "loss": 2.3975, - "step": 232800 - }, - { - "epoch": 0.41, - "learning_rate": 2.970036656354524e-05, - "loss": 2.4107, - "step": 232810 - }, - { - "epoch": 0.41, - "learning_rate": 2.969949462361841e-05, - "loss": 2.4141, - "step": 232820 - }, - { - "epoch": 0.41, - "learning_rate": 2.9698622683691585e-05, - "loss": 2.4452, - "step": 232830 - }, - { - "epoch": 0.41, - "learning_rate": 2.9697750743764756e-05, - "loss": 2.5351, - "step": 232840 - }, - { - "epoch": 0.41, - "learning_rate": 2.969687880383793e-05, - "loss": 2.2805, - "step": 232850 - }, - { - "epoch": 0.41, - "learning_rate": 2.9696006863911107e-05, - "loss": 2.4724, - "step": 232860 - }, - { - "epoch": 0.41, - "learning_rate": 2.969513492398428e-05, - "loss": 2.4018, - "step": 232870 - }, - { - "epoch": 0.41, - "learning_rate": 2.9694262984057454e-05, - "loss": 2.3756, - "step": 232880 - }, - { - "epoch": 0.41, - "learning_rate": 2.9693391044130625e-05, - "loss": 2.3385, - "step": 232890 - }, - { - "epoch": 0.41, - "learning_rate": 2.96925191042038e-05, - "loss": 2.3627, - "step": 232900 - }, - { - "epoch": 0.41, - "learning_rate": 2.969164716427697e-05, - "loss": 2.3977, - "step": 232910 - }, - { - "epoch": 0.41, - "learning_rate": 2.9690775224350143e-05, - "loss": 2.244, - "step": 232920 - }, - { - "epoch": 0.41, - "learning_rate": 2.968990328442332e-05, - "loss": 2.3146, - "step": 232930 - }, - { - "epoch": 0.41, - "learning_rate": 2.9689031344496493e-05, - "loss": 2.4781, - "step": 232940 - }, - { - "epoch": 0.41, - "learning_rate": 2.9688159404569664e-05, - "loss": 2.4355, - "step": 232950 - }, - { - "epoch": 0.41, - "learning_rate": 2.9687287464642838e-05, - "loss": 2.5337, - "step": 232960 - }, - { - "epoch": 0.41, - "learning_rate": 2.968641552471601e-05, - "loss": 2.4296, - "step": 232970 - }, - { - "epoch": 0.41, - "learning_rate": 2.9685543584789182e-05, - "loss": 2.3877, - "step": 232980 - }, - { - "epoch": 0.41, - "learning_rate": 2.9684671644862356e-05, - "loss": 2.3443, - "step": 232990 - }, - { - "epoch": 0.41, - "learning_rate": 2.968379970493553e-05, - "loss": 2.3289, - "step": 233000 - }, - { - "epoch": 0.41, - "learning_rate": 2.9682927765008706e-05, - "loss": 2.4002, - "step": 233010 - }, - { - "epoch": 0.41, - "learning_rate": 2.9682055825081877e-05, - "loss": 2.4719, - "step": 233020 - }, - { - "epoch": 0.41, - "learning_rate": 2.968118388515505e-05, - "loss": 2.3914, - "step": 233030 - }, - { - "epoch": 0.41, - "learning_rate": 2.9680311945228224e-05, - "loss": 2.5329, - "step": 233040 - }, - { - "epoch": 0.41, - "learning_rate": 2.9679440005301395e-05, - "loss": 2.4657, - "step": 233050 - }, - { - "epoch": 0.41, - "learning_rate": 2.967856806537457e-05, - "loss": 2.418, - "step": 233060 - }, - { - "epoch": 0.41, - "learning_rate": 2.967769612544774e-05, - "loss": 2.2901, - "step": 233070 - }, - { - "epoch": 0.41, - "learning_rate": 2.967682418552092e-05, - "loss": 2.3669, - "step": 233080 - }, - { - "epoch": 0.41, - "learning_rate": 2.967595224559409e-05, - "loss": 2.3624, - "step": 233090 - }, - { - "epoch": 0.41, - "learning_rate": 2.9675080305667264e-05, - "loss": 2.3629, - "step": 233100 - }, - { - "epoch": 0.41, - "learning_rate": 2.9674208365740437e-05, - "loss": 2.4021, - "step": 233110 - }, - { - "epoch": 0.41, - "learning_rate": 2.9673336425813608e-05, - "loss": 2.2978, - "step": 233120 - }, - { - "epoch": 0.41, - "learning_rate": 2.967246448588678e-05, - "loss": 2.453, - "step": 233130 - }, - { - "epoch": 0.41, - "learning_rate": 2.9671592545959952e-05, - "loss": 2.4268, - "step": 233140 - }, - { - "epoch": 0.41, - "learning_rate": 2.9670720606033126e-05, - "loss": 2.4048, - "step": 233150 - }, - { - "epoch": 0.41, - "learning_rate": 2.9669848666106303e-05, - "loss": 2.4796, - "step": 233160 - }, - { - "epoch": 0.41, - "learning_rate": 2.9668976726179477e-05, - "loss": 2.3157, - "step": 233170 - }, - { - "epoch": 0.41, - "learning_rate": 2.9668104786252647e-05, - "loss": 2.2492, - "step": 233180 - }, - { - "epoch": 0.41, - "learning_rate": 2.966723284632582e-05, - "loss": 2.4996, - "step": 233190 - }, - { - "epoch": 0.41, - "learning_rate": 2.9666360906398995e-05, - "loss": 2.3948, - "step": 233200 - }, - { - "epoch": 0.41, - "learning_rate": 2.9665488966472165e-05, - "loss": 2.4068, - "step": 233210 - }, - { - "epoch": 0.41, - "learning_rate": 2.966461702654534e-05, - "loss": 2.4175, - "step": 233220 - }, - { - "epoch": 0.41, - "learning_rate": 2.9663745086618516e-05, - "loss": 2.4709, - "step": 233230 - }, - { - "epoch": 0.41, - "learning_rate": 2.966287314669169e-05, - "loss": 2.3847, - "step": 233240 - }, - { - "epoch": 0.41, - "learning_rate": 2.966200120676486e-05, - "loss": 2.333, - "step": 233250 - }, - { - "epoch": 0.41, - "learning_rate": 2.9661129266838034e-05, - "loss": 2.4185, - "step": 233260 - }, - { - "epoch": 0.41, - "learning_rate": 2.9660257326911208e-05, - "loss": 2.4615, - "step": 233270 - }, - { - "epoch": 0.41, - "learning_rate": 2.9659385386984378e-05, - "loss": 2.347, - "step": 233280 - }, - { - "epoch": 0.41, - "learning_rate": 2.9658513447057552e-05, - "loss": 2.3577, - "step": 233290 - }, - { - "epoch": 0.41, - "learning_rate": 2.9657641507130722e-05, - "loss": 2.4092, - "step": 233300 - }, - { - "epoch": 0.41, - "learning_rate": 2.9656769567203903e-05, - "loss": 2.4222, - "step": 233310 - }, - { - "epoch": 0.41, - "learning_rate": 2.9655897627277073e-05, - "loss": 2.4685, - "step": 233320 - }, - { - "epoch": 0.41, - "learning_rate": 2.9655025687350247e-05, - "loss": 2.3828, - "step": 233330 - }, - { - "epoch": 0.41, - "learning_rate": 2.9654153747423417e-05, - "loss": 2.388, - "step": 233340 - }, - { - "epoch": 0.41, - "learning_rate": 2.965328180749659e-05, - "loss": 2.4207, - "step": 233350 - }, - { - "epoch": 0.41, - "learning_rate": 2.9652409867569765e-05, - "loss": 2.4461, - "step": 233360 - }, - { - "epoch": 0.41, - "learning_rate": 2.9651537927642935e-05, - "loss": 2.4066, - "step": 233370 - }, - { - "epoch": 0.41, - "learning_rate": 2.9650665987716116e-05, - "loss": 2.4639, - "step": 233380 - }, - { - "epoch": 0.41, - "learning_rate": 2.9649794047789286e-05, - "loss": 2.3624, - "step": 233390 - }, - { - "epoch": 0.41, - "learning_rate": 2.964892210786246e-05, - "loss": 2.4013, - "step": 233400 - }, - { - "epoch": 0.41, - "learning_rate": 2.964805016793563e-05, - "loss": 2.3587, - "step": 233410 - }, - { - "epoch": 0.41, - "learning_rate": 2.9647178228008804e-05, - "loss": 2.3012, - "step": 233420 - }, - { - "epoch": 0.41, - "learning_rate": 2.9646306288081978e-05, - "loss": 2.3997, - "step": 233430 - }, - { - "epoch": 0.41, - "learning_rate": 2.9645434348155148e-05, - "loss": 2.2657, - "step": 233440 - }, - { - "epoch": 0.41, - "learning_rate": 2.9644562408228325e-05, - "loss": 2.4237, - "step": 233450 - }, - { - "epoch": 0.41, - "learning_rate": 2.96436904683015e-05, - "loss": 2.4603, - "step": 233460 - }, - { - "epoch": 0.41, - "learning_rate": 2.9642818528374673e-05, - "loss": 2.3181, - "step": 233470 - }, - { - "epoch": 0.41, - "learning_rate": 2.9641946588447843e-05, - "loss": 2.3892, - "step": 233480 - }, - { - "epoch": 0.41, - "learning_rate": 2.9641074648521017e-05, - "loss": 2.3856, - "step": 233490 - }, - { - "epoch": 0.41, - "learning_rate": 2.964020270859419e-05, - "loss": 2.462, - "step": 233500 - }, - { - "epoch": 0.41, - "learning_rate": 2.963933076866736e-05, - "loss": 2.4495, - "step": 233510 - }, - { - "epoch": 0.41, - "learning_rate": 2.9638458828740535e-05, - "loss": 2.437, - "step": 233520 - }, - { - "epoch": 0.41, - "learning_rate": 2.9637586888813712e-05, - "loss": 2.3672, - "step": 233530 - }, - { - "epoch": 0.41, - "learning_rate": 2.9636714948886886e-05, - "loss": 2.4906, - "step": 233540 - }, - { - "epoch": 0.41, - "learning_rate": 2.9635843008960056e-05, - "loss": 2.318, - "step": 233550 - }, - { - "epoch": 0.41, - "learning_rate": 2.963497106903323e-05, - "loss": 2.451, - "step": 233560 - }, - { - "epoch": 0.41, - "learning_rate": 2.96340991291064e-05, - "loss": 2.336, - "step": 233570 - }, - { - "epoch": 0.41, - "learning_rate": 2.9633227189179574e-05, - "loss": 2.4885, - "step": 233580 - }, - { - "epoch": 0.41, - "learning_rate": 2.9632355249252748e-05, - "loss": 2.3822, - "step": 233590 - }, - { - "epoch": 0.41, - "learning_rate": 2.9631483309325925e-05, - "loss": 2.3679, - "step": 233600 - }, - { - "epoch": 0.41, - "learning_rate": 2.96306113693991e-05, - "loss": 2.2957, - "step": 233610 - }, - { - "epoch": 0.41, - "learning_rate": 2.962973942947227e-05, - "loss": 2.3134, - "step": 233620 - }, - { - "epoch": 0.41, - "learning_rate": 2.9628867489545443e-05, - "loss": 2.4471, - "step": 233630 - }, - { - "epoch": 0.41, - "learning_rate": 2.9627995549618613e-05, - "loss": 2.4624, - "step": 233640 - }, - { - "epoch": 0.41, - "learning_rate": 2.9627123609691787e-05, - "loss": 2.4666, - "step": 233650 - }, - { - "epoch": 0.41, - "learning_rate": 2.962625166976496e-05, - "loss": 2.3422, - "step": 233660 - }, - { - "epoch": 0.41, - "learning_rate": 2.962537972983813e-05, - "loss": 2.4098, - "step": 233670 - }, - { - "epoch": 0.41, - "learning_rate": 2.962450778991131e-05, - "loss": 2.399, - "step": 233680 - }, - { - "epoch": 0.41, - "learning_rate": 2.9623635849984482e-05, - "loss": 2.378, - "step": 233690 - }, - { - "epoch": 0.41, - "learning_rate": 2.9622763910057656e-05, - "loss": 2.3559, - "step": 233700 - }, - { - "epoch": 0.41, - "learning_rate": 2.9621891970130826e-05, - "loss": 2.421, - "step": 233710 - }, - { - "epoch": 0.41, - "learning_rate": 2.9621020030204e-05, - "loss": 2.473, - "step": 233720 - }, - { - "epoch": 0.41, - "learning_rate": 2.9620148090277174e-05, - "loss": 2.4666, - "step": 233730 - }, - { - "epoch": 0.41, - "learning_rate": 2.9619276150350344e-05, - "loss": 2.3793, - "step": 233740 - }, - { - "epoch": 0.41, - "learning_rate": 2.961840421042352e-05, - "loss": 2.2496, - "step": 233750 - }, - { - "epoch": 0.41, - "learning_rate": 2.9617532270496695e-05, - "loss": 2.3586, - "step": 233760 - }, - { - "epoch": 0.41, - "learning_rate": 2.961666033056987e-05, - "loss": 2.3318, - "step": 233770 - }, - { - "epoch": 0.41, - "learning_rate": 2.961578839064304e-05, - "loss": 2.3702, - "step": 233780 - }, - { - "epoch": 0.41, - "learning_rate": 2.9614916450716213e-05, - "loss": 2.3867, - "step": 233790 - }, - { - "epoch": 0.41, - "learning_rate": 2.9614044510789383e-05, - "loss": 2.4584, - "step": 233800 - }, - { - "epoch": 0.41, - "learning_rate": 2.9613172570862557e-05, - "loss": 2.5695, - "step": 233810 - }, - { - "epoch": 0.41, - "learning_rate": 2.961230063093573e-05, - "loss": 2.3707, - "step": 233820 - }, - { - "epoch": 0.41, - "learning_rate": 2.9611428691008908e-05, - "loss": 2.372, - "step": 233830 - }, - { - "epoch": 0.41, - "learning_rate": 2.9610556751082082e-05, - "loss": 2.3405, - "step": 233840 - }, - { - "epoch": 0.41, - "learning_rate": 2.9609684811155252e-05, - "loss": 2.429, - "step": 233850 - }, - { - "epoch": 0.41, - "learning_rate": 2.9608812871228426e-05, - "loss": 2.5022, - "step": 233860 - }, - { - "epoch": 0.41, - "learning_rate": 2.9607940931301596e-05, - "loss": 2.3545, - "step": 233870 - }, - { - "epoch": 0.41, - "learning_rate": 2.960706899137477e-05, - "loss": 2.3677, - "step": 233880 - }, - { - "epoch": 0.41, - "learning_rate": 2.9606197051447944e-05, - "loss": 2.3394, - "step": 233890 - }, - { - "epoch": 0.41, - "learning_rate": 2.960532511152112e-05, - "loss": 2.3345, - "step": 233900 - }, - { - "epoch": 0.41, - "learning_rate": 2.960445317159429e-05, - "loss": 2.2831, - "step": 233910 - }, - { - "epoch": 0.41, - "learning_rate": 2.9603581231667465e-05, - "loss": 2.2499, - "step": 233920 - }, - { - "epoch": 0.41, - "learning_rate": 2.960270929174064e-05, - "loss": 2.2572, - "step": 233930 - }, - { - "epoch": 0.41, - "learning_rate": 2.960183735181381e-05, - "loss": 2.3456, - "step": 233940 - }, - { - "epoch": 0.41, - "learning_rate": 2.9600965411886983e-05, - "loss": 2.3693, - "step": 233950 - }, - { - "epoch": 0.41, - "learning_rate": 2.9600093471960154e-05, - "loss": 2.4423, - "step": 233960 - }, - { - "epoch": 0.41, - "learning_rate": 2.9599221532033327e-05, - "loss": 2.3689, - "step": 233970 - }, - { - "epoch": 0.41, - "learning_rate": 2.9598349592106505e-05, - "loss": 2.4394, - "step": 233980 - }, - { - "epoch": 0.41, - "learning_rate": 2.959747765217968e-05, - "loss": 2.4189, - "step": 233990 - }, - { - "epoch": 0.41, - "learning_rate": 2.9596605712252852e-05, - "loss": 2.2991, - "step": 234000 - }, - { - "epoch": 0.41, - "learning_rate": 2.9595733772326022e-05, - "loss": 2.355, - "step": 234010 - }, - { - "epoch": 0.41, - "learning_rate": 2.9594861832399196e-05, - "loss": 2.3971, - "step": 234020 - }, - { - "epoch": 0.41, - "learning_rate": 2.9593989892472367e-05, - "loss": 2.3868, - "step": 234030 - }, - { - "epoch": 0.41, - "learning_rate": 2.959311795254554e-05, - "loss": 2.4157, - "step": 234040 - }, - { - "epoch": 0.41, - "learning_rate": 2.9592246012618718e-05, - "loss": 2.3994, - "step": 234050 - }, - { - "epoch": 0.41, - "learning_rate": 2.959137407269189e-05, - "loss": 2.4444, - "step": 234060 - }, - { - "epoch": 0.41, - "learning_rate": 2.9590502132765062e-05, - "loss": 2.3647, - "step": 234070 - }, - { - "epoch": 0.41, - "learning_rate": 2.9589630192838235e-05, - "loss": 2.4066, - "step": 234080 - }, - { - "epoch": 0.41, - "learning_rate": 2.958875825291141e-05, - "loss": 2.3599, - "step": 234090 - }, - { - "epoch": 0.41, - "learning_rate": 2.958788631298458e-05, - "loss": 2.4739, - "step": 234100 - }, - { - "epoch": 0.41, - "learning_rate": 2.9587014373057753e-05, - "loss": 2.5006, - "step": 234110 - }, - { - "epoch": 0.41, - "learning_rate": 2.958614243313093e-05, - "loss": 2.3361, - "step": 234120 - }, - { - "epoch": 0.41, - "learning_rate": 2.9585270493204104e-05, - "loss": 2.408, - "step": 234130 - }, - { - "epoch": 0.41, - "learning_rate": 2.9584398553277275e-05, - "loss": 2.2921, - "step": 234140 - }, - { - "epoch": 0.41, - "learning_rate": 2.958352661335045e-05, - "loss": 2.3878, - "step": 234150 - }, - { - "epoch": 0.41, - "learning_rate": 2.9582654673423622e-05, - "loss": 2.4109, - "step": 234160 - }, - { - "epoch": 0.41, - "learning_rate": 2.9581782733496793e-05, - "loss": 2.3528, - "step": 234170 - }, - { - "epoch": 0.41, - "learning_rate": 2.9580910793569966e-05, - "loss": 2.3969, - "step": 234180 - }, - { - "epoch": 0.41, - "learning_rate": 2.9580038853643137e-05, - "loss": 2.4039, - "step": 234190 - }, - { - "epoch": 0.41, - "learning_rate": 2.9579166913716317e-05, - "loss": 2.4285, - "step": 234200 - }, - { - "epoch": 0.41, - "learning_rate": 2.9578294973789488e-05, - "loss": 2.2862, - "step": 234210 - }, - { - "epoch": 0.41, - "learning_rate": 2.957742303386266e-05, - "loss": 2.3507, - "step": 234220 - }, - { - "epoch": 0.41, - "learning_rate": 2.9576551093935835e-05, - "loss": 2.4598, - "step": 234230 - }, - { - "epoch": 0.41, - "learning_rate": 2.9575679154009006e-05, - "loss": 2.3721, - "step": 234240 - }, - { - "epoch": 0.41, - "learning_rate": 2.957480721408218e-05, - "loss": 2.3358, - "step": 234250 - }, - { - "epoch": 0.41, - "learning_rate": 2.957393527415535e-05, - "loss": 2.3672, - "step": 234260 - }, - { - "epoch": 0.41, - "learning_rate": 2.957306333422853e-05, - "loss": 2.4097, - "step": 234270 - }, - { - "epoch": 0.41, - "learning_rate": 2.95721913943017e-05, - "loss": 2.452, - "step": 234280 - }, - { - "epoch": 0.41, - "learning_rate": 2.9571319454374874e-05, - "loss": 2.3986, - "step": 234290 - }, - { - "epoch": 0.41, - "learning_rate": 2.9570447514448045e-05, - "loss": 2.3206, - "step": 234300 - }, - { - "epoch": 0.41, - "learning_rate": 2.956957557452122e-05, - "loss": 2.3782, - "step": 234310 - }, - { - "epoch": 0.41, - "learning_rate": 2.9568703634594392e-05, - "loss": 2.3263, - "step": 234320 - }, - { - "epoch": 0.41, - "learning_rate": 2.9567831694667563e-05, - "loss": 2.3769, - "step": 234330 - }, - { - "epoch": 0.41, - "learning_rate": 2.9566959754740737e-05, - "loss": 2.2547, - "step": 234340 - }, - { - "epoch": 0.41, - "learning_rate": 2.9566087814813914e-05, - "loss": 2.4158, - "step": 234350 - }, - { - "epoch": 0.41, - "learning_rate": 2.9565215874887087e-05, - "loss": 2.4831, - "step": 234360 - }, - { - "epoch": 0.41, - "learning_rate": 2.9564343934960258e-05, - "loss": 2.4046, - "step": 234370 - }, - { - "epoch": 0.41, - "learning_rate": 2.956347199503343e-05, - "loss": 2.476, - "step": 234380 - }, - { - "epoch": 0.41, - "learning_rate": 2.9562600055106605e-05, - "loss": 2.4372, - "step": 234390 - }, - { - "epoch": 0.41, - "learning_rate": 2.9561728115179776e-05, - "loss": 2.4252, - "step": 234400 - }, - { - "epoch": 0.41, - "learning_rate": 2.956085617525295e-05, - "loss": 2.3569, - "step": 234410 - }, - { - "epoch": 0.41, - "learning_rate": 2.9559984235326127e-05, - "loss": 2.3998, - "step": 234420 - }, - { - "epoch": 0.41, - "learning_rate": 2.95591122953993e-05, - "loss": 2.3969, - "step": 234430 - }, - { - "epoch": 0.41, - "learning_rate": 2.955824035547247e-05, - "loss": 2.4176, - "step": 234440 - }, - { - "epoch": 0.41, - "learning_rate": 2.9557368415545645e-05, - "loss": 2.3537, - "step": 234450 - }, - { - "epoch": 0.41, - "learning_rate": 2.955649647561882e-05, - "loss": 2.401, - "step": 234460 - }, - { - "epoch": 0.41, - "learning_rate": 2.955562453569199e-05, - "loss": 2.4148, - "step": 234470 - }, - { - "epoch": 0.41, - "learning_rate": 2.9554752595765163e-05, - "loss": 2.3824, - "step": 234480 - }, - { - "epoch": 0.41, - "learning_rate": 2.9553880655838333e-05, - "loss": 2.4048, - "step": 234490 - }, - { - "epoch": 0.41, - "learning_rate": 2.9553008715911513e-05, - "loss": 2.4588, - "step": 234500 - }, - { - "epoch": 0.41, - "learning_rate": 2.9552136775984684e-05, - "loss": 2.4158, - "step": 234510 - }, - { - "epoch": 0.41, - "learning_rate": 2.9551264836057858e-05, - "loss": 2.3219, - "step": 234520 - }, - { - "epoch": 0.41, - "learning_rate": 2.9550392896131028e-05, - "loss": 2.52, - "step": 234530 - }, - { - "epoch": 0.41, - "learning_rate": 2.9549520956204202e-05, - "loss": 2.4422, - "step": 234540 - }, - { - "epoch": 0.41, - "learning_rate": 2.9548649016277376e-05, - "loss": 2.3634, - "step": 234550 - }, - { - "epoch": 0.41, - "learning_rate": 2.9547777076350546e-05, - "loss": 2.4873, - "step": 234560 - }, - { - "epoch": 0.41, - "learning_rate": 2.9546905136423726e-05, - "loss": 2.4685, - "step": 234570 - }, - { - "epoch": 0.41, - "learning_rate": 2.9546033196496897e-05, - "loss": 2.4227, - "step": 234580 - }, - { - "epoch": 0.41, - "learning_rate": 2.954516125657007e-05, - "loss": 2.3557, - "step": 234590 - }, - { - "epoch": 0.41, - "learning_rate": 2.954428931664324e-05, - "loss": 2.3568, - "step": 234600 - }, - { - "epoch": 0.41, - "learning_rate": 2.9543417376716415e-05, - "loss": 2.3512, - "step": 234610 - }, - { - "epoch": 0.41, - "learning_rate": 2.954254543678959e-05, - "loss": 2.3824, - "step": 234620 - }, - { - "epoch": 0.41, - "learning_rate": 2.954167349686276e-05, - "loss": 2.3547, - "step": 234630 - }, - { - "epoch": 0.41, - "learning_rate": 2.9540801556935933e-05, - "loss": 2.483, - "step": 234640 - }, - { - "epoch": 0.41, - "learning_rate": 2.953992961700911e-05, - "loss": 2.4763, - "step": 234650 - }, - { - "epoch": 0.41, - "learning_rate": 2.9539057677082284e-05, - "loss": 2.3554, - "step": 234660 - }, - { - "epoch": 0.41, - "learning_rate": 2.9538185737155454e-05, - "loss": 2.4865, - "step": 234670 - }, - { - "epoch": 0.41, - "learning_rate": 2.9537313797228628e-05, - "loss": 2.3278, - "step": 234680 - }, - { - "epoch": 0.41, - "learning_rate": 2.9536441857301798e-05, - "loss": 2.3791, - "step": 234690 - }, - { - "epoch": 0.41, - "learning_rate": 2.9535569917374972e-05, - "loss": 2.2929, - "step": 234700 - }, - { - "epoch": 0.41, - "learning_rate": 2.9534697977448146e-05, - "loss": 2.441, - "step": 234710 - }, - { - "epoch": 0.41, - "learning_rate": 2.9533826037521323e-05, - "loss": 2.4053, - "step": 234720 - }, - { - "epoch": 0.41, - "learning_rate": 2.9532954097594497e-05, - "loss": 2.3983, - "step": 234730 - }, - { - "epoch": 0.41, - "learning_rate": 2.9532082157667667e-05, - "loss": 2.5164, - "step": 234740 - }, - { - "epoch": 0.41, - "learning_rate": 2.953121021774084e-05, - "loss": 2.3957, - "step": 234750 - }, - { - "epoch": 0.41, - "learning_rate": 2.953033827781401e-05, - "loss": 2.2731, - "step": 234760 - }, - { - "epoch": 0.41, - "learning_rate": 2.9529466337887185e-05, - "loss": 2.4944, - "step": 234770 - }, - { - "epoch": 0.41, - "learning_rate": 2.952859439796036e-05, - "loss": 2.2288, - "step": 234780 - }, - { - "epoch": 0.41, - "learning_rate": 2.9527722458033536e-05, - "loss": 2.3233, - "step": 234790 - }, - { - "epoch": 0.41, - "learning_rate": 2.9526850518106706e-05, - "loss": 2.3926, - "step": 234800 - }, - { - "epoch": 0.41, - "learning_rate": 2.952597857817988e-05, - "loss": 2.255, - "step": 234810 - }, - { - "epoch": 0.41, - "learning_rate": 2.9525106638253054e-05, - "loss": 2.423, - "step": 234820 - }, - { - "epoch": 0.41, - "learning_rate": 2.9524234698326224e-05, - "loss": 2.4449, - "step": 234830 - }, - { - "epoch": 0.41, - "learning_rate": 2.9523362758399398e-05, - "loss": 2.32, - "step": 234840 - }, - { - "epoch": 0.41, - "learning_rate": 2.9522490818472572e-05, - "loss": 2.3395, - "step": 234850 - }, - { - "epoch": 0.41, - "learning_rate": 2.9521618878545742e-05, - "loss": 2.4355, - "step": 234860 - }, - { - "epoch": 0.41, - "learning_rate": 2.952074693861892e-05, - "loss": 2.3701, - "step": 234870 - }, - { - "epoch": 0.41, - "learning_rate": 2.9519874998692093e-05, - "loss": 2.2632, - "step": 234880 - }, - { - "epoch": 0.41, - "learning_rate": 2.9519003058765267e-05, - "loss": 2.4041, - "step": 234890 - }, - { - "epoch": 0.41, - "learning_rate": 2.9518131118838437e-05, - "loss": 2.3449, - "step": 234900 - }, - { - "epoch": 0.41, - "learning_rate": 2.951725917891161e-05, - "loss": 2.4732, - "step": 234910 - }, - { - "epoch": 0.41, - "learning_rate": 2.951638723898478e-05, - "loss": 2.3266, - "step": 234920 - }, - { - "epoch": 0.41, - "learning_rate": 2.9515515299057955e-05, - "loss": 2.421, - "step": 234930 - }, - { - "epoch": 0.41, - "learning_rate": 2.9514643359131132e-05, - "loss": 2.2991, - "step": 234940 - }, - { - "epoch": 0.41, - "learning_rate": 2.9513771419204306e-05, - "loss": 2.3633, - "step": 234950 - }, - { - "epoch": 0.41, - "learning_rate": 2.951289947927748e-05, - "loss": 2.4084, - "step": 234960 - }, - { - "epoch": 0.41, - "learning_rate": 2.951202753935065e-05, - "loss": 2.325, - "step": 234970 - }, - { - "epoch": 0.41, - "learning_rate": 2.9511155599423824e-05, - "loss": 2.4805, - "step": 234980 - }, - { - "epoch": 0.41, - "learning_rate": 2.9510283659496994e-05, - "loss": 2.33, - "step": 234990 - }, - { - "epoch": 0.41, - "learning_rate": 2.9509411719570168e-05, - "loss": 2.4136, - "step": 235000 - }, - { - "epoch": 0.41, - "learning_rate": 2.9508539779643342e-05, - "loss": 2.4063, - "step": 235010 - }, - { - "epoch": 0.41, - "learning_rate": 2.950766783971652e-05, - "loss": 2.3702, - "step": 235020 - }, - { - "epoch": 0.41, - "learning_rate": 2.950679589978969e-05, - "loss": 2.4129, - "step": 235030 - }, - { - "epoch": 0.41, - "learning_rate": 2.9505923959862863e-05, - "loss": 2.3539, - "step": 235040 - }, - { - "epoch": 0.41, - "learning_rate": 2.9505052019936037e-05, - "loss": 2.4322, - "step": 235050 - }, - { - "epoch": 0.41, - "learning_rate": 2.9504180080009207e-05, - "loss": 2.3004, - "step": 235060 - }, - { - "epoch": 0.41, - "learning_rate": 2.950330814008238e-05, - "loss": 2.2658, - "step": 235070 - }, - { - "epoch": 0.41, - "learning_rate": 2.9502436200155555e-05, - "loss": 2.3656, - "step": 235080 - }, - { - "epoch": 0.41, - "learning_rate": 2.9501564260228732e-05, - "loss": 2.3173, - "step": 235090 - }, - { - "epoch": 0.41, - "learning_rate": 2.9500692320301902e-05, - "loss": 2.3968, - "step": 235100 - }, - { - "epoch": 0.41, - "learning_rate": 2.9499820380375076e-05, - "loss": 2.3676, - "step": 235110 - }, - { - "epoch": 0.41, - "learning_rate": 2.949894844044825e-05, - "loss": 2.3349, - "step": 235120 - }, - { - "epoch": 0.41, - "learning_rate": 2.949807650052142e-05, - "loss": 2.42, - "step": 235130 - }, - { - "epoch": 0.41, - "learning_rate": 2.9497204560594594e-05, - "loss": 2.4713, - "step": 235140 - }, - { - "epoch": 0.41, - "learning_rate": 2.9496332620667764e-05, - "loss": 2.4617, - "step": 235150 - }, - { - "epoch": 0.41, - "learning_rate": 2.9495460680740938e-05, - "loss": 2.3466, - "step": 235160 - }, - { - "epoch": 0.41, - "learning_rate": 2.9494588740814115e-05, - "loss": 2.3872, - "step": 235170 - }, - { - "epoch": 0.41, - "learning_rate": 2.949371680088729e-05, - "loss": 2.6229, - "step": 235180 - }, - { - "epoch": 0.41, - "learning_rate": 2.9492844860960463e-05, - "loss": 2.5272, - "step": 235190 - }, - { - "epoch": 0.41, - "learning_rate": 2.9491972921033633e-05, - "loss": 2.4356, - "step": 235200 - }, - { - "epoch": 0.41, - "learning_rate": 2.9491100981106807e-05, - "loss": 2.4239, - "step": 235210 - }, - { - "epoch": 0.41, - "learning_rate": 2.9490229041179977e-05, - "loss": 2.2739, - "step": 235220 - }, - { - "epoch": 0.41, - "learning_rate": 2.948935710125315e-05, - "loss": 2.3398, - "step": 235230 - }, - { - "epoch": 0.41, - "learning_rate": 2.948848516132633e-05, - "loss": 2.4946, - "step": 235240 - }, - { - "epoch": 0.41, - "learning_rate": 2.9487613221399502e-05, - "loss": 2.3601, - "step": 235250 - }, - { - "epoch": 0.41, - "learning_rate": 2.9486741281472673e-05, - "loss": 2.4343, - "step": 235260 - }, - { - "epoch": 0.41, - "learning_rate": 2.9485869341545846e-05, - "loss": 2.43, - "step": 235270 - }, - { - "epoch": 0.41, - "learning_rate": 2.948499740161902e-05, - "loss": 2.3123, - "step": 235280 - }, - { - "epoch": 0.41, - "learning_rate": 2.948412546169219e-05, - "loss": 2.4382, - "step": 235290 - }, - { - "epoch": 0.41, - "learning_rate": 2.9483253521765364e-05, - "loss": 2.3458, - "step": 235300 - }, - { - "epoch": 0.41, - "learning_rate": 2.948238158183854e-05, - "loss": 2.4602, - "step": 235310 - }, - { - "epoch": 0.41, - "learning_rate": 2.9481509641911715e-05, - "loss": 2.3824, - "step": 235320 - }, - { - "epoch": 0.41, - "learning_rate": 2.9480637701984886e-05, - "loss": 2.3487, - "step": 235330 - }, - { - "epoch": 0.41, - "learning_rate": 2.947976576205806e-05, - "loss": 2.3962, - "step": 235340 - }, - { - "epoch": 0.41, - "learning_rate": 2.9478893822131233e-05, - "loss": 2.4352, - "step": 235350 - }, - { - "epoch": 0.41, - "learning_rate": 2.9478021882204403e-05, - "loss": 2.3684, - "step": 235360 - }, - { - "epoch": 0.41, - "learning_rate": 2.9477149942277577e-05, - "loss": 2.4329, - "step": 235370 - }, - { - "epoch": 0.41, - "learning_rate": 2.9476278002350748e-05, - "loss": 2.2928, - "step": 235380 - }, - { - "epoch": 0.41, - "learning_rate": 2.9475406062423928e-05, - "loss": 2.4479, - "step": 235390 - }, - { - "epoch": 0.41, - "learning_rate": 2.94745341224971e-05, - "loss": 2.457, - "step": 235400 - }, - { - "epoch": 0.41, - "learning_rate": 2.9473662182570272e-05, - "loss": 2.3817, - "step": 235410 - }, - { - "epoch": 0.41, - "learning_rate": 2.9472790242643443e-05, - "loss": 2.5211, - "step": 235420 - }, - { - "epoch": 0.41, - "learning_rate": 2.9471918302716617e-05, - "loss": 2.4398, - "step": 235430 - }, - { - "epoch": 0.41, - "learning_rate": 2.947104636278979e-05, - "loss": 2.375, - "step": 235440 - }, - { - "epoch": 0.41, - "learning_rate": 2.947017442286296e-05, - "loss": 2.5181, - "step": 235450 - }, - { - "epoch": 0.41, - "learning_rate": 2.946930248293614e-05, - "loss": 2.47, - "step": 235460 - }, - { - "epoch": 0.41, - "learning_rate": 2.946843054300931e-05, - "loss": 2.3759, - "step": 235470 - }, - { - "epoch": 0.41, - "learning_rate": 2.9467558603082485e-05, - "loss": 2.4283, - "step": 235480 - }, - { - "epoch": 0.41, - "learning_rate": 2.9466686663155656e-05, - "loss": 2.4469, - "step": 235490 - }, - { - "epoch": 0.41, - "learning_rate": 2.946581472322883e-05, - "loss": 2.3151, - "step": 235500 - }, - { - "epoch": 0.41, - "learning_rate": 2.9464942783302003e-05, - "loss": 2.3652, - "step": 235510 - }, - { - "epoch": 0.41, - "learning_rate": 2.9464070843375174e-05, - "loss": 2.3782, - "step": 235520 - }, - { - "epoch": 0.41, - "learning_rate": 2.9463198903448347e-05, - "loss": 2.4485, - "step": 235530 - }, - { - "epoch": 0.41, - "learning_rate": 2.9462326963521525e-05, - "loss": 2.3142, - "step": 235540 - }, - { - "epoch": 0.41, - "learning_rate": 2.94614550235947e-05, - "loss": 2.2824, - "step": 235550 - }, - { - "epoch": 0.41, - "learning_rate": 2.946058308366787e-05, - "loss": 2.4601, - "step": 235560 - }, - { - "epoch": 0.41, - "learning_rate": 2.9459711143741043e-05, - "loss": 2.2625, - "step": 235570 - }, - { - "epoch": 0.41, - "learning_rate": 2.9458839203814216e-05, - "loss": 2.4156, - "step": 235580 - }, - { - "epoch": 0.41, - "learning_rate": 2.9457967263887387e-05, - "loss": 2.3631, - "step": 235590 - }, - { - "epoch": 0.41, - "learning_rate": 2.945709532396056e-05, - "loss": 2.3686, - "step": 235600 - }, - { - "epoch": 0.41, - "learning_rate": 2.9456223384033738e-05, - "loss": 2.2936, - "step": 235610 - }, - { - "epoch": 0.41, - "learning_rate": 2.945535144410691e-05, - "loss": 2.3095, - "step": 235620 - }, - { - "epoch": 0.41, - "learning_rate": 2.9454479504180082e-05, - "loss": 2.2928, - "step": 235630 - }, - { - "epoch": 0.41, - "learning_rate": 2.9453607564253256e-05, - "loss": 2.4402, - "step": 235640 - }, - { - "epoch": 0.41, - "learning_rate": 2.9452735624326426e-05, - "loss": 2.4739, - "step": 235650 - }, - { - "epoch": 0.41, - "learning_rate": 2.94518636843996e-05, - "loss": 2.5571, - "step": 235660 - }, - { - "epoch": 0.41, - "learning_rate": 2.9450991744472773e-05, - "loss": 2.2897, - "step": 235670 - }, - { - "epoch": 0.41, - "learning_rate": 2.9450119804545944e-05, - "loss": 2.4955, - "step": 235680 - }, - { - "epoch": 0.41, - "learning_rate": 2.9449247864619124e-05, - "loss": 2.3325, - "step": 235690 - }, - { - "epoch": 0.41, - "learning_rate": 2.9448375924692295e-05, - "loss": 2.5032, - "step": 235700 - }, - { - "epoch": 0.41, - "learning_rate": 2.944750398476547e-05, - "loss": 2.3842, - "step": 235710 - }, - { - "epoch": 0.41, - "learning_rate": 2.944663204483864e-05, - "loss": 2.3237, - "step": 235720 - }, - { - "epoch": 0.41, - "learning_rate": 2.9445760104911813e-05, - "loss": 2.3979, - "step": 235730 - }, - { - "epoch": 0.41, - "learning_rate": 2.9444888164984986e-05, - "loss": 2.3975, - "step": 235740 - }, - { - "epoch": 0.41, - "learning_rate": 2.9444016225058157e-05, - "loss": 2.4317, - "step": 235750 - }, - { - "epoch": 0.41, - "learning_rate": 2.9443144285131334e-05, - "loss": 2.2487, - "step": 235760 - }, - { - "epoch": 0.41, - "learning_rate": 2.9442272345204508e-05, - "loss": 2.4143, - "step": 235770 - }, - { - "epoch": 0.41, - "learning_rate": 2.944140040527768e-05, - "loss": 2.4529, - "step": 235780 - }, - { - "epoch": 0.41, - "learning_rate": 2.9440528465350852e-05, - "loss": 2.3522, - "step": 235790 - }, - { - "epoch": 0.41, - "learning_rate": 2.9439656525424026e-05, - "loss": 2.4838, - "step": 235800 - }, - { - "epoch": 0.41, - "learning_rate": 2.94387845854972e-05, - "loss": 2.3905, - "step": 235810 - }, - { - "epoch": 0.41, - "learning_rate": 2.943791264557037e-05, - "loss": 2.3377, - "step": 235820 - }, - { - "epoch": 0.41, - "learning_rate": 2.9437040705643544e-05, - "loss": 2.3223, - "step": 235830 - }, - { - "epoch": 0.41, - "learning_rate": 2.943616876571672e-05, - "loss": 2.3337, - "step": 235840 - }, - { - "epoch": 0.41, - "learning_rate": 2.9435296825789895e-05, - "loss": 2.3394, - "step": 235850 - }, - { - "epoch": 0.41, - "learning_rate": 2.9434424885863065e-05, - "loss": 2.4904, - "step": 235860 - }, - { - "epoch": 0.41, - "learning_rate": 2.943355294593624e-05, - "loss": 2.4398, - "step": 235870 - }, - { - "epoch": 0.41, - "learning_rate": 2.943268100600941e-05, - "loss": 2.4717, - "step": 235880 - }, - { - "epoch": 0.41, - "learning_rate": 2.9431809066082583e-05, - "loss": 2.4286, - "step": 235890 - }, - { - "epoch": 0.41, - "learning_rate": 2.9430937126155757e-05, - "loss": 2.4394, - "step": 235900 - }, - { - "epoch": 0.41, - "learning_rate": 2.9430065186228934e-05, - "loss": 2.3964, - "step": 235910 - }, - { - "epoch": 0.41, - "learning_rate": 2.9429193246302108e-05, - "loss": 2.3184, - "step": 235920 - }, - { - "epoch": 0.41, - "learning_rate": 2.9428321306375278e-05, - "loss": 2.3735, - "step": 235930 - }, - { - "epoch": 0.41, - "learning_rate": 2.942744936644845e-05, - "loss": 2.4144, - "step": 235940 - }, - { - "epoch": 0.41, - "learning_rate": 2.9426577426521622e-05, - "loss": 2.3835, - "step": 235950 - }, - { - "epoch": 0.41, - "learning_rate": 2.9425705486594796e-05, - "loss": 2.2854, - "step": 235960 - }, - { - "epoch": 0.41, - "learning_rate": 2.942483354666797e-05, - "loss": 2.363, - "step": 235970 - }, - { - "epoch": 0.41, - "learning_rate": 2.9423961606741147e-05, - "loss": 2.4019, - "step": 235980 - }, - { - "epoch": 0.41, - "learning_rate": 2.9423089666814317e-05, - "loss": 2.3689, - "step": 235990 - }, - { - "epoch": 0.41, - "learning_rate": 2.942221772688749e-05, - "loss": 2.4048, - "step": 236000 - }, - { - "epoch": 0.41, - "learning_rate": 2.9421345786960665e-05, - "loss": 2.4043, - "step": 236010 - }, - { - "epoch": 0.41, - "learning_rate": 2.9420473847033835e-05, - "loss": 2.3788, - "step": 236020 - }, - { - "epoch": 0.41, - "learning_rate": 2.941960190710701e-05, - "loss": 2.4901, - "step": 236030 - }, - { - "epoch": 0.41, - "learning_rate": 2.941872996718018e-05, - "loss": 2.382, - "step": 236040 - }, - { - "epoch": 0.41, - "learning_rate": 2.9417858027253353e-05, - "loss": 2.3533, - "step": 236050 - }, - { - "epoch": 0.41, - "learning_rate": 2.941698608732653e-05, - "loss": 2.3853, - "step": 236060 - }, - { - "epoch": 0.41, - "learning_rate": 2.9416114147399704e-05, - "loss": 2.474, - "step": 236070 - }, - { - "epoch": 0.41, - "learning_rate": 2.9415242207472878e-05, - "loss": 2.4072, - "step": 236080 - }, - { - "epoch": 0.41, - "learning_rate": 2.9414370267546048e-05, - "loss": 2.3214, - "step": 236090 - }, - { - "epoch": 0.41, - "learning_rate": 2.9413498327619222e-05, - "loss": 2.3831, - "step": 236100 - }, - { - "epoch": 0.41, - "learning_rate": 2.9412626387692392e-05, - "loss": 2.3469, - "step": 236110 - }, - { - "epoch": 0.41, - "learning_rate": 2.9411754447765566e-05, - "loss": 2.5003, - "step": 236120 - }, - { - "epoch": 0.41, - "learning_rate": 2.9410882507838743e-05, - "loss": 2.5013, - "step": 236130 - }, - { - "epoch": 0.41, - "learning_rate": 2.9410010567911917e-05, - "loss": 2.4922, - "step": 236140 - }, - { - "epoch": 0.41, - "learning_rate": 2.9409138627985087e-05, - "loss": 2.3403, - "step": 236150 - }, - { - "epoch": 0.41, - "learning_rate": 2.940826668805826e-05, - "loss": 2.3666, - "step": 236160 - }, - { - "epoch": 0.41, - "learning_rate": 2.9407394748131435e-05, - "loss": 2.3742, - "step": 236170 - }, - { - "epoch": 0.41, - "learning_rate": 2.9406522808204605e-05, - "loss": 2.3755, - "step": 236180 - }, - { - "epoch": 0.41, - "learning_rate": 2.940565086827778e-05, - "loss": 2.3174, - "step": 236190 - }, - { - "epoch": 0.41, - "learning_rate": 2.9404778928350953e-05, - "loss": 2.3187, - "step": 236200 - }, - { - "epoch": 0.41, - "learning_rate": 2.940390698842413e-05, - "loss": 2.4722, - "step": 236210 - }, - { - "epoch": 0.41, - "learning_rate": 2.94030350484973e-05, - "loss": 2.4563, - "step": 236220 - }, - { - "epoch": 0.41, - "learning_rate": 2.9402163108570474e-05, - "loss": 2.4057, - "step": 236230 - }, - { - "epoch": 0.41, - "learning_rate": 2.9401291168643648e-05, - "loss": 2.3461, - "step": 236240 - }, - { - "epoch": 0.41, - "learning_rate": 2.9400419228716818e-05, - "loss": 2.3573, - "step": 236250 - }, - { - "epoch": 0.41, - "learning_rate": 2.9399547288789992e-05, - "loss": 2.4001, - "step": 236260 - }, - { - "epoch": 0.41, - "learning_rate": 2.9398675348863162e-05, - "loss": 2.3258, - "step": 236270 - }, - { - "epoch": 0.41, - "learning_rate": 2.9397803408936343e-05, - "loss": 2.3592, - "step": 236280 - }, - { - "epoch": 0.41, - "learning_rate": 2.9396931469009513e-05, - "loss": 2.4474, - "step": 236290 - }, - { - "epoch": 0.41, - "learning_rate": 2.9396059529082687e-05, - "loss": 2.3023, - "step": 236300 - }, - { - "epoch": 0.41, - "learning_rate": 2.939518758915586e-05, - "loss": 2.3694, - "step": 236310 - }, - { - "epoch": 0.41, - "learning_rate": 2.939431564922903e-05, - "loss": 2.3935, - "step": 236320 - }, - { - "epoch": 0.41, - "learning_rate": 2.9393443709302205e-05, - "loss": 2.3885, - "step": 236330 - }, - { - "epoch": 0.41, - "learning_rate": 2.9392571769375375e-05, - "loss": 2.2771, - "step": 236340 - }, - { - "epoch": 0.41, - "learning_rate": 2.939169982944855e-05, - "loss": 2.3316, - "step": 236350 - }, - { - "epoch": 0.41, - "learning_rate": 2.9390827889521726e-05, - "loss": 2.4624, - "step": 236360 - }, - { - "epoch": 0.41, - "learning_rate": 2.93899559495949e-05, - "loss": 2.338, - "step": 236370 - }, - { - "epoch": 0.41, - "learning_rate": 2.938908400966807e-05, - "loss": 2.3712, - "step": 236380 - }, - { - "epoch": 0.41, - "learning_rate": 2.9388212069741244e-05, - "loss": 2.425, - "step": 236390 - }, - { - "epoch": 0.41, - "learning_rate": 2.9387340129814418e-05, - "loss": 2.45, - "step": 236400 - }, - { - "epoch": 0.41, - "learning_rate": 2.938646818988759e-05, - "loss": 2.3967, - "step": 236410 - }, - { - "epoch": 0.41, - "learning_rate": 2.9385596249960762e-05, - "loss": 2.4948, - "step": 236420 - }, - { - "epoch": 0.41, - "learning_rate": 2.938472431003394e-05, - "loss": 2.4723, - "step": 236430 - }, - { - "epoch": 0.41, - "learning_rate": 2.9383852370107113e-05, - "loss": 2.417, - "step": 236440 - }, - { - "epoch": 0.41, - "learning_rate": 2.9382980430180283e-05, - "loss": 2.2689, - "step": 236450 - }, - { - "epoch": 0.41, - "learning_rate": 2.9382108490253457e-05, - "loss": 2.2028, - "step": 236460 - }, - { - "epoch": 0.41, - "learning_rate": 2.938123655032663e-05, - "loss": 2.4457, - "step": 236470 - }, - { - "epoch": 0.41, - "learning_rate": 2.93803646103998e-05, - "loss": 2.3357, - "step": 236480 - }, - { - "epoch": 0.41, - "learning_rate": 2.9379492670472975e-05, - "loss": 2.4153, - "step": 236490 - }, - { - "epoch": 0.41, - "learning_rate": 2.9378620730546146e-05, - "loss": 2.3187, - "step": 236500 - }, - { - "epoch": 0.41, - "learning_rate": 2.9377748790619326e-05, - "loss": 2.4323, - "step": 236510 - }, - { - "epoch": 0.41, - "learning_rate": 2.9376876850692496e-05, - "loss": 2.4039, - "step": 236520 - }, - { - "epoch": 0.41, - "learning_rate": 2.937600491076567e-05, - "loss": 2.2963, - "step": 236530 - }, - { - "epoch": 0.41, - "learning_rate": 2.9375132970838844e-05, - "loss": 2.4163, - "step": 236540 - }, - { - "epoch": 0.41, - "learning_rate": 2.9374261030912014e-05, - "loss": 2.4503, - "step": 236550 - }, - { - "epoch": 0.41, - "learning_rate": 2.9373389090985188e-05, - "loss": 2.371, - "step": 236560 - }, - { - "epoch": 0.41, - "learning_rate": 2.937251715105836e-05, - "loss": 2.4097, - "step": 236570 - }, - { - "epoch": 0.41, - "learning_rate": 2.937164521113154e-05, - "loss": 2.4088, - "step": 236580 - }, - { - "epoch": 0.41, - "learning_rate": 2.937077327120471e-05, - "loss": 2.4245, - "step": 236590 - }, - { - "epoch": 0.41, - "learning_rate": 2.9369901331277883e-05, - "loss": 2.3989, - "step": 236600 - }, - { - "epoch": 0.41, - "learning_rate": 2.9369029391351054e-05, - "loss": 2.4816, - "step": 236610 - }, - { - "epoch": 0.41, - "learning_rate": 2.9368157451424227e-05, - "loss": 2.4096, - "step": 236620 - }, - { - "epoch": 0.41, - "learning_rate": 2.93672855114974e-05, - "loss": 2.5361, - "step": 236630 - }, - { - "epoch": 0.41, - "learning_rate": 2.936641357157057e-05, - "loss": 2.4331, - "step": 236640 - }, - { - "epoch": 0.41, - "learning_rate": 2.9365541631643752e-05, - "loss": 2.4104, - "step": 236650 - }, - { - "epoch": 0.41, - "learning_rate": 2.9364669691716922e-05, - "loss": 2.3751, - "step": 236660 - }, - { - "epoch": 0.41, - "learning_rate": 2.9363797751790096e-05, - "loss": 2.3968, - "step": 236670 - }, - { - "epoch": 0.41, - "learning_rate": 2.9362925811863267e-05, - "loss": 2.3548, - "step": 236680 - }, - { - "epoch": 0.41, - "learning_rate": 2.936205387193644e-05, - "loss": 2.4794, - "step": 236690 - }, - { - "epoch": 0.41, - "learning_rate": 2.9361181932009614e-05, - "loss": 2.4413, - "step": 236700 - }, - { - "epoch": 0.41, - "learning_rate": 2.9360309992082785e-05, - "loss": 2.4248, - "step": 236710 - }, - { - "epoch": 0.41, - "learning_rate": 2.9359438052155958e-05, - "loss": 2.5247, - "step": 236720 - }, - { - "epoch": 0.41, - "learning_rate": 2.9358566112229135e-05, - "loss": 2.419, - "step": 236730 - }, - { - "epoch": 0.41, - "learning_rate": 2.935769417230231e-05, - "loss": 2.4375, - "step": 236740 - }, - { - "epoch": 0.41, - "learning_rate": 2.935682223237548e-05, - "loss": 2.4782, - "step": 236750 - }, - { - "epoch": 0.41, - "learning_rate": 2.9355950292448653e-05, - "loss": 2.5053, - "step": 236760 - }, - { - "epoch": 0.41, - "learning_rate": 2.9355078352521824e-05, - "loss": 2.3042, - "step": 236770 - }, - { - "epoch": 0.41, - "learning_rate": 2.9354206412594998e-05, - "loss": 2.4659, - "step": 236780 - }, - { - "epoch": 0.41, - "learning_rate": 2.935333447266817e-05, - "loss": 2.3824, - "step": 236790 - }, - { - "epoch": 0.41, - "learning_rate": 2.935246253274135e-05, - "loss": 2.466, - "step": 236800 - }, - { - "epoch": 0.41, - "learning_rate": 2.9351590592814522e-05, - "loss": 2.3871, - "step": 236810 - }, - { - "epoch": 0.41, - "learning_rate": 2.9350718652887693e-05, - "loss": 2.3095, - "step": 236820 - }, - { - "epoch": 0.41, - "learning_rate": 2.9349846712960866e-05, - "loss": 2.3974, - "step": 236830 - }, - { - "epoch": 0.41, - "learning_rate": 2.9348974773034037e-05, - "loss": 2.3956, - "step": 236840 - }, - { - "epoch": 0.41, - "learning_rate": 2.934810283310721e-05, - "loss": 2.2888, - "step": 236850 - }, - { - "epoch": 0.41, - "learning_rate": 2.9347230893180384e-05, - "loss": 2.3868, - "step": 236860 - }, - { - "epoch": 0.41, - "learning_rate": 2.9346358953253555e-05, - "loss": 2.4271, - "step": 236870 - }, - { - "epoch": 0.41, - "learning_rate": 2.9345487013326732e-05, - "loss": 2.3831, - "step": 236880 - }, - { - "epoch": 0.41, - "learning_rate": 2.9344615073399906e-05, - "loss": 2.2806, - "step": 236890 - }, - { - "epoch": 0.41, - "learning_rate": 2.934374313347308e-05, - "loss": 2.2106, - "step": 236900 - }, - { - "epoch": 0.41, - "learning_rate": 2.934287119354625e-05, - "loss": 2.5218, - "step": 236910 - }, - { - "epoch": 0.41, - "learning_rate": 2.9341999253619424e-05, - "loss": 2.3455, - "step": 236920 - }, - { - "epoch": 0.41, - "learning_rate": 2.9341127313692597e-05, - "loss": 2.2995, - "step": 236930 - }, - { - "epoch": 0.41, - "learning_rate": 2.9340255373765768e-05, - "loss": 2.4892, - "step": 236940 - }, - { - "epoch": 0.41, - "learning_rate": 2.9339383433838945e-05, - "loss": 2.3813, - "step": 236950 - }, - { - "epoch": 0.41, - "learning_rate": 2.933851149391212e-05, - "loss": 2.4378, - "step": 236960 - }, - { - "epoch": 0.41, - "learning_rate": 2.9337639553985292e-05, - "loss": 2.3774, - "step": 236970 - }, - { - "epoch": 0.41, - "learning_rate": 2.9336767614058463e-05, - "loss": 2.3287, - "step": 236980 - }, - { - "epoch": 0.41, - "learning_rate": 2.9335895674131637e-05, - "loss": 2.4332, - "step": 236990 - }, - { - "epoch": 0.41, - "learning_rate": 2.9335023734204807e-05, - "loss": 2.2918, - "step": 237000 - }, - { - "epoch": 0.41, - "learning_rate": 2.933415179427798e-05, - "loss": 2.4609, - "step": 237010 - }, - { - "epoch": 0.41, - "learning_rate": 2.9333279854351154e-05, - "loss": 2.4278, - "step": 237020 - }, - { - "epoch": 0.41, - "learning_rate": 2.933240791442433e-05, - "loss": 2.4239, - "step": 237030 - }, - { - "epoch": 0.41, - "learning_rate": 2.9331535974497505e-05, - "loss": 2.4249, - "step": 237040 - }, - { - "epoch": 0.41, - "learning_rate": 2.9330664034570676e-05, - "loss": 2.3649, - "step": 237050 - }, - { - "epoch": 0.41, - "learning_rate": 2.932979209464385e-05, - "loss": 2.3927, - "step": 237060 - }, - { - "epoch": 0.41, - "learning_rate": 2.932892015471702e-05, - "loss": 2.3161, - "step": 237070 - }, - { - "epoch": 0.41, - "learning_rate": 2.9328048214790194e-05, - "loss": 2.3861, - "step": 237080 - }, - { - "epoch": 0.41, - "learning_rate": 2.9327176274863367e-05, - "loss": 2.4218, - "step": 237090 - }, - { - "epoch": 0.41, - "learning_rate": 2.9326304334936545e-05, - "loss": 2.381, - "step": 237100 - }, - { - "epoch": 0.41, - "learning_rate": 2.9325432395009715e-05, - "loss": 2.4393, - "step": 237110 - }, - { - "epoch": 0.41, - "learning_rate": 2.932456045508289e-05, - "loss": 2.3374, - "step": 237120 - }, - { - "epoch": 0.41, - "learning_rate": 2.9323688515156063e-05, - "loss": 2.3187, - "step": 237130 - }, - { - "epoch": 0.41, - "learning_rate": 2.9322816575229233e-05, - "loss": 2.5044, - "step": 237140 - }, - { - "epoch": 0.41, - "learning_rate": 2.9321944635302407e-05, - "loss": 2.4001, - "step": 237150 - }, - { - "epoch": 0.41, - "learning_rate": 2.932107269537558e-05, - "loss": 2.3035, - "step": 237160 - }, - { - "epoch": 0.41, - "learning_rate": 2.9320200755448758e-05, - "loss": 2.4837, - "step": 237170 - }, - { - "epoch": 0.41, - "learning_rate": 2.9319328815521928e-05, - "loss": 2.4393, - "step": 237180 - }, - { - "epoch": 0.41, - "learning_rate": 2.9318456875595102e-05, - "loss": 2.3699, - "step": 237190 - }, - { - "epoch": 0.41, - "learning_rate": 2.9317584935668276e-05, - "loss": 2.4046, - "step": 237200 - }, - { - "epoch": 0.41, - "learning_rate": 2.9316712995741446e-05, - "loss": 2.4905, - "step": 237210 - }, - { - "epoch": 0.41, - "learning_rate": 2.931584105581462e-05, - "loss": 2.3552, - "step": 237220 - }, - { - "epoch": 0.41, - "learning_rate": 2.931496911588779e-05, - "loss": 2.3985, - "step": 237230 - }, - { - "epoch": 0.41, - "learning_rate": 2.9314097175960964e-05, - "loss": 2.3754, - "step": 237240 - }, - { - "epoch": 0.41, - "learning_rate": 2.931322523603414e-05, - "loss": 2.4035, - "step": 237250 - }, - { - "epoch": 0.41, - "learning_rate": 2.9312353296107315e-05, - "loss": 2.4221, - "step": 237260 - }, - { - "epoch": 0.41, - "learning_rate": 2.931148135618049e-05, - "loss": 2.3712, - "step": 237270 - }, - { - "epoch": 0.41, - "learning_rate": 2.931060941625366e-05, - "loss": 2.3144, - "step": 237280 - }, - { - "epoch": 0.41, - "learning_rate": 2.9309737476326833e-05, - "loss": 2.3994, - "step": 237290 - }, - { - "epoch": 0.41, - "learning_rate": 2.9308865536400003e-05, - "loss": 2.3494, - "step": 237300 - }, - { - "epoch": 0.41, - "learning_rate": 2.9307993596473177e-05, - "loss": 2.3443, - "step": 237310 - }, - { - "epoch": 0.41, - "learning_rate": 2.9307121656546354e-05, - "loss": 2.4817, - "step": 237320 - }, - { - "epoch": 0.41, - "learning_rate": 2.9306249716619528e-05, - "loss": 2.4217, - "step": 237330 - }, - { - "epoch": 0.41, - "learning_rate": 2.9305377776692698e-05, - "loss": 2.2881, - "step": 237340 - }, - { - "epoch": 0.41, - "learning_rate": 2.9304505836765872e-05, - "loss": 2.3443, - "step": 237350 - }, - { - "epoch": 0.41, - "learning_rate": 2.9303633896839046e-05, - "loss": 2.33, - "step": 237360 - }, - { - "epoch": 0.41, - "learning_rate": 2.9302761956912216e-05, - "loss": 2.3148, - "step": 237370 - }, - { - "epoch": 0.41, - "learning_rate": 2.930189001698539e-05, - "loss": 2.4183, - "step": 237380 - }, - { - "epoch": 0.41, - "learning_rate": 2.930101807705856e-05, - "loss": 2.3629, - "step": 237390 - }, - { - "epoch": 0.41, - "learning_rate": 2.930014613713174e-05, - "loss": 2.328, - "step": 237400 - }, - { - "epoch": 0.41, - "learning_rate": 2.929927419720491e-05, - "loss": 2.4122, - "step": 237410 - }, - { - "epoch": 0.41, - "learning_rate": 2.9298402257278085e-05, - "loss": 2.3661, - "step": 237420 - }, - { - "epoch": 0.41, - "learning_rate": 2.929753031735126e-05, - "loss": 2.3692, - "step": 237430 - }, - { - "epoch": 0.41, - "learning_rate": 2.929665837742443e-05, - "loss": 2.3147, - "step": 237440 - }, - { - "epoch": 0.41, - "learning_rate": 2.9295786437497603e-05, - "loss": 2.3919, - "step": 237450 - }, - { - "epoch": 0.41, - "learning_rate": 2.9294914497570773e-05, - "loss": 2.4541, - "step": 237460 - }, - { - "epoch": 0.41, - "learning_rate": 2.9294042557643954e-05, - "loss": 2.2652, - "step": 237470 - }, - { - "epoch": 0.41, - "learning_rate": 2.9293170617717124e-05, - "loss": 2.3913, - "step": 237480 - }, - { - "epoch": 0.41, - "learning_rate": 2.9292298677790298e-05, - "loss": 2.4, - "step": 237490 - }, - { - "epoch": 0.41, - "learning_rate": 2.9291426737863468e-05, - "loss": 2.3718, - "step": 237500 - }, - { - "epoch": 0.41, - "learning_rate": 2.9290554797936642e-05, - "loss": 2.3493, - "step": 237510 - }, - { - "epoch": 0.41, - "learning_rate": 2.9289682858009816e-05, - "loss": 2.3376, - "step": 237520 - }, - { - "epoch": 0.41, - "learning_rate": 2.9288810918082986e-05, - "loss": 2.4232, - "step": 237530 - }, - { - "epoch": 0.41, - "learning_rate": 2.928793897815616e-05, - "loss": 2.5617, - "step": 237540 - }, - { - "epoch": 0.41, - "learning_rate": 2.9287067038229337e-05, - "loss": 2.3158, - "step": 237550 - }, - { - "epoch": 0.41, - "learning_rate": 2.928619509830251e-05, - "loss": 2.3896, - "step": 237560 - }, - { - "epoch": 0.41, - "learning_rate": 2.928532315837568e-05, - "loss": 2.3799, - "step": 237570 - }, - { - "epoch": 0.41, - "learning_rate": 2.9284451218448855e-05, - "loss": 2.3308, - "step": 237580 - }, - { - "epoch": 0.41, - "learning_rate": 2.928357927852203e-05, - "loss": 2.4216, - "step": 237590 - }, - { - "epoch": 0.41, - "learning_rate": 2.92827073385952e-05, - "loss": 2.3383, - "step": 237600 - }, - { - "epoch": 0.41, - "learning_rate": 2.9281835398668373e-05, - "loss": 2.3547, - "step": 237610 - }, - { - "epoch": 0.41, - "learning_rate": 2.928096345874155e-05, - "loss": 2.4319, - "step": 237620 - }, - { - "epoch": 0.41, - "learning_rate": 2.9280091518814724e-05, - "loss": 2.4224, - "step": 237630 - }, - { - "epoch": 0.41, - "learning_rate": 2.9279219578887894e-05, - "loss": 2.4205, - "step": 237640 - }, - { - "epoch": 0.41, - "learning_rate": 2.9278347638961068e-05, - "loss": 2.3139, - "step": 237650 - }, - { - "epoch": 0.41, - "learning_rate": 2.9277475699034242e-05, - "loss": 2.3994, - "step": 237660 - }, - { - "epoch": 0.41, - "learning_rate": 2.9276603759107412e-05, - "loss": 2.3822, - "step": 237670 - }, - { - "epoch": 0.41, - "learning_rate": 2.9275731819180586e-05, - "loss": 2.5138, - "step": 237680 - }, - { - "epoch": 0.41, - "learning_rate": 2.9274859879253756e-05, - "loss": 2.4465, - "step": 237690 - }, - { - "epoch": 0.41, - "learning_rate": 2.9273987939326937e-05, - "loss": 2.3314, - "step": 237700 - }, - { - "epoch": 0.41, - "learning_rate": 2.9273115999400107e-05, - "loss": 2.4248, - "step": 237710 - }, - { - "epoch": 0.41, - "learning_rate": 2.927224405947328e-05, - "loss": 2.4055, - "step": 237720 - }, - { - "epoch": 0.41, - "learning_rate": 2.927137211954645e-05, - "loss": 2.4205, - "step": 237730 - }, - { - "epoch": 0.41, - "learning_rate": 2.9270500179619625e-05, - "loss": 2.4611, - "step": 237740 - }, - { - "epoch": 0.41, - "learning_rate": 2.92696282396928e-05, - "loss": 2.3047, - "step": 237750 - }, - { - "epoch": 0.41, - "learning_rate": 2.926875629976597e-05, - "loss": 2.5047, - "step": 237760 - }, - { - "epoch": 0.41, - "learning_rate": 2.926788435983915e-05, - "loss": 2.2291, - "step": 237770 - }, - { - "epoch": 0.41, - "learning_rate": 2.926701241991232e-05, - "loss": 2.4082, - "step": 237780 - }, - { - "epoch": 0.41, - "learning_rate": 2.9266140479985494e-05, - "loss": 2.2968, - "step": 237790 - }, - { - "epoch": 0.41, - "learning_rate": 2.9265268540058664e-05, - "loss": 2.4294, - "step": 237800 - }, - { - "epoch": 0.41, - "learning_rate": 2.9264396600131838e-05, - "loss": 2.39, - "step": 237810 - }, - { - "epoch": 0.41, - "learning_rate": 2.9263524660205012e-05, - "loss": 2.4464, - "step": 237820 - }, - { - "epoch": 0.41, - "learning_rate": 2.9262652720278182e-05, - "loss": 2.4251, - "step": 237830 - }, - { - "epoch": 0.41, - "learning_rate": 2.926178078035136e-05, - "loss": 2.3756, - "step": 237840 - }, - { - "epoch": 0.41, - "learning_rate": 2.9260908840424533e-05, - "loss": 2.4473, - "step": 237850 - }, - { - "epoch": 0.41, - "learning_rate": 2.9260036900497707e-05, - "loss": 2.3588, - "step": 237860 - }, - { - "epoch": 0.41, - "learning_rate": 2.9259164960570877e-05, - "loss": 2.3602, - "step": 237870 - }, - { - "epoch": 0.41, - "learning_rate": 2.925829302064405e-05, - "loss": 2.3947, - "step": 237880 - }, - { - "epoch": 0.41, - "learning_rate": 2.9257421080717225e-05, - "loss": 2.3711, - "step": 237890 - }, - { - "epoch": 0.41, - "learning_rate": 2.9256549140790395e-05, - "loss": 2.3412, - "step": 237900 - }, - { - "epoch": 0.41, - "learning_rate": 2.925567720086357e-05, - "loss": 2.368, - "step": 237910 - }, - { - "epoch": 0.41, - "learning_rate": 2.9254805260936746e-05, - "loss": 2.4569, - "step": 237920 - }, - { - "epoch": 0.41, - "learning_rate": 2.925393332100992e-05, - "loss": 2.4088, - "step": 237930 - }, - { - "epoch": 0.41, - "learning_rate": 2.925306138108309e-05, - "loss": 2.438, - "step": 237940 - }, - { - "epoch": 0.41, - "learning_rate": 2.9252189441156264e-05, - "loss": 2.3205, - "step": 237950 - }, - { - "epoch": 0.41, - "learning_rate": 2.9251317501229435e-05, - "loss": 2.3804, - "step": 237960 - }, - { - "epoch": 0.41, - "learning_rate": 2.925044556130261e-05, - "loss": 2.3843, - "step": 237970 - }, - { - "epoch": 0.42, - "learning_rate": 2.9249573621375782e-05, - "loss": 2.4832, - "step": 237980 - }, - { - "epoch": 0.42, - "learning_rate": 2.924870168144896e-05, - "loss": 2.3415, - "step": 237990 - }, - { - "epoch": 0.42, - "learning_rate": 2.9247829741522133e-05, - "loss": 2.3879, - "step": 238000 - }, - { - "epoch": 0.42, - "learning_rate": 2.9246957801595303e-05, - "loss": 2.437, - "step": 238010 - }, - { - "epoch": 0.42, - "learning_rate": 2.9246085861668477e-05, - "loss": 2.4185, - "step": 238020 - }, - { - "epoch": 0.42, - "learning_rate": 2.9245213921741648e-05, - "loss": 2.3437, - "step": 238030 - }, - { - "epoch": 0.42, - "learning_rate": 2.924434198181482e-05, - "loss": 2.2486, - "step": 238040 - }, - { - "epoch": 0.42, - "learning_rate": 2.9243470041887995e-05, - "loss": 2.3235, - "step": 238050 - }, - { - "epoch": 0.42, - "learning_rate": 2.9242598101961166e-05, - "loss": 2.3867, - "step": 238060 - }, - { - "epoch": 0.42, - "learning_rate": 2.9241726162034343e-05, - "loss": 2.3513, - "step": 238070 - }, - { - "epoch": 0.42, - "learning_rate": 2.9240854222107516e-05, - "loss": 2.4442, - "step": 238080 - }, - { - "epoch": 0.42, - "learning_rate": 2.923998228218069e-05, - "loss": 2.422, - "step": 238090 - }, - { - "epoch": 0.42, - "learning_rate": 2.923911034225386e-05, - "loss": 2.4632, - "step": 238100 - }, - { - "epoch": 0.42, - "learning_rate": 2.9238238402327034e-05, - "loss": 2.3991, - "step": 238110 - }, - { - "epoch": 0.42, - "learning_rate": 2.9237366462400205e-05, - "loss": 2.3726, - "step": 238120 - }, - { - "epoch": 0.42, - "learning_rate": 2.923649452247338e-05, - "loss": 2.5, - "step": 238130 - }, - { - "epoch": 0.42, - "learning_rate": 2.9235622582546556e-05, - "loss": 2.3964, - "step": 238140 - }, - { - "epoch": 0.42, - "learning_rate": 2.923475064261973e-05, - "loss": 2.3241, - "step": 238150 - }, - { - "epoch": 0.42, - "learning_rate": 2.9233878702692903e-05, - "loss": 2.4459, - "step": 238160 - }, - { - "epoch": 0.42, - "learning_rate": 2.9233006762766074e-05, - "loss": 2.5051, - "step": 238170 - }, - { - "epoch": 0.42, - "learning_rate": 2.9232134822839247e-05, - "loss": 2.3571, - "step": 238180 - }, - { - "epoch": 0.42, - "learning_rate": 2.9231262882912418e-05, - "loss": 2.4574, - "step": 238190 - }, - { - "epoch": 0.42, - "learning_rate": 2.923039094298559e-05, - "loss": 2.2677, - "step": 238200 - }, - { - "epoch": 0.42, - "learning_rate": 2.9229519003058765e-05, - "loss": 2.3521, - "step": 238210 - }, - { - "epoch": 0.42, - "learning_rate": 2.9228647063131942e-05, - "loss": 2.4982, - "step": 238220 - }, - { - "epoch": 0.42, - "learning_rate": 2.9227775123205113e-05, - "loss": 2.373, - "step": 238230 - }, - { - "epoch": 0.42, - "learning_rate": 2.9226903183278287e-05, - "loss": 2.341, - "step": 238240 - }, - { - "epoch": 0.42, - "learning_rate": 2.922603124335146e-05, - "loss": 2.4684, - "step": 238250 - }, - { - "epoch": 0.42, - "learning_rate": 2.922515930342463e-05, - "loss": 2.4095, - "step": 238260 - }, - { - "epoch": 0.42, - "learning_rate": 2.9224287363497805e-05, - "loss": 2.311, - "step": 238270 - }, - { - "epoch": 0.42, - "learning_rate": 2.9223415423570978e-05, - "loss": 2.3428, - "step": 238280 - }, - { - "epoch": 0.42, - "learning_rate": 2.9222543483644155e-05, - "loss": 2.437, - "step": 238290 - }, - { - "epoch": 0.42, - "learning_rate": 2.9221671543717326e-05, - "loss": 2.3692, - "step": 238300 - }, - { - "epoch": 0.42, - "learning_rate": 2.92207996037905e-05, - "loss": 2.2942, - "step": 238310 - }, - { - "epoch": 0.42, - "learning_rate": 2.9219927663863673e-05, - "loss": 2.4719, - "step": 238320 - }, - { - "epoch": 0.42, - "learning_rate": 2.9219055723936844e-05, - "loss": 2.3067, - "step": 238330 - }, - { - "epoch": 0.42, - "learning_rate": 2.9218183784010018e-05, - "loss": 2.4313, - "step": 238340 - }, - { - "epoch": 0.42, - "learning_rate": 2.9217311844083188e-05, - "loss": 2.3465, - "step": 238350 - }, - { - "epoch": 0.42, - "learning_rate": 2.921643990415636e-05, - "loss": 2.3753, - "step": 238360 - }, - { - "epoch": 0.42, - "learning_rate": 2.921556796422954e-05, - "loss": 2.293, - "step": 238370 - }, - { - "epoch": 0.42, - "learning_rate": 2.9214696024302713e-05, - "loss": 2.4028, - "step": 238380 - }, - { - "epoch": 0.42, - "learning_rate": 2.9213824084375886e-05, - "loss": 2.2972, - "step": 238390 - }, - { - "epoch": 0.42, - "learning_rate": 2.9212952144449057e-05, - "loss": 2.4677, - "step": 238400 - }, - { - "epoch": 0.42, - "learning_rate": 2.921208020452223e-05, - "loss": 2.3901, - "step": 238410 - }, - { - "epoch": 0.42, - "learning_rate": 2.92112082645954e-05, - "loss": 2.4534, - "step": 238420 - }, - { - "epoch": 0.42, - "learning_rate": 2.9210336324668575e-05, - "loss": 2.4185, - "step": 238430 - }, - { - "epoch": 0.42, - "learning_rate": 2.9209464384741752e-05, - "loss": 2.4077, - "step": 238440 - }, - { - "epoch": 0.42, - "learning_rate": 2.9208592444814926e-05, - "loss": 2.3722, - "step": 238450 - }, - { - "epoch": 0.42, - "learning_rate": 2.9207720504888096e-05, - "loss": 2.4618, - "step": 238460 - }, - { - "epoch": 0.42, - "learning_rate": 2.920684856496127e-05, - "loss": 2.3831, - "step": 238470 - }, - { - "epoch": 0.42, - "learning_rate": 2.9205976625034444e-05, - "loss": 2.4038, - "step": 238480 - }, - { - "epoch": 0.42, - "learning_rate": 2.9205104685107614e-05, - "loss": 2.4305, - "step": 238490 - }, - { - "epoch": 0.42, - "learning_rate": 2.9204232745180788e-05, - "loss": 2.4499, - "step": 238500 - }, - { - "epoch": 0.42, - "learning_rate": 2.9203360805253965e-05, - "loss": 2.3322, - "step": 238510 - }, - { - "epoch": 0.42, - "learning_rate": 2.920248886532714e-05, - "loss": 2.3466, - "step": 238520 - }, - { - "epoch": 0.42, - "learning_rate": 2.920161692540031e-05, - "loss": 2.378, - "step": 238530 - }, - { - "epoch": 0.42, - "learning_rate": 2.9200744985473483e-05, - "loss": 2.4425, - "step": 238540 - }, - { - "epoch": 0.42, - "learning_rate": 2.9199873045546657e-05, - "loss": 2.3472, - "step": 238550 - }, - { - "epoch": 0.42, - "learning_rate": 2.9199001105619827e-05, - "loss": 2.4893, - "step": 238560 - }, - { - "epoch": 0.42, - "learning_rate": 2.9198129165693e-05, - "loss": 2.3195, - "step": 238570 - }, - { - "epoch": 0.42, - "learning_rate": 2.919725722576617e-05, - "loss": 2.4792, - "step": 238580 - }, - { - "epoch": 0.42, - "learning_rate": 2.919638528583935e-05, - "loss": 2.4492, - "step": 238590 - }, - { - "epoch": 0.42, - "learning_rate": 2.9195513345912522e-05, - "loss": 2.3127, - "step": 238600 - }, - { - "epoch": 0.42, - "learning_rate": 2.9194641405985696e-05, - "loss": 2.3265, - "step": 238610 - }, - { - "epoch": 0.42, - "learning_rate": 2.919376946605887e-05, - "loss": 2.4, - "step": 238620 - }, - { - "epoch": 0.42, - "learning_rate": 2.919289752613204e-05, - "loss": 2.4229, - "step": 238630 - }, - { - "epoch": 0.42, - "learning_rate": 2.9192025586205214e-05, - "loss": 2.4685, - "step": 238640 - }, - { - "epoch": 0.42, - "learning_rate": 2.9191153646278384e-05, - "loss": 2.5046, - "step": 238650 - }, - { - "epoch": 0.42, - "learning_rate": 2.9190281706351565e-05, - "loss": 2.5483, - "step": 238660 - }, - { - "epoch": 0.42, - "learning_rate": 2.9189409766424735e-05, - "loss": 2.2917, - "step": 238670 - }, - { - "epoch": 0.42, - "learning_rate": 2.918853782649791e-05, - "loss": 2.4847, - "step": 238680 - }, - { - "epoch": 0.42, - "learning_rate": 2.918766588657108e-05, - "loss": 2.3472, - "step": 238690 - }, - { - "epoch": 0.42, - "learning_rate": 2.9186793946644253e-05, - "loss": 2.4718, - "step": 238700 - }, - { - "epoch": 0.42, - "learning_rate": 2.9185922006717427e-05, - "loss": 2.4393, - "step": 238710 - }, - { - "epoch": 0.42, - "learning_rate": 2.9185050066790597e-05, - "loss": 2.3681, - "step": 238720 - }, - { - "epoch": 0.42, - "learning_rate": 2.918417812686377e-05, - "loss": 2.36, - "step": 238730 - }, - { - "epoch": 0.42, - "learning_rate": 2.9183306186936948e-05, - "loss": 2.4042, - "step": 238740 - }, - { - "epoch": 0.42, - "learning_rate": 2.9182434247010122e-05, - "loss": 2.3747, - "step": 238750 - }, - { - "epoch": 0.42, - "learning_rate": 2.9181562307083292e-05, - "loss": 2.385, - "step": 238760 - }, - { - "epoch": 0.42, - "learning_rate": 2.9180690367156466e-05, - "loss": 2.4182, - "step": 238770 - }, - { - "epoch": 0.42, - "learning_rate": 2.917981842722964e-05, - "loss": 2.3819, - "step": 238780 - }, - { - "epoch": 0.42, - "learning_rate": 2.917894648730281e-05, - "loss": 2.4402, - "step": 238790 - }, - { - "epoch": 0.42, - "learning_rate": 2.9178074547375984e-05, - "loss": 2.3862, - "step": 238800 - }, - { - "epoch": 0.42, - "learning_rate": 2.917720260744916e-05, - "loss": 2.4354, - "step": 238810 - }, - { - "epoch": 0.42, - "learning_rate": 2.9176330667522335e-05, - "loss": 2.4346, - "step": 238820 - }, - { - "epoch": 0.42, - "learning_rate": 2.9175458727595505e-05, - "loss": 2.4086, - "step": 238830 - }, - { - "epoch": 0.42, - "learning_rate": 2.917458678766868e-05, - "loss": 2.2857, - "step": 238840 - }, - { - "epoch": 0.42, - "learning_rate": 2.917371484774185e-05, - "loss": 2.3502, - "step": 238850 - }, - { - "epoch": 0.42, - "learning_rate": 2.9172842907815023e-05, - "loss": 2.4347, - "step": 238860 - }, - { - "epoch": 0.42, - "learning_rate": 2.9171970967888197e-05, - "loss": 2.2518, - "step": 238870 - }, - { - "epoch": 0.42, - "learning_rate": 2.9171099027961367e-05, - "loss": 2.4405, - "step": 238880 - }, - { - "epoch": 0.42, - "learning_rate": 2.9170227088034548e-05, - "loss": 2.3944, - "step": 238890 - }, - { - "epoch": 0.42, - "learning_rate": 2.9169355148107718e-05, - "loss": 2.4256, - "step": 238900 - }, - { - "epoch": 0.42, - "learning_rate": 2.9168483208180892e-05, - "loss": 2.4276, - "step": 238910 - }, - { - "epoch": 0.42, - "learning_rate": 2.9167611268254062e-05, - "loss": 2.4906, - "step": 238920 - }, - { - "epoch": 0.42, - "learning_rate": 2.9166739328327236e-05, - "loss": 2.4043, - "step": 238930 - }, - { - "epoch": 0.42, - "learning_rate": 2.916586738840041e-05, - "loss": 2.2642, - "step": 238940 - }, - { - "epoch": 0.42, - "learning_rate": 2.916499544847358e-05, - "loss": 2.4363, - "step": 238950 - }, - { - "epoch": 0.42, - "learning_rate": 2.9164123508546757e-05, - "loss": 2.4167, - "step": 238960 - }, - { - "epoch": 0.42, - "learning_rate": 2.916325156861993e-05, - "loss": 2.2866, - "step": 238970 - }, - { - "epoch": 0.42, - "learning_rate": 2.9162379628693105e-05, - "loss": 2.3342, - "step": 238980 - }, - { - "epoch": 0.42, - "learning_rate": 2.9161507688766275e-05, - "loss": 2.4198, - "step": 238990 - }, - { - "epoch": 0.42, - "learning_rate": 2.916063574883945e-05, - "loss": 2.3961, - "step": 239000 - }, - { - "epoch": 0.42, - "learning_rate": 2.9159763808912623e-05, - "loss": 2.3733, - "step": 239010 - }, - { - "epoch": 0.42, - "learning_rate": 2.9158891868985793e-05, - "loss": 2.2849, - "step": 239020 - }, - { - "epoch": 0.42, - "learning_rate": 2.9158019929058967e-05, - "loss": 2.3816, - "step": 239030 - }, - { - "epoch": 0.42, - "learning_rate": 2.9157147989132144e-05, - "loss": 2.2625, - "step": 239040 - }, - { - "epoch": 0.42, - "learning_rate": 2.9156276049205318e-05, - "loss": 2.3739, - "step": 239050 - }, - { - "epoch": 0.42, - "learning_rate": 2.9155404109278488e-05, - "loss": 2.4938, - "step": 239060 - }, - { - "epoch": 0.42, - "learning_rate": 2.9154532169351662e-05, - "loss": 2.3295, - "step": 239070 - }, - { - "epoch": 0.42, - "learning_rate": 2.9153660229424832e-05, - "loss": 2.4174, - "step": 239080 - }, - { - "epoch": 0.42, - "learning_rate": 2.9152788289498006e-05, - "loss": 2.348, - "step": 239090 - }, - { - "epoch": 0.42, - "learning_rate": 2.915191634957118e-05, - "loss": 2.3729, - "step": 239100 - }, - { - "epoch": 0.42, - "learning_rate": 2.9151044409644357e-05, - "loss": 2.5517, - "step": 239110 - }, - { - "epoch": 0.42, - "learning_rate": 2.915017246971753e-05, - "loss": 2.3401, - "step": 239120 - }, - { - "epoch": 0.42, - "learning_rate": 2.91493005297907e-05, - "loss": 2.3624, - "step": 239130 - }, - { - "epoch": 0.42, - "learning_rate": 2.9148428589863875e-05, - "loss": 2.3888, - "step": 239140 - }, - { - "epoch": 0.42, - "learning_rate": 2.9147556649937045e-05, - "loss": 2.2736, - "step": 239150 - }, - { - "epoch": 0.42, - "learning_rate": 2.914668471001022e-05, - "loss": 2.4588, - "step": 239160 - }, - { - "epoch": 0.42, - "learning_rate": 2.9145812770083393e-05, - "loss": 2.3848, - "step": 239170 - }, - { - "epoch": 0.42, - "learning_rate": 2.914494083015657e-05, - "loss": 2.3441, - "step": 239180 - }, - { - "epoch": 0.42, - "learning_rate": 2.914406889022974e-05, - "loss": 2.3476, - "step": 239190 - }, - { - "epoch": 0.42, - "learning_rate": 2.9143196950302914e-05, - "loss": 2.3834, - "step": 239200 - }, - { - "epoch": 0.42, - "learning_rate": 2.9142325010376088e-05, - "loss": 2.4691, - "step": 239210 - }, - { - "epoch": 0.42, - "learning_rate": 2.914145307044926e-05, - "loss": 2.3655, - "step": 239220 - }, - { - "epoch": 0.42, - "learning_rate": 2.9140581130522432e-05, - "loss": 2.417, - "step": 239230 - }, - { - "epoch": 0.42, - "learning_rate": 2.9139709190595606e-05, - "loss": 2.4124, - "step": 239240 - }, - { - "epoch": 0.42, - "learning_rate": 2.9138837250668776e-05, - "loss": 2.4806, - "step": 239250 - }, - { - "epoch": 0.42, - "learning_rate": 2.9137965310741954e-05, - "loss": 2.3046, - "step": 239260 - }, - { - "epoch": 0.42, - "learning_rate": 2.9137093370815127e-05, - "loss": 2.405, - "step": 239270 - }, - { - "epoch": 0.42, - "learning_rate": 2.91362214308883e-05, - "loss": 2.284, - "step": 239280 - }, - { - "epoch": 0.42, - "learning_rate": 2.913534949096147e-05, - "loss": 2.3905, - "step": 239290 - }, - { - "epoch": 0.42, - "learning_rate": 2.9134477551034645e-05, - "loss": 2.3945, - "step": 239300 - }, - { - "epoch": 0.42, - "learning_rate": 2.9133605611107816e-05, - "loss": 2.4368, - "step": 239310 - }, - { - "epoch": 0.42, - "learning_rate": 2.913273367118099e-05, - "loss": 2.3966, - "step": 239320 - }, - { - "epoch": 0.42, - "learning_rate": 2.9131861731254167e-05, - "loss": 2.4935, - "step": 239330 - }, - { - "epoch": 0.42, - "learning_rate": 2.913098979132734e-05, - "loss": 2.4395, - "step": 239340 - }, - { - "epoch": 0.42, - "learning_rate": 2.9130117851400514e-05, - "loss": 2.3837, - "step": 239350 - }, - { - "epoch": 0.42, - "learning_rate": 2.9129245911473684e-05, - "loss": 2.3037, - "step": 239360 - }, - { - "epoch": 0.42, - "learning_rate": 2.9128373971546858e-05, - "loss": 2.337, - "step": 239370 - }, - { - "epoch": 0.42, - "learning_rate": 2.912750203162003e-05, - "loss": 2.3917, - "step": 239380 - }, - { - "epoch": 0.42, - "learning_rate": 2.9126630091693202e-05, - "loss": 2.401, - "step": 239390 - }, - { - "epoch": 0.42, - "learning_rate": 2.9125758151766376e-05, - "loss": 2.4685, - "step": 239400 - }, - { - "epoch": 0.42, - "learning_rate": 2.9124886211839553e-05, - "loss": 2.3237, - "step": 239410 - }, - { - "epoch": 0.42, - "learning_rate": 2.9124014271912724e-05, - "loss": 2.3475, - "step": 239420 - }, - { - "epoch": 0.42, - "learning_rate": 2.9123142331985897e-05, - "loss": 2.3358, - "step": 239430 - }, - { - "epoch": 0.42, - "learning_rate": 2.912227039205907e-05, - "loss": 2.3515, - "step": 239440 - }, - { - "epoch": 0.42, - "learning_rate": 2.912139845213224e-05, - "loss": 2.4703, - "step": 239450 - }, - { - "epoch": 0.42, - "learning_rate": 2.9120526512205415e-05, - "loss": 2.4485, - "step": 239460 - }, - { - "epoch": 0.42, - "learning_rate": 2.9119654572278586e-05, - "loss": 2.2462, - "step": 239470 - }, - { - "epoch": 0.42, - "learning_rate": 2.9118782632351766e-05, - "loss": 2.4112, - "step": 239480 - }, - { - "epoch": 0.42, - "learning_rate": 2.9117910692424937e-05, - "loss": 2.4307, - "step": 239490 - }, - { - "epoch": 0.42, - "learning_rate": 2.911703875249811e-05, - "loss": 2.3161, - "step": 239500 - }, - { - "epoch": 0.42, - "learning_rate": 2.9116166812571284e-05, - "loss": 2.457, - "step": 239510 - }, - { - "epoch": 0.42, - "learning_rate": 2.9115294872644455e-05, - "loss": 2.3689, - "step": 239520 - }, - { - "epoch": 0.42, - "learning_rate": 2.911442293271763e-05, - "loss": 2.4055, - "step": 239530 - }, - { - "epoch": 0.42, - "learning_rate": 2.91135509927908e-05, - "loss": 2.4109, - "step": 239540 - }, - { - "epoch": 0.42, - "learning_rate": 2.9112679052863973e-05, - "loss": 2.3062, - "step": 239550 - }, - { - "epoch": 0.42, - "learning_rate": 2.911180711293715e-05, - "loss": 2.3764, - "step": 239560 - }, - { - "epoch": 0.42, - "learning_rate": 2.9110935173010323e-05, - "loss": 2.4595, - "step": 239570 - }, - { - "epoch": 0.42, - "learning_rate": 2.9110063233083494e-05, - "loss": 2.354, - "step": 239580 - }, - { - "epoch": 0.42, - "learning_rate": 2.9109191293156668e-05, - "loss": 2.4047, - "step": 239590 - }, - { - "epoch": 0.42, - "learning_rate": 2.910831935322984e-05, - "loss": 2.4392, - "step": 239600 - }, - { - "epoch": 0.42, - "learning_rate": 2.9107447413303012e-05, - "loss": 2.3576, - "step": 239610 - }, - { - "epoch": 0.42, - "learning_rate": 2.9106575473376186e-05, - "loss": 2.3663, - "step": 239620 - }, - { - "epoch": 0.42, - "learning_rate": 2.9105703533449363e-05, - "loss": 2.4206, - "step": 239630 - }, - { - "epoch": 0.42, - "learning_rate": 2.9104831593522536e-05, - "loss": 2.4841, - "step": 239640 - }, - { - "epoch": 0.42, - "learning_rate": 2.9103959653595707e-05, - "loss": 2.3819, - "step": 239650 - }, - { - "epoch": 0.42, - "learning_rate": 2.910308771366888e-05, - "loss": 2.3399, - "step": 239660 - }, - { - "epoch": 0.42, - "learning_rate": 2.9102215773742054e-05, - "loss": 2.3748, - "step": 239670 - }, - { - "epoch": 0.42, - "learning_rate": 2.9101343833815225e-05, - "loss": 2.4261, - "step": 239680 - }, - { - "epoch": 0.42, - "learning_rate": 2.91004718938884e-05, - "loss": 2.3549, - "step": 239690 - }, - { - "epoch": 0.42, - "learning_rate": 2.9099599953961576e-05, - "loss": 2.3646, - "step": 239700 - }, - { - "epoch": 0.42, - "learning_rate": 2.909872801403475e-05, - "loss": 2.4632, - "step": 239710 - }, - { - "epoch": 0.42, - "learning_rate": 2.909785607410792e-05, - "loss": 2.3731, - "step": 239720 - }, - { - "epoch": 0.42, - "learning_rate": 2.9096984134181094e-05, - "loss": 2.3874, - "step": 239730 - }, - { - "epoch": 0.42, - "learning_rate": 2.9096112194254267e-05, - "loss": 2.4158, - "step": 239740 - }, - { - "epoch": 0.42, - "learning_rate": 2.9095240254327438e-05, - "loss": 2.2808, - "step": 239750 - }, - { - "epoch": 0.42, - "learning_rate": 2.909436831440061e-05, - "loss": 2.441, - "step": 239760 - }, - { - "epoch": 0.42, - "learning_rate": 2.9093496374473782e-05, - "loss": 2.3754, - "step": 239770 - }, - { - "epoch": 0.42, - "learning_rate": 2.9092624434546962e-05, - "loss": 2.3066, - "step": 239780 - }, - { - "epoch": 0.42, - "learning_rate": 2.9091752494620133e-05, - "loss": 2.3698, - "step": 239790 - }, - { - "epoch": 0.42, - "learning_rate": 2.9090880554693307e-05, - "loss": 2.3503, - "step": 239800 - }, - { - "epoch": 0.42, - "learning_rate": 2.9090008614766477e-05, - "loss": 2.4087, - "step": 239810 - }, - { - "epoch": 0.42, - "learning_rate": 2.908913667483965e-05, - "loss": 2.3628, - "step": 239820 - }, - { - "epoch": 0.42, - "learning_rate": 2.9088264734912825e-05, - "loss": 2.4483, - "step": 239830 - }, - { - "epoch": 0.42, - "learning_rate": 2.9087392794985995e-05, - "loss": 2.3699, - "step": 239840 - }, - { - "epoch": 0.42, - "learning_rate": 2.9086520855059175e-05, - "loss": 2.4233, - "step": 239850 - }, - { - "epoch": 0.42, - "learning_rate": 2.9085648915132346e-05, - "loss": 2.3676, - "step": 239860 - }, - { - "epoch": 0.42, - "learning_rate": 2.908477697520552e-05, - "loss": 2.3782, - "step": 239870 - }, - { - "epoch": 0.42, - "learning_rate": 2.908390503527869e-05, - "loss": 2.2704, - "step": 239880 - }, - { - "epoch": 0.42, - "learning_rate": 2.9083033095351864e-05, - "loss": 2.4395, - "step": 239890 - }, - { - "epoch": 0.42, - "learning_rate": 2.9082161155425038e-05, - "loss": 2.2844, - "step": 239900 - }, - { - "epoch": 0.42, - "learning_rate": 2.9081289215498208e-05, - "loss": 2.1865, - "step": 239910 - }, - { - "epoch": 0.42, - "learning_rate": 2.908041727557138e-05, - "loss": 2.4691, - "step": 239920 - }, - { - "epoch": 0.42, - "learning_rate": 2.907954533564456e-05, - "loss": 2.4039, - "step": 239930 - }, - { - "epoch": 0.42, - "learning_rate": 2.9078673395717733e-05, - "loss": 2.3618, - "step": 239940 - }, - { - "epoch": 0.42, - "learning_rate": 2.9077801455790903e-05, - "loss": 2.3784, - "step": 239950 - }, - { - "epoch": 0.42, - "learning_rate": 2.9076929515864077e-05, - "loss": 2.4692, - "step": 239960 - }, - { - "epoch": 0.42, - "learning_rate": 2.907605757593725e-05, - "loss": 2.3593, - "step": 239970 - }, - { - "epoch": 0.42, - "learning_rate": 2.907518563601042e-05, - "loss": 2.4526, - "step": 239980 - }, - { - "epoch": 0.42, - "learning_rate": 2.9074313696083595e-05, - "loss": 2.3641, - "step": 239990 - }, - { - "epoch": 0.42, - "learning_rate": 2.9073441756156772e-05, - "loss": 2.3669, - "step": 240000 - }, - { - "epoch": 0.42, - "learning_rate": 2.9072569816229946e-05, - "loss": 2.4356, - "step": 240010 - }, - { - "epoch": 0.42, - "learning_rate": 2.9071697876303116e-05, - "loss": 2.3789, - "step": 240020 - }, - { - "epoch": 0.42, - "learning_rate": 2.907082593637629e-05, - "loss": 2.2849, - "step": 240030 - }, - { - "epoch": 0.42, - "learning_rate": 2.906995399644946e-05, - "loss": 2.346, - "step": 240040 - }, - { - "epoch": 0.42, - "learning_rate": 2.9069082056522634e-05, - "loss": 2.4042, - "step": 240050 - }, - { - "epoch": 0.42, - "learning_rate": 2.9068210116595808e-05, - "loss": 2.426, - "step": 240060 - }, - { - "epoch": 0.42, - "learning_rate": 2.9067338176668978e-05, - "loss": 2.3516, - "step": 240070 - }, - { - "epoch": 0.42, - "learning_rate": 2.906646623674216e-05, - "loss": 2.3219, - "step": 240080 - }, - { - "epoch": 0.42, - "learning_rate": 2.906559429681533e-05, - "loss": 2.3432, - "step": 240090 - }, - { - "epoch": 0.42, - "learning_rate": 2.9064722356888503e-05, - "loss": 2.3158, - "step": 240100 - }, - { - "epoch": 0.42, - "learning_rate": 2.9063850416961673e-05, - "loss": 2.4156, - "step": 240110 - }, - { - "epoch": 0.42, - "learning_rate": 2.9062978477034847e-05, - "loss": 2.3767, - "step": 240120 - }, - { - "epoch": 0.42, - "learning_rate": 2.906210653710802e-05, - "loss": 2.3017, - "step": 240130 - }, - { - "epoch": 0.42, - "learning_rate": 2.906123459718119e-05, - "loss": 2.5153, - "step": 240140 - }, - { - "epoch": 0.42, - "learning_rate": 2.9060362657254368e-05, - "loss": 2.4824, - "step": 240150 - }, - { - "epoch": 0.42, - "learning_rate": 2.9059490717327542e-05, - "loss": 2.3451, - "step": 240160 - }, - { - "epoch": 0.42, - "learning_rate": 2.9058618777400716e-05, - "loss": 2.2553, - "step": 240170 - }, - { - "epoch": 0.42, - "learning_rate": 2.9057746837473886e-05, - "loss": 2.349, - "step": 240180 - }, - { - "epoch": 0.42, - "learning_rate": 2.905687489754706e-05, - "loss": 2.3836, - "step": 240190 - }, - { - "epoch": 0.42, - "learning_rate": 2.905600295762023e-05, - "loss": 2.4297, - "step": 240200 - }, - { - "epoch": 0.42, - "learning_rate": 2.9055131017693404e-05, - "loss": 2.4146, - "step": 240210 - }, - { - "epoch": 0.42, - "learning_rate": 2.9054259077766578e-05, - "loss": 2.3766, - "step": 240220 - }, - { - "epoch": 0.42, - "learning_rate": 2.9053387137839755e-05, - "loss": 2.2934, - "step": 240230 - }, - { - "epoch": 0.42, - "learning_rate": 2.905251519791293e-05, - "loss": 2.3753, - "step": 240240 - }, - { - "epoch": 0.42, - "learning_rate": 2.90516432579861e-05, - "loss": 2.3743, - "step": 240250 - }, - { - "epoch": 0.42, - "learning_rate": 2.9050771318059273e-05, - "loss": 2.3056, - "step": 240260 - }, - { - "epoch": 0.42, - "learning_rate": 2.9049899378132443e-05, - "loss": 2.4693, - "step": 240270 - }, - { - "epoch": 0.42, - "learning_rate": 2.9049027438205617e-05, - "loss": 2.2917, - "step": 240280 - }, - { - "epoch": 0.42, - "learning_rate": 2.904815549827879e-05, - "loss": 2.2688, - "step": 240290 - }, - { - "epoch": 0.42, - "learning_rate": 2.9047283558351968e-05, - "loss": 2.4809, - "step": 240300 - }, - { - "epoch": 0.42, - "learning_rate": 2.904641161842514e-05, - "loss": 2.3358, - "step": 240310 - }, - { - "epoch": 0.42, - "learning_rate": 2.9045539678498312e-05, - "loss": 2.4659, - "step": 240320 - }, - { - "epoch": 0.42, - "learning_rate": 2.9044667738571486e-05, - "loss": 2.3836, - "step": 240330 - }, - { - "epoch": 0.42, - "learning_rate": 2.9043795798644656e-05, - "loss": 2.3633, - "step": 240340 - }, - { - "epoch": 0.42, - "learning_rate": 2.904292385871783e-05, - "loss": 2.2431, - "step": 240350 - }, - { - "epoch": 0.42, - "learning_rate": 2.9042051918791004e-05, - "loss": 2.3358, - "step": 240360 - }, - { - "epoch": 0.42, - "learning_rate": 2.904117997886418e-05, - "loss": 2.3386, - "step": 240370 - }, - { - "epoch": 0.42, - "learning_rate": 2.904030803893735e-05, - "loss": 2.3953, - "step": 240380 - }, - { - "epoch": 0.42, - "learning_rate": 2.9039436099010525e-05, - "loss": 2.3352, - "step": 240390 - }, - { - "epoch": 0.42, - "learning_rate": 2.90385641590837e-05, - "loss": 2.4012, - "step": 240400 - }, - { - "epoch": 0.42, - "learning_rate": 2.903769221915687e-05, - "loss": 2.3989, - "step": 240410 - }, - { - "epoch": 0.42, - "learning_rate": 2.9036820279230043e-05, - "loss": 2.3692, - "step": 240420 - }, - { - "epoch": 0.42, - "learning_rate": 2.9035948339303213e-05, - "loss": 2.3177, - "step": 240430 - }, - { - "epoch": 0.42, - "learning_rate": 2.9035076399376387e-05, - "loss": 2.3806, - "step": 240440 - }, - { - "epoch": 0.42, - "learning_rate": 2.9034204459449564e-05, - "loss": 2.4321, - "step": 240450 - }, - { - "epoch": 0.42, - "learning_rate": 2.9033332519522738e-05, - "loss": 2.3518, - "step": 240460 - }, - { - "epoch": 0.42, - "learning_rate": 2.9032460579595912e-05, - "loss": 2.4407, - "step": 240470 - }, - { - "epoch": 0.42, - "learning_rate": 2.9031588639669082e-05, - "loss": 2.3587, - "step": 240480 - }, - { - "epoch": 0.42, - "learning_rate": 2.9030716699742256e-05, - "loss": 2.4474, - "step": 240490 - }, - { - "epoch": 0.42, - "learning_rate": 2.9029844759815426e-05, - "loss": 2.4228, - "step": 240500 - }, - { - "epoch": 0.42, - "learning_rate": 2.90289728198886e-05, - "loss": 2.3481, - "step": 240510 - }, - { - "epoch": 0.42, - "learning_rate": 2.9028100879961777e-05, - "loss": 2.3818, - "step": 240520 - }, - { - "epoch": 0.42, - "learning_rate": 2.902722894003495e-05, - "loss": 2.2582, - "step": 240530 - }, - { - "epoch": 0.42, - "learning_rate": 2.902635700010812e-05, - "loss": 2.4116, - "step": 240540 - }, - { - "epoch": 0.42, - "learning_rate": 2.9025485060181295e-05, - "loss": 2.4131, - "step": 240550 - }, - { - "epoch": 0.42, - "learning_rate": 2.902461312025447e-05, - "loss": 2.4273, - "step": 240560 - }, - { - "epoch": 0.42, - "learning_rate": 2.902374118032764e-05, - "loss": 2.418, - "step": 240570 - }, - { - "epoch": 0.42, - "learning_rate": 2.9022869240400813e-05, - "loss": 2.3828, - "step": 240580 - }, - { - "epoch": 0.42, - "learning_rate": 2.9021997300473987e-05, - "loss": 2.3458, - "step": 240590 - }, - { - "epoch": 0.42, - "learning_rate": 2.9021125360547164e-05, - "loss": 2.366, - "step": 240600 - }, - { - "epoch": 0.42, - "learning_rate": 2.9020253420620335e-05, - "loss": 2.4555, - "step": 240610 - }, - { - "epoch": 0.42, - "learning_rate": 2.901938148069351e-05, - "loss": 2.4137, - "step": 240620 - }, - { - "epoch": 0.42, - "learning_rate": 2.9018509540766682e-05, - "loss": 2.1648, - "step": 240630 - }, - { - "epoch": 0.42, - "learning_rate": 2.9017637600839852e-05, - "loss": 2.2962, - "step": 240640 - }, - { - "epoch": 0.42, - "learning_rate": 2.9016765660913026e-05, - "loss": 2.4545, - "step": 240650 - }, - { - "epoch": 0.42, - "learning_rate": 2.9015893720986197e-05, - "loss": 2.5402, - "step": 240660 - }, - { - "epoch": 0.42, - "learning_rate": 2.9015021781059377e-05, - "loss": 2.4916, - "step": 240670 - }, - { - "epoch": 0.42, - "learning_rate": 2.9014149841132548e-05, - "loss": 2.2588, - "step": 240680 - }, - { - "epoch": 0.42, - "learning_rate": 2.901327790120572e-05, - "loss": 2.4678, - "step": 240690 - }, - { - "epoch": 0.42, - "learning_rate": 2.9012405961278895e-05, - "loss": 2.3103, - "step": 240700 - }, - { - "epoch": 0.42, - "learning_rate": 2.9011534021352065e-05, - "loss": 2.3152, - "step": 240710 - }, - { - "epoch": 0.42, - "learning_rate": 2.901066208142524e-05, - "loss": 2.4707, - "step": 240720 - }, - { - "epoch": 0.42, - "learning_rate": 2.900979014149841e-05, - "loss": 2.3653, - "step": 240730 - }, - { - "epoch": 0.42, - "learning_rate": 2.9008918201571583e-05, - "loss": 2.4509, - "step": 240740 - }, - { - "epoch": 0.42, - "learning_rate": 2.900804626164476e-05, - "loss": 2.4814, - "step": 240750 - }, - { - "epoch": 0.42, - "learning_rate": 2.9007174321717934e-05, - "loss": 2.4015, - "step": 240760 - }, - { - "epoch": 0.42, - "learning_rate": 2.9006302381791105e-05, - "loss": 2.3491, - "step": 240770 - }, - { - "epoch": 0.42, - "learning_rate": 2.900543044186428e-05, - "loss": 2.3451, - "step": 240780 - }, - { - "epoch": 0.42, - "learning_rate": 2.9004558501937452e-05, - "loss": 2.4359, - "step": 240790 - }, - { - "epoch": 0.42, - "learning_rate": 2.9003686562010623e-05, - "loss": 2.3662, - "step": 240800 - }, - { - "epoch": 0.42, - "learning_rate": 2.9002814622083796e-05, - "loss": 2.3246, - "step": 240810 - }, - { - "epoch": 0.42, - "learning_rate": 2.9001942682156974e-05, - "loss": 2.4025, - "step": 240820 - }, - { - "epoch": 0.42, - "learning_rate": 2.9001070742230147e-05, - "loss": 2.4356, - "step": 240830 - }, - { - "epoch": 0.42, - "learning_rate": 2.9000198802303318e-05, - "loss": 2.4912, - "step": 240840 - }, - { - "epoch": 0.42, - "learning_rate": 2.899932686237649e-05, - "loss": 2.4188, - "step": 240850 - }, - { - "epoch": 0.42, - "learning_rate": 2.8998454922449665e-05, - "loss": 2.3095, - "step": 240860 - }, - { - "epoch": 0.42, - "learning_rate": 2.8997582982522836e-05, - "loss": 2.5075, - "step": 240870 - }, - { - "epoch": 0.42, - "learning_rate": 2.899671104259601e-05, - "loss": 2.4123, - "step": 240880 - }, - { - "epoch": 0.42, - "learning_rate": 2.899583910266918e-05, - "loss": 2.431, - "step": 240890 - }, - { - "epoch": 0.42, - "learning_rate": 2.899496716274236e-05, - "loss": 2.4141, - "step": 240900 - }, - { - "epoch": 0.42, - "learning_rate": 2.899409522281553e-05, - "loss": 2.3895, - "step": 240910 - }, - { - "epoch": 0.42, - "learning_rate": 2.8993223282888704e-05, - "loss": 2.5775, - "step": 240920 - }, - { - "epoch": 0.42, - "learning_rate": 2.8992351342961875e-05, - "loss": 2.3259, - "step": 240930 - }, - { - "epoch": 0.42, - "learning_rate": 2.899147940303505e-05, - "loss": 2.2832, - "step": 240940 - }, - { - "epoch": 0.42, - "learning_rate": 2.8990607463108222e-05, - "loss": 2.3756, - "step": 240950 - }, - { - "epoch": 0.42, - "learning_rate": 2.8989735523181393e-05, - "loss": 2.3944, - "step": 240960 - }, - { - "epoch": 0.42, - "learning_rate": 2.8988863583254573e-05, - "loss": 2.4668, - "step": 240970 - }, - { - "epoch": 0.42, - "learning_rate": 2.8987991643327744e-05, - "loss": 2.4354, - "step": 240980 - }, - { - "epoch": 0.42, - "learning_rate": 2.8987119703400917e-05, - "loss": 2.355, - "step": 240990 - }, - { - "epoch": 0.42, - "learning_rate": 2.8986247763474088e-05, - "loss": 2.2255, - "step": 241000 - }, - { - "epoch": 0.42, - "learning_rate": 2.898537582354726e-05, - "loss": 2.382, - "step": 241010 - }, - { - "epoch": 0.42, - "learning_rate": 2.8984503883620435e-05, - "loss": 2.396, - "step": 241020 - }, - { - "epoch": 0.42, - "learning_rate": 2.8983631943693606e-05, - "loss": 2.4144, - "step": 241030 - }, - { - "epoch": 0.42, - "learning_rate": 2.8982760003766783e-05, - "loss": 2.3581, - "step": 241040 - }, - { - "epoch": 0.42, - "learning_rate": 2.8981888063839957e-05, - "loss": 2.4143, - "step": 241050 - }, - { - "epoch": 0.42, - "learning_rate": 2.898101612391313e-05, - "loss": 2.3001, - "step": 241060 - }, - { - "epoch": 0.42, - "learning_rate": 2.89801441839863e-05, - "loss": 2.4422, - "step": 241070 - }, - { - "epoch": 0.42, - "learning_rate": 2.8979272244059475e-05, - "loss": 2.4038, - "step": 241080 - }, - { - "epoch": 0.42, - "learning_rate": 2.897840030413265e-05, - "loss": 2.4836, - "step": 241090 - }, - { - "epoch": 0.42, - "learning_rate": 2.897752836420582e-05, - "loss": 2.392, - "step": 241100 - }, - { - "epoch": 0.42, - "learning_rate": 2.8976656424278993e-05, - "loss": 2.311, - "step": 241110 - }, - { - "epoch": 0.42, - "learning_rate": 2.897578448435217e-05, - "loss": 2.4834, - "step": 241120 - }, - { - "epoch": 0.42, - "learning_rate": 2.8974912544425343e-05, - "loss": 2.4569, - "step": 241130 - }, - { - "epoch": 0.42, - "learning_rate": 2.8974040604498514e-05, - "loss": 2.3939, - "step": 241140 - }, - { - "epoch": 0.42, - "learning_rate": 2.8973168664571688e-05, - "loss": 2.3777, - "step": 241150 - }, - { - "epoch": 0.42, - "learning_rate": 2.8972296724644858e-05, - "loss": 2.4384, - "step": 241160 - }, - { - "epoch": 0.42, - "learning_rate": 2.8971424784718032e-05, - "loss": 2.4686, - "step": 241170 - }, - { - "epoch": 0.42, - "learning_rate": 2.8970552844791206e-05, - "loss": 2.3907, - "step": 241180 - }, - { - "epoch": 0.42, - "learning_rate": 2.8969680904864383e-05, - "loss": 2.3792, - "step": 241190 - }, - { - "epoch": 0.42, - "learning_rate": 2.8968808964937556e-05, - "loss": 2.3587, - "step": 241200 - }, - { - "epoch": 0.42, - "learning_rate": 2.8967937025010727e-05, - "loss": 2.3305, - "step": 241210 - }, - { - "epoch": 0.42, - "learning_rate": 2.89670650850839e-05, - "loss": 2.3412, - "step": 241220 - }, - { - "epoch": 0.42, - "learning_rate": 2.896619314515707e-05, - "loss": 2.4129, - "step": 241230 - }, - { - "epoch": 0.42, - "learning_rate": 2.8965321205230245e-05, - "loss": 2.5495, - "step": 241240 - }, - { - "epoch": 0.42, - "learning_rate": 2.896444926530342e-05, - "loss": 2.2836, - "step": 241250 - }, - { - "epoch": 0.42, - "learning_rate": 2.896357732537659e-05, - "loss": 2.3903, - "step": 241260 - }, - { - "epoch": 0.42, - "learning_rate": 2.8962705385449766e-05, - "loss": 2.3419, - "step": 241270 - }, - { - "epoch": 0.42, - "learning_rate": 2.896183344552294e-05, - "loss": 2.3215, - "step": 241280 - }, - { - "epoch": 0.42, - "learning_rate": 2.8960961505596114e-05, - "loss": 2.3772, - "step": 241290 - }, - { - "epoch": 0.42, - "learning_rate": 2.8960089565669284e-05, - "loss": 2.4587, - "step": 241300 - }, - { - "epoch": 0.42, - "learning_rate": 2.8959217625742458e-05, - "loss": 2.4961, - "step": 241310 - }, - { - "epoch": 0.42, - "learning_rate": 2.895834568581563e-05, - "loss": 2.4115, - "step": 241320 - }, - { - "epoch": 0.42, - "learning_rate": 2.8957473745888802e-05, - "loss": 2.3678, - "step": 241330 - }, - { - "epoch": 0.42, - "learning_rate": 2.895660180596198e-05, - "loss": 2.4734, - "step": 241340 - }, - { - "epoch": 0.42, - "learning_rate": 2.8955729866035153e-05, - "loss": 2.3316, - "step": 241350 - }, - { - "epoch": 0.42, - "learning_rate": 2.8954857926108327e-05, - "loss": 2.4115, - "step": 241360 - }, - { - "epoch": 0.42, - "learning_rate": 2.8953985986181497e-05, - "loss": 2.3587, - "step": 241370 - }, - { - "epoch": 0.42, - "learning_rate": 2.895311404625467e-05, - "loss": 2.452, - "step": 241380 - }, - { - "epoch": 0.42, - "learning_rate": 2.895224210632784e-05, - "loss": 2.4767, - "step": 241390 - }, - { - "epoch": 0.42, - "learning_rate": 2.8951370166401015e-05, - "loss": 2.4583, - "step": 241400 - }, - { - "epoch": 0.42, - "learning_rate": 2.895049822647419e-05, - "loss": 2.4032, - "step": 241410 - }, - { - "epoch": 0.42, - "learning_rate": 2.8949626286547366e-05, - "loss": 2.4183, - "step": 241420 - }, - { - "epoch": 0.42, - "learning_rate": 2.894875434662054e-05, - "loss": 2.4216, - "step": 241430 - }, - { - "epoch": 0.42, - "learning_rate": 2.894788240669371e-05, - "loss": 2.4068, - "step": 241440 - }, - { - "epoch": 0.42, - "learning_rate": 2.8947010466766884e-05, - "loss": 2.3032, - "step": 241450 - }, - { - "epoch": 0.42, - "learning_rate": 2.8946138526840054e-05, - "loss": 2.3408, - "step": 241460 - }, - { - "epoch": 0.42, - "learning_rate": 2.8945266586913228e-05, - "loss": 2.3889, - "step": 241470 - }, - { - "epoch": 0.42, - "learning_rate": 2.8944394646986402e-05, - "loss": 2.3249, - "step": 241480 - }, - { - "epoch": 0.42, - "learning_rate": 2.894352270705958e-05, - "loss": 2.4366, - "step": 241490 - }, - { - "epoch": 0.42, - "learning_rate": 2.894265076713275e-05, - "loss": 2.4657, - "step": 241500 - }, - { - "epoch": 0.42, - "learning_rate": 2.8941778827205923e-05, - "loss": 2.1678, - "step": 241510 - }, - { - "epoch": 0.42, - "learning_rate": 2.8940906887279097e-05, - "loss": 2.3895, - "step": 241520 - }, - { - "epoch": 0.42, - "learning_rate": 2.8940034947352267e-05, - "loss": 2.4347, - "step": 241530 - }, - { - "epoch": 0.42, - "learning_rate": 2.893916300742544e-05, - "loss": 2.324, - "step": 241540 - }, - { - "epoch": 0.42, - "learning_rate": 2.893829106749861e-05, - "loss": 2.3881, - "step": 241550 - }, - { - "epoch": 0.42, - "learning_rate": 2.8937419127571792e-05, - "loss": 2.4041, - "step": 241560 - }, - { - "epoch": 0.42, - "learning_rate": 2.8936547187644962e-05, - "loss": 2.3731, - "step": 241570 - }, - { - "epoch": 0.42, - "learning_rate": 2.8935675247718136e-05, - "loss": 2.3649, - "step": 241580 - }, - { - "epoch": 0.42, - "learning_rate": 2.893480330779131e-05, - "loss": 2.3051, - "step": 241590 - }, - { - "epoch": 0.42, - "learning_rate": 2.893393136786448e-05, - "loss": 2.3653, - "step": 241600 - }, - { - "epoch": 0.42, - "learning_rate": 2.8933059427937654e-05, - "loss": 2.4003, - "step": 241610 - }, - { - "epoch": 0.42, - "learning_rate": 2.8932187488010824e-05, - "loss": 2.2698, - "step": 241620 - }, - { - "epoch": 0.42, - "learning_rate": 2.8931315548083998e-05, - "loss": 2.4317, - "step": 241630 - }, - { - "epoch": 0.42, - "learning_rate": 2.8930443608157175e-05, - "loss": 2.3491, - "step": 241640 - }, - { - "epoch": 0.42, - "learning_rate": 2.892957166823035e-05, - "loss": 2.2708, - "step": 241650 - }, - { - "epoch": 0.42, - "learning_rate": 2.892869972830352e-05, - "loss": 2.4342, - "step": 241660 - }, - { - "epoch": 0.42, - "learning_rate": 2.8927827788376693e-05, - "loss": 2.2411, - "step": 241670 - }, - { - "epoch": 0.42, - "learning_rate": 2.8926955848449867e-05, - "loss": 2.2845, - "step": 241680 - }, - { - "epoch": 0.42, - "learning_rate": 2.8926083908523037e-05, - "loss": 2.3812, - "step": 241690 - }, - { - "epoch": 0.42, - "learning_rate": 2.892521196859621e-05, - "loss": 2.3819, - "step": 241700 - }, - { - "epoch": 0.42, - "learning_rate": 2.8924340028669388e-05, - "loss": 2.3931, - "step": 241710 - }, - { - "epoch": 0.42, - "learning_rate": 2.8923468088742562e-05, - "loss": 2.3681, - "step": 241720 - }, - { - "epoch": 0.42, - "learning_rate": 2.8922596148815732e-05, - "loss": 2.3741, - "step": 241730 - }, - { - "epoch": 0.42, - "learning_rate": 2.8921724208888906e-05, - "loss": 2.4586, - "step": 241740 - }, - { - "epoch": 0.42, - "learning_rate": 2.892085226896208e-05, - "loss": 2.473, - "step": 241750 - }, - { - "epoch": 0.42, - "learning_rate": 2.891998032903525e-05, - "loss": 2.4593, - "step": 241760 - }, - { - "epoch": 0.42, - "learning_rate": 2.8919108389108424e-05, - "loss": 2.391, - "step": 241770 - }, - { - "epoch": 0.42, - "learning_rate": 2.8918236449181594e-05, - "loss": 2.3853, - "step": 241780 - }, - { - "epoch": 0.42, - "learning_rate": 2.8917364509254775e-05, - "loss": 2.3438, - "step": 241790 - }, - { - "epoch": 0.42, - "learning_rate": 2.8916492569327945e-05, - "loss": 2.2576, - "step": 241800 - }, - { - "epoch": 0.42, - "learning_rate": 2.891562062940112e-05, - "loss": 2.4046, - "step": 241810 - }, - { - "epoch": 0.42, - "learning_rate": 2.8914748689474293e-05, - "loss": 2.4632, - "step": 241820 - }, - { - "epoch": 0.42, - "learning_rate": 2.8913876749547463e-05, - "loss": 2.5135, - "step": 241830 - }, - { - "epoch": 0.42, - "learning_rate": 2.8913004809620637e-05, - "loss": 2.3869, - "step": 241840 - }, - { - "epoch": 0.42, - "learning_rate": 2.8912132869693807e-05, - "loss": 2.4262, - "step": 241850 - }, - { - "epoch": 0.42, - "learning_rate": 2.8911260929766988e-05, - "loss": 2.323, - "step": 241860 - }, - { - "epoch": 0.42, - "learning_rate": 2.891038898984016e-05, - "loss": 2.3039, - "step": 241870 - }, - { - "epoch": 0.42, - "learning_rate": 2.8909517049913332e-05, - "loss": 2.3628, - "step": 241880 - }, - { - "epoch": 0.42, - "learning_rate": 2.8908645109986503e-05, - "loss": 2.3529, - "step": 241890 - }, - { - "epoch": 0.42, - "learning_rate": 2.8907773170059676e-05, - "loss": 2.3706, - "step": 241900 - }, - { - "epoch": 0.42, - "learning_rate": 2.890690123013285e-05, - "loss": 2.4442, - "step": 241910 - }, - { - "epoch": 0.42, - "learning_rate": 2.890602929020602e-05, - "loss": 2.384, - "step": 241920 - }, - { - "epoch": 0.42, - "learning_rate": 2.8905157350279194e-05, - "loss": 2.3146, - "step": 241930 - }, - { - "epoch": 0.42, - "learning_rate": 2.890428541035237e-05, - "loss": 2.4703, - "step": 241940 - }, - { - "epoch": 0.42, - "learning_rate": 2.8903413470425545e-05, - "loss": 2.3793, - "step": 241950 - }, - { - "epoch": 0.42, - "learning_rate": 2.8902541530498716e-05, - "loss": 2.2795, - "step": 241960 - }, - { - "epoch": 0.42, - "learning_rate": 2.890166959057189e-05, - "loss": 2.454, - "step": 241970 - }, - { - "epoch": 0.42, - "learning_rate": 2.8900797650645063e-05, - "loss": 2.4617, - "step": 241980 - }, - { - "epoch": 0.42, - "learning_rate": 2.8899925710718233e-05, - "loss": 2.3187, - "step": 241990 - }, - { - "epoch": 0.42, - "learning_rate": 2.8899053770791407e-05, - "loss": 2.3894, - "step": 242000 - }, - { - "epoch": 0.42, - "learning_rate": 2.8898181830864584e-05, - "loss": 2.4151, - "step": 242010 - }, - { - "epoch": 0.42, - "learning_rate": 2.8897309890937758e-05, - "loss": 2.3255, - "step": 242020 - }, - { - "epoch": 0.42, - "learning_rate": 2.889643795101093e-05, - "loss": 2.4189, - "step": 242030 - }, - { - "epoch": 0.42, - "learning_rate": 2.8895566011084102e-05, - "loss": 2.46, - "step": 242040 - }, - { - "epoch": 0.42, - "learning_rate": 2.8894694071157276e-05, - "loss": 2.5091, - "step": 242050 - }, - { - "epoch": 0.42, - "learning_rate": 2.8893822131230446e-05, - "loss": 2.2513, - "step": 242060 - }, - { - "epoch": 0.42, - "learning_rate": 2.889295019130362e-05, - "loss": 2.3531, - "step": 242070 - }, - { - "epoch": 0.42, - "learning_rate": 2.889207825137679e-05, - "loss": 2.401, - "step": 242080 - }, - { - "epoch": 0.42, - "learning_rate": 2.889120631144997e-05, - "loss": 2.5523, - "step": 242090 - }, - { - "epoch": 0.42, - "learning_rate": 2.889033437152314e-05, - "loss": 2.3241, - "step": 242100 - }, - { - "epoch": 0.42, - "learning_rate": 2.8889462431596315e-05, - "loss": 2.4944, - "step": 242110 - }, - { - "epoch": 0.42, - "learning_rate": 2.8888590491669486e-05, - "loss": 2.4952, - "step": 242120 - }, - { - "epoch": 0.42, - "learning_rate": 2.888771855174266e-05, - "loss": 2.3205, - "step": 242130 - }, - { - "epoch": 0.42, - "learning_rate": 2.8886846611815833e-05, - "loss": 2.3551, - "step": 242140 - }, - { - "epoch": 0.42, - "learning_rate": 2.8885974671889004e-05, - "loss": 2.338, - "step": 242150 - }, - { - "epoch": 0.42, - "learning_rate": 2.8885102731962184e-05, - "loss": 2.4834, - "step": 242160 - }, - { - "epoch": 0.42, - "learning_rate": 2.8884230792035355e-05, - "loss": 2.3835, - "step": 242170 - }, - { - "epoch": 0.42, - "learning_rate": 2.888335885210853e-05, - "loss": 2.3037, - "step": 242180 - }, - { - "epoch": 0.42, - "learning_rate": 2.88824869121817e-05, - "loss": 2.3879, - "step": 242190 - }, - { - "epoch": 0.42, - "learning_rate": 2.8881614972254872e-05, - "loss": 2.2975, - "step": 242200 - }, - { - "epoch": 0.42, - "learning_rate": 2.8880743032328046e-05, - "loss": 2.263, - "step": 242210 - }, - { - "epoch": 0.42, - "learning_rate": 2.8879871092401217e-05, - "loss": 2.4665, - "step": 242220 - }, - { - "epoch": 0.42, - "learning_rate": 2.8878999152474394e-05, - "loss": 2.3564, - "step": 242230 - }, - { - "epoch": 0.42, - "learning_rate": 2.8878127212547568e-05, - "loss": 2.4907, - "step": 242240 - }, - { - "epoch": 0.42, - "learning_rate": 2.887725527262074e-05, - "loss": 2.4327, - "step": 242250 - }, - { - "epoch": 0.42, - "learning_rate": 2.8876383332693912e-05, - "loss": 2.3898, - "step": 242260 - }, - { - "epoch": 0.42, - "learning_rate": 2.8875511392767085e-05, - "loss": 2.4311, - "step": 242270 - }, - { - "epoch": 0.42, - "learning_rate": 2.8874639452840256e-05, - "loss": 2.3433, - "step": 242280 - }, - { - "epoch": 0.42, - "learning_rate": 2.887376751291343e-05, - "loss": 2.4013, - "step": 242290 - }, - { - "epoch": 0.42, - "learning_rate": 2.8872895572986603e-05, - "loss": 2.3672, - "step": 242300 - }, - { - "epoch": 0.42, - "learning_rate": 2.887202363305978e-05, - "loss": 2.3554, - "step": 242310 - }, - { - "epoch": 0.42, - "learning_rate": 2.8871151693132954e-05, - "loss": 2.3816, - "step": 242320 - }, - { - "epoch": 0.42, - "learning_rate": 2.8870279753206125e-05, - "loss": 2.4294, - "step": 242330 - }, - { - "epoch": 0.42, - "learning_rate": 2.88694078132793e-05, - "loss": 2.2984, - "step": 242340 - }, - { - "epoch": 0.42, - "learning_rate": 2.886853587335247e-05, - "loss": 2.4283, - "step": 242350 - }, - { - "epoch": 0.42, - "learning_rate": 2.8867663933425643e-05, - "loss": 2.4723, - "step": 242360 - }, - { - "epoch": 0.42, - "learning_rate": 2.8866791993498816e-05, - "loss": 2.2865, - "step": 242370 - }, - { - "epoch": 0.42, - "learning_rate": 2.8865920053571994e-05, - "loss": 2.3549, - "step": 242380 - }, - { - "epoch": 0.42, - "learning_rate": 2.8865048113645164e-05, - "loss": 2.4292, - "step": 242390 - }, - { - "epoch": 0.42, - "learning_rate": 2.8864176173718338e-05, - "loss": 2.3625, - "step": 242400 - }, - { - "epoch": 0.42, - "learning_rate": 2.886330423379151e-05, - "loss": 2.4159, - "step": 242410 - }, - { - "epoch": 0.42, - "learning_rate": 2.8862432293864682e-05, - "loss": 2.3699, - "step": 242420 - }, - { - "epoch": 0.42, - "learning_rate": 2.8861560353937856e-05, - "loss": 2.3532, - "step": 242430 - }, - { - "epoch": 0.42, - "learning_rate": 2.886068841401103e-05, - "loss": 2.386, - "step": 242440 - }, - { - "epoch": 0.42, - "learning_rate": 2.88598164740842e-05, - "loss": 2.3499, - "step": 242450 - }, - { - "epoch": 0.42, - "learning_rate": 2.8858944534157377e-05, - "loss": 2.3977, - "step": 242460 - }, - { - "epoch": 0.42, - "learning_rate": 2.885807259423055e-05, - "loss": 2.421, - "step": 242470 - }, - { - "epoch": 0.42, - "learning_rate": 2.8857200654303724e-05, - "loss": 2.4267, - "step": 242480 - }, - { - "epoch": 0.42, - "learning_rate": 2.8856328714376895e-05, - "loss": 2.3816, - "step": 242490 - }, - { - "epoch": 0.42, - "learning_rate": 2.885545677445007e-05, - "loss": 2.3375, - "step": 242500 - }, - { - "epoch": 0.42, - "learning_rate": 2.885458483452324e-05, - "loss": 2.2383, - "step": 242510 - }, - { - "epoch": 0.42, - "learning_rate": 2.8853712894596413e-05, - "loss": 2.2448, - "step": 242520 - }, - { - "epoch": 0.42, - "learning_rate": 2.885284095466959e-05, - "loss": 2.3694, - "step": 242530 - }, - { - "epoch": 0.42, - "learning_rate": 2.8851969014742764e-05, - "loss": 2.4244, - "step": 242540 - }, - { - "epoch": 0.42, - "learning_rate": 2.8851097074815937e-05, - "loss": 2.4918, - "step": 242550 - }, - { - "epoch": 0.42, - "learning_rate": 2.8850225134889108e-05, - "loss": 2.5298, - "step": 242560 - }, - { - "epoch": 0.42, - "learning_rate": 2.884935319496228e-05, - "loss": 2.384, - "step": 242570 - }, - { - "epoch": 0.42, - "learning_rate": 2.8848481255035452e-05, - "loss": 2.447, - "step": 242580 - }, - { - "epoch": 0.42, - "learning_rate": 2.8847609315108626e-05, - "loss": 2.3172, - "step": 242590 - }, - { - "epoch": 0.42, - "learning_rate": 2.88467373751818e-05, - "loss": 2.2151, - "step": 242600 - }, - { - "epoch": 0.42, - "learning_rate": 2.8845865435254977e-05, - "loss": 2.3292, - "step": 242610 - }, - { - "epoch": 0.42, - "learning_rate": 2.8844993495328147e-05, - "loss": 2.3937, - "step": 242620 - }, - { - "epoch": 0.42, - "learning_rate": 2.884412155540132e-05, - "loss": 2.2716, - "step": 242630 - }, - { - "epoch": 0.42, - "learning_rate": 2.8843249615474495e-05, - "loss": 2.4902, - "step": 242640 - }, - { - "epoch": 0.42, - "learning_rate": 2.8842377675547665e-05, - "loss": 2.3741, - "step": 242650 - }, - { - "epoch": 0.42, - "learning_rate": 2.884150573562084e-05, - "loss": 2.4248, - "step": 242660 - }, - { - "epoch": 0.42, - "learning_rate": 2.8840633795694013e-05, - "loss": 2.3473, - "step": 242670 - }, - { - "epoch": 0.42, - "learning_rate": 2.883976185576719e-05, - "loss": 2.3329, - "step": 242680 - }, - { - "epoch": 0.42, - "learning_rate": 2.883888991584036e-05, - "loss": 2.2839, - "step": 242690 - }, - { - "epoch": 0.42, - "learning_rate": 2.8838017975913534e-05, - "loss": 2.3774, - "step": 242700 - }, - { - "epoch": 0.42, - "learning_rate": 2.8837146035986708e-05, - "loss": 2.2626, - "step": 242710 - }, - { - "epoch": 0.42, - "learning_rate": 2.8836274096059878e-05, - "loss": 2.2615, - "step": 242720 - }, - { - "epoch": 0.42, - "learning_rate": 2.8835402156133052e-05, - "loss": 2.3267, - "step": 242730 - }, - { - "epoch": 0.42, - "learning_rate": 2.8834530216206222e-05, - "loss": 2.4299, - "step": 242740 - }, - { - "epoch": 0.42, - "learning_rate": 2.8833658276279396e-05, - "loss": 2.3517, - "step": 242750 - }, - { - "epoch": 0.42, - "learning_rate": 2.8832786336352573e-05, - "loss": 2.2856, - "step": 242760 - }, - { - "epoch": 0.42, - "learning_rate": 2.8831914396425747e-05, - "loss": 2.3651, - "step": 242770 - }, - { - "epoch": 0.42, - "learning_rate": 2.883104245649892e-05, - "loss": 2.4572, - "step": 242780 - }, - { - "epoch": 0.42, - "learning_rate": 2.883017051657209e-05, - "loss": 2.339, - "step": 242790 - }, - { - "epoch": 0.42, - "learning_rate": 2.8829298576645265e-05, - "loss": 2.4179, - "step": 242800 - }, - { - "epoch": 0.42, - "learning_rate": 2.8828426636718435e-05, - "loss": 2.3583, - "step": 242810 - }, - { - "epoch": 0.42, - "learning_rate": 2.882755469679161e-05, - "loss": 2.3792, - "step": 242820 - }, - { - "epoch": 0.42, - "learning_rate": 2.8826682756864786e-05, - "loss": 2.4316, - "step": 242830 - }, - { - "epoch": 0.42, - "learning_rate": 2.882581081693796e-05, - "loss": 2.4264, - "step": 242840 - }, - { - "epoch": 0.42, - "learning_rate": 2.882493887701113e-05, - "loss": 2.3819, - "step": 242850 - }, - { - "epoch": 0.42, - "learning_rate": 2.8824066937084304e-05, - "loss": 2.4002, - "step": 242860 - }, - { - "epoch": 0.42, - "learning_rate": 2.8823194997157478e-05, - "loss": 2.4763, - "step": 242870 - }, - { - "epoch": 0.42, - "learning_rate": 2.8822323057230648e-05, - "loss": 2.408, - "step": 242880 - }, - { - "epoch": 0.42, - "learning_rate": 2.8821451117303822e-05, - "loss": 2.3874, - "step": 242890 - }, - { - "epoch": 0.42, - "learning_rate": 2.8820579177377e-05, - "loss": 2.262, - "step": 242900 - }, - { - "epoch": 0.42, - "learning_rate": 2.8819707237450173e-05, - "loss": 2.3515, - "step": 242910 - }, - { - "epoch": 0.42, - "learning_rate": 2.8818835297523343e-05, - "loss": 2.5326, - "step": 242920 - }, - { - "epoch": 0.42, - "learning_rate": 2.8817963357596517e-05, - "loss": 2.5119, - "step": 242930 - }, - { - "epoch": 0.42, - "learning_rate": 2.881709141766969e-05, - "loss": 2.4481, - "step": 242940 - }, - { - "epoch": 0.42, - "learning_rate": 2.881621947774286e-05, - "loss": 2.4358, - "step": 242950 - }, - { - "epoch": 0.42, - "learning_rate": 2.8815347537816035e-05, - "loss": 2.339, - "step": 242960 - }, - { - "epoch": 0.42, - "learning_rate": 2.8814475597889205e-05, - "loss": 2.2429, - "step": 242970 - }, - { - "epoch": 0.42, - "learning_rate": 2.8813603657962386e-05, - "loss": 2.4893, - "step": 242980 - }, - { - "epoch": 0.42, - "learning_rate": 2.8812731718035556e-05, - "loss": 2.3094, - "step": 242990 - }, - { - "epoch": 0.42, - "learning_rate": 2.881185977810873e-05, - "loss": 2.2788, - "step": 243000 - }, - { - "epoch": 0.42, - "learning_rate": 2.88109878381819e-05, - "loss": 2.3976, - "step": 243010 - }, - { - "epoch": 0.42, - "learning_rate": 2.8810115898255074e-05, - "loss": 2.2593, - "step": 243020 - }, - { - "epoch": 0.42, - "learning_rate": 2.8809243958328248e-05, - "loss": 2.3883, - "step": 243030 - }, - { - "epoch": 0.42, - "learning_rate": 2.880837201840142e-05, - "loss": 2.391, - "step": 243040 - }, - { - "epoch": 0.42, - "learning_rate": 2.88075000784746e-05, - "loss": 2.4815, - "step": 243050 - }, - { - "epoch": 0.42, - "learning_rate": 2.880662813854777e-05, - "loss": 2.5227, - "step": 243060 - }, - { - "epoch": 0.42, - "learning_rate": 2.8805756198620943e-05, - "loss": 2.4929, - "step": 243070 - }, - { - "epoch": 0.42, - "learning_rate": 2.8804884258694113e-05, - "loss": 2.3404, - "step": 243080 - }, - { - "epoch": 0.42, - "learning_rate": 2.8804012318767287e-05, - "loss": 2.3832, - "step": 243090 - }, - { - "epoch": 0.42, - "learning_rate": 2.880314037884046e-05, - "loss": 2.3447, - "step": 243100 - }, - { - "epoch": 0.42, - "learning_rate": 2.880226843891363e-05, - "loss": 2.3747, - "step": 243110 - }, - { - "epoch": 0.42, - "learning_rate": 2.8801396498986805e-05, - "loss": 2.4929, - "step": 243120 - }, - { - "epoch": 0.42, - "learning_rate": 2.8800524559059982e-05, - "loss": 2.417, - "step": 243130 - }, - { - "epoch": 0.42, - "learning_rate": 2.8799652619133156e-05, - "loss": 2.4128, - "step": 243140 - }, - { - "epoch": 0.42, - "learning_rate": 2.8798780679206326e-05, - "loss": 2.2712, - "step": 243150 - }, - { - "epoch": 0.42, - "learning_rate": 2.87979087392795e-05, - "loss": 2.2602, - "step": 243160 - }, - { - "epoch": 0.42, - "learning_rate": 2.8797036799352674e-05, - "loss": 2.2729, - "step": 243170 - }, - { - "epoch": 0.42, - "learning_rate": 2.8796164859425844e-05, - "loss": 2.4664, - "step": 243180 - }, - { - "epoch": 0.42, - "learning_rate": 2.8795292919499018e-05, - "loss": 2.3744, - "step": 243190 - }, - { - "epoch": 0.42, - "learning_rate": 2.8794420979572195e-05, - "loss": 2.352, - "step": 243200 - }, - { - "epoch": 0.42, - "learning_rate": 2.879354903964537e-05, - "loss": 2.372, - "step": 243210 - }, - { - "epoch": 0.42, - "learning_rate": 2.879267709971854e-05, - "loss": 2.3551, - "step": 243220 - }, - { - "epoch": 0.42, - "learning_rate": 2.8791805159791713e-05, - "loss": 2.3261, - "step": 243230 - }, - { - "epoch": 0.42, - "learning_rate": 2.8790933219864884e-05, - "loss": 2.4232, - "step": 243240 - }, - { - "epoch": 0.42, - "learning_rate": 2.8790061279938057e-05, - "loss": 2.3877, - "step": 243250 - }, - { - "epoch": 0.42, - "learning_rate": 2.878918934001123e-05, - "loss": 2.3462, - "step": 243260 - }, - { - "epoch": 0.42, - "learning_rate": 2.87883174000844e-05, - "loss": 2.3924, - "step": 243270 - }, - { - "epoch": 0.42, - "learning_rate": 2.8787445460157582e-05, - "loss": 2.3917, - "step": 243280 - }, - { - "epoch": 0.42, - "learning_rate": 2.8786573520230752e-05, - "loss": 2.5033, - "step": 243290 - }, - { - "epoch": 0.42, - "learning_rate": 2.8785701580303926e-05, - "loss": 2.4202, - "step": 243300 - }, - { - "epoch": 0.42, - "learning_rate": 2.8784829640377097e-05, - "loss": 2.3099, - "step": 243310 - }, - { - "epoch": 0.42, - "learning_rate": 2.878395770045027e-05, - "loss": 2.3687, - "step": 243320 - }, - { - "epoch": 0.42, - "learning_rate": 2.8783085760523444e-05, - "loss": 2.3328, - "step": 243330 - }, - { - "epoch": 0.42, - "learning_rate": 2.8782213820596614e-05, - "loss": 2.3834, - "step": 243340 - }, - { - "epoch": 0.42, - "learning_rate": 2.878134188066979e-05, - "loss": 2.2959, - "step": 243350 - }, - { - "epoch": 0.42, - "learning_rate": 2.8780469940742965e-05, - "loss": 2.4275, - "step": 243360 - }, - { - "epoch": 0.42, - "learning_rate": 2.877959800081614e-05, - "loss": 2.3651, - "step": 243370 - }, - { - "epoch": 0.42, - "learning_rate": 2.877872606088931e-05, - "loss": 2.361, - "step": 243380 - }, - { - "epoch": 0.42, - "learning_rate": 2.8777854120962483e-05, - "loss": 2.387, - "step": 243390 - }, - { - "epoch": 0.42, - "learning_rate": 2.8776982181035657e-05, - "loss": 2.3448, - "step": 243400 - }, - { - "epoch": 0.42, - "learning_rate": 2.8776110241108827e-05, - "loss": 2.3447, - "step": 243410 - }, - { - "epoch": 0.42, - "learning_rate": 2.8775238301182e-05, - "loss": 2.404, - "step": 243420 - }, - { - "epoch": 0.42, - "learning_rate": 2.877436636125518e-05, - "loss": 2.3214, - "step": 243430 - }, - { - "epoch": 0.42, - "learning_rate": 2.8773494421328352e-05, - "loss": 2.397, - "step": 243440 - }, - { - "epoch": 0.42, - "learning_rate": 2.8772622481401523e-05, - "loss": 2.3086, - "step": 243450 - }, - { - "epoch": 0.42, - "learning_rate": 2.8771750541474696e-05, - "loss": 2.3473, - "step": 243460 - }, - { - "epoch": 0.42, - "learning_rate": 2.8770878601547867e-05, - "loss": 2.2899, - "step": 243470 - }, - { - "epoch": 0.42, - "learning_rate": 2.877000666162104e-05, - "loss": 2.3985, - "step": 243480 - }, - { - "epoch": 0.42, - "learning_rate": 2.8769134721694214e-05, - "loss": 2.4717, - "step": 243490 - }, - { - "epoch": 0.42, - "learning_rate": 2.876826278176739e-05, - "loss": 2.5098, - "step": 243500 - }, - { - "epoch": 0.42, - "learning_rate": 2.8767390841840565e-05, - "loss": 2.4205, - "step": 243510 - }, - { - "epoch": 0.42, - "learning_rate": 2.8766518901913736e-05, - "loss": 2.33, - "step": 243520 - }, - { - "epoch": 0.42, - "learning_rate": 2.876564696198691e-05, - "loss": 2.302, - "step": 243530 - }, - { - "epoch": 0.42, - "learning_rate": 2.876477502206008e-05, - "loss": 2.3307, - "step": 243540 - }, - { - "epoch": 0.42, - "learning_rate": 2.8763903082133253e-05, - "loss": 2.3921, - "step": 243550 - }, - { - "epoch": 0.42, - "learning_rate": 2.8763031142206427e-05, - "loss": 2.385, - "step": 243560 - }, - { - "epoch": 0.42, - "learning_rate": 2.8762159202279604e-05, - "loss": 2.422, - "step": 243570 - }, - { - "epoch": 0.42, - "learning_rate": 2.8761287262352775e-05, - "loss": 2.272, - "step": 243580 - }, - { - "epoch": 0.42, - "learning_rate": 2.876041532242595e-05, - "loss": 2.3894, - "step": 243590 - }, - { - "epoch": 0.42, - "learning_rate": 2.8759543382499122e-05, - "loss": 2.3781, - "step": 243600 - }, - { - "epoch": 0.42, - "learning_rate": 2.8758671442572293e-05, - "loss": 2.486, - "step": 243610 - }, - { - "epoch": 0.42, - "learning_rate": 2.8757799502645466e-05, - "loss": 2.377, - "step": 243620 - }, - { - "epoch": 0.42, - "learning_rate": 2.8756927562718637e-05, - "loss": 2.3293, - "step": 243630 - }, - { - "epoch": 0.42, - "learning_rate": 2.875605562279181e-05, - "loss": 2.4007, - "step": 243640 - }, - { - "epoch": 0.42, - "learning_rate": 2.8755183682864988e-05, - "loss": 2.2327, - "step": 243650 - }, - { - "epoch": 0.42, - "learning_rate": 2.875431174293816e-05, - "loss": 2.4741, - "step": 243660 - }, - { - "epoch": 0.42, - "learning_rate": 2.8753439803011335e-05, - "loss": 2.4451, - "step": 243670 - }, - { - "epoch": 0.42, - "learning_rate": 2.8752567863084506e-05, - "loss": 2.3866, - "step": 243680 - }, - { - "epoch": 0.42, - "learning_rate": 2.875169592315768e-05, - "loss": 2.4598, - "step": 243690 - }, - { - "epoch": 0.42, - "learning_rate": 2.875082398323085e-05, - "loss": 2.4917, - "step": 243700 - }, - { - "epoch": 0.43, - "learning_rate": 2.8749952043304024e-05, - "loss": 2.2569, - "step": 243710 - }, - { - "epoch": 0.43, - "learning_rate": 2.87490801033772e-05, - "loss": 2.355, - "step": 243720 - }, - { - "epoch": 0.43, - "learning_rate": 2.8748208163450375e-05, - "loss": 2.3995, - "step": 243730 - }, - { - "epoch": 0.43, - "learning_rate": 2.8747336223523545e-05, - "loss": 2.4082, - "step": 243740 - }, - { - "epoch": 0.43, - "learning_rate": 2.874646428359672e-05, - "loss": 2.3837, - "step": 243750 - }, - { - "epoch": 0.43, - "learning_rate": 2.8745592343669892e-05, - "loss": 2.2877, - "step": 243760 - }, - { - "epoch": 0.43, - "learning_rate": 2.8744720403743063e-05, - "loss": 2.4297, - "step": 243770 - }, - { - "epoch": 0.43, - "learning_rate": 2.8743848463816237e-05, - "loss": 2.3633, - "step": 243780 - }, - { - "epoch": 0.43, - "learning_rate": 2.874297652388941e-05, - "loss": 2.3723, - "step": 243790 - }, - { - "epoch": 0.43, - "learning_rate": 2.8742104583962588e-05, - "loss": 2.4662, - "step": 243800 - }, - { - "epoch": 0.43, - "learning_rate": 2.8741232644035758e-05, - "loss": 2.3443, - "step": 243810 - }, - { - "epoch": 0.43, - "learning_rate": 2.8740360704108932e-05, - "loss": 2.3372, - "step": 243820 - }, - { - "epoch": 0.43, - "learning_rate": 2.8739488764182105e-05, - "loss": 2.4123, - "step": 243830 - }, - { - "epoch": 0.43, - "learning_rate": 2.8738616824255276e-05, - "loss": 2.5435, - "step": 243840 - }, - { - "epoch": 0.43, - "learning_rate": 2.873774488432845e-05, - "loss": 2.428, - "step": 243850 - }, - { - "epoch": 0.43, - "learning_rate": 2.873687294440162e-05, - "loss": 2.5078, - "step": 243860 - }, - { - "epoch": 0.43, - "learning_rate": 2.87360010044748e-05, - "loss": 2.3218, - "step": 243870 - }, - { - "epoch": 0.43, - "learning_rate": 2.873512906454797e-05, - "loss": 2.4922, - "step": 243880 - }, - { - "epoch": 0.43, - "learning_rate": 2.8734257124621145e-05, - "loss": 2.2812, - "step": 243890 - }, - { - "epoch": 0.43, - "learning_rate": 2.873338518469432e-05, - "loss": 2.3141, - "step": 243900 - }, - { - "epoch": 0.43, - "learning_rate": 2.873251324476749e-05, - "loss": 2.3125, - "step": 243910 - }, - { - "epoch": 0.43, - "learning_rate": 2.8731641304840663e-05, - "loss": 2.389, - "step": 243920 - }, - { - "epoch": 0.43, - "learning_rate": 2.8730769364913833e-05, - "loss": 2.4683, - "step": 243930 - }, - { - "epoch": 0.43, - "learning_rate": 2.8729897424987007e-05, - "loss": 2.3818, - "step": 243940 - }, - { - "epoch": 0.43, - "learning_rate": 2.8729025485060184e-05, - "loss": 2.3475, - "step": 243950 - }, - { - "epoch": 0.43, - "learning_rate": 2.8728153545133358e-05, - "loss": 2.4741, - "step": 243960 - }, - { - "epoch": 0.43, - "learning_rate": 2.8727281605206528e-05, - "loss": 2.4408, - "step": 243970 - }, - { - "epoch": 0.43, - "learning_rate": 2.8726409665279702e-05, - "loss": 2.5526, - "step": 243980 - }, - { - "epoch": 0.43, - "learning_rate": 2.8725537725352876e-05, - "loss": 2.4844, - "step": 243990 - }, - { - "epoch": 0.43, - "learning_rate": 2.8724665785426046e-05, - "loss": 2.3131, - "step": 244000 - }, - { - "epoch": 0.43, - "learning_rate": 2.872379384549922e-05, - "loss": 2.3365, - "step": 244010 - }, - { - "epoch": 0.43, - "learning_rate": 2.8722921905572397e-05, - "loss": 2.3863, - "step": 244020 - }, - { - "epoch": 0.43, - "learning_rate": 2.872204996564557e-05, - "loss": 2.3975, - "step": 244030 - }, - { - "epoch": 0.43, - "learning_rate": 2.872117802571874e-05, - "loss": 2.4345, - "step": 244040 - }, - { - "epoch": 0.43, - "learning_rate": 2.8720306085791915e-05, - "loss": 2.3679, - "step": 244050 - }, - { - "epoch": 0.43, - "learning_rate": 2.871943414586509e-05, - "loss": 2.3484, - "step": 244060 - }, - { - "epoch": 0.43, - "learning_rate": 2.871856220593826e-05, - "loss": 2.3087, - "step": 244070 - }, - { - "epoch": 0.43, - "learning_rate": 2.8717690266011433e-05, - "loss": 2.2959, - "step": 244080 - }, - { - "epoch": 0.43, - "learning_rate": 2.871681832608461e-05, - "loss": 2.5016, - "step": 244090 - }, - { - "epoch": 0.43, - "learning_rate": 2.8715946386157784e-05, - "loss": 2.446, - "step": 244100 - }, - { - "epoch": 0.43, - "learning_rate": 2.8715074446230954e-05, - "loss": 2.3425, - "step": 244110 - }, - { - "epoch": 0.43, - "learning_rate": 2.8714202506304128e-05, - "loss": 2.3637, - "step": 244120 - }, - { - "epoch": 0.43, - "learning_rate": 2.87133305663773e-05, - "loss": 2.3208, - "step": 244130 - }, - { - "epoch": 0.43, - "learning_rate": 2.8712458626450472e-05, - "loss": 2.2981, - "step": 244140 - }, - { - "epoch": 0.43, - "learning_rate": 2.8711586686523646e-05, - "loss": 2.4238, - "step": 244150 - }, - { - "epoch": 0.43, - "learning_rate": 2.8710714746596816e-05, - "loss": 2.3327, - "step": 244160 - }, - { - "epoch": 0.43, - "learning_rate": 2.8709842806669997e-05, - "loss": 2.4794, - "step": 244170 - }, - { - "epoch": 0.43, - "learning_rate": 2.8708970866743167e-05, - "loss": 2.35, - "step": 244180 - }, - { - "epoch": 0.43, - "learning_rate": 2.870809892681634e-05, - "loss": 2.3804, - "step": 244190 - }, - { - "epoch": 0.43, - "learning_rate": 2.870722698688951e-05, - "loss": 2.4817, - "step": 244200 - }, - { - "epoch": 0.43, - "learning_rate": 2.8706355046962685e-05, - "loss": 2.4568, - "step": 244210 - }, - { - "epoch": 0.43, - "learning_rate": 2.870548310703586e-05, - "loss": 2.3968, - "step": 244220 - }, - { - "epoch": 0.43, - "learning_rate": 2.870461116710903e-05, - "loss": 2.4747, - "step": 244230 - }, - { - "epoch": 0.43, - "learning_rate": 2.870373922718221e-05, - "loss": 2.4147, - "step": 244240 - }, - { - "epoch": 0.43, - "learning_rate": 2.870286728725538e-05, - "loss": 2.3786, - "step": 244250 - }, - { - "epoch": 0.43, - "learning_rate": 2.8701995347328554e-05, - "loss": 2.4033, - "step": 244260 - }, - { - "epoch": 0.43, - "learning_rate": 2.8701123407401724e-05, - "loss": 2.35, - "step": 244270 - }, - { - "epoch": 0.43, - "learning_rate": 2.8700251467474898e-05, - "loss": 2.4449, - "step": 244280 - }, - { - "epoch": 0.43, - "learning_rate": 2.8699379527548072e-05, - "loss": 2.3394, - "step": 244290 - }, - { - "epoch": 0.43, - "learning_rate": 2.8698507587621242e-05, - "loss": 2.4428, - "step": 244300 - }, - { - "epoch": 0.43, - "learning_rate": 2.8697635647694416e-05, - "loss": 2.3809, - "step": 244310 - }, - { - "epoch": 0.43, - "learning_rate": 2.8696763707767593e-05, - "loss": 2.303, - "step": 244320 - }, - { - "epoch": 0.43, - "learning_rate": 2.8695891767840767e-05, - "loss": 2.3261, - "step": 244330 - }, - { - "epoch": 0.43, - "learning_rate": 2.8695019827913937e-05, - "loss": 2.3751, - "step": 244340 - }, - { - "epoch": 0.43, - "learning_rate": 2.869414788798711e-05, - "loss": 2.344, - "step": 244350 - }, - { - "epoch": 0.43, - "learning_rate": 2.869327594806028e-05, - "loss": 2.2781, - "step": 244360 - }, - { - "epoch": 0.43, - "learning_rate": 2.8692404008133455e-05, - "loss": 2.1759, - "step": 244370 - }, - { - "epoch": 0.43, - "learning_rate": 2.869153206820663e-05, - "loss": 2.2733, - "step": 244380 - }, - { - "epoch": 0.43, - "learning_rate": 2.8690660128279806e-05, - "loss": 2.3764, - "step": 244390 - }, - { - "epoch": 0.43, - "learning_rate": 2.868978818835298e-05, - "loss": 2.3409, - "step": 244400 - }, - { - "epoch": 0.43, - "learning_rate": 2.868891624842615e-05, - "loss": 2.5366, - "step": 244410 - }, - { - "epoch": 0.43, - "learning_rate": 2.8688044308499324e-05, - "loss": 2.4427, - "step": 244420 - }, - { - "epoch": 0.43, - "learning_rate": 2.8687172368572494e-05, - "loss": 2.422, - "step": 244430 - }, - { - "epoch": 0.43, - "learning_rate": 2.8686300428645668e-05, - "loss": 2.4382, - "step": 244440 - }, - { - "epoch": 0.43, - "learning_rate": 2.8685428488718842e-05, - "loss": 2.4329, - "step": 244450 - }, - { - "epoch": 0.43, - "learning_rate": 2.8684556548792012e-05, - "loss": 2.3787, - "step": 244460 - }, - { - "epoch": 0.43, - "learning_rate": 2.868368460886519e-05, - "loss": 2.4584, - "step": 244470 - }, - { - "epoch": 0.43, - "learning_rate": 2.8682812668938363e-05, - "loss": 2.343, - "step": 244480 - }, - { - "epoch": 0.43, - "learning_rate": 2.8681940729011537e-05, - "loss": 2.3098, - "step": 244490 - }, - { - "epoch": 0.43, - "learning_rate": 2.8681068789084707e-05, - "loss": 2.4451, - "step": 244500 - }, - { - "epoch": 0.43, - "learning_rate": 2.868019684915788e-05, - "loss": 2.4524, - "step": 244510 - }, - { - "epoch": 0.43, - "learning_rate": 2.8679324909231055e-05, - "loss": 2.2532, - "step": 244520 - }, - { - "epoch": 0.43, - "learning_rate": 2.8678452969304225e-05, - "loss": 2.3947, - "step": 244530 - }, - { - "epoch": 0.43, - "learning_rate": 2.8677581029377403e-05, - "loss": 2.3974, - "step": 244540 - }, - { - "epoch": 0.43, - "learning_rate": 2.8676709089450576e-05, - "loss": 2.2899, - "step": 244550 - }, - { - "epoch": 0.43, - "learning_rate": 2.867583714952375e-05, - "loss": 2.3319, - "step": 244560 - }, - { - "epoch": 0.43, - "learning_rate": 2.867496520959692e-05, - "loss": 2.3784, - "step": 244570 - }, - { - "epoch": 0.43, - "learning_rate": 2.8674093269670094e-05, - "loss": 2.3137, - "step": 244580 - }, - { - "epoch": 0.43, - "learning_rate": 2.8673221329743265e-05, - "loss": 2.3874, - "step": 244590 - }, - { - "epoch": 0.43, - "learning_rate": 2.867234938981644e-05, - "loss": 2.514, - "step": 244600 - }, - { - "epoch": 0.43, - "learning_rate": 2.8671477449889612e-05, - "loss": 2.4534, - "step": 244610 - }, - { - "epoch": 0.43, - "learning_rate": 2.867060550996279e-05, - "loss": 2.4049, - "step": 244620 - }, - { - "epoch": 0.43, - "learning_rate": 2.8669733570035963e-05, - "loss": 2.454, - "step": 244630 - }, - { - "epoch": 0.43, - "learning_rate": 2.8668861630109133e-05, - "loss": 2.3701, - "step": 244640 - }, - { - "epoch": 0.43, - "learning_rate": 2.8667989690182307e-05, - "loss": 2.4076, - "step": 244650 - }, - { - "epoch": 0.43, - "learning_rate": 2.8667117750255478e-05, - "loss": 2.5464, - "step": 244660 - }, - { - "epoch": 0.43, - "learning_rate": 2.866624581032865e-05, - "loss": 2.3694, - "step": 244670 - }, - { - "epoch": 0.43, - "learning_rate": 2.8665373870401825e-05, - "loss": 2.1961, - "step": 244680 - }, - { - "epoch": 0.43, - "learning_rate": 2.8664501930475002e-05, - "loss": 2.3195, - "step": 244690 - }, - { - "epoch": 0.43, - "learning_rate": 2.8663629990548173e-05, - "loss": 2.2084, - "step": 244700 - }, - { - "epoch": 0.43, - "learning_rate": 2.8662758050621346e-05, - "loss": 2.5108, - "step": 244710 - }, - { - "epoch": 0.43, - "learning_rate": 2.866188611069452e-05, - "loss": 2.4287, - "step": 244720 - }, - { - "epoch": 0.43, - "learning_rate": 2.866101417076769e-05, - "loss": 2.4373, - "step": 244730 - }, - { - "epoch": 0.43, - "learning_rate": 2.8660142230840864e-05, - "loss": 2.4274, - "step": 244740 - }, - { - "epoch": 0.43, - "learning_rate": 2.8659270290914038e-05, - "loss": 2.3805, - "step": 244750 - }, - { - "epoch": 0.43, - "learning_rate": 2.8658398350987215e-05, - "loss": 2.3345, - "step": 244760 - }, - { - "epoch": 0.43, - "learning_rate": 2.8657526411060386e-05, - "loss": 2.3844, - "step": 244770 - }, - { - "epoch": 0.43, - "learning_rate": 2.865665447113356e-05, - "loss": 2.4139, - "step": 244780 - }, - { - "epoch": 0.43, - "learning_rate": 2.8655782531206733e-05, - "loss": 2.4192, - "step": 244790 - }, - { - "epoch": 0.43, - "learning_rate": 2.8654910591279904e-05, - "loss": 2.3867, - "step": 244800 - }, - { - "epoch": 0.43, - "learning_rate": 2.8654038651353077e-05, - "loss": 2.3812, - "step": 244810 - }, - { - "epoch": 0.43, - "learning_rate": 2.8653166711426248e-05, - "loss": 2.3663, - "step": 244820 - }, - { - "epoch": 0.43, - "learning_rate": 2.865229477149942e-05, - "loss": 2.3667, - "step": 244830 - }, - { - "epoch": 0.43, - "learning_rate": 2.86514228315726e-05, - "loss": 2.3643, - "step": 244840 - }, - { - "epoch": 0.43, - "learning_rate": 2.8650550891645772e-05, - "loss": 2.365, - "step": 244850 - }, - { - "epoch": 0.43, - "learning_rate": 2.8649678951718946e-05, - "loss": 2.3812, - "step": 244860 - }, - { - "epoch": 0.43, - "learning_rate": 2.8648807011792117e-05, - "loss": 2.2818, - "step": 244870 - }, - { - "epoch": 0.43, - "learning_rate": 2.864793507186529e-05, - "loss": 2.3547, - "step": 244880 - }, - { - "epoch": 0.43, - "learning_rate": 2.864706313193846e-05, - "loss": 2.4103, - "step": 244890 - }, - { - "epoch": 0.43, - "learning_rate": 2.8646191192011635e-05, - "loss": 2.3453, - "step": 244900 - }, - { - "epoch": 0.43, - "learning_rate": 2.864531925208481e-05, - "loss": 2.3509, - "step": 244910 - }, - { - "epoch": 0.43, - "learning_rate": 2.8644447312157985e-05, - "loss": 2.3677, - "step": 244920 - }, - { - "epoch": 0.43, - "learning_rate": 2.8643575372231156e-05, - "loss": 2.3724, - "step": 244930 - }, - { - "epoch": 0.43, - "learning_rate": 2.864270343230433e-05, - "loss": 2.5169, - "step": 244940 - }, - { - "epoch": 0.43, - "learning_rate": 2.8641831492377503e-05, - "loss": 2.3966, - "step": 244950 - }, - { - "epoch": 0.43, - "learning_rate": 2.8640959552450674e-05, - "loss": 2.2184, - "step": 244960 - }, - { - "epoch": 0.43, - "learning_rate": 2.8640087612523848e-05, - "loss": 2.341, - "step": 244970 - }, - { - "epoch": 0.43, - "learning_rate": 2.8639215672597018e-05, - "loss": 2.4406, - "step": 244980 - }, - { - "epoch": 0.43, - "learning_rate": 2.86383437326702e-05, - "loss": 2.2794, - "step": 244990 - }, - { - "epoch": 0.43, - "learning_rate": 2.863747179274337e-05, - "loss": 2.3613, - "step": 245000 - }, - { - "epoch": 0.43, - "learning_rate": 2.8636599852816543e-05, - "loss": 2.4719, - "step": 245010 - }, - { - "epoch": 0.43, - "learning_rate": 2.8635727912889716e-05, - "loss": 2.323, - "step": 245020 - }, - { - "epoch": 0.43, - "learning_rate": 2.8634855972962887e-05, - "loss": 2.4129, - "step": 245030 - }, - { - "epoch": 0.43, - "learning_rate": 2.863398403303606e-05, - "loss": 2.2737, - "step": 245040 - }, - { - "epoch": 0.43, - "learning_rate": 2.863311209310923e-05, - "loss": 2.4593, - "step": 245050 - }, - { - "epoch": 0.43, - "learning_rate": 2.863224015318241e-05, - "loss": 2.5225, - "step": 245060 - }, - { - "epoch": 0.43, - "learning_rate": 2.8631368213255582e-05, - "loss": 2.3856, - "step": 245070 - }, - { - "epoch": 0.43, - "learning_rate": 2.8630496273328756e-05, - "loss": 2.3508, - "step": 245080 - }, - { - "epoch": 0.43, - "learning_rate": 2.8629624333401926e-05, - "loss": 2.3612, - "step": 245090 - }, - { - "epoch": 0.43, - "learning_rate": 2.86287523934751e-05, - "loss": 2.3273, - "step": 245100 - }, - { - "epoch": 0.43, - "learning_rate": 2.8627880453548274e-05, - "loss": 2.4202, - "step": 245110 - }, - { - "epoch": 0.43, - "learning_rate": 2.8627008513621444e-05, - "loss": 2.4248, - "step": 245120 - }, - { - "epoch": 0.43, - "learning_rate": 2.8626136573694618e-05, - "loss": 2.3357, - "step": 245130 - }, - { - "epoch": 0.43, - "learning_rate": 2.8625264633767795e-05, - "loss": 2.3336, - "step": 245140 - }, - { - "epoch": 0.43, - "learning_rate": 2.862439269384097e-05, - "loss": 2.3837, - "step": 245150 - }, - { - "epoch": 0.43, - "learning_rate": 2.862352075391414e-05, - "loss": 2.3691, - "step": 245160 - }, - { - "epoch": 0.43, - "learning_rate": 2.8622648813987313e-05, - "loss": 2.4129, - "step": 245170 - }, - { - "epoch": 0.43, - "learning_rate": 2.8621776874060487e-05, - "loss": 2.449, - "step": 245180 - }, - { - "epoch": 0.43, - "learning_rate": 2.8620904934133657e-05, - "loss": 2.2806, - "step": 245190 - }, - { - "epoch": 0.43, - "learning_rate": 2.862003299420683e-05, - "loss": 2.3603, - "step": 245200 - }, - { - "epoch": 0.43, - "learning_rate": 2.8619161054280008e-05, - "loss": 2.3466, - "step": 245210 - }, - { - "epoch": 0.43, - "learning_rate": 2.861828911435318e-05, - "loss": 2.2745, - "step": 245220 - }, - { - "epoch": 0.43, - "learning_rate": 2.8617417174426352e-05, - "loss": 2.3912, - "step": 245230 - }, - { - "epoch": 0.43, - "learning_rate": 2.8616545234499526e-05, - "loss": 2.4375, - "step": 245240 - }, - { - "epoch": 0.43, - "learning_rate": 2.86156732945727e-05, - "loss": 2.3684, - "step": 245250 - }, - { - "epoch": 0.43, - "learning_rate": 2.861480135464587e-05, - "loss": 2.44, - "step": 245260 - }, - { - "epoch": 0.43, - "learning_rate": 2.8613929414719044e-05, - "loss": 2.3516, - "step": 245270 - }, - { - "epoch": 0.43, - "learning_rate": 2.8613057474792214e-05, - "loss": 2.2466, - "step": 245280 - }, - { - "epoch": 0.43, - "learning_rate": 2.8612185534865395e-05, - "loss": 2.5626, - "step": 245290 - }, - { - "epoch": 0.43, - "learning_rate": 2.8611313594938565e-05, - "loss": 2.3116, - "step": 245300 - }, - { - "epoch": 0.43, - "learning_rate": 2.861044165501174e-05, - "loss": 2.3261, - "step": 245310 - }, - { - "epoch": 0.43, - "learning_rate": 2.860956971508491e-05, - "loss": 2.4273, - "step": 245320 - }, - { - "epoch": 0.43, - "learning_rate": 2.8608697775158083e-05, - "loss": 2.2773, - "step": 245330 - }, - { - "epoch": 0.43, - "learning_rate": 2.8607825835231257e-05, - "loss": 2.3581, - "step": 245340 - }, - { - "epoch": 0.43, - "learning_rate": 2.8606953895304427e-05, - "loss": 2.4054, - "step": 245350 - }, - { - "epoch": 0.43, - "learning_rate": 2.8606081955377608e-05, - "loss": 2.2441, - "step": 245360 - }, - { - "epoch": 0.43, - "learning_rate": 2.8605210015450778e-05, - "loss": 2.4066, - "step": 245370 - }, - { - "epoch": 0.43, - "learning_rate": 2.8604338075523952e-05, - "loss": 2.3905, - "step": 245380 - }, - { - "epoch": 0.43, - "learning_rate": 2.8603466135597122e-05, - "loss": 2.4322, - "step": 245390 - }, - { - "epoch": 0.43, - "learning_rate": 2.8602594195670296e-05, - "loss": 2.2582, - "step": 245400 - }, - { - "epoch": 0.43, - "learning_rate": 2.860172225574347e-05, - "loss": 2.3232, - "step": 245410 - }, - { - "epoch": 0.43, - "learning_rate": 2.860085031581664e-05, - "loss": 2.3879, - "step": 245420 - }, - { - "epoch": 0.43, - "learning_rate": 2.8599978375889817e-05, - "loss": 2.3019, - "step": 245430 - }, - { - "epoch": 0.43, - "learning_rate": 2.859910643596299e-05, - "loss": 2.1526, - "step": 245440 - }, - { - "epoch": 0.43, - "learning_rate": 2.8598234496036165e-05, - "loss": 2.3872, - "step": 245450 - }, - { - "epoch": 0.43, - "learning_rate": 2.8597362556109335e-05, - "loss": 2.3229, - "step": 245460 - }, - { - "epoch": 0.43, - "learning_rate": 2.859649061618251e-05, - "loss": 2.4571, - "step": 245470 - }, - { - "epoch": 0.43, - "learning_rate": 2.8595618676255683e-05, - "loss": 2.3602, - "step": 245480 - }, - { - "epoch": 0.43, - "learning_rate": 2.8594746736328853e-05, - "loss": 2.4445, - "step": 245490 - }, - { - "epoch": 0.43, - "learning_rate": 2.8593874796402027e-05, - "loss": 2.294, - "step": 245500 - }, - { - "epoch": 0.43, - "learning_rate": 2.8593002856475204e-05, - "loss": 2.408, - "step": 245510 - }, - { - "epoch": 0.43, - "learning_rate": 2.8592130916548378e-05, - "loss": 2.4139, - "step": 245520 - }, - { - "epoch": 0.43, - "learning_rate": 2.8591258976621548e-05, - "loss": 2.3671, - "step": 245530 - }, - { - "epoch": 0.43, - "learning_rate": 2.8590387036694722e-05, - "loss": 2.3951, - "step": 245540 - }, - { - "epoch": 0.43, - "learning_rate": 2.8589515096767892e-05, - "loss": 2.2899, - "step": 245550 - }, - { - "epoch": 0.43, - "learning_rate": 2.8588643156841066e-05, - "loss": 2.3811, - "step": 245560 - }, - { - "epoch": 0.43, - "learning_rate": 2.858777121691424e-05, - "loss": 2.4457, - "step": 245570 - }, - { - "epoch": 0.43, - "learning_rate": 2.8586899276987417e-05, - "loss": 2.2992, - "step": 245580 - }, - { - "epoch": 0.43, - "learning_rate": 2.858602733706059e-05, - "loss": 2.3177, - "step": 245590 - }, - { - "epoch": 0.43, - "learning_rate": 2.858515539713376e-05, - "loss": 2.4617, - "step": 245600 - }, - { - "epoch": 0.43, - "learning_rate": 2.8584283457206935e-05, - "loss": 2.359, - "step": 245610 - }, - { - "epoch": 0.43, - "learning_rate": 2.8583411517280105e-05, - "loss": 2.3159, - "step": 245620 - }, - { - "epoch": 0.43, - "learning_rate": 2.858253957735328e-05, - "loss": 2.3328, - "step": 245630 - }, - { - "epoch": 0.43, - "learning_rate": 2.8581667637426453e-05, - "loss": 2.3006, - "step": 245640 - }, - { - "epoch": 0.43, - "learning_rate": 2.8580795697499623e-05, - "loss": 2.3202, - "step": 245650 - }, - { - "epoch": 0.43, - "learning_rate": 2.85799237575728e-05, - "loss": 2.1917, - "step": 245660 - }, - { - "epoch": 0.43, - "learning_rate": 2.8579051817645974e-05, - "loss": 2.3469, - "step": 245670 - }, - { - "epoch": 0.43, - "learning_rate": 2.8578179877719148e-05, - "loss": 2.4715, - "step": 245680 - }, - { - "epoch": 0.43, - "learning_rate": 2.8577307937792318e-05, - "loss": 2.3354, - "step": 245690 - }, - { - "epoch": 0.43, - "learning_rate": 2.8576435997865492e-05, - "loss": 2.3257, - "step": 245700 - }, - { - "epoch": 0.43, - "learning_rate": 2.8575564057938662e-05, - "loss": 2.3769, - "step": 245710 - }, - { - "epoch": 0.43, - "learning_rate": 2.8574692118011836e-05, - "loss": 2.3835, - "step": 245720 - }, - { - "epoch": 0.43, - "learning_rate": 2.8573820178085013e-05, - "loss": 2.4494, - "step": 245730 - }, - { - "epoch": 0.43, - "learning_rate": 2.8572948238158187e-05, - "loss": 2.3979, - "step": 245740 - }, - { - "epoch": 0.43, - "learning_rate": 2.857207629823136e-05, - "loss": 2.4004, - "step": 245750 - }, - { - "epoch": 0.43, - "learning_rate": 2.857120435830453e-05, - "loss": 2.3302, - "step": 245760 - }, - { - "epoch": 0.43, - "learning_rate": 2.8570332418377705e-05, - "loss": 2.3137, - "step": 245770 - }, - { - "epoch": 0.43, - "learning_rate": 2.8569460478450875e-05, - "loss": 2.3733, - "step": 245780 - }, - { - "epoch": 0.43, - "learning_rate": 2.856858853852405e-05, - "loss": 2.3152, - "step": 245790 - }, - { - "epoch": 0.43, - "learning_rate": 2.8567716598597223e-05, - "loss": 2.4759, - "step": 245800 - }, - { - "epoch": 0.43, - "learning_rate": 2.85668446586704e-05, - "loss": 2.4111, - "step": 245810 - }, - { - "epoch": 0.43, - "learning_rate": 2.856597271874357e-05, - "loss": 2.3235, - "step": 245820 - }, - { - "epoch": 0.43, - "learning_rate": 2.8565100778816744e-05, - "loss": 2.2963, - "step": 245830 - }, - { - "epoch": 0.43, - "learning_rate": 2.8564228838889918e-05, - "loss": 2.3509, - "step": 245840 - }, - { - "epoch": 0.43, - "learning_rate": 2.856335689896309e-05, - "loss": 2.5217, - "step": 245850 - }, - { - "epoch": 0.43, - "learning_rate": 2.8562484959036262e-05, - "loss": 2.4098, - "step": 245860 - }, - { - "epoch": 0.43, - "learning_rate": 2.8561613019109436e-05, - "loss": 2.366, - "step": 245870 - }, - { - "epoch": 0.43, - "learning_rate": 2.8560741079182613e-05, - "loss": 2.3873, - "step": 245880 - }, - { - "epoch": 0.43, - "learning_rate": 2.8559869139255784e-05, - "loss": 2.3782, - "step": 245890 - }, - { - "epoch": 0.43, - "learning_rate": 2.8558997199328957e-05, - "loss": 2.2906, - "step": 245900 - }, - { - "epoch": 0.43, - "learning_rate": 2.855812525940213e-05, - "loss": 2.3531, - "step": 245910 - }, - { - "epoch": 0.43, - "learning_rate": 2.85572533194753e-05, - "loss": 2.4112, - "step": 245920 - }, - { - "epoch": 0.43, - "learning_rate": 2.8556381379548475e-05, - "loss": 2.4118, - "step": 245930 - }, - { - "epoch": 0.43, - "learning_rate": 2.8555509439621646e-05, - "loss": 2.3564, - "step": 245940 - }, - { - "epoch": 0.43, - "learning_rate": 2.8554637499694826e-05, - "loss": 2.4667, - "step": 245950 - }, - { - "epoch": 0.43, - "learning_rate": 2.8553765559767997e-05, - "loss": 2.4213, - "step": 245960 - }, - { - "epoch": 0.43, - "learning_rate": 2.855289361984117e-05, - "loss": 2.3991, - "step": 245970 - }, - { - "epoch": 0.43, - "learning_rate": 2.8552021679914344e-05, - "loss": 2.4328, - "step": 245980 - }, - { - "epoch": 0.43, - "learning_rate": 2.8551149739987514e-05, - "loss": 2.294, - "step": 245990 - }, - { - "epoch": 0.43, - "learning_rate": 2.8550277800060688e-05, - "loss": 2.3862, - "step": 246000 - }, - { - "epoch": 0.43, - "learning_rate": 2.854940586013386e-05, - "loss": 2.3631, - "step": 246010 - }, - { - "epoch": 0.43, - "learning_rate": 2.8548533920207032e-05, - "loss": 2.3904, - "step": 246020 - }, - { - "epoch": 0.43, - "learning_rate": 2.854766198028021e-05, - "loss": 2.3509, - "step": 246030 - }, - { - "epoch": 0.43, - "learning_rate": 2.8546790040353383e-05, - "loss": 2.3014, - "step": 246040 - }, - { - "epoch": 0.43, - "learning_rate": 2.8545918100426554e-05, - "loss": 2.3454, - "step": 246050 - }, - { - "epoch": 0.43, - "learning_rate": 2.8545046160499727e-05, - "loss": 2.4714, - "step": 246060 - }, - { - "epoch": 0.43, - "learning_rate": 2.85441742205729e-05, - "loss": 2.4039, - "step": 246070 - }, - { - "epoch": 0.43, - "learning_rate": 2.854330228064607e-05, - "loss": 2.3748, - "step": 246080 - }, - { - "epoch": 0.43, - "learning_rate": 2.8542430340719245e-05, - "loss": 2.4107, - "step": 246090 - }, - { - "epoch": 0.43, - "learning_rate": 2.8541558400792423e-05, - "loss": 2.3621, - "step": 246100 - }, - { - "epoch": 0.43, - "learning_rate": 2.8540686460865596e-05, - "loss": 2.4451, - "step": 246110 - }, - { - "epoch": 0.43, - "learning_rate": 2.8539814520938767e-05, - "loss": 2.3735, - "step": 246120 - }, - { - "epoch": 0.43, - "learning_rate": 2.853894258101194e-05, - "loss": 2.3675, - "step": 246130 - }, - { - "epoch": 0.43, - "learning_rate": 2.8538070641085114e-05, - "loss": 2.4945, - "step": 246140 - }, - { - "epoch": 0.43, - "learning_rate": 2.8537198701158285e-05, - "loss": 2.4685, - "step": 246150 - }, - { - "epoch": 0.43, - "learning_rate": 2.853632676123146e-05, - "loss": 2.4322, - "step": 246160 - }, - { - "epoch": 0.43, - "learning_rate": 2.853545482130463e-05, - "loss": 2.3231, - "step": 246170 - }, - { - "epoch": 0.43, - "learning_rate": 2.853458288137781e-05, - "loss": 2.3617, - "step": 246180 - }, - { - "epoch": 0.43, - "learning_rate": 2.853371094145098e-05, - "loss": 2.4968, - "step": 246190 - }, - { - "epoch": 0.43, - "learning_rate": 2.8532839001524153e-05, - "loss": 2.3979, - "step": 246200 - }, - { - "epoch": 0.43, - "learning_rate": 2.8531967061597327e-05, - "loss": 2.4505, - "step": 246210 - }, - { - "epoch": 0.43, - "learning_rate": 2.8531095121670498e-05, - "loss": 2.4659, - "step": 246220 - }, - { - "epoch": 0.43, - "learning_rate": 2.853022318174367e-05, - "loss": 2.3657, - "step": 246230 - }, - { - "epoch": 0.43, - "learning_rate": 2.8529351241816842e-05, - "loss": 2.3808, - "step": 246240 - }, - { - "epoch": 0.43, - "learning_rate": 2.8528479301890022e-05, - "loss": 2.3541, - "step": 246250 - }, - { - "epoch": 0.43, - "learning_rate": 2.8527607361963193e-05, - "loss": 2.4519, - "step": 246260 - }, - { - "epoch": 0.43, - "learning_rate": 2.8526735422036366e-05, - "loss": 2.2436, - "step": 246270 - }, - { - "epoch": 0.43, - "learning_rate": 2.8525863482109537e-05, - "loss": 2.4062, - "step": 246280 - }, - { - "epoch": 0.43, - "learning_rate": 2.852499154218271e-05, - "loss": 2.4275, - "step": 246290 - }, - { - "epoch": 0.43, - "learning_rate": 2.8524119602255884e-05, - "loss": 2.3935, - "step": 246300 - }, - { - "epoch": 0.43, - "learning_rate": 2.8523247662329055e-05, - "loss": 2.356, - "step": 246310 - }, - { - "epoch": 0.43, - "learning_rate": 2.852237572240223e-05, - "loss": 2.3472, - "step": 246320 - }, - { - "epoch": 0.43, - "learning_rate": 2.8521503782475406e-05, - "loss": 2.346, - "step": 246330 - }, - { - "epoch": 0.43, - "learning_rate": 2.852063184254858e-05, - "loss": 2.4861, - "step": 246340 - }, - { - "epoch": 0.43, - "learning_rate": 2.851975990262175e-05, - "loss": 2.3553, - "step": 246350 - }, - { - "epoch": 0.43, - "learning_rate": 2.8518887962694924e-05, - "loss": 2.3715, - "step": 246360 - }, - { - "epoch": 0.43, - "learning_rate": 2.8518016022768097e-05, - "loss": 2.2936, - "step": 246370 - }, - { - "epoch": 0.43, - "learning_rate": 2.8517144082841268e-05, - "loss": 2.4267, - "step": 246380 - }, - { - "epoch": 0.43, - "learning_rate": 2.851627214291444e-05, - "loss": 2.3603, - "step": 246390 - }, - { - "epoch": 0.43, - "learning_rate": 2.851540020298762e-05, - "loss": 2.4139, - "step": 246400 - }, - { - "epoch": 0.43, - "learning_rate": 2.8514528263060792e-05, - "loss": 2.2985, - "step": 246410 - }, - { - "epoch": 0.43, - "learning_rate": 2.8513656323133963e-05, - "loss": 2.5067, - "step": 246420 - }, - { - "epoch": 0.43, - "learning_rate": 2.8512784383207137e-05, - "loss": 2.359, - "step": 246430 - }, - { - "epoch": 0.43, - "learning_rate": 2.8511912443280307e-05, - "loss": 2.392, - "step": 246440 - }, - { - "epoch": 0.43, - "learning_rate": 2.851104050335348e-05, - "loss": 2.4611, - "step": 246450 - }, - { - "epoch": 0.43, - "learning_rate": 2.8510168563426655e-05, - "loss": 2.337, - "step": 246460 - }, - { - "epoch": 0.43, - "learning_rate": 2.8509296623499825e-05, - "loss": 2.3506, - "step": 246470 - }, - { - "epoch": 0.43, - "learning_rate": 2.8508424683573005e-05, - "loss": 2.446, - "step": 246480 - }, - { - "epoch": 0.43, - "learning_rate": 2.8507552743646176e-05, - "loss": 2.3342, - "step": 246490 - }, - { - "epoch": 0.43, - "learning_rate": 2.850668080371935e-05, - "loss": 2.431, - "step": 246500 - }, - { - "epoch": 0.43, - "learning_rate": 2.850580886379252e-05, - "loss": 2.259, - "step": 246510 - }, - { - "epoch": 0.43, - "learning_rate": 2.8504936923865694e-05, - "loss": 2.3228, - "step": 246520 - }, - { - "epoch": 0.43, - "learning_rate": 2.8504064983938868e-05, - "loss": 2.4769, - "step": 246530 - }, - { - "epoch": 0.43, - "learning_rate": 2.8503193044012038e-05, - "loss": 2.4144, - "step": 246540 - }, - { - "epoch": 0.43, - "learning_rate": 2.8502321104085215e-05, - "loss": 2.4424, - "step": 246550 - }, - { - "epoch": 0.43, - "learning_rate": 2.850144916415839e-05, - "loss": 2.4265, - "step": 246560 - }, - { - "epoch": 0.43, - "learning_rate": 2.8500577224231563e-05, - "loss": 2.4053, - "step": 246570 - }, - { - "epoch": 0.43, - "learning_rate": 2.8499705284304733e-05, - "loss": 2.4265, - "step": 246580 - }, - { - "epoch": 0.43, - "learning_rate": 2.8498833344377907e-05, - "loss": 2.453, - "step": 246590 - }, - { - "epoch": 0.43, - "learning_rate": 2.849796140445108e-05, - "loss": 2.4088, - "step": 246600 - }, - { - "epoch": 0.43, - "learning_rate": 2.849708946452425e-05, - "loss": 2.3816, - "step": 246610 - }, - { - "epoch": 0.43, - "learning_rate": 2.8496217524597428e-05, - "loss": 2.4214, - "step": 246620 - }, - { - "epoch": 0.43, - "learning_rate": 2.8495345584670602e-05, - "loss": 2.3285, - "step": 246630 - }, - { - "epoch": 0.43, - "learning_rate": 2.8494473644743776e-05, - "loss": 2.3287, - "step": 246640 - }, - { - "epoch": 0.43, - "learning_rate": 2.8493601704816946e-05, - "loss": 2.3505, - "step": 246650 - }, - { - "epoch": 0.43, - "learning_rate": 2.849272976489012e-05, - "loss": 2.3778, - "step": 246660 - }, - { - "epoch": 0.43, - "learning_rate": 2.849185782496329e-05, - "loss": 2.3955, - "step": 246670 - }, - { - "epoch": 0.43, - "learning_rate": 2.8490985885036464e-05, - "loss": 2.352, - "step": 246680 - }, - { - "epoch": 0.43, - "learning_rate": 2.8490113945109638e-05, - "loss": 2.3233, - "step": 246690 - }, - { - "epoch": 0.43, - "learning_rate": 2.8489242005182815e-05, - "loss": 2.4982, - "step": 246700 - }, - { - "epoch": 0.43, - "learning_rate": 2.848837006525599e-05, - "loss": 2.4446, - "step": 246710 - }, - { - "epoch": 0.43, - "learning_rate": 2.848749812532916e-05, - "loss": 2.3796, - "step": 246720 - }, - { - "epoch": 0.43, - "learning_rate": 2.8486626185402333e-05, - "loss": 2.3838, - "step": 246730 - }, - { - "epoch": 0.43, - "learning_rate": 2.8485754245475503e-05, - "loss": 2.3252, - "step": 246740 - }, - { - "epoch": 0.43, - "learning_rate": 2.8484882305548677e-05, - "loss": 2.3377, - "step": 246750 - }, - { - "epoch": 0.43, - "learning_rate": 2.848401036562185e-05, - "loss": 2.3469, - "step": 246760 - }, - { - "epoch": 0.43, - "learning_rate": 2.8483138425695028e-05, - "loss": 2.4251, - "step": 246770 - }, - { - "epoch": 0.43, - "learning_rate": 2.8482266485768198e-05, - "loss": 2.3938, - "step": 246780 - }, - { - "epoch": 0.43, - "learning_rate": 2.8481394545841372e-05, - "loss": 2.3894, - "step": 246790 - }, - { - "epoch": 0.43, - "learning_rate": 2.8480522605914546e-05, - "loss": 2.3409, - "step": 246800 - }, - { - "epoch": 0.43, - "learning_rate": 2.8479650665987716e-05, - "loss": 2.4042, - "step": 246810 - }, - { - "epoch": 0.43, - "learning_rate": 2.847877872606089e-05, - "loss": 2.3666, - "step": 246820 - }, - { - "epoch": 0.43, - "learning_rate": 2.8477906786134064e-05, - "loss": 2.3685, - "step": 246830 - }, - { - "epoch": 0.43, - "learning_rate": 2.8477034846207234e-05, - "loss": 2.4069, - "step": 246840 - }, - { - "epoch": 0.43, - "learning_rate": 2.847616290628041e-05, - "loss": 2.3832, - "step": 246850 - }, - { - "epoch": 0.43, - "learning_rate": 2.8475290966353585e-05, - "loss": 2.4186, - "step": 246860 - }, - { - "epoch": 0.43, - "learning_rate": 2.847441902642676e-05, - "loss": 2.4157, - "step": 246870 - }, - { - "epoch": 0.43, - "learning_rate": 2.847354708649993e-05, - "loss": 2.355, - "step": 246880 - }, - { - "epoch": 0.43, - "learning_rate": 2.8472675146573103e-05, - "loss": 2.3311, - "step": 246890 - }, - { - "epoch": 0.43, - "learning_rate": 2.8471803206646273e-05, - "loss": 2.2961, - "step": 246900 - }, - { - "epoch": 0.43, - "learning_rate": 2.8470931266719447e-05, - "loss": 2.3866, - "step": 246910 - }, - { - "epoch": 0.43, - "learning_rate": 2.8470059326792624e-05, - "loss": 2.4452, - "step": 246920 - }, - { - "epoch": 0.43, - "learning_rate": 2.8469187386865798e-05, - "loss": 2.351, - "step": 246930 - }, - { - "epoch": 0.43, - "learning_rate": 2.8468315446938972e-05, - "loss": 2.395, - "step": 246940 - }, - { - "epoch": 0.43, - "learning_rate": 2.8467443507012142e-05, - "loss": 2.3455, - "step": 246950 - }, - { - "epoch": 0.43, - "learning_rate": 2.8466571567085316e-05, - "loss": 2.2824, - "step": 246960 - }, - { - "epoch": 0.43, - "learning_rate": 2.8465699627158486e-05, - "loss": 2.3906, - "step": 246970 - }, - { - "epoch": 0.43, - "learning_rate": 2.846482768723166e-05, - "loss": 2.316, - "step": 246980 - }, - { - "epoch": 0.43, - "learning_rate": 2.8463955747304834e-05, - "loss": 2.3936, - "step": 246990 - }, - { - "epoch": 0.43, - "learning_rate": 2.846308380737801e-05, - "loss": 2.3979, - "step": 247000 - }, - { - "epoch": 0.43, - "learning_rate": 2.846221186745118e-05, - "loss": 2.3305, - "step": 247010 - }, - { - "epoch": 0.43, - "learning_rate": 2.8461339927524355e-05, - "loss": 2.3954, - "step": 247020 - }, - { - "epoch": 0.43, - "learning_rate": 2.846046798759753e-05, - "loss": 2.4613, - "step": 247030 - }, - { - "epoch": 0.43, - "learning_rate": 2.84595960476707e-05, - "loss": 2.337, - "step": 247040 - }, - { - "epoch": 0.43, - "learning_rate": 2.8458724107743873e-05, - "loss": 2.345, - "step": 247050 - }, - { - "epoch": 0.43, - "learning_rate": 2.8457852167817043e-05, - "loss": 2.3961, - "step": 247060 - }, - { - "epoch": 0.43, - "learning_rate": 2.8456980227890224e-05, - "loss": 2.5158, - "step": 247070 - }, - { - "epoch": 0.43, - "learning_rate": 2.8456108287963394e-05, - "loss": 2.3591, - "step": 247080 - }, - { - "epoch": 0.43, - "learning_rate": 2.8455236348036568e-05, - "loss": 2.3727, - "step": 247090 - }, - { - "epoch": 0.43, - "learning_rate": 2.8454364408109742e-05, - "loss": 2.3069, - "step": 247100 - }, - { - "epoch": 0.43, - "learning_rate": 2.8453492468182912e-05, - "loss": 2.3783, - "step": 247110 - }, - { - "epoch": 0.43, - "learning_rate": 2.8452620528256086e-05, - "loss": 2.42, - "step": 247120 - }, - { - "epoch": 0.43, - "learning_rate": 2.8451748588329256e-05, - "loss": 2.3585, - "step": 247130 - }, - { - "epoch": 0.43, - "learning_rate": 2.845087664840243e-05, - "loss": 2.2831, - "step": 247140 - }, - { - "epoch": 0.43, - "learning_rate": 2.8450004708475607e-05, - "loss": 2.3898, - "step": 247150 - }, - { - "epoch": 0.43, - "learning_rate": 2.844913276854878e-05, - "loss": 2.3134, - "step": 247160 - }, - { - "epoch": 0.43, - "learning_rate": 2.844826082862195e-05, - "loss": 2.3582, - "step": 247170 - }, - { - "epoch": 0.43, - "learning_rate": 2.8447388888695125e-05, - "loss": 2.2181, - "step": 247180 - }, - { - "epoch": 0.43, - "learning_rate": 2.84465169487683e-05, - "loss": 2.3148, - "step": 247190 - }, - { - "epoch": 0.43, - "learning_rate": 2.844564500884147e-05, - "loss": 2.3315, - "step": 247200 - }, - { - "epoch": 0.43, - "learning_rate": 2.8444773068914643e-05, - "loss": 2.3988, - "step": 247210 - }, - { - "epoch": 0.43, - "learning_rate": 2.844390112898782e-05, - "loss": 2.4284, - "step": 247220 - }, - { - "epoch": 0.43, - "learning_rate": 2.8443029189060994e-05, - "loss": 2.3869, - "step": 247230 - }, - { - "epoch": 0.43, - "learning_rate": 2.8442157249134165e-05, - "loss": 2.4832, - "step": 247240 - }, - { - "epoch": 0.43, - "learning_rate": 2.8441285309207338e-05, - "loss": 2.3316, - "step": 247250 - }, - { - "epoch": 0.43, - "learning_rate": 2.8440413369280512e-05, - "loss": 2.4013, - "step": 247260 - }, - { - "epoch": 0.43, - "learning_rate": 2.8439541429353682e-05, - "loss": 2.3485, - "step": 247270 - }, - { - "epoch": 0.43, - "learning_rate": 2.8438669489426856e-05, - "loss": 2.3558, - "step": 247280 - }, - { - "epoch": 0.43, - "learning_rate": 2.8437797549500033e-05, - "loss": 2.4394, - "step": 247290 - }, - { - "epoch": 0.43, - "learning_rate": 2.8436925609573207e-05, - "loss": 2.3872, - "step": 247300 - }, - { - "epoch": 0.43, - "learning_rate": 2.8436053669646378e-05, - "loss": 2.402, - "step": 247310 - }, - { - "epoch": 0.43, - "learning_rate": 2.843518172971955e-05, - "loss": 2.3365, - "step": 247320 - }, - { - "epoch": 0.43, - "learning_rate": 2.8434309789792725e-05, - "loss": 2.3707, - "step": 247330 - }, - { - "epoch": 0.43, - "learning_rate": 2.8433437849865895e-05, - "loss": 2.4207, - "step": 247340 - }, - { - "epoch": 0.43, - "learning_rate": 2.843256590993907e-05, - "loss": 2.4339, - "step": 247350 - }, - { - "epoch": 0.43, - "learning_rate": 2.843169397001224e-05, - "loss": 2.373, - "step": 247360 - }, - { - "epoch": 0.43, - "learning_rate": 2.843082203008542e-05, - "loss": 2.3579, - "step": 247370 - }, - { - "epoch": 0.43, - "learning_rate": 2.842995009015859e-05, - "loss": 2.3893, - "step": 247380 - }, - { - "epoch": 0.43, - "learning_rate": 2.8429078150231764e-05, - "loss": 2.3315, - "step": 247390 - }, - { - "epoch": 0.43, - "learning_rate": 2.8428206210304935e-05, - "loss": 2.345, - "step": 247400 - }, - { - "epoch": 0.43, - "learning_rate": 2.842733427037811e-05, - "loss": 2.4022, - "step": 247410 - }, - { - "epoch": 0.43, - "learning_rate": 2.8426462330451282e-05, - "loss": 2.3633, - "step": 247420 - }, - { - "epoch": 0.43, - "learning_rate": 2.8425590390524453e-05, - "loss": 2.4421, - "step": 247430 - }, - { - "epoch": 0.43, - "learning_rate": 2.8424718450597633e-05, - "loss": 2.4681, - "step": 247440 - }, - { - "epoch": 0.43, - "learning_rate": 2.8423846510670804e-05, - "loss": 2.4905, - "step": 247450 - }, - { - "epoch": 0.43, - "learning_rate": 2.8422974570743977e-05, - "loss": 2.406, - "step": 247460 - }, - { - "epoch": 0.43, - "learning_rate": 2.8422102630817148e-05, - "loss": 2.3654, - "step": 247470 - }, - { - "epoch": 0.43, - "learning_rate": 2.842123069089032e-05, - "loss": 2.3935, - "step": 247480 - }, - { - "epoch": 0.43, - "learning_rate": 2.8420358750963495e-05, - "loss": 2.3913, - "step": 247490 - }, - { - "epoch": 0.43, - "learning_rate": 2.8419486811036666e-05, - "loss": 2.3924, - "step": 247500 - }, - { - "epoch": 0.43, - "learning_rate": 2.841861487110984e-05, - "loss": 2.3949, - "step": 247510 - }, - { - "epoch": 0.43, - "learning_rate": 2.8417742931183017e-05, - "loss": 2.3842, - "step": 247520 - }, - { - "epoch": 0.43, - "learning_rate": 2.841687099125619e-05, - "loss": 2.4553, - "step": 247530 - }, - { - "epoch": 0.43, - "learning_rate": 2.841599905132936e-05, - "loss": 2.3899, - "step": 247540 - }, - { - "epoch": 0.43, - "learning_rate": 2.8415127111402534e-05, - "loss": 2.5026, - "step": 247550 - }, - { - "epoch": 0.43, - "learning_rate": 2.8414255171475708e-05, - "loss": 2.4101, - "step": 247560 - }, - { - "epoch": 0.43, - "learning_rate": 2.841338323154888e-05, - "loss": 2.3494, - "step": 247570 - }, - { - "epoch": 0.43, - "learning_rate": 2.8412511291622052e-05, - "loss": 2.4109, - "step": 247580 - }, - { - "epoch": 0.43, - "learning_rate": 2.841163935169523e-05, - "loss": 2.5008, - "step": 247590 - }, - { - "epoch": 0.43, - "learning_rate": 2.8410767411768403e-05, - "loss": 2.3658, - "step": 247600 - }, - { - "epoch": 0.43, - "learning_rate": 2.8409895471841574e-05, - "loss": 2.393, - "step": 247610 - }, - { - "epoch": 0.43, - "learning_rate": 2.8409023531914747e-05, - "loss": 2.3815, - "step": 247620 - }, - { - "epoch": 0.43, - "learning_rate": 2.8408151591987918e-05, - "loss": 2.2829, - "step": 247630 - }, - { - "epoch": 0.43, - "learning_rate": 2.840727965206109e-05, - "loss": 2.3521, - "step": 247640 - }, - { - "epoch": 0.43, - "learning_rate": 2.8406407712134265e-05, - "loss": 2.321, - "step": 247650 - }, - { - "epoch": 0.43, - "learning_rate": 2.8405535772207436e-05, - "loss": 2.3331, - "step": 247660 - }, - { - "epoch": 0.43, - "learning_rate": 2.8404663832280616e-05, - "loss": 2.4419, - "step": 247670 - }, - { - "epoch": 0.43, - "learning_rate": 2.8403791892353787e-05, - "loss": 2.404, - "step": 247680 - }, - { - "epoch": 0.43, - "learning_rate": 2.840291995242696e-05, - "loss": 2.3056, - "step": 247690 - }, - { - "epoch": 0.43, - "learning_rate": 2.840204801250013e-05, - "loss": 2.4164, - "step": 247700 - }, - { - "epoch": 0.43, - "learning_rate": 2.8401176072573305e-05, - "loss": 2.369, - "step": 247710 - }, - { - "epoch": 0.43, - "learning_rate": 2.840030413264648e-05, - "loss": 2.5083, - "step": 247720 - }, - { - "epoch": 0.43, - "learning_rate": 2.839943219271965e-05, - "loss": 2.4005, - "step": 247730 - }, - { - "epoch": 0.43, - "learning_rate": 2.8398560252792826e-05, - "loss": 2.3664, - "step": 247740 - }, - { - "epoch": 0.43, - "learning_rate": 2.8397688312866e-05, - "loss": 2.3989, - "step": 247750 - }, - { - "epoch": 0.43, - "learning_rate": 2.8396816372939173e-05, - "loss": 2.4617, - "step": 247760 - }, - { - "epoch": 0.43, - "learning_rate": 2.8395944433012344e-05, - "loss": 2.4553, - "step": 247770 - }, - { - "epoch": 0.43, - "learning_rate": 2.8395072493085518e-05, - "loss": 2.3548, - "step": 247780 - }, - { - "epoch": 0.43, - "learning_rate": 2.8394200553158688e-05, - "loss": 2.3612, - "step": 247790 - }, - { - "epoch": 0.43, - "learning_rate": 2.8393328613231862e-05, - "loss": 2.4687, - "step": 247800 - }, - { - "epoch": 0.43, - "learning_rate": 2.839245667330504e-05, - "loss": 2.3697, - "step": 247810 - }, - { - "epoch": 0.43, - "learning_rate": 2.8391584733378213e-05, - "loss": 2.3686, - "step": 247820 - }, - { - "epoch": 0.43, - "learning_rate": 2.8390712793451386e-05, - "loss": 2.5143, - "step": 247830 - }, - { - "epoch": 0.43, - "learning_rate": 2.8389840853524557e-05, - "loss": 2.3993, - "step": 247840 - }, - { - "epoch": 0.43, - "learning_rate": 2.838896891359773e-05, - "loss": 2.3793, - "step": 247850 - }, - { - "epoch": 0.43, - "learning_rate": 2.83880969736709e-05, - "loss": 2.3831, - "step": 247860 - }, - { - "epoch": 0.43, - "learning_rate": 2.8387225033744075e-05, - "loss": 2.3943, - "step": 247870 - }, - { - "epoch": 0.43, - "learning_rate": 2.838635309381725e-05, - "loss": 2.4123, - "step": 247880 - }, - { - "epoch": 0.43, - "learning_rate": 2.8385481153890426e-05, - "loss": 2.3444, - "step": 247890 - }, - { - "epoch": 0.43, - "learning_rate": 2.8384609213963596e-05, - "loss": 2.5063, - "step": 247900 - }, - { - "epoch": 0.43, - "learning_rate": 2.838373727403677e-05, - "loss": 2.4652, - "step": 247910 - }, - { - "epoch": 0.43, - "learning_rate": 2.8382865334109944e-05, - "loss": 2.3035, - "step": 247920 - }, - { - "epoch": 0.43, - "learning_rate": 2.8381993394183114e-05, - "loss": 2.5045, - "step": 247930 - }, - { - "epoch": 0.43, - "learning_rate": 2.8381121454256288e-05, - "loss": 2.5161, - "step": 247940 - }, - { - "epoch": 0.43, - "learning_rate": 2.838024951432946e-05, - "loss": 2.442, - "step": 247950 - }, - { - "epoch": 0.43, - "learning_rate": 2.837937757440264e-05, - "loss": 2.4643, - "step": 247960 - }, - { - "epoch": 0.43, - "learning_rate": 2.837850563447581e-05, - "loss": 2.4149, - "step": 247970 - }, - { - "epoch": 0.43, - "learning_rate": 2.8377633694548983e-05, - "loss": 2.32, - "step": 247980 - }, - { - "epoch": 0.43, - "learning_rate": 2.8376761754622157e-05, - "loss": 2.3077, - "step": 247990 - }, - { - "epoch": 0.43, - "learning_rate": 2.8375889814695327e-05, - "loss": 2.3522, - "step": 248000 - }, - { - "epoch": 0.43, - "learning_rate": 2.83750178747685e-05, - "loss": 2.4452, - "step": 248010 - }, - { - "epoch": 0.43, - "learning_rate": 2.837414593484167e-05, - "loss": 2.3612, - "step": 248020 - }, - { - "epoch": 0.43, - "learning_rate": 2.8373273994914845e-05, - "loss": 2.4995, - "step": 248030 - }, - { - "epoch": 0.43, - "learning_rate": 2.8372402054988022e-05, - "loss": 2.3867, - "step": 248040 - }, - { - "epoch": 0.43, - "learning_rate": 2.8371530115061196e-05, - "loss": 2.386, - "step": 248050 - }, - { - "epoch": 0.43, - "learning_rate": 2.837065817513437e-05, - "loss": 2.479, - "step": 248060 - }, - { - "epoch": 0.43, - "learning_rate": 2.836978623520754e-05, - "loss": 2.4566, - "step": 248070 - }, - { - "epoch": 0.43, - "learning_rate": 2.8368914295280714e-05, - "loss": 2.3765, - "step": 248080 - }, - { - "epoch": 0.43, - "learning_rate": 2.8368042355353884e-05, - "loss": 2.3941, - "step": 248090 - }, - { - "epoch": 0.43, - "learning_rate": 2.8367170415427058e-05, - "loss": 2.5683, - "step": 248100 - }, - { - "epoch": 0.43, - "learning_rate": 2.8366298475500235e-05, - "loss": 2.3681, - "step": 248110 - }, - { - "epoch": 0.43, - "learning_rate": 2.836542653557341e-05, - "loss": 2.397, - "step": 248120 - }, - { - "epoch": 0.43, - "learning_rate": 2.836455459564658e-05, - "loss": 2.4261, - "step": 248130 - }, - { - "epoch": 0.43, - "learning_rate": 2.8363682655719753e-05, - "loss": 2.3197, - "step": 248140 - }, - { - "epoch": 0.43, - "learning_rate": 2.8362810715792927e-05, - "loss": 2.4592, - "step": 248150 - }, - { - "epoch": 0.43, - "learning_rate": 2.8361938775866097e-05, - "loss": 2.3454, - "step": 248160 - }, - { - "epoch": 0.43, - "learning_rate": 2.836106683593927e-05, - "loss": 2.4207, - "step": 248170 - }, - { - "epoch": 0.43, - "learning_rate": 2.8360194896012445e-05, - "loss": 2.3068, - "step": 248180 - }, - { - "epoch": 0.43, - "learning_rate": 2.8359322956085622e-05, - "loss": 2.4476, - "step": 248190 - }, - { - "epoch": 0.43, - "learning_rate": 2.8358451016158792e-05, - "loss": 2.4316, - "step": 248200 - }, - { - "epoch": 0.43, - "learning_rate": 2.8357579076231966e-05, - "loss": 2.4903, - "step": 248210 - }, - { - "epoch": 0.43, - "learning_rate": 2.835670713630514e-05, - "loss": 2.399, - "step": 248220 - }, - { - "epoch": 0.43, - "learning_rate": 2.835583519637831e-05, - "loss": 2.3034, - "step": 248230 - }, - { - "epoch": 0.43, - "learning_rate": 2.8354963256451484e-05, - "loss": 2.3937, - "step": 248240 - }, - { - "epoch": 0.43, - "learning_rate": 2.8354091316524654e-05, - "loss": 2.4275, - "step": 248250 - }, - { - "epoch": 0.43, - "learning_rate": 2.8353219376597835e-05, - "loss": 2.3094, - "step": 248260 - }, - { - "epoch": 0.43, - "learning_rate": 2.8352347436671005e-05, - "loss": 2.5134, - "step": 248270 - }, - { - "epoch": 0.43, - "learning_rate": 2.835147549674418e-05, - "loss": 2.3144, - "step": 248280 - }, - { - "epoch": 0.43, - "learning_rate": 2.8350603556817353e-05, - "loss": 2.3895, - "step": 248290 - }, - { - "epoch": 0.43, - "learning_rate": 2.8349731616890523e-05, - "loss": 2.429, - "step": 248300 - }, - { - "epoch": 0.43, - "learning_rate": 2.8348859676963697e-05, - "loss": 2.4318, - "step": 248310 - }, - { - "epoch": 0.43, - "learning_rate": 2.8347987737036867e-05, - "loss": 2.3973, - "step": 248320 - }, - { - "epoch": 0.43, - "learning_rate": 2.834711579711004e-05, - "loss": 2.3875, - "step": 248330 - }, - { - "epoch": 0.43, - "learning_rate": 2.8346243857183218e-05, - "loss": 2.4332, - "step": 248340 - }, - { - "epoch": 0.43, - "learning_rate": 2.8345371917256392e-05, - "loss": 2.4313, - "step": 248350 - }, - { - "epoch": 0.43, - "learning_rate": 2.8344499977329562e-05, - "loss": 2.3162, - "step": 248360 - }, - { - "epoch": 0.43, - "learning_rate": 2.8343628037402736e-05, - "loss": 2.2923, - "step": 248370 - }, - { - "epoch": 0.43, - "learning_rate": 2.834275609747591e-05, - "loss": 2.2926, - "step": 248380 - }, - { - "epoch": 0.43, - "learning_rate": 2.834188415754908e-05, - "loss": 2.477, - "step": 248390 - }, - { - "epoch": 0.43, - "learning_rate": 2.8341012217622254e-05, - "loss": 2.4268, - "step": 248400 - }, - { - "epoch": 0.43, - "learning_rate": 2.834014027769543e-05, - "loss": 2.272, - "step": 248410 - }, - { - "epoch": 0.43, - "learning_rate": 2.8339268337768605e-05, - "loss": 2.3832, - "step": 248420 - }, - { - "epoch": 0.43, - "learning_rate": 2.8338396397841775e-05, - "loss": 2.4697, - "step": 248430 - }, - { - "epoch": 0.43, - "learning_rate": 2.833752445791495e-05, - "loss": 2.3767, - "step": 248440 - }, - { - "epoch": 0.43, - "learning_rate": 2.8336652517988123e-05, - "loss": 2.402, - "step": 248450 - }, - { - "epoch": 0.43, - "learning_rate": 2.8335780578061293e-05, - "loss": 2.4095, - "step": 248460 - }, - { - "epoch": 0.43, - "learning_rate": 2.8334908638134467e-05, - "loss": 2.4492, - "step": 248470 - }, - { - "epoch": 0.43, - "learning_rate": 2.8334036698207644e-05, - "loss": 2.3899, - "step": 248480 - }, - { - "epoch": 0.43, - "learning_rate": 2.8333164758280818e-05, - "loss": 2.3423, - "step": 248490 - }, - { - "epoch": 0.43, - "learning_rate": 2.833229281835399e-05, - "loss": 2.2997, - "step": 248500 - }, - { - "epoch": 0.43, - "learning_rate": 2.8331420878427162e-05, - "loss": 2.3794, - "step": 248510 - }, - { - "epoch": 0.43, - "learning_rate": 2.8330548938500333e-05, - "loss": 2.3663, - "step": 248520 - }, - { - "epoch": 0.43, - "learning_rate": 2.8329676998573506e-05, - "loss": 2.4387, - "step": 248530 - }, - { - "epoch": 0.43, - "learning_rate": 2.832880505864668e-05, - "loss": 2.3133, - "step": 248540 - }, - { - "epoch": 0.43, - "learning_rate": 2.832793311871985e-05, - "loss": 2.3398, - "step": 248550 - }, - { - "epoch": 0.43, - "learning_rate": 2.832706117879303e-05, - "loss": 2.4907, - "step": 248560 - }, - { - "epoch": 0.43, - "learning_rate": 2.83261892388662e-05, - "loss": 2.3282, - "step": 248570 - }, - { - "epoch": 0.43, - "learning_rate": 2.8325317298939375e-05, - "loss": 2.3631, - "step": 248580 - }, - { - "epoch": 0.43, - "learning_rate": 2.8324445359012546e-05, - "loss": 2.4429, - "step": 248590 - }, - { - "epoch": 0.43, - "learning_rate": 2.832357341908572e-05, - "loss": 2.5103, - "step": 248600 - }, - { - "epoch": 0.43, - "learning_rate": 2.8322701479158893e-05, - "loss": 2.3561, - "step": 248610 - }, - { - "epoch": 0.43, - "learning_rate": 2.8321829539232063e-05, - "loss": 2.3621, - "step": 248620 - }, - { - "epoch": 0.43, - "learning_rate": 2.832095759930524e-05, - "loss": 2.3646, - "step": 248630 - }, - { - "epoch": 0.43, - "learning_rate": 2.8320085659378414e-05, - "loss": 2.3799, - "step": 248640 - }, - { - "epoch": 0.43, - "learning_rate": 2.8319213719451588e-05, - "loss": 2.3734, - "step": 248650 - }, - { - "epoch": 0.43, - "learning_rate": 2.831834177952476e-05, - "loss": 2.4498, - "step": 248660 - }, - { - "epoch": 0.43, - "learning_rate": 2.8317469839597932e-05, - "loss": 2.3996, - "step": 248670 - }, - { - "epoch": 0.43, - "learning_rate": 2.8316597899671106e-05, - "loss": 2.365, - "step": 248680 - }, - { - "epoch": 0.43, - "learning_rate": 2.8315725959744276e-05, - "loss": 2.3475, - "step": 248690 - }, - { - "epoch": 0.43, - "learning_rate": 2.831485401981745e-05, - "loss": 2.4035, - "step": 248700 - }, - { - "epoch": 0.43, - "learning_rate": 2.8313982079890627e-05, - "loss": 2.3927, - "step": 248710 - }, - { - "epoch": 0.43, - "learning_rate": 2.83131101399638e-05, - "loss": 2.3642, - "step": 248720 - }, - { - "epoch": 0.43, - "learning_rate": 2.831223820003697e-05, - "loss": 2.4836, - "step": 248730 - }, - { - "epoch": 0.43, - "learning_rate": 2.8311366260110145e-05, - "loss": 2.3605, - "step": 248740 - }, - { - "epoch": 0.43, - "learning_rate": 2.8310494320183316e-05, - "loss": 2.5012, - "step": 248750 - }, - { - "epoch": 0.43, - "learning_rate": 2.830962238025649e-05, - "loss": 2.3535, - "step": 248760 - }, - { - "epoch": 0.43, - "learning_rate": 2.8308750440329663e-05, - "loss": 2.3435, - "step": 248770 - }, - { - "epoch": 0.43, - "learning_rate": 2.830787850040284e-05, - "loss": 2.2883, - "step": 248780 - }, - { - "epoch": 0.43, - "learning_rate": 2.8307006560476014e-05, - "loss": 2.4659, - "step": 248790 - }, - { - "epoch": 0.43, - "learning_rate": 2.8306134620549185e-05, - "loss": 2.4712, - "step": 248800 - }, - { - "epoch": 0.43, - "learning_rate": 2.830526268062236e-05, - "loss": 2.4074, - "step": 248810 - }, - { - "epoch": 0.43, - "learning_rate": 2.830439074069553e-05, - "loss": 2.455, - "step": 248820 - }, - { - "epoch": 0.43, - "learning_rate": 2.8303518800768702e-05, - "loss": 2.4181, - "step": 248830 - }, - { - "epoch": 0.43, - "learning_rate": 2.8302646860841876e-05, - "loss": 2.3692, - "step": 248840 - }, - { - "epoch": 0.43, - "learning_rate": 2.8301774920915047e-05, - "loss": 2.2579, - "step": 248850 - }, - { - "epoch": 0.43, - "learning_rate": 2.8300902980988224e-05, - "loss": 2.3381, - "step": 248860 - }, - { - "epoch": 0.43, - "learning_rate": 2.8300031041061398e-05, - "loss": 2.3975, - "step": 248870 - }, - { - "epoch": 0.43, - "learning_rate": 2.829915910113457e-05, - "loss": 2.4753, - "step": 248880 - }, - { - "epoch": 0.43, - "learning_rate": 2.829828716120774e-05, - "loss": 2.3337, - "step": 248890 - }, - { - "epoch": 0.43, - "learning_rate": 2.8297415221280915e-05, - "loss": 2.3176, - "step": 248900 - }, - { - "epoch": 0.43, - "learning_rate": 2.829654328135409e-05, - "loss": 2.3428, - "step": 248910 - }, - { - "epoch": 0.43, - "learning_rate": 2.829567134142726e-05, - "loss": 2.3428, - "step": 248920 - }, - { - "epoch": 0.43, - "learning_rate": 2.8294799401500437e-05, - "loss": 2.2915, - "step": 248930 - }, - { - "epoch": 0.43, - "learning_rate": 2.829392746157361e-05, - "loss": 2.4295, - "step": 248940 - }, - { - "epoch": 0.43, - "learning_rate": 2.8293055521646784e-05, - "loss": 2.4371, - "step": 248950 - }, - { - "epoch": 0.43, - "learning_rate": 2.8292183581719955e-05, - "loss": 2.297, - "step": 248960 - }, - { - "epoch": 0.43, - "learning_rate": 2.829131164179313e-05, - "loss": 2.2187, - "step": 248970 - }, - { - "epoch": 0.43, - "learning_rate": 2.82904397018663e-05, - "loss": 2.4937, - "step": 248980 - }, - { - "epoch": 0.43, - "learning_rate": 2.8289567761939473e-05, - "loss": 2.4701, - "step": 248990 - }, - { - "epoch": 0.43, - "learning_rate": 2.8288695822012646e-05, - "loss": 2.2846, - "step": 249000 - }, - { - "epoch": 0.43, - "learning_rate": 2.8287823882085824e-05, - "loss": 2.458, - "step": 249010 - }, - { - "epoch": 0.43, - "learning_rate": 2.8286951942158997e-05, - "loss": 2.344, - "step": 249020 - }, - { - "epoch": 0.43, - "learning_rate": 2.8286080002232168e-05, - "loss": 2.4567, - "step": 249030 - }, - { - "epoch": 0.43, - "learning_rate": 2.828520806230534e-05, - "loss": 2.47, - "step": 249040 - }, - { - "epoch": 0.43, - "learning_rate": 2.8284336122378512e-05, - "loss": 2.5644, - "step": 249050 - }, - { - "epoch": 0.43, - "learning_rate": 2.8283464182451686e-05, - "loss": 2.3866, - "step": 249060 - }, - { - "epoch": 0.43, - "learning_rate": 2.828259224252486e-05, - "loss": 2.4076, - "step": 249070 - }, - { - "epoch": 0.43, - "learning_rate": 2.8281720302598037e-05, - "loss": 2.398, - "step": 249080 - }, - { - "epoch": 0.43, - "learning_rate": 2.8280848362671207e-05, - "loss": 2.4526, - "step": 249090 - }, - { - "epoch": 0.43, - "learning_rate": 2.827997642274438e-05, - "loss": 2.4631, - "step": 249100 - }, - { - "epoch": 0.43, - "learning_rate": 2.8279104482817554e-05, - "loss": 2.3608, - "step": 249110 - }, - { - "epoch": 0.43, - "learning_rate": 2.8278232542890725e-05, - "loss": 2.4666, - "step": 249120 - }, - { - "epoch": 0.43, - "learning_rate": 2.82773606029639e-05, - "loss": 2.431, - "step": 249130 - }, - { - "epoch": 0.43, - "learning_rate": 2.827648866303707e-05, - "loss": 2.3059, - "step": 249140 - }, - { - "epoch": 0.43, - "learning_rate": 2.827561672311025e-05, - "loss": 2.3784, - "step": 249150 - }, - { - "epoch": 0.43, - "learning_rate": 2.827474478318342e-05, - "loss": 2.3872, - "step": 249160 - }, - { - "epoch": 0.43, - "learning_rate": 2.8273872843256594e-05, - "loss": 2.4111, - "step": 249170 - }, - { - "epoch": 0.43, - "learning_rate": 2.8273000903329767e-05, - "loss": 2.4353, - "step": 249180 - }, - { - "epoch": 0.43, - "learning_rate": 2.8272128963402938e-05, - "loss": 2.3155, - "step": 249190 - }, - { - "epoch": 0.43, - "learning_rate": 2.827125702347611e-05, - "loss": 2.3918, - "step": 249200 - }, - { - "epoch": 0.43, - "learning_rate": 2.8270385083549282e-05, - "loss": 2.325, - "step": 249210 - }, - { - "epoch": 0.43, - "learning_rate": 2.8269513143622456e-05, - "loss": 2.4625, - "step": 249220 - }, - { - "epoch": 0.43, - "learning_rate": 2.8268641203695633e-05, - "loss": 2.3801, - "step": 249230 - }, - { - "epoch": 0.43, - "learning_rate": 2.8267769263768807e-05, - "loss": 2.4026, - "step": 249240 - }, - { - "epoch": 0.43, - "learning_rate": 2.8266897323841977e-05, - "loss": 2.3312, - "step": 249250 - }, - { - "epoch": 0.43, - "learning_rate": 2.826602538391515e-05, - "loss": 2.4112, - "step": 249260 - }, - { - "epoch": 0.43, - "learning_rate": 2.8265153443988325e-05, - "loss": 2.3629, - "step": 249270 - }, - { - "epoch": 0.43, - "learning_rate": 2.8264281504061495e-05, - "loss": 2.4734, - "step": 249280 - }, - { - "epoch": 0.43, - "learning_rate": 2.826340956413467e-05, - "loss": 2.2905, - "step": 249290 - }, - { - "epoch": 0.43, - "learning_rate": 2.8262537624207846e-05, - "loss": 2.3896, - "step": 249300 - }, - { - "epoch": 0.43, - "learning_rate": 2.826166568428102e-05, - "loss": 2.3844, - "step": 249310 - }, - { - "epoch": 0.43, - "learning_rate": 2.826079374435419e-05, - "loss": 2.3669, - "step": 249320 - }, - { - "epoch": 0.43, - "learning_rate": 2.8259921804427364e-05, - "loss": 2.335, - "step": 249330 - }, - { - "epoch": 0.43, - "learning_rate": 2.8259049864500538e-05, - "loss": 2.3055, - "step": 249340 - }, - { - "epoch": 0.43, - "learning_rate": 2.8258177924573708e-05, - "loss": 2.4332, - "step": 249350 - }, - { - "epoch": 0.43, - "learning_rate": 2.8257305984646882e-05, - "loss": 2.5294, - "step": 249360 - }, - { - "epoch": 0.43, - "learning_rate": 2.8256434044720052e-05, - "loss": 2.4437, - "step": 249370 - }, - { - "epoch": 0.43, - "learning_rate": 2.8255562104793233e-05, - "loss": 2.5043, - "step": 249380 - }, - { - "epoch": 0.43, - "learning_rate": 2.8254690164866403e-05, - "loss": 2.3785, - "step": 249390 - }, - { - "epoch": 0.43, - "learning_rate": 2.8253818224939577e-05, - "loss": 2.5137, - "step": 249400 - }, - { - "epoch": 0.43, - "learning_rate": 2.825294628501275e-05, - "loss": 2.384, - "step": 249410 - }, - { - "epoch": 0.43, - "learning_rate": 2.825207434508592e-05, - "loss": 2.413, - "step": 249420 - }, - { - "epoch": 0.43, - "learning_rate": 2.8251202405159095e-05, - "loss": 2.3799, - "step": 249430 - }, - { - "epoch": 0.43, - "learning_rate": 2.8250330465232265e-05, - "loss": 2.3674, - "step": 249440 - }, - { - "epoch": 0.44, - "learning_rate": 2.8249458525305446e-05, - "loss": 2.3922, - "step": 249450 - }, - { - "epoch": 0.44, - "learning_rate": 2.8248586585378616e-05, - "loss": 2.4736, - "step": 249460 - }, - { - "epoch": 0.44, - "learning_rate": 2.824771464545179e-05, - "loss": 2.3516, - "step": 249470 - }, - { - "epoch": 0.44, - "learning_rate": 2.824684270552496e-05, - "loss": 2.4209, - "step": 249480 - }, - { - "epoch": 0.44, - "learning_rate": 2.8245970765598134e-05, - "loss": 2.3157, - "step": 249490 - }, - { - "epoch": 0.44, - "learning_rate": 2.8245098825671308e-05, - "loss": 2.3629, - "step": 249500 - }, - { - "epoch": 0.44, - "learning_rate": 2.8244226885744478e-05, - "loss": 2.3229, - "step": 249510 - }, - { - "epoch": 0.44, - "learning_rate": 2.8243354945817652e-05, - "loss": 2.3577, - "step": 249520 - }, - { - "epoch": 0.44, - "learning_rate": 2.824248300589083e-05, - "loss": 2.429, - "step": 249530 - }, - { - "epoch": 0.44, - "learning_rate": 2.8241611065964003e-05, - "loss": 2.3918, - "step": 249540 - }, - { - "epoch": 0.44, - "learning_rate": 2.8240739126037173e-05, - "loss": 2.4326, - "step": 249550 - }, - { - "epoch": 0.44, - "learning_rate": 2.8239867186110347e-05, - "loss": 2.3339, - "step": 249560 - }, - { - "epoch": 0.44, - "learning_rate": 2.823899524618352e-05, - "loss": 2.38, - "step": 249570 - }, - { - "epoch": 0.44, - "learning_rate": 2.823812330625669e-05, - "loss": 2.3335, - "step": 249580 - }, - { - "epoch": 0.44, - "learning_rate": 2.8237251366329865e-05, - "loss": 2.3282, - "step": 249590 - }, - { - "epoch": 0.44, - "learning_rate": 2.8236379426403042e-05, - "loss": 2.3702, - "step": 249600 - }, - { - "epoch": 0.44, - "learning_rate": 2.8235507486476216e-05, - "loss": 2.4401, - "step": 249610 - }, - { - "epoch": 0.44, - "learning_rate": 2.8234635546549386e-05, - "loss": 2.5287, - "step": 249620 - }, - { - "epoch": 0.44, - "learning_rate": 2.823376360662256e-05, - "loss": 2.4044, - "step": 249630 - }, - { - "epoch": 0.44, - "learning_rate": 2.8232891666695734e-05, - "loss": 2.3797, - "step": 249640 - }, - { - "epoch": 0.44, - "learning_rate": 2.8232019726768904e-05, - "loss": 2.3912, - "step": 249650 - }, - { - "epoch": 0.44, - "learning_rate": 2.8231147786842078e-05, - "loss": 2.2302, - "step": 249660 - }, - { - "epoch": 0.44, - "learning_rate": 2.823027584691525e-05, - "loss": 2.4194, - "step": 249670 - }, - { - "epoch": 0.44, - "learning_rate": 2.822940390698843e-05, - "loss": 2.3336, - "step": 249680 - }, - { - "epoch": 0.44, - "learning_rate": 2.82285319670616e-05, - "loss": 2.3014, - "step": 249690 - }, - { - "epoch": 0.44, - "learning_rate": 2.8227660027134773e-05, - "loss": 2.3539, - "step": 249700 - }, - { - "epoch": 0.44, - "learning_rate": 2.8226788087207943e-05, - "loss": 2.4192, - "step": 249710 - }, - { - "epoch": 0.44, - "learning_rate": 2.8225916147281117e-05, - "loss": 2.409, - "step": 249720 - }, - { - "epoch": 0.44, - "learning_rate": 2.822504420735429e-05, - "loss": 2.3183, - "step": 249730 - }, - { - "epoch": 0.44, - "learning_rate": 2.822417226742746e-05, - "loss": 2.365, - "step": 249740 - }, - { - "epoch": 0.44, - "learning_rate": 2.8223300327500642e-05, - "loss": 2.3742, - "step": 249750 - }, - { - "epoch": 0.44, - "learning_rate": 2.8222428387573812e-05, - "loss": 2.4174, - "step": 249760 - }, - { - "epoch": 0.44, - "learning_rate": 2.8221556447646986e-05, - "loss": 2.3699, - "step": 249770 - }, - { - "epoch": 0.44, - "learning_rate": 2.8220684507720156e-05, - "loss": 2.4081, - "step": 249780 - }, - { - "epoch": 0.44, - "learning_rate": 2.821981256779333e-05, - "loss": 2.4019, - "step": 249790 - }, - { - "epoch": 0.44, - "learning_rate": 2.8218940627866504e-05, - "loss": 2.3005, - "step": 249800 - }, - { - "epoch": 0.44, - "learning_rate": 2.8218068687939674e-05, - "loss": 2.3798, - "step": 249810 - }, - { - "epoch": 0.44, - "learning_rate": 2.821719674801285e-05, - "loss": 2.275, - "step": 249820 - }, - { - "epoch": 0.44, - "learning_rate": 2.8216324808086025e-05, - "loss": 2.3642, - "step": 249830 - }, - { - "epoch": 0.44, - "learning_rate": 2.82154528681592e-05, - "loss": 2.2631, - "step": 249840 - }, - { - "epoch": 0.44, - "learning_rate": 2.821458092823237e-05, - "loss": 2.3691, - "step": 249850 - }, - { - "epoch": 0.44, - "learning_rate": 2.8213708988305543e-05, - "loss": 2.3994, - "step": 249860 - }, - { - "epoch": 0.44, - "learning_rate": 2.8212837048378714e-05, - "loss": 2.3554, - "step": 249870 - }, - { - "epoch": 0.44, - "learning_rate": 2.8211965108451887e-05, - "loss": 2.223, - "step": 249880 - }, - { - "epoch": 0.44, - "learning_rate": 2.821109316852506e-05, - "loss": 2.3068, - "step": 249890 - }, - { - "epoch": 0.44, - "learning_rate": 2.8210221228598238e-05, - "loss": 2.3744, - "step": 249900 - }, - { - "epoch": 0.44, - "learning_rate": 2.8209349288671412e-05, - "loss": 2.4611, - "step": 249910 - }, - { - "epoch": 0.44, - "learning_rate": 2.8208477348744582e-05, - "loss": 2.4337, - "step": 249920 - }, - { - "epoch": 0.44, - "learning_rate": 2.8207605408817756e-05, - "loss": 2.3842, - "step": 249930 - }, - { - "epoch": 0.44, - "learning_rate": 2.8206733468890927e-05, - "loss": 2.4696, - "step": 249940 - }, - { - "epoch": 0.44, - "learning_rate": 2.82058615289641e-05, - "loss": 2.3131, - "step": 249950 - }, - { - "epoch": 0.44, - "learning_rate": 2.8204989589037274e-05, - "loss": 2.3421, - "step": 249960 - }, - { - "epoch": 0.44, - "learning_rate": 2.820411764911045e-05, - "loss": 2.3899, - "step": 249970 - }, - { - "epoch": 0.44, - "learning_rate": 2.820324570918362e-05, - "loss": 2.3702, - "step": 249980 - }, - { - "epoch": 0.44, - "learning_rate": 2.8202373769256795e-05, - "loss": 2.3528, - "step": 249990 - }, - { - "epoch": 0.44, - "learning_rate": 2.820150182932997e-05, - "loss": 2.4109, - "step": 250000 - }, - { - "epoch": 0.44, - "learning_rate": 2.820062988940314e-05, - "loss": 2.4066, - "step": 250010 - }, - { - "epoch": 0.44, - "learning_rate": 2.8199757949476313e-05, - "loss": 2.3437, - "step": 250020 - }, - { - "epoch": 0.44, - "learning_rate": 2.8198886009549487e-05, - "loss": 2.4409, - "step": 250030 - }, - { - "epoch": 0.44, - "learning_rate": 2.8198014069622657e-05, - "loss": 2.4333, - "step": 250040 - }, - { - "epoch": 0.44, - "learning_rate": 2.8197142129695835e-05, - "loss": 2.3758, - "step": 250050 - }, - { - "epoch": 0.44, - "learning_rate": 2.819627018976901e-05, - "loss": 2.4991, - "step": 250060 - }, - { - "epoch": 0.44, - "learning_rate": 2.8195398249842182e-05, - "loss": 2.3851, - "step": 250070 - }, - { - "epoch": 0.44, - "learning_rate": 2.8194526309915353e-05, - "loss": 2.4059, - "step": 250080 - }, - { - "epoch": 0.44, - "learning_rate": 2.8193654369988526e-05, - "loss": 2.3711, - "step": 250090 - }, - { - "epoch": 0.44, - "learning_rate": 2.8192782430061697e-05, - "loss": 2.283, - "step": 250100 - }, - { - "epoch": 0.44, - "learning_rate": 2.819191049013487e-05, - "loss": 2.3302, - "step": 250110 - }, - { - "epoch": 0.44, - "learning_rate": 2.8191038550208048e-05, - "loss": 2.3547, - "step": 250120 - }, - { - "epoch": 0.44, - "learning_rate": 2.819016661028122e-05, - "loss": 2.3298, - "step": 250130 - }, - { - "epoch": 0.44, - "learning_rate": 2.8189294670354395e-05, - "loss": 2.3518, - "step": 250140 - }, - { - "epoch": 0.44, - "learning_rate": 2.8188422730427566e-05, - "loss": 2.4255, - "step": 250150 - }, - { - "epoch": 0.44, - "learning_rate": 2.818755079050074e-05, - "loss": 2.4486, - "step": 250160 - }, - { - "epoch": 0.44, - "learning_rate": 2.818667885057391e-05, - "loss": 2.3114, - "step": 250170 - }, - { - "epoch": 0.44, - "learning_rate": 2.8185806910647083e-05, - "loss": 2.4562, - "step": 250180 - }, - { - "epoch": 0.44, - "learning_rate": 2.8184934970720257e-05, - "loss": 2.3166, - "step": 250190 - }, - { - "epoch": 0.44, - "learning_rate": 2.8184063030793434e-05, - "loss": 2.2788, - "step": 250200 - }, - { - "epoch": 0.44, - "learning_rate": 2.8183191090866605e-05, - "loss": 2.3477, - "step": 250210 - }, - { - "epoch": 0.44, - "learning_rate": 2.818231915093978e-05, - "loss": 2.3876, - "step": 250220 - }, - { - "epoch": 0.44, - "learning_rate": 2.8181447211012952e-05, - "loss": 2.3946, - "step": 250230 - }, - { - "epoch": 0.44, - "learning_rate": 2.8180575271086123e-05, - "loss": 2.3983, - "step": 250240 - }, - { - "epoch": 0.44, - "learning_rate": 2.8179703331159296e-05, - "loss": 2.3794, - "step": 250250 - }, - { - "epoch": 0.44, - "learning_rate": 2.817883139123247e-05, - "loss": 2.3631, - "step": 250260 - }, - { - "epoch": 0.44, - "learning_rate": 2.8177959451305647e-05, - "loss": 2.3901, - "step": 250270 - }, - { - "epoch": 0.44, - "learning_rate": 2.8177087511378818e-05, - "loss": 2.4371, - "step": 250280 - }, - { - "epoch": 0.44, - "learning_rate": 2.817621557145199e-05, - "loss": 2.3947, - "step": 250290 - }, - { - "epoch": 0.44, - "learning_rate": 2.8175343631525165e-05, - "loss": 2.3943, - "step": 250300 - }, - { - "epoch": 0.44, - "learning_rate": 2.8174471691598336e-05, - "loss": 2.4379, - "step": 250310 - }, - { - "epoch": 0.44, - "learning_rate": 2.817359975167151e-05, - "loss": 2.3251, - "step": 250320 - }, - { - "epoch": 0.44, - "learning_rate": 2.817272781174468e-05, - "loss": 2.4425, - "step": 250330 - }, - { - "epoch": 0.44, - "learning_rate": 2.817185587181786e-05, - "loss": 2.5714, - "step": 250340 - }, - { - "epoch": 0.44, - "learning_rate": 2.817098393189103e-05, - "loss": 2.1696, - "step": 250350 - }, - { - "epoch": 0.44, - "learning_rate": 2.8170111991964205e-05, - "loss": 2.4102, - "step": 250360 - }, - { - "epoch": 0.44, - "learning_rate": 2.816924005203738e-05, - "loss": 2.4223, - "step": 250370 - }, - { - "epoch": 0.44, - "learning_rate": 2.816836811211055e-05, - "loss": 2.3931, - "step": 250380 - }, - { - "epoch": 0.44, - "learning_rate": 2.8167496172183722e-05, - "loss": 2.4592, - "step": 250390 - }, - { - "epoch": 0.44, - "learning_rate": 2.8166624232256893e-05, - "loss": 2.3698, - "step": 250400 - }, - { - "epoch": 0.44, - "learning_rate": 2.8165752292330067e-05, - "loss": 2.4895, - "step": 250410 - }, - { - "epoch": 0.44, - "learning_rate": 2.8164880352403244e-05, - "loss": 2.316, - "step": 250420 - }, - { - "epoch": 0.44, - "learning_rate": 2.8164008412476418e-05, - "loss": 2.4881, - "step": 250430 - }, - { - "epoch": 0.44, - "learning_rate": 2.8163136472549588e-05, - "loss": 2.389, - "step": 250440 - }, - { - "epoch": 0.44, - "learning_rate": 2.8162264532622762e-05, - "loss": 2.4297, - "step": 250450 - }, - { - "epoch": 0.44, - "learning_rate": 2.8161392592695935e-05, - "loss": 2.3178, - "step": 250460 - }, - { - "epoch": 0.44, - "learning_rate": 2.8160520652769106e-05, - "loss": 2.3214, - "step": 250470 - }, - { - "epoch": 0.44, - "learning_rate": 2.815964871284228e-05, - "loss": 2.3869, - "step": 250480 - }, - { - "epoch": 0.44, - "learning_rate": 2.8158776772915457e-05, - "loss": 2.3227, - "step": 250490 - }, - { - "epoch": 0.44, - "learning_rate": 2.815790483298863e-05, - "loss": 2.3362, - "step": 250500 - }, - { - "epoch": 0.44, - "learning_rate": 2.81570328930618e-05, - "loss": 2.3021, - "step": 250510 - }, - { - "epoch": 0.44, - "learning_rate": 2.8156160953134975e-05, - "loss": 2.4497, - "step": 250520 - }, - { - "epoch": 0.44, - "learning_rate": 2.815528901320815e-05, - "loss": 2.3597, - "step": 250530 - }, - { - "epoch": 0.44, - "learning_rate": 2.815441707328132e-05, - "loss": 2.4744, - "step": 250540 - }, - { - "epoch": 0.44, - "learning_rate": 2.8153545133354493e-05, - "loss": 2.3717, - "step": 250550 - }, - { - "epoch": 0.44, - "learning_rate": 2.8152673193427663e-05, - "loss": 2.4429, - "step": 250560 - }, - { - "epoch": 0.44, - "learning_rate": 2.8151801253500844e-05, - "loss": 2.4086, - "step": 250570 - }, - { - "epoch": 0.44, - "learning_rate": 2.8150929313574014e-05, - "loss": 2.4956, - "step": 250580 - }, - { - "epoch": 0.44, - "learning_rate": 2.8150057373647188e-05, - "loss": 2.4202, - "step": 250590 - }, - { - "epoch": 0.44, - "learning_rate": 2.8149185433720358e-05, - "loss": 2.4012, - "step": 250600 - }, - { - "epoch": 0.44, - "learning_rate": 2.8148313493793532e-05, - "loss": 2.4827, - "step": 250610 - }, - { - "epoch": 0.44, - "learning_rate": 2.8147441553866706e-05, - "loss": 2.3177, - "step": 250620 - }, - { - "epoch": 0.44, - "learning_rate": 2.8146569613939876e-05, - "loss": 2.4161, - "step": 250630 - }, - { - "epoch": 0.44, - "learning_rate": 2.8145697674013057e-05, - "loss": 2.4524, - "step": 250640 - }, - { - "epoch": 0.44, - "learning_rate": 2.8144825734086227e-05, - "loss": 2.2542, - "step": 250650 - }, - { - "epoch": 0.44, - "learning_rate": 2.81439537941594e-05, - "loss": 2.3453, - "step": 250660 - }, - { - "epoch": 0.44, - "learning_rate": 2.814308185423257e-05, - "loss": 2.3545, - "step": 250670 - }, - { - "epoch": 0.44, - "learning_rate": 2.8142209914305745e-05, - "loss": 2.4145, - "step": 250680 - }, - { - "epoch": 0.44, - "learning_rate": 2.814133797437892e-05, - "loss": 2.4047, - "step": 250690 - }, - { - "epoch": 0.44, - "learning_rate": 2.814046603445209e-05, - "loss": 2.24, - "step": 250700 - }, - { - "epoch": 0.44, - "learning_rate": 2.8139594094525263e-05, - "loss": 2.3585, - "step": 250710 - }, - { - "epoch": 0.44, - "learning_rate": 2.813872215459844e-05, - "loss": 2.336, - "step": 250720 - }, - { - "epoch": 0.44, - "learning_rate": 2.8137850214671614e-05, - "loss": 2.4156, - "step": 250730 - }, - { - "epoch": 0.44, - "learning_rate": 2.8136978274744784e-05, - "loss": 2.3499, - "step": 250740 - }, - { - "epoch": 0.44, - "learning_rate": 2.8136106334817958e-05, - "loss": 2.3701, - "step": 250750 - }, - { - "epoch": 0.44, - "learning_rate": 2.813523439489113e-05, - "loss": 2.3332, - "step": 250760 - }, - { - "epoch": 0.44, - "learning_rate": 2.8134362454964302e-05, - "loss": 2.3162, - "step": 250770 - }, - { - "epoch": 0.44, - "learning_rate": 2.8133490515037476e-05, - "loss": 2.3157, - "step": 250780 - }, - { - "epoch": 0.44, - "learning_rate": 2.8132618575110653e-05, - "loss": 2.3869, - "step": 250790 - }, - { - "epoch": 0.44, - "learning_rate": 2.8131746635183827e-05, - "loss": 2.3601, - "step": 250800 - }, - { - "epoch": 0.44, - "learning_rate": 2.8130874695256997e-05, - "loss": 2.4291, - "step": 250810 - }, - { - "epoch": 0.44, - "learning_rate": 2.813000275533017e-05, - "loss": 2.4127, - "step": 250820 - }, - { - "epoch": 0.44, - "learning_rate": 2.812913081540334e-05, - "loss": 2.3183, - "step": 250830 - }, - { - "epoch": 0.44, - "learning_rate": 2.8128258875476515e-05, - "loss": 2.4982, - "step": 250840 - }, - { - "epoch": 0.44, - "learning_rate": 2.812738693554969e-05, - "loss": 2.4576, - "step": 250850 - }, - { - "epoch": 0.44, - "learning_rate": 2.812651499562286e-05, - "loss": 2.4828, - "step": 250860 - }, - { - "epoch": 0.44, - "learning_rate": 2.812564305569604e-05, - "loss": 2.5099, - "step": 250870 - }, - { - "epoch": 0.44, - "learning_rate": 2.812477111576921e-05, - "loss": 2.3744, - "step": 250880 - }, - { - "epoch": 0.44, - "learning_rate": 2.8123899175842384e-05, - "loss": 2.3456, - "step": 250890 - }, - { - "epoch": 0.44, - "learning_rate": 2.8123027235915554e-05, - "loss": 2.3745, - "step": 250900 - }, - { - "epoch": 0.44, - "learning_rate": 2.8122155295988728e-05, - "loss": 2.3907, - "step": 250910 - }, - { - "epoch": 0.44, - "learning_rate": 2.8121283356061902e-05, - "loss": 2.3744, - "step": 250920 - }, - { - "epoch": 0.44, - "learning_rate": 2.8120411416135072e-05, - "loss": 2.3239, - "step": 250930 - }, - { - "epoch": 0.44, - "learning_rate": 2.811953947620825e-05, - "loss": 2.3716, - "step": 250940 - }, - { - "epoch": 0.44, - "learning_rate": 2.8118667536281423e-05, - "loss": 2.3529, - "step": 250950 - }, - { - "epoch": 0.44, - "learning_rate": 2.8117795596354597e-05, - "loss": 2.3612, - "step": 250960 - }, - { - "epoch": 0.44, - "learning_rate": 2.8116923656427767e-05, - "loss": 2.2948, - "step": 250970 - }, - { - "epoch": 0.44, - "learning_rate": 2.811605171650094e-05, - "loss": 2.3537, - "step": 250980 - }, - { - "epoch": 0.44, - "learning_rate": 2.8115179776574115e-05, - "loss": 2.3536, - "step": 250990 - }, - { - "epoch": 0.44, - "learning_rate": 2.8114307836647285e-05, - "loss": 2.3416, - "step": 251000 - }, - { - "epoch": 0.44, - "learning_rate": 2.8113435896720462e-05, - "loss": 2.2796, - "step": 251010 - }, - { - "epoch": 0.44, - "learning_rate": 2.8112563956793636e-05, - "loss": 2.1598, - "step": 251020 - }, - { - "epoch": 0.44, - "learning_rate": 2.811169201686681e-05, - "loss": 2.3941, - "step": 251030 - }, - { - "epoch": 0.44, - "learning_rate": 2.811082007693998e-05, - "loss": 2.4109, - "step": 251040 - }, - { - "epoch": 0.44, - "learning_rate": 2.8109948137013154e-05, - "loss": 2.3269, - "step": 251050 - }, - { - "epoch": 0.44, - "learning_rate": 2.8109076197086324e-05, - "loss": 2.4919, - "step": 251060 - }, - { - "epoch": 0.44, - "learning_rate": 2.8108204257159498e-05, - "loss": 2.3991, - "step": 251070 - }, - { - "epoch": 0.44, - "learning_rate": 2.8107332317232672e-05, - "loss": 2.3607, - "step": 251080 - }, - { - "epoch": 0.44, - "learning_rate": 2.810646037730585e-05, - "loss": 2.3327, - "step": 251090 - }, - { - "epoch": 0.44, - "learning_rate": 2.8105588437379023e-05, - "loss": 2.4526, - "step": 251100 - }, - { - "epoch": 0.44, - "learning_rate": 2.8104716497452193e-05, - "loss": 2.4055, - "step": 251110 - }, - { - "epoch": 0.44, - "learning_rate": 2.8103844557525367e-05, - "loss": 2.4559, - "step": 251120 - }, - { - "epoch": 0.44, - "learning_rate": 2.8102972617598537e-05, - "loss": 2.3667, - "step": 251130 - }, - { - "epoch": 0.44, - "learning_rate": 2.810210067767171e-05, - "loss": 2.2985, - "step": 251140 - }, - { - "epoch": 0.44, - "learning_rate": 2.8101228737744885e-05, - "loss": 2.4075, - "step": 251150 - }, - { - "epoch": 0.44, - "learning_rate": 2.8100356797818062e-05, - "loss": 2.4902, - "step": 251160 - }, - { - "epoch": 0.44, - "learning_rate": 2.8099484857891232e-05, - "loss": 2.3624, - "step": 251170 - }, - { - "epoch": 0.44, - "learning_rate": 2.8098612917964406e-05, - "loss": 2.3139, - "step": 251180 - }, - { - "epoch": 0.44, - "learning_rate": 2.809774097803758e-05, - "loss": 2.4476, - "step": 251190 - }, - { - "epoch": 0.44, - "learning_rate": 2.809686903811075e-05, - "loss": 2.406, - "step": 251200 - }, - { - "epoch": 0.44, - "learning_rate": 2.8095997098183924e-05, - "loss": 2.4883, - "step": 251210 - }, - { - "epoch": 0.44, - "learning_rate": 2.8095125158257095e-05, - "loss": 2.4377, - "step": 251220 - }, - { - "epoch": 0.44, - "learning_rate": 2.809425321833027e-05, - "loss": 2.3754, - "step": 251230 - }, - { - "epoch": 0.44, - "learning_rate": 2.8093381278403445e-05, - "loss": 2.3678, - "step": 251240 - }, - { - "epoch": 0.44, - "learning_rate": 2.809250933847662e-05, - "loss": 2.4361, - "step": 251250 - }, - { - "epoch": 0.44, - "learning_rate": 2.8091637398549793e-05, - "loss": 2.4963, - "step": 251260 - }, - { - "epoch": 0.44, - "learning_rate": 2.8090765458622963e-05, - "loss": 2.3533, - "step": 251270 - }, - { - "epoch": 0.44, - "learning_rate": 2.8089893518696137e-05, - "loss": 2.3312, - "step": 251280 - }, - { - "epoch": 0.44, - "learning_rate": 2.8089021578769308e-05, - "loss": 2.3356, - "step": 251290 - }, - { - "epoch": 0.44, - "learning_rate": 2.808814963884248e-05, - "loss": 2.4532, - "step": 251300 - }, - { - "epoch": 0.44, - "learning_rate": 2.808727769891566e-05, - "loss": 2.4308, - "step": 251310 - }, - { - "epoch": 0.44, - "learning_rate": 2.8086405758988832e-05, - "loss": 2.4363, - "step": 251320 - }, - { - "epoch": 0.44, - "learning_rate": 2.8085533819062003e-05, - "loss": 2.3676, - "step": 251330 - }, - { - "epoch": 0.44, - "learning_rate": 2.8084661879135176e-05, - "loss": 2.3274, - "step": 251340 - }, - { - "epoch": 0.44, - "learning_rate": 2.808378993920835e-05, - "loss": 2.4045, - "step": 251350 - }, - { - "epoch": 0.44, - "learning_rate": 2.808291799928152e-05, - "loss": 2.3822, - "step": 251360 - }, - { - "epoch": 0.44, - "learning_rate": 2.8082046059354694e-05, - "loss": 2.3902, - "step": 251370 - }, - { - "epoch": 0.44, - "learning_rate": 2.8081174119427868e-05, - "loss": 2.411, - "step": 251380 - }, - { - "epoch": 0.44, - "learning_rate": 2.8080302179501045e-05, - "loss": 2.4034, - "step": 251390 - }, - { - "epoch": 0.44, - "learning_rate": 2.8079430239574216e-05, - "loss": 2.2519, - "step": 251400 - }, - { - "epoch": 0.44, - "learning_rate": 2.807855829964739e-05, - "loss": 2.3523, - "step": 251410 - }, - { - "epoch": 0.44, - "learning_rate": 2.8077686359720563e-05, - "loss": 2.3418, - "step": 251420 - }, - { - "epoch": 0.44, - "learning_rate": 2.8076814419793734e-05, - "loss": 2.3161, - "step": 251430 - }, - { - "epoch": 0.44, - "learning_rate": 2.8075942479866907e-05, - "loss": 2.4225, - "step": 251440 - }, - { - "epoch": 0.44, - "learning_rate": 2.8075070539940078e-05, - "loss": 2.3955, - "step": 251450 - }, - { - "epoch": 0.44, - "learning_rate": 2.8074198600013258e-05, - "loss": 2.2751, - "step": 251460 - }, - { - "epoch": 0.44, - "learning_rate": 2.807332666008643e-05, - "loss": 2.4628, - "step": 251470 - }, - { - "epoch": 0.44, - "learning_rate": 2.8072454720159602e-05, - "loss": 2.2813, - "step": 251480 - }, - { - "epoch": 0.44, - "learning_rate": 2.8071582780232776e-05, - "loss": 2.4014, - "step": 251490 - }, - { - "epoch": 0.44, - "learning_rate": 2.8070710840305947e-05, - "loss": 2.324, - "step": 251500 - }, - { - "epoch": 0.44, - "learning_rate": 2.806983890037912e-05, - "loss": 2.4562, - "step": 251510 - }, - { - "epoch": 0.44, - "learning_rate": 2.806896696045229e-05, - "loss": 2.4011, - "step": 251520 - }, - { - "epoch": 0.44, - "learning_rate": 2.8068095020525464e-05, - "loss": 2.3785, - "step": 251530 - }, - { - "epoch": 0.44, - "learning_rate": 2.806722308059864e-05, - "loss": 2.43, - "step": 251540 - }, - { - "epoch": 0.44, - "learning_rate": 2.8066351140671815e-05, - "loss": 2.4289, - "step": 251550 - }, - { - "epoch": 0.44, - "learning_rate": 2.8065479200744986e-05, - "loss": 2.3036, - "step": 251560 - }, - { - "epoch": 0.44, - "learning_rate": 2.806460726081816e-05, - "loss": 2.234, - "step": 251570 - }, - { - "epoch": 0.44, - "learning_rate": 2.8063735320891333e-05, - "loss": 2.4378, - "step": 251580 - }, - { - "epoch": 0.44, - "learning_rate": 2.8062863380964504e-05, - "loss": 2.4778, - "step": 251590 - }, - { - "epoch": 0.44, - "learning_rate": 2.8061991441037677e-05, - "loss": 2.2756, - "step": 251600 - }, - { - "epoch": 0.44, - "learning_rate": 2.8061119501110855e-05, - "loss": 2.4013, - "step": 251610 - }, - { - "epoch": 0.44, - "learning_rate": 2.806024756118403e-05, - "loss": 2.4779, - "step": 251620 - }, - { - "epoch": 0.44, - "learning_rate": 2.80593756212572e-05, - "loss": 2.4289, - "step": 251630 - }, - { - "epoch": 0.44, - "learning_rate": 2.8058503681330373e-05, - "loss": 2.4476, - "step": 251640 - }, - { - "epoch": 0.44, - "learning_rate": 2.8057631741403546e-05, - "loss": 2.3937, - "step": 251650 - }, - { - "epoch": 0.44, - "learning_rate": 2.8056759801476717e-05, - "loss": 2.2632, - "step": 251660 - }, - { - "epoch": 0.44, - "learning_rate": 2.805588786154989e-05, - "loss": 2.4158, - "step": 251670 - }, - { - "epoch": 0.44, - "learning_rate": 2.8055015921623068e-05, - "loss": 2.4459, - "step": 251680 - }, - { - "epoch": 0.44, - "learning_rate": 2.805414398169624e-05, - "loss": 2.3605, - "step": 251690 - }, - { - "epoch": 0.44, - "learning_rate": 2.8053272041769412e-05, - "loss": 2.4386, - "step": 251700 - }, - { - "epoch": 0.44, - "learning_rate": 2.8052400101842586e-05, - "loss": 2.5348, - "step": 251710 - }, - { - "epoch": 0.44, - "learning_rate": 2.805152816191576e-05, - "loss": 2.2894, - "step": 251720 - }, - { - "epoch": 0.44, - "learning_rate": 2.805065622198893e-05, - "loss": 2.4002, - "step": 251730 - }, - { - "epoch": 0.44, - "learning_rate": 2.8049784282062103e-05, - "loss": 2.41, - "step": 251740 - }, - { - "epoch": 0.44, - "learning_rate": 2.8048912342135274e-05, - "loss": 2.3929, - "step": 251750 - }, - { - "epoch": 0.44, - "learning_rate": 2.8048040402208454e-05, - "loss": 2.3957, - "step": 251760 - }, - { - "epoch": 0.44, - "learning_rate": 2.8047168462281625e-05, - "loss": 2.3754, - "step": 251770 - }, - { - "epoch": 0.44, - "learning_rate": 2.80462965223548e-05, - "loss": 2.2663, - "step": 251780 - }, - { - "epoch": 0.44, - "learning_rate": 2.804542458242797e-05, - "loss": 2.263, - "step": 251790 - }, - { - "epoch": 0.44, - "learning_rate": 2.8044552642501143e-05, - "loss": 2.4132, - "step": 251800 - }, - { - "epoch": 0.44, - "learning_rate": 2.8043680702574316e-05, - "loss": 2.348, - "step": 251810 - }, - { - "epoch": 0.44, - "learning_rate": 2.8042808762647487e-05, - "loss": 2.313, - "step": 251820 - }, - { - "epoch": 0.44, - "learning_rate": 2.8041936822720667e-05, - "loss": 2.354, - "step": 251830 - }, - { - "epoch": 0.44, - "learning_rate": 2.8041064882793838e-05, - "loss": 2.3332, - "step": 251840 - }, - { - "epoch": 0.44, - "learning_rate": 2.804019294286701e-05, - "loss": 2.3926, - "step": 251850 - }, - { - "epoch": 0.44, - "learning_rate": 2.8039321002940182e-05, - "loss": 2.3949, - "step": 251860 - }, - { - "epoch": 0.44, - "learning_rate": 2.8038449063013356e-05, - "loss": 2.4041, - "step": 251870 - }, - { - "epoch": 0.44, - "learning_rate": 2.803757712308653e-05, - "loss": 2.4173, - "step": 251880 - }, - { - "epoch": 0.44, - "learning_rate": 2.80367051831597e-05, - "loss": 2.3757, - "step": 251890 - }, - { - "epoch": 0.44, - "learning_rate": 2.8035833243232874e-05, - "loss": 2.3737, - "step": 251900 - }, - { - "epoch": 0.44, - "learning_rate": 2.803496130330605e-05, - "loss": 2.4748, - "step": 251910 - }, - { - "epoch": 0.44, - "learning_rate": 2.8034089363379225e-05, - "loss": 2.1998, - "step": 251920 - }, - { - "epoch": 0.44, - "learning_rate": 2.8033217423452395e-05, - "loss": 2.3128, - "step": 251930 - }, - { - "epoch": 0.44, - "learning_rate": 2.803234548352557e-05, - "loss": 2.3982, - "step": 251940 - }, - { - "epoch": 0.44, - "learning_rate": 2.803147354359874e-05, - "loss": 2.4231, - "step": 251950 - }, - { - "epoch": 0.44, - "learning_rate": 2.8030601603671913e-05, - "loss": 2.3601, - "step": 251960 - }, - { - "epoch": 0.44, - "learning_rate": 2.8029729663745087e-05, - "loss": 2.3963, - "step": 251970 - }, - { - "epoch": 0.44, - "learning_rate": 2.8028857723818264e-05, - "loss": 2.4489, - "step": 251980 - }, - { - "epoch": 0.44, - "learning_rate": 2.8027985783891438e-05, - "loss": 2.3805, - "step": 251990 - }, - { - "epoch": 0.44, - "learning_rate": 2.8027113843964608e-05, - "loss": 2.3272, - "step": 252000 - }, - { - "epoch": 0.44, - "learning_rate": 2.8026241904037782e-05, - "loss": 2.4034, - "step": 252010 - }, - { - "epoch": 0.44, - "learning_rate": 2.8025369964110952e-05, - "loss": 2.3077, - "step": 252020 - }, - { - "epoch": 0.44, - "learning_rate": 2.8024498024184126e-05, - "loss": 2.4061, - "step": 252030 - }, - { - "epoch": 0.44, - "learning_rate": 2.80236260842573e-05, - "loss": 2.4026, - "step": 252040 - }, - { - "epoch": 0.44, - "learning_rate": 2.802275414433047e-05, - "loss": 2.3885, - "step": 252050 - }, - { - "epoch": 0.44, - "learning_rate": 2.8021882204403647e-05, - "loss": 2.4024, - "step": 252060 - }, - { - "epoch": 0.44, - "learning_rate": 2.802101026447682e-05, - "loss": 2.5136, - "step": 252070 - }, - { - "epoch": 0.44, - "learning_rate": 2.8020138324549995e-05, - "loss": 2.3906, - "step": 252080 - }, - { - "epoch": 0.44, - "learning_rate": 2.8019266384623165e-05, - "loss": 2.3702, - "step": 252090 - }, - { - "epoch": 0.44, - "learning_rate": 2.801839444469634e-05, - "loss": 2.3901, - "step": 252100 - }, - { - "epoch": 0.44, - "learning_rate": 2.8017522504769513e-05, - "loss": 2.3298, - "step": 252110 - }, - { - "epoch": 0.44, - "learning_rate": 2.8016650564842683e-05, - "loss": 2.456, - "step": 252120 - }, - { - "epoch": 0.44, - "learning_rate": 2.801577862491586e-05, - "loss": 2.4105, - "step": 252130 - }, - { - "epoch": 0.44, - "learning_rate": 2.8014906684989034e-05, - "loss": 2.3389, - "step": 252140 - }, - { - "epoch": 0.44, - "learning_rate": 2.8014034745062208e-05, - "loss": 2.2879, - "step": 252150 - }, - { - "epoch": 0.44, - "learning_rate": 2.8013162805135378e-05, - "loss": 2.3225, - "step": 252160 - }, - { - "epoch": 0.44, - "learning_rate": 2.8012290865208552e-05, - "loss": 2.3801, - "step": 252170 - }, - { - "epoch": 0.44, - "learning_rate": 2.8011418925281722e-05, - "loss": 2.5363, - "step": 252180 - }, - { - "epoch": 0.44, - "learning_rate": 2.8010546985354896e-05, - "loss": 2.3707, - "step": 252190 - }, - { - "epoch": 0.44, - "learning_rate": 2.8009675045428073e-05, - "loss": 2.2859, - "step": 252200 - }, - { - "epoch": 0.44, - "learning_rate": 2.8008803105501247e-05, - "loss": 2.2788, - "step": 252210 - }, - { - "epoch": 0.44, - "learning_rate": 2.800793116557442e-05, - "loss": 2.3235, - "step": 252220 - }, - { - "epoch": 0.44, - "learning_rate": 2.800705922564759e-05, - "loss": 2.3716, - "step": 252230 - }, - { - "epoch": 0.44, - "learning_rate": 2.8006187285720765e-05, - "loss": 2.3452, - "step": 252240 - }, - { - "epoch": 0.44, - "learning_rate": 2.8005315345793935e-05, - "loss": 2.3842, - "step": 252250 - }, - { - "epoch": 0.44, - "learning_rate": 2.800444340586711e-05, - "loss": 2.4005, - "step": 252260 - }, - { - "epoch": 0.44, - "learning_rate": 2.8003571465940283e-05, - "loss": 2.3521, - "step": 252270 - }, - { - "epoch": 0.44, - "learning_rate": 2.800269952601346e-05, - "loss": 2.3703, - "step": 252280 - }, - { - "epoch": 0.44, - "learning_rate": 2.800182758608663e-05, - "loss": 2.4675, - "step": 252290 - }, - { - "epoch": 0.44, - "learning_rate": 2.8000955646159804e-05, - "loss": 2.404, - "step": 252300 - }, - { - "epoch": 0.44, - "learning_rate": 2.8000083706232978e-05, - "loss": 2.4154, - "step": 252310 - }, - { - "epoch": 0.44, - "learning_rate": 2.7999211766306148e-05, - "loss": 2.3558, - "step": 252320 - }, - { - "epoch": 0.44, - "learning_rate": 2.7998339826379322e-05, - "loss": 2.4599, - "step": 252330 - }, - { - "epoch": 0.44, - "learning_rate": 2.7997467886452496e-05, - "loss": 2.337, - "step": 252340 - }, - { - "epoch": 0.44, - "learning_rate": 2.7996595946525673e-05, - "loss": 2.2892, - "step": 252350 - }, - { - "epoch": 0.44, - "learning_rate": 2.7995724006598843e-05, - "loss": 2.4715, - "step": 252360 - }, - { - "epoch": 0.44, - "learning_rate": 2.7994852066672017e-05, - "loss": 2.2382, - "step": 252370 - }, - { - "epoch": 0.44, - "learning_rate": 2.799398012674519e-05, - "loss": 2.4403, - "step": 252380 - }, - { - "epoch": 0.44, - "learning_rate": 2.799310818681836e-05, - "loss": 2.2983, - "step": 252390 - }, - { - "epoch": 0.44, - "learning_rate": 2.7992236246891535e-05, - "loss": 2.4681, - "step": 252400 - }, - { - "epoch": 0.44, - "learning_rate": 2.7991364306964705e-05, - "loss": 2.3082, - "step": 252410 - }, - { - "epoch": 0.44, - "learning_rate": 2.799049236703788e-05, - "loss": 2.4649, - "step": 252420 - }, - { - "epoch": 0.44, - "learning_rate": 2.7989620427111056e-05, - "loss": 2.3244, - "step": 252430 - }, - { - "epoch": 0.44, - "learning_rate": 2.798874848718423e-05, - "loss": 2.4487, - "step": 252440 - }, - { - "epoch": 0.44, - "learning_rate": 2.7987876547257404e-05, - "loss": 2.3717, - "step": 252450 - }, - { - "epoch": 0.44, - "learning_rate": 2.7987004607330574e-05, - "loss": 2.3927, - "step": 252460 - }, - { - "epoch": 0.44, - "learning_rate": 2.7986132667403748e-05, - "loss": 2.4354, - "step": 252470 - }, - { - "epoch": 0.44, - "learning_rate": 2.798526072747692e-05, - "loss": 2.4476, - "step": 252480 - }, - { - "epoch": 0.44, - "learning_rate": 2.7984388787550092e-05, - "loss": 2.3703, - "step": 252490 - }, - { - "epoch": 0.44, - "learning_rate": 2.798351684762327e-05, - "loss": 2.4411, - "step": 252500 - }, - { - "epoch": 0.44, - "learning_rate": 2.7982644907696443e-05, - "loss": 2.4613, - "step": 252510 - }, - { - "epoch": 0.44, - "learning_rate": 2.7981772967769613e-05, - "loss": 2.3301, - "step": 252520 - }, - { - "epoch": 0.44, - "learning_rate": 2.7980901027842787e-05, - "loss": 2.4951, - "step": 252530 - }, - { - "epoch": 0.44, - "learning_rate": 2.798002908791596e-05, - "loss": 2.3589, - "step": 252540 - }, - { - "epoch": 0.44, - "learning_rate": 2.797915714798913e-05, - "loss": 2.3965, - "step": 252550 - }, - { - "epoch": 0.44, - "learning_rate": 2.7978285208062305e-05, - "loss": 2.303, - "step": 252560 - }, - { - "epoch": 0.44, - "learning_rate": 2.7977413268135476e-05, - "loss": 2.2844, - "step": 252570 - }, - { - "epoch": 0.44, - "learning_rate": 2.7976541328208656e-05, - "loss": 2.3835, - "step": 252580 - }, - { - "epoch": 0.44, - "learning_rate": 2.7975669388281826e-05, - "loss": 2.3843, - "step": 252590 - }, - { - "epoch": 0.44, - "learning_rate": 2.7974797448355e-05, - "loss": 2.3619, - "step": 252600 - }, - { - "epoch": 0.44, - "learning_rate": 2.7973925508428174e-05, - "loss": 2.3819, - "step": 252610 - }, - { - "epoch": 0.44, - "learning_rate": 2.7973053568501344e-05, - "loss": 2.3811, - "step": 252620 - }, - { - "epoch": 0.44, - "learning_rate": 2.7972181628574518e-05, - "loss": 2.4021, - "step": 252630 - }, - { - "epoch": 0.44, - "learning_rate": 2.797130968864769e-05, - "loss": 2.381, - "step": 252640 - }, - { - "epoch": 0.44, - "learning_rate": 2.797043774872087e-05, - "loss": 2.4214, - "step": 252650 - }, - { - "epoch": 0.44, - "learning_rate": 2.796956580879404e-05, - "loss": 2.4281, - "step": 252660 - }, - { - "epoch": 0.44, - "learning_rate": 2.7968693868867213e-05, - "loss": 2.5293, - "step": 252670 - }, - { - "epoch": 0.44, - "learning_rate": 2.7967821928940384e-05, - "loss": 2.4871, - "step": 252680 - }, - { - "epoch": 0.44, - "learning_rate": 2.7966949989013557e-05, - "loss": 2.3632, - "step": 252690 - }, - { - "epoch": 0.44, - "learning_rate": 2.796607804908673e-05, - "loss": 2.433, - "step": 252700 - }, - { - "epoch": 0.44, - "learning_rate": 2.79652061091599e-05, - "loss": 2.2376, - "step": 252710 - }, - { - "epoch": 0.44, - "learning_rate": 2.7964334169233075e-05, - "loss": 2.4449, - "step": 252720 - }, - { - "epoch": 0.44, - "learning_rate": 2.7963462229306252e-05, - "loss": 2.3139, - "step": 252730 - }, - { - "epoch": 0.44, - "learning_rate": 2.7962590289379426e-05, - "loss": 2.3087, - "step": 252740 - }, - { - "epoch": 0.44, - "learning_rate": 2.7961718349452597e-05, - "loss": 2.3744, - "step": 252750 - }, - { - "epoch": 0.44, - "learning_rate": 2.796084640952577e-05, - "loss": 2.2595, - "step": 252760 - }, - { - "epoch": 0.44, - "learning_rate": 2.7959974469598944e-05, - "loss": 2.4185, - "step": 252770 - }, - { - "epoch": 0.44, - "learning_rate": 2.7959102529672115e-05, - "loss": 2.4459, - "step": 252780 - }, - { - "epoch": 0.44, - "learning_rate": 2.795823058974529e-05, - "loss": 2.3861, - "step": 252790 - }, - { - "epoch": 0.44, - "learning_rate": 2.7957358649818466e-05, - "loss": 2.2961, - "step": 252800 - }, - { - "epoch": 0.44, - "learning_rate": 2.795648670989164e-05, - "loss": 2.4259, - "step": 252810 - }, - { - "epoch": 0.44, - "learning_rate": 2.795561476996481e-05, - "loss": 2.3727, - "step": 252820 - }, - { - "epoch": 0.44, - "learning_rate": 2.7954742830037983e-05, - "loss": 2.3013, - "step": 252830 - }, - { - "epoch": 0.44, - "learning_rate": 2.7953870890111157e-05, - "loss": 2.455, - "step": 252840 - }, - { - "epoch": 0.44, - "learning_rate": 2.7952998950184328e-05, - "loss": 2.3217, - "step": 252850 - }, - { - "epoch": 0.44, - "learning_rate": 2.79521270102575e-05, - "loss": 2.3621, - "step": 252860 - }, - { - "epoch": 0.44, - "learning_rate": 2.795125507033068e-05, - "loss": 2.4164, - "step": 252870 - }, - { - "epoch": 0.44, - "learning_rate": 2.7950383130403852e-05, - "loss": 2.3609, - "step": 252880 - }, - { - "epoch": 0.44, - "learning_rate": 2.7949511190477023e-05, - "loss": 2.2224, - "step": 252890 - }, - { - "epoch": 0.44, - "learning_rate": 2.7948639250550196e-05, - "loss": 2.4953, - "step": 252900 - }, - { - "epoch": 0.44, - "learning_rate": 2.7947767310623367e-05, - "loss": 2.3584, - "step": 252910 - }, - { - "epoch": 0.44, - "learning_rate": 2.794689537069654e-05, - "loss": 2.2805, - "step": 252920 - }, - { - "epoch": 0.44, - "learning_rate": 2.7946023430769714e-05, - "loss": 2.3276, - "step": 252930 - }, - { - "epoch": 0.44, - "learning_rate": 2.7945151490842885e-05, - "loss": 2.3945, - "step": 252940 - }, - { - "epoch": 0.44, - "learning_rate": 2.7944279550916065e-05, - "loss": 2.3548, - "step": 252950 - }, - { - "epoch": 0.44, - "learning_rate": 2.7943407610989236e-05, - "loss": 2.4061, - "step": 252960 - }, - { - "epoch": 0.44, - "learning_rate": 2.794253567106241e-05, - "loss": 2.3883, - "step": 252970 - }, - { - "epoch": 0.44, - "learning_rate": 2.794166373113558e-05, - "loss": 2.4618, - "step": 252980 - }, - { - "epoch": 0.44, - "learning_rate": 2.7940791791208754e-05, - "loss": 2.3111, - "step": 252990 - }, - { - "epoch": 0.44, - "learning_rate": 2.7939919851281927e-05, - "loss": 2.4725, - "step": 253000 - }, - { - "epoch": 0.44, - "learning_rate": 2.7939047911355098e-05, - "loss": 2.4055, - "step": 253010 - }, - { - "epoch": 0.44, - "learning_rate": 2.7938175971428275e-05, - "loss": 2.3291, - "step": 253020 - }, - { - "epoch": 0.44, - "learning_rate": 2.793730403150145e-05, - "loss": 2.3875, - "step": 253030 - }, - { - "epoch": 0.44, - "learning_rate": 2.7936432091574622e-05, - "loss": 2.3455, - "step": 253040 - }, - { - "epoch": 0.44, - "learning_rate": 2.7935560151647793e-05, - "loss": 2.2478, - "step": 253050 - }, - { - "epoch": 0.44, - "learning_rate": 2.7934688211720967e-05, - "loss": 2.2531, - "step": 253060 - }, - { - "epoch": 0.44, - "learning_rate": 2.793381627179414e-05, - "loss": 2.4143, - "step": 253070 - }, - { - "epoch": 0.44, - "learning_rate": 2.793294433186731e-05, - "loss": 2.4918, - "step": 253080 - }, - { - "epoch": 0.44, - "learning_rate": 2.7932072391940484e-05, - "loss": 2.3475, - "step": 253090 - }, - { - "epoch": 0.44, - "learning_rate": 2.793120045201366e-05, - "loss": 2.4201, - "step": 253100 - }, - { - "epoch": 0.44, - "learning_rate": 2.7930328512086835e-05, - "loss": 2.3384, - "step": 253110 - }, - { - "epoch": 0.44, - "learning_rate": 2.7929456572160006e-05, - "loss": 2.4081, - "step": 253120 - }, - { - "epoch": 0.44, - "learning_rate": 2.792858463223318e-05, - "loss": 2.3123, - "step": 253130 - }, - { - "epoch": 0.44, - "learning_rate": 2.792771269230635e-05, - "loss": 2.4216, - "step": 253140 - }, - { - "epoch": 0.44, - "learning_rate": 2.7926840752379524e-05, - "loss": 2.4099, - "step": 253150 - }, - { - "epoch": 0.44, - "learning_rate": 2.7925968812452697e-05, - "loss": 2.4541, - "step": 253160 - }, - { - "epoch": 0.44, - "learning_rate": 2.7925096872525875e-05, - "loss": 2.3362, - "step": 253170 - }, - { - "epoch": 0.44, - "learning_rate": 2.792422493259905e-05, - "loss": 2.3136, - "step": 253180 - }, - { - "epoch": 0.44, - "learning_rate": 2.792335299267222e-05, - "loss": 2.3909, - "step": 253190 - }, - { - "epoch": 0.44, - "learning_rate": 2.7922481052745393e-05, - "loss": 2.2755, - "step": 253200 - }, - { - "epoch": 0.44, - "learning_rate": 2.7921609112818563e-05, - "loss": 2.3424, - "step": 253210 - }, - { - "epoch": 0.44, - "learning_rate": 2.7920737172891737e-05, - "loss": 2.253, - "step": 253220 - }, - { - "epoch": 0.44, - "learning_rate": 2.791986523296491e-05, - "loss": 2.4602, - "step": 253230 - }, - { - "epoch": 0.44, - "learning_rate": 2.791899329303808e-05, - "loss": 2.2618, - "step": 253240 - }, - { - "epoch": 0.44, - "learning_rate": 2.7918121353111258e-05, - "loss": 2.3649, - "step": 253250 - }, - { - "epoch": 0.44, - "learning_rate": 2.7917249413184432e-05, - "loss": 2.3618, - "step": 253260 - }, - { - "epoch": 0.44, - "learning_rate": 2.7916377473257606e-05, - "loss": 2.3909, - "step": 253270 - }, - { - "epoch": 0.44, - "learning_rate": 2.7915505533330776e-05, - "loss": 2.3346, - "step": 253280 - }, - { - "epoch": 0.44, - "learning_rate": 2.791463359340395e-05, - "loss": 2.3196, - "step": 253290 - }, - { - "epoch": 0.44, - "learning_rate": 2.791376165347712e-05, - "loss": 2.3897, - "step": 253300 - }, - { - "epoch": 0.44, - "learning_rate": 2.7912889713550294e-05, - "loss": 2.2841, - "step": 253310 - }, - { - "epoch": 0.44, - "learning_rate": 2.791201777362347e-05, - "loss": 2.5143, - "step": 253320 - }, - { - "epoch": 0.44, - "learning_rate": 2.7911145833696645e-05, - "loss": 2.3907, - "step": 253330 - }, - { - "epoch": 0.44, - "learning_rate": 2.791027389376982e-05, - "loss": 2.4014, - "step": 253340 - }, - { - "epoch": 0.44, - "learning_rate": 2.790940195384299e-05, - "loss": 2.3574, - "step": 253350 - }, - { - "epoch": 0.44, - "learning_rate": 2.7908530013916163e-05, - "loss": 2.3802, - "step": 253360 - }, - { - "epoch": 0.44, - "learning_rate": 2.7907658073989333e-05, - "loss": 2.4666, - "step": 253370 - }, - { - "epoch": 0.44, - "learning_rate": 2.7906786134062507e-05, - "loss": 2.2977, - "step": 253380 - }, - { - "epoch": 0.44, - "learning_rate": 2.790591419413568e-05, - "loss": 2.325, - "step": 253390 - }, - { - "epoch": 0.44, - "learning_rate": 2.7905042254208858e-05, - "loss": 2.3386, - "step": 253400 - }, - { - "epoch": 0.44, - "learning_rate": 2.7904170314282028e-05, - "loss": 2.4159, - "step": 253410 - }, - { - "epoch": 0.44, - "learning_rate": 2.7903298374355202e-05, - "loss": 2.3303, - "step": 253420 - }, - { - "epoch": 0.44, - "learning_rate": 2.7902426434428376e-05, - "loss": 2.43, - "step": 253430 - }, - { - "epoch": 0.44, - "learning_rate": 2.7901554494501546e-05, - "loss": 2.345, - "step": 253440 - }, - { - "epoch": 0.44, - "learning_rate": 2.790068255457472e-05, - "loss": 2.4161, - "step": 253450 - }, - { - "epoch": 0.44, - "learning_rate": 2.7899810614647894e-05, - "loss": 2.4638, - "step": 253460 - }, - { - "epoch": 0.44, - "learning_rate": 2.789893867472107e-05, - "loss": 2.4566, - "step": 253470 - }, - { - "epoch": 0.44, - "learning_rate": 2.789806673479424e-05, - "loss": 2.3846, - "step": 253480 - }, - { - "epoch": 0.44, - "learning_rate": 2.7897194794867415e-05, - "loss": 2.4392, - "step": 253490 - }, - { - "epoch": 0.44, - "learning_rate": 2.789632285494059e-05, - "loss": 2.3946, - "step": 253500 - }, - { - "epoch": 0.44, - "learning_rate": 2.789545091501376e-05, - "loss": 2.3398, - "step": 253510 - }, - { - "epoch": 0.44, - "learning_rate": 2.7894578975086933e-05, - "loss": 2.2993, - "step": 253520 - }, - { - "epoch": 0.44, - "learning_rate": 2.7893707035160103e-05, - "loss": 2.3719, - "step": 253530 - }, - { - "epoch": 0.44, - "learning_rate": 2.7892835095233284e-05, - "loss": 2.3123, - "step": 253540 - }, - { - "epoch": 0.44, - "learning_rate": 2.7891963155306454e-05, - "loss": 2.4793, - "step": 253550 - }, - { - "epoch": 0.44, - "learning_rate": 2.7891091215379628e-05, - "loss": 2.4993, - "step": 253560 - }, - { - "epoch": 0.44, - "learning_rate": 2.7890219275452802e-05, - "loss": 2.4228, - "step": 253570 - }, - { - "epoch": 0.44, - "learning_rate": 2.7889347335525972e-05, - "loss": 2.4126, - "step": 253580 - }, - { - "epoch": 0.44, - "learning_rate": 2.7888475395599146e-05, - "loss": 2.4234, - "step": 253590 - }, - { - "epoch": 0.44, - "learning_rate": 2.7887603455672316e-05, - "loss": 2.4589, - "step": 253600 - }, - { - "epoch": 0.44, - "learning_rate": 2.788673151574549e-05, - "loss": 2.4502, - "step": 253610 - }, - { - "epoch": 0.44, - "learning_rate": 2.7885859575818667e-05, - "loss": 2.4486, - "step": 253620 - }, - { - "epoch": 0.44, - "learning_rate": 2.788498763589184e-05, - "loss": 2.3778, - "step": 253630 - }, - { - "epoch": 0.44, - "learning_rate": 2.788411569596501e-05, - "loss": 2.3555, - "step": 253640 - }, - { - "epoch": 0.44, - "learning_rate": 2.7883243756038185e-05, - "loss": 2.2546, - "step": 253650 - }, - { - "epoch": 0.44, - "learning_rate": 2.788237181611136e-05, - "loss": 2.371, - "step": 253660 - }, - { - "epoch": 0.44, - "learning_rate": 2.788149987618453e-05, - "loss": 2.2535, - "step": 253670 - }, - { - "epoch": 0.44, - "learning_rate": 2.7880627936257703e-05, - "loss": 2.2754, - "step": 253680 - }, - { - "epoch": 0.44, - "learning_rate": 2.787975599633088e-05, - "loss": 2.4369, - "step": 253690 - }, - { - "epoch": 0.44, - "learning_rate": 2.7878884056404054e-05, - "loss": 2.4667, - "step": 253700 - }, - { - "epoch": 0.44, - "learning_rate": 2.7878012116477224e-05, - "loss": 2.3364, - "step": 253710 - }, - { - "epoch": 0.44, - "learning_rate": 2.7877140176550398e-05, - "loss": 2.3633, - "step": 253720 - }, - { - "epoch": 0.44, - "learning_rate": 2.7876268236623572e-05, - "loss": 2.4322, - "step": 253730 - }, - { - "epoch": 0.44, - "learning_rate": 2.7875396296696742e-05, - "loss": 2.4737, - "step": 253740 - }, - { - "epoch": 0.44, - "learning_rate": 2.7874524356769916e-05, - "loss": 2.3413, - "step": 253750 - }, - { - "epoch": 0.44, - "learning_rate": 2.7873652416843086e-05, - "loss": 2.4138, - "step": 253760 - }, - { - "epoch": 0.44, - "learning_rate": 2.7872780476916267e-05, - "loss": 2.2766, - "step": 253770 - }, - { - "epoch": 0.44, - "learning_rate": 2.7871908536989437e-05, - "loss": 2.3735, - "step": 253780 - }, - { - "epoch": 0.44, - "learning_rate": 2.787103659706261e-05, - "loss": 2.3712, - "step": 253790 - }, - { - "epoch": 0.44, - "learning_rate": 2.7870164657135785e-05, - "loss": 2.3357, - "step": 253800 - }, - { - "epoch": 0.44, - "learning_rate": 2.7869292717208955e-05, - "loss": 2.4494, - "step": 253810 - }, - { - "epoch": 0.44, - "learning_rate": 2.786842077728213e-05, - "loss": 2.3612, - "step": 253820 - }, - { - "epoch": 0.44, - "learning_rate": 2.78675488373553e-05, - "loss": 2.4451, - "step": 253830 - }, - { - "epoch": 0.44, - "learning_rate": 2.786667689742848e-05, - "loss": 2.2992, - "step": 253840 - }, - { - "epoch": 0.44, - "learning_rate": 2.786580495750165e-05, - "loss": 2.379, - "step": 253850 - }, - { - "epoch": 0.44, - "learning_rate": 2.7864933017574824e-05, - "loss": 2.299, - "step": 253860 - }, - { - "epoch": 0.44, - "learning_rate": 2.7864061077647995e-05, - "loss": 2.4501, - "step": 253870 - }, - { - "epoch": 0.44, - "learning_rate": 2.7863189137721168e-05, - "loss": 2.3457, - "step": 253880 - }, - { - "epoch": 0.44, - "learning_rate": 2.7862317197794342e-05, - "loss": 2.3343, - "step": 253890 - }, - { - "epoch": 0.44, - "learning_rate": 2.7861445257867512e-05, - "loss": 2.4601, - "step": 253900 - }, - { - "epoch": 0.44, - "learning_rate": 2.7860573317940686e-05, - "loss": 2.3991, - "step": 253910 - }, - { - "epoch": 0.44, - "learning_rate": 2.7859701378013863e-05, - "loss": 2.3811, - "step": 253920 - }, - { - "epoch": 0.44, - "learning_rate": 2.7858829438087037e-05, - "loss": 2.477, - "step": 253930 - }, - { - "epoch": 0.44, - "learning_rate": 2.7857957498160208e-05, - "loss": 2.3679, - "step": 253940 - }, - { - "epoch": 0.44, - "learning_rate": 2.785708555823338e-05, - "loss": 2.3116, - "step": 253950 - }, - { - "epoch": 0.44, - "learning_rate": 2.7856213618306555e-05, - "loss": 2.3504, - "step": 253960 - }, - { - "epoch": 0.44, - "learning_rate": 2.7855341678379725e-05, - "loss": 2.4954, - "step": 253970 - }, - { - "epoch": 0.44, - "learning_rate": 2.78544697384529e-05, - "loss": 2.3926, - "step": 253980 - }, - { - "epoch": 0.44, - "learning_rate": 2.7853597798526076e-05, - "loss": 2.3871, - "step": 253990 - }, - { - "epoch": 0.44, - "learning_rate": 2.785272585859925e-05, - "loss": 2.3618, - "step": 254000 - }, - { - "epoch": 0.44, - "learning_rate": 2.785185391867242e-05, - "loss": 2.4318, - "step": 254010 - }, - { - "epoch": 0.44, - "learning_rate": 2.7850981978745594e-05, - "loss": 2.2959, - "step": 254020 - }, - { - "epoch": 0.44, - "learning_rate": 2.7850110038818765e-05, - "loss": 2.2827, - "step": 254030 - }, - { - "epoch": 0.44, - "learning_rate": 2.784923809889194e-05, - "loss": 2.4988, - "step": 254040 - }, - { - "epoch": 0.44, - "learning_rate": 2.7848366158965112e-05, - "loss": 2.4331, - "step": 254050 - }, - { - "epoch": 0.44, - "learning_rate": 2.7847494219038283e-05, - "loss": 2.4791, - "step": 254060 - }, - { - "epoch": 0.44, - "learning_rate": 2.7846622279111463e-05, - "loss": 2.2758, - "step": 254070 - }, - { - "epoch": 0.44, - "learning_rate": 2.7845750339184634e-05, - "loss": 2.4256, - "step": 254080 - }, - { - "epoch": 0.44, - "learning_rate": 2.7844878399257807e-05, - "loss": 2.351, - "step": 254090 - }, - { - "epoch": 0.44, - "learning_rate": 2.7844006459330978e-05, - "loss": 2.2288, - "step": 254100 - }, - { - "epoch": 0.44, - "learning_rate": 2.784313451940415e-05, - "loss": 2.4971, - "step": 254110 - }, - { - "epoch": 0.44, - "learning_rate": 2.7842262579477325e-05, - "loss": 2.3977, - "step": 254120 - }, - { - "epoch": 0.44, - "learning_rate": 2.7841390639550496e-05, - "loss": 2.3597, - "step": 254130 - }, - { - "epoch": 0.44, - "learning_rate": 2.7840518699623673e-05, - "loss": 2.3695, - "step": 254140 - }, - { - "epoch": 0.44, - "learning_rate": 2.7839646759696847e-05, - "loss": 2.2908, - "step": 254150 - }, - { - "epoch": 0.44, - "learning_rate": 2.783877481977002e-05, - "loss": 2.3935, - "step": 254160 - }, - { - "epoch": 0.44, - "learning_rate": 2.783790287984319e-05, - "loss": 2.4235, - "step": 254170 - }, - { - "epoch": 0.44, - "learning_rate": 2.7837030939916364e-05, - "loss": 2.454, - "step": 254180 - }, - { - "epoch": 0.44, - "learning_rate": 2.7836158999989538e-05, - "loss": 2.4713, - "step": 254190 - }, - { - "epoch": 0.44, - "learning_rate": 2.783528706006271e-05, - "loss": 2.419, - "step": 254200 - }, - { - "epoch": 0.44, - "learning_rate": 2.7834415120135886e-05, - "loss": 2.243, - "step": 254210 - }, - { - "epoch": 0.44, - "learning_rate": 2.783354318020906e-05, - "loss": 2.2918, - "step": 254220 - }, - { - "epoch": 0.44, - "learning_rate": 2.7832671240282233e-05, - "loss": 2.3447, - "step": 254230 - }, - { - "epoch": 0.44, - "learning_rate": 2.7831799300355404e-05, - "loss": 2.4251, - "step": 254240 - }, - { - "epoch": 0.44, - "learning_rate": 2.7830927360428577e-05, - "loss": 2.4489, - "step": 254250 - }, - { - "epoch": 0.44, - "learning_rate": 2.7830055420501748e-05, - "loss": 2.3353, - "step": 254260 - }, - { - "epoch": 0.44, - "learning_rate": 2.782918348057492e-05, - "loss": 2.4211, - "step": 254270 - }, - { - "epoch": 0.44, - "learning_rate": 2.7828311540648095e-05, - "loss": 2.4775, - "step": 254280 - }, - { - "epoch": 0.44, - "learning_rate": 2.7827439600721273e-05, - "loss": 2.4081, - "step": 254290 - }, - { - "epoch": 0.44, - "learning_rate": 2.7826567660794446e-05, - "loss": 2.3604, - "step": 254300 - }, - { - "epoch": 0.44, - "learning_rate": 2.7825695720867617e-05, - "loss": 2.3533, - "step": 254310 - }, - { - "epoch": 0.44, - "learning_rate": 2.782482378094079e-05, - "loss": 2.4634, - "step": 254320 - }, - { - "epoch": 0.44, - "learning_rate": 2.782395184101396e-05, - "loss": 2.4165, - "step": 254330 - }, - { - "epoch": 0.44, - "learning_rate": 2.7823079901087135e-05, - "loss": 2.3333, - "step": 254340 - }, - { - "epoch": 0.44, - "learning_rate": 2.782220796116031e-05, - "loss": 2.3115, - "step": 254350 - }, - { - "epoch": 0.44, - "learning_rate": 2.7821336021233486e-05, - "loss": 2.3354, - "step": 254360 - }, - { - "epoch": 0.44, - "learning_rate": 2.7820464081306656e-05, - "loss": 2.3869, - "step": 254370 - }, - { - "epoch": 0.44, - "learning_rate": 2.781959214137983e-05, - "loss": 2.3917, - "step": 254380 - }, - { - "epoch": 0.44, - "learning_rate": 2.7818720201453003e-05, - "loss": 2.4059, - "step": 254390 - }, - { - "epoch": 0.44, - "learning_rate": 2.7817848261526174e-05, - "loss": 2.4696, - "step": 254400 - }, - { - "epoch": 0.44, - "learning_rate": 2.7816976321599348e-05, - "loss": 2.4153, - "step": 254410 - }, - { - "epoch": 0.44, - "learning_rate": 2.781610438167252e-05, - "loss": 2.2645, - "step": 254420 - }, - { - "epoch": 0.44, - "learning_rate": 2.7815232441745692e-05, - "loss": 2.4301, - "step": 254430 - }, - { - "epoch": 0.44, - "learning_rate": 2.781436050181887e-05, - "loss": 2.4772, - "step": 254440 - }, - { - "epoch": 0.44, - "learning_rate": 2.7813488561892043e-05, - "loss": 2.2635, - "step": 254450 - }, - { - "epoch": 0.44, - "learning_rate": 2.7812616621965216e-05, - "loss": 2.4847, - "step": 254460 - }, - { - "epoch": 0.44, - "learning_rate": 2.7811744682038387e-05, - "loss": 2.466, - "step": 254470 - }, - { - "epoch": 0.44, - "learning_rate": 2.781087274211156e-05, - "loss": 2.2566, - "step": 254480 - }, - { - "epoch": 0.44, - "learning_rate": 2.781000080218473e-05, - "loss": 2.4071, - "step": 254490 - }, - { - "epoch": 0.44, - "learning_rate": 2.7809128862257905e-05, - "loss": 2.4377, - "step": 254500 - }, - { - "epoch": 0.44, - "learning_rate": 2.7808256922331082e-05, - "loss": 2.496, - "step": 254510 - }, - { - "epoch": 0.44, - "learning_rate": 2.7807384982404256e-05, - "loss": 2.3797, - "step": 254520 - }, - { - "epoch": 0.44, - "learning_rate": 2.780651304247743e-05, - "loss": 2.3672, - "step": 254530 - }, - { - "epoch": 0.44, - "learning_rate": 2.78056411025506e-05, - "loss": 2.4311, - "step": 254540 - }, - { - "epoch": 0.44, - "learning_rate": 2.7804769162623774e-05, - "loss": 2.5014, - "step": 254550 - }, - { - "epoch": 0.44, - "learning_rate": 2.7803897222696944e-05, - "loss": 2.4056, - "step": 254560 - }, - { - "epoch": 0.44, - "learning_rate": 2.7803025282770118e-05, - "loss": 2.3525, - "step": 254570 - }, - { - "epoch": 0.44, - "learning_rate": 2.780215334284329e-05, - "loss": 2.438, - "step": 254580 - }, - { - "epoch": 0.44, - "learning_rate": 2.780128140291647e-05, - "loss": 2.3297, - "step": 254590 - }, - { - "epoch": 0.44, - "learning_rate": 2.780040946298964e-05, - "loss": 2.4038, - "step": 254600 - }, - { - "epoch": 0.44, - "learning_rate": 2.7799537523062813e-05, - "loss": 2.4223, - "step": 254610 - }, - { - "epoch": 0.44, - "learning_rate": 2.7798665583135987e-05, - "loss": 2.2514, - "step": 254620 - }, - { - "epoch": 0.44, - "learning_rate": 2.7797793643209157e-05, - "loss": 2.3068, - "step": 254630 - }, - { - "epoch": 0.44, - "learning_rate": 2.779692170328233e-05, - "loss": 2.3871, - "step": 254640 - }, - { - "epoch": 0.44, - "learning_rate": 2.77960497633555e-05, - "loss": 2.4723, - "step": 254650 - }, - { - "epoch": 0.44, - "learning_rate": 2.779517782342868e-05, - "loss": 2.2598, - "step": 254660 - }, - { - "epoch": 0.44, - "learning_rate": 2.7794305883501852e-05, - "loss": 2.3702, - "step": 254670 - }, - { - "epoch": 0.44, - "learning_rate": 2.7793433943575026e-05, - "loss": 2.4173, - "step": 254680 - }, - { - "epoch": 0.44, - "learning_rate": 2.77925620036482e-05, - "loss": 2.4696, - "step": 254690 - }, - { - "epoch": 0.44, - "learning_rate": 2.779169006372137e-05, - "loss": 2.415, - "step": 254700 - }, - { - "epoch": 0.44, - "learning_rate": 2.7790818123794544e-05, - "loss": 2.297, - "step": 254710 - }, - { - "epoch": 0.44, - "learning_rate": 2.7789946183867714e-05, - "loss": 2.3732, - "step": 254720 - }, - { - "epoch": 0.44, - "learning_rate": 2.7789074243940895e-05, - "loss": 2.2799, - "step": 254730 - }, - { - "epoch": 0.44, - "learning_rate": 2.7788202304014065e-05, - "loss": 2.4427, - "step": 254740 - }, - { - "epoch": 0.44, - "learning_rate": 2.778733036408724e-05, - "loss": 2.3389, - "step": 254750 - }, - { - "epoch": 0.44, - "learning_rate": 2.778645842416041e-05, - "loss": 2.3127, - "step": 254760 - }, - { - "epoch": 0.44, - "learning_rate": 2.7785586484233583e-05, - "loss": 2.3231, - "step": 254770 - }, - { - "epoch": 0.44, - "learning_rate": 2.7784714544306757e-05, - "loss": 2.4384, - "step": 254780 - }, - { - "epoch": 0.44, - "learning_rate": 2.7783842604379927e-05, - "loss": 2.3482, - "step": 254790 - }, - { - "epoch": 0.44, - "learning_rate": 2.77829706644531e-05, - "loss": 2.3672, - "step": 254800 - }, - { - "epoch": 0.44, - "learning_rate": 2.7782098724526278e-05, - "loss": 2.3287, - "step": 254810 - }, - { - "epoch": 0.44, - "learning_rate": 2.7781226784599452e-05, - "loss": 2.3299, - "step": 254820 - }, - { - "epoch": 0.44, - "learning_rate": 2.7780354844672622e-05, - "loss": 2.4149, - "step": 254830 - }, - { - "epoch": 0.44, - "learning_rate": 2.7779482904745796e-05, - "loss": 2.453, - "step": 254840 - }, - { - "epoch": 0.44, - "learning_rate": 2.777861096481897e-05, - "loss": 2.3995, - "step": 254850 - }, - { - "epoch": 0.44, - "learning_rate": 2.777773902489214e-05, - "loss": 2.3704, - "step": 254860 - }, - { - "epoch": 0.44, - "learning_rate": 2.7776867084965314e-05, - "loss": 2.3278, - "step": 254870 - }, - { - "epoch": 0.44, - "learning_rate": 2.777599514503849e-05, - "loss": 2.306, - "step": 254880 - }, - { - "epoch": 0.44, - "learning_rate": 2.7775123205111665e-05, - "loss": 2.3666, - "step": 254890 - }, - { - "epoch": 0.44, - "learning_rate": 2.7774251265184835e-05, - "loss": 2.448, - "step": 254900 - }, - { - "epoch": 0.44, - "learning_rate": 2.777337932525801e-05, - "loss": 2.2609, - "step": 254910 - }, - { - "epoch": 0.44, - "learning_rate": 2.7772507385331183e-05, - "loss": 2.3974, - "step": 254920 - }, - { - "epoch": 0.44, - "learning_rate": 2.7771635445404353e-05, - "loss": 2.4358, - "step": 254930 - }, - { - "epoch": 0.44, - "learning_rate": 2.7770763505477527e-05, - "loss": 2.3303, - "step": 254940 - }, - { - "epoch": 0.44, - "learning_rate": 2.7769891565550697e-05, - "loss": 2.4265, - "step": 254950 - }, - { - "epoch": 0.44, - "learning_rate": 2.7769019625623878e-05, - "loss": 2.3487, - "step": 254960 - }, - { - "epoch": 0.44, - "learning_rate": 2.7768147685697048e-05, - "loss": 2.4594, - "step": 254970 - }, - { - "epoch": 0.44, - "learning_rate": 2.7767275745770222e-05, - "loss": 2.3718, - "step": 254980 - }, - { - "epoch": 0.44, - "learning_rate": 2.7766403805843392e-05, - "loss": 2.3995, - "step": 254990 - }, - { - "epoch": 0.44, - "learning_rate": 2.7765531865916566e-05, - "loss": 2.3212, - "step": 255000 - }, - { - "epoch": 0.44, - "learning_rate": 2.776465992598974e-05, - "loss": 2.4538, - "step": 255010 - }, - { - "epoch": 0.44, - "learning_rate": 2.776378798606291e-05, - "loss": 2.3578, - "step": 255020 - }, - { - "epoch": 0.44, - "learning_rate": 2.776291604613609e-05, - "loss": 2.275, - "step": 255030 - }, - { - "epoch": 0.44, - "learning_rate": 2.776204410620926e-05, - "loss": 2.4287, - "step": 255040 - }, - { - "epoch": 0.44, - "learning_rate": 2.7761172166282435e-05, - "loss": 2.4343, - "step": 255050 - }, - { - "epoch": 0.44, - "learning_rate": 2.7760300226355605e-05, - "loss": 2.4222, - "step": 255060 - }, - { - "epoch": 0.44, - "learning_rate": 2.775942828642878e-05, - "loss": 2.2925, - "step": 255070 - }, - { - "epoch": 0.44, - "learning_rate": 2.7758556346501953e-05, - "loss": 2.4017, - "step": 255080 - }, - { - "epoch": 0.44, - "learning_rate": 2.7757684406575123e-05, - "loss": 2.3306, - "step": 255090 - }, - { - "epoch": 0.44, - "learning_rate": 2.7756812466648297e-05, - "loss": 2.2624, - "step": 255100 - }, - { - "epoch": 0.44, - "learning_rate": 2.7755940526721474e-05, - "loss": 2.3064, - "step": 255110 - }, - { - "epoch": 0.44, - "learning_rate": 2.7755068586794648e-05, - "loss": 2.3719, - "step": 255120 - }, - { - "epoch": 0.44, - "learning_rate": 2.775419664686782e-05, - "loss": 2.4286, - "step": 255130 - }, - { - "epoch": 0.44, - "learning_rate": 2.7753324706940992e-05, - "loss": 2.3838, - "step": 255140 - }, - { - "epoch": 0.44, - "learning_rate": 2.7752452767014166e-05, - "loss": 2.4506, - "step": 255150 - }, - { - "epoch": 0.44, - "learning_rate": 2.7751580827087336e-05, - "loss": 2.5364, - "step": 255160 - }, - { - "epoch": 0.44, - "learning_rate": 2.775070888716051e-05, - "loss": 2.3726, - "step": 255170 - }, - { - "epoch": 0.45, - "learning_rate": 2.7749836947233687e-05, - "loss": 2.3261, - "step": 255180 - }, - { - "epoch": 0.45, - "learning_rate": 2.774896500730686e-05, - "loss": 2.3038, - "step": 255190 - }, - { - "epoch": 0.45, - "learning_rate": 2.774809306738003e-05, - "loss": 2.384, - "step": 255200 - }, - { - "epoch": 0.45, - "learning_rate": 2.7747221127453205e-05, - "loss": 2.4188, - "step": 255210 - }, - { - "epoch": 0.45, - "learning_rate": 2.7746349187526376e-05, - "loss": 2.265, - "step": 255220 - }, - { - "epoch": 0.45, - "learning_rate": 2.774547724759955e-05, - "loss": 2.2837, - "step": 255230 - }, - { - "epoch": 0.45, - "learning_rate": 2.7744605307672723e-05, - "loss": 2.3142, - "step": 255240 - }, - { - "epoch": 0.45, - "learning_rate": 2.7743733367745893e-05, - "loss": 2.4188, - "step": 255250 - }, - { - "epoch": 0.45, - "learning_rate": 2.7742861427819074e-05, - "loss": 2.4214, - "step": 255260 - }, - { - "epoch": 0.45, - "learning_rate": 2.7741989487892244e-05, - "loss": 2.4173, - "step": 255270 - }, - { - "epoch": 0.45, - "learning_rate": 2.7741117547965418e-05, - "loss": 2.3916, - "step": 255280 - }, - { - "epoch": 0.45, - "learning_rate": 2.774024560803859e-05, - "loss": 2.2544, - "step": 255290 - }, - { - "epoch": 0.45, - "learning_rate": 2.7739373668111762e-05, - "loss": 2.4617, - "step": 255300 - }, - { - "epoch": 0.45, - "learning_rate": 2.7738501728184936e-05, - "loss": 2.3542, - "step": 255310 - }, - { - "epoch": 0.45, - "learning_rate": 2.7737629788258106e-05, - "loss": 2.383, - "step": 255320 - }, - { - "epoch": 0.45, - "learning_rate": 2.7736757848331284e-05, - "loss": 2.3188, - "step": 255330 - }, - { - "epoch": 0.45, - "learning_rate": 2.7735885908404457e-05, - "loss": 2.3992, - "step": 255340 - }, - { - "epoch": 0.45, - "learning_rate": 2.773501396847763e-05, - "loss": 2.4868, - "step": 255350 - }, - { - "epoch": 0.45, - "learning_rate": 2.77341420285508e-05, - "loss": 2.4145, - "step": 255360 - }, - { - "epoch": 0.45, - "learning_rate": 2.7733270088623975e-05, - "loss": 2.387, - "step": 255370 - }, - { - "epoch": 0.45, - "learning_rate": 2.7732398148697146e-05, - "loss": 2.177, - "step": 255380 - }, - { - "epoch": 0.45, - "learning_rate": 2.773152620877032e-05, - "loss": 2.4626, - "step": 255390 - }, - { - "epoch": 0.45, - "learning_rate": 2.7730654268843497e-05, - "loss": 2.3987, - "step": 255400 - }, - { - "epoch": 0.45, - "learning_rate": 2.772978232891667e-05, - "loss": 2.4662, - "step": 255410 - }, - { - "epoch": 0.45, - "learning_rate": 2.7728910388989844e-05, - "loss": 2.361, - "step": 255420 - }, - { - "epoch": 0.45, - "learning_rate": 2.7728038449063015e-05, - "loss": 2.2769, - "step": 255430 - }, - { - "epoch": 0.45, - "learning_rate": 2.7727166509136188e-05, - "loss": 2.4207, - "step": 255440 - }, - { - "epoch": 0.45, - "learning_rate": 2.772629456920936e-05, - "loss": 2.3307, - "step": 255450 - }, - { - "epoch": 0.45, - "learning_rate": 2.7725422629282532e-05, - "loss": 2.3883, - "step": 255460 - }, - { - "epoch": 0.45, - "learning_rate": 2.7724550689355706e-05, - "loss": 2.3068, - "step": 255470 - }, - { - "epoch": 0.45, - "learning_rate": 2.7723678749428883e-05, - "loss": 2.3547, - "step": 255480 - }, - { - "epoch": 0.45, - "learning_rate": 2.7722806809502054e-05, - "loss": 2.3186, - "step": 255490 - }, - { - "epoch": 0.45, - "learning_rate": 2.7721934869575228e-05, - "loss": 2.3235, - "step": 255500 - }, - { - "epoch": 0.45, - "learning_rate": 2.77210629296484e-05, - "loss": 2.415, - "step": 255510 - }, - { - "epoch": 0.45, - "learning_rate": 2.772019098972157e-05, - "loss": 2.4369, - "step": 255520 - }, - { - "epoch": 0.45, - "learning_rate": 2.7719319049794745e-05, - "loss": 2.4112, - "step": 255530 - }, - { - "epoch": 0.45, - "learning_rate": 2.771844710986792e-05, - "loss": 2.3755, - "step": 255540 - }, - { - "epoch": 0.45, - "learning_rate": 2.7717575169941096e-05, - "loss": 2.3892, - "step": 255550 - }, - { - "epoch": 0.45, - "learning_rate": 2.7716703230014267e-05, - "loss": 2.4331, - "step": 255560 - }, - { - "epoch": 0.45, - "learning_rate": 2.771583129008744e-05, - "loss": 2.3771, - "step": 255570 - }, - { - "epoch": 0.45, - "learning_rate": 2.7714959350160614e-05, - "loss": 2.3788, - "step": 255580 - }, - { - "epoch": 0.45, - "learning_rate": 2.7714087410233785e-05, - "loss": 2.303, - "step": 255590 - }, - { - "epoch": 0.45, - "learning_rate": 2.771321547030696e-05, - "loss": 2.3653, - "step": 255600 - }, - { - "epoch": 0.45, - "learning_rate": 2.771234353038013e-05, - "loss": 2.3513, - "step": 255610 - }, - { - "epoch": 0.45, - "learning_rate": 2.7711471590453303e-05, - "loss": 2.4204, - "step": 255620 - }, - { - "epoch": 0.45, - "learning_rate": 2.771059965052648e-05, - "loss": 2.3672, - "step": 255630 - }, - { - "epoch": 0.45, - "learning_rate": 2.7709727710599654e-05, - "loss": 2.4254, - "step": 255640 - }, - { - "epoch": 0.45, - "learning_rate": 2.7708855770672827e-05, - "loss": 2.3851, - "step": 255650 - }, - { - "epoch": 0.45, - "learning_rate": 2.7707983830745998e-05, - "loss": 2.4203, - "step": 255660 - }, - { - "epoch": 0.45, - "learning_rate": 2.770711189081917e-05, - "loss": 2.4277, - "step": 255670 - }, - { - "epoch": 0.45, - "learning_rate": 2.7706239950892342e-05, - "loss": 2.3575, - "step": 255680 - }, - { - "epoch": 0.45, - "learning_rate": 2.7705368010965516e-05, - "loss": 2.4017, - "step": 255690 - }, - { - "epoch": 0.45, - "learning_rate": 2.7704496071038693e-05, - "loss": 2.4569, - "step": 255700 - }, - { - "epoch": 0.45, - "learning_rate": 2.7703624131111867e-05, - "loss": 2.392, - "step": 255710 - }, - { - "epoch": 0.45, - "learning_rate": 2.7702752191185037e-05, - "loss": 2.3708, - "step": 255720 - }, - { - "epoch": 0.45, - "learning_rate": 2.770188025125821e-05, - "loss": 2.4555, - "step": 255730 - }, - { - "epoch": 0.45, - "learning_rate": 2.7701008311331384e-05, - "loss": 2.3402, - "step": 255740 - }, - { - "epoch": 0.45, - "learning_rate": 2.7700136371404555e-05, - "loss": 2.3395, - "step": 255750 - }, - { - "epoch": 0.45, - "learning_rate": 2.769926443147773e-05, - "loss": 2.3709, - "step": 255760 - }, - { - "epoch": 0.45, - "learning_rate": 2.7698392491550902e-05, - "loss": 2.3854, - "step": 255770 - }, - { - "epoch": 0.45, - "learning_rate": 2.769752055162408e-05, - "loss": 2.2644, - "step": 255780 - }, - { - "epoch": 0.45, - "learning_rate": 2.769664861169725e-05, - "loss": 2.499, - "step": 255790 - }, - { - "epoch": 0.45, - "learning_rate": 2.7695776671770424e-05, - "loss": 2.3663, - "step": 255800 - }, - { - "epoch": 0.45, - "learning_rate": 2.7694904731843597e-05, - "loss": 2.376, - "step": 255810 - }, - { - "epoch": 0.45, - "learning_rate": 2.7694032791916768e-05, - "loss": 2.4105, - "step": 255820 - }, - { - "epoch": 0.45, - "learning_rate": 2.769316085198994e-05, - "loss": 2.4572, - "step": 255830 - }, - { - "epoch": 0.45, - "learning_rate": 2.7692288912063112e-05, - "loss": 2.3715, - "step": 255840 - }, - { - "epoch": 0.45, - "learning_rate": 2.7691416972136293e-05, - "loss": 2.5044, - "step": 255850 - }, - { - "epoch": 0.45, - "learning_rate": 2.7690545032209463e-05, - "loss": 2.34, - "step": 255860 - }, - { - "epoch": 0.45, - "learning_rate": 2.7689673092282637e-05, - "loss": 2.2933, - "step": 255870 - }, - { - "epoch": 0.45, - "learning_rate": 2.768880115235581e-05, - "loss": 2.3849, - "step": 255880 - }, - { - "epoch": 0.45, - "learning_rate": 2.768792921242898e-05, - "loss": 2.3227, - "step": 255890 - }, - { - "epoch": 0.45, - "learning_rate": 2.7687057272502155e-05, - "loss": 2.3589, - "step": 255900 - }, - { - "epoch": 0.45, - "learning_rate": 2.7686185332575325e-05, - "loss": 2.3998, - "step": 255910 - }, - { - "epoch": 0.45, - "learning_rate": 2.76853133926485e-05, - "loss": 2.4371, - "step": 255920 - }, - { - "epoch": 0.45, - "learning_rate": 2.7684441452721676e-05, - "loss": 2.3606, - "step": 255930 - }, - { - "epoch": 0.45, - "learning_rate": 2.768356951279485e-05, - "loss": 2.3365, - "step": 255940 - }, - { - "epoch": 0.45, - "learning_rate": 2.768269757286802e-05, - "loss": 2.367, - "step": 255950 - }, - { - "epoch": 0.45, - "learning_rate": 2.7681825632941194e-05, - "loss": 2.4008, - "step": 255960 - }, - { - "epoch": 0.45, - "learning_rate": 2.7680953693014368e-05, - "loss": 2.2758, - "step": 255970 - }, - { - "epoch": 0.45, - "learning_rate": 2.7680081753087538e-05, - "loss": 2.3095, - "step": 255980 - }, - { - "epoch": 0.45, - "learning_rate": 2.7679209813160712e-05, - "loss": 2.3736, - "step": 255990 - }, - { - "epoch": 0.45, - "learning_rate": 2.767833787323389e-05, - "loss": 2.3646, - "step": 256000 - }, - { - "epoch": 0.89, - "learning_rate": 5.354931866614118e-06, - "loss": 2.3582, - "step": 256010 - }, - { - "epoch": 0.89, - "learning_rate": 5.353187986760464e-06, - "loss": 2.3675, - "step": 256020 - }, - { - "epoch": 0.89, - "learning_rate": 5.351444106906811e-06, - "loss": 2.4478, - "step": 256030 - }, - { - "epoch": 0.89, - "learning_rate": 5.349700227053157e-06, - "loss": 2.4297, - "step": 256040 - }, - { - "epoch": 0.89, - "learning_rate": 5.347956347199504e-06, - "loss": 2.4002, - "step": 256050 - }, - { - "epoch": 0.89, - "learning_rate": 5.34621246734585e-06, - "loss": 2.3831, - "step": 256060 - }, - { - "epoch": 0.89, - "learning_rate": 5.344468587492196e-06, - "loss": 2.3242, - "step": 256070 - }, - { - "epoch": 0.89, - "learning_rate": 5.342724707638542e-06, - "loss": 2.3855, - "step": 256080 - }, - { - "epoch": 0.89, - "learning_rate": 5.34098082778489e-06, - "loss": 2.3627, - "step": 256090 - }, - { - "epoch": 0.89, - "learning_rate": 5.339236947931236e-06, - "loss": 2.3849, - "step": 256100 - }, - { - "epoch": 0.89, - "learning_rate": 5.337493068077582e-06, - "loss": 2.4403, - "step": 256110 - }, - { - "epoch": 0.89, - "learning_rate": 5.335749188223928e-06, - "loss": 2.4415, - "step": 256120 - }, - { - "epoch": 0.89, - "learning_rate": 5.334005308370275e-06, - "loss": 2.3887, - "step": 256130 - }, - { - "epoch": 0.89, - "learning_rate": 5.332261428516621e-06, - "loss": 2.455, - "step": 256140 - }, - { - "epoch": 0.89, - "learning_rate": 5.330517548662967e-06, - "loss": 2.3745, - "step": 256150 - }, - { - "epoch": 0.89, - "learning_rate": 5.328773668809314e-06, - "loss": 2.4248, - "step": 256160 - }, - { - "epoch": 0.89, - "learning_rate": 5.327029788955661e-06, - "loss": 2.3738, - "step": 256170 - }, - { - "epoch": 0.89, - "learning_rate": 5.325285909102007e-06, - "loss": 2.3599, - "step": 256180 - }, - { - "epoch": 0.89, - "learning_rate": 5.323542029248353e-06, - "loss": 2.3814, - "step": 256190 - }, - { - "epoch": 0.89, - "learning_rate": 5.321798149394699e-06, - "loss": 2.3544, - "step": 256200 - }, - { - "epoch": 0.89, - "learning_rate": 5.320054269541046e-06, - "loss": 2.342, - "step": 256210 - }, - { - "epoch": 0.89, - "learning_rate": 5.318310389687392e-06, - "loss": 2.3765, - "step": 256220 - }, - { - "epoch": 0.89, - "learning_rate": 5.316566509833739e-06, - "loss": 2.4637, - "step": 256230 - }, - { - "epoch": 0.89, - "learning_rate": 5.314822629980085e-06, - "loss": 2.2951, - "step": 256240 - }, - { - "epoch": 0.89, - "learning_rate": 5.313078750126432e-06, - "loss": 2.3562, - "step": 256250 - }, - { - "epoch": 0.89, - "learning_rate": 5.311334870272778e-06, - "loss": 2.3041, - "step": 256260 - }, - { - "epoch": 0.89, - "learning_rate": 5.309590990419124e-06, - "loss": 2.342, - "step": 256270 - }, - { - "epoch": 0.89, - "learning_rate": 5.30784711056547e-06, - "loss": 2.3967, - "step": 256280 - }, - { - "epoch": 0.89, - "learning_rate": 5.306103230711818e-06, - "loss": 2.3413, - "step": 256290 - }, - { - "epoch": 0.89, - "learning_rate": 5.3043593508581635e-06, - "loss": 2.3959, - "step": 256300 - }, - { - "epoch": 0.89, - "learning_rate": 5.30261547100451e-06, - "loss": 2.4433, - "step": 256310 - }, - { - "epoch": 0.89, - "learning_rate": 5.300871591150856e-06, - "loss": 2.3768, - "step": 256320 - }, - { - "epoch": 0.89, - "learning_rate": 5.299127711297203e-06, - "loss": 2.2736, - "step": 256330 - }, - { - "epoch": 0.89, - "learning_rate": 5.297383831443549e-06, - "loss": 2.4386, - "step": 256340 - }, - { - "epoch": 0.89, - "learning_rate": 5.295639951589895e-06, - "loss": 2.3786, - "step": 256350 - }, - { - "epoch": 0.89, - "learning_rate": 5.293896071736242e-06, - "loss": 2.3633, - "step": 256360 - }, - { - "epoch": 0.89, - "learning_rate": 5.292152191882589e-06, - "loss": 2.3843, - "step": 256370 - }, - { - "epoch": 0.89, - "learning_rate": 5.2904083120289345e-06, - "loss": 2.424, - "step": 256380 - }, - { - "epoch": 0.89, - "learning_rate": 5.288664432175281e-06, - "loss": 2.375, - "step": 256390 - }, - { - "epoch": 0.89, - "learning_rate": 5.286920552321627e-06, - "loss": 2.2736, - "step": 256400 - }, - { - "epoch": 0.89, - "learning_rate": 5.285176672467974e-06, - "loss": 2.4225, - "step": 256410 - }, - { - "epoch": 0.89, - "learning_rate": 5.28343279261432e-06, - "loss": 2.3215, - "step": 256420 - }, - { - "epoch": 0.89, - "learning_rate": 5.281688912760667e-06, - "loss": 2.3795, - "step": 256430 - }, - { - "epoch": 0.89, - "learning_rate": 5.279945032907013e-06, - "loss": 2.3795, - "step": 256440 - }, - { - "epoch": 0.89, - "learning_rate": 5.27820115305336e-06, - "loss": 2.338, - "step": 256450 - }, - { - "epoch": 0.89, - "learning_rate": 5.2764572731997055e-06, - "loss": 2.3321, - "step": 256460 - }, - { - "epoch": 0.89, - "learning_rate": 5.274713393346052e-06, - "loss": 2.4215, - "step": 256470 - }, - { - "epoch": 0.89, - "learning_rate": 5.272969513492398e-06, - "loss": 2.4639, - "step": 256480 - }, - { - "epoch": 0.89, - "learning_rate": 5.271225633638746e-06, - "loss": 2.3912, - "step": 256490 - }, - { - "epoch": 0.89, - "learning_rate": 5.2694817537850914e-06, - "loss": 2.3259, - "step": 256500 - }, - { - "epoch": 0.89, - "learning_rate": 5.267737873931438e-06, - "loss": 2.319, - "step": 256510 - }, - { - "epoch": 0.89, - "learning_rate": 5.265993994077784e-06, - "loss": 2.3882, - "step": 256520 - }, - { - "epoch": 0.89, - "learning_rate": 5.264250114224131e-06, - "loss": 2.3908, - "step": 256530 - }, - { - "epoch": 0.89, - "learning_rate": 5.2625062343704765e-06, - "loss": 2.4055, - "step": 256540 - }, - { - "epoch": 0.89, - "learning_rate": 5.260762354516823e-06, - "loss": 2.3113, - "step": 256550 - }, - { - "epoch": 0.89, - "learning_rate": 5.25901847466317e-06, - "loss": 2.3672, - "step": 256560 - }, - { - "epoch": 0.89, - "learning_rate": 5.257274594809517e-06, - "loss": 2.3848, - "step": 256570 - }, - { - "epoch": 0.89, - "learning_rate": 5.2555307149558624e-06, - "loss": 2.4087, - "step": 256580 - }, - { - "epoch": 0.89, - "learning_rate": 5.253786835102209e-06, - "loss": 2.329, - "step": 256590 - }, - { - "epoch": 0.89, - "learning_rate": 5.252042955248555e-06, - "loss": 2.3174, - "step": 256600 - }, - { - "epoch": 0.89, - "learning_rate": 5.250299075394902e-06, - "loss": 2.3467, - "step": 256610 - }, - { - "epoch": 0.9, - "learning_rate": 5.2485551955412475e-06, - "loss": 2.3472, - "step": 256620 - }, - { - "epoch": 0.9, - "learning_rate": 5.246811315687595e-06, - "loss": 2.2868, - "step": 256630 - }, - { - "epoch": 0.9, - "learning_rate": 5.245067435833941e-06, - "loss": 2.3208, - "step": 256640 - }, - { - "epoch": 0.9, - "learning_rate": 5.243323555980288e-06, - "loss": 2.3691, - "step": 256650 - }, - { - "epoch": 0.9, - "learning_rate": 5.2415796761266334e-06, - "loss": 2.4033, - "step": 256660 - }, - { - "epoch": 0.9, - "learning_rate": 5.23983579627298e-06, - "loss": 2.3467, - "step": 256670 - }, - { - "epoch": 0.9, - "learning_rate": 5.238091916419326e-06, - "loss": 2.371, - "step": 256680 - }, - { - "epoch": 0.9, - "learning_rate": 5.2363480365656735e-06, - "loss": 2.3569, - "step": 256690 - }, - { - "epoch": 0.9, - "learning_rate": 5.234604156712019e-06, - "loss": 2.3565, - "step": 256700 - }, - { - "epoch": 0.9, - "learning_rate": 5.232860276858366e-06, - "loss": 2.3014, - "step": 256710 - }, - { - "epoch": 0.9, - "learning_rate": 5.231116397004712e-06, - "loss": 2.3847, - "step": 256720 - }, - { - "epoch": 0.9, - "learning_rate": 5.229372517151059e-06, - "loss": 2.339, - "step": 256730 - }, - { - "epoch": 0.9, - "learning_rate": 5.2276286372974044e-06, - "loss": 2.3468, - "step": 256740 - }, - { - "epoch": 0.9, - "learning_rate": 5.225884757443751e-06, - "loss": 2.3991, - "step": 256750 - }, - { - "epoch": 0.9, - "learning_rate": 5.224140877590098e-06, - "loss": 2.3706, - "step": 256760 - }, - { - "epoch": 0.9, - "learning_rate": 5.2223969977364445e-06, - "loss": 2.3427, - "step": 256770 - }, - { - "epoch": 0.9, - "learning_rate": 5.22065311788279e-06, - "loss": 2.3872, - "step": 256780 - }, - { - "epoch": 0.9, - "learning_rate": 5.218909238029137e-06, - "loss": 2.3275, - "step": 256790 - }, - { - "epoch": 0.9, - "learning_rate": 5.217165358175483e-06, - "loss": 2.3744, - "step": 256800 - }, - { - "epoch": 0.9, - "learning_rate": 5.21542147832183e-06, - "loss": 2.369, - "step": 256810 - }, - { - "epoch": 0.9, - "learning_rate": 5.2136775984681754e-06, - "loss": 2.3179, - "step": 256820 - }, - { - "epoch": 0.9, - "learning_rate": 5.211933718614523e-06, - "loss": 2.362, - "step": 256830 - }, - { - "epoch": 0.9, - "learning_rate": 5.210189838760869e-06, - "loss": 2.3696, - "step": 256840 - }, - { - "epoch": 0.9, - "learning_rate": 5.2084459589072155e-06, - "loss": 2.3714, - "step": 256850 - }, - { - "epoch": 0.9, - "learning_rate": 5.206702079053561e-06, - "loss": 2.3509, - "step": 256860 - }, - { - "epoch": 0.9, - "learning_rate": 5.204958199199908e-06, - "loss": 2.3564, - "step": 256870 - }, - { - "epoch": 0.9, - "learning_rate": 5.203214319346254e-06, - "loss": 2.3223, - "step": 256880 - }, - { - "epoch": 0.9, - "learning_rate": 5.2014704394926014e-06, - "loss": 2.3757, - "step": 256890 - }, - { - "epoch": 0.9, - "learning_rate": 5.199726559638947e-06, - "loss": 2.3983, - "step": 256900 - }, - { - "epoch": 0.9, - "learning_rate": 5.197982679785294e-06, - "loss": 2.367, - "step": 256910 - }, - { - "epoch": 0.9, - "learning_rate": 5.19623879993164e-06, - "loss": 2.3722, - "step": 256920 - }, - { - "epoch": 0.9, - "learning_rate": 5.1944949200779865e-06, - "loss": 2.2908, - "step": 256930 - }, - { - "epoch": 0.9, - "learning_rate": 5.192751040224332e-06, - "loss": 2.4104, - "step": 256940 - }, - { - "epoch": 0.9, - "learning_rate": 5.191007160370679e-06, - "loss": 2.3264, - "step": 256950 - }, - { - "epoch": 0.9, - "learning_rate": 5.189263280517026e-06, - "loss": 2.3562, - "step": 256960 - }, - { - "epoch": 0.9, - "learning_rate": 5.1875194006633724e-06, - "loss": 2.305, - "step": 256970 - }, - { - "epoch": 0.9, - "learning_rate": 5.185775520809718e-06, - "loss": 2.4383, - "step": 256980 - }, - { - "epoch": 0.9, - "learning_rate": 5.184031640956065e-06, - "loss": 2.2791, - "step": 256990 - }, - { - "epoch": 0.9, - "learning_rate": 5.182287761102411e-06, - "loss": 2.4113, - "step": 257000 - }, - { - "epoch": 0.9, - "learning_rate": 5.1805438812487575e-06, - "loss": 2.3209, - "step": 257010 - }, - { - "epoch": 0.9, - "learning_rate": 5.178800001395104e-06, - "loss": 2.427, - "step": 257020 - }, - { - "epoch": 0.9, - "learning_rate": 5.177056121541451e-06, - "loss": 2.4318, - "step": 257030 - }, - { - "epoch": 0.9, - "learning_rate": 5.175312241687797e-06, - "loss": 2.3616, - "step": 257040 - }, - { - "epoch": 0.9, - "learning_rate": 5.1735683618341434e-06, - "loss": 2.3726, - "step": 257050 - }, - { - "epoch": 0.9, - "learning_rate": 5.171824481980489e-06, - "loss": 2.4024, - "step": 257060 - }, - { - "epoch": 0.9, - "learning_rate": 5.170080602126836e-06, - "loss": 2.3935, - "step": 257070 - }, - { - "epoch": 0.9, - "learning_rate": 5.168336722273182e-06, - "loss": 2.3543, - "step": 257080 - }, - { - "epoch": 0.9, - "learning_rate": 5.166592842419529e-06, - "loss": 2.318, - "step": 257090 - }, - { - "epoch": 0.9, - "learning_rate": 5.164848962565875e-06, - "loss": 2.3125, - "step": 257100 - }, - { - "epoch": 0.9, - "learning_rate": 5.163105082712222e-06, - "loss": 2.3714, - "step": 257110 - }, - { - "epoch": 0.9, - "learning_rate": 5.161361202858568e-06, - "loss": 2.3635, - "step": 257120 - }, - { - "epoch": 0.9, - "learning_rate": 5.1596173230049144e-06, - "loss": 2.39, - "step": 257130 - }, - { - "epoch": 0.9, - "learning_rate": 5.15787344315126e-06, - "loss": 2.3963, - "step": 257140 - }, - { - "epoch": 0.9, - "learning_rate": 5.156129563297607e-06, - "loss": 2.3936, - "step": 257150 - }, - { - "epoch": 0.9, - "learning_rate": 5.154385683443954e-06, - "loss": 2.4016, - "step": 257160 - }, - { - "epoch": 0.9, - "learning_rate": 5.1526418035903e-06, - "loss": 2.2812, - "step": 257170 - }, - { - "epoch": 0.9, - "learning_rate": 5.150897923736646e-06, - "loss": 2.3631, - "step": 257180 - }, - { - "epoch": 0.9, - "learning_rate": 5.149154043882993e-06, - "loss": 2.4348, - "step": 257190 - }, - { - "epoch": 0.9, - "learning_rate": 5.147410164029339e-06, - "loss": 2.3934, - "step": 257200 - }, - { - "epoch": 0.9, - "learning_rate": 5.1456662841756854e-06, - "loss": 2.3166, - "step": 257210 - }, - { - "epoch": 0.9, - "learning_rate": 5.143922404322032e-06, - "loss": 2.3631, - "step": 257220 - }, - { - "epoch": 0.9, - "learning_rate": 5.142178524468379e-06, - "loss": 2.4293, - "step": 257230 - }, - { - "epoch": 0.9, - "learning_rate": 5.140434644614725e-06, - "loss": 2.3747, - "step": 257240 - }, - { - "epoch": 0.9, - "learning_rate": 5.138690764761071e-06, - "loss": 2.3977, - "step": 257250 - }, - { - "epoch": 0.9, - "learning_rate": 5.136946884907417e-06, - "loss": 2.2926, - "step": 257260 - }, - { - "epoch": 0.9, - "learning_rate": 5.135203005053764e-06, - "loss": 2.323, - "step": 257270 - }, - { - "epoch": 0.9, - "learning_rate": 5.133459125200111e-06, - "loss": 2.376, - "step": 257280 - }, - { - "epoch": 0.9, - "learning_rate": 5.131715245346457e-06, - "loss": 2.3071, - "step": 257290 - }, - { - "epoch": 0.9, - "learning_rate": 5.129971365492803e-06, - "loss": 2.2773, - "step": 257300 - }, - { - "epoch": 0.9, - "learning_rate": 5.12822748563915e-06, - "loss": 2.3829, - "step": 257310 - }, - { - "epoch": 0.9, - "learning_rate": 5.126483605785496e-06, - "loss": 2.41, - "step": 257320 - }, - { - "epoch": 0.9, - "learning_rate": 5.124739725931842e-06, - "loss": 2.3027, - "step": 257330 - }, - { - "epoch": 0.9, - "learning_rate": 5.122995846078188e-06, - "loss": 2.2588, - "step": 257340 - }, - { - "epoch": 0.9, - "learning_rate": 5.121251966224535e-06, - "loss": 2.2358, - "step": 257350 - }, - { - "epoch": 0.9, - "learning_rate": 5.119508086370882e-06, - "loss": 2.3593, - "step": 257360 - }, - { - "epoch": 0.9, - "learning_rate": 5.117764206517228e-06, - "loss": 2.3454, - "step": 257370 - }, - { - "epoch": 0.9, - "learning_rate": 5.116020326663574e-06, - "loss": 2.3462, - "step": 257380 - }, - { - "epoch": 0.9, - "learning_rate": 5.114276446809921e-06, - "loss": 2.4014, - "step": 257390 - }, - { - "epoch": 0.9, - "learning_rate": 5.112532566956267e-06, - "loss": 2.2754, - "step": 257400 - }, - { - "epoch": 0.9, - "learning_rate": 5.110788687102613e-06, - "loss": 2.3404, - "step": 257410 - }, - { - "epoch": 0.9, - "learning_rate": 5.10904480724896e-06, - "loss": 2.3427, - "step": 257420 - }, - { - "epoch": 0.9, - "learning_rate": 5.107300927395307e-06, - "loss": 2.3379, - "step": 257430 - }, - { - "epoch": 0.9, - "learning_rate": 5.105557047541653e-06, - "loss": 2.3091, - "step": 257440 - }, - { - "epoch": 0.9, - "learning_rate": 5.103813167687999e-06, - "loss": 2.3933, - "step": 257450 - }, - { - "epoch": 0.9, - "learning_rate": 5.102069287834345e-06, - "loss": 2.3192, - "step": 257460 - }, - { - "epoch": 0.9, - "learning_rate": 5.100325407980692e-06, - "loss": 2.4396, - "step": 257470 - }, - { - "epoch": 0.9, - "learning_rate": 5.0985815281270385e-06, - "loss": 2.3595, - "step": 257480 - }, - { - "epoch": 0.9, - "learning_rate": 5.096837648273385e-06, - "loss": 2.3795, - "step": 257490 - }, - { - "epoch": 0.9, - "learning_rate": 5.095093768419731e-06, - "loss": 2.393, - "step": 257500 - }, - { - "epoch": 0.9, - "learning_rate": 5.093349888566078e-06, - "loss": 2.4275, - "step": 257510 - }, - { - "epoch": 0.9, - "learning_rate": 5.091606008712424e-06, - "loss": 2.4011, - "step": 257520 - }, - { - "epoch": 0.9, - "learning_rate": 5.08986212885877e-06, - "loss": 2.3176, - "step": 257530 - }, - { - "epoch": 0.9, - "learning_rate": 5.088118249005117e-06, - "loss": 2.4229, - "step": 257540 - }, - { - "epoch": 0.9, - "learning_rate": 5.086374369151463e-06, - "loss": 2.2913, - "step": 257550 - }, - { - "epoch": 0.9, - "learning_rate": 5.0846304892978095e-06, - "loss": 2.3762, - "step": 257560 - }, - { - "epoch": 0.9, - "learning_rate": 5.082886609444156e-06, - "loss": 2.3367, - "step": 257570 - }, - { - "epoch": 0.9, - "learning_rate": 5.081142729590502e-06, - "loss": 2.3427, - "step": 257580 - }, - { - "epoch": 0.9, - "learning_rate": 5.079398849736849e-06, - "loss": 2.4109, - "step": 257590 - }, - { - "epoch": 0.9, - "learning_rate": 5.0776549698831955e-06, - "loss": 2.3766, - "step": 257600 - }, - { - "epoch": 0.9, - "learning_rate": 5.075911090029541e-06, - "loss": 2.3605, - "step": 257610 - }, - { - "epoch": 0.9, - "learning_rate": 5.074167210175888e-06, - "loss": 2.2901, - "step": 257620 - }, - { - "epoch": 0.9, - "learning_rate": 5.072423330322235e-06, - "loss": 2.2964, - "step": 257630 - }, - { - "epoch": 0.9, - "learning_rate": 5.0706794504685805e-06, - "loss": 2.3229, - "step": 257640 - }, - { - "epoch": 0.9, - "learning_rate": 5.068935570614927e-06, - "loss": 2.3524, - "step": 257650 - }, - { - "epoch": 0.9, - "learning_rate": 5.067191690761273e-06, - "loss": 2.3766, - "step": 257660 - }, - { - "epoch": 0.9, - "learning_rate": 5.06544781090762e-06, - "loss": 2.3261, - "step": 257670 - }, - { - "epoch": 0.9, - "learning_rate": 5.0637039310539665e-06, - "loss": 2.3511, - "step": 257680 - }, - { - "epoch": 0.9, - "learning_rate": 5.061960051200313e-06, - "loss": 2.4216, - "step": 257690 - }, - { - "epoch": 0.9, - "learning_rate": 5.060216171346659e-06, - "loss": 2.4148, - "step": 257700 - }, - { - "epoch": 0.9, - "learning_rate": 5.058472291493006e-06, - "loss": 2.321, - "step": 257710 - }, - { - "epoch": 0.9, - "learning_rate": 5.0567284116393515e-06, - "loss": 2.3601, - "step": 257720 - }, - { - "epoch": 0.9, - "learning_rate": 5.054984531785698e-06, - "loss": 2.3226, - "step": 257730 - }, - { - "epoch": 0.9, - "learning_rate": 5.053240651932045e-06, - "loss": 2.4482, - "step": 257740 - }, - { - "epoch": 0.9, - "learning_rate": 5.051496772078391e-06, - "loss": 2.4066, - "step": 257750 - }, - { - "epoch": 0.9, - "learning_rate": 5.0497528922247375e-06, - "loss": 2.4, - "step": 257760 - }, - { - "epoch": 0.9, - "learning_rate": 5.048009012371084e-06, - "loss": 2.4275, - "step": 257770 - }, - { - "epoch": 0.9, - "learning_rate": 5.04626513251743e-06, - "loss": 2.2931, - "step": 257780 - }, - { - "epoch": 0.9, - "learning_rate": 5.044521252663777e-06, - "loss": 2.2831, - "step": 257790 - }, - { - "epoch": 0.9, - "learning_rate": 5.042777372810123e-06, - "loss": 2.3071, - "step": 257800 - }, - { - "epoch": 0.9, - "learning_rate": 5.041033492956469e-06, - "loss": 2.3743, - "step": 257810 - }, - { - "epoch": 0.9, - "learning_rate": 5.039289613102816e-06, - "loss": 2.3105, - "step": 257820 - }, - { - "epoch": 0.9, - "learning_rate": 5.037545733249163e-06, - "loss": 2.381, - "step": 257830 - }, - { - "epoch": 0.9, - "learning_rate": 5.0358018533955085e-06, - "loss": 2.306, - "step": 257840 - }, - { - "epoch": 0.9, - "learning_rate": 5.034057973541855e-06, - "loss": 2.4386, - "step": 257850 - }, - { - "epoch": 0.9, - "learning_rate": 5.032314093688202e-06, - "loss": 2.2909, - "step": 257860 - }, - { - "epoch": 0.9, - "learning_rate": 5.030570213834548e-06, - "loss": 2.3403, - "step": 257870 - }, - { - "epoch": 0.9, - "learning_rate": 5.028826333980894e-06, - "loss": 2.4475, - "step": 257880 - }, - { - "epoch": 0.9, - "learning_rate": 5.027082454127241e-06, - "loss": 2.3357, - "step": 257890 - }, - { - "epoch": 0.9, - "learning_rate": 5.025338574273587e-06, - "loss": 2.4035, - "step": 257900 - }, - { - "epoch": 0.9, - "learning_rate": 5.023594694419934e-06, - "loss": 2.4184, - "step": 257910 - }, - { - "epoch": 0.9, - "learning_rate": 5.0218508145662795e-06, - "loss": 2.3988, - "step": 257920 - }, - { - "epoch": 0.9, - "learning_rate": 5.020106934712626e-06, - "loss": 2.3095, - "step": 257930 - }, - { - "epoch": 0.9, - "learning_rate": 5.018363054858973e-06, - "loss": 2.3571, - "step": 257940 - }, - { - "epoch": 0.9, - "learning_rate": 5.016619175005319e-06, - "loss": 2.2416, - "step": 257950 - }, - { - "epoch": 0.9, - "learning_rate": 5.014875295151665e-06, - "loss": 2.371, - "step": 257960 - }, - { - "epoch": 0.9, - "learning_rate": 5.013131415298012e-06, - "loss": 2.3062, - "step": 257970 - }, - { - "epoch": 0.9, - "learning_rate": 5.011387535444358e-06, - "loss": 2.383, - "step": 257980 - }, - { - "epoch": 0.9, - "learning_rate": 5.009643655590705e-06, - "loss": 2.3184, - "step": 257990 - }, - { - "epoch": 0.9, - "learning_rate": 5.007899775737051e-06, - "loss": 2.4382, - "step": 258000 - }, - { - "epoch": 0.9, - "learning_rate": 5.006155895883397e-06, - "loss": 2.37, - "step": 258010 - }, - { - "epoch": 0.9, - "learning_rate": 5.004412016029744e-06, - "loss": 2.3484, - "step": 258020 - }, - { - "epoch": 0.9, - "learning_rate": 5.0026681361760905e-06, - "loss": 2.3196, - "step": 258030 - }, - { - "epoch": 0.9, - "learning_rate": 5.000924256322436e-06, - "loss": 2.2903, - "step": 258040 - }, - { - "epoch": 0.9, - "learning_rate": 4.999180376468783e-06, - "loss": 2.4194, - "step": 258050 - }, - { - "epoch": 0.9, - "learning_rate": 4.99743649661513e-06, - "loss": 2.3215, - "step": 258060 - }, - { - "epoch": 0.9, - "learning_rate": 4.995692616761476e-06, - "loss": 2.3148, - "step": 258070 - }, - { - "epoch": 0.9, - "learning_rate": 4.993948736907822e-06, - "loss": 2.4586, - "step": 258080 - }, - { - "epoch": 0.9, - "learning_rate": 4.992204857054169e-06, - "loss": 2.3239, - "step": 258090 - }, - { - "epoch": 0.9, - "learning_rate": 4.990460977200515e-06, - "loss": 2.3785, - "step": 258100 - }, - { - "epoch": 0.9, - "learning_rate": 4.9887170973468615e-06, - "loss": 2.3849, - "step": 258110 - }, - { - "epoch": 0.9, - "learning_rate": 4.986973217493208e-06, - "loss": 2.31, - "step": 258120 - }, - { - "epoch": 0.9, - "learning_rate": 4.985229337639554e-06, - "loss": 2.3325, - "step": 258130 - }, - { - "epoch": 0.9, - "learning_rate": 4.983485457785901e-06, - "loss": 2.3265, - "step": 258140 - }, - { - "epoch": 0.9, - "learning_rate": 4.981741577932247e-06, - "loss": 2.3174, - "step": 258150 - }, - { - "epoch": 0.9, - "learning_rate": 4.979997698078593e-06, - "loss": 2.3649, - "step": 258160 - }, - { - "epoch": 0.9, - "learning_rate": 4.97825381822494e-06, - "loss": 2.3315, - "step": 258170 - }, - { - "epoch": 0.9, - "learning_rate": 4.976509938371286e-06, - "loss": 2.3052, - "step": 258180 - }, - { - "epoch": 0.9, - "learning_rate": 4.9747660585176325e-06, - "loss": 2.2661, - "step": 258190 - }, - { - "epoch": 0.9, - "learning_rate": 4.973022178663979e-06, - "loss": 2.4095, - "step": 258200 - }, - { - "epoch": 0.9, - "learning_rate": 4.971278298810325e-06, - "loss": 2.3187, - "step": 258210 - }, - { - "epoch": 0.9, - "learning_rate": 4.969534418956672e-06, - "loss": 2.3892, - "step": 258220 - }, - { - "epoch": 0.9, - "learning_rate": 4.9677905391030185e-06, - "loss": 2.3149, - "step": 258230 - }, - { - "epoch": 0.9, - "learning_rate": 4.966046659249364e-06, - "loss": 2.3179, - "step": 258240 - }, - { - "epoch": 0.9, - "learning_rate": 4.964302779395711e-06, - "loss": 2.2662, - "step": 258250 - }, - { - "epoch": 0.9, - "learning_rate": 4.962558899542058e-06, - "loss": 2.3628, - "step": 258260 - }, - { - "epoch": 0.9, - "learning_rate": 4.9608150196884035e-06, - "loss": 2.3899, - "step": 258270 - }, - { - "epoch": 0.9, - "learning_rate": 4.95907113983475e-06, - "loss": 2.3703, - "step": 258280 - }, - { - "epoch": 0.9, - "learning_rate": 4.957327259981097e-06, - "loss": 2.3522, - "step": 258290 - }, - { - "epoch": 0.9, - "learning_rate": 4.955583380127443e-06, - "loss": 2.3157, - "step": 258300 - }, - { - "epoch": 0.9, - "learning_rate": 4.9538395002737895e-06, - "loss": 2.3566, - "step": 258310 - }, - { - "epoch": 0.9, - "learning_rate": 4.952095620420136e-06, - "loss": 2.3547, - "step": 258320 - }, - { - "epoch": 0.9, - "learning_rate": 4.950351740566482e-06, - "loss": 2.343, - "step": 258330 - }, - { - "epoch": 0.9, - "learning_rate": 4.948607860712829e-06, - "loss": 2.4028, - "step": 258340 - }, - { - "epoch": 0.9, - "learning_rate": 4.9468639808591745e-06, - "loss": 2.388, - "step": 258350 - }, - { - "epoch": 0.9, - "learning_rate": 4.945120101005521e-06, - "loss": 2.3604, - "step": 258360 - }, - { - "epoch": 0.9, - "learning_rate": 4.943376221151868e-06, - "loss": 2.3053, - "step": 258370 - }, - { - "epoch": 0.9, - "learning_rate": 4.941632341298215e-06, - "loss": 2.3987, - "step": 258380 - }, - { - "epoch": 0.9, - "learning_rate": 4.9398884614445605e-06, - "loss": 2.2759, - "step": 258390 - }, - { - "epoch": 0.9, - "learning_rate": 4.938144581590907e-06, - "loss": 2.3716, - "step": 258400 - }, - { - "epoch": 0.9, - "learning_rate": 4.936400701737253e-06, - "loss": 2.3781, - "step": 258410 - }, - { - "epoch": 0.9, - "learning_rate": 4.9346568218836e-06, - "loss": 2.3589, - "step": 258420 - }, - { - "epoch": 0.9, - "learning_rate": 4.932912942029946e-06, - "loss": 2.3636, - "step": 258430 - }, - { - "epoch": 0.9, - "learning_rate": 4.931169062176292e-06, - "loss": 2.3523, - "step": 258440 - }, - { - "epoch": 0.9, - "learning_rate": 4.929425182322639e-06, - "loss": 2.3438, - "step": 258450 - }, - { - "epoch": 0.9, - "learning_rate": 4.927681302468986e-06, - "loss": 2.3194, - "step": 258460 - }, - { - "epoch": 0.9, - "learning_rate": 4.9259374226153315e-06, - "loss": 2.4383, - "step": 258470 - }, - { - "epoch": 0.9, - "learning_rate": 4.924193542761678e-06, - "loss": 2.2923, - "step": 258480 - }, - { - "epoch": 0.9, - "learning_rate": 4.922449662908025e-06, - "loss": 2.3405, - "step": 258490 - }, - { - "epoch": 0.9, - "learning_rate": 4.920705783054371e-06, - "loss": 2.2166, - "step": 258500 - }, - { - "epoch": 0.9, - "learning_rate": 4.918961903200717e-06, - "loss": 2.4169, - "step": 258510 - }, - { - "epoch": 0.9, - "learning_rate": 4.917218023347064e-06, - "loss": 2.3162, - "step": 258520 - }, - { - "epoch": 0.9, - "learning_rate": 4.91547414349341e-06, - "loss": 2.2827, - "step": 258530 - }, - { - "epoch": 0.9, - "learning_rate": 4.913730263639757e-06, - "loss": 2.3291, - "step": 258540 - }, - { - "epoch": 0.9, - "learning_rate": 4.9119863837861025e-06, - "loss": 2.4561, - "step": 258550 - }, - { - "epoch": 0.9, - "learning_rate": 4.910242503932449e-06, - "loss": 2.3809, - "step": 258560 - }, - { - "epoch": 0.9, - "learning_rate": 4.908498624078796e-06, - "loss": 2.2839, - "step": 258570 - }, - { - "epoch": 0.9, - "learning_rate": 4.9067547442251425e-06, - "loss": 2.2899, - "step": 258580 - }, - { - "epoch": 0.9, - "learning_rate": 4.905010864371488e-06, - "loss": 2.3067, - "step": 258590 - }, - { - "epoch": 0.9, - "learning_rate": 4.903266984517835e-06, - "loss": 2.3839, - "step": 258600 - }, - { - "epoch": 0.9, - "learning_rate": 4.901523104664181e-06, - "loss": 2.3496, - "step": 258610 - }, - { - "epoch": 0.9, - "learning_rate": 4.899779224810528e-06, - "loss": 2.364, - "step": 258620 - }, - { - "epoch": 0.9, - "learning_rate": 4.898035344956874e-06, - "loss": 2.4226, - "step": 258630 - }, - { - "epoch": 0.9, - "learning_rate": 4.896291465103221e-06, - "loss": 2.3899, - "step": 258640 - }, - { - "epoch": 0.9, - "learning_rate": 4.894547585249567e-06, - "loss": 2.476, - "step": 258650 - }, - { - "epoch": 0.9, - "learning_rate": 4.8928037053959135e-06, - "loss": 2.3479, - "step": 258660 - }, - { - "epoch": 0.9, - "learning_rate": 4.891059825542259e-06, - "loss": 2.3859, - "step": 258670 - }, - { - "epoch": 0.9, - "learning_rate": 4.889315945688606e-06, - "loss": 2.4304, - "step": 258680 - }, - { - "epoch": 0.9, - "learning_rate": 4.887572065834953e-06, - "loss": 2.4256, - "step": 258690 - }, - { - "epoch": 0.9, - "learning_rate": 4.885828185981299e-06, - "loss": 2.4201, - "step": 258700 - }, - { - "epoch": 0.9, - "learning_rate": 4.884084306127645e-06, - "loss": 2.3957, - "step": 258710 - }, - { - "epoch": 0.9, - "learning_rate": 4.882340426273992e-06, - "loss": 2.3624, - "step": 258720 - }, - { - "epoch": 0.9, - "learning_rate": 4.880596546420338e-06, - "loss": 2.439, - "step": 258730 - }, - { - "epoch": 0.9, - "learning_rate": 4.8788526665666845e-06, - "loss": 2.3351, - "step": 258740 - }, - { - "epoch": 0.9, - "learning_rate": 4.87710878671303e-06, - "loss": 2.2996, - "step": 258750 - }, - { - "epoch": 0.9, - "learning_rate": 4.875364906859377e-06, - "loss": 2.3144, - "step": 258760 - }, - { - "epoch": 0.9, - "learning_rate": 4.873621027005724e-06, - "loss": 2.3907, - "step": 258770 - }, - { - "epoch": 0.9, - "learning_rate": 4.8718771471520705e-06, - "loss": 2.3612, - "step": 258780 - }, - { - "epoch": 0.9, - "learning_rate": 4.870133267298416e-06, - "loss": 2.3395, - "step": 258790 - }, - { - "epoch": 0.9, - "learning_rate": 4.868389387444763e-06, - "loss": 2.477, - "step": 258800 - }, - { - "epoch": 0.9, - "learning_rate": 4.866645507591109e-06, - "loss": 2.318, - "step": 258810 - }, - { - "epoch": 0.9, - "learning_rate": 4.8649016277374555e-06, - "loss": 2.3336, - "step": 258820 - }, - { - "epoch": 0.9, - "learning_rate": 4.863157747883802e-06, - "loss": 2.4125, - "step": 258830 - }, - { - "epoch": 0.9, - "learning_rate": 4.861413868030149e-06, - "loss": 2.3609, - "step": 258840 - }, - { - "epoch": 0.9, - "learning_rate": 4.859669988176495e-06, - "loss": 2.1989, - "step": 258850 - }, - { - "epoch": 0.9, - "learning_rate": 4.8579261083228415e-06, - "loss": 2.3615, - "step": 258860 - }, - { - "epoch": 0.9, - "learning_rate": 4.856182228469187e-06, - "loss": 2.3676, - "step": 258870 - }, - { - "epoch": 0.9, - "learning_rate": 4.854438348615534e-06, - "loss": 2.3706, - "step": 258880 - }, - { - "epoch": 0.9, - "learning_rate": 4.852694468761881e-06, - "loss": 2.3481, - "step": 258890 - }, - { - "epoch": 0.9, - "learning_rate": 4.850950588908227e-06, - "loss": 2.3869, - "step": 258900 - }, - { - "epoch": 0.9, - "learning_rate": 4.849206709054573e-06, - "loss": 2.2858, - "step": 258910 - }, - { - "epoch": 0.9, - "learning_rate": 4.84746282920092e-06, - "loss": 2.3335, - "step": 258920 - }, - { - "epoch": 0.9, - "learning_rate": 4.845718949347266e-06, - "loss": 2.2927, - "step": 258930 - }, - { - "epoch": 0.9, - "learning_rate": 4.8439750694936125e-06, - "loss": 2.3189, - "step": 258940 - }, - { - "epoch": 0.9, - "learning_rate": 4.842231189639959e-06, - "loss": 2.4216, - "step": 258950 - }, - { - "epoch": 0.9, - "learning_rate": 4.840487309786305e-06, - "loss": 2.3337, - "step": 258960 - }, - { - "epoch": 0.9, - "learning_rate": 4.838743429932652e-06, - "loss": 2.3331, - "step": 258970 - }, - { - "epoch": 0.9, - "learning_rate": 4.836999550078998e-06, - "loss": 2.3653, - "step": 258980 - }, - { - "epoch": 0.9, - "learning_rate": 4.835255670225344e-06, - "loss": 2.3374, - "step": 258990 - }, - { - "epoch": 0.9, - "learning_rate": 4.833511790371691e-06, - "loss": 2.3544, - "step": 259000 - }, - { - "epoch": 0.9, - "learning_rate": 4.831767910518037e-06, - "loss": 2.366, - "step": 259010 - }, - { - "epoch": 0.9, - "learning_rate": 4.8300240306643835e-06, - "loss": 2.2731, - "step": 259020 - }, - { - "epoch": 0.9, - "learning_rate": 4.82828015081073e-06, - "loss": 2.3712, - "step": 259030 - }, - { - "epoch": 0.9, - "learning_rate": 4.826536270957077e-06, - "loss": 2.3226, - "step": 259040 - }, - { - "epoch": 0.9, - "learning_rate": 4.824792391103423e-06, - "loss": 2.4115, - "step": 259050 - }, - { - "epoch": 0.9, - "learning_rate": 4.823048511249769e-06, - "loss": 2.2428, - "step": 259060 - }, - { - "epoch": 0.9, - "learning_rate": 4.821304631396115e-06, - "loss": 2.3345, - "step": 259070 - }, - { - "epoch": 0.9, - "learning_rate": 4.819560751542462e-06, - "loss": 2.3343, - "step": 259080 - }, - { - "epoch": 0.9, - "learning_rate": 4.817816871688809e-06, - "loss": 2.3191, - "step": 259090 - }, - { - "epoch": 0.9, - "learning_rate": 4.816072991835155e-06, - "loss": 2.4026, - "step": 259100 - }, - { - "epoch": 0.9, - "learning_rate": 4.814329111981501e-06, - "loss": 2.3822, - "step": 259110 - }, - { - "epoch": 0.9, - "learning_rate": 4.812585232127848e-06, - "loss": 2.3576, - "step": 259120 - }, - { - "epoch": 0.9, - "learning_rate": 4.810841352274194e-06, - "loss": 2.4168, - "step": 259130 - }, - { - "epoch": 0.9, - "learning_rate": 4.80909747242054e-06, - "loss": 2.4301, - "step": 259140 - }, - { - "epoch": 0.9, - "learning_rate": 4.807353592566887e-06, - "loss": 2.3942, - "step": 259150 - }, - { - "epoch": 0.9, - "learning_rate": 4.805609712713234e-06, - "loss": 2.3377, - "step": 259160 - }, - { - "epoch": 0.9, - "learning_rate": 4.80386583285958e-06, - "loss": 2.3486, - "step": 259170 - }, - { - "epoch": 0.9, - "learning_rate": 4.802121953005926e-06, - "loss": 2.3803, - "step": 259180 - }, - { - "epoch": 0.9, - "learning_rate": 4.800378073152272e-06, - "loss": 2.2363, - "step": 259190 - }, - { - "epoch": 0.9, - "learning_rate": 4.798634193298619e-06, - "loss": 2.3449, - "step": 259200 - }, - { - "epoch": 0.9, - "learning_rate": 4.796890313444965e-06, - "loss": 2.3832, - "step": 259210 - }, - { - "epoch": 0.9, - "learning_rate": 4.795146433591312e-06, - "loss": 2.3288, - "step": 259220 - }, - { - "epoch": 0.9, - "learning_rate": 4.793402553737658e-06, - "loss": 2.3178, - "step": 259230 - }, - { - "epoch": 0.9, - "learning_rate": 4.791658673884005e-06, - "loss": 2.3917, - "step": 259240 - }, - { - "epoch": 0.9, - "learning_rate": 4.789914794030351e-06, - "loss": 2.2798, - "step": 259250 - }, - { - "epoch": 0.9, - "learning_rate": 4.788170914176697e-06, - "loss": 2.38, - "step": 259260 - }, - { - "epoch": 0.9, - "learning_rate": 4.786427034323043e-06, - "loss": 2.2874, - "step": 259270 - }, - { - "epoch": 0.9, - "learning_rate": 4.78468315446939e-06, - "loss": 2.3397, - "step": 259280 - }, - { - "epoch": 0.9, - "learning_rate": 4.7829392746157366e-06, - "loss": 2.3002, - "step": 259290 - }, - { - "epoch": 0.9, - "learning_rate": 4.781195394762083e-06, - "loss": 2.3662, - "step": 259300 - }, - { - "epoch": 0.9, - "learning_rate": 4.779451514908429e-06, - "loss": 2.3571, - "step": 259310 - }, - { - "epoch": 0.9, - "learning_rate": 4.777707635054776e-06, - "loss": 2.3193, - "step": 259320 - }, - { - "epoch": 0.9, - "learning_rate": 4.775963755201122e-06, - "loss": 2.3084, - "step": 259330 - }, - { - "epoch": 0.9, - "learning_rate": 4.774219875347468e-06, - "loss": 2.3055, - "step": 259340 - }, - { - "epoch": 0.9, - "learning_rate": 4.772475995493815e-06, - "loss": 2.3862, - "step": 259350 - }, - { - "epoch": 0.9, - "learning_rate": 4.770732115640162e-06, - "loss": 2.2909, - "step": 259360 - }, - { - "epoch": 0.9, - "learning_rate": 4.7689882357865076e-06, - "loss": 2.3637, - "step": 259370 - }, - { - "epoch": 0.9, - "learning_rate": 4.767244355932854e-06, - "loss": 2.3273, - "step": 259380 - }, - { - "epoch": 0.9, - "learning_rate": 4.7655004760792e-06, - "loss": 2.3745, - "step": 259390 - }, - { - "epoch": 0.9, - "learning_rate": 4.763756596225547e-06, - "loss": 2.344, - "step": 259400 - }, - { - "epoch": 0.9, - "learning_rate": 4.762012716371893e-06, - "loss": 2.3231, - "step": 259410 - }, - { - "epoch": 0.9, - "learning_rate": 4.76026883651824e-06, - "loss": 2.3984, - "step": 259420 - }, - { - "epoch": 0.9, - "learning_rate": 4.758524956664586e-06, - "loss": 2.387, - "step": 259430 - }, - { - "epoch": 0.9, - "learning_rate": 4.756781076810933e-06, - "loss": 2.302, - "step": 259440 - }, - { - "epoch": 0.9, - "learning_rate": 4.7550371969572786e-06, - "loss": 2.2626, - "step": 259450 - }, - { - "epoch": 0.9, - "learning_rate": 4.753293317103625e-06, - "loss": 2.3355, - "step": 259460 - }, - { - "epoch": 0.9, - "learning_rate": 4.751549437249971e-06, - "loss": 2.2764, - "step": 259470 - }, - { - "epoch": 0.91, - "learning_rate": 4.749805557396318e-06, - "loss": 2.3473, - "step": 259480 - }, - { - "epoch": 0.91, - "learning_rate": 4.7480616775426645e-06, - "loss": 2.2861, - "step": 259490 - }, - { - "epoch": 0.91, - "learning_rate": 4.746317797689011e-06, - "loss": 2.3256, - "step": 259500 - }, - { - "epoch": 0.91, - "learning_rate": 4.744573917835357e-06, - "loss": 2.3243, - "step": 259510 - }, - { - "epoch": 0.91, - "learning_rate": 4.742830037981704e-06, - "loss": 2.3573, - "step": 259520 - }, - { - "epoch": 0.91, - "learning_rate": 4.7410861581280496e-06, - "loss": 2.347, - "step": 259530 - }, - { - "epoch": 0.91, - "learning_rate": 4.739342278274396e-06, - "loss": 2.3069, - "step": 259540 - }, - { - "epoch": 0.91, - "learning_rate": 4.737598398420743e-06, - "loss": 2.3542, - "step": 259550 - }, - { - "epoch": 0.91, - "learning_rate": 4.73585451856709e-06, - "loss": 2.3488, - "step": 259560 - }, - { - "epoch": 0.91, - "learning_rate": 4.7341106387134355e-06, - "loss": 2.3554, - "step": 259570 - }, - { - "epoch": 0.91, - "learning_rate": 4.732366758859782e-06, - "loss": 2.4161, - "step": 259580 - }, - { - "epoch": 0.91, - "learning_rate": 4.730622879006128e-06, - "loss": 2.2804, - "step": 259590 - }, - { - "epoch": 0.91, - "learning_rate": 4.728878999152475e-06, - "loss": 2.2962, - "step": 259600 - }, - { - "epoch": 0.91, - "learning_rate": 4.7271351192988206e-06, - "loss": 2.2666, - "step": 259610 - }, - { - "epoch": 0.91, - "learning_rate": 4.725391239445168e-06, - "loss": 2.4088, - "step": 259620 - }, - { - "epoch": 0.91, - "learning_rate": 4.723647359591514e-06, - "loss": 2.3121, - "step": 259630 - }, - { - "epoch": 0.91, - "learning_rate": 4.721903479737861e-06, - "loss": 2.3308, - "step": 259640 - }, - { - "epoch": 0.91, - "learning_rate": 4.7201595998842065e-06, - "loss": 2.4001, - "step": 259650 - }, - { - "epoch": 0.91, - "learning_rate": 4.718415720030553e-06, - "loss": 2.3412, - "step": 259660 - }, - { - "epoch": 0.91, - "learning_rate": 4.716671840176899e-06, - "loss": 2.3498, - "step": 259670 - }, - { - "epoch": 0.91, - "learning_rate": 4.714927960323246e-06, - "loss": 2.3205, - "step": 259680 - }, - { - "epoch": 0.91, - "learning_rate": 4.713184080469592e-06, - "loss": 2.2944, - "step": 259690 - }, - { - "epoch": 0.91, - "learning_rate": 4.711440200615939e-06, - "loss": 2.3969, - "step": 259700 - }, - { - "epoch": 0.91, - "learning_rate": 4.709696320762285e-06, - "loss": 2.3272, - "step": 259710 - }, - { - "epoch": 0.91, - "learning_rate": 4.707952440908632e-06, - "loss": 2.3603, - "step": 259720 - }, - { - "epoch": 0.91, - "learning_rate": 4.7062085610549775e-06, - "loss": 2.3677, - "step": 259730 - }, - { - "epoch": 0.91, - "learning_rate": 4.704464681201324e-06, - "loss": 2.3242, - "step": 259740 - }, - { - "epoch": 0.91, - "learning_rate": 4.702720801347671e-06, - "loss": 2.2827, - "step": 259750 - }, - { - "epoch": 0.91, - "learning_rate": 4.7009769214940176e-06, - "loss": 2.3236, - "step": 259760 - }, - { - "epoch": 0.91, - "learning_rate": 4.699233041640363e-06, - "loss": 2.3765, - "step": 259770 - }, - { - "epoch": 0.91, - "learning_rate": 4.69748916178671e-06, - "loss": 2.3749, - "step": 259780 - }, - { - "epoch": 0.91, - "learning_rate": 4.695745281933056e-06, - "loss": 2.3496, - "step": 259790 - }, - { - "epoch": 0.91, - "learning_rate": 4.694001402079403e-06, - "loss": 2.3346, - "step": 259800 - }, - { - "epoch": 0.91, - "learning_rate": 4.6922575222257485e-06, - "loss": 2.3113, - "step": 259810 - }, - { - "epoch": 0.91, - "learning_rate": 4.690513642372096e-06, - "loss": 2.3166, - "step": 259820 - }, - { - "epoch": 0.91, - "learning_rate": 4.688769762518442e-06, - "loss": 2.328, - "step": 259830 - }, - { - "epoch": 0.91, - "learning_rate": 4.6870258826647886e-06, - "loss": 2.3098, - "step": 259840 - }, - { - "epoch": 0.91, - "learning_rate": 4.685282002811134e-06, - "loss": 2.3288, - "step": 259850 - }, - { - "epoch": 0.91, - "learning_rate": 4.683538122957481e-06, - "loss": 2.3503, - "step": 259860 - }, - { - "epoch": 0.91, - "learning_rate": 4.681794243103827e-06, - "loss": 2.3199, - "step": 259870 - }, - { - "epoch": 0.91, - "learning_rate": 4.680050363250174e-06, - "loss": 2.2534, - "step": 259880 - }, - { - "epoch": 0.91, - "learning_rate": 4.67830648339652e-06, - "loss": 2.3125, - "step": 259890 - }, - { - "epoch": 0.91, - "learning_rate": 4.676562603542867e-06, - "loss": 2.3054, - "step": 259900 - }, - { - "epoch": 0.91, - "learning_rate": 4.674818723689213e-06, - "loss": 2.3888, - "step": 259910 - }, - { - "epoch": 0.91, - "learning_rate": 4.6730748438355596e-06, - "loss": 2.304, - "step": 259920 - }, - { - "epoch": 0.91, - "learning_rate": 4.671330963981905e-06, - "loss": 2.3118, - "step": 259930 - }, - { - "epoch": 0.91, - "learning_rate": 4.669587084128252e-06, - "loss": 2.3723, - "step": 259940 - }, - { - "epoch": 0.91, - "learning_rate": 4.667843204274599e-06, - "loss": 2.3158, - "step": 259950 - }, - { - "epoch": 0.91, - "learning_rate": 4.6660993244209455e-06, - "loss": 2.4279, - "step": 259960 - }, - { - "epoch": 0.91, - "learning_rate": 4.664355444567291e-06, - "loss": 2.3485, - "step": 259970 - }, - { - "epoch": 0.91, - "learning_rate": 4.662611564713638e-06, - "loss": 2.3773, - "step": 259980 - }, - { - "epoch": 0.91, - "learning_rate": 4.660867684859984e-06, - "loss": 2.3709, - "step": 259990 - }, - { - "epoch": 0.91, - "learning_rate": 4.6591238050063306e-06, - "loss": 2.3385, - "step": 260000 - }, - { - "epoch": 0.91, - "learning_rate": 4.657379925152676e-06, - "loss": 2.3604, - "step": 260010 - }, - { - "epoch": 0.91, - "learning_rate": 4.655636045299024e-06, - "loss": 2.3301, - "step": 260020 - }, - { - "epoch": 0.91, - "learning_rate": 4.65389216544537e-06, - "loss": 2.4516, - "step": 260030 - }, - { - "epoch": 0.91, - "learning_rate": 4.6521482855917165e-06, - "loss": 2.2742, - "step": 260040 - }, - { - "epoch": 0.91, - "learning_rate": 4.650404405738062e-06, - "loss": 2.3722, - "step": 260050 - }, - { - "epoch": 0.91, - "learning_rate": 4.648660525884409e-06, - "loss": 2.2697, - "step": 260060 - }, - { - "epoch": 0.91, - "learning_rate": 4.646916646030755e-06, - "loss": 2.2789, - "step": 260070 - }, - { - "epoch": 0.91, - "learning_rate": 4.6451727661771016e-06, - "loss": 2.4295, - "step": 260080 - }, - { - "epoch": 0.91, - "learning_rate": 4.643428886323448e-06, - "loss": 2.3495, - "step": 260090 - }, - { - "epoch": 0.91, - "learning_rate": 4.641685006469795e-06, - "loss": 2.3177, - "step": 260100 - }, - { - "epoch": 0.91, - "learning_rate": 4.639941126616141e-06, - "loss": 2.3613, - "step": 260110 - }, - { - "epoch": 0.91, - "learning_rate": 4.6381972467624875e-06, - "loss": 2.32, - "step": 260120 - }, - { - "epoch": 0.91, - "learning_rate": 4.636453366908833e-06, - "loss": 2.3605, - "step": 260130 - }, - { - "epoch": 0.91, - "learning_rate": 4.63470948705518e-06, - "loss": 2.3197, - "step": 260140 - }, - { - "epoch": 0.91, - "learning_rate": 4.632965607201527e-06, - "loss": 2.3776, - "step": 260150 - }, - { - "epoch": 0.91, - "learning_rate": 4.631221727347873e-06, - "loss": 2.2885, - "step": 260160 - }, - { - "epoch": 0.91, - "learning_rate": 4.629477847494219e-06, - "loss": 2.3737, - "step": 260170 - }, - { - "epoch": 0.91, - "learning_rate": 4.627733967640566e-06, - "loss": 2.3868, - "step": 260180 - }, - { - "epoch": 0.91, - "learning_rate": 4.625990087786912e-06, - "loss": 2.379, - "step": 260190 - }, - { - "epoch": 0.91, - "learning_rate": 4.6242462079332585e-06, - "loss": 2.3408, - "step": 260200 - }, - { - "epoch": 0.91, - "learning_rate": 4.622502328079604e-06, - "loss": 2.4198, - "step": 260210 - }, - { - "epoch": 0.91, - "learning_rate": 4.620758448225952e-06, - "loss": 2.3695, - "step": 260220 - }, - { - "epoch": 0.91, - "learning_rate": 4.619014568372298e-06, - "loss": 2.3107, - "step": 260230 - }, - { - "epoch": 0.91, - "learning_rate": 4.617270688518644e-06, - "loss": 2.3492, - "step": 260240 - }, - { - "epoch": 0.91, - "learning_rate": 4.61552680866499e-06, - "loss": 2.3099, - "step": 260250 - }, - { - "epoch": 0.91, - "learning_rate": 4.613782928811337e-06, - "loss": 2.2823, - "step": 260260 - }, - { - "epoch": 0.91, - "learning_rate": 4.612039048957683e-06, - "loss": 2.3248, - "step": 260270 - }, - { - "epoch": 0.91, - "learning_rate": 4.61029516910403e-06, - "loss": 2.2684, - "step": 260280 - }, - { - "epoch": 0.91, - "learning_rate": 4.608551289250376e-06, - "loss": 2.2762, - "step": 260290 - }, - { - "epoch": 0.91, - "learning_rate": 4.606807409396723e-06, - "loss": 2.4043, - "step": 260300 - }, - { - "epoch": 0.91, - "learning_rate": 4.605063529543069e-06, - "loss": 2.3057, - "step": 260310 - }, - { - "epoch": 0.91, - "learning_rate": 4.603319649689415e-06, - "loss": 2.3005, - "step": 260320 - }, - { - "epoch": 0.91, - "learning_rate": 4.601575769835761e-06, - "loss": 2.4019, - "step": 260330 - }, - { - "epoch": 0.91, - "learning_rate": 4.599831889982108e-06, - "loss": 2.3825, - "step": 260340 - }, - { - "epoch": 0.91, - "learning_rate": 4.598088010128455e-06, - "loss": 2.3293, - "step": 260350 - }, - { - "epoch": 0.91, - "learning_rate": 4.596344130274801e-06, - "loss": 2.3561, - "step": 260360 - }, - { - "epoch": 0.91, - "learning_rate": 4.594600250421147e-06, - "loss": 2.357, - "step": 260370 - }, - { - "epoch": 0.91, - "learning_rate": 4.592856370567494e-06, - "loss": 2.364, - "step": 260380 - }, - { - "epoch": 0.91, - "learning_rate": 4.59111249071384e-06, - "loss": 2.3269, - "step": 260390 - }, - { - "epoch": 0.91, - "learning_rate": 4.589368610860186e-06, - "loss": 2.2807, - "step": 260400 - }, - { - "epoch": 0.91, - "learning_rate": 4.587624731006532e-06, - "loss": 2.3327, - "step": 260410 - }, - { - "epoch": 0.91, - "learning_rate": 4.58588085115288e-06, - "loss": 2.4024, - "step": 260420 - }, - { - "epoch": 0.91, - "learning_rate": 4.584136971299226e-06, - "loss": 2.3821, - "step": 260430 - }, - { - "epoch": 0.91, - "learning_rate": 4.582393091445572e-06, - "loss": 2.3248, - "step": 260440 - }, - { - "epoch": 0.91, - "learning_rate": 4.580649211591918e-06, - "loss": 2.3765, - "step": 260450 - }, - { - "epoch": 0.91, - "learning_rate": 4.578905331738265e-06, - "loss": 2.3548, - "step": 260460 - }, - { - "epoch": 0.91, - "learning_rate": 4.577161451884611e-06, - "loss": 2.3307, - "step": 260470 - }, - { - "epoch": 0.91, - "learning_rate": 4.575417572030958e-06, - "loss": 2.342, - "step": 260480 - }, - { - "epoch": 0.91, - "learning_rate": 4.573673692177304e-06, - "loss": 2.2877, - "step": 260490 - }, - { - "epoch": 0.91, - "learning_rate": 4.571929812323651e-06, - "loss": 2.4089, - "step": 260500 - }, - { - "epoch": 0.91, - "learning_rate": 4.570185932469997e-06, - "loss": 2.304, - "step": 260510 - }, - { - "epoch": 0.91, - "learning_rate": 4.568442052616343e-06, - "loss": 2.3102, - "step": 260520 - }, - { - "epoch": 0.91, - "learning_rate": 4.566698172762689e-06, - "loss": 2.3569, - "step": 260530 - }, - { - "epoch": 0.91, - "learning_rate": 4.564954292909036e-06, - "loss": 2.252, - "step": 260540 - }, - { - "epoch": 0.91, - "learning_rate": 4.563210413055383e-06, - "loss": 2.35, - "step": 260550 - }, - { - "epoch": 0.91, - "learning_rate": 4.561466533201729e-06, - "loss": 2.378, - "step": 260560 - }, - { - "epoch": 0.91, - "learning_rate": 4.559722653348075e-06, - "loss": 2.4026, - "step": 260570 - }, - { - "epoch": 0.91, - "learning_rate": 4.557978773494422e-06, - "loss": 2.3163, - "step": 260580 - }, - { - "epoch": 0.91, - "learning_rate": 4.556234893640768e-06, - "loss": 2.3541, - "step": 260590 - }, - { - "epoch": 0.91, - "learning_rate": 4.554491013787114e-06, - "loss": 2.391, - "step": 260600 - }, - { - "epoch": 0.91, - "learning_rate": 4.55274713393346e-06, - "loss": 2.3464, - "step": 260610 - }, - { - "epoch": 0.91, - "learning_rate": 4.551003254079808e-06, - "loss": 2.3818, - "step": 260620 - }, - { - "epoch": 0.91, - "learning_rate": 4.549259374226154e-06, - "loss": 2.3796, - "step": 260630 - }, - { - "epoch": 0.91, - "learning_rate": 4.5475154943725e-06, - "loss": 2.3831, - "step": 260640 - }, - { - "epoch": 0.91, - "learning_rate": 4.545771614518846e-06, - "loss": 2.3433, - "step": 260650 - }, - { - "epoch": 0.91, - "learning_rate": 4.544027734665193e-06, - "loss": 2.3453, - "step": 260660 - }, - { - "epoch": 0.91, - "learning_rate": 4.542283854811539e-06, - "loss": 2.311, - "step": 260670 - }, - { - "epoch": 0.91, - "learning_rate": 4.540539974957886e-06, - "loss": 2.3437, - "step": 260680 - }, - { - "epoch": 0.91, - "learning_rate": 4.538796095104232e-06, - "loss": 2.3625, - "step": 260690 - }, - { - "epoch": 0.91, - "learning_rate": 4.537052215250579e-06, - "loss": 2.3099, - "step": 260700 - }, - { - "epoch": 0.91, - "learning_rate": 4.535308335396925e-06, - "loss": 2.3377, - "step": 260710 - }, - { - "epoch": 0.91, - "learning_rate": 4.533564455543271e-06, - "loss": 2.2412, - "step": 260720 - }, - { - "epoch": 0.91, - "learning_rate": 4.531820575689617e-06, - "loss": 2.324, - "step": 260730 - }, - { - "epoch": 0.91, - "learning_rate": 4.530076695835964e-06, - "loss": 2.3278, - "step": 260740 - }, - { - "epoch": 0.91, - "learning_rate": 4.5283328159823105e-06, - "loss": 2.3289, - "step": 260750 - }, - { - "epoch": 0.91, - "learning_rate": 4.526588936128657e-06, - "loss": 2.3259, - "step": 260760 - }, - { - "epoch": 0.91, - "learning_rate": 4.524845056275003e-06, - "loss": 2.3945, - "step": 260770 - }, - { - "epoch": 0.91, - "learning_rate": 4.52310117642135e-06, - "loss": 2.3433, - "step": 260780 - }, - { - "epoch": 0.91, - "learning_rate": 4.521357296567696e-06, - "loss": 2.3382, - "step": 260790 - }, - { - "epoch": 0.91, - "learning_rate": 4.519613416714042e-06, - "loss": 2.4201, - "step": 260800 - }, - { - "epoch": 0.91, - "learning_rate": 4.517869536860388e-06, - "loss": 2.3666, - "step": 260810 - }, - { - "epoch": 0.91, - "learning_rate": 4.516125657006736e-06, - "loss": 2.3214, - "step": 260820 - }, - { - "epoch": 0.91, - "learning_rate": 4.5143817771530815e-06, - "loss": 2.2794, - "step": 260830 - }, - { - "epoch": 0.91, - "learning_rate": 4.512637897299428e-06, - "loss": 2.357, - "step": 260840 - }, - { - "epoch": 0.91, - "learning_rate": 4.510894017445774e-06, - "loss": 2.3853, - "step": 260850 - }, - { - "epoch": 0.91, - "learning_rate": 4.509150137592121e-06, - "loss": 2.3714, - "step": 260860 - }, - { - "epoch": 0.91, - "learning_rate": 4.507406257738467e-06, - "loss": 2.3579, - "step": 260870 - }, - { - "epoch": 0.91, - "learning_rate": 4.505662377884814e-06, - "loss": 2.313, - "step": 260880 - }, - { - "epoch": 0.91, - "learning_rate": 4.50391849803116e-06, - "loss": 2.313, - "step": 260890 - }, - { - "epoch": 0.91, - "learning_rate": 4.502174618177507e-06, - "loss": 2.3379, - "step": 260900 - }, - { - "epoch": 0.91, - "learning_rate": 4.5004307383238525e-06, - "loss": 2.3111, - "step": 260910 - }, - { - "epoch": 0.91, - "learning_rate": 4.498686858470199e-06, - "loss": 2.3886, - "step": 260920 - }, - { - "epoch": 0.91, - "learning_rate": 4.496942978616545e-06, - "loss": 2.3052, - "step": 260930 - }, - { - "epoch": 0.91, - "learning_rate": 4.495199098762892e-06, - "loss": 2.3363, - "step": 260940 - }, - { - "epoch": 0.91, - "learning_rate": 4.4934552189092384e-06, - "loss": 2.3539, - "step": 260950 - }, - { - "epoch": 0.91, - "learning_rate": 4.491711339055585e-06, - "loss": 2.4119, - "step": 260960 - }, - { - "epoch": 0.91, - "learning_rate": 4.489967459201931e-06, - "loss": 2.4119, - "step": 260970 - }, - { - "epoch": 0.91, - "learning_rate": 4.488223579348278e-06, - "loss": 2.3076, - "step": 260980 - }, - { - "epoch": 0.91, - "learning_rate": 4.4864796994946235e-06, - "loss": 2.3235, - "step": 260990 - }, - { - "epoch": 0.91, - "learning_rate": 4.48473581964097e-06, - "loss": 2.3114, - "step": 261000 - }, - { - "epoch": 0.91, - "learning_rate": 4.482991939787316e-06, - "loss": 2.3767, - "step": 261010 - }, - { - "epoch": 0.91, - "learning_rate": 4.481248059933664e-06, - "loss": 2.3676, - "step": 261020 - }, - { - "epoch": 0.91, - "learning_rate": 4.4795041800800094e-06, - "loss": 2.3877, - "step": 261030 - }, - { - "epoch": 0.91, - "learning_rate": 4.477760300226356e-06, - "loss": 2.3391, - "step": 261040 - }, - { - "epoch": 0.91, - "learning_rate": 4.476016420372702e-06, - "loss": 2.3292, - "step": 261050 - }, - { - "epoch": 0.91, - "learning_rate": 4.474272540519049e-06, - "loss": 2.3391, - "step": 261060 - }, - { - "epoch": 0.91, - "learning_rate": 4.4725286606653945e-06, - "loss": 2.3339, - "step": 261070 - }, - { - "epoch": 0.91, - "learning_rate": 4.470784780811742e-06, - "loss": 2.315, - "step": 261080 - }, - { - "epoch": 0.91, - "learning_rate": 4.469040900958088e-06, - "loss": 2.4257, - "step": 261090 - }, - { - "epoch": 0.91, - "learning_rate": 4.467297021104435e-06, - "loss": 2.4444, - "step": 261100 - }, - { - "epoch": 0.91, - "learning_rate": 4.4655531412507804e-06, - "loss": 2.3276, - "step": 261110 - }, - { - "epoch": 0.91, - "learning_rate": 4.463809261397127e-06, - "loss": 2.3242, - "step": 261120 - }, - { - "epoch": 0.91, - "learning_rate": 4.462065381543473e-06, - "loss": 2.3685, - "step": 261130 - }, - { - "epoch": 0.91, - "learning_rate": 4.46032150168982e-06, - "loss": 2.3212, - "step": 261140 - }, - { - "epoch": 0.91, - "learning_rate": 4.458577621836166e-06, - "loss": 2.2812, - "step": 261150 - }, - { - "epoch": 0.91, - "learning_rate": 4.456833741982513e-06, - "loss": 2.3493, - "step": 261160 - }, - { - "epoch": 0.91, - "learning_rate": 4.455089862128859e-06, - "loss": 2.3546, - "step": 261170 - }, - { - "epoch": 0.91, - "learning_rate": 4.453345982275206e-06, - "loss": 2.3377, - "step": 261180 - }, - { - "epoch": 0.91, - "learning_rate": 4.4516021024215514e-06, - "loss": 2.3374, - "step": 261190 - }, - { - "epoch": 0.91, - "learning_rate": 4.449858222567898e-06, - "loss": 2.3196, - "step": 261200 - }, - { - "epoch": 0.91, - "learning_rate": 4.448114342714244e-06, - "loss": 2.3462, - "step": 261210 - }, - { - "epoch": 0.91, - "learning_rate": 4.4463704628605915e-06, - "loss": 2.298, - "step": 261220 - }, - { - "epoch": 0.91, - "learning_rate": 4.444626583006937e-06, - "loss": 2.3123, - "step": 261230 - }, - { - "epoch": 0.91, - "learning_rate": 4.442882703153284e-06, - "loss": 2.2913, - "step": 261240 - }, - { - "epoch": 0.91, - "learning_rate": 4.44113882329963e-06, - "loss": 2.4587, - "step": 261250 - }, - { - "epoch": 0.91, - "learning_rate": 4.439394943445977e-06, - "loss": 2.3478, - "step": 261260 - }, - { - "epoch": 0.91, - "learning_rate": 4.4376510635923224e-06, - "loss": 2.4092, - "step": 261270 - }, - { - "epoch": 0.91, - "learning_rate": 4.43590718373867e-06, - "loss": 2.2167, - "step": 261280 - }, - { - "epoch": 0.91, - "learning_rate": 4.434163303885016e-06, - "loss": 2.3615, - "step": 261290 - }, - { - "epoch": 0.91, - "learning_rate": 4.4324194240313625e-06, - "loss": 2.3824, - "step": 261300 - }, - { - "epoch": 0.91, - "learning_rate": 4.430675544177708e-06, - "loss": 2.3713, - "step": 261310 - }, - { - "epoch": 0.91, - "learning_rate": 4.428931664324055e-06, - "loss": 2.276, - "step": 261320 - }, - { - "epoch": 0.91, - "learning_rate": 4.427187784470401e-06, - "loss": 2.4067, - "step": 261330 - }, - { - "epoch": 0.91, - "learning_rate": 4.425443904616748e-06, - "loss": 2.3517, - "step": 261340 - }, - { - "epoch": 0.91, - "learning_rate": 4.423700024763094e-06, - "loss": 2.4016, - "step": 261350 - }, - { - "epoch": 0.91, - "learning_rate": 4.421956144909441e-06, - "loss": 2.2991, - "step": 261360 - }, - { - "epoch": 0.91, - "learning_rate": 4.420212265055787e-06, - "loss": 2.4047, - "step": 261370 - }, - { - "epoch": 0.91, - "learning_rate": 4.4184683852021335e-06, - "loss": 2.3304, - "step": 261380 - }, - { - "epoch": 0.91, - "learning_rate": 4.416724505348479e-06, - "loss": 2.3652, - "step": 261390 - }, - { - "epoch": 0.91, - "learning_rate": 4.414980625494826e-06, - "loss": 2.298, - "step": 261400 - }, - { - "epoch": 0.91, - "learning_rate": 4.413236745641172e-06, - "loss": 2.2839, - "step": 261410 - }, - { - "epoch": 0.91, - "learning_rate": 4.4114928657875194e-06, - "loss": 2.3403, - "step": 261420 - }, - { - "epoch": 0.91, - "learning_rate": 4.409748985933865e-06, - "loss": 2.3475, - "step": 261430 - }, - { - "epoch": 0.91, - "learning_rate": 4.408005106080212e-06, - "loss": 2.354, - "step": 261440 - }, - { - "epoch": 0.91, - "learning_rate": 4.406261226226558e-06, - "loss": 2.3663, - "step": 261450 - }, - { - "epoch": 0.91, - "learning_rate": 4.4045173463729045e-06, - "loss": 2.3451, - "step": 261460 - }, - { - "epoch": 0.91, - "learning_rate": 4.40277346651925e-06, - "loss": 2.3453, - "step": 261470 - }, - { - "epoch": 0.91, - "learning_rate": 4.401029586665598e-06, - "loss": 2.2611, - "step": 261480 - }, - { - "epoch": 0.91, - "learning_rate": 4.399285706811944e-06, - "loss": 2.3622, - "step": 261490 - }, - { - "epoch": 0.91, - "learning_rate": 4.3975418269582904e-06, - "loss": 2.3723, - "step": 261500 - }, - { - "epoch": 0.91, - "learning_rate": 4.395797947104636e-06, - "loss": 2.405, - "step": 261510 - }, - { - "epoch": 0.91, - "learning_rate": 4.394054067250983e-06, - "loss": 2.3213, - "step": 261520 - }, - { - "epoch": 0.91, - "learning_rate": 4.392310187397329e-06, - "loss": 2.3396, - "step": 261530 - }, - { - "epoch": 0.91, - "learning_rate": 4.3905663075436755e-06, - "loss": 2.3476, - "step": 261540 - }, - { - "epoch": 0.91, - "learning_rate": 4.388822427690022e-06, - "loss": 2.2973, - "step": 261550 - }, - { - "epoch": 0.91, - "learning_rate": 4.387078547836369e-06, - "loss": 2.3766, - "step": 261560 - }, - { - "epoch": 0.91, - "learning_rate": 4.385334667982715e-06, - "loss": 2.3364, - "step": 261570 - }, - { - "epoch": 0.91, - "learning_rate": 4.3835907881290614e-06, - "loss": 2.3679, - "step": 261580 - }, - { - "epoch": 0.91, - "learning_rate": 4.381846908275407e-06, - "loss": 2.3401, - "step": 261590 - }, - { - "epoch": 0.91, - "learning_rate": 4.380103028421754e-06, - "loss": 2.2747, - "step": 261600 - }, - { - "epoch": 0.91, - "learning_rate": 4.3783591485681e-06, - "loss": 2.3274, - "step": 261610 - }, - { - "epoch": 0.91, - "learning_rate": 4.376615268714447e-06, - "loss": 2.31, - "step": 261620 - }, - { - "epoch": 0.91, - "learning_rate": 4.374871388860793e-06, - "loss": 2.2706, - "step": 261630 - }, - { - "epoch": 0.91, - "learning_rate": 4.37312750900714e-06, - "loss": 2.3479, - "step": 261640 - }, - { - "epoch": 0.91, - "learning_rate": 4.371383629153486e-06, - "loss": 2.3413, - "step": 261650 - }, - { - "epoch": 0.91, - "learning_rate": 4.3696397492998324e-06, - "loss": 2.3022, - "step": 261660 - }, - { - "epoch": 0.91, - "learning_rate": 4.367895869446178e-06, - "loss": 2.3131, - "step": 261670 - }, - { - "epoch": 0.91, - "learning_rate": 4.366151989592526e-06, - "loss": 2.3363, - "step": 261680 - }, - { - "epoch": 0.91, - "learning_rate": 4.364408109738872e-06, - "loss": 2.2983, - "step": 261690 - }, - { - "epoch": 0.91, - "learning_rate": 4.362664229885218e-06, - "loss": 2.3433, - "step": 261700 - }, - { - "epoch": 0.91, - "learning_rate": 4.360920350031564e-06, - "loss": 2.273, - "step": 261710 - }, - { - "epoch": 0.91, - "learning_rate": 4.359176470177911e-06, - "loss": 2.3276, - "step": 261720 - }, - { - "epoch": 0.91, - "learning_rate": 4.357432590324257e-06, - "loss": 2.353, - "step": 261730 - }, - { - "epoch": 0.91, - "learning_rate": 4.3556887104706034e-06, - "loss": 2.393, - "step": 261740 - }, - { - "epoch": 0.91, - "learning_rate": 4.35394483061695e-06, - "loss": 2.3849, - "step": 261750 - }, - { - "epoch": 0.91, - "learning_rate": 4.352200950763297e-06, - "loss": 2.381, - "step": 261760 - }, - { - "epoch": 0.91, - "learning_rate": 4.350457070909643e-06, - "loss": 2.2692, - "step": 261770 - }, - { - "epoch": 0.91, - "learning_rate": 4.348713191055989e-06, - "loss": 2.3841, - "step": 261780 - }, - { - "epoch": 0.91, - "learning_rate": 4.346969311202335e-06, - "loss": 2.4188, - "step": 261790 - }, - { - "epoch": 0.91, - "learning_rate": 4.345225431348682e-06, - "loss": 2.3197, - "step": 261800 - }, - { - "epoch": 0.91, - "learning_rate": 4.343481551495029e-06, - "loss": 2.3346, - "step": 261810 - }, - { - "epoch": 0.91, - "learning_rate": 4.341737671641375e-06, - "loss": 2.2451, - "step": 261820 - }, - { - "epoch": 0.91, - "learning_rate": 4.339993791787721e-06, - "loss": 2.3623, - "step": 261830 - }, - { - "epoch": 0.91, - "learning_rate": 4.338249911934068e-06, - "loss": 2.304, - "step": 261840 - }, - { - "epoch": 0.91, - "learning_rate": 4.336506032080414e-06, - "loss": 2.2794, - "step": 261850 - }, - { - "epoch": 0.91, - "learning_rate": 4.33476215222676e-06, - "loss": 2.2622, - "step": 261860 - }, - { - "epoch": 0.91, - "learning_rate": 4.333018272373106e-06, - "loss": 2.3138, - "step": 261870 - }, - { - "epoch": 0.91, - "learning_rate": 4.331274392519454e-06, - "loss": 2.3613, - "step": 261880 - }, - { - "epoch": 0.91, - "learning_rate": 4.3295305126658e-06, - "loss": 2.2685, - "step": 261890 - }, - { - "epoch": 0.91, - "learning_rate": 4.327786632812146e-06, - "loss": 2.4418, - "step": 261900 - }, - { - "epoch": 0.91, - "learning_rate": 4.326042752958492e-06, - "loss": 2.2911, - "step": 261910 - }, - { - "epoch": 0.91, - "learning_rate": 4.324298873104839e-06, - "loss": 2.3926, - "step": 261920 - }, - { - "epoch": 0.91, - "learning_rate": 4.322554993251185e-06, - "loss": 2.3643, - "step": 261930 - }, - { - "epoch": 0.91, - "learning_rate": 4.320811113397531e-06, - "loss": 2.3188, - "step": 261940 - }, - { - "epoch": 0.91, - "learning_rate": 4.319067233543878e-06, - "loss": 2.3055, - "step": 261950 - }, - { - "epoch": 0.91, - "learning_rate": 4.317323353690225e-06, - "loss": 2.2993, - "step": 261960 - }, - { - "epoch": 0.91, - "learning_rate": 4.315579473836571e-06, - "loss": 2.3079, - "step": 261970 - }, - { - "epoch": 0.91, - "learning_rate": 4.313835593982917e-06, - "loss": 2.3523, - "step": 261980 - }, - { - "epoch": 0.91, - "learning_rate": 4.312091714129263e-06, - "loss": 2.426, - "step": 261990 - }, - { - "epoch": 0.91, - "learning_rate": 4.31034783427561e-06, - "loss": 2.3084, - "step": 262000 - }, - { - "epoch": 0.91, - "learning_rate": 4.3086039544219565e-06, - "loss": 2.2874, - "step": 262010 - }, - { - "epoch": 0.91, - "learning_rate": 4.306860074568303e-06, - "loss": 2.3822, - "step": 262020 - }, - { - "epoch": 0.91, - "learning_rate": 4.305116194714649e-06, - "loss": 2.3283, - "step": 262030 - }, - { - "epoch": 0.91, - "learning_rate": 4.303372314860996e-06, - "loss": 2.3627, - "step": 262040 - }, - { - "epoch": 0.91, - "learning_rate": 4.301628435007342e-06, - "loss": 2.3847, - "step": 262050 - }, - { - "epoch": 0.91, - "learning_rate": 4.299884555153688e-06, - "loss": 2.2688, - "step": 262060 - }, - { - "epoch": 0.91, - "learning_rate": 4.298140675300034e-06, - "loss": 2.2977, - "step": 262070 - }, - { - "epoch": 0.91, - "learning_rate": 4.296396795446382e-06, - "loss": 2.3685, - "step": 262080 - }, - { - "epoch": 0.91, - "learning_rate": 4.2946529155927275e-06, - "loss": 2.373, - "step": 262090 - }, - { - "epoch": 0.91, - "learning_rate": 4.292909035739074e-06, - "loss": 2.3827, - "step": 262100 - }, - { - "epoch": 0.91, - "learning_rate": 4.29116515588542e-06, - "loss": 2.3523, - "step": 262110 - }, - { - "epoch": 0.91, - "learning_rate": 4.289421276031767e-06, - "loss": 2.3233, - "step": 262120 - }, - { - "epoch": 0.91, - "learning_rate": 4.287677396178113e-06, - "loss": 2.3269, - "step": 262130 - }, - { - "epoch": 0.91, - "learning_rate": 4.285933516324459e-06, - "loss": 2.3678, - "step": 262140 - }, - { - "epoch": 0.91, - "learning_rate": 4.284189636470806e-06, - "loss": 2.4086, - "step": 262150 - }, - { - "epoch": 0.91, - "learning_rate": 4.282445756617153e-06, - "loss": 2.2079, - "step": 262160 - }, - { - "epoch": 0.91, - "learning_rate": 4.2807018767634985e-06, - "loss": 2.3446, - "step": 262170 - }, - { - "epoch": 0.91, - "learning_rate": 4.278957996909845e-06, - "loss": 2.3763, - "step": 262180 - }, - { - "epoch": 0.91, - "learning_rate": 4.277214117056191e-06, - "loss": 2.3336, - "step": 262190 - }, - { - "epoch": 0.91, - "learning_rate": 4.275470237202538e-06, - "loss": 2.3154, - "step": 262200 - }, - { - "epoch": 0.91, - "learning_rate": 4.2737263573488845e-06, - "loss": 2.278, - "step": 262210 - }, - { - "epoch": 0.91, - "learning_rate": 4.271982477495231e-06, - "loss": 2.2952, - "step": 262220 - }, - { - "epoch": 0.91, - "learning_rate": 4.270238597641577e-06, - "loss": 2.3589, - "step": 262230 - }, - { - "epoch": 0.91, - "learning_rate": 4.268494717787924e-06, - "loss": 2.349, - "step": 262240 - }, - { - "epoch": 0.91, - "learning_rate": 4.2667508379342695e-06, - "loss": 2.362, - "step": 262250 - }, - { - "epoch": 0.91, - "learning_rate": 4.265006958080616e-06, - "loss": 2.3746, - "step": 262260 - }, - { - "epoch": 0.91, - "learning_rate": 4.263263078226962e-06, - "loss": 2.3487, - "step": 262270 - }, - { - "epoch": 0.91, - "learning_rate": 4.26151919837331e-06, - "loss": 2.3763, - "step": 262280 - }, - { - "epoch": 0.91, - "learning_rate": 4.2597753185196555e-06, - "loss": 2.4307, - "step": 262290 - }, - { - "epoch": 0.91, - "learning_rate": 4.258031438666002e-06, - "loss": 2.3624, - "step": 262300 - }, - { - "epoch": 0.91, - "learning_rate": 4.256287558812348e-06, - "loss": 2.2976, - "step": 262310 - }, - { - "epoch": 0.91, - "learning_rate": 4.254543678958695e-06, - "loss": 2.3364, - "step": 262320 - }, - { - "epoch": 0.91, - "learning_rate": 4.2527997991050405e-06, - "loss": 2.3508, - "step": 262330 - }, - { - "epoch": 0.91, - "learning_rate": 4.251055919251387e-06, - "loss": 2.3981, - "step": 262340 - }, - { - "epoch": 0.92, - "learning_rate": 4.249312039397734e-06, - "loss": 2.295, - "step": 262350 - }, - { - "epoch": 0.92, - "learning_rate": 4.247568159544081e-06, - "loss": 2.2969, - "step": 262360 - }, - { - "epoch": 0.92, - "learning_rate": 4.2458242796904265e-06, - "loss": 2.3194, - "step": 262370 - }, - { - "epoch": 0.92, - "learning_rate": 4.244080399836773e-06, - "loss": 2.3122, - "step": 262380 - }, - { - "epoch": 0.92, - "learning_rate": 4.242336519983119e-06, - "loss": 2.3445, - "step": 262390 - }, - { - "epoch": 0.92, - "learning_rate": 4.240592640129466e-06, - "loss": 2.3949, - "step": 262400 - }, - { - "epoch": 0.92, - "learning_rate": 4.238848760275812e-06, - "loss": 2.3354, - "step": 262410 - }, - { - "epoch": 0.92, - "learning_rate": 4.237104880422159e-06, - "loss": 2.3003, - "step": 262420 - }, - { - "epoch": 0.92, - "learning_rate": 4.235361000568505e-06, - "loss": 2.3792, - "step": 262430 - }, - { - "epoch": 0.92, - "learning_rate": 4.233617120714852e-06, - "loss": 2.3225, - "step": 262440 - }, - { - "epoch": 0.92, - "learning_rate": 4.2318732408611975e-06, - "loss": 2.3339, - "step": 262450 - }, - { - "epoch": 0.92, - "learning_rate": 4.230129361007544e-06, - "loss": 2.2889, - "step": 262460 - }, - { - "epoch": 0.92, - "learning_rate": 4.22838548115389e-06, - "loss": 2.3707, - "step": 262470 - }, - { - "epoch": 0.92, - "learning_rate": 4.2266416013002375e-06, - "loss": 2.3939, - "step": 262480 - }, - { - "epoch": 0.92, - "learning_rate": 4.224897721446583e-06, - "loss": 2.2476, - "step": 262490 - }, - { - "epoch": 0.92, - "learning_rate": 4.22315384159293e-06, - "loss": 2.3301, - "step": 262500 - }, - { - "epoch": 0.92, - "learning_rate": 4.221409961739276e-06, - "loss": 2.3652, - "step": 262510 - }, - { - "epoch": 0.92, - "learning_rate": 4.219666081885623e-06, - "loss": 2.317, - "step": 262520 - }, - { - "epoch": 0.92, - "learning_rate": 4.2179222020319685e-06, - "loss": 2.3256, - "step": 262530 - }, - { - "epoch": 0.92, - "learning_rate": 4.216178322178315e-06, - "loss": 2.3805, - "step": 262540 - }, - { - "epoch": 0.92, - "learning_rate": 4.214434442324662e-06, - "loss": 2.3207, - "step": 262550 - }, - { - "epoch": 0.92, - "learning_rate": 4.2126905624710085e-06, - "loss": 2.3011, - "step": 262560 - }, - { - "epoch": 0.92, - "learning_rate": 4.210946682617354e-06, - "loss": 2.3197, - "step": 262570 - }, - { - "epoch": 0.92, - "learning_rate": 4.209202802763701e-06, - "loss": 2.3412, - "step": 262580 - }, - { - "epoch": 0.92, - "learning_rate": 4.207458922910047e-06, - "loss": 2.3246, - "step": 262590 - }, - { - "epoch": 0.92, - "learning_rate": 4.205715043056394e-06, - "loss": 2.4308, - "step": 262600 - }, - { - "epoch": 0.92, - "learning_rate": 4.20397116320274e-06, - "loss": 2.3343, - "step": 262610 - }, - { - "epoch": 0.92, - "learning_rate": 4.202227283349087e-06, - "loss": 2.2681, - "step": 262620 - }, - { - "epoch": 0.92, - "learning_rate": 4.200483403495433e-06, - "loss": 2.3522, - "step": 262630 - }, - { - "epoch": 0.92, - "learning_rate": 4.1987395236417795e-06, - "loss": 2.3777, - "step": 262640 - }, - { - "epoch": 0.92, - "learning_rate": 4.196995643788125e-06, - "loss": 2.2508, - "step": 262650 - }, - { - "epoch": 0.92, - "learning_rate": 4.195251763934472e-06, - "loss": 2.3712, - "step": 262660 - }, - { - "epoch": 0.92, - "learning_rate": 4.193507884080818e-06, - "loss": 2.2993, - "step": 262670 - }, - { - "epoch": 0.92, - "learning_rate": 4.1917640042271655e-06, - "loss": 2.343, - "step": 262680 - }, - { - "epoch": 0.92, - "learning_rate": 4.190020124373511e-06, - "loss": 2.3114, - "step": 262690 - }, - { - "epoch": 0.92, - "learning_rate": 4.188276244519858e-06, - "loss": 2.4111, - "step": 262700 - }, - { - "epoch": 0.92, - "learning_rate": 4.186532364666204e-06, - "loss": 2.3451, - "step": 262710 - }, - { - "epoch": 0.92, - "learning_rate": 4.1847884848125505e-06, - "loss": 2.3228, - "step": 262720 - }, - { - "epoch": 0.92, - "learning_rate": 4.183044604958896e-06, - "loss": 2.2874, - "step": 262730 - }, - { - "epoch": 0.92, - "learning_rate": 4.181300725105243e-06, - "loss": 2.3102, - "step": 262740 - }, - { - "epoch": 0.92, - "learning_rate": 4.17955684525159e-06, - "loss": 2.3469, - "step": 262750 - }, - { - "epoch": 0.92, - "learning_rate": 4.1778129653979365e-06, - "loss": 2.3682, - "step": 262760 - }, - { - "epoch": 0.92, - "learning_rate": 4.176069085544282e-06, - "loss": 2.3497, - "step": 262770 - }, - { - "epoch": 0.92, - "learning_rate": 4.174325205690629e-06, - "loss": 2.3546, - "step": 262780 - }, - { - "epoch": 0.92, - "learning_rate": 4.172581325836975e-06, - "loss": 2.4529, - "step": 262790 - }, - { - "epoch": 0.92, - "learning_rate": 4.1708374459833215e-06, - "loss": 2.2522, - "step": 262800 - }, - { - "epoch": 0.92, - "learning_rate": 4.169093566129668e-06, - "loss": 2.3059, - "step": 262810 - }, - { - "epoch": 0.92, - "learning_rate": 4.167349686276015e-06, - "loss": 2.4088, - "step": 262820 - }, - { - "epoch": 0.92, - "learning_rate": 4.165605806422361e-06, - "loss": 2.3307, - "step": 262830 - }, - { - "epoch": 0.92, - "learning_rate": 4.1638619265687075e-06, - "loss": 2.3656, - "step": 262840 - }, - { - "epoch": 0.92, - "learning_rate": 4.162118046715053e-06, - "loss": 2.3476, - "step": 262850 - }, - { - "epoch": 0.92, - "learning_rate": 4.1603741668614e-06, - "loss": 2.3334, - "step": 262860 - }, - { - "epoch": 0.92, - "learning_rate": 4.158630287007746e-06, - "loss": 2.2638, - "step": 262870 - }, - { - "epoch": 0.92, - "learning_rate": 4.156886407154093e-06, - "loss": 2.3666, - "step": 262880 - }, - { - "epoch": 0.92, - "learning_rate": 4.155142527300439e-06, - "loss": 2.3872, - "step": 262890 - }, - { - "epoch": 0.92, - "learning_rate": 4.153398647446786e-06, - "loss": 2.3207, - "step": 262900 - }, - { - "epoch": 0.92, - "learning_rate": 4.151654767593132e-06, - "loss": 2.3152, - "step": 262910 - }, - { - "epoch": 0.92, - "learning_rate": 4.1499108877394785e-06, - "loss": 2.3927, - "step": 262920 - }, - { - "epoch": 0.92, - "learning_rate": 4.148167007885824e-06, - "loss": 2.3011, - "step": 262930 - }, - { - "epoch": 0.92, - "learning_rate": 4.146423128032171e-06, - "loss": 2.3237, - "step": 262940 - }, - { - "epoch": 0.92, - "learning_rate": 4.144679248178518e-06, - "loss": 2.298, - "step": 262950 - }, - { - "epoch": 0.92, - "learning_rate": 4.142935368324864e-06, - "loss": 2.3313, - "step": 262960 - }, - { - "epoch": 0.92, - "learning_rate": 4.14119148847121e-06, - "loss": 2.3022, - "step": 262970 - }, - { - "epoch": 0.92, - "learning_rate": 4.139447608617557e-06, - "loss": 2.362, - "step": 262980 - }, - { - "epoch": 0.92, - "learning_rate": 4.137703728763903e-06, - "loss": 2.3583, - "step": 262990 - }, - { - "epoch": 0.92, - "learning_rate": 4.1359598489102495e-06, - "loss": 2.3251, - "step": 263000 - }, - { - "epoch": 0.92, - "learning_rate": 4.134215969056596e-06, - "loss": 2.3248, - "step": 263010 - }, - { - "epoch": 0.92, - "learning_rate": 4.132472089202943e-06, - "loss": 2.3606, - "step": 263020 - }, - { - "epoch": 0.92, - "learning_rate": 4.130728209349289e-06, - "loss": 2.3407, - "step": 263030 - }, - { - "epoch": 0.92, - "learning_rate": 4.128984329495635e-06, - "loss": 2.3262, - "step": 263040 - }, - { - "epoch": 0.92, - "learning_rate": 4.127240449641981e-06, - "loss": 2.2578, - "step": 263050 - }, - { - "epoch": 0.92, - "learning_rate": 4.125496569788328e-06, - "loss": 2.2956, - "step": 263060 - }, - { - "epoch": 0.92, - "learning_rate": 4.123752689934674e-06, - "loss": 2.2981, - "step": 263070 - }, - { - "epoch": 0.92, - "learning_rate": 4.122008810081021e-06, - "loss": 2.3968, - "step": 263080 - }, - { - "epoch": 0.92, - "learning_rate": 4.120264930227367e-06, - "loss": 2.369, - "step": 263090 - }, - { - "epoch": 0.92, - "learning_rate": 4.118521050373714e-06, - "loss": 2.3547, - "step": 263100 - }, - { - "epoch": 0.92, - "learning_rate": 4.11677717052006e-06, - "loss": 2.3972, - "step": 263110 - }, - { - "epoch": 0.92, - "learning_rate": 4.115033290666406e-06, - "loss": 2.337, - "step": 263120 - }, - { - "epoch": 0.92, - "learning_rate": 4.113289410812752e-06, - "loss": 2.3151, - "step": 263130 - }, - { - "epoch": 0.92, - "learning_rate": 4.1115455309591e-06, - "loss": 2.3547, - "step": 263140 - }, - { - "epoch": 0.92, - "learning_rate": 4.109801651105446e-06, - "loss": 2.2942, - "step": 263150 - }, - { - "epoch": 0.92, - "learning_rate": 4.108057771251792e-06, - "loss": 2.3708, - "step": 263160 - }, - { - "epoch": 0.92, - "learning_rate": 4.106313891398138e-06, - "loss": 2.3687, - "step": 263170 - }, - { - "epoch": 0.92, - "learning_rate": 4.104570011544485e-06, - "loss": 2.4522, - "step": 263180 - }, - { - "epoch": 0.92, - "learning_rate": 4.102826131690831e-06, - "loss": 2.323, - "step": 263190 - }, - { - "epoch": 0.92, - "learning_rate": 4.101082251837177e-06, - "loss": 2.4175, - "step": 263200 - }, - { - "epoch": 0.92, - "learning_rate": 4.099338371983524e-06, - "loss": 2.3018, - "step": 263210 - }, - { - "epoch": 0.92, - "learning_rate": 4.097594492129871e-06, - "loss": 2.3607, - "step": 263220 - }, - { - "epoch": 0.92, - "learning_rate": 4.095850612276217e-06, - "loss": 2.4167, - "step": 263230 - }, - { - "epoch": 0.92, - "learning_rate": 4.094106732422563e-06, - "loss": 2.3524, - "step": 263240 - }, - { - "epoch": 0.92, - "learning_rate": 4.092362852568909e-06, - "loss": 2.3222, - "step": 263250 - }, - { - "epoch": 0.92, - "learning_rate": 4.090618972715256e-06, - "loss": 2.2791, - "step": 263260 - }, - { - "epoch": 0.92, - "learning_rate": 4.088875092861602e-06, - "loss": 2.2899, - "step": 263270 - }, - { - "epoch": 0.92, - "learning_rate": 4.087131213007949e-06, - "loss": 2.3866, - "step": 263280 - }, - { - "epoch": 0.92, - "learning_rate": 4.085387333154295e-06, - "loss": 2.3387, - "step": 263290 - }, - { - "epoch": 0.92, - "learning_rate": 4.083643453300642e-06, - "loss": 2.3567, - "step": 263300 - }, - { - "epoch": 0.92, - "learning_rate": 4.081899573446988e-06, - "loss": 2.3763, - "step": 263310 - }, - { - "epoch": 0.92, - "learning_rate": 4.080155693593334e-06, - "loss": 2.2517, - "step": 263320 - }, - { - "epoch": 0.92, - "learning_rate": 4.07841181373968e-06, - "loss": 2.2759, - "step": 263330 - }, - { - "epoch": 0.92, - "learning_rate": 4.076667933886028e-06, - "loss": 2.364, - "step": 263340 - }, - { - "epoch": 0.92, - "learning_rate": 4.0749240540323736e-06, - "loss": 2.2959, - "step": 263350 - }, - { - "epoch": 0.92, - "learning_rate": 4.07318017417872e-06, - "loss": 2.323, - "step": 263360 - }, - { - "epoch": 0.92, - "learning_rate": 4.071436294325066e-06, - "loss": 2.4053, - "step": 263370 - }, - { - "epoch": 0.92, - "learning_rate": 4.069692414471413e-06, - "loss": 2.2993, - "step": 263380 - }, - { - "epoch": 0.92, - "learning_rate": 4.067948534617759e-06, - "loss": 2.3092, - "step": 263390 - }, - { - "epoch": 0.92, - "learning_rate": 4.066204654764105e-06, - "loss": 2.3892, - "step": 263400 - }, - { - "epoch": 0.92, - "learning_rate": 4.064460774910452e-06, - "loss": 2.3259, - "step": 263410 - }, - { - "epoch": 0.92, - "learning_rate": 4.062716895056799e-06, - "loss": 2.3431, - "step": 263420 - }, - { - "epoch": 0.92, - "learning_rate": 4.0609730152031446e-06, - "loss": 2.3555, - "step": 263430 - }, - { - "epoch": 0.92, - "learning_rate": 4.059229135349491e-06, - "loss": 2.2619, - "step": 263440 - }, - { - "epoch": 0.92, - "learning_rate": 4.057485255495837e-06, - "loss": 2.343, - "step": 263450 - }, - { - "epoch": 0.92, - "learning_rate": 4.055741375642184e-06, - "loss": 2.3969, - "step": 263460 - }, - { - "epoch": 0.92, - "learning_rate": 4.05399749578853e-06, - "loss": 2.3697, - "step": 263470 - }, - { - "epoch": 0.92, - "learning_rate": 4.052253615934877e-06, - "loss": 2.392, - "step": 263480 - }, - { - "epoch": 0.92, - "learning_rate": 4.050509736081223e-06, - "loss": 2.3866, - "step": 263490 - }, - { - "epoch": 0.92, - "learning_rate": 4.04876585622757e-06, - "loss": 2.3541, - "step": 263500 - }, - { - "epoch": 0.92, - "learning_rate": 4.0470219763739156e-06, - "loss": 2.4105, - "step": 263510 - }, - { - "epoch": 0.92, - "learning_rate": 4.045278096520262e-06, - "loss": 2.365, - "step": 263520 - }, - { - "epoch": 0.92, - "learning_rate": 4.043534216666608e-06, - "loss": 2.2937, - "step": 263530 - }, - { - "epoch": 0.92, - "learning_rate": 4.041790336812956e-06, - "loss": 2.301, - "step": 263540 - }, - { - "epoch": 0.92, - "learning_rate": 4.0400464569593015e-06, - "loss": 2.429, - "step": 263550 - }, - { - "epoch": 0.92, - "learning_rate": 4.038302577105648e-06, - "loss": 2.3045, - "step": 263560 - }, - { - "epoch": 0.92, - "learning_rate": 4.036558697251994e-06, - "loss": 2.3929, - "step": 263570 - }, - { - "epoch": 0.92, - "learning_rate": 4.034814817398341e-06, - "loss": 2.284, - "step": 263580 - }, - { - "epoch": 0.92, - "learning_rate": 4.0330709375446866e-06, - "loss": 2.3486, - "step": 263590 - }, - { - "epoch": 0.92, - "learning_rate": 4.031327057691033e-06, - "loss": 2.3002, - "step": 263600 - }, - { - "epoch": 0.92, - "learning_rate": 4.02958317783738e-06, - "loss": 2.379, - "step": 263610 - }, - { - "epoch": 0.92, - "learning_rate": 4.027839297983727e-06, - "loss": 2.3479, - "step": 263620 - }, - { - "epoch": 0.92, - "learning_rate": 4.0260954181300725e-06, - "loss": 2.3824, - "step": 263630 - }, - { - "epoch": 0.92, - "learning_rate": 4.024351538276419e-06, - "loss": 2.286, - "step": 263640 - }, - { - "epoch": 0.92, - "learning_rate": 4.022607658422765e-06, - "loss": 2.3857, - "step": 263650 - }, - { - "epoch": 0.92, - "learning_rate": 4.020863778569112e-06, - "loss": 2.2697, - "step": 263660 - }, - { - "epoch": 0.92, - "learning_rate": 4.0191198987154576e-06, - "loss": 2.3455, - "step": 263670 - }, - { - "epoch": 0.92, - "learning_rate": 4.017376018861805e-06, - "loss": 2.3881, - "step": 263680 - }, - { - "epoch": 0.92, - "learning_rate": 4.015632139008151e-06, - "loss": 2.3679, - "step": 263690 - }, - { - "epoch": 0.92, - "learning_rate": 4.013888259154498e-06, - "loss": 2.3713, - "step": 263700 - }, - { - "epoch": 0.92, - "learning_rate": 4.0121443793008435e-06, - "loss": 2.3311, - "step": 263710 - }, - { - "epoch": 0.92, - "learning_rate": 4.01040049944719e-06, - "loss": 2.363, - "step": 263720 - }, - { - "epoch": 0.92, - "learning_rate": 4.008656619593536e-06, - "loss": 2.3296, - "step": 263730 - }, - { - "epoch": 0.92, - "learning_rate": 4.0069127397398836e-06, - "loss": 2.3856, - "step": 263740 - }, - { - "epoch": 0.92, - "learning_rate": 4.005168859886229e-06, - "loss": 2.3504, - "step": 263750 - }, - { - "epoch": 0.92, - "learning_rate": 4.003424980032576e-06, - "loss": 2.339, - "step": 263760 - }, - { - "epoch": 0.92, - "learning_rate": 4.001681100178922e-06, - "loss": 2.2964, - "step": 263770 - }, - { - "epoch": 0.92, - "learning_rate": 3.999937220325269e-06, - "loss": 2.3172, - "step": 263780 - }, - { - "epoch": 0.92, - "learning_rate": 3.9981933404716145e-06, - "loss": 2.4197, - "step": 263790 - }, - { - "epoch": 0.92, - "learning_rate": 3.996449460617961e-06, - "loss": 2.3102, - "step": 263800 - }, - { - "epoch": 0.92, - "learning_rate": 3.994705580764308e-06, - "loss": 2.3635, - "step": 263810 - }, - { - "epoch": 0.92, - "learning_rate": 3.9929617009106546e-06, - "loss": 2.3284, - "step": 263820 - }, - { - "epoch": 0.92, - "learning_rate": 3.991217821057e-06, - "loss": 2.3255, - "step": 263830 - }, - { - "epoch": 0.92, - "learning_rate": 3.989473941203347e-06, - "loss": 2.3468, - "step": 263840 - }, - { - "epoch": 0.92, - "learning_rate": 3.987730061349693e-06, - "loss": 2.3376, - "step": 263850 - }, - { - "epoch": 0.92, - "learning_rate": 3.98598618149604e-06, - "loss": 2.3345, - "step": 263860 - }, - { - "epoch": 0.92, - "learning_rate": 3.9842423016423855e-06, - "loss": 2.3419, - "step": 263870 - }, - { - "epoch": 0.92, - "learning_rate": 3.982498421788733e-06, - "loss": 2.3282, - "step": 263880 - }, - { - "epoch": 0.92, - "learning_rate": 3.980754541935079e-06, - "loss": 2.4248, - "step": 263890 - }, - { - "epoch": 0.92, - "learning_rate": 3.9790106620814256e-06, - "loss": 2.3664, - "step": 263900 - }, - { - "epoch": 0.92, - "learning_rate": 3.977266782227771e-06, - "loss": 2.3357, - "step": 263910 - }, - { - "epoch": 0.92, - "learning_rate": 3.975522902374118e-06, - "loss": 2.3747, - "step": 263920 - }, - { - "epoch": 0.92, - "learning_rate": 3.973779022520464e-06, - "loss": 2.2631, - "step": 263930 - }, - { - "epoch": 0.92, - "learning_rate": 3.9720351426668115e-06, - "loss": 2.3886, - "step": 263940 - }, - { - "epoch": 0.92, - "learning_rate": 3.970291262813157e-06, - "loss": 2.3887, - "step": 263950 - }, - { - "epoch": 0.92, - "learning_rate": 3.968547382959504e-06, - "loss": 2.2767, - "step": 263960 - }, - { - "epoch": 0.92, - "learning_rate": 3.96680350310585e-06, - "loss": 2.3866, - "step": 263970 - }, - { - "epoch": 0.92, - "learning_rate": 3.9650596232521966e-06, - "loss": 2.3092, - "step": 263980 - }, - { - "epoch": 0.92, - "learning_rate": 3.963315743398542e-06, - "loss": 2.4075, - "step": 263990 - }, - { - "epoch": 0.92, - "learning_rate": 3.961571863544889e-06, - "loss": 2.3982, - "step": 264000 - }, - { - "epoch": 0.92, - "learning_rate": 3.959827983691236e-06, - "loss": 2.3446, - "step": 264010 - }, - { - "epoch": 0.92, - "learning_rate": 3.9580841038375825e-06, - "loss": 2.3195, - "step": 264020 - }, - { - "epoch": 0.92, - "learning_rate": 3.956340223983928e-06, - "loss": 2.2972, - "step": 264030 - }, - { - "epoch": 0.92, - "learning_rate": 3.954596344130275e-06, - "loss": 2.297, - "step": 264040 - }, - { - "epoch": 0.92, - "learning_rate": 3.952852464276621e-06, - "loss": 2.3672, - "step": 264050 - }, - { - "epoch": 0.92, - "learning_rate": 3.9511085844229676e-06, - "loss": 2.3288, - "step": 264060 - }, - { - "epoch": 0.92, - "learning_rate": 3.949364704569314e-06, - "loss": 2.3565, - "step": 264070 - }, - { - "epoch": 0.92, - "learning_rate": 3.947620824715661e-06, - "loss": 2.3376, - "step": 264080 - }, - { - "epoch": 0.92, - "learning_rate": 3.945876944862007e-06, - "loss": 2.3769, - "step": 264090 - }, - { - "epoch": 0.92, - "learning_rate": 3.9441330650083535e-06, - "loss": 2.3342, - "step": 264100 - }, - { - "epoch": 0.92, - "learning_rate": 3.942389185154699e-06, - "loss": 2.3069, - "step": 264110 - }, - { - "epoch": 0.92, - "learning_rate": 3.940645305301046e-06, - "loss": 2.3067, - "step": 264120 - }, - { - "epoch": 0.92, - "learning_rate": 3.938901425447393e-06, - "loss": 2.3776, - "step": 264130 - }, - { - "epoch": 0.92, - "learning_rate": 3.937157545593739e-06, - "loss": 2.337, - "step": 264140 - }, - { - "epoch": 0.92, - "learning_rate": 3.935413665740085e-06, - "loss": 2.3644, - "step": 264150 - }, - { - "epoch": 0.92, - "learning_rate": 3.933669785886432e-06, - "loss": 2.3487, - "step": 264160 - }, - { - "epoch": 0.92, - "learning_rate": 3.931925906032778e-06, - "loss": 2.3456, - "step": 264170 - }, - { - "epoch": 0.92, - "learning_rate": 3.9301820261791245e-06, - "loss": 2.3403, - "step": 264180 - }, - { - "epoch": 0.92, - "learning_rate": 3.92843814632547e-06, - "loss": 2.396, - "step": 264190 - }, - { - "epoch": 0.92, - "learning_rate": 3.926694266471817e-06, - "loss": 2.2129, - "step": 264200 - }, - { - "epoch": 0.92, - "learning_rate": 3.924950386618164e-06, - "loss": 2.2855, - "step": 264210 - }, - { - "epoch": 0.92, - "learning_rate": 3.92320650676451e-06, - "loss": 2.3927, - "step": 264220 - }, - { - "epoch": 0.92, - "learning_rate": 3.921462626910856e-06, - "loss": 2.3499, - "step": 264230 - }, - { - "epoch": 0.92, - "learning_rate": 3.919718747057203e-06, - "loss": 2.3283, - "step": 264240 - }, - { - "epoch": 0.92, - "learning_rate": 3.917974867203549e-06, - "loss": 2.3078, - "step": 264250 - }, - { - "epoch": 0.92, - "learning_rate": 3.9162309873498955e-06, - "loss": 2.3415, - "step": 264260 - }, - { - "epoch": 0.92, - "learning_rate": 3.914487107496242e-06, - "loss": 2.3633, - "step": 264270 - }, - { - "epoch": 0.92, - "learning_rate": 3.912743227642589e-06, - "loss": 2.3757, - "step": 264280 - }, - { - "epoch": 0.92, - "learning_rate": 3.910999347788935e-06, - "loss": 2.3602, - "step": 264290 - }, - { - "epoch": 0.92, - "learning_rate": 3.909255467935281e-06, - "loss": 2.3647, - "step": 264300 - }, - { - "epoch": 0.92, - "learning_rate": 3.907511588081627e-06, - "loss": 2.2689, - "step": 264310 - }, - { - "epoch": 0.92, - "learning_rate": 3.905767708227974e-06, - "loss": 2.4001, - "step": 264320 - }, - { - "epoch": 0.92, - "learning_rate": 3.904023828374321e-06, - "loss": 2.3542, - "step": 264330 - }, - { - "epoch": 0.92, - "learning_rate": 3.902279948520667e-06, - "loss": 2.3069, - "step": 264340 - }, - { - "epoch": 0.92, - "learning_rate": 3.900536068667013e-06, - "loss": 2.3367, - "step": 264350 - }, - { - "epoch": 0.92, - "learning_rate": 3.89879218881336e-06, - "loss": 2.3844, - "step": 264360 - }, - { - "epoch": 0.92, - "learning_rate": 3.897048308959706e-06, - "loss": 2.3939, - "step": 264370 - }, - { - "epoch": 0.92, - "learning_rate": 3.895304429106052e-06, - "loss": 2.3652, - "step": 264380 - }, - { - "epoch": 0.92, - "learning_rate": 3.893560549252399e-06, - "loss": 2.2973, - "step": 264390 - }, - { - "epoch": 0.92, - "learning_rate": 3.891816669398745e-06, - "loss": 2.3474, - "step": 264400 - }, - { - "epoch": 0.92, - "learning_rate": 3.890072789545092e-06, - "loss": 2.4206, - "step": 264410 - }, - { - "epoch": 0.92, - "learning_rate": 3.888328909691438e-06, - "loss": 2.4373, - "step": 264420 - }, - { - "epoch": 0.92, - "learning_rate": 3.886585029837784e-06, - "loss": 2.3135, - "step": 264430 - }, - { - "epoch": 0.92, - "learning_rate": 3.884841149984131e-06, - "loss": 2.3615, - "step": 264440 - }, - { - "epoch": 0.92, - "learning_rate": 3.883097270130477e-06, - "loss": 2.3445, - "step": 264450 - }, - { - "epoch": 0.92, - "learning_rate": 3.881353390276823e-06, - "loss": 2.3221, - "step": 264460 - }, - { - "epoch": 0.92, - "learning_rate": 3.87960951042317e-06, - "loss": 2.394, - "step": 264470 - }, - { - "epoch": 0.92, - "learning_rate": 3.877865630569517e-06, - "loss": 2.3942, - "step": 264480 - }, - { - "epoch": 0.92, - "learning_rate": 3.876121750715863e-06, - "loss": 2.3397, - "step": 264490 - }, - { - "epoch": 0.92, - "learning_rate": 3.874377870862209e-06, - "loss": 2.3002, - "step": 264500 - }, - { - "epoch": 0.92, - "learning_rate": 3.872633991008555e-06, - "loss": 2.3428, - "step": 264510 - }, - { - "epoch": 0.92, - "learning_rate": 3.870890111154902e-06, - "loss": 2.3871, - "step": 264520 - }, - { - "epoch": 0.92, - "learning_rate": 3.8691462313012486e-06, - "loss": 2.437, - "step": 264530 - }, - { - "epoch": 0.92, - "learning_rate": 3.867402351447595e-06, - "loss": 2.4295, - "step": 264540 - }, - { - "epoch": 0.92, - "learning_rate": 3.865658471593941e-06, - "loss": 2.2996, - "step": 264550 - }, - { - "epoch": 0.92, - "learning_rate": 3.863914591740288e-06, - "loss": 2.3448, - "step": 264560 - }, - { - "epoch": 0.92, - "learning_rate": 3.862170711886634e-06, - "loss": 2.2866, - "step": 264570 - }, - { - "epoch": 0.92, - "learning_rate": 3.86042683203298e-06, - "loss": 2.2855, - "step": 264580 - }, - { - "epoch": 0.92, - "learning_rate": 3.858682952179327e-06, - "loss": 2.3627, - "step": 264590 - }, - { - "epoch": 0.92, - "learning_rate": 3.856939072325673e-06, - "loss": 2.3843, - "step": 264600 - }, - { - "epoch": 0.92, - "learning_rate": 3.8551951924720196e-06, - "loss": 2.3303, - "step": 264610 - }, - { - "epoch": 0.92, - "learning_rate": 3.853451312618366e-06, - "loss": 2.3055, - "step": 264620 - }, - { - "epoch": 0.92, - "learning_rate": 3.851707432764712e-06, - "loss": 2.3088, - "step": 264630 - }, - { - "epoch": 0.92, - "learning_rate": 3.849963552911059e-06, - "loss": 2.2491, - "step": 264640 - }, - { - "epoch": 0.92, - "learning_rate": 3.8482196730574055e-06, - "loss": 2.3449, - "step": 264650 - }, - { - "epoch": 0.92, - "learning_rate": 3.846475793203751e-06, - "loss": 2.3297, - "step": 264660 - }, - { - "epoch": 0.92, - "learning_rate": 3.844731913350098e-06, - "loss": 2.3287, - "step": 264670 - }, - { - "epoch": 0.92, - "learning_rate": 3.842988033496445e-06, - "loss": 2.2553, - "step": 264680 - }, - { - "epoch": 0.92, - "learning_rate": 3.8412441536427906e-06, - "loss": 2.3409, - "step": 264690 - }, - { - "epoch": 0.92, - "learning_rate": 3.839500273789137e-06, - "loss": 2.3573, - "step": 264700 - }, - { - "epoch": 0.92, - "learning_rate": 3.837756393935483e-06, - "loss": 2.4352, - "step": 264710 - }, - { - "epoch": 0.92, - "learning_rate": 3.83601251408183e-06, - "loss": 2.311, - "step": 264720 - }, - { - "epoch": 0.92, - "learning_rate": 3.8342686342281765e-06, - "loss": 2.3182, - "step": 264730 - }, - { - "epoch": 0.92, - "learning_rate": 3.832524754374523e-06, - "loss": 2.3018, - "step": 264740 - }, - { - "epoch": 0.92, - "learning_rate": 3.830780874520869e-06, - "loss": 2.3917, - "step": 264750 - }, - { - "epoch": 0.92, - "learning_rate": 3.829036994667216e-06, - "loss": 2.3459, - "step": 264760 - }, - { - "epoch": 0.92, - "learning_rate": 3.8272931148135616e-06, - "loss": 2.3704, - "step": 264770 - }, - { - "epoch": 0.92, - "learning_rate": 3.825549234959908e-06, - "loss": 2.3504, - "step": 264780 - }, - { - "epoch": 0.92, - "learning_rate": 3.823805355106255e-06, - "loss": 2.3117, - "step": 264790 - }, - { - "epoch": 0.92, - "learning_rate": 3.822061475252601e-06, - "loss": 2.3467, - "step": 264800 - }, - { - "epoch": 0.92, - "learning_rate": 3.8203175953989475e-06, - "loss": 2.364, - "step": 264810 - }, - { - "epoch": 0.92, - "learning_rate": 3.818573715545294e-06, - "loss": 2.3797, - "step": 264820 - }, - { - "epoch": 0.92, - "learning_rate": 3.81682983569164e-06, - "loss": 2.282, - "step": 264830 - }, - { - "epoch": 0.92, - "learning_rate": 3.815085955837987e-06, - "loss": 2.4325, - "step": 264840 - }, - { - "epoch": 0.92, - "learning_rate": 3.813342075984333e-06, - "loss": 2.2678, - "step": 264850 - }, - { - "epoch": 0.92, - "learning_rate": 3.8115981961306793e-06, - "loss": 2.2071, - "step": 264860 - }, - { - "epoch": 0.92, - "learning_rate": 3.8098543162770264e-06, - "loss": 2.398, - "step": 264870 - }, - { - "epoch": 0.92, - "learning_rate": 3.8081104364233727e-06, - "loss": 2.3185, - "step": 264880 - }, - { - "epoch": 0.92, - "learning_rate": 3.806366556569719e-06, - "loss": 2.3444, - "step": 264890 - }, - { - "epoch": 0.92, - "learning_rate": 3.804622676716065e-06, - "loss": 2.3493, - "step": 264900 - }, - { - "epoch": 0.92, - "learning_rate": 3.8028787968624115e-06, - "loss": 2.4137, - "step": 264910 - }, - { - "epoch": 0.92, - "learning_rate": 3.8011349170087577e-06, - "loss": 2.3469, - "step": 264920 - }, - { - "epoch": 0.92, - "learning_rate": 3.799391037155104e-06, - "loss": 2.3415, - "step": 264930 - }, - { - "epoch": 0.92, - "learning_rate": 3.797647157301451e-06, - "loss": 2.3261, - "step": 264940 - }, - { - "epoch": 0.92, - "learning_rate": 3.7959032774477974e-06, - "loss": 2.413, - "step": 264950 - }, - { - "epoch": 0.92, - "learning_rate": 3.7941593975941437e-06, - "loss": 2.304, - "step": 264960 - }, - { - "epoch": 0.92, - "learning_rate": 3.79241551774049e-06, - "loss": 2.4432, - "step": 264970 - }, - { - "epoch": 0.92, - "learning_rate": 3.790671637886836e-06, - "loss": 2.3121, - "step": 264980 - }, - { - "epoch": 0.92, - "learning_rate": 3.7889277580331825e-06, - "loss": 2.3189, - "step": 264990 - }, - { - "epoch": 0.92, - "learning_rate": 3.7871838781795287e-06, - "loss": 2.3617, - "step": 265000 - }, - { - "epoch": 0.92, - "learning_rate": 3.785439998325876e-06, - "loss": 2.311, - "step": 265010 - }, - { - "epoch": 0.92, - "learning_rate": 3.783696118472222e-06, - "loss": 2.303, - "step": 265020 - }, - { - "epoch": 0.92, - "learning_rate": 3.7819522386185684e-06, - "loss": 2.3111, - "step": 265030 - }, - { - "epoch": 0.92, - "learning_rate": 3.7802083587649147e-06, - "loss": 2.3427, - "step": 265040 - }, - { - "epoch": 0.92, - "learning_rate": 3.778464478911261e-06, - "loss": 2.2758, - "step": 265050 - }, - { - "epoch": 0.92, - "learning_rate": 3.776720599057607e-06, - "loss": 2.3577, - "step": 265060 - }, - { - "epoch": 0.92, - "learning_rate": 3.7749767192039543e-06, - "loss": 2.3736, - "step": 265070 - }, - { - "epoch": 0.92, - "learning_rate": 3.7732328393503006e-06, - "loss": 2.3013, - "step": 265080 - }, - { - "epoch": 0.92, - "learning_rate": 3.771488959496647e-06, - "loss": 2.3529, - "step": 265090 - }, - { - "epoch": 0.92, - "learning_rate": 3.769745079642993e-06, - "loss": 2.362, - "step": 265100 - }, - { - "epoch": 0.92, - "learning_rate": 3.7680011997893394e-06, - "loss": 2.2488, - "step": 265110 - }, - { - "epoch": 0.92, - "learning_rate": 3.7662573199356857e-06, - "loss": 2.2634, - "step": 265120 - }, - { - "epoch": 0.92, - "learning_rate": 3.764513440082032e-06, - "loss": 2.4154, - "step": 265130 - }, - { - "epoch": 0.92, - "learning_rate": 3.762769560228379e-06, - "loss": 2.3629, - "step": 265140 - }, - { - "epoch": 0.92, - "learning_rate": 3.7610256803747253e-06, - "loss": 2.4116, - "step": 265150 - }, - { - "epoch": 0.92, - "learning_rate": 3.7592818005210716e-06, - "loss": 2.2957, - "step": 265160 - }, - { - "epoch": 0.92, - "learning_rate": 3.757537920667418e-06, - "loss": 2.3014, - "step": 265170 - }, - { - "epoch": 0.92, - "learning_rate": 3.755794040813764e-06, - "loss": 2.3475, - "step": 265180 - }, - { - "epoch": 0.92, - "learning_rate": 3.7540501609601104e-06, - "loss": 2.39, - "step": 265190 - }, - { - "epoch": 0.92, - "learning_rate": 3.7523062811064567e-06, - "loss": 2.3508, - "step": 265200 - }, - { - "epoch": 0.92, - "learning_rate": 3.7505624012528038e-06, - "loss": 2.2954, - "step": 265210 - }, - { - "epoch": 0.93, - "learning_rate": 3.74881852139915e-06, - "loss": 2.302, - "step": 265220 - }, - { - "epoch": 0.93, - "learning_rate": 3.7470746415454963e-06, - "loss": 2.3256, - "step": 265230 - }, - { - "epoch": 0.93, - "learning_rate": 3.7453307616918426e-06, - "loss": 2.3226, - "step": 265240 - }, - { - "epoch": 0.93, - "learning_rate": 3.743586881838189e-06, - "loss": 2.292, - "step": 265250 - }, - { - "epoch": 0.93, - "learning_rate": 3.741843001984535e-06, - "loss": 2.3923, - "step": 265260 - }, - { - "epoch": 0.93, - "learning_rate": 3.7400991221308822e-06, - "loss": 2.2258, - "step": 265270 - }, - { - "epoch": 0.93, - "learning_rate": 3.7383552422772285e-06, - "loss": 2.3653, - "step": 265280 - }, - { - "epoch": 0.93, - "learning_rate": 3.7366113624235748e-06, - "loss": 2.2834, - "step": 265290 - }, - { - "epoch": 0.93, - "learning_rate": 3.734867482569921e-06, - "loss": 2.2833, - "step": 265300 - }, - { - "epoch": 0.93, - "learning_rate": 3.7331236027162673e-06, - "loss": 2.2791, - "step": 265310 - }, - { - "epoch": 0.93, - "learning_rate": 3.7313797228626136e-06, - "loss": 2.3695, - "step": 265320 - }, - { - "epoch": 0.93, - "learning_rate": 3.72963584300896e-06, - "loss": 2.3274, - "step": 265330 - }, - { - "epoch": 0.93, - "learning_rate": 3.727891963155307e-06, - "loss": 2.3903, - "step": 265340 - }, - { - "epoch": 0.93, - "learning_rate": 3.7261480833016532e-06, - "loss": 2.3072, - "step": 265350 - }, - { - "epoch": 0.93, - "learning_rate": 3.7244042034479995e-06, - "loss": 2.322, - "step": 265360 - }, - { - "epoch": 0.93, - "learning_rate": 3.7226603235943458e-06, - "loss": 2.3224, - "step": 265370 - }, - { - "epoch": 0.93, - "learning_rate": 3.720916443740692e-06, - "loss": 2.371, - "step": 265380 - }, - { - "epoch": 0.93, - "learning_rate": 3.7191725638870383e-06, - "loss": 2.3756, - "step": 265390 - }, - { - "epoch": 0.93, - "learning_rate": 3.7174286840333846e-06, - "loss": 2.3078, - "step": 265400 - }, - { - "epoch": 0.93, - "learning_rate": 3.7156848041797317e-06, - "loss": 2.3213, - "step": 265410 - }, - { - "epoch": 0.93, - "learning_rate": 3.713940924326078e-06, - "loss": 2.3089, - "step": 265420 - }, - { - "epoch": 0.93, - "learning_rate": 3.7121970444724242e-06, - "loss": 2.2647, - "step": 265430 - }, - { - "epoch": 0.93, - "learning_rate": 3.7104531646187705e-06, - "loss": 2.3231, - "step": 265440 - }, - { - "epoch": 0.93, - "learning_rate": 3.7087092847651168e-06, - "loss": 2.3257, - "step": 265450 - }, - { - "epoch": 0.93, - "learning_rate": 3.706965404911463e-06, - "loss": 2.2734, - "step": 265460 - }, - { - "epoch": 0.93, - "learning_rate": 3.70522152505781e-06, - "loss": 2.3316, - "step": 265470 - }, - { - "epoch": 0.93, - "learning_rate": 3.7034776452041564e-06, - "loss": 2.3, - "step": 265480 - }, - { - "epoch": 0.93, - "learning_rate": 3.7017337653505027e-06, - "loss": 2.4456, - "step": 265490 - }, - { - "epoch": 0.93, - "learning_rate": 3.699989885496849e-06, - "loss": 2.335, - "step": 265500 - }, - { - "epoch": 0.93, - "learning_rate": 3.6982460056431952e-06, - "loss": 2.3089, - "step": 265510 - }, - { - "epoch": 0.93, - "learning_rate": 3.6965021257895415e-06, - "loss": 2.3952, - "step": 265520 - }, - { - "epoch": 0.93, - "learning_rate": 3.6947582459358878e-06, - "loss": 2.253, - "step": 265530 - }, - { - "epoch": 0.93, - "learning_rate": 3.693014366082235e-06, - "loss": 2.4005, - "step": 265540 - }, - { - "epoch": 0.93, - "learning_rate": 3.691270486228581e-06, - "loss": 2.3434, - "step": 265550 - }, - { - "epoch": 0.93, - "learning_rate": 3.6895266063749274e-06, - "loss": 2.3186, - "step": 265560 - }, - { - "epoch": 0.93, - "learning_rate": 3.6877827265212737e-06, - "loss": 2.3589, - "step": 265570 - }, - { - "epoch": 0.93, - "learning_rate": 3.68603884666762e-06, - "loss": 2.4055, - "step": 265580 - }, - { - "epoch": 0.93, - "learning_rate": 3.6842949668139662e-06, - "loss": 2.3037, - "step": 265590 - }, - { - "epoch": 0.93, - "learning_rate": 3.6825510869603125e-06, - "loss": 2.3587, - "step": 265600 - }, - { - "epoch": 0.93, - "learning_rate": 3.6808072071066596e-06, - "loss": 2.343, - "step": 265610 - }, - { - "epoch": 0.93, - "learning_rate": 3.679063327253006e-06, - "loss": 2.3881, - "step": 265620 - }, - { - "epoch": 0.93, - "learning_rate": 3.677319447399352e-06, - "loss": 2.3408, - "step": 265630 - }, - { - "epoch": 0.93, - "learning_rate": 3.6755755675456984e-06, - "loss": 2.3956, - "step": 265640 - }, - { - "epoch": 0.93, - "learning_rate": 3.6738316876920447e-06, - "loss": 2.3293, - "step": 265650 - }, - { - "epoch": 0.93, - "learning_rate": 3.672087807838391e-06, - "loss": 2.2661, - "step": 265660 - }, - { - "epoch": 0.93, - "learning_rate": 3.670343927984738e-06, - "loss": 2.3063, - "step": 265670 - }, - { - "epoch": 0.93, - "learning_rate": 3.6686000481310844e-06, - "loss": 2.3874, - "step": 265680 - }, - { - "epoch": 0.93, - "learning_rate": 3.6668561682774306e-06, - "loss": 2.3332, - "step": 265690 - }, - { - "epoch": 0.93, - "learning_rate": 3.665112288423777e-06, - "loss": 2.2872, - "step": 265700 - }, - { - "epoch": 0.93, - "learning_rate": 3.663368408570123e-06, - "loss": 2.3892, - "step": 265710 - }, - { - "epoch": 0.93, - "learning_rate": 3.6616245287164694e-06, - "loss": 2.2746, - "step": 265720 - }, - { - "epoch": 0.93, - "learning_rate": 3.6598806488628157e-06, - "loss": 2.3146, - "step": 265730 - }, - { - "epoch": 0.93, - "learning_rate": 3.658136769009163e-06, - "loss": 2.3466, - "step": 265740 - }, - { - "epoch": 0.93, - "learning_rate": 3.656392889155509e-06, - "loss": 2.3252, - "step": 265750 - }, - { - "epoch": 0.93, - "learning_rate": 3.6546490093018554e-06, - "loss": 2.3822, - "step": 265760 - }, - { - "epoch": 0.93, - "learning_rate": 3.6529051294482016e-06, - "loss": 2.3106, - "step": 265770 - }, - { - "epoch": 0.93, - "learning_rate": 3.651161249594548e-06, - "loss": 2.2679, - "step": 265780 - }, - { - "epoch": 0.93, - "learning_rate": 3.649417369740894e-06, - "loss": 2.2942, - "step": 265790 - }, - { - "epoch": 0.93, - "learning_rate": 3.6476734898872404e-06, - "loss": 2.3782, - "step": 265800 - }, - { - "epoch": 0.93, - "learning_rate": 3.6459296100335876e-06, - "loss": 2.3444, - "step": 265810 - }, - { - "epoch": 0.93, - "learning_rate": 3.644185730179934e-06, - "loss": 2.3393, - "step": 265820 - }, - { - "epoch": 0.93, - "learning_rate": 3.64244185032628e-06, - "loss": 2.3585, - "step": 265830 - }, - { - "epoch": 0.93, - "learning_rate": 3.6406979704726264e-06, - "loss": 2.4124, - "step": 265840 - }, - { - "epoch": 0.93, - "learning_rate": 3.6389540906189726e-06, - "loss": 2.3652, - "step": 265850 - }, - { - "epoch": 0.93, - "learning_rate": 3.637210210765319e-06, - "loss": 2.276, - "step": 265860 - }, - { - "epoch": 0.93, - "learning_rate": 3.635466330911666e-06, - "loss": 2.2848, - "step": 265870 - }, - { - "epoch": 0.93, - "learning_rate": 3.6337224510580123e-06, - "loss": 2.3276, - "step": 265880 - }, - { - "epoch": 0.93, - "learning_rate": 3.6319785712043586e-06, - "loss": 2.2898, - "step": 265890 - }, - { - "epoch": 0.93, - "learning_rate": 3.630234691350705e-06, - "loss": 2.281, - "step": 265900 - }, - { - "epoch": 0.93, - "learning_rate": 3.628490811497051e-06, - "loss": 2.3182, - "step": 265910 - }, - { - "epoch": 0.93, - "learning_rate": 3.6267469316433974e-06, - "loss": 2.3461, - "step": 265920 - }, - { - "epoch": 0.93, - "learning_rate": 3.6250030517897436e-06, - "loss": 2.3638, - "step": 265930 - }, - { - "epoch": 0.93, - "learning_rate": 3.6232591719360907e-06, - "loss": 2.2368, - "step": 265940 - }, - { - "epoch": 0.93, - "learning_rate": 3.621515292082437e-06, - "loss": 2.3, - "step": 265950 - }, - { - "epoch": 0.93, - "learning_rate": 3.6197714122287833e-06, - "loss": 2.3248, - "step": 265960 - }, - { - "epoch": 0.93, - "learning_rate": 3.6180275323751296e-06, - "loss": 2.3465, - "step": 265970 - }, - { - "epoch": 0.93, - "learning_rate": 3.616283652521476e-06, - "loss": 2.3111, - "step": 265980 - }, - { - "epoch": 0.93, - "learning_rate": 3.614539772667822e-06, - "loss": 2.4125, - "step": 265990 - }, - { - "epoch": 0.93, - "learning_rate": 3.6127958928141692e-06, - "loss": 2.1898, - "step": 266000 - }, - { - "epoch": 0.93, - "learning_rate": 3.6110520129605155e-06, - "loss": 2.3098, - "step": 266010 - }, - { - "epoch": 0.93, - "learning_rate": 3.6093081331068618e-06, - "loss": 2.2912, - "step": 266020 - }, - { - "epoch": 0.93, - "learning_rate": 3.607564253253208e-06, - "loss": 2.4039, - "step": 266030 - }, - { - "epoch": 0.93, - "learning_rate": 3.6058203733995543e-06, - "loss": 2.4078, - "step": 266040 - }, - { - "epoch": 0.93, - "learning_rate": 3.6040764935459006e-06, - "loss": 2.2981, - "step": 266050 - }, - { - "epoch": 0.93, - "learning_rate": 3.602332613692247e-06, - "loss": 2.3001, - "step": 266060 - }, - { - "epoch": 0.93, - "learning_rate": 3.600588733838594e-06, - "loss": 2.3784, - "step": 266070 - }, - { - "epoch": 0.93, - "learning_rate": 3.5988448539849402e-06, - "loss": 2.3399, - "step": 266080 - }, - { - "epoch": 0.93, - "learning_rate": 3.5971009741312865e-06, - "loss": 2.3308, - "step": 266090 - }, - { - "epoch": 0.93, - "learning_rate": 3.5953570942776328e-06, - "loss": 2.3592, - "step": 266100 - }, - { - "epoch": 0.93, - "learning_rate": 3.593613214423979e-06, - "loss": 2.3796, - "step": 266110 - }, - { - "epoch": 0.93, - "learning_rate": 3.5918693345703253e-06, - "loss": 2.3688, - "step": 266120 - }, - { - "epoch": 0.93, - "learning_rate": 3.5901254547166716e-06, - "loss": 2.3245, - "step": 266130 - }, - { - "epoch": 0.93, - "learning_rate": 3.5883815748630187e-06, - "loss": 2.2686, - "step": 266140 - }, - { - "epoch": 0.93, - "learning_rate": 3.586637695009365e-06, - "loss": 2.3073, - "step": 266150 - }, - { - "epoch": 0.93, - "learning_rate": 3.5848938151557112e-06, - "loss": 2.2903, - "step": 266160 - }, - { - "epoch": 0.93, - "learning_rate": 3.5831499353020575e-06, - "loss": 2.2968, - "step": 266170 - }, - { - "epoch": 0.93, - "learning_rate": 3.5814060554484038e-06, - "loss": 2.3731, - "step": 266180 - }, - { - "epoch": 0.93, - "learning_rate": 3.57966217559475e-06, - "loss": 2.4027, - "step": 266190 - }, - { - "epoch": 0.93, - "learning_rate": 3.577918295741097e-06, - "loss": 2.2898, - "step": 266200 - }, - { - "epoch": 0.93, - "learning_rate": 3.5761744158874434e-06, - "loss": 2.3542, - "step": 266210 - }, - { - "epoch": 0.93, - "learning_rate": 3.5744305360337897e-06, - "loss": 2.3173, - "step": 266220 - }, - { - "epoch": 0.93, - "learning_rate": 3.572686656180136e-06, - "loss": 2.3923, - "step": 266230 - }, - { - "epoch": 0.93, - "learning_rate": 3.5709427763264822e-06, - "loss": 2.3336, - "step": 266240 - }, - { - "epoch": 0.93, - "learning_rate": 3.5691988964728285e-06, - "loss": 2.3609, - "step": 266250 - }, - { - "epoch": 0.93, - "learning_rate": 3.5674550166191748e-06, - "loss": 2.3022, - "step": 266260 - }, - { - "epoch": 0.93, - "learning_rate": 3.565711136765522e-06, - "loss": 2.4148, - "step": 266270 - }, - { - "epoch": 0.93, - "learning_rate": 3.563967256911868e-06, - "loss": 2.3909, - "step": 266280 - }, - { - "epoch": 0.93, - "learning_rate": 3.5622233770582144e-06, - "loss": 2.2906, - "step": 266290 - }, - { - "epoch": 0.93, - "learning_rate": 3.5604794972045607e-06, - "loss": 2.2873, - "step": 266300 - }, - { - "epoch": 0.93, - "learning_rate": 3.558735617350907e-06, - "loss": 2.3069, - "step": 266310 - }, - { - "epoch": 0.93, - "learning_rate": 3.5569917374972532e-06, - "loss": 2.3801, - "step": 266320 - }, - { - "epoch": 0.93, - "learning_rate": 3.5552478576435995e-06, - "loss": 2.3356, - "step": 266330 - }, - { - "epoch": 0.93, - "learning_rate": 3.5535039777899466e-06, - "loss": 2.3705, - "step": 266340 - }, - { - "epoch": 0.93, - "learning_rate": 3.551760097936293e-06, - "loss": 2.249, - "step": 266350 - }, - { - "epoch": 0.93, - "learning_rate": 3.550016218082639e-06, - "loss": 2.353, - "step": 266360 - }, - { - "epoch": 0.93, - "learning_rate": 3.5482723382289854e-06, - "loss": 2.319, - "step": 266370 - }, - { - "epoch": 0.93, - "learning_rate": 3.5465284583753317e-06, - "loss": 2.3714, - "step": 266380 - }, - { - "epoch": 0.93, - "learning_rate": 3.544784578521678e-06, - "loss": 2.2841, - "step": 266390 - }, - { - "epoch": 0.93, - "learning_rate": 3.543040698668025e-06, - "loss": 2.2804, - "step": 266400 - }, - { - "epoch": 0.93, - "learning_rate": 3.5412968188143713e-06, - "loss": 2.3125, - "step": 266410 - }, - { - "epoch": 0.93, - "learning_rate": 3.5395529389607176e-06, - "loss": 2.4291, - "step": 266420 - }, - { - "epoch": 0.93, - "learning_rate": 3.537809059107064e-06, - "loss": 2.3824, - "step": 266430 - }, - { - "epoch": 0.93, - "learning_rate": 3.53606517925341e-06, - "loss": 2.3229, - "step": 266440 - }, - { - "epoch": 0.93, - "learning_rate": 3.5343212993997564e-06, - "loss": 2.4473, - "step": 266450 - }, - { - "epoch": 0.93, - "learning_rate": 3.5325774195461027e-06, - "loss": 2.2893, - "step": 266460 - }, - { - "epoch": 0.93, - "learning_rate": 3.53083353969245e-06, - "loss": 2.383, - "step": 266470 - }, - { - "epoch": 0.93, - "learning_rate": 3.529089659838796e-06, - "loss": 2.299, - "step": 266480 - }, - { - "epoch": 0.93, - "learning_rate": 3.5273457799851423e-06, - "loss": 2.3111, - "step": 266490 - }, - { - "epoch": 0.93, - "learning_rate": 3.5256019001314886e-06, - "loss": 2.2211, - "step": 266500 - }, - { - "epoch": 0.93, - "learning_rate": 3.523858020277835e-06, - "loss": 2.3219, - "step": 266510 - }, - { - "epoch": 0.93, - "learning_rate": 3.522114140424181e-06, - "loss": 2.3303, - "step": 266520 - }, - { - "epoch": 0.93, - "learning_rate": 3.5203702605705274e-06, - "loss": 2.3204, - "step": 266530 - }, - { - "epoch": 0.93, - "learning_rate": 3.5186263807168745e-06, - "loss": 2.3362, - "step": 266540 - }, - { - "epoch": 0.93, - "learning_rate": 3.516882500863221e-06, - "loss": 2.3666, - "step": 266550 - }, - { - "epoch": 0.93, - "learning_rate": 3.515138621009567e-06, - "loss": 2.3897, - "step": 266560 - }, - { - "epoch": 0.93, - "learning_rate": 3.5133947411559133e-06, - "loss": 2.3146, - "step": 266570 - }, - { - "epoch": 0.93, - "learning_rate": 3.5116508613022596e-06, - "loss": 2.363, - "step": 266580 - }, - { - "epoch": 0.93, - "learning_rate": 3.509906981448606e-06, - "loss": 2.3554, - "step": 266590 - }, - { - "epoch": 0.93, - "learning_rate": 3.508163101594953e-06, - "loss": 2.3614, - "step": 266600 - }, - { - "epoch": 0.93, - "learning_rate": 3.5064192217412993e-06, - "loss": 2.3096, - "step": 266610 - }, - { - "epoch": 0.93, - "learning_rate": 3.5046753418876455e-06, - "loss": 2.345, - "step": 266620 - }, - { - "epoch": 0.93, - "learning_rate": 3.502931462033992e-06, - "loss": 2.3429, - "step": 266630 - }, - { - "epoch": 0.93, - "learning_rate": 3.501187582180338e-06, - "loss": 2.3769, - "step": 266640 - }, - { - "epoch": 0.93, - "learning_rate": 3.4994437023266843e-06, - "loss": 2.3159, - "step": 266650 - }, - { - "epoch": 0.93, - "learning_rate": 3.4976998224730306e-06, - "loss": 2.3686, - "step": 266660 - }, - { - "epoch": 0.93, - "learning_rate": 3.4959559426193777e-06, - "loss": 2.3115, - "step": 266670 - }, - { - "epoch": 0.93, - "learning_rate": 3.494212062765724e-06, - "loss": 2.4107, - "step": 266680 - }, - { - "epoch": 0.93, - "learning_rate": 3.4924681829120703e-06, - "loss": 2.4326, - "step": 266690 - }, - { - "epoch": 0.93, - "learning_rate": 3.4907243030584165e-06, - "loss": 2.2815, - "step": 266700 - }, - { - "epoch": 0.93, - "learning_rate": 3.488980423204763e-06, - "loss": 2.3355, - "step": 266710 - }, - { - "epoch": 0.93, - "learning_rate": 3.487236543351109e-06, - "loss": 2.263, - "step": 266720 - }, - { - "epoch": 0.93, - "learning_rate": 3.4854926634974553e-06, - "loss": 2.2563, - "step": 266730 - }, - { - "epoch": 0.93, - "learning_rate": 3.4837487836438025e-06, - "loss": 2.3375, - "step": 266740 - }, - { - "epoch": 0.93, - "learning_rate": 3.4820049037901487e-06, - "loss": 2.3437, - "step": 266750 - }, - { - "epoch": 0.93, - "learning_rate": 3.480261023936495e-06, - "loss": 2.3592, - "step": 266760 - }, - { - "epoch": 0.93, - "learning_rate": 3.4785171440828413e-06, - "loss": 2.3706, - "step": 266770 - }, - { - "epoch": 0.93, - "learning_rate": 3.4767732642291875e-06, - "loss": 2.2843, - "step": 266780 - }, - { - "epoch": 0.93, - "learning_rate": 3.475029384375534e-06, - "loss": 2.3018, - "step": 266790 - }, - { - "epoch": 0.93, - "learning_rate": 3.473285504521881e-06, - "loss": 2.3706, - "step": 266800 - }, - { - "epoch": 0.93, - "learning_rate": 3.471541624668227e-06, - "loss": 2.3475, - "step": 266810 - }, - { - "epoch": 0.93, - "learning_rate": 3.4697977448145735e-06, - "loss": 2.3033, - "step": 266820 - }, - { - "epoch": 0.93, - "learning_rate": 3.4680538649609197e-06, - "loss": 2.3763, - "step": 266830 - }, - { - "epoch": 0.93, - "learning_rate": 3.466309985107266e-06, - "loss": 2.3745, - "step": 266840 - }, - { - "epoch": 0.93, - "learning_rate": 3.4645661052536123e-06, - "loss": 2.3273, - "step": 266850 - }, - { - "epoch": 0.93, - "learning_rate": 3.4628222253999585e-06, - "loss": 2.3591, - "step": 266860 - }, - { - "epoch": 0.93, - "learning_rate": 3.4610783455463057e-06, - "loss": 2.2275, - "step": 266870 - }, - { - "epoch": 0.93, - "learning_rate": 3.459334465692652e-06, - "loss": 2.3162, - "step": 266880 - }, - { - "epoch": 0.93, - "learning_rate": 3.457590585838998e-06, - "loss": 2.2853, - "step": 266890 - }, - { - "epoch": 0.93, - "learning_rate": 3.4558467059853445e-06, - "loss": 2.3643, - "step": 266900 - }, - { - "epoch": 0.93, - "learning_rate": 3.4541028261316907e-06, - "loss": 2.3028, - "step": 266910 - }, - { - "epoch": 0.93, - "learning_rate": 3.452358946278037e-06, - "loss": 2.3613, - "step": 266920 - }, - { - "epoch": 0.93, - "learning_rate": 3.4506150664243833e-06, - "loss": 2.2521, - "step": 266930 - }, - { - "epoch": 0.93, - "learning_rate": 3.4488711865707304e-06, - "loss": 2.3243, - "step": 266940 - }, - { - "epoch": 0.93, - "learning_rate": 3.4471273067170767e-06, - "loss": 2.3382, - "step": 266950 - }, - { - "epoch": 0.93, - "learning_rate": 3.445383426863423e-06, - "loss": 2.3688, - "step": 266960 - }, - { - "epoch": 0.93, - "learning_rate": 3.443639547009769e-06, - "loss": 2.2794, - "step": 266970 - }, - { - "epoch": 0.93, - "learning_rate": 3.4418956671561155e-06, - "loss": 2.3549, - "step": 266980 - }, - { - "epoch": 0.93, - "learning_rate": 3.4401517873024617e-06, - "loss": 2.4083, - "step": 266990 - }, - { - "epoch": 0.93, - "learning_rate": 3.438407907448809e-06, - "loss": 2.3066, - "step": 267000 - }, - { - "epoch": 0.93, - "learning_rate": 3.436664027595155e-06, - "loss": 2.2904, - "step": 267010 - }, - { - "epoch": 0.93, - "learning_rate": 3.4349201477415014e-06, - "loss": 2.3522, - "step": 267020 - }, - { - "epoch": 0.93, - "learning_rate": 3.4331762678878477e-06, - "loss": 2.344, - "step": 267030 - }, - { - "epoch": 0.93, - "learning_rate": 3.431432388034194e-06, - "loss": 2.3757, - "step": 267040 - }, - { - "epoch": 0.93, - "learning_rate": 3.42968850818054e-06, - "loss": 2.3024, - "step": 267050 - }, - { - "epoch": 0.93, - "learning_rate": 3.4279446283268865e-06, - "loss": 2.3597, - "step": 267060 - }, - { - "epoch": 0.93, - "learning_rate": 3.4262007484732336e-06, - "loss": 2.3522, - "step": 267070 - }, - { - "epoch": 0.93, - "learning_rate": 3.42445686861958e-06, - "loss": 2.4137, - "step": 267080 - }, - { - "epoch": 0.93, - "learning_rate": 3.422712988765926e-06, - "loss": 2.3719, - "step": 267090 - }, - { - "epoch": 0.93, - "learning_rate": 3.4209691089122724e-06, - "loss": 2.3035, - "step": 267100 - }, - { - "epoch": 0.93, - "learning_rate": 3.4192252290586187e-06, - "loss": 2.3632, - "step": 267110 - }, - { - "epoch": 0.93, - "learning_rate": 3.417481349204965e-06, - "loss": 2.3134, - "step": 267120 - }, - { - "epoch": 0.93, - "learning_rate": 3.415737469351311e-06, - "loss": 2.335, - "step": 267130 - }, - { - "epoch": 0.93, - "learning_rate": 3.4139935894976583e-06, - "loss": 2.3303, - "step": 267140 - }, - { - "epoch": 0.93, - "learning_rate": 3.4122497096440046e-06, - "loss": 2.318, - "step": 267150 - }, - { - "epoch": 0.93, - "learning_rate": 3.410505829790351e-06, - "loss": 2.2738, - "step": 267160 - }, - { - "epoch": 0.93, - "learning_rate": 3.408761949936697e-06, - "loss": 2.3255, - "step": 267170 - }, - { - "epoch": 0.93, - "learning_rate": 3.4070180700830434e-06, - "loss": 2.322, - "step": 267180 - }, - { - "epoch": 0.93, - "learning_rate": 3.4052741902293897e-06, - "loss": 2.358, - "step": 267190 - }, - { - "epoch": 0.93, - "learning_rate": 3.4035303103757368e-06, - "loss": 2.2675, - "step": 267200 - }, - { - "epoch": 0.93, - "learning_rate": 3.401786430522083e-06, - "loss": 2.226, - "step": 267210 - }, - { - "epoch": 0.93, - "learning_rate": 3.4000425506684293e-06, - "loss": 2.2367, - "step": 267220 - }, - { - "epoch": 0.93, - "learning_rate": 3.3982986708147756e-06, - "loss": 2.3331, - "step": 267230 - }, - { - "epoch": 0.93, - "learning_rate": 3.396554790961122e-06, - "loss": 2.2976, - "step": 267240 - }, - { - "epoch": 0.93, - "learning_rate": 3.394810911107468e-06, - "loss": 2.3992, - "step": 267250 - }, - { - "epoch": 0.93, - "learning_rate": 3.3930670312538144e-06, - "loss": 2.3074, - "step": 267260 - }, - { - "epoch": 0.93, - "learning_rate": 3.3913231514001615e-06, - "loss": 2.3595, - "step": 267270 - }, - { - "epoch": 0.93, - "learning_rate": 3.3895792715465078e-06, - "loss": 2.311, - "step": 267280 - }, - { - "epoch": 0.93, - "learning_rate": 3.387835391692854e-06, - "loss": 2.3818, - "step": 267290 - }, - { - "epoch": 0.93, - "learning_rate": 3.3860915118392003e-06, - "loss": 2.289, - "step": 267300 - }, - { - "epoch": 0.93, - "learning_rate": 3.3843476319855466e-06, - "loss": 2.3316, - "step": 267310 - }, - { - "epoch": 0.93, - "learning_rate": 3.382603752131893e-06, - "loss": 2.2752, - "step": 267320 - }, - { - "epoch": 0.93, - "learning_rate": 3.38085987227824e-06, - "loss": 2.2869, - "step": 267330 - }, - { - "epoch": 0.93, - "learning_rate": 3.3791159924245862e-06, - "loss": 2.3024, - "step": 267340 - }, - { - "epoch": 0.93, - "learning_rate": 3.3773721125709325e-06, - "loss": 2.3786, - "step": 267350 - }, - { - "epoch": 0.93, - "learning_rate": 3.3756282327172788e-06, - "loss": 2.2741, - "step": 267360 - }, - { - "epoch": 0.93, - "learning_rate": 3.373884352863625e-06, - "loss": 2.3737, - "step": 267370 - }, - { - "epoch": 0.93, - "learning_rate": 3.3721404730099713e-06, - "loss": 2.3043, - "step": 267380 - }, - { - "epoch": 0.93, - "learning_rate": 3.3703965931563176e-06, - "loss": 2.3322, - "step": 267390 - }, - { - "epoch": 0.93, - "learning_rate": 3.3686527133026647e-06, - "loss": 2.3883, - "step": 267400 - }, - { - "epoch": 0.93, - "learning_rate": 3.366908833449011e-06, - "loss": 2.3329, - "step": 267410 - }, - { - "epoch": 0.93, - "learning_rate": 3.3651649535953572e-06, - "loss": 2.3555, - "step": 267420 - }, - { - "epoch": 0.93, - "learning_rate": 3.3634210737417035e-06, - "loss": 2.356, - "step": 267430 - }, - { - "epoch": 0.93, - "learning_rate": 3.3616771938880498e-06, - "loss": 2.3098, - "step": 267440 - }, - { - "epoch": 0.93, - "learning_rate": 3.359933314034396e-06, - "loss": 2.2992, - "step": 267450 - }, - { - "epoch": 0.93, - "learning_rate": 3.3581894341807427e-06, - "loss": 2.3365, - "step": 267460 - }, - { - "epoch": 0.93, - "learning_rate": 3.3564455543270894e-06, - "loss": 2.345, - "step": 267470 - }, - { - "epoch": 0.93, - "learning_rate": 3.3547016744734357e-06, - "loss": 2.3076, - "step": 267480 - }, - { - "epoch": 0.93, - "learning_rate": 3.352957794619782e-06, - "loss": 2.3383, - "step": 267490 - }, - { - "epoch": 0.93, - "learning_rate": 3.3512139147661282e-06, - "loss": 2.3646, - "step": 267500 - }, - { - "epoch": 0.93, - "learning_rate": 3.3494700349124745e-06, - "loss": 2.3481, - "step": 267510 - }, - { - "epoch": 0.93, - "learning_rate": 3.3477261550588208e-06, - "loss": 2.3944, - "step": 267520 - }, - { - "epoch": 0.93, - "learning_rate": 3.345982275205168e-06, - "loss": 2.3985, - "step": 267530 - }, - { - "epoch": 0.93, - "learning_rate": 3.344238395351514e-06, - "loss": 2.2963, - "step": 267540 - }, - { - "epoch": 0.93, - "learning_rate": 3.3424945154978604e-06, - "loss": 2.2761, - "step": 267550 - }, - { - "epoch": 0.93, - "learning_rate": 3.3407506356442067e-06, - "loss": 2.2863, - "step": 267560 - }, - { - "epoch": 0.93, - "learning_rate": 3.339006755790553e-06, - "loss": 2.2918, - "step": 267570 - }, - { - "epoch": 0.93, - "learning_rate": 3.3372628759368992e-06, - "loss": 2.3587, - "step": 267580 - }, - { - "epoch": 0.93, - "learning_rate": 3.335518996083246e-06, - "loss": 2.3693, - "step": 267590 - }, - { - "epoch": 0.93, - "learning_rate": 3.3337751162295926e-06, - "loss": 2.3696, - "step": 267600 - }, - { - "epoch": 0.93, - "learning_rate": 3.332031236375939e-06, - "loss": 2.3348, - "step": 267610 - }, - { - "epoch": 0.93, - "learning_rate": 3.330287356522285e-06, - "loss": 2.2981, - "step": 267620 - }, - { - "epoch": 0.93, - "learning_rate": 3.3285434766686314e-06, - "loss": 2.3229, - "step": 267630 - }, - { - "epoch": 0.93, - "learning_rate": 3.3267995968149777e-06, - "loss": 2.2666, - "step": 267640 - }, - { - "epoch": 0.93, - "learning_rate": 3.325055716961324e-06, - "loss": 2.3446, - "step": 267650 - }, - { - "epoch": 0.93, - "learning_rate": 3.3233118371076707e-06, - "loss": 2.3567, - "step": 267660 - }, - { - "epoch": 0.93, - "learning_rate": 3.3215679572540174e-06, - "loss": 2.3447, - "step": 267670 - }, - { - "epoch": 0.93, - "learning_rate": 3.3198240774003636e-06, - "loss": 2.2937, - "step": 267680 - }, - { - "epoch": 0.93, - "learning_rate": 3.31808019754671e-06, - "loss": 2.3696, - "step": 267690 - }, - { - "epoch": 0.93, - "learning_rate": 3.316336317693056e-06, - "loss": 2.2323, - "step": 267700 - }, - { - "epoch": 0.93, - "learning_rate": 3.3145924378394024e-06, - "loss": 2.3762, - "step": 267710 - }, - { - "epoch": 0.93, - "learning_rate": 3.312848557985749e-06, - "loss": 2.346, - "step": 267720 - }, - { - "epoch": 0.93, - "learning_rate": 3.311104678132096e-06, - "loss": 2.3333, - "step": 267730 - }, - { - "epoch": 0.93, - "learning_rate": 3.309360798278442e-06, - "loss": 2.3027, - "step": 267740 - }, - { - "epoch": 0.93, - "learning_rate": 3.3076169184247884e-06, - "loss": 2.2835, - "step": 267750 - }, - { - "epoch": 0.93, - "learning_rate": 3.3058730385711346e-06, - "loss": 2.3054, - "step": 267760 - }, - { - "epoch": 0.93, - "learning_rate": 3.304129158717481e-06, - "loss": 2.3485, - "step": 267770 - }, - { - "epoch": 0.93, - "learning_rate": 3.302385278863827e-06, - "loss": 2.2954, - "step": 267780 - }, - { - "epoch": 0.93, - "learning_rate": 3.300641399010174e-06, - "loss": 2.3449, - "step": 267790 - }, - { - "epoch": 0.93, - "learning_rate": 3.2988975191565206e-06, - "loss": 2.3644, - "step": 267800 - }, - { - "epoch": 0.93, - "learning_rate": 3.297153639302867e-06, - "loss": 2.3879, - "step": 267810 - }, - { - "epoch": 0.93, - "learning_rate": 3.295409759449213e-06, - "loss": 2.3376, - "step": 267820 - }, - { - "epoch": 0.93, - "learning_rate": 3.2936658795955594e-06, - "loss": 2.3645, - "step": 267830 - }, - { - "epoch": 0.93, - "learning_rate": 3.2919219997419056e-06, - "loss": 2.3407, - "step": 267840 - }, - { - "epoch": 0.93, - "learning_rate": 3.2901781198882523e-06, - "loss": 2.3452, - "step": 267850 - }, - { - "epoch": 0.93, - "learning_rate": 3.2884342400345986e-06, - "loss": 2.3048, - "step": 267860 - }, - { - "epoch": 0.93, - "learning_rate": 3.2866903601809453e-06, - "loss": 2.4246, - "step": 267870 - }, - { - "epoch": 0.93, - "learning_rate": 3.2849464803272916e-06, - "loss": 2.2928, - "step": 267880 - }, - { - "epoch": 0.93, - "learning_rate": 3.283202600473638e-06, - "loss": 2.3369, - "step": 267890 - }, - { - "epoch": 0.93, - "learning_rate": 3.281458720619984e-06, - "loss": 2.3034, - "step": 267900 - }, - { - "epoch": 0.93, - "learning_rate": 3.2797148407663304e-06, - "loss": 2.3432, - "step": 267910 - }, - { - "epoch": 0.93, - "learning_rate": 3.277970960912677e-06, - "loss": 2.3047, - "step": 267920 - }, - { - "epoch": 0.93, - "learning_rate": 3.2762270810590237e-06, - "loss": 2.2404, - "step": 267930 - }, - { - "epoch": 0.93, - "learning_rate": 3.27448320120537e-06, - "loss": 2.2812, - "step": 267940 - }, - { - "epoch": 0.93, - "learning_rate": 3.2727393213517163e-06, - "loss": 2.3261, - "step": 267950 - }, - { - "epoch": 0.93, - "learning_rate": 3.2709954414980626e-06, - "loss": 2.376, - "step": 267960 - }, - { - "epoch": 0.93, - "learning_rate": 3.269251561644409e-06, - "loss": 2.2771, - "step": 267970 - }, - { - "epoch": 0.93, - "learning_rate": 3.2675076817907555e-06, - "loss": 2.3382, - "step": 267980 - }, - { - "epoch": 0.93, - "learning_rate": 3.2657638019371018e-06, - "loss": 2.3275, - "step": 267990 - }, - { - "epoch": 0.93, - "learning_rate": 3.2640199220834485e-06, - "loss": 2.3548, - "step": 268000 - }, - { - "epoch": 0.93, - "learning_rate": 3.2622760422297947e-06, - "loss": 2.3071, - "step": 268010 - }, - { - "epoch": 0.93, - "learning_rate": 3.260532162376141e-06, - "loss": 2.4043, - "step": 268020 - }, - { - "epoch": 0.93, - "learning_rate": 3.2587882825224873e-06, - "loss": 2.3464, - "step": 268030 - }, - { - "epoch": 0.93, - "learning_rate": 3.2570444026688336e-06, - "loss": 2.3215, - "step": 268040 - }, - { - "epoch": 0.93, - "learning_rate": 3.2553005228151802e-06, - "loss": 2.3359, - "step": 268050 - }, - { - "epoch": 0.93, - "learning_rate": 3.2535566429615265e-06, - "loss": 2.3352, - "step": 268060 - }, - { - "epoch": 0.93, - "learning_rate": 3.251812763107873e-06, - "loss": 2.3163, - "step": 268070 - }, - { - "epoch": 0.93, - "learning_rate": 3.2500688832542195e-06, - "loss": 2.296, - "step": 268080 - }, - { - "epoch": 0.94, - "learning_rate": 3.2483250034005657e-06, - "loss": 2.2871, - "step": 268090 - }, - { - "epoch": 0.94, - "learning_rate": 3.246581123546912e-06, - "loss": 2.4058, - "step": 268100 - }, - { - "epoch": 0.94, - "learning_rate": 3.2448372436932587e-06, - "loss": 2.3273, - "step": 268110 - }, - { - "epoch": 0.94, - "learning_rate": 3.243093363839605e-06, - "loss": 2.3632, - "step": 268120 - }, - { - "epoch": 0.94, - "learning_rate": 3.2413494839859517e-06, - "loss": 2.3912, - "step": 268130 - }, - { - "epoch": 0.94, - "learning_rate": 3.239605604132298e-06, - "loss": 2.3127, - "step": 268140 - }, - { - "epoch": 0.94, - "learning_rate": 3.237861724278644e-06, - "loss": 2.2076, - "step": 268150 - }, - { - "epoch": 0.94, - "learning_rate": 3.2361178444249905e-06, - "loss": 2.3005, - "step": 268160 - }, - { - "epoch": 0.94, - "learning_rate": 3.2343739645713367e-06, - "loss": 2.3812, - "step": 268170 - }, - { - "epoch": 0.94, - "learning_rate": 3.2326300847176834e-06, - "loss": 2.3721, - "step": 268180 - }, - { - "epoch": 0.94, - "learning_rate": 3.2308862048640297e-06, - "loss": 2.3867, - "step": 268190 - }, - { - "epoch": 0.94, - "learning_rate": 3.2291423250103764e-06, - "loss": 2.2818, - "step": 268200 - }, - { - "epoch": 0.94, - "learning_rate": 3.2273984451567227e-06, - "loss": 2.3186, - "step": 268210 - }, - { - "epoch": 0.94, - "learning_rate": 3.225654565303069e-06, - "loss": 2.3183, - "step": 268220 - }, - { - "epoch": 0.94, - "learning_rate": 3.2239106854494152e-06, - "loss": 2.283, - "step": 268230 - }, - { - "epoch": 0.94, - "learning_rate": 3.222166805595762e-06, - "loss": 2.3152, - "step": 268240 - }, - { - "epoch": 0.94, - "learning_rate": 3.220422925742108e-06, - "loss": 2.2902, - "step": 268250 - }, - { - "epoch": 0.94, - "learning_rate": 3.2186790458884544e-06, - "loss": 2.3699, - "step": 268260 - }, - { - "epoch": 0.94, - "learning_rate": 3.216935166034801e-06, - "loss": 2.3356, - "step": 268270 - }, - { - "epoch": 0.94, - "learning_rate": 3.2151912861811474e-06, - "loss": 2.3143, - "step": 268280 - }, - { - "epoch": 0.94, - "learning_rate": 3.2134474063274937e-06, - "loss": 2.3904, - "step": 268290 - }, - { - "epoch": 0.94, - "learning_rate": 3.21170352647384e-06, - "loss": 2.3018, - "step": 268300 - }, - { - "epoch": 0.94, - "learning_rate": 3.2099596466201866e-06, - "loss": 2.3431, - "step": 268310 - }, - { - "epoch": 0.94, - "learning_rate": 3.208215766766533e-06, - "loss": 2.2835, - "step": 268320 - }, - { - "epoch": 0.94, - "learning_rate": 3.2064718869128796e-06, - "loss": 2.3903, - "step": 268330 - }, - { - "epoch": 0.94, - "learning_rate": 3.204728007059226e-06, - "loss": 2.2608, - "step": 268340 - }, - { - "epoch": 0.94, - "learning_rate": 3.202984127205572e-06, - "loss": 2.3174, - "step": 268350 - }, - { - "epoch": 0.94, - "learning_rate": 3.2012402473519184e-06, - "loss": 2.3496, - "step": 268360 - }, - { - "epoch": 0.94, - "learning_rate": 3.199496367498265e-06, - "loss": 2.3752, - "step": 268370 - }, - { - "epoch": 0.94, - "learning_rate": 3.1977524876446114e-06, - "loss": 2.3236, - "step": 268380 - }, - { - "epoch": 0.94, - "learning_rate": 3.1960086077909576e-06, - "loss": 2.3275, - "step": 268390 - }, - { - "epoch": 0.94, - "learning_rate": 3.1942647279373043e-06, - "loss": 2.3365, - "step": 268400 - }, - { - "epoch": 0.94, - "learning_rate": 3.1925208480836506e-06, - "loss": 2.3484, - "step": 268410 - }, - { - "epoch": 0.94, - "learning_rate": 3.190776968229997e-06, - "loss": 2.3008, - "step": 268420 - }, - { - "epoch": 0.94, - "learning_rate": 3.189033088376343e-06, - "loss": 2.3974, - "step": 268430 - }, - { - "epoch": 0.94, - "learning_rate": 3.18728920852269e-06, - "loss": 2.3647, - "step": 268440 - }, - { - "epoch": 0.94, - "learning_rate": 3.185545328669036e-06, - "loss": 2.3493, - "step": 268450 - }, - { - "epoch": 0.94, - "learning_rate": 3.1838014488153824e-06, - "loss": 2.4011, - "step": 268460 - }, - { - "epoch": 0.94, - "learning_rate": 3.182057568961729e-06, - "loss": 2.3831, - "step": 268470 - }, - { - "epoch": 0.94, - "learning_rate": 3.1803136891080753e-06, - "loss": 2.3335, - "step": 268480 - }, - { - "epoch": 0.94, - "learning_rate": 3.1785698092544216e-06, - "loss": 2.3677, - "step": 268490 - }, - { - "epoch": 0.94, - "learning_rate": 3.1768259294007683e-06, - "loss": 2.2806, - "step": 268500 - }, - { - "epoch": 0.94, - "learning_rate": 3.1750820495471146e-06, - "loss": 2.274, - "step": 268510 - }, - { - "epoch": 0.94, - "learning_rate": 3.173338169693461e-06, - "loss": 2.3286, - "step": 268520 - }, - { - "epoch": 0.94, - "learning_rate": 3.1715942898398075e-06, - "loss": 2.3776, - "step": 268530 - }, - { - "epoch": 0.94, - "learning_rate": 3.169850409986154e-06, - "loss": 2.296, - "step": 268540 - }, - { - "epoch": 0.94, - "learning_rate": 3.1681065301325e-06, - "loss": 2.3454, - "step": 268550 - }, - { - "epoch": 0.94, - "learning_rate": 3.1663626502788463e-06, - "loss": 2.3205, - "step": 268560 - }, - { - "epoch": 0.94, - "learning_rate": 3.164618770425193e-06, - "loss": 2.3179, - "step": 268570 - }, - { - "epoch": 0.94, - "learning_rate": 3.1628748905715393e-06, - "loss": 2.2403, - "step": 268580 - }, - { - "epoch": 0.94, - "learning_rate": 3.1611310107178856e-06, - "loss": 2.2327, - "step": 268590 - }, - { - "epoch": 0.94, - "learning_rate": 3.1593871308642323e-06, - "loss": 2.3172, - "step": 268600 - }, - { - "epoch": 0.94, - "learning_rate": 3.1576432510105785e-06, - "loss": 2.3386, - "step": 268610 - }, - { - "epoch": 0.94, - "learning_rate": 3.155899371156925e-06, - "loss": 2.4413, - "step": 268620 - }, - { - "epoch": 0.94, - "learning_rate": 3.1541554913032715e-06, - "loss": 2.3189, - "step": 268630 - }, - { - "epoch": 0.94, - "learning_rate": 3.1524116114496178e-06, - "loss": 2.2961, - "step": 268640 - }, - { - "epoch": 0.94, - "learning_rate": 3.150667731595964e-06, - "loss": 2.4254, - "step": 268650 - }, - { - "epoch": 0.94, - "learning_rate": 3.1489238517423103e-06, - "loss": 2.3424, - "step": 268660 - }, - { - "epoch": 0.94, - "learning_rate": 3.147179971888657e-06, - "loss": 2.34, - "step": 268670 - }, - { - "epoch": 0.94, - "learning_rate": 3.1454360920350033e-06, - "loss": 2.3444, - "step": 268680 - }, - { - "epoch": 0.94, - "learning_rate": 3.1436922121813495e-06, - "loss": 2.4197, - "step": 268690 - }, - { - "epoch": 0.94, - "learning_rate": 3.1419483323276962e-06, - "loss": 2.2884, - "step": 268700 - }, - { - "epoch": 0.94, - "learning_rate": 3.1402044524740425e-06, - "loss": 2.3535, - "step": 268710 - }, - { - "epoch": 0.94, - "learning_rate": 3.1384605726203888e-06, - "loss": 2.2627, - "step": 268720 - }, - { - "epoch": 0.94, - "learning_rate": 3.1367166927667355e-06, - "loss": 2.313, - "step": 268730 - }, - { - "epoch": 0.94, - "learning_rate": 3.1349728129130817e-06, - "loss": 2.2839, - "step": 268740 - }, - { - "epoch": 0.94, - "learning_rate": 3.133228933059428e-06, - "loss": 2.3278, - "step": 268750 - }, - { - "epoch": 0.94, - "learning_rate": 3.1314850532057747e-06, - "loss": 2.3351, - "step": 268760 - }, - { - "epoch": 0.94, - "learning_rate": 3.129741173352121e-06, - "loss": 2.3313, - "step": 268770 - }, - { - "epoch": 0.94, - "learning_rate": 3.1279972934984672e-06, - "loss": 2.328, - "step": 268780 - }, - { - "epoch": 0.94, - "learning_rate": 3.1262534136448135e-06, - "loss": 2.3402, - "step": 268790 - }, - { - "epoch": 0.94, - "learning_rate": 3.12450953379116e-06, - "loss": 2.3378, - "step": 268800 - }, - { - "epoch": 0.94, - "learning_rate": 3.1227656539375065e-06, - "loss": 2.3087, - "step": 268810 - }, - { - "epoch": 0.94, - "learning_rate": 3.121021774083853e-06, - "loss": 2.299, - "step": 268820 - }, - { - "epoch": 0.94, - "learning_rate": 3.1192778942301994e-06, - "loss": 2.3322, - "step": 268830 - }, - { - "epoch": 0.94, - "learning_rate": 3.1175340143765457e-06, - "loss": 2.3527, - "step": 268840 - }, - { - "epoch": 0.94, - "learning_rate": 3.115790134522892e-06, - "loss": 2.3992, - "step": 268850 - }, - { - "epoch": 0.94, - "learning_rate": 3.1140462546692386e-06, - "loss": 2.3188, - "step": 268860 - }, - { - "epoch": 0.94, - "learning_rate": 3.112302374815585e-06, - "loss": 2.2936, - "step": 268870 - }, - { - "epoch": 0.94, - "learning_rate": 3.110558494961931e-06, - "loss": 2.2889, - "step": 268880 - }, - { - "epoch": 0.94, - "learning_rate": 3.108814615108278e-06, - "loss": 2.4106, - "step": 268890 - }, - { - "epoch": 0.94, - "learning_rate": 3.107070735254624e-06, - "loss": 2.4032, - "step": 268900 - }, - { - "epoch": 0.94, - "learning_rate": 3.1053268554009704e-06, - "loss": 2.3112, - "step": 268910 - }, - { - "epoch": 0.94, - "learning_rate": 3.103582975547317e-06, - "loss": 2.2897, - "step": 268920 - }, - { - "epoch": 0.94, - "learning_rate": 3.1018390956936634e-06, - "loss": 2.2743, - "step": 268930 - }, - { - "epoch": 0.94, - "learning_rate": 3.1000952158400096e-06, - "loss": 2.2386, - "step": 268940 - }, - { - "epoch": 0.94, - "learning_rate": 3.0983513359863563e-06, - "loss": 2.3569, - "step": 268950 - }, - { - "epoch": 0.94, - "learning_rate": 3.0966074561327026e-06, - "loss": 2.301, - "step": 268960 - }, - { - "epoch": 0.94, - "learning_rate": 3.094863576279049e-06, - "loss": 2.3022, - "step": 268970 - }, - { - "epoch": 0.94, - "learning_rate": 3.093119696425395e-06, - "loss": 2.2962, - "step": 268980 - }, - { - "epoch": 0.94, - "learning_rate": 3.091375816571742e-06, - "loss": 2.4098, - "step": 268990 - }, - { - "epoch": 0.94, - "learning_rate": 3.089631936718088e-06, - "loss": 2.3266, - "step": 269000 - }, - { - "epoch": 0.94, - "learning_rate": 3.0878880568644344e-06, - "loss": 2.3752, - "step": 269010 - }, - { - "epoch": 0.94, - "learning_rate": 3.086144177010781e-06, - "loss": 2.4, - "step": 269020 - }, - { - "epoch": 0.94, - "learning_rate": 3.0844002971571273e-06, - "loss": 2.3554, - "step": 269030 - }, - { - "epoch": 0.94, - "learning_rate": 3.0826564173034736e-06, - "loss": 2.3156, - "step": 269040 - }, - { - "epoch": 0.94, - "learning_rate": 3.0809125374498203e-06, - "loss": 2.3556, - "step": 269050 - }, - { - "epoch": 0.94, - "learning_rate": 3.0791686575961666e-06, - "loss": 2.2963, - "step": 269060 - }, - { - "epoch": 0.94, - "learning_rate": 3.077424777742513e-06, - "loss": 2.3522, - "step": 269070 - }, - { - "epoch": 0.94, - "learning_rate": 3.0756808978888595e-06, - "loss": 2.2944, - "step": 269080 - }, - { - "epoch": 0.94, - "learning_rate": 3.073937018035206e-06, - "loss": 2.29, - "step": 269090 - }, - { - "epoch": 0.94, - "learning_rate": 3.072193138181552e-06, - "loss": 2.4056, - "step": 269100 - }, - { - "epoch": 0.94, - "learning_rate": 3.0704492583278983e-06, - "loss": 2.3714, - "step": 269110 - }, - { - "epoch": 0.94, - "learning_rate": 3.068705378474245e-06, - "loss": 2.2994, - "step": 269120 - }, - { - "epoch": 0.94, - "learning_rate": 3.0669614986205913e-06, - "loss": 2.436, - "step": 269130 - }, - { - "epoch": 0.94, - "learning_rate": 3.0652176187669376e-06, - "loss": 2.3371, - "step": 269140 - }, - { - "epoch": 0.94, - "learning_rate": 3.0634737389132843e-06, - "loss": 2.3262, - "step": 269150 - }, - { - "epoch": 0.94, - "learning_rate": 3.0617298590596305e-06, - "loss": 2.3707, - "step": 269160 - }, - { - "epoch": 0.94, - "learning_rate": 3.059985979205977e-06, - "loss": 2.28, - "step": 269170 - }, - { - "epoch": 0.94, - "learning_rate": 3.0582420993523235e-06, - "loss": 2.3005, - "step": 269180 - }, - { - "epoch": 0.94, - "learning_rate": 3.0564982194986698e-06, - "loss": 2.3709, - "step": 269190 - }, - { - "epoch": 0.94, - "learning_rate": 3.054754339645016e-06, - "loss": 2.3341, - "step": 269200 - }, - { - "epoch": 0.94, - "learning_rate": 3.0530104597913627e-06, - "loss": 2.3063, - "step": 269210 - }, - { - "epoch": 0.94, - "learning_rate": 3.051266579937709e-06, - "loss": 2.35, - "step": 269220 - }, - { - "epoch": 0.94, - "learning_rate": 3.0495227000840553e-06, - "loss": 2.3585, - "step": 269230 - }, - { - "epoch": 0.94, - "learning_rate": 3.0477788202304015e-06, - "loss": 2.3599, - "step": 269240 - }, - { - "epoch": 0.94, - "learning_rate": 3.0460349403767482e-06, - "loss": 2.275, - "step": 269250 - }, - { - "epoch": 0.94, - "learning_rate": 3.0442910605230945e-06, - "loss": 2.3699, - "step": 269260 - }, - { - "epoch": 0.94, - "learning_rate": 3.0425471806694408e-06, - "loss": 2.257, - "step": 269270 - }, - { - "epoch": 0.94, - "learning_rate": 3.0408033008157875e-06, - "loss": 2.3226, - "step": 269280 - }, - { - "epoch": 0.94, - "learning_rate": 3.0390594209621337e-06, - "loss": 2.3167, - "step": 269290 - }, - { - "epoch": 0.94, - "learning_rate": 3.03731554110848e-06, - "loss": 2.3049, - "step": 269300 - }, - { - "epoch": 0.94, - "learning_rate": 3.0355716612548267e-06, - "loss": 2.3278, - "step": 269310 - }, - { - "epoch": 0.94, - "learning_rate": 3.033827781401173e-06, - "loss": 2.3351, - "step": 269320 - }, - { - "epoch": 0.94, - "learning_rate": 3.0320839015475192e-06, - "loss": 2.3905, - "step": 269330 - }, - { - "epoch": 0.94, - "learning_rate": 3.0303400216938655e-06, - "loss": 2.317, - "step": 269340 - }, - { - "epoch": 0.94, - "learning_rate": 3.028596141840212e-06, - "loss": 2.3319, - "step": 269350 - }, - { - "epoch": 0.94, - "learning_rate": 3.0268522619865585e-06, - "loss": 2.3439, - "step": 269360 - }, - { - "epoch": 0.94, - "learning_rate": 3.0251083821329047e-06, - "loss": 2.3149, - "step": 269370 - }, - { - "epoch": 0.94, - "learning_rate": 3.0233645022792514e-06, - "loss": 2.35, - "step": 269380 - }, - { - "epoch": 0.94, - "learning_rate": 3.0216206224255977e-06, - "loss": 2.3662, - "step": 269390 - }, - { - "epoch": 0.94, - "learning_rate": 3.019876742571944e-06, - "loss": 2.3149, - "step": 269400 - }, - { - "epoch": 0.94, - "learning_rate": 3.0181328627182907e-06, - "loss": 2.2984, - "step": 269410 - }, - { - "epoch": 0.94, - "learning_rate": 3.016388982864637e-06, - "loss": 2.2738, - "step": 269420 - }, - { - "epoch": 0.94, - "learning_rate": 3.014645103010983e-06, - "loss": 2.2756, - "step": 269430 - }, - { - "epoch": 0.94, - "learning_rate": 3.0129012231573295e-06, - "loss": 2.2727, - "step": 269440 - }, - { - "epoch": 0.94, - "learning_rate": 3.011157343303676e-06, - "loss": 2.2752, - "step": 269450 - }, - { - "epoch": 0.94, - "learning_rate": 3.0094134634500224e-06, - "loss": 2.3502, - "step": 269460 - }, - { - "epoch": 0.94, - "learning_rate": 3.0076695835963687e-06, - "loss": 2.3799, - "step": 269470 - }, - { - "epoch": 0.94, - "learning_rate": 3.0059257037427154e-06, - "loss": 2.3095, - "step": 269480 - }, - { - "epoch": 0.94, - "learning_rate": 3.0041818238890617e-06, - "loss": 2.3235, - "step": 269490 - }, - { - "epoch": 0.94, - "learning_rate": 3.002437944035408e-06, - "loss": 2.3587, - "step": 269500 - }, - { - "epoch": 0.94, - "learning_rate": 3.0006940641817546e-06, - "loss": 2.2959, - "step": 269510 - }, - { - "epoch": 0.94, - "learning_rate": 2.998950184328101e-06, - "loss": 2.2488, - "step": 269520 - }, - { - "epoch": 0.94, - "learning_rate": 2.997206304474447e-06, - "loss": 2.4415, - "step": 269530 - }, - { - "epoch": 0.94, - "learning_rate": 2.9954624246207934e-06, - "loss": 2.3114, - "step": 269540 - }, - { - "epoch": 0.94, - "learning_rate": 2.99371854476714e-06, - "loss": 2.3242, - "step": 269550 - }, - { - "epoch": 0.94, - "learning_rate": 2.9919746649134864e-06, - "loss": 2.2573, - "step": 269560 - }, - { - "epoch": 0.94, - "learning_rate": 2.9902307850598327e-06, - "loss": 2.3017, - "step": 269570 - }, - { - "epoch": 0.94, - "learning_rate": 2.9884869052061794e-06, - "loss": 2.3151, - "step": 269580 - }, - { - "epoch": 0.94, - "learning_rate": 2.9867430253525256e-06, - "loss": 2.2936, - "step": 269590 - }, - { - "epoch": 0.94, - "learning_rate": 2.984999145498872e-06, - "loss": 2.2979, - "step": 269600 - }, - { - "epoch": 0.94, - "learning_rate": 2.9832552656452186e-06, - "loss": 2.2841, - "step": 269610 - }, - { - "epoch": 0.94, - "learning_rate": 2.981511385791565e-06, - "loss": 2.3825, - "step": 269620 - }, - { - "epoch": 0.94, - "learning_rate": 2.979767505937911e-06, - "loss": 2.3372, - "step": 269630 - }, - { - "epoch": 0.94, - "learning_rate": 2.9780236260842574e-06, - "loss": 2.4489, - "step": 269640 - }, - { - "epoch": 0.94, - "learning_rate": 2.976279746230604e-06, - "loss": 2.2436, - "step": 269650 - }, - { - "epoch": 0.94, - "learning_rate": 2.9745358663769504e-06, - "loss": 2.2951, - "step": 269660 - }, - { - "epoch": 0.94, - "learning_rate": 2.9727919865232966e-06, - "loss": 2.4182, - "step": 269670 - }, - { - "epoch": 0.94, - "learning_rate": 2.9710481066696433e-06, - "loss": 2.2777, - "step": 269680 - }, - { - "epoch": 0.94, - "learning_rate": 2.9693042268159896e-06, - "loss": 2.3449, - "step": 269690 - }, - { - "epoch": 0.94, - "learning_rate": 2.967560346962336e-06, - "loss": 2.4102, - "step": 269700 - }, - { - "epoch": 0.94, - "learning_rate": 2.9658164671086825e-06, - "loss": 2.2411, - "step": 269710 - }, - { - "epoch": 0.94, - "learning_rate": 2.964072587255029e-06, - "loss": 2.2837, - "step": 269720 - }, - { - "epoch": 0.94, - "learning_rate": 2.962328707401375e-06, - "loss": 2.3396, - "step": 269730 - }, - { - "epoch": 0.94, - "learning_rate": 2.9605848275477214e-06, - "loss": 2.3519, - "step": 269740 - }, - { - "epoch": 0.94, - "learning_rate": 2.958840947694068e-06, - "loss": 2.3368, - "step": 269750 - }, - { - "epoch": 0.94, - "learning_rate": 2.9570970678404143e-06, - "loss": 2.3734, - "step": 269760 - }, - { - "epoch": 0.94, - "learning_rate": 2.9553531879867606e-06, - "loss": 2.3449, - "step": 269770 - }, - { - "epoch": 0.94, - "learning_rate": 2.9536093081331073e-06, - "loss": 2.3784, - "step": 269780 - }, - { - "epoch": 0.94, - "learning_rate": 2.9518654282794535e-06, - "loss": 2.2199, - "step": 269790 - }, - { - "epoch": 0.94, - "learning_rate": 2.9501215484258e-06, - "loss": 2.2989, - "step": 269800 - }, - { - "epoch": 0.94, - "learning_rate": 2.9483776685721465e-06, - "loss": 2.3559, - "step": 269810 - }, - { - "epoch": 0.94, - "learning_rate": 2.9466337887184928e-06, - "loss": 2.3124, - "step": 269820 - }, - { - "epoch": 0.94, - "learning_rate": 2.944889908864839e-06, - "loss": 2.3662, - "step": 269830 - }, - { - "epoch": 0.94, - "learning_rate": 2.9431460290111853e-06, - "loss": 2.2884, - "step": 269840 - }, - { - "epoch": 0.94, - "learning_rate": 2.941402149157532e-06, - "loss": 2.3413, - "step": 269850 - }, - { - "epoch": 0.94, - "learning_rate": 2.9396582693038783e-06, - "loss": 2.2455, - "step": 269860 - }, - { - "epoch": 0.94, - "learning_rate": 2.9379143894502245e-06, - "loss": 2.3433, - "step": 269870 - }, - { - "epoch": 0.94, - "learning_rate": 2.9361705095965712e-06, - "loss": 2.3557, - "step": 269880 - }, - { - "epoch": 0.94, - "learning_rate": 2.9344266297429175e-06, - "loss": 2.3348, - "step": 269890 - }, - { - "epoch": 0.94, - "learning_rate": 2.9326827498892638e-06, - "loss": 2.3514, - "step": 269900 - }, - { - "epoch": 0.94, - "learning_rate": 2.9309388700356105e-06, - "loss": 2.3032, - "step": 269910 - }, - { - "epoch": 0.94, - "learning_rate": 2.9291949901819567e-06, - "loss": 2.3114, - "step": 269920 - }, - { - "epoch": 0.94, - "learning_rate": 2.927451110328303e-06, - "loss": 2.3436, - "step": 269930 - }, - { - "epoch": 0.94, - "learning_rate": 2.9257072304746493e-06, - "loss": 2.3158, - "step": 269940 - }, - { - "epoch": 0.94, - "learning_rate": 2.923963350620996e-06, - "loss": 2.2469, - "step": 269950 - }, - { - "epoch": 0.94, - "learning_rate": 2.9222194707673422e-06, - "loss": 2.2406, - "step": 269960 - }, - { - "epoch": 0.94, - "learning_rate": 2.9204755909136885e-06, - "loss": 2.4245, - "step": 269970 - }, - { - "epoch": 0.94, - "learning_rate": 2.918731711060035e-06, - "loss": 2.3021, - "step": 269980 - }, - { - "epoch": 0.94, - "learning_rate": 2.9169878312063815e-06, - "loss": 2.3799, - "step": 269990 - }, - { - "epoch": 0.94, - "learning_rate": 2.9152439513527277e-06, - "loss": 2.3248, - "step": 270000 - }, - { - "epoch": 0.94, - "learning_rate": 2.9135000714990744e-06, - "loss": 2.3114, - "step": 270010 - }, - { - "epoch": 0.94, - "learning_rate": 2.9117561916454207e-06, - "loss": 2.3445, - "step": 270020 - }, - { - "epoch": 0.94, - "learning_rate": 2.910012311791767e-06, - "loss": 2.325, - "step": 270030 - }, - { - "epoch": 0.94, - "learning_rate": 2.9082684319381132e-06, - "loss": 2.3891, - "step": 270040 - }, - { - "epoch": 0.94, - "learning_rate": 2.90652455208446e-06, - "loss": 2.2664, - "step": 270050 - }, - { - "epoch": 0.94, - "learning_rate": 2.904780672230806e-06, - "loss": 2.4291, - "step": 270060 - }, - { - "epoch": 0.94, - "learning_rate": 2.9030367923771525e-06, - "loss": 2.2906, - "step": 270070 - }, - { - "epoch": 0.94, - "learning_rate": 2.901292912523499e-06, - "loss": 2.2769, - "step": 270080 - }, - { - "epoch": 0.94, - "learning_rate": 2.8995490326698454e-06, - "loss": 2.3497, - "step": 270090 - }, - { - "epoch": 0.94, - "learning_rate": 2.8978051528161917e-06, - "loss": 2.2963, - "step": 270100 - }, - { - "epoch": 0.94, - "learning_rate": 2.8960612729625384e-06, - "loss": 2.3283, - "step": 270110 - }, - { - "epoch": 0.94, - "learning_rate": 2.8943173931088847e-06, - "loss": 2.3653, - "step": 270120 - }, - { - "epoch": 0.94, - "learning_rate": 2.892573513255231e-06, - "loss": 2.3887, - "step": 270130 - }, - { - "epoch": 0.94, - "learning_rate": 2.8908296334015776e-06, - "loss": 2.3836, - "step": 270140 - }, - { - "epoch": 0.94, - "learning_rate": 2.889085753547924e-06, - "loss": 2.3385, - "step": 270150 - }, - { - "epoch": 0.94, - "learning_rate": 2.88734187369427e-06, - "loss": 2.3122, - "step": 270160 - }, - { - "epoch": 0.94, - "learning_rate": 2.8855979938406164e-06, - "loss": 2.3411, - "step": 270170 - }, - { - "epoch": 0.94, - "learning_rate": 2.883854113986963e-06, - "loss": 2.3776, - "step": 270180 - }, - { - "epoch": 0.94, - "learning_rate": 2.8821102341333094e-06, - "loss": 2.3298, - "step": 270190 - }, - { - "epoch": 0.94, - "learning_rate": 2.8803663542796557e-06, - "loss": 2.3978, - "step": 270200 - }, - { - "epoch": 0.94, - "learning_rate": 2.8786224744260024e-06, - "loss": 2.3419, - "step": 270210 - }, - { - "epoch": 0.94, - "learning_rate": 2.8768785945723486e-06, - "loss": 2.2454, - "step": 270220 - }, - { - "epoch": 0.94, - "learning_rate": 2.875134714718695e-06, - "loss": 2.4229, - "step": 270230 - }, - { - "epoch": 0.94, - "learning_rate": 2.8733908348650416e-06, - "loss": 2.3243, - "step": 270240 - }, - { - "epoch": 0.94, - "learning_rate": 2.871646955011388e-06, - "loss": 2.4248, - "step": 270250 - }, - { - "epoch": 0.94, - "learning_rate": 2.869903075157734e-06, - "loss": 2.3533, - "step": 270260 - }, - { - "epoch": 0.94, - "learning_rate": 2.8681591953040804e-06, - "loss": 2.3551, - "step": 270270 - }, - { - "epoch": 0.94, - "learning_rate": 2.866415315450427e-06, - "loss": 2.3305, - "step": 270280 - }, - { - "epoch": 0.94, - "learning_rate": 2.8646714355967734e-06, - "loss": 2.3669, - "step": 270290 - }, - { - "epoch": 0.94, - "learning_rate": 2.8629275557431196e-06, - "loss": 2.345, - "step": 270300 - }, - { - "epoch": 0.94, - "learning_rate": 2.8611836758894663e-06, - "loss": 2.3724, - "step": 270310 - }, - { - "epoch": 0.94, - "learning_rate": 2.8594397960358126e-06, - "loss": 2.3107, - "step": 270320 - }, - { - "epoch": 0.94, - "learning_rate": 2.857695916182159e-06, - "loss": 2.2408, - "step": 270330 - }, - { - "epoch": 0.94, - "learning_rate": 2.8559520363285056e-06, - "loss": 2.4362, - "step": 270340 - }, - { - "epoch": 0.94, - "learning_rate": 2.854208156474852e-06, - "loss": 2.3744, - "step": 270350 - }, - { - "epoch": 0.94, - "learning_rate": 2.852464276621198e-06, - "loss": 2.4255, - "step": 270360 - }, - { - "epoch": 0.94, - "learning_rate": 2.8507203967675444e-06, - "loss": 2.3815, - "step": 270370 - }, - { - "epoch": 0.94, - "learning_rate": 2.848976516913891e-06, - "loss": 2.3253, - "step": 270380 - }, - { - "epoch": 0.94, - "learning_rate": 2.8472326370602373e-06, - "loss": 2.3254, - "step": 270390 - }, - { - "epoch": 0.94, - "learning_rate": 2.8454887572065836e-06, - "loss": 2.3259, - "step": 270400 - }, - { - "epoch": 0.94, - "learning_rate": 2.8437448773529303e-06, - "loss": 2.3337, - "step": 270410 - }, - { - "epoch": 0.94, - "learning_rate": 2.8420009974992766e-06, - "loss": 2.3464, - "step": 270420 - }, - { - "epoch": 0.94, - "learning_rate": 2.840257117645623e-06, - "loss": 2.4134, - "step": 270430 - }, - { - "epoch": 0.94, - "learning_rate": 2.8385132377919695e-06, - "loss": 2.2933, - "step": 270440 - }, - { - "epoch": 0.94, - "learning_rate": 2.836769357938316e-06, - "loss": 2.3104, - "step": 270450 - }, - { - "epoch": 0.94, - "learning_rate": 2.835025478084662e-06, - "loss": 2.3252, - "step": 270460 - }, - { - "epoch": 0.94, - "learning_rate": 2.8332815982310083e-06, - "loss": 2.2065, - "step": 270470 - }, - { - "epoch": 0.94, - "learning_rate": 2.831537718377355e-06, - "loss": 2.3405, - "step": 270480 - }, - { - "epoch": 0.94, - "learning_rate": 2.8297938385237013e-06, - "loss": 2.298, - "step": 270490 - }, - { - "epoch": 0.94, - "learning_rate": 2.8280499586700476e-06, - "loss": 2.2619, - "step": 270500 - }, - { - "epoch": 0.94, - "learning_rate": 2.8263060788163943e-06, - "loss": 2.4311, - "step": 270510 - }, - { - "epoch": 0.94, - "learning_rate": 2.8245621989627405e-06, - "loss": 2.2746, - "step": 270520 - }, - { - "epoch": 0.94, - "learning_rate": 2.822818319109087e-06, - "loss": 2.3598, - "step": 270530 - }, - { - "epoch": 0.94, - "learning_rate": 2.8210744392554335e-06, - "loss": 2.313, - "step": 270540 - }, - { - "epoch": 0.94, - "learning_rate": 2.8193305594017798e-06, - "loss": 2.3221, - "step": 270550 - }, - { - "epoch": 0.94, - "learning_rate": 2.817586679548126e-06, - "loss": 2.2554, - "step": 270560 - }, - { - "epoch": 0.94, - "learning_rate": 2.8158427996944723e-06, - "loss": 2.394, - "step": 270570 - }, - { - "epoch": 0.94, - "learning_rate": 2.814098919840819e-06, - "loss": 2.3707, - "step": 270580 - }, - { - "epoch": 0.94, - "learning_rate": 2.8123550399871653e-06, - "loss": 2.3269, - "step": 270590 - }, - { - "epoch": 0.94, - "learning_rate": 2.8106111601335115e-06, - "loss": 2.304, - "step": 270600 - }, - { - "epoch": 0.94, - "learning_rate": 2.8088672802798582e-06, - "loss": 2.3656, - "step": 270610 - }, - { - "epoch": 0.94, - "learning_rate": 2.8071234004262045e-06, - "loss": 2.338, - "step": 270620 - }, - { - "epoch": 0.94, - "learning_rate": 2.8053795205725508e-06, - "loss": 2.3098, - "step": 270630 - }, - { - "epoch": 0.94, - "learning_rate": 2.8036356407188974e-06, - "loss": 2.2503, - "step": 270640 - }, - { - "epoch": 0.94, - "learning_rate": 2.8018917608652437e-06, - "loss": 2.3283, - "step": 270650 - }, - { - "epoch": 0.94, - "learning_rate": 2.80014788101159e-06, - "loss": 2.353, - "step": 270660 - }, - { - "epoch": 0.94, - "learning_rate": 2.7984040011579363e-06, - "loss": 2.3632, - "step": 270670 - }, - { - "epoch": 0.94, - "learning_rate": 2.796660121304283e-06, - "loss": 2.3495, - "step": 270680 - }, - { - "epoch": 0.94, - "learning_rate": 2.7949162414506292e-06, - "loss": 2.3278, - "step": 270690 - }, - { - "epoch": 0.94, - "learning_rate": 2.7931723615969755e-06, - "loss": 2.3607, - "step": 270700 - }, - { - "epoch": 0.94, - "learning_rate": 2.791428481743322e-06, - "loss": 2.3067, - "step": 270710 - }, - { - "epoch": 0.94, - "learning_rate": 2.7896846018896684e-06, - "loss": 2.3528, - "step": 270720 - }, - { - "epoch": 0.94, - "learning_rate": 2.7879407220360147e-06, - "loss": 2.2896, - "step": 270730 - }, - { - "epoch": 0.94, - "learning_rate": 2.7861968421823614e-06, - "loss": 2.3736, - "step": 270740 - }, - { - "epoch": 0.94, - "learning_rate": 2.7844529623287077e-06, - "loss": 2.3546, - "step": 270750 - }, - { - "epoch": 0.94, - "learning_rate": 2.782709082475054e-06, - "loss": 2.3095, - "step": 270760 - }, - { - "epoch": 0.94, - "learning_rate": 2.7809652026214002e-06, - "loss": 2.3289, - "step": 270770 - }, - { - "epoch": 0.94, - "learning_rate": 2.779221322767747e-06, - "loss": 2.3877, - "step": 270780 - }, - { - "epoch": 0.94, - "learning_rate": 2.777477442914093e-06, - "loss": 2.3596, - "step": 270790 - }, - { - "epoch": 0.94, - "learning_rate": 2.7757335630604394e-06, - "loss": 2.3212, - "step": 270800 - }, - { - "epoch": 0.94, - "learning_rate": 2.773989683206786e-06, - "loss": 2.3089, - "step": 270810 - }, - { - "epoch": 0.94, - "learning_rate": 2.7722458033531324e-06, - "loss": 2.316, - "step": 270820 - }, - { - "epoch": 0.94, - "learning_rate": 2.7705019234994787e-06, - "loss": 2.3183, - "step": 270830 - }, - { - "epoch": 0.94, - "learning_rate": 2.7687580436458254e-06, - "loss": 2.3197, - "step": 270840 - }, - { - "epoch": 0.94, - "learning_rate": 2.7670141637921716e-06, - "loss": 2.4082, - "step": 270850 - }, - { - "epoch": 0.94, - "learning_rate": 2.765270283938518e-06, - "loss": 2.2909, - "step": 270860 - }, - { - "epoch": 0.94, - "learning_rate": 2.763526404084864e-06, - "loss": 2.3013, - "step": 270870 - }, - { - "epoch": 0.94, - "learning_rate": 2.761782524231211e-06, - "loss": 2.3013, - "step": 270880 - }, - { - "epoch": 0.94, - "learning_rate": 2.760038644377557e-06, - "loss": 2.3941, - "step": 270890 - }, - { - "epoch": 0.94, - "learning_rate": 2.7582947645239034e-06, - "loss": 2.3225, - "step": 270900 - }, - { - "epoch": 0.94, - "learning_rate": 2.75655088467025e-06, - "loss": 2.3719, - "step": 270910 - }, - { - "epoch": 0.94, - "learning_rate": 2.7548070048165964e-06, - "loss": 2.3885, - "step": 270920 - }, - { - "epoch": 0.94, - "learning_rate": 2.7530631249629426e-06, - "loss": 2.3342, - "step": 270930 - }, - { - "epoch": 0.94, - "learning_rate": 2.7513192451092893e-06, - "loss": 2.3459, - "step": 270940 - }, - { - "epoch": 0.95, - "learning_rate": 2.7495753652556356e-06, - "loss": 2.2301, - "step": 270950 - }, - { - "epoch": 0.95, - "learning_rate": 2.747831485401982e-06, - "loss": 2.3882, - "step": 270960 - }, - { - "epoch": 0.95, - "learning_rate": 2.746087605548328e-06, - "loss": 2.3156, - "step": 270970 - }, - { - "epoch": 0.95, - "learning_rate": 2.744343725694675e-06, - "loss": 2.3097, - "step": 270980 - }, - { - "epoch": 0.95, - "learning_rate": 2.742599845841021e-06, - "loss": 2.2995, - "step": 270990 - }, - { - "epoch": 0.95, - "learning_rate": 2.7408559659873674e-06, - "loss": 2.37, - "step": 271000 - }, - { - "epoch": 0.95, - "learning_rate": 2.739112086133714e-06, - "loss": 2.2871, - "step": 271010 - }, - { - "epoch": 0.95, - "learning_rate": 2.7373682062800603e-06, - "loss": 2.3205, - "step": 271020 - }, - { - "epoch": 0.95, - "learning_rate": 2.7356243264264066e-06, - "loss": 2.3332, - "step": 271030 - }, - { - "epoch": 0.95, - "learning_rate": 2.7338804465727533e-06, - "loss": 2.3461, - "step": 271040 - }, - { - "epoch": 0.95, - "learning_rate": 2.7321365667190996e-06, - "loss": 2.3063, - "step": 271050 - }, - { - "epoch": 0.95, - "learning_rate": 2.730392686865446e-06, - "loss": 2.436, - "step": 271060 - }, - { - "epoch": 0.95, - "learning_rate": 2.728648807011792e-06, - "loss": 2.3583, - "step": 271070 - }, - { - "epoch": 0.95, - "learning_rate": 2.726904927158139e-06, - "loss": 2.3167, - "step": 271080 - }, - { - "epoch": 0.95, - "learning_rate": 2.725161047304485e-06, - "loss": 2.3398, - "step": 271090 - }, - { - "epoch": 0.95, - "learning_rate": 2.7234171674508313e-06, - "loss": 2.4425, - "step": 271100 - }, - { - "epoch": 0.95, - "learning_rate": 2.721673287597178e-06, - "loss": 2.35, - "step": 271110 - }, - { - "epoch": 0.95, - "learning_rate": 2.7199294077435243e-06, - "loss": 2.3008, - "step": 271120 - }, - { - "epoch": 0.95, - "learning_rate": 2.7181855278898706e-06, - "loss": 2.3306, - "step": 271130 - }, - { - "epoch": 0.95, - "learning_rate": 2.7164416480362173e-06, - "loss": 2.3078, - "step": 271140 - }, - { - "epoch": 0.95, - "learning_rate": 2.7146977681825635e-06, - "loss": 2.3845, - "step": 271150 - }, - { - "epoch": 0.95, - "learning_rate": 2.71295388832891e-06, - "loss": 2.3766, - "step": 271160 - }, - { - "epoch": 0.95, - "learning_rate": 2.711210008475256e-06, - "loss": 2.4144, - "step": 271170 - }, - { - "epoch": 0.95, - "learning_rate": 2.7094661286216028e-06, - "loss": 2.2634, - "step": 271180 - }, - { - "epoch": 0.95, - "learning_rate": 2.707722248767949e-06, - "loss": 2.4086, - "step": 271190 - }, - { - "epoch": 0.95, - "learning_rate": 2.7059783689142953e-06, - "loss": 2.3091, - "step": 271200 - }, - { - "epoch": 0.95, - "learning_rate": 2.704234489060642e-06, - "loss": 2.2234, - "step": 271210 - }, - { - "epoch": 0.95, - "learning_rate": 2.7024906092069883e-06, - "loss": 2.2804, - "step": 271220 - }, - { - "epoch": 0.95, - "learning_rate": 2.7007467293533345e-06, - "loss": 2.2997, - "step": 271230 - }, - { - "epoch": 0.95, - "learning_rate": 2.6990028494996812e-06, - "loss": 2.3765, - "step": 271240 - }, - { - "epoch": 0.95, - "learning_rate": 2.6972589696460275e-06, - "loss": 2.3811, - "step": 271250 - }, - { - "epoch": 0.95, - "learning_rate": 2.6955150897923738e-06, - "loss": 2.2881, - "step": 271260 - }, - { - "epoch": 0.95, - "learning_rate": 2.69377120993872e-06, - "loss": 2.3132, - "step": 271270 - }, - { - "epoch": 0.95, - "learning_rate": 2.6920273300850667e-06, - "loss": 2.245, - "step": 271280 - }, - { - "epoch": 0.95, - "learning_rate": 2.690283450231413e-06, - "loss": 2.3532, - "step": 271290 - }, - { - "epoch": 0.95, - "learning_rate": 2.6885395703777593e-06, - "loss": 2.335, - "step": 271300 - }, - { - "epoch": 0.95, - "learning_rate": 2.686795690524106e-06, - "loss": 2.3658, - "step": 271310 - }, - { - "epoch": 0.95, - "learning_rate": 2.6850518106704522e-06, - "loss": 2.3095, - "step": 271320 - }, - { - "epoch": 0.95, - "learning_rate": 2.6833079308167985e-06, - "loss": 2.2514, - "step": 271330 - }, - { - "epoch": 0.95, - "learning_rate": 2.681564050963145e-06, - "loss": 2.2628, - "step": 271340 - }, - { - "epoch": 0.95, - "learning_rate": 2.6798201711094915e-06, - "loss": 2.3305, - "step": 271350 - }, - { - "epoch": 0.95, - "learning_rate": 2.6780762912558377e-06, - "loss": 2.3406, - "step": 271360 - }, - { - "epoch": 0.95, - "learning_rate": 2.676332411402184e-06, - "loss": 2.3311, - "step": 271370 - }, - { - "epoch": 0.95, - "learning_rate": 2.6745885315485307e-06, - "loss": 2.3472, - "step": 271380 - }, - { - "epoch": 0.95, - "learning_rate": 2.672844651694877e-06, - "loss": 2.2616, - "step": 271390 - }, - { - "epoch": 0.95, - "learning_rate": 2.6711007718412232e-06, - "loss": 2.2225, - "step": 271400 - }, - { - "epoch": 0.95, - "learning_rate": 2.66935689198757e-06, - "loss": 2.2846, - "step": 271410 - }, - { - "epoch": 0.95, - "learning_rate": 2.667613012133916e-06, - "loss": 2.3027, - "step": 271420 - }, - { - "epoch": 0.95, - "learning_rate": 2.6658691322802625e-06, - "loss": 2.3747, - "step": 271430 - }, - { - "epoch": 0.95, - "learning_rate": 2.664125252426609e-06, - "loss": 2.3506, - "step": 271440 - }, - { - "epoch": 0.95, - "learning_rate": 2.6623813725729554e-06, - "loss": 2.3624, - "step": 271450 - }, - { - "epoch": 0.95, - "learning_rate": 2.6606374927193017e-06, - "loss": 2.3299, - "step": 271460 - }, - { - "epoch": 0.95, - "learning_rate": 2.6588936128656484e-06, - "loss": 2.3015, - "step": 271470 - }, - { - "epoch": 0.95, - "learning_rate": 2.6571497330119947e-06, - "loss": 2.2927, - "step": 271480 - }, - { - "epoch": 0.95, - "learning_rate": 2.655405853158341e-06, - "loss": 2.3088, - "step": 271490 - }, - { - "epoch": 0.95, - "learning_rate": 2.653661973304687e-06, - "loss": 2.3335, - "step": 271500 - }, - { - "epoch": 0.95, - "learning_rate": 2.651918093451034e-06, - "loss": 2.3003, - "step": 271510 - }, - { - "epoch": 0.95, - "learning_rate": 2.65017421359738e-06, - "loss": 2.2914, - "step": 271520 - }, - { - "epoch": 0.95, - "learning_rate": 2.6484303337437264e-06, - "loss": 2.2662, - "step": 271530 - }, - { - "epoch": 0.95, - "learning_rate": 2.646686453890073e-06, - "loss": 2.3501, - "step": 271540 - }, - { - "epoch": 0.95, - "learning_rate": 2.6449425740364194e-06, - "loss": 2.3654, - "step": 271550 - }, - { - "epoch": 0.95, - "learning_rate": 2.6431986941827657e-06, - "loss": 2.3714, - "step": 271560 - }, - { - "epoch": 0.95, - "learning_rate": 2.6414548143291123e-06, - "loss": 2.3575, - "step": 271570 - }, - { - "epoch": 0.95, - "learning_rate": 2.6397109344754586e-06, - "loss": 2.3583, - "step": 271580 - }, - { - "epoch": 0.95, - "learning_rate": 2.637967054621805e-06, - "loss": 2.3062, - "step": 271590 - }, - { - "epoch": 0.95, - "learning_rate": 2.636223174768151e-06, - "loss": 2.2755, - "step": 271600 - }, - { - "epoch": 0.95, - "learning_rate": 2.634479294914498e-06, - "loss": 2.3829, - "step": 271610 - }, - { - "epoch": 0.95, - "learning_rate": 2.632735415060844e-06, - "loss": 2.3207, - "step": 271620 - }, - { - "epoch": 0.95, - "learning_rate": 2.6309915352071904e-06, - "loss": 2.3587, - "step": 271630 - }, - { - "epoch": 0.95, - "learning_rate": 2.629247655353537e-06, - "loss": 2.3714, - "step": 271640 - }, - { - "epoch": 0.95, - "learning_rate": 2.6275037754998833e-06, - "loss": 2.2926, - "step": 271650 - }, - { - "epoch": 0.95, - "learning_rate": 2.6257598956462296e-06, - "loss": 2.2678, - "step": 271660 - }, - { - "epoch": 0.95, - "learning_rate": 2.6240160157925763e-06, - "loss": 2.2691, - "step": 271670 - }, - { - "epoch": 0.95, - "learning_rate": 2.6222721359389226e-06, - "loss": 2.298, - "step": 271680 - }, - { - "epoch": 0.95, - "learning_rate": 2.620528256085269e-06, - "loss": 2.3071, - "step": 271690 - }, - { - "epoch": 0.95, - "learning_rate": 2.618784376231615e-06, - "loss": 2.3615, - "step": 271700 - }, - { - "epoch": 0.95, - "learning_rate": 2.617040496377962e-06, - "loss": 2.3659, - "step": 271710 - }, - { - "epoch": 0.95, - "learning_rate": 2.615296616524308e-06, - "loss": 2.3277, - "step": 271720 - }, - { - "epoch": 0.95, - "learning_rate": 2.6135527366706543e-06, - "loss": 2.3123, - "step": 271730 - }, - { - "epoch": 0.95, - "learning_rate": 2.611808856817001e-06, - "loss": 2.3959, - "step": 271740 - }, - { - "epoch": 0.95, - "learning_rate": 2.6100649769633473e-06, - "loss": 2.3088, - "step": 271750 - }, - { - "epoch": 0.95, - "learning_rate": 2.6083210971096936e-06, - "loss": 2.3117, - "step": 271760 - }, - { - "epoch": 0.95, - "learning_rate": 2.6065772172560403e-06, - "loss": 2.3073, - "step": 271770 - }, - { - "epoch": 0.95, - "learning_rate": 2.6048333374023865e-06, - "loss": 2.2573, - "step": 271780 - }, - { - "epoch": 0.95, - "learning_rate": 2.603089457548733e-06, - "loss": 2.3664, - "step": 271790 - }, - { - "epoch": 0.95, - "learning_rate": 2.601345577695079e-06, - "loss": 2.2853, - "step": 271800 - }, - { - "epoch": 0.95, - "learning_rate": 2.5996016978414258e-06, - "loss": 2.3481, - "step": 271810 - }, - { - "epoch": 0.95, - "learning_rate": 2.597857817987772e-06, - "loss": 2.2707, - "step": 271820 - }, - { - "epoch": 0.95, - "learning_rate": 2.5961139381341183e-06, - "loss": 2.4036, - "step": 271830 - }, - { - "epoch": 0.95, - "learning_rate": 2.594370058280465e-06, - "loss": 2.306, - "step": 271840 - }, - { - "epoch": 0.95, - "learning_rate": 2.5926261784268113e-06, - "loss": 2.385, - "step": 271850 - }, - { - "epoch": 0.95, - "learning_rate": 2.5908822985731575e-06, - "loss": 2.2721, - "step": 271860 - }, - { - "epoch": 0.95, - "learning_rate": 2.5891384187195042e-06, - "loss": 2.4067, - "step": 271870 - }, - { - "epoch": 0.95, - "learning_rate": 2.5873945388658505e-06, - "loss": 2.2781, - "step": 271880 - }, - { - "epoch": 0.95, - "learning_rate": 2.5856506590121968e-06, - "loss": 2.3242, - "step": 271890 - }, - { - "epoch": 0.95, - "learning_rate": 2.583906779158543e-06, - "loss": 2.3422, - "step": 271900 - }, - { - "epoch": 0.95, - "learning_rate": 2.5821628993048897e-06, - "loss": 2.3681, - "step": 271910 - }, - { - "epoch": 0.95, - "learning_rate": 2.580419019451236e-06, - "loss": 2.3108, - "step": 271920 - }, - { - "epoch": 0.95, - "learning_rate": 2.5786751395975823e-06, - "loss": 2.2614, - "step": 271930 - }, - { - "epoch": 0.95, - "learning_rate": 2.576931259743929e-06, - "loss": 2.2715, - "step": 271940 - }, - { - "epoch": 0.95, - "learning_rate": 2.5751873798902752e-06, - "loss": 2.3854, - "step": 271950 - }, - { - "epoch": 0.95, - "learning_rate": 2.5734435000366215e-06, - "loss": 2.3528, - "step": 271960 - }, - { - "epoch": 0.95, - "learning_rate": 2.571699620182968e-06, - "loss": 2.2808, - "step": 271970 - }, - { - "epoch": 0.95, - "learning_rate": 2.5699557403293145e-06, - "loss": 2.359, - "step": 271980 - }, - { - "epoch": 0.95, - "learning_rate": 2.5682118604756607e-06, - "loss": 2.2917, - "step": 271990 - }, - { - "epoch": 0.95, - "learning_rate": 2.566467980622007e-06, - "loss": 2.3359, - "step": 272000 - }, - { - "epoch": 0.95, - "learning_rate": 2.5647241007683537e-06, - "loss": 2.3444, - "step": 272010 - }, - { - "epoch": 0.95, - "learning_rate": 2.5629802209147e-06, - "loss": 2.3435, - "step": 272020 - }, - { - "epoch": 0.95, - "learning_rate": 2.5612363410610462e-06, - "loss": 2.3013, - "step": 272030 - }, - { - "epoch": 0.95, - "learning_rate": 2.559492461207393e-06, - "loss": 2.2416, - "step": 272040 - }, - { - "epoch": 0.95, - "learning_rate": 2.557748581353739e-06, - "loss": 2.3011, - "step": 272050 - }, - { - "epoch": 0.95, - "learning_rate": 2.5560047015000855e-06, - "loss": 2.3393, - "step": 272060 - }, - { - "epoch": 0.95, - "learning_rate": 2.554260821646432e-06, - "loss": 2.389, - "step": 272070 - }, - { - "epoch": 0.95, - "learning_rate": 2.5525169417927784e-06, - "loss": 2.3676, - "step": 272080 - }, - { - "epoch": 0.95, - "learning_rate": 2.5507730619391247e-06, - "loss": 2.3476, - "step": 272090 - }, - { - "epoch": 0.95, - "learning_rate": 2.549029182085471e-06, - "loss": 2.3495, - "step": 272100 - }, - { - "epoch": 0.95, - "learning_rate": 2.5472853022318177e-06, - "loss": 2.3751, - "step": 272110 - }, - { - "epoch": 0.95, - "learning_rate": 2.545541422378164e-06, - "loss": 2.2783, - "step": 272120 - }, - { - "epoch": 0.95, - "learning_rate": 2.54379754252451e-06, - "loss": 2.2615, - "step": 272130 - }, - { - "epoch": 0.95, - "learning_rate": 2.542053662670857e-06, - "loss": 2.3595, - "step": 272140 - }, - { - "epoch": 0.95, - "learning_rate": 2.540309782817203e-06, - "loss": 2.4117, - "step": 272150 - }, - { - "epoch": 0.95, - "learning_rate": 2.5385659029635494e-06, - "loss": 2.3642, - "step": 272160 - }, - { - "epoch": 0.95, - "learning_rate": 2.536822023109896e-06, - "loss": 2.3899, - "step": 272170 - }, - { - "epoch": 0.95, - "learning_rate": 2.5350781432562424e-06, - "loss": 2.3652, - "step": 272180 - }, - { - "epoch": 0.95, - "learning_rate": 2.5333342634025887e-06, - "loss": 2.2997, - "step": 272190 - }, - { - "epoch": 0.95, - "learning_rate": 2.531590383548935e-06, - "loss": 2.3388, - "step": 272200 - }, - { - "epoch": 0.95, - "learning_rate": 2.5298465036952816e-06, - "loss": 2.3226, - "step": 272210 - }, - { - "epoch": 0.95, - "learning_rate": 2.528102623841628e-06, - "loss": 2.3382, - "step": 272220 - }, - { - "epoch": 0.95, - "learning_rate": 2.526358743987974e-06, - "loss": 2.3605, - "step": 272230 - }, - { - "epoch": 0.95, - "learning_rate": 2.524614864134321e-06, - "loss": 2.3148, - "step": 272240 - }, - { - "epoch": 0.95, - "learning_rate": 2.522870984280667e-06, - "loss": 2.342, - "step": 272250 - }, - { - "epoch": 0.95, - "learning_rate": 2.5211271044270134e-06, - "loss": 2.2945, - "step": 272260 - }, - { - "epoch": 0.95, - "learning_rate": 2.51938322457336e-06, - "loss": 2.2947, - "step": 272270 - }, - { - "epoch": 0.95, - "learning_rate": 2.5176393447197064e-06, - "loss": 2.3311, - "step": 272280 - }, - { - "epoch": 0.95, - "learning_rate": 2.5158954648660526e-06, - "loss": 2.4195, - "step": 272290 - }, - { - "epoch": 0.95, - "learning_rate": 2.514151585012399e-06, - "loss": 2.3283, - "step": 272300 - }, - { - "epoch": 0.95, - "learning_rate": 2.5124077051587456e-06, - "loss": 2.338, - "step": 272310 - }, - { - "epoch": 0.95, - "learning_rate": 2.510663825305092e-06, - "loss": 2.3117, - "step": 272320 - }, - { - "epoch": 0.95, - "learning_rate": 2.508919945451438e-06, - "loss": 2.3031, - "step": 272330 - }, - { - "epoch": 0.95, - "learning_rate": 2.507176065597785e-06, - "loss": 2.3144, - "step": 272340 - }, - { - "epoch": 0.95, - "learning_rate": 2.505432185744131e-06, - "loss": 2.2741, - "step": 272350 - }, - { - "epoch": 0.95, - "learning_rate": 2.5036883058904774e-06, - "loss": 2.4127, - "step": 272360 - }, - { - "epoch": 0.95, - "learning_rate": 2.501944426036824e-06, - "loss": 2.2104, - "step": 272370 - }, - { - "epoch": 0.95, - "learning_rate": 2.5002005461831703e-06, - "loss": 2.3148, - "step": 272380 - }, - { - "epoch": 0.95, - "learning_rate": 2.4984566663295166e-06, - "loss": 2.3321, - "step": 272390 - }, - { - "epoch": 0.95, - "learning_rate": 2.496712786475863e-06, - "loss": 2.272, - "step": 272400 - }, - { - "epoch": 0.95, - "learning_rate": 2.4949689066222096e-06, - "loss": 2.3213, - "step": 272410 - }, - { - "epoch": 0.95, - "learning_rate": 2.493225026768556e-06, - "loss": 2.2354, - "step": 272420 - }, - { - "epoch": 0.95, - "learning_rate": 2.491481146914902e-06, - "loss": 2.3524, - "step": 272430 - }, - { - "epoch": 0.95, - "learning_rate": 2.4897372670612488e-06, - "loss": 2.3168, - "step": 272440 - }, - { - "epoch": 0.95, - "learning_rate": 2.487993387207595e-06, - "loss": 2.2609, - "step": 272450 - }, - { - "epoch": 0.95, - "learning_rate": 2.4862495073539413e-06, - "loss": 2.2772, - "step": 272460 - }, - { - "epoch": 0.95, - "learning_rate": 2.484505627500288e-06, - "loss": 2.3916, - "step": 272470 - }, - { - "epoch": 0.95, - "learning_rate": 2.4827617476466343e-06, - "loss": 2.295, - "step": 272480 - }, - { - "epoch": 0.95, - "learning_rate": 2.4810178677929806e-06, - "loss": 2.3073, - "step": 272490 - }, - { - "epoch": 0.95, - "learning_rate": 2.479273987939327e-06, - "loss": 2.312, - "step": 272500 - }, - { - "epoch": 0.95, - "learning_rate": 2.4775301080856735e-06, - "loss": 2.3995, - "step": 272510 - }, - { - "epoch": 0.95, - "learning_rate": 2.4757862282320198e-06, - "loss": 2.3092, - "step": 272520 - }, - { - "epoch": 0.95, - "learning_rate": 2.474042348378366e-06, - "loss": 2.2973, - "step": 272530 - }, - { - "epoch": 0.95, - "learning_rate": 2.4722984685247127e-06, - "loss": 2.3502, - "step": 272540 - }, - { - "epoch": 0.95, - "learning_rate": 2.470554588671059e-06, - "loss": 2.3249, - "step": 272550 - }, - { - "epoch": 0.95, - "learning_rate": 2.4688107088174053e-06, - "loss": 2.3259, - "step": 272560 - }, - { - "epoch": 0.95, - "learning_rate": 2.467066828963752e-06, - "loss": 2.3198, - "step": 272570 - }, - { - "epoch": 0.95, - "learning_rate": 2.4653229491100982e-06, - "loss": 2.3808, - "step": 272580 - }, - { - "epoch": 0.95, - "learning_rate": 2.4635790692564445e-06, - "loss": 2.2741, - "step": 272590 - }, - { - "epoch": 0.95, - "learning_rate": 2.4618351894027908e-06, - "loss": 2.3257, - "step": 272600 - }, - { - "epoch": 0.95, - "learning_rate": 2.4600913095491375e-06, - "loss": 2.3466, - "step": 272610 - }, - { - "epoch": 0.95, - "learning_rate": 2.4583474296954837e-06, - "loss": 2.3634, - "step": 272620 - }, - { - "epoch": 0.95, - "learning_rate": 2.45660354984183e-06, - "loss": 2.232, - "step": 272630 - }, - { - "epoch": 0.95, - "learning_rate": 2.4548596699881767e-06, - "loss": 2.303, - "step": 272640 - }, - { - "epoch": 0.95, - "learning_rate": 2.453115790134523e-06, - "loss": 2.3257, - "step": 272650 - }, - { - "epoch": 0.95, - "learning_rate": 2.4513719102808692e-06, - "loss": 2.3724, - "step": 272660 - }, - { - "epoch": 0.95, - "learning_rate": 2.449628030427216e-06, - "loss": 2.297, - "step": 272670 - }, - { - "epoch": 0.95, - "learning_rate": 2.4478841505735622e-06, - "loss": 2.3563, - "step": 272680 - }, - { - "epoch": 0.95, - "learning_rate": 2.4461402707199085e-06, - "loss": 2.2821, - "step": 272690 - }, - { - "epoch": 0.95, - "learning_rate": 2.4443963908662548e-06, - "loss": 2.3591, - "step": 272700 - }, - { - "epoch": 0.95, - "learning_rate": 2.4426525110126014e-06, - "loss": 2.3441, - "step": 272710 - }, - { - "epoch": 0.95, - "learning_rate": 2.4409086311589477e-06, - "loss": 2.2619, - "step": 272720 - }, - { - "epoch": 0.95, - "learning_rate": 2.439164751305294e-06, - "loss": 2.3653, - "step": 272730 - }, - { - "epoch": 0.95, - "learning_rate": 2.4374208714516407e-06, - "loss": 2.326, - "step": 272740 - }, - { - "epoch": 0.95, - "learning_rate": 2.435676991597987e-06, - "loss": 2.3282, - "step": 272750 - }, - { - "epoch": 0.95, - "learning_rate": 2.4339331117443332e-06, - "loss": 2.2854, - "step": 272760 - }, - { - "epoch": 0.95, - "learning_rate": 2.43218923189068e-06, - "loss": 2.3457, - "step": 272770 - }, - { - "epoch": 0.95, - "learning_rate": 2.430445352037026e-06, - "loss": 2.3382, - "step": 272780 - }, - { - "epoch": 0.95, - "learning_rate": 2.4287014721833724e-06, - "loss": 2.2922, - "step": 272790 - }, - { - "epoch": 0.95, - "learning_rate": 2.4269575923297187e-06, - "loss": 2.3434, - "step": 272800 - }, - { - "epoch": 0.95, - "learning_rate": 2.4252137124760654e-06, - "loss": 2.3069, - "step": 272810 - }, - { - "epoch": 0.95, - "learning_rate": 2.4234698326224117e-06, - "loss": 2.3845, - "step": 272820 - }, - { - "epoch": 0.95, - "learning_rate": 2.421725952768758e-06, - "loss": 2.2586, - "step": 272830 - }, - { - "epoch": 0.95, - "learning_rate": 2.4199820729151046e-06, - "loss": 2.3446, - "step": 272840 - }, - { - "epoch": 0.95, - "learning_rate": 2.418238193061451e-06, - "loss": 2.4214, - "step": 272850 - }, - { - "epoch": 0.95, - "learning_rate": 2.416494313207797e-06, - "loss": 2.4293, - "step": 272860 - }, - { - "epoch": 0.95, - "learning_rate": 2.414750433354144e-06, - "loss": 2.3523, - "step": 272870 - }, - { - "epoch": 0.95, - "learning_rate": 2.41300655350049e-06, - "loss": 2.3879, - "step": 272880 - }, - { - "epoch": 0.95, - "learning_rate": 2.4112626736468364e-06, - "loss": 2.3195, - "step": 272890 - }, - { - "epoch": 0.95, - "learning_rate": 2.409518793793183e-06, - "loss": 2.3587, - "step": 272900 - }, - { - "epoch": 0.95, - "learning_rate": 2.4077749139395294e-06, - "loss": 2.2615, - "step": 272910 - }, - { - "epoch": 0.95, - "learning_rate": 2.4060310340858756e-06, - "loss": 2.3716, - "step": 272920 - }, - { - "epoch": 0.95, - "learning_rate": 2.404287154232222e-06, - "loss": 2.3153, - "step": 272930 - }, - { - "epoch": 0.95, - "learning_rate": 2.4025432743785686e-06, - "loss": 2.3802, - "step": 272940 - }, - { - "epoch": 0.95, - "learning_rate": 2.400799394524915e-06, - "loss": 2.4251, - "step": 272950 - }, - { - "epoch": 0.95, - "learning_rate": 2.399055514671261e-06, - "loss": 2.3143, - "step": 272960 - }, - { - "epoch": 0.95, - "learning_rate": 2.397311634817608e-06, - "loss": 2.2254, - "step": 272970 - }, - { - "epoch": 0.95, - "learning_rate": 2.395567754963954e-06, - "loss": 2.3321, - "step": 272980 - }, - { - "epoch": 0.95, - "learning_rate": 2.3938238751103004e-06, - "loss": 2.3005, - "step": 272990 - }, - { - "epoch": 0.95, - "learning_rate": 2.392079995256647e-06, - "loss": 2.2623, - "step": 273000 - }, - { - "epoch": 0.95, - "learning_rate": 2.3903361154029933e-06, - "loss": 2.3408, - "step": 273010 - }, - { - "epoch": 0.95, - "learning_rate": 2.3885922355493396e-06, - "loss": 2.3309, - "step": 273020 - }, - { - "epoch": 0.95, - "learning_rate": 2.386848355695686e-06, - "loss": 2.3185, - "step": 273030 - }, - { - "epoch": 0.95, - "learning_rate": 2.3851044758420326e-06, - "loss": 2.2923, - "step": 273040 - }, - { - "epoch": 0.95, - "learning_rate": 2.383360595988379e-06, - "loss": 2.3042, - "step": 273050 - }, - { - "epoch": 0.95, - "learning_rate": 2.381616716134725e-06, - "loss": 2.3723, - "step": 273060 - }, - { - "epoch": 0.95, - "learning_rate": 2.379872836281072e-06, - "loss": 2.3807, - "step": 273070 - }, - { - "epoch": 0.95, - "learning_rate": 2.378128956427418e-06, - "loss": 2.2967, - "step": 273080 - }, - { - "epoch": 0.95, - "learning_rate": 2.3763850765737643e-06, - "loss": 2.3268, - "step": 273090 - }, - { - "epoch": 0.95, - "learning_rate": 2.374641196720111e-06, - "loss": 2.3374, - "step": 273100 - }, - { - "epoch": 0.95, - "learning_rate": 2.3728973168664573e-06, - "loss": 2.2927, - "step": 273110 - }, - { - "epoch": 0.95, - "learning_rate": 2.3711534370128036e-06, - "loss": 2.3044, - "step": 273120 - }, - { - "epoch": 0.95, - "learning_rate": 2.36940955715915e-06, - "loss": 2.3669, - "step": 273130 - }, - { - "epoch": 0.95, - "learning_rate": 2.3676656773054965e-06, - "loss": 2.3811, - "step": 273140 - }, - { - "epoch": 0.95, - "learning_rate": 2.365921797451843e-06, - "loss": 2.2811, - "step": 273150 - }, - { - "epoch": 0.95, - "learning_rate": 2.364177917598189e-06, - "loss": 2.2704, - "step": 273160 - }, - { - "epoch": 0.95, - "learning_rate": 2.3624340377445358e-06, - "loss": 2.3885, - "step": 273170 - }, - { - "epoch": 0.95, - "learning_rate": 2.360690157890882e-06, - "loss": 2.3676, - "step": 273180 - }, - { - "epoch": 0.95, - "learning_rate": 2.3589462780372283e-06, - "loss": 2.3481, - "step": 273190 - }, - { - "epoch": 0.95, - "learning_rate": 2.357202398183575e-06, - "loss": 2.3718, - "step": 273200 - }, - { - "epoch": 0.95, - "learning_rate": 2.3554585183299213e-06, - "loss": 2.3371, - "step": 273210 - }, - { - "epoch": 0.95, - "learning_rate": 2.3537146384762675e-06, - "loss": 2.3233, - "step": 273220 - }, - { - "epoch": 0.95, - "learning_rate": 2.351970758622614e-06, - "loss": 2.3068, - "step": 273230 - }, - { - "epoch": 0.95, - "learning_rate": 2.3502268787689605e-06, - "loss": 2.3857, - "step": 273240 - }, - { - "epoch": 0.95, - "learning_rate": 2.3484829989153068e-06, - "loss": 2.3148, - "step": 273250 - }, - { - "epoch": 0.95, - "learning_rate": 2.346739119061653e-06, - "loss": 2.2558, - "step": 273260 - }, - { - "epoch": 0.95, - "learning_rate": 2.3449952392079997e-06, - "loss": 2.2878, - "step": 273270 - }, - { - "epoch": 0.95, - "learning_rate": 2.343251359354346e-06, - "loss": 2.3722, - "step": 273280 - }, - { - "epoch": 0.95, - "learning_rate": 2.3415074795006923e-06, - "loss": 2.3527, - "step": 273290 - }, - { - "epoch": 0.95, - "learning_rate": 2.339763599647039e-06, - "loss": 2.3057, - "step": 273300 - }, - { - "epoch": 0.95, - "learning_rate": 2.3380197197933852e-06, - "loss": 2.3358, - "step": 273310 - }, - { - "epoch": 0.95, - "learning_rate": 2.3362758399397315e-06, - "loss": 2.3571, - "step": 273320 - }, - { - "epoch": 0.95, - "learning_rate": 2.3345319600860778e-06, - "loss": 2.3242, - "step": 273330 - }, - { - "epoch": 0.95, - "learning_rate": 2.3327880802324245e-06, - "loss": 2.3866, - "step": 273340 - }, - { - "epoch": 0.95, - "learning_rate": 2.3310442003787707e-06, - "loss": 2.299, - "step": 273350 - }, - { - "epoch": 0.95, - "learning_rate": 2.329300320525117e-06, - "loss": 2.2989, - "step": 273360 - }, - { - "epoch": 0.95, - "learning_rate": 2.3275564406714637e-06, - "loss": 2.3507, - "step": 273370 - }, - { - "epoch": 0.95, - "learning_rate": 2.32581256081781e-06, - "loss": 2.3549, - "step": 273380 - }, - { - "epoch": 0.95, - "learning_rate": 2.3240686809641562e-06, - "loss": 2.3343, - "step": 273390 - }, - { - "epoch": 0.95, - "learning_rate": 2.322324801110503e-06, - "loss": 2.3567, - "step": 273400 - }, - { - "epoch": 0.95, - "learning_rate": 2.320580921256849e-06, - "loss": 2.3371, - "step": 273410 - }, - { - "epoch": 0.95, - "learning_rate": 2.3188370414031955e-06, - "loss": 2.4294, - "step": 273420 - }, - { - "epoch": 0.95, - "learning_rate": 2.3170931615495417e-06, - "loss": 2.3599, - "step": 273430 - }, - { - "epoch": 0.95, - "learning_rate": 2.3153492816958884e-06, - "loss": 2.3629, - "step": 273440 - }, - { - "epoch": 0.95, - "learning_rate": 2.3136054018422347e-06, - "loss": 2.3402, - "step": 273450 - }, - { - "epoch": 0.95, - "learning_rate": 2.311861521988581e-06, - "loss": 2.3366, - "step": 273460 - }, - { - "epoch": 0.95, - "learning_rate": 2.3101176421349276e-06, - "loss": 2.3377, - "step": 273470 - }, - { - "epoch": 0.95, - "learning_rate": 2.308373762281274e-06, - "loss": 2.3716, - "step": 273480 - }, - { - "epoch": 0.95, - "learning_rate": 2.30662988242762e-06, - "loss": 2.3096, - "step": 273490 - }, - { - "epoch": 0.95, - "learning_rate": 2.304886002573967e-06, - "loss": 2.313, - "step": 273500 - }, - { - "epoch": 0.95, - "learning_rate": 2.303142122720313e-06, - "loss": 2.4223, - "step": 273510 - }, - { - "epoch": 0.95, - "learning_rate": 2.3013982428666594e-06, - "loss": 2.3661, - "step": 273520 - }, - { - "epoch": 0.95, - "learning_rate": 2.2996543630130057e-06, - "loss": 2.3461, - "step": 273530 - }, - { - "epoch": 0.95, - "learning_rate": 2.2979104831593524e-06, - "loss": 2.3093, - "step": 273540 - }, - { - "epoch": 0.95, - "learning_rate": 2.2961666033056986e-06, - "loss": 2.312, - "step": 273550 - }, - { - "epoch": 0.95, - "learning_rate": 2.294422723452045e-06, - "loss": 2.3774, - "step": 273560 - }, - { - "epoch": 0.95, - "learning_rate": 2.2926788435983916e-06, - "loss": 2.2529, - "step": 273570 - }, - { - "epoch": 0.95, - "learning_rate": 2.290934963744738e-06, - "loss": 2.2894, - "step": 273580 - }, - { - "epoch": 0.95, - "learning_rate": 2.289191083891084e-06, - "loss": 2.3238, - "step": 273590 - }, - { - "epoch": 0.95, - "learning_rate": 2.287447204037431e-06, - "loss": 2.3109, - "step": 273600 - }, - { - "epoch": 0.95, - "learning_rate": 2.285703324183777e-06, - "loss": 2.27, - "step": 273610 - }, - { - "epoch": 0.95, - "learning_rate": 2.2839594443301234e-06, - "loss": 2.2857, - "step": 273620 - }, - { - "epoch": 0.95, - "learning_rate": 2.2822155644764697e-06, - "loss": 2.4713, - "step": 273630 - }, - { - "epoch": 0.95, - "learning_rate": 2.2804716846228163e-06, - "loss": 2.3202, - "step": 273640 - }, - { - "epoch": 0.95, - "learning_rate": 2.2787278047691626e-06, - "loss": 2.3176, - "step": 273650 - }, - { - "epoch": 0.95, - "learning_rate": 2.276983924915509e-06, - "loss": 2.3788, - "step": 273660 - }, - { - "epoch": 0.95, - "learning_rate": 2.2752400450618556e-06, - "loss": 2.3163, - "step": 273670 - }, - { - "epoch": 0.95, - "learning_rate": 2.273496165208202e-06, - "loss": 2.3158, - "step": 273680 - }, - { - "epoch": 0.95, - "learning_rate": 2.271752285354548e-06, - "loss": 2.336, - "step": 273690 - }, - { - "epoch": 0.95, - "learning_rate": 2.270008405500895e-06, - "loss": 2.3108, - "step": 273700 - }, - { - "epoch": 0.95, - "learning_rate": 2.268264525647241e-06, - "loss": 2.3647, - "step": 273710 - }, - { - "epoch": 0.95, - "learning_rate": 2.2665206457935873e-06, - "loss": 2.3096, - "step": 273720 - }, - { - "epoch": 0.95, - "learning_rate": 2.2647767659399336e-06, - "loss": 2.1996, - "step": 273730 - }, - { - "epoch": 0.95, - "learning_rate": 2.2630328860862803e-06, - "loss": 2.3169, - "step": 273740 - }, - { - "epoch": 0.95, - "learning_rate": 2.2612890062326266e-06, - "loss": 2.2509, - "step": 273750 - }, - { - "epoch": 0.95, - "learning_rate": 2.259545126378973e-06, - "loss": 2.3441, - "step": 273760 - }, - { - "epoch": 0.95, - "learning_rate": 2.2578012465253195e-06, - "loss": 2.3411, - "step": 273770 - }, - { - "epoch": 0.95, - "learning_rate": 2.256057366671666e-06, - "loss": 2.3465, - "step": 273780 - }, - { - "epoch": 0.95, - "learning_rate": 2.254313486818012e-06, - "loss": 2.3026, - "step": 273790 - }, - { - "epoch": 0.95, - "learning_rate": 2.2525696069643588e-06, - "loss": 2.3896, - "step": 273800 - }, - { - "epoch": 0.95, - "learning_rate": 2.250825727110705e-06, - "loss": 2.4198, - "step": 273810 - }, - { - "epoch": 0.96, - "learning_rate": 2.2490818472570513e-06, - "loss": 2.3355, - "step": 273820 - }, - { - "epoch": 0.96, - "learning_rate": 2.2473379674033976e-06, - "loss": 2.286, - "step": 273830 - }, - { - "epoch": 0.96, - "learning_rate": 2.2455940875497443e-06, - "loss": 2.3926, - "step": 273840 - }, - { - "epoch": 0.96, - "learning_rate": 2.2438502076960905e-06, - "loss": 2.3556, - "step": 273850 - }, - { - "epoch": 0.96, - "learning_rate": 2.242106327842437e-06, - "loss": 2.3667, - "step": 273860 - }, - { - "epoch": 0.96, - "learning_rate": 2.2403624479887835e-06, - "loss": 2.3031, - "step": 273870 - }, - { - "epoch": 0.96, - "learning_rate": 2.2386185681351298e-06, - "loss": 2.3479, - "step": 273880 - }, - { - "epoch": 0.96, - "learning_rate": 2.236874688281476e-06, - "loss": 2.3203, - "step": 273890 - }, - { - "epoch": 0.96, - "learning_rate": 2.2351308084278227e-06, - "loss": 2.2561, - "step": 273900 - }, - { - "epoch": 0.96, - "learning_rate": 2.233386928574169e-06, - "loss": 2.2922, - "step": 273910 - }, - { - "epoch": 0.96, - "learning_rate": 2.2316430487205153e-06, - "loss": 2.3061, - "step": 273920 - }, - { - "epoch": 0.96, - "learning_rate": 2.2298991688668615e-06, - "loss": 2.3525, - "step": 273930 - }, - { - "epoch": 0.96, - "learning_rate": 2.2281552890132082e-06, - "loss": 2.297, - "step": 273940 - }, - { - "epoch": 0.96, - "learning_rate": 2.2264114091595545e-06, - "loss": 2.2604, - "step": 273950 - }, - { - "epoch": 0.96, - "learning_rate": 2.2246675293059008e-06, - "loss": 2.3814, - "step": 273960 - }, - { - "epoch": 0.96, - "learning_rate": 2.2229236494522475e-06, - "loss": 2.3741, - "step": 273970 - }, - { - "epoch": 0.96, - "learning_rate": 2.2211797695985937e-06, - "loss": 2.308, - "step": 273980 - }, - { - "epoch": 0.96, - "learning_rate": 2.21943588974494e-06, - "loss": 2.3193, - "step": 273990 - }, - { - "epoch": 0.96, - "learning_rate": 2.2176920098912867e-06, - "loss": 2.3547, - "step": 274000 - }, - { - "epoch": 0.96, - "learning_rate": 2.215948130037633e-06, - "loss": 2.3183, - "step": 274010 - }, - { - "epoch": 0.96, - "learning_rate": 2.2142042501839792e-06, - "loss": 2.2997, - "step": 274020 - }, - { - "epoch": 0.96, - "learning_rate": 2.2124603703303255e-06, - "loss": 2.3355, - "step": 274030 - }, - { - "epoch": 0.96, - "learning_rate": 2.210716490476672e-06, - "loss": 2.3697, - "step": 274040 - }, - { - "epoch": 0.96, - "learning_rate": 2.2089726106230185e-06, - "loss": 2.3243, - "step": 274050 - }, - { - "epoch": 0.96, - "learning_rate": 2.2072287307693647e-06, - "loss": 2.3147, - "step": 274060 - }, - { - "epoch": 0.96, - "learning_rate": 2.2054848509157114e-06, - "loss": 2.261, - "step": 274070 - }, - { - "epoch": 0.96, - "learning_rate": 2.2037409710620577e-06, - "loss": 2.3387, - "step": 274080 - }, - { - "epoch": 0.96, - "learning_rate": 2.201997091208404e-06, - "loss": 2.3752, - "step": 274090 - }, - { - "epoch": 0.96, - "learning_rate": 2.2002532113547507e-06, - "loss": 2.3558, - "step": 274100 - }, - { - "epoch": 0.96, - "learning_rate": 2.198509331501097e-06, - "loss": 2.4127, - "step": 274110 - }, - { - "epoch": 0.96, - "learning_rate": 2.196765451647443e-06, - "loss": 2.2437, - "step": 274120 - }, - { - "epoch": 0.96, - "learning_rate": 2.1950215717937895e-06, - "loss": 2.3375, - "step": 274130 - }, - { - "epoch": 0.96, - "learning_rate": 2.193277691940136e-06, - "loss": 2.2846, - "step": 274140 - }, - { - "epoch": 0.96, - "learning_rate": 2.1915338120864824e-06, - "loss": 2.2826, - "step": 274150 - }, - { - "epoch": 0.96, - "learning_rate": 2.1897899322328287e-06, - "loss": 2.351, - "step": 274160 - }, - { - "epoch": 0.96, - "learning_rate": 2.1880460523791754e-06, - "loss": 2.3876, - "step": 274170 - }, - { - "epoch": 0.96, - "learning_rate": 2.1863021725255217e-06, - "loss": 2.3793, - "step": 274180 - }, - { - "epoch": 0.96, - "learning_rate": 2.184558292671868e-06, - "loss": 2.3074, - "step": 274190 - }, - { - "epoch": 0.96, - "learning_rate": 2.1828144128182146e-06, - "loss": 2.3653, - "step": 274200 - }, - { - "epoch": 0.96, - "learning_rate": 2.181070532964561e-06, - "loss": 2.3009, - "step": 274210 - }, - { - "epoch": 0.96, - "learning_rate": 2.179326653110907e-06, - "loss": 2.3164, - "step": 274220 - }, - { - "epoch": 0.96, - "learning_rate": 2.1775827732572534e-06, - "loss": 2.3166, - "step": 274230 - }, - { - "epoch": 0.96, - "learning_rate": 2.1758388934036e-06, - "loss": 2.3332, - "step": 274240 - }, - { - "epoch": 0.96, - "learning_rate": 2.1740950135499464e-06, - "loss": 2.3572, - "step": 274250 - }, - { - "epoch": 0.96, - "learning_rate": 2.1723511336962927e-06, - "loss": 2.3211, - "step": 274260 - }, - { - "epoch": 0.96, - "learning_rate": 2.1706072538426394e-06, - "loss": 2.4078, - "step": 274270 - }, - { - "epoch": 0.96, - "learning_rate": 2.1688633739889856e-06, - "loss": 2.2922, - "step": 274280 - }, - { - "epoch": 0.96, - "learning_rate": 2.167119494135332e-06, - "loss": 2.3202, - "step": 274290 - }, - { - "epoch": 0.96, - "learning_rate": 2.1653756142816786e-06, - "loss": 2.3592, - "step": 274300 - }, - { - "epoch": 0.96, - "learning_rate": 2.163631734428025e-06, - "loss": 2.3858, - "step": 274310 - }, - { - "epoch": 0.96, - "learning_rate": 2.161887854574371e-06, - "loss": 2.4393, - "step": 274320 - }, - { - "epoch": 0.96, - "learning_rate": 2.160143974720718e-06, - "loss": 2.298, - "step": 274330 - }, - { - "epoch": 0.96, - "learning_rate": 2.158400094867064e-06, - "loss": 2.4091, - "step": 274340 - }, - { - "epoch": 0.96, - "learning_rate": 2.1566562150134104e-06, - "loss": 2.3558, - "step": 274350 - }, - { - "epoch": 0.96, - "learning_rate": 2.1549123351597566e-06, - "loss": 2.298, - "step": 274360 - }, - { - "epoch": 0.96, - "learning_rate": 2.1531684553061033e-06, - "loss": 2.3073, - "step": 274370 - }, - { - "epoch": 0.96, - "learning_rate": 2.1514245754524496e-06, - "loss": 2.3828, - "step": 274380 - }, - { - "epoch": 0.96, - "learning_rate": 2.149680695598796e-06, - "loss": 2.3839, - "step": 274390 - }, - { - "epoch": 0.96, - "learning_rate": 2.1479368157451425e-06, - "loss": 2.3284, - "step": 274400 - }, - { - "epoch": 0.96, - "learning_rate": 2.146192935891489e-06, - "loss": 2.2772, - "step": 274410 - }, - { - "epoch": 0.96, - "learning_rate": 2.144449056037835e-06, - "loss": 2.3047, - "step": 274420 - }, - { - "epoch": 0.96, - "learning_rate": 2.1427051761841818e-06, - "loss": 2.2724, - "step": 274430 - }, - { - "epoch": 0.96, - "learning_rate": 2.140961296330528e-06, - "loss": 2.3424, - "step": 274440 - }, - { - "epoch": 0.96, - "learning_rate": 2.1392174164768743e-06, - "loss": 2.3322, - "step": 274450 - }, - { - "epoch": 0.96, - "learning_rate": 2.1374735366232206e-06, - "loss": 2.3172, - "step": 274460 - }, - { - "epoch": 0.96, - "learning_rate": 2.1357296567695673e-06, - "loss": 2.3071, - "step": 274470 - }, - { - "epoch": 0.96, - "learning_rate": 2.1339857769159136e-06, - "loss": 2.3887, - "step": 274480 - }, - { - "epoch": 0.96, - "learning_rate": 2.13224189706226e-06, - "loss": 2.3214, - "step": 274490 - }, - { - "epoch": 0.96, - "learning_rate": 2.1304980172086065e-06, - "loss": 2.3045, - "step": 274500 - }, - { - "epoch": 0.96, - "learning_rate": 2.1287541373549528e-06, - "loss": 2.396, - "step": 274510 - }, - { - "epoch": 0.96, - "learning_rate": 2.127010257501299e-06, - "loss": 2.3619, - "step": 274520 - }, - { - "epoch": 0.96, - "learning_rate": 2.1252663776476457e-06, - "loss": 2.3419, - "step": 274530 - }, - { - "epoch": 0.96, - "learning_rate": 2.123522497793992e-06, - "loss": 2.2917, - "step": 274540 - }, - { - "epoch": 0.96, - "learning_rate": 2.1217786179403383e-06, - "loss": 2.3453, - "step": 274550 - }, - { - "epoch": 0.96, - "learning_rate": 2.1200347380866846e-06, - "loss": 2.3359, - "step": 274560 - }, - { - "epoch": 0.96, - "learning_rate": 2.1182908582330312e-06, - "loss": 2.3889, - "step": 274570 - }, - { - "epoch": 0.96, - "learning_rate": 2.1165469783793775e-06, - "loss": 2.4124, - "step": 274580 - }, - { - "epoch": 0.96, - "learning_rate": 2.1148030985257238e-06, - "loss": 2.3087, - "step": 274590 - }, - { - "epoch": 0.96, - "learning_rate": 2.1130592186720705e-06, - "loss": 2.3771, - "step": 274600 - }, - { - "epoch": 0.96, - "learning_rate": 2.1113153388184167e-06, - "loss": 2.3879, - "step": 274610 - }, - { - "epoch": 0.96, - "learning_rate": 2.109571458964763e-06, - "loss": 2.2912, - "step": 274620 - }, - { - "epoch": 0.96, - "learning_rate": 2.1078275791111097e-06, - "loss": 2.2613, - "step": 274630 - }, - { - "epoch": 0.96, - "learning_rate": 2.106083699257456e-06, - "loss": 2.404, - "step": 274640 - }, - { - "epoch": 0.96, - "learning_rate": 2.1043398194038022e-06, - "loss": 2.3875, - "step": 274650 - }, - { - "epoch": 0.96, - "learning_rate": 2.1025959395501485e-06, - "loss": 2.3276, - "step": 274660 - }, - { - "epoch": 0.96, - "learning_rate": 2.100852059696495e-06, - "loss": 2.3156, - "step": 274670 - }, - { - "epoch": 0.96, - "learning_rate": 2.0991081798428415e-06, - "loss": 2.3283, - "step": 274680 - }, - { - "epoch": 0.96, - "learning_rate": 2.0973642999891877e-06, - "loss": 2.3721, - "step": 274690 - }, - { - "epoch": 0.96, - "learning_rate": 2.0956204201355344e-06, - "loss": 2.3503, - "step": 274700 - }, - { - "epoch": 0.96, - "learning_rate": 2.0938765402818807e-06, - "loss": 2.3894, - "step": 274710 - }, - { - "epoch": 0.96, - "learning_rate": 2.092132660428227e-06, - "loss": 2.3067, - "step": 274720 - }, - { - "epoch": 0.96, - "learning_rate": 2.0903887805745737e-06, - "loss": 2.3593, - "step": 274730 - }, - { - "epoch": 0.96, - "learning_rate": 2.08864490072092e-06, - "loss": 2.309, - "step": 274740 - }, - { - "epoch": 0.96, - "learning_rate": 2.086901020867266e-06, - "loss": 2.3897, - "step": 274750 - }, - { - "epoch": 0.96, - "learning_rate": 2.0851571410136125e-06, - "loss": 2.3265, - "step": 274760 - }, - { - "epoch": 0.96, - "learning_rate": 2.083413261159959e-06, - "loss": 2.3059, - "step": 274770 - }, - { - "epoch": 0.96, - "learning_rate": 2.0816693813063054e-06, - "loss": 2.3484, - "step": 274780 - }, - { - "epoch": 0.96, - "learning_rate": 2.0799255014526517e-06, - "loss": 2.1853, - "step": 274790 - }, - { - "epoch": 0.96, - "learning_rate": 2.0781816215989984e-06, - "loss": 2.2944, - "step": 274800 - }, - { - "epoch": 0.96, - "learning_rate": 2.0764377417453447e-06, - "loss": 2.3021, - "step": 274810 - }, - { - "epoch": 0.96, - "learning_rate": 2.074693861891691e-06, - "loss": 2.2836, - "step": 274820 - }, - { - "epoch": 0.96, - "learning_rate": 2.0729499820380376e-06, - "loss": 2.3293, - "step": 274830 - }, - { - "epoch": 0.96, - "learning_rate": 2.071206102184384e-06, - "loss": 2.2852, - "step": 274840 - }, - { - "epoch": 0.96, - "learning_rate": 2.06946222233073e-06, - "loss": 2.327, - "step": 274850 - }, - { - "epoch": 0.96, - "learning_rate": 2.0677183424770764e-06, - "loss": 2.3523, - "step": 274860 - }, - { - "epoch": 0.96, - "learning_rate": 2.065974462623423e-06, - "loss": 2.3128, - "step": 274870 - }, - { - "epoch": 0.96, - "learning_rate": 2.0642305827697694e-06, - "loss": 2.275, - "step": 274880 - }, - { - "epoch": 0.96, - "learning_rate": 2.0624867029161157e-06, - "loss": 2.3001, - "step": 274890 - }, - { - "epoch": 0.96, - "learning_rate": 2.0607428230624624e-06, - "loss": 2.3736, - "step": 274900 - }, - { - "epoch": 0.96, - "learning_rate": 2.0589989432088086e-06, - "loss": 2.2424, - "step": 274910 - }, - { - "epoch": 0.96, - "learning_rate": 2.057255063355155e-06, - "loss": 2.2527, - "step": 274920 - }, - { - "epoch": 0.96, - "learning_rate": 2.0555111835015016e-06, - "loss": 2.3981, - "step": 274930 - }, - { - "epoch": 0.96, - "learning_rate": 2.053767303647848e-06, - "loss": 2.3283, - "step": 274940 - }, - { - "epoch": 0.96, - "learning_rate": 2.052023423794194e-06, - "loss": 2.3447, - "step": 274950 - }, - { - "epoch": 0.96, - "learning_rate": 2.0502795439405404e-06, - "loss": 2.3548, - "step": 274960 - }, - { - "epoch": 0.96, - "learning_rate": 2.048535664086887e-06, - "loss": 2.255, - "step": 274970 - }, - { - "epoch": 0.96, - "learning_rate": 2.0467917842332334e-06, - "loss": 2.4082, - "step": 274980 - }, - { - "epoch": 0.96, - "learning_rate": 2.0450479043795796e-06, - "loss": 2.312, - "step": 274990 - }, - { - "epoch": 0.96, - "learning_rate": 2.0433040245259263e-06, - "loss": 2.3026, - "step": 275000 - }, - { - "epoch": 0.96, - "learning_rate": 2.0415601446722726e-06, - "loss": 2.2922, - "step": 275010 - }, - { - "epoch": 0.96, - "learning_rate": 2.039816264818619e-06, - "loss": 2.3222, - "step": 275020 - }, - { - "epoch": 0.96, - "learning_rate": 2.0380723849649656e-06, - "loss": 2.3625, - "step": 275030 - }, - { - "epoch": 0.96, - "learning_rate": 2.036328505111312e-06, - "loss": 2.3323, - "step": 275040 - }, - { - "epoch": 0.96, - "learning_rate": 2.034584625257658e-06, - "loss": 2.3488, - "step": 275050 - }, - { - "epoch": 0.96, - "learning_rate": 2.032840745404005e-06, - "loss": 2.3135, - "step": 275060 - }, - { - "epoch": 0.96, - "learning_rate": 2.031096865550351e-06, - "loss": 2.3037, - "step": 275070 - }, - { - "epoch": 0.96, - "learning_rate": 2.0293529856966973e-06, - "loss": 2.3385, - "step": 275080 - }, - { - "epoch": 0.96, - "learning_rate": 2.0276091058430436e-06, - "loss": 2.394, - "step": 275090 - }, - { - "epoch": 0.96, - "learning_rate": 2.0258652259893903e-06, - "loss": 2.3197, - "step": 275100 - }, - { - "epoch": 0.96, - "learning_rate": 2.0241213461357366e-06, - "loss": 2.3323, - "step": 275110 - }, - { - "epoch": 0.96, - "learning_rate": 2.022377466282083e-06, - "loss": 2.3382, - "step": 275120 - }, - { - "epoch": 0.96, - "learning_rate": 2.0206335864284295e-06, - "loss": 2.3887, - "step": 275130 - }, - { - "epoch": 0.96, - "learning_rate": 2.018889706574776e-06, - "loss": 2.3314, - "step": 275140 - }, - { - "epoch": 0.96, - "learning_rate": 2.017145826721122e-06, - "loss": 2.3205, - "step": 275150 - }, - { - "epoch": 0.96, - "learning_rate": 2.0154019468674688e-06, - "loss": 2.3327, - "step": 275160 - }, - { - "epoch": 0.96, - "learning_rate": 2.013658067013815e-06, - "loss": 2.3482, - "step": 275170 - }, - { - "epoch": 0.96, - "learning_rate": 2.0119141871601613e-06, - "loss": 2.3581, - "step": 275180 - }, - { - "epoch": 0.96, - "learning_rate": 2.010170307306508e-06, - "loss": 2.3118, - "step": 275190 - }, - { - "epoch": 0.96, - "learning_rate": 2.0084264274528543e-06, - "loss": 2.2349, - "step": 275200 - }, - { - "epoch": 0.96, - "learning_rate": 2.0066825475992005e-06, - "loss": 2.2948, - "step": 275210 - }, - { - "epoch": 0.96, - "learning_rate": 2.0049386677455472e-06, - "loss": 2.3567, - "step": 275220 - }, - { - "epoch": 0.96, - "learning_rate": 2.0031947878918935e-06, - "loss": 2.2716, - "step": 275230 - }, - { - "epoch": 0.96, - "learning_rate": 2.0014509080382398e-06, - "loss": 2.2971, - "step": 275240 - }, - { - "epoch": 0.96, - "learning_rate": 1.999707028184586e-06, - "loss": 2.3372, - "step": 275250 - }, - { - "epoch": 0.96, - "learning_rate": 1.9979631483309327e-06, - "loss": 2.3474, - "step": 275260 - }, - { - "epoch": 0.96, - "learning_rate": 1.996219268477279e-06, - "loss": 2.2739, - "step": 275270 - }, - { - "epoch": 0.96, - "learning_rate": 1.9944753886236253e-06, - "loss": 2.3179, - "step": 275280 - }, - { - "epoch": 0.96, - "learning_rate": 1.992731508769972e-06, - "loss": 2.2849, - "step": 275290 - }, - { - "epoch": 0.96, - "learning_rate": 1.9909876289163182e-06, - "loss": 2.3341, - "step": 275300 - }, - { - "epoch": 0.96, - "learning_rate": 1.9892437490626645e-06, - "loss": 2.2688, - "step": 275310 - }, - { - "epoch": 0.96, - "learning_rate": 1.987499869209011e-06, - "loss": 2.3151, - "step": 275320 - }, - { - "epoch": 0.96, - "learning_rate": 1.9857559893553574e-06, - "loss": 2.2506, - "step": 275330 - }, - { - "epoch": 0.96, - "learning_rate": 1.9840121095017037e-06, - "loss": 2.3954, - "step": 275340 - }, - { - "epoch": 0.96, - "learning_rate": 1.9822682296480504e-06, - "loss": 2.4046, - "step": 275350 - }, - { - "epoch": 0.96, - "learning_rate": 1.9805243497943967e-06, - "loss": 2.3448, - "step": 275360 - }, - { - "epoch": 0.96, - "learning_rate": 1.978780469940743e-06, - "loss": 2.3901, - "step": 275370 - }, - { - "epoch": 0.96, - "learning_rate": 1.9770365900870892e-06, - "loss": 2.3331, - "step": 275380 - }, - { - "epoch": 0.96, - "learning_rate": 1.975292710233436e-06, - "loss": 2.4041, - "step": 275390 - }, - { - "epoch": 0.96, - "learning_rate": 1.973548830379782e-06, - "loss": 2.3101, - "step": 275400 - }, - { - "epoch": 0.96, - "learning_rate": 1.9718049505261285e-06, - "loss": 2.3062, - "step": 275410 - }, - { - "epoch": 0.96, - "learning_rate": 1.970061070672475e-06, - "loss": 2.3676, - "step": 275420 - }, - { - "epoch": 0.96, - "learning_rate": 1.9683171908188214e-06, - "loss": 2.2438, - "step": 275430 - }, - { - "epoch": 0.96, - "learning_rate": 1.9665733109651677e-06, - "loss": 2.3814, - "step": 275440 - }, - { - "epoch": 0.96, - "learning_rate": 1.9648294311115144e-06, - "loss": 2.2665, - "step": 275450 - }, - { - "epoch": 0.96, - "learning_rate": 1.9630855512578606e-06, - "loss": 2.3347, - "step": 275460 - }, - { - "epoch": 0.96, - "learning_rate": 1.961341671404207e-06, - "loss": 2.309, - "step": 275470 - }, - { - "epoch": 0.96, - "learning_rate": 1.9595977915505536e-06, - "loss": 2.2642, - "step": 275480 - }, - { - "epoch": 0.96, - "learning_rate": 1.9578539116969e-06, - "loss": 2.3468, - "step": 275490 - }, - { - "epoch": 0.96, - "learning_rate": 1.956110031843246e-06, - "loss": 2.3683, - "step": 275500 - }, - { - "epoch": 0.96, - "learning_rate": 1.9543661519895924e-06, - "loss": 2.3313, - "step": 275510 - }, - { - "epoch": 0.96, - "learning_rate": 1.952622272135939e-06, - "loss": 2.3105, - "step": 275520 - }, - { - "epoch": 0.96, - "learning_rate": 1.9508783922822854e-06, - "loss": 2.411, - "step": 275530 - }, - { - "epoch": 0.96, - "learning_rate": 1.9491345124286316e-06, - "loss": 2.3335, - "step": 275540 - }, - { - "epoch": 0.96, - "learning_rate": 1.9473906325749783e-06, - "loss": 2.2698, - "step": 275550 - }, - { - "epoch": 0.96, - "learning_rate": 1.9456467527213246e-06, - "loss": 2.4546, - "step": 275560 - }, - { - "epoch": 0.96, - "learning_rate": 1.943902872867671e-06, - "loss": 2.3219, - "step": 275570 - }, - { - "epoch": 0.96, - "learning_rate": 1.9421589930140176e-06, - "loss": 2.3859, - "step": 275580 - }, - { - "epoch": 0.96, - "learning_rate": 1.940415113160364e-06, - "loss": 2.2927, - "step": 275590 - }, - { - "epoch": 0.96, - "learning_rate": 1.93867123330671e-06, - "loss": 2.3691, - "step": 275600 - }, - { - "epoch": 0.96, - "learning_rate": 1.936927353453057e-06, - "loss": 2.3029, - "step": 275610 - }, - { - "epoch": 0.96, - "learning_rate": 1.935183473599403e-06, - "loss": 2.3409, - "step": 275620 - }, - { - "epoch": 0.96, - "learning_rate": 1.9334395937457493e-06, - "loss": 2.3698, - "step": 275630 - }, - { - "epoch": 0.96, - "learning_rate": 1.9316957138920956e-06, - "loss": 2.3615, - "step": 275640 - }, - { - "epoch": 0.96, - "learning_rate": 1.9299518340384423e-06, - "loss": 2.3045, - "step": 275650 - }, - { - "epoch": 0.96, - "learning_rate": 1.9282079541847886e-06, - "loss": 2.3302, - "step": 275660 - }, - { - "epoch": 0.96, - "learning_rate": 1.926464074331135e-06, - "loss": 2.329, - "step": 275670 - }, - { - "epoch": 0.96, - "learning_rate": 1.9247201944774815e-06, - "loss": 2.3134, - "step": 275680 - }, - { - "epoch": 0.96, - "learning_rate": 1.922976314623828e-06, - "loss": 2.3282, - "step": 275690 - }, - { - "epoch": 0.96, - "learning_rate": 1.921232434770174e-06, - "loss": 2.2998, - "step": 275700 - }, - { - "epoch": 0.96, - "learning_rate": 1.9194885549165208e-06, - "loss": 2.2873, - "step": 275710 - }, - { - "epoch": 0.96, - "learning_rate": 1.917744675062867e-06, - "loss": 2.3491, - "step": 275720 - }, - { - "epoch": 0.96, - "learning_rate": 1.9160007952092133e-06, - "loss": 2.3489, - "step": 275730 - }, - { - "epoch": 0.96, - "learning_rate": 1.91425691535556e-06, - "loss": 2.337, - "step": 275740 - }, - { - "epoch": 0.96, - "learning_rate": 1.9125130355019063e-06, - "loss": 2.2839, - "step": 275750 - }, - { - "epoch": 0.96, - "learning_rate": 1.9107691556482525e-06, - "loss": 2.3607, - "step": 275760 - }, - { - "epoch": 0.96, - "learning_rate": 1.909025275794599e-06, - "loss": 2.235, - "step": 275770 - }, - { - "epoch": 0.96, - "learning_rate": 1.9072813959409453e-06, - "loss": 2.3272, - "step": 275780 - }, - { - "epoch": 0.96, - "learning_rate": 1.9055375160872916e-06, - "loss": 2.3307, - "step": 275790 - }, - { - "epoch": 0.96, - "learning_rate": 1.9037936362336382e-06, - "loss": 2.37, - "step": 275800 - }, - { - "epoch": 0.96, - "learning_rate": 1.9020497563799845e-06, - "loss": 2.2042, - "step": 275810 - }, - { - "epoch": 0.96, - "learning_rate": 1.9003058765263308e-06, - "loss": 2.3326, - "step": 275820 - }, - { - "epoch": 0.96, - "learning_rate": 1.8985619966726775e-06, - "loss": 2.3651, - "step": 275830 - }, - { - "epoch": 0.96, - "learning_rate": 1.8968181168190237e-06, - "loss": 2.3727, - "step": 275840 - }, - { - "epoch": 0.96, - "learning_rate": 1.89507423696537e-06, - "loss": 2.3866, - "step": 275850 - }, - { - "epoch": 0.96, - "learning_rate": 1.8933303571117167e-06, - "loss": 2.3295, - "step": 275860 - }, - { - "epoch": 0.96, - "learning_rate": 1.891586477258063e-06, - "loss": 2.3098, - "step": 275870 - }, - { - "epoch": 0.96, - "learning_rate": 1.8898425974044092e-06, - "loss": 2.3766, - "step": 275880 - }, - { - "epoch": 0.96, - "learning_rate": 1.8880987175507555e-06, - "loss": 2.2799, - "step": 275890 - }, - { - "epoch": 0.96, - "learning_rate": 1.8863548376971022e-06, - "loss": 2.3846, - "step": 275900 - }, - { - "epoch": 0.96, - "learning_rate": 1.8846109578434485e-06, - "loss": 2.3239, - "step": 275910 - }, - { - "epoch": 0.96, - "learning_rate": 1.8828670779897947e-06, - "loss": 2.3721, - "step": 275920 - }, - { - "epoch": 0.96, - "learning_rate": 1.8811231981361414e-06, - "loss": 2.3207, - "step": 275930 - }, - { - "epoch": 0.96, - "learning_rate": 1.8793793182824877e-06, - "loss": 2.3132, - "step": 275940 - }, - { - "epoch": 0.96, - "learning_rate": 1.877635438428834e-06, - "loss": 2.3017, - "step": 275950 - }, - { - "epoch": 0.96, - "learning_rate": 1.8758915585751807e-06, - "loss": 2.382, - "step": 275960 - }, - { - "epoch": 0.96, - "learning_rate": 1.874147678721527e-06, - "loss": 2.3504, - "step": 275970 - }, - { - "epoch": 0.96, - "learning_rate": 1.8724037988678732e-06, - "loss": 2.2937, - "step": 275980 - }, - { - "epoch": 0.96, - "learning_rate": 1.8706599190142195e-06, - "loss": 2.3851, - "step": 275990 - }, - { - "epoch": 0.96, - "learning_rate": 1.8689160391605662e-06, - "loss": 2.3471, - "step": 276000 - }, - { - "epoch": 0.96, - "learning_rate": 1.8671721593069124e-06, - "loss": 2.3789, - "step": 276010 - }, - { - "epoch": 0.96, - "learning_rate": 1.8654282794532587e-06, - "loss": 2.3189, - "step": 276020 - }, - { - "epoch": 0.96, - "learning_rate": 1.8636843995996054e-06, - "loss": 2.3399, - "step": 276030 - }, - { - "epoch": 0.96, - "learning_rate": 1.8619405197459517e-06, - "loss": 2.2782, - "step": 276040 - }, - { - "epoch": 0.96, - "learning_rate": 1.860196639892298e-06, - "loss": 2.3252, - "step": 276050 - }, - { - "epoch": 0.96, - "learning_rate": 1.8584527600386446e-06, - "loss": 2.3058, - "step": 276060 - }, - { - "epoch": 0.96, - "learning_rate": 1.856708880184991e-06, - "loss": 2.2655, - "step": 276070 - }, - { - "epoch": 0.96, - "learning_rate": 1.8549650003313372e-06, - "loss": 2.3606, - "step": 276080 - }, - { - "epoch": 0.96, - "learning_rate": 1.8532211204776834e-06, - "loss": 2.3828, - "step": 276090 - }, - { - "epoch": 0.96, - "learning_rate": 1.8514772406240301e-06, - "loss": 2.321, - "step": 276100 - }, - { - "epoch": 0.96, - "learning_rate": 1.8497333607703764e-06, - "loss": 2.3105, - "step": 276110 - }, - { - "epoch": 0.96, - "learning_rate": 1.8479894809167227e-06, - "loss": 2.4135, - "step": 276120 - }, - { - "epoch": 0.96, - "learning_rate": 1.8462456010630694e-06, - "loss": 2.2479, - "step": 276130 - }, - { - "epoch": 0.96, - "learning_rate": 1.8445017212094156e-06, - "loss": 2.3275, - "step": 276140 - }, - { - "epoch": 0.96, - "learning_rate": 1.842757841355762e-06, - "loss": 2.3251, - "step": 276150 - }, - { - "epoch": 0.96, - "learning_rate": 1.8410139615021086e-06, - "loss": 2.2878, - "step": 276160 - }, - { - "epoch": 0.96, - "learning_rate": 1.8392700816484549e-06, - "loss": 2.3252, - "step": 276170 - }, - { - "epoch": 0.96, - "learning_rate": 1.8375262017948011e-06, - "loss": 2.3657, - "step": 276180 - }, - { - "epoch": 0.96, - "learning_rate": 1.8357823219411474e-06, - "loss": 2.2991, - "step": 276190 - }, - { - "epoch": 0.96, - "learning_rate": 1.834038442087494e-06, - "loss": 2.3454, - "step": 276200 - }, - { - "epoch": 0.96, - "learning_rate": 1.8322945622338404e-06, - "loss": 2.3604, - "step": 276210 - }, - { - "epoch": 0.96, - "learning_rate": 1.8305506823801866e-06, - "loss": 2.3496, - "step": 276220 - }, - { - "epoch": 0.96, - "learning_rate": 1.8288068025265333e-06, - "loss": 2.3492, - "step": 276230 - }, - { - "epoch": 0.96, - "learning_rate": 1.8270629226728796e-06, - "loss": 2.3135, - "step": 276240 - }, - { - "epoch": 0.96, - "learning_rate": 1.8253190428192259e-06, - "loss": 2.3531, - "step": 276250 - }, - { - "epoch": 0.96, - "learning_rate": 1.8235751629655726e-06, - "loss": 2.2857, - "step": 276260 - }, - { - "epoch": 0.96, - "learning_rate": 1.8218312831119188e-06, - "loss": 2.3243, - "step": 276270 - }, - { - "epoch": 0.96, - "learning_rate": 1.820087403258265e-06, - "loss": 2.3525, - "step": 276280 - }, - { - "epoch": 0.96, - "learning_rate": 1.8183435234046114e-06, - "loss": 2.3343, - "step": 276290 - }, - { - "epoch": 0.96, - "learning_rate": 1.816599643550958e-06, - "loss": 2.3231, - "step": 276300 - }, - { - "epoch": 0.96, - "learning_rate": 1.8148557636973043e-06, - "loss": 2.374, - "step": 276310 - }, - { - "epoch": 0.96, - "learning_rate": 1.8131118838436506e-06, - "loss": 2.2764, - "step": 276320 - }, - { - "epoch": 0.96, - "learning_rate": 1.8113680039899973e-06, - "loss": 2.4468, - "step": 276330 - }, - { - "epoch": 0.96, - "learning_rate": 1.8096241241363436e-06, - "loss": 2.3348, - "step": 276340 - }, - { - "epoch": 0.96, - "learning_rate": 1.8078802442826898e-06, - "loss": 2.3468, - "step": 276350 - }, - { - "epoch": 0.96, - "learning_rate": 1.8061363644290365e-06, - "loss": 2.4003, - "step": 276360 - }, - { - "epoch": 0.96, - "learning_rate": 1.8043924845753828e-06, - "loss": 2.2987, - "step": 276370 - }, - { - "epoch": 0.96, - "learning_rate": 1.802648604721729e-06, - "loss": 2.364, - "step": 276380 - }, - { - "epoch": 0.96, - "learning_rate": 1.8009047248680753e-06, - "loss": 2.2562, - "step": 276390 - }, - { - "epoch": 0.96, - "learning_rate": 1.799160845014422e-06, - "loss": 2.3153, - "step": 276400 - }, - { - "epoch": 0.96, - "learning_rate": 1.7974169651607683e-06, - "loss": 2.3523, - "step": 276410 - }, - { - "epoch": 0.96, - "learning_rate": 1.7956730853071146e-06, - "loss": 2.4001, - "step": 276420 - }, - { - "epoch": 0.96, - "learning_rate": 1.7939292054534613e-06, - "loss": 2.3622, - "step": 276430 - }, - { - "epoch": 0.96, - "learning_rate": 1.7921853255998075e-06, - "loss": 2.3533, - "step": 276440 - }, - { - "epoch": 0.96, - "learning_rate": 1.7904414457461538e-06, - "loss": 2.3299, - "step": 276450 - }, - { - "epoch": 0.96, - "learning_rate": 1.7886975658925005e-06, - "loss": 2.4218, - "step": 276460 - }, - { - "epoch": 0.96, - "learning_rate": 1.7869536860388468e-06, - "loss": 2.3467, - "step": 276470 - }, - { - "epoch": 0.96, - "learning_rate": 1.785209806185193e-06, - "loss": 2.2999, - "step": 276480 - }, - { - "epoch": 0.96, - "learning_rate": 1.7834659263315393e-06, - "loss": 2.3576, - "step": 276490 - }, - { - "epoch": 0.96, - "learning_rate": 1.781722046477886e-06, - "loss": 2.323, - "step": 276500 - }, - { - "epoch": 0.96, - "learning_rate": 1.7799781666242323e-06, - "loss": 2.3741, - "step": 276510 - }, - { - "epoch": 0.96, - "learning_rate": 1.7782342867705785e-06, - "loss": 2.3608, - "step": 276520 - }, - { - "epoch": 0.96, - "learning_rate": 1.7764904069169252e-06, - "loss": 2.3261, - "step": 276530 - }, - { - "epoch": 0.96, - "learning_rate": 1.7747465270632715e-06, - "loss": 2.3398, - "step": 276540 - }, - { - "epoch": 0.96, - "learning_rate": 1.7730026472096178e-06, - "loss": 2.3549, - "step": 276550 - }, - { - "epoch": 0.96, - "learning_rate": 1.7712587673559645e-06, - "loss": 2.2308, - "step": 276560 - }, - { - "epoch": 0.96, - "learning_rate": 1.7695148875023107e-06, - "loss": 2.382, - "step": 276570 - }, - { - "epoch": 0.96, - "learning_rate": 1.767771007648657e-06, - "loss": 2.228, - "step": 276580 - }, - { - "epoch": 0.96, - "learning_rate": 1.7660271277950033e-06, - "loss": 2.2977, - "step": 276590 - }, - { - "epoch": 0.96, - "learning_rate": 1.76428324794135e-06, - "loss": 2.3622, - "step": 276600 - }, - { - "epoch": 0.96, - "learning_rate": 1.7625393680876962e-06, - "loss": 2.3321, - "step": 276610 - }, - { - "epoch": 0.96, - "learning_rate": 1.7607954882340425e-06, - "loss": 2.2714, - "step": 276620 - }, - { - "epoch": 0.96, - "learning_rate": 1.7590516083803892e-06, - "loss": 2.2618, - "step": 276630 - }, - { - "epoch": 0.96, - "learning_rate": 1.7573077285267355e-06, - "loss": 2.393, - "step": 276640 - }, - { - "epoch": 0.96, - "learning_rate": 1.7555638486730817e-06, - "loss": 2.3936, - "step": 276650 - }, - { - "epoch": 0.96, - "learning_rate": 1.7538199688194284e-06, - "loss": 2.3609, - "step": 276660 - }, - { - "epoch": 0.96, - "learning_rate": 1.7520760889657747e-06, - "loss": 2.2251, - "step": 276670 - }, - { - "epoch": 0.96, - "learning_rate": 1.750332209112121e-06, - "loss": 2.4141, - "step": 276680 - }, - { - "epoch": 0.97, - "learning_rate": 1.7485883292584672e-06, - "loss": 2.3278, - "step": 276690 - }, - { - "epoch": 0.97, - "learning_rate": 1.746844449404814e-06, - "loss": 2.3494, - "step": 276700 - }, - { - "epoch": 0.97, - "learning_rate": 1.7451005695511602e-06, - "loss": 2.3395, - "step": 276710 - }, - { - "epoch": 0.97, - "learning_rate": 1.7433566896975065e-06, - "loss": 2.3495, - "step": 276720 - }, - { - "epoch": 0.97, - "learning_rate": 1.7416128098438531e-06, - "loss": 2.3565, - "step": 276730 - }, - { - "epoch": 0.97, - "learning_rate": 1.7398689299901994e-06, - "loss": 2.2603, - "step": 276740 - }, - { - "epoch": 0.97, - "learning_rate": 1.7381250501365457e-06, - "loss": 2.2585, - "step": 276750 - }, - { - "epoch": 0.97, - "learning_rate": 1.7363811702828924e-06, - "loss": 2.3886, - "step": 276760 - }, - { - "epoch": 0.97, - "learning_rate": 1.7346372904292386e-06, - "loss": 2.4339, - "step": 276770 - }, - { - "epoch": 0.97, - "learning_rate": 1.732893410575585e-06, - "loss": 2.3027, - "step": 276780 - }, - { - "epoch": 0.97, - "learning_rate": 1.7311495307219314e-06, - "loss": 2.3191, - "step": 276790 - }, - { - "epoch": 0.97, - "learning_rate": 1.7294056508682779e-06, - "loss": 2.3628, - "step": 276800 - }, - { - "epoch": 0.97, - "learning_rate": 1.7276617710146241e-06, - "loss": 2.3321, - "step": 276810 - }, - { - "epoch": 0.97, - "learning_rate": 1.7259178911609706e-06, - "loss": 2.3095, - "step": 276820 - }, - { - "epoch": 0.97, - "learning_rate": 1.7241740113073171e-06, - "loss": 2.3266, - "step": 276830 - }, - { - "epoch": 0.97, - "learning_rate": 1.7224301314536634e-06, - "loss": 2.3622, - "step": 276840 - }, - { - "epoch": 0.97, - "learning_rate": 1.7206862516000096e-06, - "loss": 2.2989, - "step": 276850 - }, - { - "epoch": 0.97, - "learning_rate": 1.7189423717463563e-06, - "loss": 2.3263, - "step": 276860 - }, - { - "epoch": 0.97, - "learning_rate": 1.7171984918927026e-06, - "loss": 2.3001, - "step": 276870 - }, - { - "epoch": 0.97, - "learning_rate": 1.7154546120390489e-06, - "loss": 2.3504, - "step": 276880 - }, - { - "epoch": 0.97, - "learning_rate": 1.7137107321853954e-06, - "loss": 2.3081, - "step": 276890 - }, - { - "epoch": 0.97, - "learning_rate": 1.7119668523317418e-06, - "loss": 2.271, - "step": 276900 - }, - { - "epoch": 0.97, - "learning_rate": 1.7102229724780881e-06, - "loss": 2.3143, - "step": 276910 - }, - { - "epoch": 0.97, - "learning_rate": 1.7084790926244346e-06, - "loss": 2.2501, - "step": 276920 - }, - { - "epoch": 0.97, - "learning_rate": 1.706735212770781e-06, - "loss": 2.3304, - "step": 276930 - }, - { - "epoch": 0.97, - "learning_rate": 1.7049913329171273e-06, - "loss": 2.3647, - "step": 276940 - }, - { - "epoch": 0.97, - "learning_rate": 1.7032474530634738e-06, - "loss": 2.4319, - "step": 276950 - }, - { - "epoch": 0.97, - "learning_rate": 1.7015035732098203e-06, - "loss": 2.3793, - "step": 276960 - }, - { - "epoch": 0.97, - "learning_rate": 1.6997596933561666e-06, - "loss": 2.3636, - "step": 276970 - }, - { - "epoch": 0.97, - "learning_rate": 1.6980158135025128e-06, - "loss": 2.3312, - "step": 276980 - }, - { - "epoch": 0.97, - "learning_rate": 1.6962719336488593e-06, - "loss": 2.3593, - "step": 276990 - }, - { - "epoch": 0.97, - "learning_rate": 1.6945280537952058e-06, - "loss": 2.2383, - "step": 277000 - }, - { - "epoch": 0.97, - "learning_rate": 1.692784173941552e-06, - "loss": 2.3458, - "step": 277010 - }, - { - "epoch": 0.97, - "learning_rate": 1.6910402940878986e-06, - "loss": 2.3504, - "step": 277020 - }, - { - "epoch": 0.97, - "learning_rate": 1.689296414234245e-06, - "loss": 2.3521, - "step": 277030 - }, - { - "epoch": 0.97, - "learning_rate": 1.6875525343805913e-06, - "loss": 2.2828, - "step": 277040 - }, - { - "epoch": 0.97, - "learning_rate": 1.6858086545269378e-06, - "loss": 2.2399, - "step": 277050 - }, - { - "epoch": 0.97, - "learning_rate": 1.6840647746732843e-06, - "loss": 2.3979, - "step": 277060 - }, - { - "epoch": 0.97, - "learning_rate": 1.6823208948196305e-06, - "loss": 2.3229, - "step": 277070 - }, - { - "epoch": 0.97, - "learning_rate": 1.680577014965977e-06, - "loss": 2.285, - "step": 277080 - }, - { - "epoch": 0.97, - "learning_rate": 1.6788331351123235e-06, - "loss": 2.319, - "step": 277090 - }, - { - "epoch": 0.97, - "learning_rate": 1.6770892552586698e-06, - "loss": 2.3974, - "step": 277100 - }, - { - "epoch": 0.97, - "learning_rate": 1.675345375405016e-06, - "loss": 2.314, - "step": 277110 - }, - { - "epoch": 0.97, - "learning_rate": 1.6736014955513625e-06, - "loss": 2.4143, - "step": 277120 - }, - { - "epoch": 0.97, - "learning_rate": 1.671857615697709e-06, - "loss": 2.3344, - "step": 277130 - }, - { - "epoch": 0.97, - "learning_rate": 1.6701137358440553e-06, - "loss": 2.3571, - "step": 277140 - }, - { - "epoch": 0.97, - "learning_rate": 1.6683698559904018e-06, - "loss": 2.3296, - "step": 277150 - }, - { - "epoch": 0.97, - "learning_rate": 1.6666259761367482e-06, - "loss": 2.2606, - "step": 277160 - }, - { - "epoch": 0.97, - "learning_rate": 1.6648820962830945e-06, - "loss": 2.4344, - "step": 277170 - }, - { - "epoch": 0.97, - "learning_rate": 1.663138216429441e-06, - "loss": 2.3219, - "step": 277180 - }, - { - "epoch": 0.97, - "learning_rate": 1.6613943365757875e-06, - "loss": 2.3587, - "step": 277190 - }, - { - "epoch": 0.97, - "learning_rate": 1.6596504567221337e-06, - "loss": 2.3343, - "step": 277200 - }, - { - "epoch": 0.97, - "learning_rate": 1.6579065768684802e-06, - "loss": 2.337, - "step": 277210 - }, - { - "epoch": 0.97, - "learning_rate": 1.6561626970148265e-06, - "loss": 2.3272, - "step": 277220 - }, - { - "epoch": 0.97, - "learning_rate": 1.654418817161173e-06, - "loss": 2.3238, - "step": 277230 - }, - { - "epoch": 0.97, - "learning_rate": 1.6526749373075192e-06, - "loss": 2.3029, - "step": 277240 - }, - { - "epoch": 0.97, - "learning_rate": 1.6509310574538657e-06, - "loss": 2.2861, - "step": 277250 - }, - { - "epoch": 0.97, - "learning_rate": 1.6491871776002122e-06, - "loss": 2.3319, - "step": 277260 - }, - { - "epoch": 0.97, - "learning_rate": 1.6474432977465585e-06, - "loss": 2.326, - "step": 277270 - }, - { - "epoch": 0.97, - "learning_rate": 1.645699417892905e-06, - "loss": 2.3139, - "step": 277280 - }, - { - "epoch": 0.97, - "learning_rate": 1.6439555380392514e-06, - "loss": 2.3772, - "step": 277290 - }, - { - "epoch": 0.97, - "learning_rate": 1.6422116581855977e-06, - "loss": 2.2054, - "step": 277300 - }, - { - "epoch": 0.97, - "learning_rate": 1.6404677783319442e-06, - "loss": 2.3364, - "step": 277310 - }, - { - "epoch": 0.97, - "learning_rate": 1.6387238984782904e-06, - "loss": 2.3758, - "step": 277320 - }, - { - "epoch": 0.97, - "learning_rate": 1.636980018624637e-06, - "loss": 2.3141, - "step": 277330 - }, - { - "epoch": 0.97, - "learning_rate": 1.6352361387709834e-06, - "loss": 2.3557, - "step": 277340 - }, - { - "epoch": 0.97, - "learning_rate": 1.6334922589173297e-06, - "loss": 2.316, - "step": 277350 - }, - { - "epoch": 0.97, - "learning_rate": 1.6317483790636762e-06, - "loss": 2.3097, - "step": 277360 - }, - { - "epoch": 0.97, - "learning_rate": 1.6300044992100224e-06, - "loss": 2.355, - "step": 277370 - }, - { - "epoch": 0.97, - "learning_rate": 1.628260619356369e-06, - "loss": 2.2859, - "step": 277380 - }, - { - "epoch": 0.97, - "learning_rate": 1.6265167395027154e-06, - "loss": 2.3626, - "step": 277390 - }, - { - "epoch": 0.97, - "learning_rate": 1.6247728596490617e-06, - "loss": 2.3168, - "step": 277400 - }, - { - "epoch": 0.97, - "learning_rate": 1.6230289797954081e-06, - "loss": 2.4259, - "step": 277410 - }, - { - "epoch": 0.97, - "learning_rate": 1.6212850999417544e-06, - "loss": 2.2657, - "step": 277420 - }, - { - "epoch": 0.97, - "learning_rate": 1.6195412200881009e-06, - "loss": 2.3692, - "step": 277430 - }, - { - "epoch": 0.97, - "learning_rate": 1.6177973402344474e-06, - "loss": 2.287, - "step": 277440 - }, - { - "epoch": 0.97, - "learning_rate": 1.6160534603807936e-06, - "loss": 2.325, - "step": 277450 - }, - { - "epoch": 0.97, - "learning_rate": 1.6143095805271401e-06, - "loss": 2.3548, - "step": 277460 - }, - { - "epoch": 0.97, - "learning_rate": 1.6125657006734866e-06, - "loss": 2.2935, - "step": 277470 - }, - { - "epoch": 0.97, - "learning_rate": 1.6108218208198329e-06, - "loss": 2.3515, - "step": 277480 - }, - { - "epoch": 0.97, - "learning_rate": 1.6090779409661794e-06, - "loss": 2.3388, - "step": 277490 - }, - { - "epoch": 0.97, - "learning_rate": 1.6073340611125256e-06, - "loss": 2.4097, - "step": 277500 - }, - { - "epoch": 0.97, - "learning_rate": 1.605590181258872e-06, - "loss": 2.2745, - "step": 277510 - }, - { - "epoch": 0.97, - "learning_rate": 1.6038463014052184e-06, - "loss": 2.3393, - "step": 277520 - }, - { - "epoch": 0.97, - "learning_rate": 1.6021024215515649e-06, - "loss": 2.3539, - "step": 277530 - }, - { - "epoch": 0.97, - "learning_rate": 1.6003585416979113e-06, - "loss": 2.3548, - "step": 277540 - }, - { - "epoch": 0.97, - "learning_rate": 1.5986146618442576e-06, - "loss": 2.3452, - "step": 277550 - }, - { - "epoch": 0.97, - "learning_rate": 1.596870781990604e-06, - "loss": 2.2808, - "step": 277560 - }, - { - "epoch": 0.97, - "learning_rate": 1.5951269021369506e-06, - "loss": 2.3374, - "step": 277570 - }, - { - "epoch": 0.97, - "learning_rate": 1.5933830222832968e-06, - "loss": 2.3638, - "step": 277580 - }, - { - "epoch": 0.97, - "learning_rate": 1.5916391424296433e-06, - "loss": 2.3934, - "step": 277590 - }, - { - "epoch": 0.97, - "learning_rate": 1.5898952625759898e-06, - "loss": 2.3649, - "step": 277600 - }, - { - "epoch": 0.97, - "learning_rate": 1.588151382722336e-06, - "loss": 2.2947, - "step": 277610 - }, - { - "epoch": 0.97, - "learning_rate": 1.5864075028686823e-06, - "loss": 2.3803, - "step": 277620 - }, - { - "epoch": 0.97, - "learning_rate": 1.584663623015029e-06, - "loss": 2.383, - "step": 277630 - }, - { - "epoch": 0.97, - "learning_rate": 1.5829197431613753e-06, - "loss": 2.3436, - "step": 277640 - }, - { - "epoch": 0.97, - "learning_rate": 1.5811758633077216e-06, - "loss": 2.34, - "step": 277650 - }, - { - "epoch": 0.97, - "learning_rate": 1.579431983454068e-06, - "loss": 2.3076, - "step": 277660 - }, - { - "epoch": 0.97, - "learning_rate": 1.5776881036004145e-06, - "loss": 2.3054, - "step": 277670 - }, - { - "epoch": 0.97, - "learning_rate": 1.5759442237467608e-06, - "loss": 2.2583, - "step": 277680 - }, - { - "epoch": 0.97, - "learning_rate": 1.5742003438931073e-06, - "loss": 2.2651, - "step": 277690 - }, - { - "epoch": 0.97, - "learning_rate": 1.5724564640394538e-06, - "loss": 2.3163, - "step": 277700 - }, - { - "epoch": 0.97, - "learning_rate": 1.5707125841858e-06, - "loss": 2.4028, - "step": 277710 - }, - { - "epoch": 0.97, - "learning_rate": 1.5689687043321463e-06, - "loss": 2.4175, - "step": 277720 - }, - { - "epoch": 0.97, - "learning_rate": 1.567224824478493e-06, - "loss": 2.3436, - "step": 277730 - }, - { - "epoch": 0.97, - "learning_rate": 1.5654809446248393e-06, - "loss": 2.2984, - "step": 277740 - }, - { - "epoch": 0.97, - "learning_rate": 1.5637370647711855e-06, - "loss": 2.3267, - "step": 277750 - }, - { - "epoch": 0.97, - "learning_rate": 1.561993184917532e-06, - "loss": 2.2867, - "step": 277760 - }, - { - "epoch": 0.97, - "learning_rate": 1.5602493050638785e-06, - "loss": 2.3264, - "step": 277770 - }, - { - "epoch": 0.97, - "learning_rate": 1.558505425210225e-06, - "loss": 2.3827, - "step": 277780 - }, - { - "epoch": 0.97, - "learning_rate": 1.5567615453565712e-06, - "loss": 2.3638, - "step": 277790 - }, - { - "epoch": 0.97, - "learning_rate": 1.5550176655029177e-06, - "loss": 2.3849, - "step": 277800 - }, - { - "epoch": 0.97, - "learning_rate": 1.553273785649264e-06, - "loss": 2.3541, - "step": 277810 - }, - { - "epoch": 0.97, - "learning_rate": 1.5515299057956105e-06, - "loss": 2.3494, - "step": 277820 - }, - { - "epoch": 0.97, - "learning_rate": 1.549786025941957e-06, - "loss": 2.3292, - "step": 277830 - }, - { - "epoch": 0.97, - "learning_rate": 1.5480421460883032e-06, - "loss": 2.3899, - "step": 277840 - }, - { - "epoch": 0.97, - "learning_rate": 1.5462982662346497e-06, - "loss": 2.2984, - "step": 277850 - }, - { - "epoch": 0.97, - "learning_rate": 1.544554386380996e-06, - "loss": 2.372, - "step": 277860 - }, - { - "epoch": 0.97, - "learning_rate": 1.5428105065273425e-06, - "loss": 2.3663, - "step": 277870 - }, - { - "epoch": 0.97, - "learning_rate": 1.541066626673689e-06, - "loss": 2.3788, - "step": 277880 - }, - { - "epoch": 0.97, - "learning_rate": 1.5393227468200352e-06, - "loss": 2.3532, - "step": 277890 - }, - { - "epoch": 0.97, - "learning_rate": 1.5375788669663817e-06, - "loss": 2.3135, - "step": 277900 - }, - { - "epoch": 0.97, - "learning_rate": 1.535834987112728e-06, - "loss": 2.3348, - "step": 277910 - }, - { - "epoch": 0.97, - "learning_rate": 1.5340911072590744e-06, - "loss": 2.3544, - "step": 277920 - }, - { - "epoch": 0.97, - "learning_rate": 1.532347227405421e-06, - "loss": 2.324, - "step": 277930 - }, - { - "epoch": 0.97, - "learning_rate": 1.5306033475517672e-06, - "loss": 2.3515, - "step": 277940 - }, - { - "epoch": 0.97, - "learning_rate": 1.5288594676981137e-06, - "loss": 2.4157, - "step": 277950 - }, - { - "epoch": 0.97, - "learning_rate": 1.52711558784446e-06, - "loss": 2.3576, - "step": 277960 - }, - { - "epoch": 0.97, - "learning_rate": 1.5253717079908064e-06, - "loss": 2.3078, - "step": 277970 - }, - { - "epoch": 0.97, - "learning_rate": 1.523627828137153e-06, - "loss": 2.2789, - "step": 277980 - }, - { - "epoch": 0.97, - "learning_rate": 1.5218839482834992e-06, - "loss": 2.3361, - "step": 277990 - }, - { - "epoch": 0.97, - "learning_rate": 1.5201400684298456e-06, - "loss": 2.3902, - "step": 278000 - }, - { - "epoch": 0.97, - "learning_rate": 1.518396188576192e-06, - "loss": 2.3209, - "step": 278010 - }, - { - "epoch": 0.97, - "learning_rate": 1.5166523087225384e-06, - "loss": 2.3122, - "step": 278020 - }, - { - "epoch": 0.97, - "learning_rate": 1.5149084288688849e-06, - "loss": 2.3805, - "step": 278030 - }, - { - "epoch": 0.97, - "learning_rate": 1.5131645490152312e-06, - "loss": 2.3204, - "step": 278040 - }, - { - "epoch": 0.97, - "learning_rate": 1.5114206691615776e-06, - "loss": 2.4093, - "step": 278050 - }, - { - "epoch": 0.97, - "learning_rate": 1.509676789307924e-06, - "loss": 2.3556, - "step": 278060 - }, - { - "epoch": 0.97, - "learning_rate": 1.5079329094542704e-06, - "loss": 2.2265, - "step": 278070 - }, - { - "epoch": 0.97, - "learning_rate": 1.5061890296006169e-06, - "loss": 2.2627, - "step": 278080 - }, - { - "epoch": 0.97, - "learning_rate": 1.5044451497469631e-06, - "loss": 2.3667, - "step": 278090 - }, - { - "epoch": 0.97, - "learning_rate": 1.5027012698933096e-06, - "loss": 2.3332, - "step": 278100 - }, - { - "epoch": 0.97, - "learning_rate": 1.5009573900396559e-06, - "loss": 2.3032, - "step": 278110 - }, - { - "epoch": 0.97, - "learning_rate": 1.4992135101860024e-06, - "loss": 2.2543, - "step": 278120 - }, - { - "epoch": 0.97, - "learning_rate": 1.4974696303323488e-06, - "loss": 2.2899, - "step": 278130 - }, - { - "epoch": 0.97, - "learning_rate": 1.4957257504786951e-06, - "loss": 2.3835, - "step": 278140 - }, - { - "epoch": 0.97, - "learning_rate": 1.4939818706250416e-06, - "loss": 2.304, - "step": 278150 - }, - { - "epoch": 0.97, - "learning_rate": 1.4922379907713879e-06, - "loss": 2.3797, - "step": 278160 - }, - { - "epoch": 0.97, - "learning_rate": 1.4904941109177343e-06, - "loss": 2.3348, - "step": 278170 - }, - { - "epoch": 0.97, - "learning_rate": 1.4887502310640808e-06, - "loss": 2.3014, - "step": 278180 - }, - { - "epoch": 0.97, - "learning_rate": 1.487006351210427e-06, - "loss": 2.2613, - "step": 278190 - }, - { - "epoch": 0.97, - "learning_rate": 1.4852624713567736e-06, - "loss": 2.3769, - "step": 278200 - }, - { - "epoch": 0.97, - "learning_rate": 1.4835185915031198e-06, - "loss": 2.2904, - "step": 278210 - }, - { - "epoch": 0.97, - "learning_rate": 1.4817747116494663e-06, - "loss": 2.3174, - "step": 278220 - }, - { - "epoch": 0.97, - "learning_rate": 1.4800308317958128e-06, - "loss": 2.3162, - "step": 278230 - }, - { - "epoch": 0.97, - "learning_rate": 1.478286951942159e-06, - "loss": 2.4036, - "step": 278240 - }, - { - "epoch": 0.97, - "learning_rate": 1.4765430720885056e-06, - "loss": 2.3364, - "step": 278250 - }, - { - "epoch": 0.97, - "learning_rate": 1.4747991922348518e-06, - "loss": 2.2916, - "step": 278260 - }, - { - "epoch": 0.97, - "learning_rate": 1.4730553123811983e-06, - "loss": 2.343, - "step": 278270 - }, - { - "epoch": 0.97, - "learning_rate": 1.4713114325275448e-06, - "loss": 2.2887, - "step": 278280 - }, - { - "epoch": 0.97, - "learning_rate": 1.469567552673891e-06, - "loss": 2.3626, - "step": 278290 - }, - { - "epoch": 0.97, - "learning_rate": 1.4678236728202375e-06, - "loss": 2.3092, - "step": 278300 - }, - { - "epoch": 0.97, - "learning_rate": 1.4660797929665838e-06, - "loss": 2.352, - "step": 278310 - }, - { - "epoch": 0.97, - "learning_rate": 1.4643359131129303e-06, - "loss": 2.3208, - "step": 278320 - }, - { - "epoch": 0.97, - "learning_rate": 1.4625920332592768e-06, - "loss": 2.354, - "step": 278330 - }, - { - "epoch": 0.97, - "learning_rate": 1.460848153405623e-06, - "loss": 2.2933, - "step": 278340 - }, - { - "epoch": 0.97, - "learning_rate": 1.4591042735519695e-06, - "loss": 2.3144, - "step": 278350 - }, - { - "epoch": 0.97, - "learning_rate": 1.4573603936983158e-06, - "loss": 2.337, - "step": 278360 - }, - { - "epoch": 0.97, - "learning_rate": 1.4556165138446623e-06, - "loss": 2.3463, - "step": 278370 - }, - { - "epoch": 0.97, - "learning_rate": 1.4538726339910088e-06, - "loss": 2.3786, - "step": 278380 - }, - { - "epoch": 0.97, - "learning_rate": 1.452128754137355e-06, - "loss": 2.3333, - "step": 278390 - }, - { - "epoch": 0.97, - "learning_rate": 1.4503848742837015e-06, - "loss": 2.3508, - "step": 278400 - }, - { - "epoch": 0.97, - "learning_rate": 1.4486409944300478e-06, - "loss": 2.3259, - "step": 278410 - }, - { - "epoch": 0.97, - "learning_rate": 1.4468971145763943e-06, - "loss": 2.3298, - "step": 278420 - }, - { - "epoch": 0.97, - "learning_rate": 1.4451532347227407e-06, - "loss": 2.3153, - "step": 278430 - }, - { - "epoch": 0.97, - "learning_rate": 1.443409354869087e-06, - "loss": 2.2877, - "step": 278440 - }, - { - "epoch": 0.97, - "learning_rate": 1.4416654750154335e-06, - "loss": 2.3431, - "step": 278450 - }, - { - "epoch": 0.97, - "learning_rate": 1.4399215951617798e-06, - "loss": 2.2773, - "step": 278460 - }, - { - "epoch": 0.97, - "learning_rate": 1.4381777153081262e-06, - "loss": 2.3317, - "step": 278470 - }, - { - "epoch": 0.97, - "learning_rate": 1.4364338354544727e-06, - "loss": 2.3628, - "step": 278480 - }, - { - "epoch": 0.97, - "learning_rate": 1.434689955600819e-06, - "loss": 2.3132, - "step": 278490 - }, - { - "epoch": 0.97, - "learning_rate": 1.4329460757471655e-06, - "loss": 2.2925, - "step": 278500 - }, - { - "epoch": 0.97, - "learning_rate": 1.4312021958935117e-06, - "loss": 2.3429, - "step": 278510 - }, - { - "epoch": 0.97, - "learning_rate": 1.4294583160398582e-06, - "loss": 2.2532, - "step": 278520 - }, - { - "epoch": 0.97, - "learning_rate": 1.4277144361862047e-06, - "loss": 2.3449, - "step": 278530 - }, - { - "epoch": 0.97, - "learning_rate": 1.425970556332551e-06, - "loss": 2.3521, - "step": 278540 - }, - { - "epoch": 0.97, - "learning_rate": 1.4242266764788974e-06, - "loss": 2.3178, - "step": 278550 - }, - { - "epoch": 0.97, - "learning_rate": 1.4224827966252437e-06, - "loss": 2.3759, - "step": 278560 - }, - { - "epoch": 0.97, - "learning_rate": 1.4207389167715902e-06, - "loss": 2.3996, - "step": 278570 - }, - { - "epoch": 0.97, - "learning_rate": 1.4189950369179367e-06, - "loss": 2.3713, - "step": 278580 - }, - { - "epoch": 0.97, - "learning_rate": 1.417251157064283e-06, - "loss": 2.3159, - "step": 278590 - }, - { - "epoch": 0.97, - "learning_rate": 1.4155072772106294e-06, - "loss": 2.3245, - "step": 278600 - }, - { - "epoch": 0.97, - "learning_rate": 1.4137633973569757e-06, - "loss": 2.3682, - "step": 278610 - }, - { - "epoch": 0.97, - "learning_rate": 1.4120195175033222e-06, - "loss": 2.3625, - "step": 278620 - }, - { - "epoch": 0.97, - "learning_rate": 1.4102756376496687e-06, - "loss": 2.3136, - "step": 278630 - }, - { - "epoch": 0.97, - "learning_rate": 1.408531757796015e-06, - "loss": 2.3661, - "step": 278640 - }, - { - "epoch": 0.97, - "learning_rate": 1.4067878779423614e-06, - "loss": 2.3093, - "step": 278650 - }, - { - "epoch": 0.97, - "learning_rate": 1.4050439980887077e-06, - "loss": 2.3357, - "step": 278660 - }, - { - "epoch": 0.97, - "learning_rate": 1.4033001182350542e-06, - "loss": 2.4361, - "step": 278670 - }, - { - "epoch": 0.97, - "learning_rate": 1.4015562383814006e-06, - "loss": 2.3896, - "step": 278680 - }, - { - "epoch": 0.97, - "learning_rate": 1.399812358527747e-06, - "loss": 2.3109, - "step": 278690 - }, - { - "epoch": 0.97, - "learning_rate": 1.3980684786740934e-06, - "loss": 2.318, - "step": 278700 - }, - { - "epoch": 0.97, - "learning_rate": 1.3963245988204397e-06, - "loss": 2.2617, - "step": 278710 - }, - { - "epoch": 0.97, - "learning_rate": 1.3945807189667861e-06, - "loss": 2.258, - "step": 278720 - }, - { - "epoch": 0.97, - "learning_rate": 1.3928368391131326e-06, - "loss": 2.2691, - "step": 278730 - }, - { - "epoch": 0.97, - "learning_rate": 1.3910929592594789e-06, - "loss": 2.3656, - "step": 278740 - }, - { - "epoch": 0.97, - "learning_rate": 1.3893490794058254e-06, - "loss": 2.3934, - "step": 278750 - }, - { - "epoch": 0.97, - "learning_rate": 1.3876051995521716e-06, - "loss": 2.3395, - "step": 278760 - }, - { - "epoch": 0.97, - "learning_rate": 1.3858613196985181e-06, - "loss": 2.2575, - "step": 278770 - }, - { - "epoch": 0.97, - "learning_rate": 1.3841174398448646e-06, - "loss": 2.3381, - "step": 278780 - }, - { - "epoch": 0.97, - "learning_rate": 1.3823735599912109e-06, - "loss": 2.3656, - "step": 278790 - }, - { - "epoch": 0.97, - "learning_rate": 1.3806296801375574e-06, - "loss": 2.3697, - "step": 278800 - }, - { - "epoch": 0.97, - "learning_rate": 1.3788858002839036e-06, - "loss": 2.3138, - "step": 278810 - }, - { - "epoch": 0.97, - "learning_rate": 1.3771419204302501e-06, - "loss": 2.3266, - "step": 278820 - }, - { - "epoch": 0.97, - "learning_rate": 1.3753980405765966e-06, - "loss": 2.3138, - "step": 278830 - }, - { - "epoch": 0.97, - "learning_rate": 1.3736541607229429e-06, - "loss": 2.3549, - "step": 278840 - }, - { - "epoch": 0.97, - "learning_rate": 1.3719102808692893e-06, - "loss": 2.3384, - "step": 278850 - }, - { - "epoch": 0.97, - "learning_rate": 1.3701664010156356e-06, - "loss": 2.2917, - "step": 278860 - }, - { - "epoch": 0.97, - "learning_rate": 1.368422521161982e-06, - "loss": 2.3026, - "step": 278870 - }, - { - "epoch": 0.97, - "learning_rate": 1.3666786413083286e-06, - "loss": 2.3492, - "step": 278880 - }, - { - "epoch": 0.97, - "learning_rate": 1.3649347614546748e-06, - "loss": 2.2768, - "step": 278890 - }, - { - "epoch": 0.97, - "learning_rate": 1.3631908816010213e-06, - "loss": 2.345, - "step": 278900 - }, - { - "epoch": 0.97, - "learning_rate": 1.3614470017473676e-06, - "loss": 2.3044, - "step": 278910 - }, - { - "epoch": 0.97, - "learning_rate": 1.359703121893714e-06, - "loss": 2.3242, - "step": 278920 - }, - { - "epoch": 0.97, - "learning_rate": 1.3579592420400606e-06, - "loss": 2.3329, - "step": 278930 - }, - { - "epoch": 0.97, - "learning_rate": 1.3562153621864068e-06, - "loss": 2.2569, - "step": 278940 - }, - { - "epoch": 0.97, - "learning_rate": 1.3544714823327533e-06, - "loss": 2.2592, - "step": 278950 - }, - { - "epoch": 0.97, - "learning_rate": 1.3527276024790996e-06, - "loss": 2.3681, - "step": 278960 - }, - { - "epoch": 0.97, - "learning_rate": 1.350983722625446e-06, - "loss": 2.3242, - "step": 278970 - }, - { - "epoch": 0.97, - "learning_rate": 1.3492398427717925e-06, - "loss": 2.3777, - "step": 278980 - }, - { - "epoch": 0.97, - "learning_rate": 1.3474959629181388e-06, - "loss": 2.381, - "step": 278990 - }, - { - "epoch": 0.97, - "learning_rate": 1.3457520830644853e-06, - "loss": 2.3802, - "step": 279000 - }, - { - "epoch": 0.97, - "learning_rate": 1.3440082032108316e-06, - "loss": 2.2971, - "step": 279010 - }, - { - "epoch": 0.97, - "learning_rate": 1.342264323357178e-06, - "loss": 2.3322, - "step": 279020 - }, - { - "epoch": 0.97, - "learning_rate": 1.3405204435035245e-06, - "loss": 2.2185, - "step": 279030 - }, - { - "epoch": 0.97, - "learning_rate": 1.3387765636498708e-06, - "loss": 2.3178, - "step": 279040 - }, - { - "epoch": 0.97, - "learning_rate": 1.3370326837962173e-06, - "loss": 2.3357, - "step": 279050 - }, - { - "epoch": 0.97, - "learning_rate": 1.3352888039425635e-06, - "loss": 2.3796, - "step": 279060 - }, - { - "epoch": 0.97, - "learning_rate": 1.33354492408891e-06, - "loss": 2.3719, - "step": 279070 - }, - { - "epoch": 0.97, - "learning_rate": 1.3318010442352565e-06, - "loss": 2.3669, - "step": 279080 - }, - { - "epoch": 0.97, - "learning_rate": 1.3300571643816028e-06, - "loss": 2.3042, - "step": 279090 - }, - { - "epoch": 0.97, - "learning_rate": 1.3283132845279492e-06, - "loss": 2.2563, - "step": 279100 - }, - { - "epoch": 0.97, - "learning_rate": 1.3265694046742955e-06, - "loss": 2.322, - "step": 279110 - }, - { - "epoch": 0.97, - "learning_rate": 1.324825524820642e-06, - "loss": 2.3694, - "step": 279120 - }, - { - "epoch": 0.97, - "learning_rate": 1.3230816449669885e-06, - "loss": 2.3016, - "step": 279130 - }, - { - "epoch": 0.97, - "learning_rate": 1.3213377651133347e-06, - "loss": 2.3438, - "step": 279140 - }, - { - "epoch": 0.97, - "learning_rate": 1.3195938852596812e-06, - "loss": 2.3434, - "step": 279150 - }, - { - "epoch": 0.97, - "learning_rate": 1.3178500054060275e-06, - "loss": 2.3054, - "step": 279160 - }, - { - "epoch": 0.97, - "learning_rate": 1.316106125552374e-06, - "loss": 2.3734, - "step": 279170 - }, - { - "epoch": 0.97, - "learning_rate": 1.3143622456987205e-06, - "loss": 2.4254, - "step": 279180 - }, - { - "epoch": 0.97, - "learning_rate": 1.3126183658450667e-06, - "loss": 2.3152, - "step": 279190 - }, - { - "epoch": 0.97, - "learning_rate": 1.3108744859914132e-06, - "loss": 2.3591, - "step": 279200 - }, - { - "epoch": 0.97, - "learning_rate": 1.3091306061377597e-06, - "loss": 2.3276, - "step": 279210 - }, - { - "epoch": 0.97, - "learning_rate": 1.307386726284106e-06, - "loss": 2.3104, - "step": 279220 - }, - { - "epoch": 0.97, - "learning_rate": 1.3056428464304524e-06, - "loss": 2.2852, - "step": 279230 - }, - { - "epoch": 0.97, - "learning_rate": 1.3038989665767987e-06, - "loss": 2.3251, - "step": 279240 - }, - { - "epoch": 0.97, - "learning_rate": 1.3021550867231452e-06, - "loss": 2.2883, - "step": 279250 - }, - { - "epoch": 0.97, - "learning_rate": 1.3004112068694917e-06, - "loss": 2.3234, - "step": 279260 - }, - { - "epoch": 0.97, - "learning_rate": 1.298667327015838e-06, - "loss": 2.306, - "step": 279270 - }, - { - "epoch": 0.97, - "learning_rate": 1.2969234471621844e-06, - "loss": 2.3825, - "step": 279280 - }, - { - "epoch": 0.97, - "learning_rate": 1.2951795673085307e-06, - "loss": 2.2784, - "step": 279290 - }, - { - "epoch": 0.97, - "learning_rate": 1.2934356874548772e-06, - "loss": 2.3108, - "step": 279300 - }, - { - "epoch": 0.97, - "learning_rate": 1.2916918076012237e-06, - "loss": 2.3376, - "step": 279310 - }, - { - "epoch": 0.97, - "learning_rate": 1.28994792774757e-06, - "loss": 2.3486, - "step": 279320 - }, - { - "epoch": 0.97, - "learning_rate": 1.2882040478939164e-06, - "loss": 2.3376, - "step": 279330 - }, - { - "epoch": 0.97, - "learning_rate": 1.2864601680402627e-06, - "loss": 2.3637, - "step": 279340 - }, - { - "epoch": 0.97, - "learning_rate": 1.2847162881866092e-06, - "loss": 2.3065, - "step": 279350 - }, - { - "epoch": 0.97, - "learning_rate": 1.2829724083329556e-06, - "loss": 2.3613, - "step": 279360 - }, - { - "epoch": 0.97, - "learning_rate": 1.281228528479302e-06, - "loss": 2.3279, - "step": 279370 - }, - { - "epoch": 0.97, - "learning_rate": 1.2794846486256484e-06, - "loss": 2.3155, - "step": 279380 - }, - { - "epoch": 0.97, - "learning_rate": 1.2777407687719947e-06, - "loss": 2.3052, - "step": 279390 - }, - { - "epoch": 0.97, - "learning_rate": 1.2759968889183411e-06, - "loss": 2.2864, - "step": 279400 - }, - { - "epoch": 0.97, - "learning_rate": 1.2742530090646876e-06, - "loss": 2.299, - "step": 279410 - }, - { - "epoch": 0.97, - "learning_rate": 1.2725091292110339e-06, - "loss": 2.3972, - "step": 279420 - }, - { - "epoch": 0.97, - "learning_rate": 1.2707652493573804e-06, - "loss": 2.3763, - "step": 279430 - }, - { - "epoch": 0.97, - "learning_rate": 1.2690213695037266e-06, - "loss": 2.3201, - "step": 279440 - }, - { - "epoch": 0.97, - "learning_rate": 1.2672774896500731e-06, - "loss": 2.3675, - "step": 279450 - }, - { - "epoch": 0.97, - "learning_rate": 1.2655336097964196e-06, - "loss": 2.3333, - "step": 279460 - }, - { - "epoch": 0.97, - "learning_rate": 1.2637897299427659e-06, - "loss": 2.2821, - "step": 279470 - }, - { - "epoch": 0.97, - "learning_rate": 1.2620458500891123e-06, - "loss": 2.2847, - "step": 279480 - }, - { - "epoch": 0.97, - "learning_rate": 1.2603019702354586e-06, - "loss": 2.2814, - "step": 279490 - }, - { - "epoch": 0.97, - "learning_rate": 1.258558090381805e-06, - "loss": 2.307, - "step": 279500 - }, - { - "epoch": 0.97, - "learning_rate": 1.2568142105281516e-06, - "loss": 2.3682, - "step": 279510 - }, - { - "epoch": 0.97, - "learning_rate": 1.2550703306744978e-06, - "loss": 2.3472, - "step": 279520 - }, - { - "epoch": 0.97, - "learning_rate": 1.2533264508208443e-06, - "loss": 2.3717, - "step": 279530 - }, - { - "epoch": 0.97, - "learning_rate": 1.2515825709671906e-06, - "loss": 2.2552, - "step": 279540 - }, - { - "epoch": 0.98, - "learning_rate": 1.249838691113537e-06, - "loss": 2.3178, - "step": 279550 - }, - { - "epoch": 0.98, - "learning_rate": 1.2480948112598836e-06, - "loss": 2.3326, - "step": 279560 - }, - { - "epoch": 0.98, - "learning_rate": 1.2463509314062298e-06, - "loss": 2.3331, - "step": 279570 - }, - { - "epoch": 0.98, - "learning_rate": 1.2446070515525763e-06, - "loss": 2.3915, - "step": 279580 - }, - { - "epoch": 0.98, - "learning_rate": 1.2428631716989226e-06, - "loss": 2.2427, - "step": 279590 - }, - { - "epoch": 0.98, - "learning_rate": 1.241119291845269e-06, - "loss": 2.3555, - "step": 279600 - }, - { - "epoch": 0.98, - "learning_rate": 1.2393754119916155e-06, - "loss": 2.353, - "step": 279610 - }, - { - "epoch": 0.98, - "learning_rate": 1.2376315321379618e-06, - "loss": 2.3514, - "step": 279620 - }, - { - "epoch": 0.98, - "learning_rate": 1.2358876522843083e-06, - "loss": 2.3847, - "step": 279630 - }, - { - "epoch": 0.98, - "learning_rate": 1.2341437724306546e-06, - "loss": 2.2868, - "step": 279640 - }, - { - "epoch": 0.98, - "learning_rate": 1.232399892577001e-06, - "loss": 2.3753, - "step": 279650 - }, - { - "epoch": 0.98, - "learning_rate": 1.2306560127233475e-06, - "loss": 2.3654, - "step": 279660 - }, - { - "epoch": 0.98, - "learning_rate": 1.2289121328696938e-06, - "loss": 2.3612, - "step": 279670 - }, - { - "epoch": 0.98, - "learning_rate": 1.2271682530160403e-06, - "loss": 2.3094, - "step": 279680 - }, - { - "epoch": 0.98, - "learning_rate": 1.2254243731623865e-06, - "loss": 2.2026, - "step": 279690 - }, - { - "epoch": 0.98, - "learning_rate": 1.223680493308733e-06, - "loss": 2.3017, - "step": 279700 - }, - { - "epoch": 0.98, - "learning_rate": 1.2219366134550795e-06, - "loss": 2.333, - "step": 279710 - }, - { - "epoch": 0.98, - "learning_rate": 1.2201927336014258e-06, - "loss": 2.2436, - "step": 279720 - }, - { - "epoch": 0.98, - "learning_rate": 1.2184488537477723e-06, - "loss": 2.4421, - "step": 279730 - }, - { - "epoch": 0.98, - "learning_rate": 1.2167049738941185e-06, - "loss": 2.2402, - "step": 279740 - }, - { - "epoch": 0.98, - "learning_rate": 1.214961094040465e-06, - "loss": 2.3128, - "step": 279750 - }, - { - "epoch": 0.98, - "learning_rate": 1.2132172141868115e-06, - "loss": 2.3544, - "step": 279760 - }, - { - "epoch": 0.98, - "learning_rate": 1.2114733343331578e-06, - "loss": 2.2452, - "step": 279770 - }, - { - "epoch": 0.98, - "learning_rate": 1.2097294544795042e-06, - "loss": 2.3058, - "step": 279780 - }, - { - "epoch": 0.98, - "learning_rate": 1.2079855746258505e-06, - "loss": 2.3217, - "step": 279790 - }, - { - "epoch": 0.98, - "learning_rate": 1.206241694772197e-06, - "loss": 2.2893, - "step": 279800 - }, - { - "epoch": 0.98, - "learning_rate": 1.2044978149185435e-06, - "loss": 2.3332, - "step": 279810 - }, - { - "epoch": 0.98, - "learning_rate": 1.2027539350648897e-06, - "loss": 2.2755, - "step": 279820 - }, - { - "epoch": 0.98, - "learning_rate": 1.2010100552112362e-06, - "loss": 2.2943, - "step": 279830 - }, - { - "epoch": 0.98, - "learning_rate": 1.1992661753575825e-06, - "loss": 2.3852, - "step": 279840 - }, - { - "epoch": 0.98, - "learning_rate": 1.197522295503929e-06, - "loss": 2.3405, - "step": 279850 - }, - { - "epoch": 0.98, - "learning_rate": 1.1957784156502755e-06, - "loss": 2.4067, - "step": 279860 - }, - { - "epoch": 0.98, - "learning_rate": 1.1940345357966217e-06, - "loss": 2.3257, - "step": 279870 - }, - { - "epoch": 0.98, - "learning_rate": 1.1922906559429682e-06, - "loss": 2.3366, - "step": 279880 - }, - { - "epoch": 0.98, - "learning_rate": 1.1905467760893145e-06, - "loss": 2.3337, - "step": 279890 - }, - { - "epoch": 0.98, - "learning_rate": 1.188802896235661e-06, - "loss": 2.3136, - "step": 279900 - }, - { - "epoch": 0.98, - "learning_rate": 1.1870590163820074e-06, - "loss": 2.3004, - "step": 279910 - }, - { - "epoch": 0.98, - "learning_rate": 1.1853151365283537e-06, - "loss": 2.3569, - "step": 279920 - }, - { - "epoch": 0.98, - "learning_rate": 1.1835712566747002e-06, - "loss": 2.3974, - "step": 279930 - }, - { - "epoch": 0.98, - "learning_rate": 1.1818273768210465e-06, - "loss": 2.3285, - "step": 279940 - }, - { - "epoch": 0.98, - "learning_rate": 1.180083496967393e-06, - "loss": 2.2694, - "step": 279950 - }, - { - "epoch": 0.98, - "learning_rate": 1.1783396171137394e-06, - "loss": 2.3329, - "step": 279960 - }, - { - "epoch": 0.98, - "learning_rate": 1.1765957372600857e-06, - "loss": 2.3159, - "step": 279970 - }, - { - "epoch": 0.98, - "learning_rate": 1.1748518574064322e-06, - "loss": 2.3179, - "step": 279980 - }, - { - "epoch": 0.98, - "learning_rate": 1.1731079775527784e-06, - "loss": 2.3373, - "step": 279990 - }, - { - "epoch": 0.98, - "learning_rate": 1.171364097699125e-06, - "loss": 2.25, - "step": 280000 - }, - { - "epoch": 0.98, - "learning_rate": 1.1696202178454714e-06, - "loss": 2.3636, - "step": 280010 - }, - { - "epoch": 0.98, - "learning_rate": 1.1678763379918177e-06, - "loss": 2.3867, - "step": 280020 - }, - { - "epoch": 0.98, - "learning_rate": 1.1661324581381641e-06, - "loss": 2.2982, - "step": 280030 - }, - { - "epoch": 0.98, - "learning_rate": 1.1643885782845104e-06, - "loss": 2.3727, - "step": 280040 - }, - { - "epoch": 0.98, - "learning_rate": 1.162644698430857e-06, - "loss": 2.2825, - "step": 280050 - }, - { - "epoch": 0.98, - "learning_rate": 1.1609008185772034e-06, - "loss": 2.244, - "step": 280060 - }, - { - "epoch": 0.98, - "learning_rate": 1.1591569387235496e-06, - "loss": 2.3003, - "step": 280070 - }, - { - "epoch": 0.98, - "learning_rate": 1.1574130588698961e-06, - "loss": 2.33, - "step": 280080 - }, - { - "epoch": 0.98, - "learning_rate": 1.1556691790162424e-06, - "loss": 2.3407, - "step": 280090 - }, - { - "epoch": 0.98, - "learning_rate": 1.1539252991625889e-06, - "loss": 2.2636, - "step": 280100 - }, - { - "epoch": 0.98, - "learning_rate": 1.1521814193089354e-06, - "loss": 2.3598, - "step": 280110 - }, - { - "epoch": 0.98, - "learning_rate": 1.1504375394552816e-06, - "loss": 2.3698, - "step": 280120 - }, - { - "epoch": 0.98, - "learning_rate": 1.1486936596016281e-06, - "loss": 2.268, - "step": 280130 - }, - { - "epoch": 0.98, - "learning_rate": 1.1469497797479744e-06, - "loss": 2.2854, - "step": 280140 - }, - { - "epoch": 0.98, - "learning_rate": 1.1452058998943209e-06, - "loss": 2.341, - "step": 280150 - }, - { - "epoch": 0.98, - "learning_rate": 1.1434620200406673e-06, - "loss": 2.2885, - "step": 280160 - }, - { - "epoch": 0.98, - "learning_rate": 1.1417181401870136e-06, - "loss": 2.2885, - "step": 280170 - }, - { - "epoch": 0.98, - "learning_rate": 1.13997426033336e-06, - "loss": 2.374, - "step": 280180 - }, - { - "epoch": 0.98, - "learning_rate": 1.1382303804797064e-06, - "loss": 2.3493, - "step": 280190 - }, - { - "epoch": 0.98, - "learning_rate": 1.1364865006260528e-06, - "loss": 2.2976, - "step": 280200 - }, - { - "epoch": 0.98, - "learning_rate": 1.1347426207723993e-06, - "loss": 2.3391, - "step": 280210 - }, - { - "epoch": 0.98, - "learning_rate": 1.1329987409187456e-06, - "loss": 2.3192, - "step": 280220 - }, - { - "epoch": 0.98, - "learning_rate": 1.131254861065092e-06, - "loss": 2.2497, - "step": 280230 - }, - { - "epoch": 0.98, - "learning_rate": 1.1295109812114383e-06, - "loss": 2.3443, - "step": 280240 - }, - { - "epoch": 0.98, - "learning_rate": 1.1277671013577848e-06, - "loss": 2.3276, - "step": 280250 - }, - { - "epoch": 0.98, - "learning_rate": 1.1260232215041313e-06, - "loss": 2.4156, - "step": 280260 - }, - { - "epoch": 0.98, - "learning_rate": 1.1242793416504776e-06, - "loss": 2.3265, - "step": 280270 - }, - { - "epoch": 0.98, - "learning_rate": 1.122535461796824e-06, - "loss": 2.2524, - "step": 280280 - }, - { - "epoch": 0.98, - "learning_rate": 1.1207915819431703e-06, - "loss": 2.3486, - "step": 280290 - }, - { - "epoch": 0.98, - "learning_rate": 1.1190477020895168e-06, - "loss": 2.3647, - "step": 280300 - }, - { - "epoch": 0.98, - "learning_rate": 1.1173038222358633e-06, - "loss": 2.3989, - "step": 280310 - }, - { - "epoch": 0.98, - "learning_rate": 1.1155599423822096e-06, - "loss": 2.3715, - "step": 280320 - }, - { - "epoch": 0.98, - "learning_rate": 1.113816062528556e-06, - "loss": 2.2271, - "step": 280330 - }, - { - "epoch": 0.98, - "learning_rate": 1.1120721826749023e-06, - "loss": 2.3418, - "step": 280340 - }, - { - "epoch": 0.98, - "learning_rate": 1.1103283028212488e-06, - "loss": 2.3049, - "step": 280350 - }, - { - "epoch": 0.98, - "learning_rate": 1.1085844229675953e-06, - "loss": 2.2826, - "step": 280360 - }, - { - "epoch": 0.98, - "learning_rate": 1.1068405431139415e-06, - "loss": 2.3888, - "step": 280370 - }, - { - "epoch": 0.98, - "learning_rate": 1.105096663260288e-06, - "loss": 2.3753, - "step": 280380 - }, - { - "epoch": 0.98, - "learning_rate": 1.1033527834066343e-06, - "loss": 2.3884, - "step": 280390 - }, - { - "epoch": 0.98, - "learning_rate": 1.1016089035529808e-06, - "loss": 2.3417, - "step": 280400 - }, - { - "epoch": 0.98, - "learning_rate": 1.0998650236993272e-06, - "loss": 2.2516, - "step": 280410 - }, - { - "epoch": 0.98, - "learning_rate": 1.0981211438456735e-06, - "loss": 2.2852, - "step": 280420 - }, - { - "epoch": 0.98, - "learning_rate": 1.09637726399202e-06, - "loss": 2.3511, - "step": 280430 - }, - { - "epoch": 0.98, - "learning_rate": 1.0946333841383663e-06, - "loss": 2.3162, - "step": 280440 - }, - { - "epoch": 0.98, - "learning_rate": 1.0928895042847127e-06, - "loss": 2.3128, - "step": 280450 - }, - { - "epoch": 0.98, - "learning_rate": 1.0911456244310592e-06, - "loss": 2.3081, - "step": 280460 - }, - { - "epoch": 0.98, - "learning_rate": 1.0894017445774055e-06, - "loss": 2.2366, - "step": 280470 - }, - { - "epoch": 0.98, - "learning_rate": 1.087657864723752e-06, - "loss": 2.3583, - "step": 280480 - }, - { - "epoch": 0.98, - "learning_rate": 1.0859139848700985e-06, - "loss": 2.4366, - "step": 280490 - }, - { - "epoch": 0.98, - "learning_rate": 1.0841701050164447e-06, - "loss": 2.3559, - "step": 280500 - }, - { - "epoch": 0.98, - "learning_rate": 1.0824262251627912e-06, - "loss": 2.3926, - "step": 280510 - }, - { - "epoch": 0.98, - "learning_rate": 1.0806823453091375e-06, - "loss": 2.3255, - "step": 280520 - }, - { - "epoch": 0.98, - "learning_rate": 1.078938465455484e-06, - "loss": 2.2952, - "step": 280530 - }, - { - "epoch": 0.98, - "learning_rate": 1.0771945856018304e-06, - "loss": 2.3156, - "step": 280540 - }, - { - "epoch": 0.98, - "learning_rate": 1.0754507057481767e-06, - "loss": 2.3685, - "step": 280550 - }, - { - "epoch": 0.98, - "learning_rate": 1.0737068258945232e-06, - "loss": 2.3392, - "step": 280560 - }, - { - "epoch": 0.98, - "learning_rate": 1.0719629460408695e-06, - "loss": 2.2513, - "step": 280570 - }, - { - "epoch": 0.98, - "learning_rate": 1.070219066187216e-06, - "loss": 2.3906, - "step": 280580 - }, - { - "epoch": 0.98, - "learning_rate": 1.0684751863335624e-06, - "loss": 2.4292, - "step": 280590 - }, - { - "epoch": 0.98, - "learning_rate": 1.0667313064799087e-06, - "loss": 2.3071, - "step": 280600 - }, - { - "epoch": 0.98, - "learning_rate": 1.0649874266262552e-06, - "loss": 2.2823, - "step": 280610 - }, - { - "epoch": 0.98, - "learning_rate": 1.0632435467726017e-06, - "loss": 2.3918, - "step": 280620 - }, - { - "epoch": 0.98, - "learning_rate": 1.061499666918948e-06, - "loss": 2.373, - "step": 280630 - }, - { - "epoch": 0.98, - "learning_rate": 1.0597557870652944e-06, - "loss": 2.2933, - "step": 280640 - }, - { - "epoch": 0.98, - "learning_rate": 1.0580119072116407e-06, - "loss": 2.3902, - "step": 280650 - }, - { - "epoch": 0.98, - "learning_rate": 1.0562680273579872e-06, - "loss": 2.3038, - "step": 280660 - }, - { - "epoch": 0.98, - "learning_rate": 1.0545241475043336e-06, - "loss": 2.3193, - "step": 280670 - }, - { - "epoch": 0.98, - "learning_rate": 1.05278026765068e-06, - "loss": 2.318, - "step": 280680 - }, - { - "epoch": 0.98, - "learning_rate": 1.0510363877970264e-06, - "loss": 2.2825, - "step": 280690 - }, - { - "epoch": 0.98, - "learning_rate": 1.0492925079433727e-06, - "loss": 2.3866, - "step": 280700 - }, - { - "epoch": 0.98, - "learning_rate": 1.0475486280897191e-06, - "loss": 2.3139, - "step": 280710 - }, - { - "epoch": 0.98, - "learning_rate": 1.0458047482360656e-06, - "loss": 2.3015, - "step": 280720 - }, - { - "epoch": 0.98, - "learning_rate": 1.0440608683824119e-06, - "loss": 2.3487, - "step": 280730 - }, - { - "epoch": 0.98, - "learning_rate": 1.0423169885287584e-06, - "loss": 2.3054, - "step": 280740 - }, - { - "epoch": 0.98, - "learning_rate": 1.0405731086751049e-06, - "loss": 2.3619, - "step": 280750 - }, - { - "epoch": 0.98, - "learning_rate": 1.0388292288214511e-06, - "loss": 2.3117, - "step": 280760 - }, - { - "epoch": 0.98, - "learning_rate": 1.0370853489677976e-06, - "loss": 2.2986, - "step": 280770 - }, - { - "epoch": 0.98, - "learning_rate": 1.0353414691141439e-06, - "loss": 2.38, - "step": 280780 - }, - { - "epoch": 0.98, - "learning_rate": 1.0335975892604904e-06, - "loss": 2.3388, - "step": 280790 - }, - { - "epoch": 0.98, - "learning_rate": 1.0318537094068368e-06, - "loss": 2.3113, - "step": 280800 - }, - { - "epoch": 0.98, - "learning_rate": 1.030109829553183e-06, - "loss": 2.3712, - "step": 280810 - }, - { - "epoch": 0.98, - "learning_rate": 1.0283659496995296e-06, - "loss": 2.3473, - "step": 280820 - }, - { - "epoch": 0.98, - "learning_rate": 1.026622069845876e-06, - "loss": 2.2589, - "step": 280830 - }, - { - "epoch": 0.98, - "learning_rate": 1.0248781899922223e-06, - "loss": 2.3086, - "step": 280840 - }, - { - "epoch": 0.98, - "learning_rate": 1.0231343101385688e-06, - "loss": 2.2784, - "step": 280850 - }, - { - "epoch": 0.98, - "learning_rate": 1.021390430284915e-06, - "loss": 2.3585, - "step": 280860 - }, - { - "epoch": 0.98, - "learning_rate": 1.0196465504312616e-06, - "loss": 2.3574, - "step": 280870 - }, - { - "epoch": 0.98, - "learning_rate": 1.017902670577608e-06, - "loss": 2.3566, - "step": 280880 - }, - { - "epoch": 0.98, - "learning_rate": 1.0161587907239543e-06, - "loss": 2.391, - "step": 280890 - }, - { - "epoch": 0.98, - "learning_rate": 1.0144149108703008e-06, - "loss": 2.327, - "step": 280900 - }, - { - "epoch": 0.98, - "learning_rate": 1.012671031016647e-06, - "loss": 2.3959, - "step": 280910 - }, - { - "epoch": 0.98, - "learning_rate": 1.0109271511629935e-06, - "loss": 2.2774, - "step": 280920 - }, - { - "epoch": 0.98, - "learning_rate": 1.00918327130934e-06, - "loss": 2.3272, - "step": 280930 - }, - { - "epoch": 0.98, - "learning_rate": 1.0074393914556863e-06, - "loss": 2.3326, - "step": 280940 - }, - { - "epoch": 0.98, - "learning_rate": 1.0056955116020328e-06, - "loss": 2.35, - "step": 280950 - }, - { - "epoch": 0.98, - "learning_rate": 1.0039516317483793e-06, - "loss": 2.3604, - "step": 280960 - }, - { - "epoch": 0.98, - "learning_rate": 1.0022077518947255e-06, - "loss": 2.3668, - "step": 280970 - }, - { - "epoch": 0.98, - "learning_rate": 1.000463872041072e-06, - "loss": 2.3462, - "step": 280980 - }, - { - "epoch": 0.98, - "learning_rate": 9.987199921874183e-07, - "loss": 2.3687, - "step": 280990 - }, - { - "epoch": 0.98, - "learning_rate": 9.969761123337648e-07, - "loss": 2.2979, - "step": 281000 - }, - { - "epoch": 0.98, - "learning_rate": 9.952322324801112e-07, - "loss": 2.3385, - "step": 281010 - }, - { - "epoch": 0.98, - "learning_rate": 9.934883526264575e-07, - "loss": 2.4258, - "step": 281020 - }, - { - "epoch": 0.98, - "learning_rate": 9.91744472772804e-07, - "loss": 2.3557, - "step": 281030 - }, - { - "epoch": 0.98, - "learning_rate": 9.900005929191503e-07, - "loss": 2.3582, - "step": 281040 - }, - { - "epoch": 0.98, - "learning_rate": 9.882567130654967e-07, - "loss": 2.4087, - "step": 281050 - }, - { - "epoch": 0.98, - "learning_rate": 9.865128332118432e-07, - "loss": 2.3294, - "step": 281060 - }, - { - "epoch": 0.98, - "learning_rate": 9.847689533581895e-07, - "loss": 2.4166, - "step": 281070 - }, - { - "epoch": 0.98, - "learning_rate": 9.83025073504536e-07, - "loss": 2.3247, - "step": 281080 - }, - { - "epoch": 0.98, - "learning_rate": 9.812811936508825e-07, - "loss": 2.4197, - "step": 281090 - }, - { - "epoch": 0.98, - "learning_rate": 9.795373137972287e-07, - "loss": 2.4286, - "step": 281100 - }, - { - "epoch": 0.98, - "learning_rate": 9.777934339435752e-07, - "loss": 2.3266, - "step": 281110 - }, - { - "epoch": 0.98, - "learning_rate": 9.760495540899215e-07, - "loss": 2.2863, - "step": 281120 - }, - { - "epoch": 0.98, - "learning_rate": 9.74305674236268e-07, - "loss": 2.3422, - "step": 281130 - }, - { - "epoch": 0.98, - "learning_rate": 9.725617943826144e-07, - "loss": 2.2647, - "step": 281140 - }, - { - "epoch": 0.98, - "learning_rate": 9.708179145289607e-07, - "loss": 2.3572, - "step": 281150 - }, - { - "epoch": 0.98, - "learning_rate": 9.690740346753072e-07, - "loss": 2.3612, - "step": 281160 - }, - { - "epoch": 0.98, - "learning_rate": 9.673301548216535e-07, - "loss": 2.3459, - "step": 281170 - }, - { - "epoch": 0.98, - "learning_rate": 9.65586274968e-07, - "loss": 2.343, - "step": 281180 - }, - { - "epoch": 0.98, - "learning_rate": 9.638423951143464e-07, - "loss": 2.3679, - "step": 281190 - }, - { - "epoch": 0.98, - "learning_rate": 9.620985152606927e-07, - "loss": 2.3644, - "step": 281200 - }, - { - "epoch": 0.98, - "learning_rate": 9.603546354070392e-07, - "loss": 2.2363, - "step": 281210 - }, - { - "epoch": 0.98, - "learning_rate": 9.586107555533854e-07, - "loss": 2.3714, - "step": 281220 - }, - { - "epoch": 0.98, - "learning_rate": 9.56866875699732e-07, - "loss": 2.3376, - "step": 281230 - }, - { - "epoch": 0.98, - "learning_rate": 9.551229958460784e-07, - "loss": 2.3771, - "step": 281240 - }, - { - "epoch": 0.98, - "learning_rate": 9.533791159924246e-07, - "loss": 2.3976, - "step": 281250 - }, - { - "epoch": 0.98, - "learning_rate": 9.51635236138771e-07, - "loss": 2.3164, - "step": 281260 - }, - { - "epoch": 0.98, - "learning_rate": 9.498913562851173e-07, - "loss": 2.3819, - "step": 281270 - }, - { - "epoch": 0.98, - "learning_rate": 9.481474764314638e-07, - "loss": 2.2821, - "step": 281280 - }, - { - "epoch": 0.98, - "learning_rate": 9.464035965778103e-07, - "loss": 2.3486, - "step": 281290 - }, - { - "epoch": 0.98, - "learning_rate": 9.446597167241565e-07, - "loss": 2.2531, - "step": 281300 - }, - { - "epoch": 0.98, - "learning_rate": 9.42915836870503e-07, - "loss": 2.3854, - "step": 281310 - }, - { - "epoch": 0.98, - "learning_rate": 9.411719570168493e-07, - "loss": 2.2448, - "step": 281320 - }, - { - "epoch": 0.98, - "learning_rate": 9.394280771631958e-07, - "loss": 2.3203, - "step": 281330 - }, - { - "epoch": 0.98, - "learning_rate": 9.376841973095423e-07, - "loss": 2.3181, - "step": 281340 - }, - { - "epoch": 0.98, - "learning_rate": 9.359403174558885e-07, - "loss": 2.3696, - "step": 281350 - }, - { - "epoch": 0.98, - "learning_rate": 9.34196437602235e-07, - "loss": 2.3394, - "step": 281360 - }, - { - "epoch": 0.98, - "learning_rate": 9.324525577485813e-07, - "loss": 2.3591, - "step": 281370 - }, - { - "epoch": 0.98, - "learning_rate": 9.307086778949278e-07, - "loss": 2.2944, - "step": 281380 - }, - { - "epoch": 0.98, - "learning_rate": 9.289647980412742e-07, - "loss": 2.4315, - "step": 281390 - }, - { - "epoch": 0.98, - "learning_rate": 9.272209181876205e-07, - "loss": 2.3634, - "step": 281400 - }, - { - "epoch": 0.98, - "learning_rate": 9.25477038333967e-07, - "loss": 2.3138, - "step": 281410 - }, - { - "epoch": 0.98, - "learning_rate": 9.237331584803134e-07, - "loss": 2.3839, - "step": 281420 - }, - { - "epoch": 0.98, - "learning_rate": 9.219892786266597e-07, - "loss": 2.3177, - "step": 281430 - }, - { - "epoch": 0.98, - "learning_rate": 9.202453987730062e-07, - "loss": 2.3894, - "step": 281440 - }, - { - "epoch": 0.98, - "learning_rate": 9.185015189193525e-07, - "loss": 2.2278, - "step": 281450 - }, - { - "epoch": 0.98, - "learning_rate": 9.16757639065699e-07, - "loss": 2.2884, - "step": 281460 - }, - { - "epoch": 0.98, - "learning_rate": 9.150137592120453e-07, - "loss": 2.3761, - "step": 281470 - }, - { - "epoch": 0.98, - "learning_rate": 9.132698793583917e-07, - "loss": 2.294, - "step": 281480 - }, - { - "epoch": 0.98, - "learning_rate": 9.115259995047382e-07, - "loss": 2.288, - "step": 281490 - }, - { - "epoch": 0.98, - "learning_rate": 9.097821196510845e-07, - "loss": 2.3138, - "step": 281500 - }, - { - "epoch": 0.98, - "learning_rate": 9.08038239797431e-07, - "loss": 2.3369, - "step": 281510 - }, - { - "epoch": 0.98, - "learning_rate": 9.062943599437773e-07, - "loss": 2.3283, - "step": 281520 - }, - { - "epoch": 0.98, - "learning_rate": 9.045504800901237e-07, - "loss": 2.3233, - "step": 281530 - }, - { - "epoch": 0.98, - "learning_rate": 9.028066002364702e-07, - "loss": 2.2671, - "step": 281540 - }, - { - "epoch": 0.98, - "learning_rate": 9.010627203828166e-07, - "loss": 2.3504, - "step": 281550 - }, - { - "epoch": 0.98, - "learning_rate": 8.993188405291629e-07, - "loss": 2.3056, - "step": 281560 - }, - { - "epoch": 0.98, - "learning_rate": 8.975749606755093e-07, - "loss": 2.4085, - "step": 281570 - }, - { - "epoch": 0.98, - "learning_rate": 8.958310808218557e-07, - "loss": 2.3825, - "step": 281580 - }, - { - "epoch": 0.98, - "learning_rate": 8.940872009682022e-07, - "loss": 2.3499, - "step": 281590 - }, - { - "epoch": 0.98, - "learning_rate": 8.923433211145485e-07, - "loss": 2.3309, - "step": 281600 - }, - { - "epoch": 0.98, - "learning_rate": 8.905994412608949e-07, - "loss": 2.2264, - "step": 281610 - }, - { - "epoch": 0.98, - "learning_rate": 8.888555614072413e-07, - "loss": 2.3761, - "step": 281620 - }, - { - "epoch": 0.98, - "learning_rate": 8.871116815535878e-07, - "loss": 2.335, - "step": 281630 - }, - { - "epoch": 0.98, - "learning_rate": 8.853678016999341e-07, - "loss": 2.3898, - "step": 281640 - }, - { - "epoch": 0.98, - "learning_rate": 8.836239218462805e-07, - "loss": 2.3194, - "step": 281650 - }, - { - "epoch": 0.98, - "learning_rate": 8.818800419926269e-07, - "loss": 2.3476, - "step": 281660 - }, - { - "epoch": 0.98, - "learning_rate": 8.801361621389733e-07, - "loss": 2.3572, - "step": 281670 - }, - { - "epoch": 0.98, - "learning_rate": 8.783922822853198e-07, - "loss": 2.3646, - "step": 281680 - }, - { - "epoch": 0.98, - "learning_rate": 8.766484024316661e-07, - "loss": 2.2714, - "step": 281690 - }, - { - "epoch": 0.98, - "learning_rate": 8.749045225780125e-07, - "loss": 2.3454, - "step": 281700 - }, - { - "epoch": 0.98, - "learning_rate": 8.731606427243589e-07, - "loss": 2.3261, - "step": 281710 - }, - { - "epoch": 0.98, - "learning_rate": 8.714167628707053e-07, - "loss": 2.3365, - "step": 281720 - }, - { - "epoch": 0.98, - "learning_rate": 8.696728830170517e-07, - "loss": 2.3636, - "step": 281730 - }, - { - "epoch": 0.98, - "learning_rate": 8.679290031633981e-07, - "loss": 2.373, - "step": 281740 - }, - { - "epoch": 0.98, - "learning_rate": 8.661851233097445e-07, - "loss": 2.3549, - "step": 281750 - }, - { - "epoch": 0.98, - "learning_rate": 8.64441243456091e-07, - "loss": 2.277, - "step": 281760 - }, - { - "epoch": 0.98, - "learning_rate": 8.626973636024372e-07, - "loss": 2.3167, - "step": 281770 - }, - { - "epoch": 0.98, - "learning_rate": 8.609534837487837e-07, - "loss": 2.2656, - "step": 281780 - }, - { - "epoch": 0.98, - "learning_rate": 8.592096038951301e-07, - "loss": 2.2952, - "step": 281790 - }, - { - "epoch": 0.98, - "learning_rate": 8.574657240414765e-07, - "loss": 2.2873, - "step": 281800 - }, - { - "epoch": 0.98, - "learning_rate": 8.557218441878229e-07, - "loss": 2.3304, - "step": 281810 - }, - { - "epoch": 0.98, - "learning_rate": 8.539779643341692e-07, - "loss": 2.3978, - "step": 281820 - }, - { - "epoch": 0.98, - "learning_rate": 8.522340844805157e-07, - "loss": 2.3379, - "step": 281830 - }, - { - "epoch": 0.98, - "learning_rate": 8.504902046268621e-07, - "loss": 2.2752, - "step": 281840 - }, - { - "epoch": 0.98, - "learning_rate": 8.487463247732084e-07, - "loss": 2.3552, - "step": 281850 - }, - { - "epoch": 0.98, - "learning_rate": 8.470024449195549e-07, - "loss": 2.287, - "step": 281860 - }, - { - "epoch": 0.98, - "learning_rate": 8.452585650659012e-07, - "loss": 2.282, - "step": 281870 - }, - { - "epoch": 0.98, - "learning_rate": 8.435146852122477e-07, - "loss": 2.3143, - "step": 281880 - }, - { - "epoch": 0.98, - "learning_rate": 8.417708053585942e-07, - "loss": 2.3158, - "step": 281890 - }, - { - "epoch": 0.98, - "learning_rate": 8.400269255049404e-07, - "loss": 2.2618, - "step": 281900 - }, - { - "epoch": 0.98, - "learning_rate": 8.382830456512869e-07, - "loss": 2.3409, - "step": 281910 - }, - { - "epoch": 0.98, - "learning_rate": 8.365391657976332e-07, - "loss": 2.3767, - "step": 281920 - }, - { - "epoch": 0.98, - "learning_rate": 8.347952859439797e-07, - "loss": 2.2711, - "step": 281930 - }, - { - "epoch": 0.98, - "learning_rate": 8.330514060903261e-07, - "loss": 2.3815, - "step": 281940 - }, - { - "epoch": 0.98, - "learning_rate": 8.313075262366724e-07, - "loss": 2.2724, - "step": 281950 - }, - { - "epoch": 0.98, - "learning_rate": 8.295636463830189e-07, - "loss": 2.3543, - "step": 281960 - }, - { - "epoch": 0.98, - "learning_rate": 8.278197665293653e-07, - "loss": 2.3453, - "step": 281970 - }, - { - "epoch": 0.98, - "learning_rate": 8.260758866757116e-07, - "loss": 2.3363, - "step": 281980 - }, - { - "epoch": 0.98, - "learning_rate": 8.243320068220581e-07, - "loss": 2.3354, - "step": 281990 - }, - { - "epoch": 0.98, - "learning_rate": 8.225881269684044e-07, - "loss": 2.3087, - "step": 282000 - }, - { - "epoch": 0.98, - "learning_rate": 8.208442471147509e-07, - "loss": 2.3674, - "step": 282010 - }, - { - "epoch": 0.98, - "learning_rate": 8.191003672610974e-07, - "loss": 2.344, - "step": 282020 - }, - { - "epoch": 0.98, - "learning_rate": 8.173564874074436e-07, - "loss": 2.3747, - "step": 282030 - }, - { - "epoch": 0.98, - "learning_rate": 8.156126075537901e-07, - "loss": 2.3266, - "step": 282040 - }, - { - "epoch": 0.98, - "learning_rate": 8.138687277001364e-07, - "loss": 2.3022, - "step": 282050 - }, - { - "epoch": 0.98, - "learning_rate": 8.121248478464829e-07, - "loss": 2.3633, - "step": 282060 - }, - { - "epoch": 0.98, - "learning_rate": 8.103809679928293e-07, - "loss": 2.2927, - "step": 282070 - }, - { - "epoch": 0.98, - "learning_rate": 8.086370881391756e-07, - "loss": 2.3445, - "step": 282080 - }, - { - "epoch": 0.98, - "learning_rate": 8.068932082855221e-07, - "loss": 2.2949, - "step": 282090 - }, - { - "epoch": 0.98, - "learning_rate": 8.051493284318684e-07, - "loss": 2.3551, - "step": 282100 - }, - { - "epoch": 0.98, - "learning_rate": 8.034054485782148e-07, - "loss": 2.3136, - "step": 282110 - }, - { - "epoch": 0.98, - "learning_rate": 8.016615687245613e-07, - "loss": 2.382, - "step": 282120 - }, - { - "epoch": 0.98, - "learning_rate": 7.999176888709076e-07, - "loss": 2.3544, - "step": 282130 - }, - { - "epoch": 0.98, - "learning_rate": 7.981738090172541e-07, - "loss": 2.3458, - "step": 282140 - }, - { - "epoch": 0.98, - "learning_rate": 7.964299291636003e-07, - "loss": 2.2563, - "step": 282150 - }, - { - "epoch": 0.98, - "learning_rate": 7.946860493099468e-07, - "loss": 2.3455, - "step": 282160 - }, - { - "epoch": 0.98, - "learning_rate": 7.929421694562933e-07, - "loss": 2.3211, - "step": 282170 - }, - { - "epoch": 0.98, - "learning_rate": 7.911982896026396e-07, - "loss": 2.3328, - "step": 282180 - }, - { - "epoch": 0.98, - "learning_rate": 7.89454409748986e-07, - "loss": 2.4276, - "step": 282190 - }, - { - "epoch": 0.98, - "learning_rate": 7.877105298953323e-07, - "loss": 2.3753, - "step": 282200 - }, - { - "epoch": 0.98, - "learning_rate": 7.859666500416788e-07, - "loss": 2.3778, - "step": 282210 - }, - { - "epoch": 0.98, - "learning_rate": 7.842227701880253e-07, - "loss": 2.2464, - "step": 282220 - }, - { - "epoch": 0.98, - "learning_rate": 7.824788903343715e-07, - "loss": 2.3475, - "step": 282230 - }, - { - "epoch": 0.98, - "learning_rate": 7.807350104807179e-07, - "loss": 2.2435, - "step": 282240 - }, - { - "epoch": 0.98, - "learning_rate": 7.789911306270644e-07, - "loss": 2.2741, - "step": 282250 - }, - { - "epoch": 0.98, - "learning_rate": 7.772472507734108e-07, - "loss": 2.3004, - "step": 282260 - }, - { - "epoch": 0.98, - "learning_rate": 7.755033709197572e-07, - "loss": 2.2979, - "step": 282270 - }, - { - "epoch": 0.98, - "learning_rate": 7.737594910661035e-07, - "loss": 2.2956, - "step": 282280 - }, - { - "epoch": 0.98, - "learning_rate": 7.720156112124499e-07, - "loss": 2.3233, - "step": 282290 - }, - { - "epoch": 0.98, - "learning_rate": 7.702717313587964e-07, - "loss": 2.2008, - "step": 282300 - }, - { - "epoch": 0.98, - "learning_rate": 7.685278515051428e-07, - "loss": 2.3525, - "step": 282310 - }, - { - "epoch": 0.98, - "learning_rate": 7.667839716514891e-07, - "loss": 2.235, - "step": 282320 - }, - { - "epoch": 0.98, - "learning_rate": 7.650400917978355e-07, - "loss": 2.3593, - "step": 282330 - }, - { - "epoch": 0.98, - "learning_rate": 7.63296211944182e-07, - "loss": 2.3963, - "step": 282340 - }, - { - "epoch": 0.98, - "learning_rate": 7.615523320905284e-07, - "loss": 2.3911, - "step": 282350 - }, - { - "epoch": 0.98, - "learning_rate": 7.598084522368747e-07, - "loss": 2.3703, - "step": 282360 - }, - { - "epoch": 0.98, - "learning_rate": 7.580645723832211e-07, - "loss": 2.3119, - "step": 282370 - }, - { - "epoch": 0.98, - "learning_rate": 7.563206925295675e-07, - "loss": 2.3903, - "step": 282380 - }, - { - "epoch": 0.98, - "learning_rate": 7.54576812675914e-07, - "loss": 2.3027, - "step": 282390 - }, - { - "epoch": 0.98, - "learning_rate": 7.528329328222604e-07, - "loss": 2.3275, - "step": 282400 - }, - { - "epoch": 0.98, - "learning_rate": 7.510890529686067e-07, - "loss": 2.3849, - "step": 282410 - }, - { - "epoch": 0.99, - "learning_rate": 7.493451731149531e-07, - "loss": 2.3039, - "step": 282420 - }, - { - "epoch": 0.99, - "learning_rate": 7.476012932612995e-07, - "loss": 2.377, - "step": 282430 - }, - { - "epoch": 0.99, - "learning_rate": 7.45857413407646e-07, - "loss": 2.2787, - "step": 282440 - }, - { - "epoch": 0.99, - "learning_rate": 7.441135335539923e-07, - "loss": 2.3314, - "step": 282450 - }, - { - "epoch": 0.99, - "learning_rate": 7.423696537003387e-07, - "loss": 2.2548, - "step": 282460 - }, - { - "epoch": 0.99, - "learning_rate": 7.406257738466851e-07, - "loss": 2.3269, - "step": 282470 - }, - { - "epoch": 0.99, - "learning_rate": 7.388818939930315e-07, - "loss": 2.3293, - "step": 282480 - }, - { - "epoch": 0.99, - "learning_rate": 7.371380141393779e-07, - "loss": 2.3191, - "step": 282490 - }, - { - "epoch": 0.99, - "learning_rate": 7.353941342857243e-07, - "loss": 2.228, - "step": 282500 - }, - { - "epoch": 0.99, - "learning_rate": 7.336502544320707e-07, - "loss": 2.4329, - "step": 282510 - }, - { - "epoch": 0.99, - "learning_rate": 7.319063745784171e-07, - "loss": 2.3127, - "step": 282520 - }, - { - "epoch": 0.99, - "learning_rate": 7.301624947247634e-07, - "loss": 2.3122, - "step": 282530 - }, - { - "epoch": 0.99, - "learning_rate": 7.284186148711099e-07, - "loss": 2.3745, - "step": 282540 - }, - { - "epoch": 0.99, - "learning_rate": 7.266747350174563e-07, - "loss": 2.3631, - "step": 282550 - }, - { - "epoch": 0.99, - "learning_rate": 7.249308551638027e-07, - "loss": 2.3507, - "step": 282560 - }, - { - "epoch": 0.99, - "learning_rate": 7.23186975310149e-07, - "loss": 2.41, - "step": 282570 - }, - { - "epoch": 0.99, - "learning_rate": 7.214430954564954e-07, - "loss": 2.2302, - "step": 282580 - }, - { - "epoch": 0.99, - "learning_rate": 7.196992156028419e-07, - "loss": 2.3326, - "step": 282590 - }, - { - "epoch": 0.99, - "learning_rate": 7.179553357491883e-07, - "loss": 2.3485, - "step": 282600 - }, - { - "epoch": 0.99, - "learning_rate": 7.162114558955347e-07, - "loss": 2.2698, - "step": 282610 - }, - { - "epoch": 0.99, - "learning_rate": 7.14467576041881e-07, - "loss": 2.3212, - "step": 282620 - }, - { - "epoch": 0.99, - "learning_rate": 7.127236961882274e-07, - "loss": 2.3231, - "step": 282630 - }, - { - "epoch": 0.99, - "learning_rate": 7.109798163345739e-07, - "loss": 2.3417, - "step": 282640 - }, - { - "epoch": 0.99, - "learning_rate": 7.092359364809203e-07, - "loss": 2.3404, - "step": 282650 - }, - { - "epoch": 0.99, - "learning_rate": 7.074920566272666e-07, - "loss": 2.2906, - "step": 282660 - }, - { - "epoch": 0.99, - "learning_rate": 7.05748176773613e-07, - "loss": 2.3511, - "step": 282670 - }, - { - "epoch": 0.99, - "learning_rate": 7.040042969199594e-07, - "loss": 2.2879, - "step": 282680 - }, - { - "epoch": 0.99, - "learning_rate": 7.022604170663059e-07, - "loss": 2.3241, - "step": 282690 - }, - { - "epoch": 0.99, - "learning_rate": 7.005165372126522e-07, - "loss": 2.2852, - "step": 282700 - }, - { - "epoch": 0.99, - "learning_rate": 6.987726573589986e-07, - "loss": 2.4131, - "step": 282710 - }, - { - "epoch": 0.99, - "learning_rate": 6.97028777505345e-07, - "loss": 2.3323, - "step": 282720 - }, - { - "epoch": 0.99, - "learning_rate": 6.952848976516914e-07, - "loss": 2.3137, - "step": 282730 - }, - { - "epoch": 0.99, - "learning_rate": 6.935410177980378e-07, - "loss": 2.249, - "step": 282740 - }, - { - "epoch": 0.99, - "learning_rate": 6.917971379443842e-07, - "loss": 2.2877, - "step": 282750 - }, - { - "epoch": 0.99, - "learning_rate": 6.900532580907306e-07, - "loss": 2.2895, - "step": 282760 - }, - { - "epoch": 0.99, - "learning_rate": 6.88309378237077e-07, - "loss": 2.3724, - "step": 282770 - }, - { - "epoch": 0.99, - "learning_rate": 6.865654983834233e-07, - "loss": 2.3992, - "step": 282780 - }, - { - "epoch": 0.99, - "learning_rate": 6.848216185297698e-07, - "loss": 2.2934, - "step": 282790 - }, - { - "epoch": 0.99, - "learning_rate": 6.830777386761162e-07, - "loss": 2.3613, - "step": 282800 - }, - { - "epoch": 0.99, - "learning_rate": 6.813338588224626e-07, - "loss": 2.3402, - "step": 282810 - }, - { - "epoch": 0.99, - "learning_rate": 6.79589978968809e-07, - "loss": 2.3588, - "step": 282820 - }, - { - "epoch": 0.99, - "learning_rate": 6.778460991151553e-07, - "loss": 2.319, - "step": 282830 - }, - { - "epoch": 0.99, - "learning_rate": 6.761022192615018e-07, - "loss": 2.3636, - "step": 282840 - }, - { - "epoch": 0.99, - "learning_rate": 6.743583394078482e-07, - "loss": 2.3509, - "step": 282850 - }, - { - "epoch": 0.99, - "learning_rate": 6.726144595541946e-07, - "loss": 2.3746, - "step": 282860 - }, - { - "epoch": 0.99, - "learning_rate": 6.708705797005409e-07, - "loss": 2.3772, - "step": 282870 - }, - { - "epoch": 0.99, - "learning_rate": 6.691266998468873e-07, - "loss": 2.3842, - "step": 282880 - }, - { - "epoch": 0.99, - "learning_rate": 6.673828199932338e-07, - "loss": 2.2784, - "step": 282890 - }, - { - "epoch": 0.99, - "learning_rate": 6.656389401395802e-07, - "loss": 2.3813, - "step": 282900 - }, - { - "epoch": 0.99, - "learning_rate": 6.638950602859265e-07, - "loss": 2.2373, - "step": 282910 - }, - { - "epoch": 0.99, - "learning_rate": 6.621511804322729e-07, - "loss": 2.3699, - "step": 282920 - }, - { - "epoch": 0.99, - "learning_rate": 6.604073005786193e-07, - "loss": 2.3536, - "step": 282930 - }, - { - "epoch": 0.99, - "learning_rate": 6.586634207249658e-07, - "loss": 2.2131, - "step": 282940 - }, - { - "epoch": 0.99, - "learning_rate": 6.569195408713121e-07, - "loss": 2.2766, - "step": 282950 - }, - { - "epoch": 0.99, - "learning_rate": 6.551756610176585e-07, - "loss": 2.4027, - "step": 282960 - }, - { - "epoch": 0.99, - "learning_rate": 6.534317811640049e-07, - "loss": 2.343, - "step": 282970 - }, - { - "epoch": 0.99, - "learning_rate": 6.516879013103513e-07, - "loss": 2.3381, - "step": 282980 - }, - { - "epoch": 0.99, - "learning_rate": 6.499440214566978e-07, - "loss": 2.3429, - "step": 282990 - }, - { - "epoch": 0.99, - "learning_rate": 6.482001416030441e-07, - "loss": 2.3695, - "step": 283000 - }, - { - "epoch": 0.99, - "learning_rate": 6.464562617493905e-07, - "loss": 2.3262, - "step": 283010 - }, - { - "epoch": 0.99, - "learning_rate": 6.447123818957369e-07, - "loss": 2.3401, - "step": 283020 - }, - { - "epoch": 0.99, - "learning_rate": 6.429685020420834e-07, - "loss": 2.3313, - "step": 283030 - }, - { - "epoch": 0.99, - "learning_rate": 6.412246221884297e-07, - "loss": 2.2955, - "step": 283040 - }, - { - "epoch": 0.99, - "learning_rate": 6.394807423347761e-07, - "loss": 2.2764, - "step": 283050 - }, - { - "epoch": 0.99, - "learning_rate": 6.377368624811225e-07, - "loss": 2.2873, - "step": 283060 - }, - { - "epoch": 0.99, - "learning_rate": 6.359929826274689e-07, - "loss": 2.3367, - "step": 283070 - }, - { - "epoch": 0.99, - "learning_rate": 6.342491027738153e-07, - "loss": 2.417, - "step": 283080 - }, - { - "epoch": 0.99, - "learning_rate": 6.325052229201617e-07, - "loss": 2.3281, - "step": 283090 - }, - { - "epoch": 0.99, - "learning_rate": 6.307613430665081e-07, - "loss": 2.2836, - "step": 283100 - }, - { - "epoch": 0.99, - "learning_rate": 6.290174632128545e-07, - "loss": 2.2985, - "step": 283110 - }, - { - "epoch": 0.99, - "learning_rate": 6.272735833592008e-07, - "loss": 2.3593, - "step": 283120 - }, - { - "epoch": 0.99, - "learning_rate": 6.255297035055473e-07, - "loss": 2.3097, - "step": 283130 - }, - { - "epoch": 0.99, - "learning_rate": 6.237858236518937e-07, - "loss": 2.3018, - "step": 283140 - }, - { - "epoch": 0.99, - "learning_rate": 6.220419437982401e-07, - "loss": 2.3755, - "step": 283150 - }, - { - "epoch": 0.99, - "learning_rate": 6.202980639445865e-07, - "loss": 2.3526, - "step": 283160 - }, - { - "epoch": 0.99, - "learning_rate": 6.185541840909328e-07, - "loss": 2.3508, - "step": 283170 - }, - { - "epoch": 0.99, - "learning_rate": 6.168103042372793e-07, - "loss": 2.338, - "step": 283180 - }, - { - "epoch": 0.99, - "learning_rate": 6.150664243836257e-07, - "loss": 2.1332, - "step": 283190 - }, - { - "epoch": 0.99, - "learning_rate": 6.133225445299721e-07, - "loss": 2.3001, - "step": 283200 - }, - { - "epoch": 0.99, - "learning_rate": 6.115786646763184e-07, - "loss": 2.3204, - "step": 283210 - }, - { - "epoch": 0.99, - "learning_rate": 6.098347848226648e-07, - "loss": 2.2727, - "step": 283220 - }, - { - "epoch": 0.99, - "learning_rate": 6.080909049690113e-07, - "loss": 2.3279, - "step": 283230 - }, - { - "epoch": 0.99, - "learning_rate": 6.063470251153577e-07, - "loss": 2.3629, - "step": 283240 - }, - { - "epoch": 0.99, - "learning_rate": 6.04603145261704e-07, - "loss": 2.3158, - "step": 283250 - }, - { - "epoch": 0.99, - "learning_rate": 6.028592654080504e-07, - "loss": 2.3372, - "step": 283260 - }, - { - "epoch": 0.99, - "learning_rate": 6.011153855543968e-07, - "loss": 2.2748, - "step": 283270 - }, - { - "epoch": 0.99, - "learning_rate": 5.993715057007433e-07, - "loss": 2.31, - "step": 283280 - }, - { - "epoch": 0.99, - "learning_rate": 5.976276258470896e-07, - "loss": 2.3231, - "step": 283290 - }, - { - "epoch": 0.99, - "learning_rate": 5.95883745993436e-07, - "loss": 2.286, - "step": 283300 - }, - { - "epoch": 0.99, - "learning_rate": 5.941398661397824e-07, - "loss": 2.3155, - "step": 283310 - }, - { - "epoch": 0.99, - "learning_rate": 5.923959862861289e-07, - "loss": 2.3249, - "step": 283320 - }, - { - "epoch": 0.99, - "learning_rate": 5.906521064324753e-07, - "loss": 2.3789, - "step": 283330 - }, - { - "epoch": 0.99, - "learning_rate": 5.889082265788216e-07, - "loss": 2.3361, - "step": 283340 - }, - { - "epoch": 0.99, - "learning_rate": 5.87164346725168e-07, - "loss": 2.3074, - "step": 283350 - }, - { - "epoch": 0.99, - "learning_rate": 5.854204668715145e-07, - "loss": 2.3405, - "step": 283360 - }, - { - "epoch": 0.99, - "learning_rate": 5.836765870178609e-07, - "loss": 2.3741, - "step": 283370 - }, - { - "epoch": 0.99, - "learning_rate": 5.819327071642072e-07, - "loss": 2.3988, - "step": 283380 - }, - { - "epoch": 0.99, - "learning_rate": 5.801888273105536e-07, - "loss": 2.3032, - "step": 283390 - }, - { - "epoch": 0.99, - "learning_rate": 5.784449474569001e-07, - "loss": 2.3074, - "step": 283400 - }, - { - "epoch": 0.99, - "learning_rate": 5.767010676032465e-07, - "loss": 2.4214, - "step": 283410 - }, - { - "epoch": 0.99, - "learning_rate": 5.749571877495928e-07, - "loss": 2.3618, - "step": 283420 - }, - { - "epoch": 0.99, - "learning_rate": 5.732133078959392e-07, - "loss": 2.2689, - "step": 283430 - }, - { - "epoch": 0.99, - "learning_rate": 5.714694280422856e-07, - "loss": 2.3147, - "step": 283440 - }, - { - "epoch": 0.99, - "learning_rate": 5.697255481886321e-07, - "loss": 2.3397, - "step": 283450 - }, - { - "epoch": 0.99, - "learning_rate": 5.679816683349784e-07, - "loss": 2.3017, - "step": 283460 - }, - { - "epoch": 0.99, - "learning_rate": 5.662377884813248e-07, - "loss": 2.3301, - "step": 283470 - }, - { - "epoch": 0.99, - "learning_rate": 5.644939086276712e-07, - "loss": 2.3528, - "step": 283480 - }, - { - "epoch": 0.99, - "learning_rate": 5.627500287740177e-07, - "loss": 2.2974, - "step": 283490 - }, - { - "epoch": 0.99, - "learning_rate": 5.61006148920364e-07, - "loss": 2.325, - "step": 283500 - }, - { - "epoch": 0.99, - "learning_rate": 5.592622690667104e-07, - "loss": 2.2558, - "step": 283510 - }, - { - "epoch": 0.99, - "learning_rate": 5.575183892130568e-07, - "loss": 2.328, - "step": 283520 - }, - { - "epoch": 0.99, - "learning_rate": 5.557745093594033e-07, - "loss": 2.2929, - "step": 283530 - }, - { - "epoch": 0.99, - "learning_rate": 5.540306295057497e-07, - "loss": 2.3235, - "step": 283540 - }, - { - "epoch": 0.99, - "learning_rate": 5.52286749652096e-07, - "loss": 2.3238, - "step": 283550 - }, - { - "epoch": 0.99, - "learning_rate": 5.505428697984424e-07, - "loss": 2.3884, - "step": 283560 - }, - { - "epoch": 0.99, - "learning_rate": 5.487989899447888e-07, - "loss": 2.3215, - "step": 283570 - }, - { - "epoch": 0.99, - "learning_rate": 5.470551100911353e-07, - "loss": 2.2962, - "step": 283580 - }, - { - "epoch": 0.99, - "learning_rate": 5.453112302374816e-07, - "loss": 2.3559, - "step": 283590 - }, - { - "epoch": 0.99, - "learning_rate": 5.43567350383828e-07, - "loss": 2.4084, - "step": 283600 - }, - { - "epoch": 0.99, - "learning_rate": 5.418234705301744e-07, - "loss": 2.3084, - "step": 283610 - }, - { - "epoch": 0.99, - "learning_rate": 5.400795906765208e-07, - "loss": 2.3351, - "step": 283620 - }, - { - "epoch": 0.99, - "learning_rate": 5.383357108228672e-07, - "loss": 2.2856, - "step": 283630 - }, - { - "epoch": 0.99, - "learning_rate": 5.365918309692136e-07, - "loss": 2.289, - "step": 283640 - }, - { - "epoch": 0.99, - "learning_rate": 5.3484795111556e-07, - "loss": 2.2906, - "step": 283650 - }, - { - "epoch": 0.99, - "learning_rate": 5.331040712619064e-07, - "loss": 2.3654, - "step": 283660 - }, - { - "epoch": 0.99, - "learning_rate": 5.313601914082527e-07, - "loss": 2.3686, - "step": 283670 - }, - { - "epoch": 0.99, - "learning_rate": 5.296163115545992e-07, - "loss": 2.2228, - "step": 283680 - }, - { - "epoch": 0.99, - "learning_rate": 5.278724317009456e-07, - "loss": 2.3487, - "step": 283690 - }, - { - "epoch": 0.99, - "learning_rate": 5.26128551847292e-07, - "loss": 2.3708, - "step": 283700 - }, - { - "epoch": 0.99, - "learning_rate": 5.243846719936384e-07, - "loss": 2.337, - "step": 283710 - }, - { - "epoch": 0.99, - "learning_rate": 5.226407921399848e-07, - "loss": 2.3726, - "step": 283720 - }, - { - "epoch": 0.99, - "learning_rate": 5.208969122863312e-07, - "loss": 2.3544, - "step": 283730 - }, - { - "epoch": 0.99, - "learning_rate": 5.191530324326776e-07, - "loss": 2.3003, - "step": 283740 - }, - { - "epoch": 0.99, - "learning_rate": 5.17409152579024e-07, - "loss": 2.3209, - "step": 283750 - }, - { - "epoch": 0.99, - "learning_rate": 5.156652727253703e-07, - "loss": 2.3011, - "step": 283760 - }, - { - "epoch": 0.99, - "learning_rate": 5.139213928717168e-07, - "loss": 2.3031, - "step": 283770 - }, - { - "epoch": 0.99, - "learning_rate": 5.121775130180632e-07, - "loss": 2.3173, - "step": 283780 - }, - { - "epoch": 0.99, - "learning_rate": 5.104336331644096e-07, - "loss": 2.3157, - "step": 283790 - }, - { - "epoch": 0.99, - "learning_rate": 5.086897533107559e-07, - "loss": 2.3441, - "step": 283800 - }, - { - "epoch": 0.99, - "learning_rate": 5.069458734571023e-07, - "loss": 2.307, - "step": 283810 - }, - { - "epoch": 0.99, - "learning_rate": 5.052019936034488e-07, - "loss": 2.3253, - "step": 283820 - }, - { - "epoch": 0.99, - "learning_rate": 5.034581137497952e-07, - "loss": 2.3387, - "step": 283830 - }, - { - "epoch": 0.99, - "learning_rate": 5.017142338961415e-07, - "loss": 2.3904, - "step": 283840 - }, - { - "epoch": 0.99, - "learning_rate": 4.999703540424879e-07, - "loss": 2.3929, - "step": 283850 - }, - { - "epoch": 0.99, - "learning_rate": 4.982264741888343e-07, - "loss": 2.2951, - "step": 283860 - }, - { - "epoch": 0.99, - "learning_rate": 4.964825943351808e-07, - "loss": 2.3627, - "step": 283870 - }, - { - "epoch": 0.99, - "learning_rate": 4.947387144815272e-07, - "loss": 2.253, - "step": 283880 - }, - { - "epoch": 0.99, - "learning_rate": 4.929948346278735e-07, - "loss": 2.2877, - "step": 283890 - }, - { - "epoch": 0.99, - "learning_rate": 4.912509547742199e-07, - "loss": 2.2268, - "step": 283900 - }, - { - "epoch": 0.99, - "learning_rate": 4.895070749205663e-07, - "loss": 2.4325, - "step": 283910 - }, - { - "epoch": 0.99, - "learning_rate": 4.877631950669128e-07, - "loss": 2.422, - "step": 283920 - }, - { - "epoch": 0.99, - "learning_rate": 4.860193152132591e-07, - "loss": 2.349, - "step": 283930 - }, - { - "epoch": 0.99, - "learning_rate": 4.842754353596055e-07, - "loss": 2.2907, - "step": 283940 - }, - { - "epoch": 0.99, - "learning_rate": 4.825315555059519e-07, - "loss": 2.3822, - "step": 283950 - }, - { - "epoch": 0.99, - "learning_rate": 4.807876756522983e-07, - "loss": 2.2989, - "step": 283960 - }, - { - "epoch": 0.99, - "learning_rate": 4.790437957986447e-07, - "loss": 2.3539, - "step": 283970 - }, - { - "epoch": 0.99, - "learning_rate": 4.772999159449911e-07, - "loss": 2.2657, - "step": 283980 - }, - { - "epoch": 0.99, - "learning_rate": 4.755560360913375e-07, - "loss": 2.2122, - "step": 283990 - }, - { - "epoch": 0.99, - "learning_rate": 4.7381215623768387e-07, - "loss": 2.3463, - "step": 284000 - }, - { - "epoch": 0.99, - "learning_rate": 4.7206827638403024e-07, - "loss": 2.2298, - "step": 284010 - }, - { - "epoch": 0.99, - "learning_rate": 4.703243965303767e-07, - "loss": 2.3329, - "step": 284020 - }, - { - "epoch": 0.99, - "learning_rate": 4.685805166767231e-07, - "loss": 2.3806, - "step": 284030 - }, - { - "epoch": 0.99, - "learning_rate": 4.668366368230695e-07, - "loss": 2.3717, - "step": 284040 - }, - { - "epoch": 0.99, - "learning_rate": 4.6509275696941585e-07, - "loss": 2.2847, - "step": 284050 - }, - { - "epoch": 0.99, - "learning_rate": 4.633488771157622e-07, - "loss": 2.3827, - "step": 284060 - }, - { - "epoch": 0.99, - "learning_rate": 4.616049972621087e-07, - "loss": 2.268, - "step": 284070 - }, - { - "epoch": 0.99, - "learning_rate": 4.598611174084551e-07, - "loss": 2.2801, - "step": 284080 - }, - { - "epoch": 0.99, - "learning_rate": 4.5811723755480146e-07, - "loss": 2.3017, - "step": 284090 - }, - { - "epoch": 0.99, - "learning_rate": 4.5637335770114783e-07, - "loss": 2.3361, - "step": 284100 - }, - { - "epoch": 0.99, - "learning_rate": 4.546294778474942e-07, - "loss": 2.2968, - "step": 284110 - }, - { - "epoch": 0.99, - "learning_rate": 4.528855979938407e-07, - "loss": 2.3798, - "step": 284120 - }, - { - "epoch": 0.99, - "learning_rate": 4.5114171814018706e-07, - "loss": 2.348, - "step": 284130 - }, - { - "epoch": 0.99, - "learning_rate": 4.4939783828653344e-07, - "loss": 2.3687, - "step": 284140 - }, - { - "epoch": 0.99, - "learning_rate": 4.476539584328798e-07, - "loss": 2.2605, - "step": 284150 - }, - { - "epoch": 0.99, - "learning_rate": 4.459100785792262e-07, - "loss": 2.4119, - "step": 284160 - }, - { - "epoch": 0.99, - "learning_rate": 4.4416619872557267e-07, - "loss": 2.3176, - "step": 284170 - }, - { - "epoch": 0.99, - "learning_rate": 4.4242231887191904e-07, - "loss": 2.3288, - "step": 284180 - }, - { - "epoch": 0.99, - "learning_rate": 4.406784390182654e-07, - "loss": 2.348, - "step": 284190 - }, - { - "epoch": 0.99, - "learning_rate": 4.389345591646118e-07, - "loss": 2.4315, - "step": 284200 - }, - { - "epoch": 0.99, - "learning_rate": 4.3719067931095817e-07, - "loss": 2.34, - "step": 284210 - }, - { - "epoch": 0.99, - "learning_rate": 4.3544679945730465e-07, - "loss": 2.3445, - "step": 284220 - }, - { - "epoch": 0.99, - "learning_rate": 4.33702919603651e-07, - "loss": 2.3191, - "step": 284230 - }, - { - "epoch": 0.99, - "learning_rate": 4.319590397499974e-07, - "loss": 2.3146, - "step": 284240 - }, - { - "epoch": 0.99, - "learning_rate": 4.302151598963438e-07, - "loss": 2.3148, - "step": 284250 - }, - { - "epoch": 0.99, - "learning_rate": 4.2847128004269015e-07, - "loss": 2.348, - "step": 284260 - }, - { - "epoch": 0.99, - "learning_rate": 4.2672740018903663e-07, - "loss": 2.3119, - "step": 284270 - }, - { - "epoch": 0.99, - "learning_rate": 4.24983520335383e-07, - "loss": 2.2827, - "step": 284280 - }, - { - "epoch": 0.99, - "learning_rate": 4.232396404817294e-07, - "loss": 2.3554, - "step": 284290 - }, - { - "epoch": 0.99, - "learning_rate": 4.2149576062807576e-07, - "loss": 2.3585, - "step": 284300 - }, - { - "epoch": 0.99, - "learning_rate": 4.1975188077442213e-07, - "loss": 2.3217, - "step": 284310 - }, - { - "epoch": 0.99, - "learning_rate": 4.180080009207686e-07, - "loss": 2.3185, - "step": 284320 - }, - { - "epoch": 0.99, - "learning_rate": 4.16264121067115e-07, - "loss": 2.3849, - "step": 284330 - }, - { - "epoch": 0.99, - "learning_rate": 4.1452024121346136e-07, - "loss": 2.3052, - "step": 284340 - }, - { - "epoch": 0.99, - "learning_rate": 4.1277636135980774e-07, - "loss": 2.3906, - "step": 284350 - }, - { - "epoch": 0.99, - "learning_rate": 4.110324815061541e-07, - "loss": 2.3171, - "step": 284360 - }, - { - "epoch": 0.99, - "learning_rate": 4.092886016525006e-07, - "loss": 2.3196, - "step": 284370 - }, - { - "epoch": 0.99, - "learning_rate": 4.0754472179884697e-07, - "loss": 2.3699, - "step": 284380 - }, - { - "epoch": 0.99, - "learning_rate": 4.0580084194519335e-07, - "loss": 2.2105, - "step": 284390 - }, - { - "epoch": 0.99, - "learning_rate": 4.040569620915397e-07, - "loss": 2.2939, - "step": 284400 - }, - { - "epoch": 0.99, - "learning_rate": 4.023130822378862e-07, - "loss": 2.3235, - "step": 284410 - }, - { - "epoch": 0.99, - "learning_rate": 4.005692023842326e-07, - "loss": 2.3059, - "step": 284420 - }, - { - "epoch": 0.99, - "learning_rate": 3.9882532253057895e-07, - "loss": 2.3178, - "step": 284430 - }, - { - "epoch": 0.99, - "learning_rate": 3.9708144267692533e-07, - "loss": 2.3611, - "step": 284440 - }, - { - "epoch": 0.99, - "learning_rate": 3.953375628232717e-07, - "loss": 2.3311, - "step": 284450 - }, - { - "epoch": 0.99, - "learning_rate": 3.935936829696182e-07, - "loss": 2.3098, - "step": 284460 - }, - { - "epoch": 0.99, - "learning_rate": 3.9184980311596456e-07, - "loss": 2.3504, - "step": 284470 - }, - { - "epoch": 0.99, - "learning_rate": 3.9010592326231093e-07, - "loss": 2.2991, - "step": 284480 - }, - { - "epoch": 0.99, - "learning_rate": 3.883620434086573e-07, - "loss": 2.2902, - "step": 284490 - }, - { - "epoch": 0.99, - "learning_rate": 3.8661816355500374e-07, - "loss": 2.3861, - "step": 284500 - }, - { - "epoch": 0.99, - "learning_rate": 3.848742837013501e-07, - "loss": 2.2868, - "step": 284510 - }, - { - "epoch": 0.99, - "learning_rate": 3.831304038476965e-07, - "loss": 2.2547, - "step": 284520 - }, - { - "epoch": 0.99, - "learning_rate": 3.813865239940429e-07, - "loss": 2.3238, - "step": 284530 - }, - { - "epoch": 0.99, - "learning_rate": 3.796426441403893e-07, - "loss": 2.3756, - "step": 284540 - }, - { - "epoch": 0.99, - "learning_rate": 3.778987642867357e-07, - "loss": 2.2762, - "step": 284550 - }, - { - "epoch": 0.99, - "learning_rate": 3.761548844330821e-07, - "loss": 2.3283, - "step": 284560 - }, - { - "epoch": 0.99, - "learning_rate": 3.7441100457942847e-07, - "loss": 2.2955, - "step": 284570 - }, - { - "epoch": 0.99, - "learning_rate": 3.726671247257749e-07, - "loss": 2.331, - "step": 284580 - }, - { - "epoch": 0.99, - "learning_rate": 3.7092324487212127e-07, - "loss": 2.3289, - "step": 284590 - }, - { - "epoch": 0.99, - "learning_rate": 3.691793650184677e-07, - "loss": 2.3808, - "step": 284600 - }, - { - "epoch": 0.99, - "learning_rate": 3.674354851648141e-07, - "loss": 2.3555, - "step": 284610 - }, - { - "epoch": 0.99, - "learning_rate": 3.656916053111605e-07, - "loss": 2.2899, - "step": 284620 - }, - { - "epoch": 0.99, - "learning_rate": 3.639477254575069e-07, - "loss": 2.3274, - "step": 284630 - }, - { - "epoch": 0.99, - "learning_rate": 3.6220384560385325e-07, - "loss": 2.434, - "step": 284640 - }, - { - "epoch": 0.99, - "learning_rate": 3.604599657501997e-07, - "loss": 2.3477, - "step": 284650 - }, - { - "epoch": 0.99, - "learning_rate": 3.5871608589654606e-07, - "loss": 2.4153, - "step": 284660 - }, - { - "epoch": 0.99, - "learning_rate": 3.569722060428925e-07, - "loss": 2.3372, - "step": 284670 - }, - { - "epoch": 0.99, - "learning_rate": 3.5522832618923886e-07, - "loss": 2.3241, - "step": 284680 - }, - { - "epoch": 0.99, - "learning_rate": 3.534844463355853e-07, - "loss": 2.406, - "step": 284690 - }, - { - "epoch": 0.99, - "learning_rate": 3.5174056648193166e-07, - "loss": 2.3453, - "step": 284700 - }, - { - "epoch": 0.99, - "learning_rate": 3.499966866282781e-07, - "loss": 2.3601, - "step": 284710 - }, - { - "epoch": 0.99, - "learning_rate": 3.4825280677462447e-07, - "loss": 2.3208, - "step": 284720 - }, - { - "epoch": 0.99, - "learning_rate": 3.465089269209709e-07, - "loss": 2.2582, - "step": 284730 - }, - { - "epoch": 0.99, - "learning_rate": 3.4476504706731727e-07, - "loss": 2.3784, - "step": 284740 - }, - { - "epoch": 0.99, - "learning_rate": 3.430211672136637e-07, - "loss": 2.2838, - "step": 284750 - }, - { - "epoch": 0.99, - "learning_rate": 3.412772873600101e-07, - "loss": 2.3326, - "step": 284760 - }, - { - "epoch": 0.99, - "learning_rate": 3.3953340750635645e-07, - "loss": 2.2974, - "step": 284770 - }, - { - "epoch": 0.99, - "learning_rate": 3.377895276527029e-07, - "loss": 2.3348, - "step": 284780 - }, - { - "epoch": 0.99, - "learning_rate": 3.3604564779904925e-07, - "loss": 2.3463, - "step": 284790 - }, - { - "epoch": 0.99, - "learning_rate": 3.343017679453957e-07, - "loss": 2.4124, - "step": 284800 - }, - { - "epoch": 0.99, - "learning_rate": 3.3255788809174206e-07, - "loss": 2.403, - "step": 284810 - }, - { - "epoch": 0.99, - "learning_rate": 3.308140082380885e-07, - "loss": 2.4159, - "step": 284820 - }, - { - "epoch": 0.99, - "learning_rate": 3.2907012838443486e-07, - "loss": 2.3469, - "step": 284830 - }, - { - "epoch": 0.99, - "learning_rate": 3.2732624853078123e-07, - "loss": 2.284, - "step": 284840 - }, - { - "epoch": 0.99, - "learning_rate": 3.2558236867712766e-07, - "loss": 2.3186, - "step": 284850 - }, - { - "epoch": 0.99, - "learning_rate": 3.2383848882347404e-07, - "loss": 2.291, - "step": 284860 - }, - { - "epoch": 0.99, - "learning_rate": 3.2209460896982047e-07, - "loss": 2.3699, - "step": 284870 - }, - { - "epoch": 0.99, - "learning_rate": 3.2035072911616684e-07, - "loss": 2.3248, - "step": 284880 - }, - { - "epoch": 0.99, - "learning_rate": 3.186068492625132e-07, - "loss": 2.2956, - "step": 284890 - }, - { - "epoch": 0.99, - "learning_rate": 3.1686296940885964e-07, - "loss": 2.3296, - "step": 284900 - }, - { - "epoch": 0.99, - "learning_rate": 3.15119089555206e-07, - "loss": 2.3574, - "step": 284910 - }, - { - "epoch": 0.99, - "learning_rate": 3.1337520970155245e-07, - "loss": 2.3039, - "step": 284920 - }, - { - "epoch": 0.99, - "learning_rate": 3.116313298478988e-07, - "loss": 2.2836, - "step": 284930 - }, - { - "epoch": 0.99, - "learning_rate": 3.0988744999424525e-07, - "loss": 2.3209, - "step": 284940 - }, - { - "epoch": 0.99, - "learning_rate": 3.081435701405916e-07, - "loss": 2.3656, - "step": 284950 - }, - { - "epoch": 0.99, - "learning_rate": 3.06399690286938e-07, - "loss": 2.2877, - "step": 284960 - }, - { - "epoch": 0.99, - "learning_rate": 3.0465581043328443e-07, - "loss": 2.2892, - "step": 284970 - }, - { - "epoch": 0.99, - "learning_rate": 3.029119305796308e-07, - "loss": 2.3652, - "step": 284980 - }, - { - "epoch": 0.99, - "learning_rate": 3.0116805072597723e-07, - "loss": 2.3241, - "step": 284990 - }, - { - "epoch": 0.99, - "learning_rate": 2.994241708723236e-07, - "loss": 2.4672, - "step": 285000 - }, - { - "epoch": 0.99, - "learning_rate": 2.9768029101867e-07, - "loss": 2.3113, - "step": 285010 - }, - { - "epoch": 0.99, - "learning_rate": 2.959364111650164e-07, - "loss": 2.3279, - "step": 285020 - }, - { - "epoch": 0.99, - "learning_rate": 2.941925313113628e-07, - "loss": 2.3552, - "step": 285030 - }, - { - "epoch": 0.99, - "learning_rate": 2.924486514577092e-07, - "loss": 2.3431, - "step": 285040 - }, - { - "epoch": 0.99, - "learning_rate": 2.907047716040556e-07, - "loss": 2.3441, - "step": 285050 - }, - { - "epoch": 0.99, - "learning_rate": 2.8896089175040196e-07, - "loss": 2.2145, - "step": 285060 - }, - { - "epoch": 0.99, - "learning_rate": 2.872170118967484e-07, - "loss": 2.2873, - "step": 285070 - }, - { - "epoch": 0.99, - "learning_rate": 2.8547313204309477e-07, - "loss": 2.3932, - "step": 285080 - }, - { - "epoch": 0.99, - "learning_rate": 2.837292521894412e-07, - "loss": 2.3567, - "step": 285090 - }, - { - "epoch": 0.99, - "learning_rate": 2.8198537233578757e-07, - "loss": 2.3222, - "step": 285100 - }, - { - "epoch": 0.99, - "learning_rate": 2.8024149248213395e-07, - "loss": 2.3442, - "step": 285110 - }, - { - "epoch": 0.99, - "learning_rate": 2.7849761262848037e-07, - "loss": 2.264, - "step": 285120 - }, - { - "epoch": 0.99, - "learning_rate": 2.7675373277482675e-07, - "loss": 2.3257, - "step": 285130 - }, - { - "epoch": 0.99, - "learning_rate": 2.750098529211732e-07, - "loss": 2.329, - "step": 285140 - }, - { - "epoch": 0.99, - "learning_rate": 2.7326597306751955e-07, - "loss": 2.2825, - "step": 285150 - }, - { - "epoch": 0.99, - "learning_rate": 2.7152209321386593e-07, - "loss": 2.2741, - "step": 285160 - }, - { - "epoch": 0.99, - "learning_rate": 2.6977821336021236e-07, - "loss": 2.254, - "step": 285170 - }, - { - "epoch": 0.99, - "learning_rate": 2.6803433350655873e-07, - "loss": 2.3768, - "step": 285180 - }, - { - "epoch": 0.99, - "learning_rate": 2.6629045365290516e-07, - "loss": 2.3363, - "step": 285190 - }, - { - "epoch": 0.99, - "learning_rate": 2.6454657379925153e-07, - "loss": 2.2796, - "step": 285200 - }, - { - "epoch": 0.99, - "learning_rate": 2.628026939455979e-07, - "loss": 2.3927, - "step": 285210 - }, - { - "epoch": 0.99, - "learning_rate": 2.6105881409194434e-07, - "loss": 2.3441, - "step": 285220 - }, - { - "epoch": 0.99, - "learning_rate": 2.593149342382907e-07, - "loss": 2.3625, - "step": 285230 - }, - { - "epoch": 0.99, - "learning_rate": 2.5757105438463714e-07, - "loss": 2.305, - "step": 285240 - }, - { - "epoch": 0.99, - "learning_rate": 2.558271745309835e-07, - "loss": 2.3121, - "step": 285250 - }, - { - "epoch": 0.99, - "learning_rate": 2.540832946773299e-07, - "loss": 2.4078, - "step": 285260 - }, - { - "epoch": 0.99, - "learning_rate": 2.523394148236763e-07, - "loss": 2.2495, - "step": 285270 - }, - { - "epoch": 0.99, - "learning_rate": 2.505955349700227e-07, - "loss": 2.3396, - "step": 285280 - }, - { - "epoch": 1.0, - "learning_rate": 2.488516551163691e-07, - "loss": 2.3427, - "step": 285290 - }, - { - "epoch": 1.0, - "learning_rate": 2.471077752627155e-07, - "loss": 2.3511, - "step": 285300 - }, - { - "epoch": 1.0, - "learning_rate": 2.453638954090619e-07, - "loss": 2.3952, - "step": 285310 - }, - { - "epoch": 1.0, - "learning_rate": 2.436200155554083e-07, - "loss": 2.2959, - "step": 285320 - }, - { - "epoch": 1.0, - "learning_rate": 2.418761357017547e-07, - "loss": 2.4302, - "step": 285330 - }, - { - "epoch": 1.0, - "learning_rate": 2.401322558481011e-07, - "loss": 2.3446, - "step": 285340 - }, - { - "epoch": 1.0, - "learning_rate": 2.383883759944475e-07, - "loss": 2.3643, - "step": 285350 - }, - { - "epoch": 1.0, - "learning_rate": 2.366444961407939e-07, - "loss": 2.3104, - "step": 285360 - }, - { - "epoch": 1.0, - "learning_rate": 2.3490061628714028e-07, - "loss": 2.3135, - "step": 285370 - }, - { - "epoch": 1.0, - "learning_rate": 2.3315673643348668e-07, - "loss": 2.2758, - "step": 285380 - }, - { - "epoch": 1.0, - "learning_rate": 2.3141285657983308e-07, - "loss": 2.2784, - "step": 285390 - }, - { - "epoch": 1.0, - "learning_rate": 2.2966897672617949e-07, - "loss": 2.2062, - "step": 285400 - }, - { - "epoch": 1.0, - "learning_rate": 2.279250968725259e-07, - "loss": 2.3775, - "step": 285410 - }, - { - "epoch": 1.0, - "learning_rate": 2.261812170188723e-07, - "loss": 2.3219, - "step": 285420 - }, - { - "epoch": 1.0, - "learning_rate": 2.2443733716521866e-07, - "loss": 2.3049, - "step": 285430 - }, - { - "epoch": 1.0, - "learning_rate": 2.226934573115651e-07, - "loss": 2.325, - "step": 285440 - }, - { - "epoch": 1.0, - "learning_rate": 2.2094957745791147e-07, - "loss": 2.3975, - "step": 285450 - }, - { - "epoch": 1.0, - "learning_rate": 2.192056976042579e-07, - "loss": 2.3468, - "step": 285460 - }, - { - "epoch": 1.0, - "learning_rate": 2.1746181775060427e-07, - "loss": 2.3437, - "step": 285470 - }, - { - "epoch": 1.0, - "learning_rate": 2.1571793789695065e-07, - "loss": 2.3263, - "step": 285480 - }, - { - "epoch": 1.0, - "learning_rate": 2.1397405804329707e-07, - "loss": 2.3357, - "step": 285490 - }, - { - "epoch": 1.0, - "learning_rate": 2.1223017818964345e-07, - "loss": 2.2768, - "step": 285500 - }, - { - "epoch": 1.0, - "learning_rate": 2.1048629833598988e-07, - "loss": 2.356, - "step": 285510 - }, - { - "epoch": 1.0, - "learning_rate": 2.0874241848233625e-07, - "loss": 2.337, - "step": 285520 - }, - { - "epoch": 1.0, - "learning_rate": 2.0699853862868263e-07, - "loss": 2.4426, - "step": 285530 - }, - { - "epoch": 1.0, - "learning_rate": 2.0525465877502906e-07, - "loss": 2.3389, - "step": 285540 - }, - { - "epoch": 1.0, - "learning_rate": 2.0351077892137543e-07, - "loss": 2.3869, - "step": 285550 - }, - { - "epoch": 1.0, - "learning_rate": 2.0176689906772186e-07, - "loss": 2.3117, - "step": 285560 - }, - { - "epoch": 1.0, - "learning_rate": 2.0002301921406823e-07, - "loss": 2.2979, - "step": 285570 - }, - { - "epoch": 1.0, - "learning_rate": 1.982791393604146e-07, - "loss": 2.4086, - "step": 285580 - }, - { - "epoch": 1.0, - "learning_rate": 1.9653525950676104e-07, - "loss": 2.3774, - "step": 285590 - }, - { - "epoch": 1.0, - "learning_rate": 1.9479137965310744e-07, - "loss": 2.3697, - "step": 285600 - }, - { - "epoch": 1.0, - "learning_rate": 1.9304749979945381e-07, - "loss": 2.3417, - "step": 285610 - }, - { - "epoch": 1.0, - "learning_rate": 1.9130361994580022e-07, - "loss": 2.301, - "step": 285620 - }, - { - "epoch": 1.0, - "learning_rate": 1.8955974009214662e-07, - "loss": 2.3374, - "step": 285630 - }, - { - "epoch": 1.0, - "learning_rate": 1.8781586023849302e-07, - "loss": 2.229, - "step": 285640 - }, - { - "epoch": 1.0, - "learning_rate": 1.8607198038483942e-07, - "loss": 2.3062, - "step": 285650 - }, - { - "epoch": 1.0, - "learning_rate": 1.843281005311858e-07, - "loss": 2.2968, - "step": 285660 - }, - { - "epoch": 1.0, - "learning_rate": 1.825842206775322e-07, - "loss": 2.3885, - "step": 285670 - }, - { - "epoch": 1.0, - "learning_rate": 1.808403408238786e-07, - "loss": 2.3288, - "step": 285680 - }, - { - "epoch": 1.0, - "learning_rate": 1.79096460970225e-07, - "loss": 2.2978, - "step": 285690 - }, - { - "epoch": 1.0, - "learning_rate": 1.773525811165714e-07, - "loss": 2.3072, - "step": 285700 - }, - { - "epoch": 1.0, - "learning_rate": 1.7560870126291778e-07, - "loss": 2.3291, - "step": 285710 - }, - { - "epoch": 1.0, - "learning_rate": 1.7386482140926418e-07, - "loss": 2.3093, - "step": 285720 - }, - { - "epoch": 1.0, - "learning_rate": 1.7212094155561058e-07, - "loss": 2.2569, - "step": 285730 - }, - { - "epoch": 1.0, - "learning_rate": 1.7037706170195698e-07, - "loss": 2.3185, - "step": 285740 - }, - { - "epoch": 1.0, - "learning_rate": 1.6863318184830338e-07, - "loss": 2.3159, - "step": 285750 - }, - { - "epoch": 1.0, - "learning_rate": 1.6688930199464979e-07, - "loss": 2.3438, - "step": 285760 - }, - { - "epoch": 1.0, - "learning_rate": 1.6514542214099616e-07, - "loss": 2.3355, - "step": 285770 - }, - { - "epoch": 1.0, - "learning_rate": 1.6340154228734256e-07, - "loss": 2.3262, - "step": 285780 - }, - { - "epoch": 1.0, - "learning_rate": 1.6165766243368896e-07, - "loss": 2.35, - "step": 285790 - }, - { - "epoch": 1.0, - "learning_rate": 1.5991378258003537e-07, - "loss": 2.2904, - "step": 285800 - }, - { - "epoch": 1.0, - "learning_rate": 1.5816990272638177e-07, - "loss": 2.2915, - "step": 285810 - }, - { - "epoch": 1.0, - "learning_rate": 1.5642602287272817e-07, - "loss": 2.2974, - "step": 285820 - }, - { - "epoch": 1.0, - "learning_rate": 1.5468214301907457e-07, - "loss": 2.3712, - "step": 285830 - }, - { - "epoch": 1.0, - "learning_rate": 1.5293826316542097e-07, - "loss": 2.3671, - "step": 285840 - }, - { - "epoch": 1.0, - "learning_rate": 1.5119438331176737e-07, - "loss": 2.3057, - "step": 285850 - }, - { - "epoch": 1.0, - "learning_rate": 1.4945050345811378e-07, - "loss": 2.3911, - "step": 285860 - }, - { - "epoch": 1.0, - "learning_rate": 1.4770662360446015e-07, - "loss": 2.3095, - "step": 285870 - }, - { - "epoch": 1.0, - "learning_rate": 1.4596274375080655e-07, - "loss": 2.3733, - "step": 285880 - }, - { - "epoch": 1.0, - "learning_rate": 1.4421886389715295e-07, - "loss": 2.3348, - "step": 285890 - }, - { - "epoch": 1.0, - "learning_rate": 1.4247498404349936e-07, - "loss": 2.2955, - "step": 285900 - }, - { - "epoch": 1.0, - "learning_rate": 1.4073110418984576e-07, - "loss": 2.3678, - "step": 285910 - }, - { - "epoch": 1.0, - "learning_rate": 1.3898722433619216e-07, - "loss": 2.3681, - "step": 285920 - }, - { - "epoch": 1.0, - "learning_rate": 1.3724334448253853e-07, - "loss": 2.2165, - "step": 285930 - }, - { - "epoch": 1.0, - "learning_rate": 1.3549946462888494e-07, - "loss": 2.3807, - "step": 285940 - }, - { - "epoch": 1.0, - "learning_rate": 1.3375558477523134e-07, - "loss": 2.3771, - "step": 285950 - }, - { - "epoch": 1.0, - "learning_rate": 1.3201170492157774e-07, - "loss": 2.3432, - "step": 285960 - }, - { - "epoch": 1.0, - "learning_rate": 1.3026782506792414e-07, - "loss": 2.3381, - "step": 285970 - }, - { - "epoch": 1.0, - "learning_rate": 1.2852394521427052e-07, - "loss": 2.2467, - "step": 285980 - }, - { - "epoch": 1.0, - "learning_rate": 1.2678006536061692e-07, - "loss": 2.3453, - "step": 285990 - }, - { - "epoch": 1.0, - "learning_rate": 1.2503618550696332e-07, - "loss": 2.3587, - "step": 286000 - }, - { - "epoch": 1.0, - "learning_rate": 1.2329230565330972e-07, - "loss": 2.369, - "step": 286010 - }, - { - "epoch": 1.0, - "learning_rate": 1.2154842579965612e-07, - "loss": 2.3626, - "step": 286020 - }, - { - "epoch": 1.0, - "learning_rate": 1.198045459460025e-07, - "loss": 2.4206, - "step": 286030 - }, - { - "epoch": 1.0, - "learning_rate": 1.180606660923489e-07, - "loss": 2.3219, - "step": 286040 - }, - { - "epoch": 1.0, - "learning_rate": 1.163167862386953e-07, - "loss": 2.2636, - "step": 286050 - }, - { - "epoch": 1.0, - "learning_rate": 1.145729063850417e-07, - "loss": 2.3141, - "step": 286060 - }, - { - "epoch": 1.0, - "learning_rate": 1.128290265313881e-07, - "loss": 2.3573, - "step": 286070 - }, - { - "epoch": 1.0, - "learning_rate": 1.110851466777345e-07, - "loss": 2.3249, - "step": 286080 - }, - { - "epoch": 1.0, - "learning_rate": 1.0934126682408088e-07, - "loss": 2.3467, - "step": 286090 - }, - { - "epoch": 1.0, - "learning_rate": 1.0759738697042728e-07, - "loss": 2.2809, - "step": 286100 - }, - { - "epoch": 1.0, - "learning_rate": 1.0585350711677368e-07, - "loss": 2.2963, - "step": 286110 - }, - { - "epoch": 1.0, - "learning_rate": 1.0410962726312009e-07, - "loss": 2.3127, - "step": 286120 - }, - { - "epoch": 1.0, - "learning_rate": 1.0236574740946649e-07, - "loss": 2.4025, - "step": 286130 - }, - { - "epoch": 1.0, - "learning_rate": 1.0062186755581288e-07, - "loss": 2.3728, - "step": 286140 - }, - { - "epoch": 1.0, - "learning_rate": 9.887798770215928e-08, - "loss": 2.3214, - "step": 286150 - }, - { - "epoch": 1.0, - "learning_rate": 9.713410784850568e-08, - "loss": 2.3407, - "step": 286160 - }, - { - "epoch": 1.0, - "learning_rate": 9.539022799485208e-08, - "loss": 2.363, - "step": 286170 - }, - { - "epoch": 1.0, - "learning_rate": 9.364634814119847e-08, - "loss": 2.3875, - "step": 286180 - }, - { - "epoch": 1.0, - "learning_rate": 9.190246828754487e-08, - "loss": 2.3301, - "step": 286190 - }, - { - "epoch": 1.0, - "learning_rate": 9.015858843389126e-08, - "loss": 2.2799, - "step": 286200 - }, - { - "epoch": 1.0, - "learning_rate": 8.841470858023766e-08, - "loss": 2.3344, - "step": 286210 - }, - { - "epoch": 1.0, - "learning_rate": 8.667082872658406e-08, - "loss": 2.3721, - "step": 286220 - }, - { - "epoch": 1.0, - "learning_rate": 8.492694887293045e-08, - "loss": 2.3437, - "step": 286230 - }, - { - "epoch": 1.0, - "learning_rate": 8.318306901927685e-08, - "loss": 2.3615, - "step": 286240 - }, - { - "epoch": 1.0, - "learning_rate": 8.143918916562325e-08, - "loss": 2.2441, - "step": 286250 - }, - { - "epoch": 1.0, - "learning_rate": 7.969530931196964e-08, - "loss": 2.3586, - "step": 286260 - }, - { - "epoch": 1.0, - "learning_rate": 7.795142945831604e-08, - "loss": 2.3446, - "step": 286270 - }, - { - "epoch": 1.0, - "learning_rate": 7.620754960466243e-08, - "loss": 2.3193, - "step": 286280 - }, - { - "epoch": 1.0, - "learning_rate": 7.446366975100883e-08, - "loss": 2.2415, - "step": 286290 - }, - { - "epoch": 1.0, - "learning_rate": 7.271978989735524e-08, - "loss": 2.375, - "step": 286300 - }, - { - "epoch": 1.0, - "learning_rate": 7.097591004370162e-08, - "loss": 2.3062, - "step": 286310 - }, - { - "epoch": 1.0, - "learning_rate": 6.923203019004803e-08, - "loss": 2.3738, - "step": 286320 - }, - { - "epoch": 1.0, - "learning_rate": 6.748815033639443e-08, - "loss": 2.3729, - "step": 286330 - }, - { - "epoch": 1.0, - "learning_rate": 6.574427048274083e-08, - "loss": 2.4112, - "step": 286340 - }, - { - "epoch": 1.0, - "learning_rate": 6.400039062908722e-08, - "loss": 2.286, - "step": 286350 - }, - { - "epoch": 1.0, - "learning_rate": 6.225651077543362e-08, - "loss": 2.3367, - "step": 286360 - }, - { - "epoch": 1.0, - "learning_rate": 6.051263092178002e-08, - "loss": 2.3127, - "step": 286370 - }, - { - "epoch": 1.0, - "learning_rate": 5.8768751068126415e-08, - "loss": 2.2882, - "step": 286380 - }, - { - "epoch": 1.0, - "learning_rate": 5.702487121447281e-08, - "loss": 2.3549, - "step": 286390 - }, - { - "epoch": 1.0, - "learning_rate": 5.5280991360819205e-08, - "loss": 2.3747, - "step": 286400 - }, - { - "epoch": 1.0, - "learning_rate": 5.3537111507165607e-08, - "loss": 2.304, - "step": 286410 - }, - { - "epoch": 1.0, - "learning_rate": 5.1793231653512e-08, - "loss": 2.2996, - "step": 286420 - }, - { - "epoch": 1.0, - "learning_rate": 5.00493517998584e-08, - "loss": 2.3123, - "step": 286430 - }, - { - "epoch": 1.0, - "learning_rate": 4.83054719462048e-08, - "loss": 2.301, - "step": 286440 - }, - { - "epoch": 1.0, - "learning_rate": 4.656159209255119e-08, - "loss": 2.3676, - "step": 286450 - }, - { - "epoch": 1.0, - "learning_rate": 4.481771223889759e-08, - "loss": 2.298, - "step": 286460 - }, - { - "epoch": 1.0, - "learning_rate": 4.307383238524399e-08, - "loss": 2.3243, - "step": 286470 - }, - { - "epoch": 1.0, - "learning_rate": 4.1329952531590385e-08, - "loss": 2.3733, - "step": 286480 - }, - { - "epoch": 1.0, - "learning_rate": 3.958607267793678e-08, - "loss": 2.3593, - "step": 286490 - }, - { - "epoch": 1.0, - "learning_rate": 3.7842192824283175e-08, - "loss": 2.2642, - "step": 286500 - }, - { - "epoch": 0.5, - "learning_rate": 2.501804915648532e-05, - "loss": 2.2268, - "step": 286510 - }, - { - "epoch": 0.5, - "learning_rate": 2.501717721655849e-05, - "loss": 2.2357, - "step": 286520 - }, - { - "epoch": 0.5, - "learning_rate": 2.5016305276631664e-05, - "loss": 2.2253, - "step": 286530 - }, - { - "epoch": 0.5, - "learning_rate": 2.5015433336704834e-05, - "loss": 2.3401, - "step": 286540 - }, - { - "epoch": 0.5, - "learning_rate": 2.5014561396778008e-05, - "loss": 2.3747, - "step": 286550 - }, - { - "epoch": 0.5, - "learning_rate": 2.501368945685118e-05, - "loss": 2.3105, - "step": 286560 - }, - { - "epoch": 0.5, - "learning_rate": 2.5012817516924352e-05, - "loss": 2.2003, - "step": 286570 - }, - { - "epoch": 0.5, - "learning_rate": 2.5011945576997532e-05, - "loss": 2.3854, - "step": 286580 - }, - { - "epoch": 0.5, - "learning_rate": 2.5011073637070703e-05, - "loss": 2.1984, - "step": 286590 - }, - { - "epoch": 0.5, - "learning_rate": 2.5010201697143877e-05, - "loss": 2.355, - "step": 286600 - }, - { - "epoch": 0.5, - "learning_rate": 2.5009329757217047e-05, - "loss": 2.3667, - "step": 286610 - }, - { - "epoch": 0.5, - "learning_rate": 2.500845781729022e-05, - "loss": 2.2959, - "step": 286620 - }, - { - "epoch": 0.5, - "learning_rate": 2.5007585877363394e-05, - "loss": 2.3303, - "step": 286630 - }, - { - "epoch": 0.5, - "learning_rate": 2.5006713937436565e-05, - "loss": 2.4082, - "step": 286640 - }, - { - "epoch": 0.5, - "learning_rate": 2.500584199750974e-05, - "loss": 2.3471, - "step": 286650 - }, - { - "epoch": 0.5, - "learning_rate": 2.5004970057582916e-05, - "loss": 2.3459, - "step": 286660 - }, - { - "epoch": 0.5, - "learning_rate": 2.500409811765609e-05, - "loss": 2.3638, - "step": 286670 - }, - { - "epoch": 0.5, - "learning_rate": 2.500322617772926e-05, - "loss": 2.4141, - "step": 286680 - }, - { - "epoch": 0.5, - "learning_rate": 2.5002354237802434e-05, - "loss": 2.4243, - "step": 286690 - }, - { - "epoch": 0.5, - "learning_rate": 2.5001482297875607e-05, - "loss": 2.3172, - "step": 286700 - }, - { - "epoch": 0.5, - "learning_rate": 2.5000610357948778e-05, - "loss": 2.2777, - "step": 286710 - }, - { - "epoch": 0.5, - "learning_rate": 2.4999738418021955e-05, - "loss": 2.3301, - "step": 286720 - }, - { - "epoch": 0.5, - "learning_rate": 2.4998866478095125e-05, - "loss": 2.4074, - "step": 286730 - }, - { - "epoch": 0.5, - "learning_rate": 2.49979945381683e-05, - "loss": 2.4159, - "step": 286740 - }, - { - "epoch": 0.5, - "learning_rate": 2.4997122598241473e-05, - "loss": 2.3664, - "step": 286750 - }, - { - "epoch": 0.5, - "learning_rate": 2.4996250658314647e-05, - "loss": 2.425, - "step": 286760 - }, - { - "epoch": 0.5, - "learning_rate": 2.4995378718387817e-05, - "loss": 2.3309, - "step": 286770 - }, - { - "epoch": 0.5, - "learning_rate": 2.499450677846099e-05, - "loss": 2.3227, - "step": 286780 - }, - { - "epoch": 0.5, - "learning_rate": 2.4993634838534165e-05, - "loss": 2.3188, - "step": 286790 - }, - { - "epoch": 0.5, - "learning_rate": 2.499276289860734e-05, - "loss": 2.2535, - "step": 286800 - }, - { - "epoch": 0.5, - "learning_rate": 2.4991890958680512e-05, - "loss": 2.4168, - "step": 286810 - }, - { - "epoch": 0.5, - "learning_rate": 2.4991019018753686e-05, - "loss": 2.3898, - "step": 286820 - }, - { - "epoch": 0.5, - "learning_rate": 2.499014707882686e-05, - "loss": 2.174, - "step": 286830 - }, - { - "epoch": 0.5, - "learning_rate": 2.498927513890003e-05, - "loss": 2.2998, - "step": 286840 - }, - { - "epoch": 0.5, - "learning_rate": 2.4988403198973204e-05, - "loss": 2.4884, - "step": 286850 - }, - { - "epoch": 0.5, - "learning_rate": 2.4987531259046378e-05, - "loss": 2.2641, - "step": 286860 - }, - { - "epoch": 0.5, - "learning_rate": 2.498665931911955e-05, - "loss": 2.2546, - "step": 286870 - }, - { - "epoch": 0.5, - "learning_rate": 2.4985787379192725e-05, - "loss": 2.3294, - "step": 286880 - }, - { - "epoch": 0.5, - "learning_rate": 2.4984915439265896e-05, - "loss": 2.2593, - "step": 286890 - }, - { - "epoch": 0.5, - "learning_rate": 2.4984043499339073e-05, - "loss": 2.3751, - "step": 286900 - }, - { - "epoch": 0.5, - "learning_rate": 2.4983171559412243e-05, - "loss": 2.4327, - "step": 286910 - }, - { - "epoch": 0.5, - "learning_rate": 2.4982299619485417e-05, - "loss": 2.4162, - "step": 286920 - }, - { - "epoch": 0.5, - "learning_rate": 2.498142767955859e-05, - "loss": 2.3835, - "step": 286930 - }, - { - "epoch": 0.5, - "learning_rate": 2.4980555739631764e-05, - "loss": 2.3808, - "step": 286940 - }, - { - "epoch": 0.5, - "learning_rate": 2.4979683799704938e-05, - "loss": 2.4371, - "step": 286950 - }, - { - "epoch": 0.5, - "learning_rate": 2.497881185977811e-05, - "loss": 2.3955, - "step": 286960 - }, - { - "epoch": 0.5, - "learning_rate": 2.4977939919851286e-05, - "loss": 2.3837, - "step": 286970 - }, - { - "epoch": 0.5, - "learning_rate": 2.4977067979924456e-05, - "loss": 2.3439, - "step": 286980 - }, - { - "epoch": 0.5, - "learning_rate": 2.497619603999763e-05, - "loss": 2.3856, - "step": 286990 - }, - { - "epoch": 0.5, - "learning_rate": 2.49753241000708e-05, - "loss": 2.3867, - "step": 287000 - }, - { - "epoch": 0.5, - "learning_rate": 2.4974452160143977e-05, - "loss": 2.2328, - "step": 287010 - }, - { - "epoch": 0.5, - "learning_rate": 2.4973580220217148e-05, - "loss": 2.3675, - "step": 287020 - }, - { - "epoch": 0.5, - "learning_rate": 2.497270828029032e-05, - "loss": 2.4436, - "step": 287030 - }, - { - "epoch": 0.5, - "learning_rate": 2.4971836340363495e-05, - "loss": 2.3239, - "step": 287040 - }, - { - "epoch": 0.5, - "learning_rate": 2.497096440043667e-05, - "loss": 2.4047, - "step": 287050 - }, - { - "epoch": 0.5, - "learning_rate": 2.4970092460509843e-05, - "loss": 2.4817, - "step": 287060 - }, - { - "epoch": 0.5, - "learning_rate": 2.4969220520583013e-05, - "loss": 2.3425, - "step": 287070 - }, - { - "epoch": 0.5, - "learning_rate": 2.496834858065619e-05, - "loss": 2.3675, - "step": 287080 - }, - { - "epoch": 0.5, - "learning_rate": 2.496747664072936e-05, - "loss": 2.386, - "step": 287090 - }, - { - "epoch": 0.5, - "learning_rate": 2.4966604700802535e-05, - "loss": 2.3983, - "step": 287100 - }, - { - "epoch": 0.5, - "learning_rate": 2.496573276087571e-05, - "loss": 2.3558, - "step": 287110 - }, - { - "epoch": 0.5, - "learning_rate": 2.4964860820948882e-05, - "loss": 2.2954, - "step": 287120 - }, - { - "epoch": 0.5, - "learning_rate": 2.4963988881022056e-05, - "loss": 2.4245, - "step": 287130 - }, - { - "epoch": 0.5, - "learning_rate": 2.4963116941095226e-05, - "loss": 2.3726, - "step": 287140 - }, - { - "epoch": 0.5, - "learning_rate": 2.49622450011684e-05, - "loss": 2.4018, - "step": 287150 - }, - { - "epoch": 0.5, - "learning_rate": 2.4961373061241574e-05, - "loss": 2.4077, - "step": 287160 - }, - { - "epoch": 0.5, - "learning_rate": 2.4960501121314748e-05, - "loss": 2.3067, - "step": 287170 - }, - { - "epoch": 0.5, - "learning_rate": 2.4959629181387918e-05, - "loss": 2.4695, - "step": 287180 - }, - { - "epoch": 0.5, - "learning_rate": 2.4958757241461095e-05, - "loss": 2.4182, - "step": 287190 - }, - { - "epoch": 0.5, - "learning_rate": 2.495788530153427e-05, - "loss": 2.3528, - "step": 287200 - }, - { - "epoch": 0.5, - "learning_rate": 2.495701336160744e-05, - "loss": 2.1961, - "step": 287210 - }, - { - "epoch": 0.5, - "learning_rate": 2.4956141421680613e-05, - "loss": 2.4111, - "step": 287220 - }, - { - "epoch": 0.5, - "learning_rate": 2.4955269481753787e-05, - "loss": 2.3462, - "step": 287230 - }, - { - "epoch": 0.5, - "learning_rate": 2.495439754182696e-05, - "loss": 2.4084, - "step": 287240 - }, - { - "epoch": 0.5, - "learning_rate": 2.495352560190013e-05, - "loss": 2.3031, - "step": 287250 - }, - { - "epoch": 0.5, - "learning_rate": 2.4952653661973305e-05, - "loss": 2.4129, - "step": 287260 - }, - { - "epoch": 0.5, - "learning_rate": 2.495178172204648e-05, - "loss": 2.3508, - "step": 287270 - }, - { - "epoch": 0.5, - "learning_rate": 2.4950909782119652e-05, - "loss": 2.2933, - "step": 287280 - }, - { - "epoch": 0.5, - "learning_rate": 2.4950037842192826e-05, - "loss": 2.3969, - "step": 287290 - }, - { - "epoch": 0.5, - "learning_rate": 2.4949165902265996e-05, - "loss": 2.3137, - "step": 287300 - }, - { - "epoch": 0.5, - "learning_rate": 2.4948293962339174e-05, - "loss": 2.3964, - "step": 287310 - }, - { - "epoch": 0.5, - "learning_rate": 2.4947422022412344e-05, - "loss": 2.3855, - "step": 287320 - }, - { - "epoch": 0.5, - "learning_rate": 2.4946550082485518e-05, - "loss": 2.3617, - "step": 287330 - }, - { - "epoch": 0.5, - "learning_rate": 2.494567814255869e-05, - "loss": 2.3448, - "step": 287340 - }, - { - "epoch": 0.5, - "learning_rate": 2.4944806202631865e-05, - "loss": 2.4593, - "step": 287350 - }, - { - "epoch": 0.5, - "learning_rate": 2.494393426270504e-05, - "loss": 2.3693, - "step": 287360 - }, - { - "epoch": 0.5, - "learning_rate": 2.494306232277821e-05, - "loss": 2.3633, - "step": 287370 - }, - { - "epoch": 0.5, - "learning_rate": 2.4942190382851387e-05, - "loss": 2.4289, - "step": 287380 - }, - { - "epoch": 0.5, - "learning_rate": 2.4941318442924557e-05, - "loss": 2.4064, - "step": 287390 - }, - { - "epoch": 0.5, - "learning_rate": 2.494044650299773e-05, - "loss": 2.4214, - "step": 287400 - }, - { - "epoch": 0.5, - "learning_rate": 2.49395745630709e-05, - "loss": 2.3502, - "step": 287410 - }, - { - "epoch": 0.5, - "learning_rate": 2.4938702623144078e-05, - "loss": 2.4025, - "step": 287420 - }, - { - "epoch": 0.5, - "learning_rate": 2.4937830683217252e-05, - "loss": 2.3359, - "step": 287430 - }, - { - "epoch": 0.5, - "learning_rate": 2.4936958743290422e-05, - "loss": 2.4125, - "step": 287440 - }, - { - "epoch": 0.5, - "learning_rate": 2.49360868033636e-05, - "loss": 2.3971, - "step": 287450 - }, - { - "epoch": 0.5, - "learning_rate": 2.493521486343677e-05, - "loss": 2.456, - "step": 287460 - }, - { - "epoch": 0.5, - "learning_rate": 2.4934342923509944e-05, - "loss": 2.4363, - "step": 287470 - }, - { - "epoch": 0.5, - "learning_rate": 2.4933470983583114e-05, - "loss": 2.3761, - "step": 287480 - }, - { - "epoch": 0.5, - "learning_rate": 2.493259904365629e-05, - "loss": 2.4089, - "step": 287490 - }, - { - "epoch": 0.5, - "learning_rate": 2.493172710372946e-05, - "loss": 2.3767, - "step": 287500 - }, - { - "epoch": 0.5, - "learning_rate": 2.4930855163802635e-05, - "loss": 2.3656, - "step": 287510 - }, - { - "epoch": 0.5, - "learning_rate": 2.492998322387581e-05, - "loss": 2.4044, - "step": 287520 - }, - { - "epoch": 0.5, - "learning_rate": 2.4929111283948983e-05, - "loss": 2.4082, - "step": 287530 - }, - { - "epoch": 0.5, - "learning_rate": 2.4928239344022157e-05, - "loss": 2.3255, - "step": 287540 - }, - { - "epoch": 0.5, - "learning_rate": 2.4927367404095327e-05, - "loss": 2.404, - "step": 287550 - }, - { - "epoch": 0.5, - "learning_rate": 2.49264954641685e-05, - "loss": 2.4031, - "step": 287560 - }, - { - "epoch": 0.5, - "learning_rate": 2.4925623524241675e-05, - "loss": 2.4274, - "step": 287570 - }, - { - "epoch": 0.5, - "learning_rate": 2.492475158431485e-05, - "loss": 2.1763, - "step": 287580 - }, - { - "epoch": 0.5, - "learning_rate": 2.4923879644388022e-05, - "loss": 2.3126, - "step": 287590 - }, - { - "epoch": 0.5, - "learning_rate": 2.4923007704461196e-05, - "loss": 2.4297, - "step": 287600 - }, - { - "epoch": 0.5, - "learning_rate": 2.492213576453437e-05, - "loss": 2.3406, - "step": 287610 - }, - { - "epoch": 0.5, - "learning_rate": 2.492126382460754e-05, - "loss": 2.412, - "step": 287620 - }, - { - "epoch": 0.5, - "learning_rate": 2.4920391884680714e-05, - "loss": 2.3748, - "step": 287630 - }, - { - "epoch": 0.5, - "learning_rate": 2.4919519944753888e-05, - "loss": 2.1283, - "step": 287640 - }, - { - "epoch": 0.5, - "learning_rate": 2.491864800482706e-05, - "loss": 2.3526, - "step": 287650 - }, - { - "epoch": 0.5, - "learning_rate": 2.4917776064900232e-05, - "loss": 2.4206, - "step": 287660 - }, - { - "epoch": 0.5, - "learning_rate": 2.4916904124973406e-05, - "loss": 2.351, - "step": 287670 - }, - { - "epoch": 0.5, - "learning_rate": 2.4916032185046583e-05, - "loss": 2.3685, - "step": 287680 - }, - { - "epoch": 0.5, - "learning_rate": 2.4915160245119753e-05, - "loss": 2.338, - "step": 287690 - }, - { - "epoch": 0.5, - "learning_rate": 2.4914288305192927e-05, - "loss": 2.2593, - "step": 287700 - }, - { - "epoch": 0.5, - "learning_rate": 2.4913416365266097e-05, - "loss": 2.3347, - "step": 287710 - }, - { - "epoch": 0.5, - "learning_rate": 2.4912544425339274e-05, - "loss": 2.3992, - "step": 287720 - }, - { - "epoch": 0.5, - "learning_rate": 2.4911672485412445e-05, - "loss": 2.4958, - "step": 287730 - }, - { - "epoch": 0.5, - "learning_rate": 2.491080054548562e-05, - "loss": 2.3532, - "step": 287740 - }, - { - "epoch": 0.5, - "learning_rate": 2.4909928605558792e-05, - "loss": 2.3036, - "step": 287750 - }, - { - "epoch": 0.5, - "learning_rate": 2.4909056665631966e-05, - "loss": 2.3262, - "step": 287760 - }, - { - "epoch": 0.5, - "learning_rate": 2.490818472570514e-05, - "loss": 2.3747, - "step": 287770 - }, - { - "epoch": 0.5, - "learning_rate": 2.490731278577831e-05, - "loss": 2.3014, - "step": 287780 - }, - { - "epoch": 0.5, - "learning_rate": 2.4906440845851487e-05, - "loss": 2.4001, - "step": 287790 - }, - { - "epoch": 0.5, - "learning_rate": 2.4905568905924658e-05, - "loss": 2.3995, - "step": 287800 - }, - { - "epoch": 0.5, - "learning_rate": 2.490469696599783e-05, - "loss": 2.3386, - "step": 287810 - }, - { - "epoch": 0.5, - "learning_rate": 2.4903825026071005e-05, - "loss": 2.4022, - "step": 287820 - }, - { - "epoch": 0.5, - "learning_rate": 2.490295308614418e-05, - "loss": 2.3378, - "step": 287830 - }, - { - "epoch": 0.5, - "learning_rate": 2.4902081146217353e-05, - "loss": 2.3522, - "step": 287840 - }, - { - "epoch": 0.5, - "learning_rate": 2.4901209206290523e-05, - "loss": 2.3204, - "step": 287850 - }, - { - "epoch": 0.5, - "learning_rate": 2.49003372663637e-05, - "loss": 2.3191, - "step": 287860 - }, - { - "epoch": 0.5, - "learning_rate": 2.489946532643687e-05, - "loss": 2.2889, - "step": 287870 - }, - { - "epoch": 0.5, - "learning_rate": 2.4898593386510045e-05, - "loss": 2.3418, - "step": 287880 - }, - { - "epoch": 0.5, - "learning_rate": 2.4897721446583215e-05, - "loss": 2.3664, - "step": 287890 - }, - { - "epoch": 0.5, - "learning_rate": 2.4896849506656392e-05, - "loss": 2.2569, - "step": 287900 - }, - { - "epoch": 0.5, - "learning_rate": 2.4895977566729562e-05, - "loss": 2.3267, - "step": 287910 - }, - { - "epoch": 0.5, - "learning_rate": 2.4895105626802736e-05, - "loss": 2.3981, - "step": 287920 - }, - { - "epoch": 0.5, - "learning_rate": 2.489423368687591e-05, - "loss": 2.4334, - "step": 287930 - }, - { - "epoch": 0.5, - "learning_rate": 2.4893361746949084e-05, - "loss": 2.367, - "step": 287940 - }, - { - "epoch": 0.5, - "learning_rate": 2.4892489807022258e-05, - "loss": 2.5344, - "step": 287950 - }, - { - "epoch": 0.5, - "learning_rate": 2.4891617867095428e-05, - "loss": 2.2886, - "step": 287960 - }, - { - "epoch": 0.5, - "learning_rate": 2.4890745927168602e-05, - "loss": 2.3179, - "step": 287970 - }, - { - "epoch": 0.5, - "learning_rate": 2.4889873987241775e-05, - "loss": 2.3962, - "step": 287980 - }, - { - "epoch": 0.5, - "learning_rate": 2.488900204731495e-05, - "loss": 2.4935, - "step": 287990 - }, - { - "epoch": 0.5, - "learning_rate": 2.4888130107388123e-05, - "loss": 2.3311, - "step": 288000 - }, - { - "epoch": 0.5, - "learning_rate": 2.4887258167461297e-05, - "loss": 2.5074, - "step": 288010 - }, - { - "epoch": 0.5, - "learning_rate": 2.488638622753447e-05, - "loss": 2.4023, - "step": 288020 - }, - { - "epoch": 0.5, - "learning_rate": 2.488551428760764e-05, - "loss": 2.3538, - "step": 288030 - }, - { - "epoch": 0.5, - "learning_rate": 2.4884642347680815e-05, - "loss": 2.3427, - "step": 288040 - }, - { - "epoch": 0.5, - "learning_rate": 2.488377040775399e-05, - "loss": 2.3163, - "step": 288050 - }, - { - "epoch": 0.5, - "learning_rate": 2.4882898467827162e-05, - "loss": 2.4777, - "step": 288060 - }, - { - "epoch": 0.5, - "learning_rate": 2.4882026527900336e-05, - "loss": 2.2752, - "step": 288070 - }, - { - "epoch": 0.5, - "learning_rate": 2.4881154587973506e-05, - "loss": 2.3832, - "step": 288080 - }, - { - "epoch": 0.5, - "learning_rate": 2.4880282648046684e-05, - "loss": 2.4503, - "step": 288090 - }, - { - "epoch": 0.5, - "learning_rate": 2.4879410708119854e-05, - "loss": 2.3353, - "step": 288100 - }, - { - "epoch": 0.5, - "learning_rate": 2.4878538768193028e-05, - "loss": 2.2827, - "step": 288110 - }, - { - "epoch": 0.5, - "learning_rate": 2.48776668282662e-05, - "loss": 2.4014, - "step": 288120 - }, - { - "epoch": 0.5, - "learning_rate": 2.4876794888339375e-05, - "loss": 2.365, - "step": 288130 - }, - { - "epoch": 0.5, - "learning_rate": 2.4875922948412546e-05, - "loss": 2.4174, - "step": 288140 - }, - { - "epoch": 0.5, - "learning_rate": 2.487505100848572e-05, - "loss": 2.3416, - "step": 288150 - }, - { - "epoch": 0.5, - "learning_rate": 2.4874179068558897e-05, - "loss": 2.3422, - "step": 288160 - }, - { - "epoch": 0.5, - "learning_rate": 2.4873307128632067e-05, - "loss": 2.2966, - "step": 288170 - }, - { - "epoch": 0.5, - "learning_rate": 2.487243518870524e-05, - "loss": 2.3593, - "step": 288180 - }, - { - "epoch": 0.5, - "learning_rate": 2.487156324877841e-05, - "loss": 2.2661, - "step": 288190 - }, - { - "epoch": 0.5, - "learning_rate": 2.4870691308851588e-05, - "loss": 2.3521, - "step": 288200 - }, - { - "epoch": 0.5, - "learning_rate": 2.486981936892476e-05, - "loss": 2.4595, - "step": 288210 - }, - { - "epoch": 0.5, - "learning_rate": 2.4868947428997932e-05, - "loss": 2.2664, - "step": 288220 - }, - { - "epoch": 0.5, - "learning_rate": 2.4868075489071106e-05, - "loss": 2.3477, - "step": 288230 - }, - { - "epoch": 0.5, - "learning_rate": 2.486720354914428e-05, - "loss": 2.3825, - "step": 288240 - }, - { - "epoch": 0.5, - "learning_rate": 2.4866331609217454e-05, - "loss": 2.398, - "step": 288250 - }, - { - "epoch": 0.5, - "learning_rate": 2.4865459669290624e-05, - "loss": 2.2126, - "step": 288260 - }, - { - "epoch": 0.5, - "learning_rate": 2.48645877293638e-05, - "loss": 2.4237, - "step": 288270 - }, - { - "epoch": 0.5, - "learning_rate": 2.486371578943697e-05, - "loss": 2.3546, - "step": 288280 - }, - { - "epoch": 0.5, - "learning_rate": 2.4862843849510145e-05, - "loss": 2.3357, - "step": 288290 - }, - { - "epoch": 0.5, - "learning_rate": 2.486197190958332e-05, - "loss": 2.3614, - "step": 288300 - }, - { - "epoch": 0.5, - "learning_rate": 2.4861099969656493e-05, - "loss": 2.4106, - "step": 288310 - }, - { - "epoch": 0.5, - "learning_rate": 2.4860228029729667e-05, - "loss": 2.2382, - "step": 288320 - }, - { - "epoch": 0.5, - "learning_rate": 2.4859356089802837e-05, - "loss": 2.3342, - "step": 288330 - }, - { - "epoch": 0.5, - "learning_rate": 2.485848414987601e-05, - "loss": 2.3817, - "step": 288340 - }, - { - "epoch": 0.5, - "learning_rate": 2.4857612209949185e-05, - "loss": 2.392, - "step": 288350 - }, - { - "epoch": 0.5, - "learning_rate": 2.485674027002236e-05, - "loss": 2.3458, - "step": 288360 - }, - { - "epoch": 0.5, - "learning_rate": 2.485586833009553e-05, - "loss": 2.3879, - "step": 288370 - }, - { - "epoch": 0.5, - "learning_rate": 2.4854996390168706e-05, - "loss": 2.3725, - "step": 288380 - }, - { - "epoch": 0.5, - "learning_rate": 2.4854124450241876e-05, - "loss": 2.3492, - "step": 288390 - }, - { - "epoch": 0.5, - "learning_rate": 2.485325251031505e-05, - "loss": 2.3735, - "step": 288400 - }, - { - "epoch": 0.5, - "learning_rate": 2.4852380570388224e-05, - "loss": 2.3926, - "step": 288410 - }, - { - "epoch": 0.5, - "learning_rate": 2.4851508630461398e-05, - "loss": 2.2688, - "step": 288420 - }, - { - "epoch": 0.5, - "learning_rate": 2.485063669053457e-05, - "loss": 2.295, - "step": 288430 - }, - { - "epoch": 0.5, - "learning_rate": 2.4849764750607742e-05, - "loss": 2.2295, - "step": 288440 - }, - { - "epoch": 0.5, - "learning_rate": 2.4848892810680916e-05, - "loss": 2.2932, - "step": 288450 - }, - { - "epoch": 0.5, - "learning_rate": 2.484802087075409e-05, - "loss": 2.3662, - "step": 288460 - }, - { - "epoch": 0.5, - "learning_rate": 2.4847148930827263e-05, - "loss": 2.4126, - "step": 288470 - }, - { - "epoch": 0.5, - "learning_rate": 2.4846276990900437e-05, - "loss": 2.3616, - "step": 288480 - }, - { - "epoch": 0.5, - "learning_rate": 2.4845405050973607e-05, - "loss": 2.4475, - "step": 288490 - }, - { - "epoch": 0.5, - "learning_rate": 2.4844533111046784e-05, - "loss": 2.2703, - "step": 288500 - }, - { - "epoch": 0.5, - "learning_rate": 2.4843661171119955e-05, - "loss": 2.3055, - "step": 288510 - }, - { - "epoch": 0.5, - "learning_rate": 2.484278923119313e-05, - "loss": 2.3432, - "step": 288520 - }, - { - "epoch": 0.5, - "learning_rate": 2.4841917291266302e-05, - "loss": 2.3521, - "step": 288530 - }, - { - "epoch": 0.5, - "learning_rate": 2.4841045351339476e-05, - "loss": 2.4403, - "step": 288540 - }, - { - "epoch": 0.5, - "learning_rate": 2.484017341141265e-05, - "loss": 2.3355, - "step": 288550 - }, - { - "epoch": 0.5, - "learning_rate": 2.483930147148582e-05, - "loss": 2.3621, - "step": 288560 - }, - { - "epoch": 0.5, - "learning_rate": 2.4838429531558997e-05, - "loss": 2.369, - "step": 288570 - }, - { - "epoch": 0.5, - "learning_rate": 2.4837557591632168e-05, - "loss": 2.2664, - "step": 288580 - }, - { - "epoch": 0.5, - "learning_rate": 2.483668565170534e-05, - "loss": 2.3053, - "step": 288590 - }, - { - "epoch": 0.5, - "learning_rate": 2.4835813711778512e-05, - "loss": 2.345, - "step": 288600 - }, - { - "epoch": 0.5, - "learning_rate": 2.483494177185169e-05, - "loss": 2.376, - "step": 288610 - }, - { - "epoch": 0.5, - "learning_rate": 2.483406983192486e-05, - "loss": 2.3433, - "step": 288620 - }, - { - "epoch": 0.5, - "learning_rate": 2.4833197891998033e-05, - "loss": 2.3061, - "step": 288630 - }, - { - "epoch": 0.5, - "learning_rate": 2.4832325952071207e-05, - "loss": 2.3017, - "step": 288640 - }, - { - "epoch": 0.5, - "learning_rate": 2.483145401214438e-05, - "loss": 2.4045, - "step": 288650 - }, - { - "epoch": 0.5, - "learning_rate": 2.4830582072217555e-05, - "loss": 2.4386, - "step": 288660 - }, - { - "epoch": 0.5, - "learning_rate": 2.4829710132290725e-05, - "loss": 2.3269, - "step": 288670 - }, - { - "epoch": 0.5, - "learning_rate": 2.4828838192363902e-05, - "loss": 2.3436, - "step": 288680 - }, - { - "epoch": 0.5, - "learning_rate": 2.4827966252437072e-05, - "loss": 2.3689, - "step": 288690 - }, - { - "epoch": 0.5, - "learning_rate": 2.4827094312510246e-05, - "loss": 2.343, - "step": 288700 - }, - { - "epoch": 0.5, - "learning_rate": 2.482622237258342e-05, - "loss": 2.4351, - "step": 288710 - }, - { - "epoch": 0.5, - "learning_rate": 2.4825350432656594e-05, - "loss": 2.3617, - "step": 288720 - }, - { - "epoch": 0.5, - "learning_rate": 2.4824478492729768e-05, - "loss": 2.3473, - "step": 288730 - }, - { - "epoch": 0.5, - "learning_rate": 2.4823606552802938e-05, - "loss": 2.3194, - "step": 288740 - }, - { - "epoch": 0.5, - "learning_rate": 2.4822734612876112e-05, - "loss": 2.3265, - "step": 288750 - }, - { - "epoch": 0.5, - "learning_rate": 2.4821862672949286e-05, - "loss": 2.3241, - "step": 288760 - }, - { - "epoch": 0.5, - "learning_rate": 2.482099073302246e-05, - "loss": 2.4199, - "step": 288770 - }, - { - "epoch": 0.5, - "learning_rate": 2.4820118793095633e-05, - "loss": 2.2634, - "step": 288780 - }, - { - "epoch": 0.5, - "learning_rate": 2.4819246853168807e-05, - "loss": 2.4318, - "step": 288790 - }, - { - "epoch": 0.5, - "learning_rate": 2.481837491324198e-05, - "loss": 2.3056, - "step": 288800 - }, - { - "epoch": 0.5, - "learning_rate": 2.481750297331515e-05, - "loss": 2.3648, - "step": 288810 - }, - { - "epoch": 0.5, - "learning_rate": 2.4816631033388325e-05, - "loss": 2.4045, - "step": 288820 - }, - { - "epoch": 0.5, - "learning_rate": 2.48157590934615e-05, - "loss": 2.2624, - "step": 288830 - }, - { - "epoch": 0.5, - "learning_rate": 2.4814887153534672e-05, - "loss": 2.355, - "step": 288840 - }, - { - "epoch": 0.5, - "learning_rate": 2.4814015213607843e-05, - "loss": 2.2775, - "step": 288850 - }, - { - "epoch": 0.5, - "learning_rate": 2.4813143273681016e-05, - "loss": 2.375, - "step": 288860 - }, - { - "epoch": 0.5, - "learning_rate": 2.481227133375419e-05, - "loss": 2.3724, - "step": 288870 - }, - { - "epoch": 0.5, - "learning_rate": 2.4811399393827364e-05, - "loss": 2.4173, - "step": 288880 - }, - { - "epoch": 0.5, - "learning_rate": 2.4810527453900538e-05, - "loss": 2.3648, - "step": 288890 - }, - { - "epoch": 0.5, - "learning_rate": 2.4809655513973708e-05, - "loss": 2.1772, - "step": 288900 - }, - { - "epoch": 0.5, - "learning_rate": 2.4808783574046885e-05, - "loss": 2.4278, - "step": 288910 - }, - { - "epoch": 0.5, - "learning_rate": 2.4807911634120056e-05, - "loss": 2.3561, - "step": 288920 - }, - { - "epoch": 0.5, - "learning_rate": 2.480703969419323e-05, - "loss": 2.2298, - "step": 288930 - }, - { - "epoch": 0.5, - "learning_rate": 2.4806167754266403e-05, - "loss": 2.2692, - "step": 288940 - }, - { - "epoch": 0.5, - "learning_rate": 2.4805295814339577e-05, - "loss": 2.3031, - "step": 288950 - }, - { - "epoch": 0.5, - "learning_rate": 2.480442387441275e-05, - "loss": 2.4073, - "step": 288960 - }, - { - "epoch": 0.5, - "learning_rate": 2.480355193448592e-05, - "loss": 2.4386, - "step": 288970 - }, - { - "epoch": 0.5, - "learning_rate": 2.4802679994559098e-05, - "loss": 2.3414, - "step": 288980 - }, - { - "epoch": 0.5, - "learning_rate": 2.480180805463227e-05, - "loss": 2.3003, - "step": 288990 - }, - { - "epoch": 0.5, - "learning_rate": 2.4800936114705442e-05, - "loss": 2.3353, - "step": 289000 - }, - { - "epoch": 0.5, - "learning_rate": 2.4800064174778613e-05, - "loss": 2.3224, - "step": 289010 - }, - { - "epoch": 0.5, - "learning_rate": 2.479919223485179e-05, - "loss": 2.4021, - "step": 289020 - }, - { - "epoch": 0.5, - "learning_rate": 2.4798320294924964e-05, - "loss": 2.4544, - "step": 289030 - }, - { - "epoch": 0.5, - "learning_rate": 2.4797448354998134e-05, - "loss": 2.4166, - "step": 289040 - }, - { - "epoch": 0.5, - "learning_rate": 2.479657641507131e-05, - "loss": 2.2541, - "step": 289050 - }, - { - "epoch": 0.5, - "learning_rate": 2.479570447514448e-05, - "loss": 2.3954, - "step": 289060 - }, - { - "epoch": 0.5, - "learning_rate": 2.4794832535217655e-05, - "loss": 2.348, - "step": 289070 - }, - { - "epoch": 0.5, - "learning_rate": 2.4793960595290826e-05, - "loss": 2.3917, - "step": 289080 - }, - { - "epoch": 0.5, - "learning_rate": 2.4793088655364003e-05, - "loss": 2.2845, - "step": 289090 - }, - { - "epoch": 0.5, - "learning_rate": 2.4792216715437173e-05, - "loss": 2.3718, - "step": 289100 - }, - { - "epoch": 0.5, - "learning_rate": 2.4791344775510347e-05, - "loss": 2.3641, - "step": 289110 - }, - { - "epoch": 0.5, - "learning_rate": 2.479047283558352e-05, - "loss": 2.3161, - "step": 289120 - }, - { - "epoch": 0.5, - "learning_rate": 2.4789600895656695e-05, - "loss": 2.3821, - "step": 289130 - }, - { - "epoch": 0.5, - "learning_rate": 2.478872895572987e-05, - "loss": 2.3472, - "step": 289140 - }, - { - "epoch": 0.5, - "learning_rate": 2.478785701580304e-05, - "loss": 2.2837, - "step": 289150 - }, - { - "epoch": 0.5, - "learning_rate": 2.4786985075876213e-05, - "loss": 2.2695, - "step": 289160 - }, - { - "epoch": 0.5, - "learning_rate": 2.4786113135949386e-05, - "loss": 2.4039, - "step": 289170 - }, - { - "epoch": 0.5, - "learning_rate": 2.478524119602256e-05, - "loss": 2.3869, - "step": 289180 - }, - { - "epoch": 0.5, - "learning_rate": 2.4784369256095734e-05, - "loss": 2.4482, - "step": 289190 - }, - { - "epoch": 0.5, - "learning_rate": 2.4783497316168908e-05, - "loss": 2.3041, - "step": 289200 - }, - { - "epoch": 0.5, - "learning_rate": 2.478262537624208e-05, - "loss": 2.373, - "step": 289210 - }, - { - "epoch": 0.5, - "learning_rate": 2.4781753436315252e-05, - "loss": 2.2963, - "step": 289220 - }, - { - "epoch": 0.5, - "learning_rate": 2.4780881496388426e-05, - "loss": 2.471, - "step": 289230 - }, - { - "epoch": 0.5, - "learning_rate": 2.47800095564616e-05, - "loss": 2.2769, - "step": 289240 - }, - { - "epoch": 0.5, - "learning_rate": 2.4779137616534773e-05, - "loss": 2.3131, - "step": 289250 - }, - { - "epoch": 0.5, - "learning_rate": 2.4778265676607944e-05, - "loss": 2.2801, - "step": 289260 - }, - { - "epoch": 0.5, - "learning_rate": 2.4777393736681117e-05, - "loss": 2.3475, - "step": 289270 - }, - { - "epoch": 0.5, - "learning_rate": 2.4776521796754294e-05, - "loss": 2.3625, - "step": 289280 - }, - { - "epoch": 0.5, - "learning_rate": 2.4775649856827465e-05, - "loss": 2.2698, - "step": 289290 - }, - { - "epoch": 0.5, - "learning_rate": 2.477477791690064e-05, - "loss": 2.4298, - "step": 289300 - }, - { - "epoch": 0.5, - "learning_rate": 2.477390597697381e-05, - "loss": 2.3185, - "step": 289310 - }, - { - "epoch": 0.5, - "learning_rate": 2.4773034037046986e-05, - "loss": 2.3965, - "step": 289320 - }, - { - "epoch": 0.5, - "learning_rate": 2.4772162097120157e-05, - "loss": 2.3904, - "step": 289330 - }, - { - "epoch": 0.5, - "learning_rate": 2.477129015719333e-05, - "loss": 2.4527, - "step": 289340 - }, - { - "epoch": 0.5, - "learning_rate": 2.4770418217266504e-05, - "loss": 2.3859, - "step": 289350 - }, - { - "epoch": 0.5, - "learning_rate": 2.4769546277339678e-05, - "loss": 2.3495, - "step": 289360 - }, - { - "epoch": 0.5, - "learning_rate": 2.476867433741285e-05, - "loss": 2.1536, - "step": 289370 - }, - { - "epoch": 0.5, - "learning_rate": 2.4767802397486022e-05, - "loss": 2.2443, - "step": 289380 - }, - { - "epoch": 0.5, - "learning_rate": 2.47669304575592e-05, - "loss": 2.3802, - "step": 289390 - }, - { - "epoch": 0.5, - "learning_rate": 2.476605851763237e-05, - "loss": 2.4404, - "step": 289400 - }, - { - "epoch": 0.5, - "learning_rate": 2.4765186577705543e-05, - "loss": 2.3591, - "step": 289410 - }, - { - "epoch": 0.5, - "learning_rate": 2.4764314637778717e-05, - "loss": 2.3411, - "step": 289420 - }, - { - "epoch": 0.5, - "learning_rate": 2.476344269785189e-05, - "loss": 2.3765, - "step": 289430 - }, - { - "epoch": 0.5, - "learning_rate": 2.4762570757925065e-05, - "loss": 2.3931, - "step": 289440 - }, - { - "epoch": 0.5, - "learning_rate": 2.4761698817998235e-05, - "loss": 2.3829, - "step": 289450 - }, - { - "epoch": 0.5, - "learning_rate": 2.4760826878071412e-05, - "loss": 2.4214, - "step": 289460 - }, - { - "epoch": 0.5, - "learning_rate": 2.4759954938144583e-05, - "loss": 2.5588, - "step": 289470 - }, - { - "epoch": 0.5, - "learning_rate": 2.4759082998217756e-05, - "loss": 2.1934, - "step": 289480 - }, - { - "epoch": 0.5, - "learning_rate": 2.4758211058290927e-05, - "loss": 2.3098, - "step": 289490 - }, - { - "epoch": 0.5, - "learning_rate": 2.4757339118364104e-05, - "loss": 2.2045, - "step": 289500 - }, - { - "epoch": 0.5, - "learning_rate": 2.4756467178437278e-05, - "loss": 2.3424, - "step": 289510 - }, - { - "epoch": 0.5, - "learning_rate": 2.4755595238510448e-05, - "loss": 2.3851, - "step": 289520 - }, - { - "epoch": 0.5, - "learning_rate": 2.4754723298583622e-05, - "loss": 2.3599, - "step": 289530 - }, - { - "epoch": 0.5, - "learning_rate": 2.4753851358656796e-05, - "loss": 2.2394, - "step": 289540 - }, - { - "epoch": 0.5, - "learning_rate": 2.475297941872997e-05, - "loss": 2.3502, - "step": 289550 - }, - { - "epoch": 0.5, - "learning_rate": 2.475210747880314e-05, - "loss": 2.2637, - "step": 289560 - }, - { - "epoch": 0.5, - "learning_rate": 2.4751235538876313e-05, - "loss": 2.4154, - "step": 289570 - }, - { - "epoch": 0.5, - "learning_rate": 2.4750363598949487e-05, - "loss": 2.402, - "step": 289580 - }, - { - "epoch": 0.51, - "learning_rate": 2.474949165902266e-05, - "loss": 2.194, - "step": 289590 - }, - { - "epoch": 0.51, - "learning_rate": 2.4748619719095835e-05, - "loss": 2.3227, - "step": 289600 - }, - { - "epoch": 0.51, - "learning_rate": 2.474774777916901e-05, - "loss": 2.3868, - "step": 289610 - }, - { - "epoch": 0.51, - "learning_rate": 2.4746875839242182e-05, - "loss": 2.3488, - "step": 289620 - }, - { - "epoch": 0.51, - "learning_rate": 2.4746003899315353e-05, - "loss": 2.4322, - "step": 289630 - }, - { - "epoch": 0.51, - "learning_rate": 2.4745131959388526e-05, - "loss": 2.5103, - "step": 289640 - }, - { - "epoch": 0.51, - "learning_rate": 2.47442600194617e-05, - "loss": 2.2787, - "step": 289650 - }, - { - "epoch": 0.51, - "learning_rate": 2.4743388079534874e-05, - "loss": 2.3334, - "step": 289660 - }, - { - "epoch": 0.51, - "learning_rate": 2.4742516139608048e-05, - "loss": 2.3668, - "step": 289670 - }, - { - "epoch": 0.51, - "learning_rate": 2.4741644199681218e-05, - "loss": 2.2986, - "step": 289680 - }, - { - "epoch": 0.51, - "learning_rate": 2.4740772259754395e-05, - "loss": 2.3473, - "step": 289690 - }, - { - "epoch": 0.51, - "learning_rate": 2.4739900319827566e-05, - "loss": 2.3773, - "step": 289700 - }, - { - "epoch": 0.51, - "learning_rate": 2.473902837990074e-05, - "loss": 2.4054, - "step": 289710 - }, - { - "epoch": 0.51, - "learning_rate": 2.4738156439973913e-05, - "loss": 2.3478, - "step": 289720 - }, - { - "epoch": 0.51, - "learning_rate": 2.4737284500047087e-05, - "loss": 2.3944, - "step": 289730 - }, - { - "epoch": 0.51, - "learning_rate": 2.4736412560120257e-05, - "loss": 2.2815, - "step": 289740 - }, - { - "epoch": 0.51, - "learning_rate": 2.473554062019343e-05, - "loss": 2.4135, - "step": 289750 - }, - { - "epoch": 0.51, - "learning_rate": 2.4734668680266608e-05, - "loss": 2.3447, - "step": 289760 - }, - { - "epoch": 0.51, - "learning_rate": 2.473379674033978e-05, - "loss": 2.3952, - "step": 289770 - }, - { - "epoch": 0.51, - "learning_rate": 2.4732924800412952e-05, - "loss": 2.371, - "step": 289780 - }, - { - "epoch": 0.51, - "learning_rate": 2.4732052860486123e-05, - "loss": 2.383, - "step": 289790 - }, - { - "epoch": 0.51, - "learning_rate": 2.47311809205593e-05, - "loss": 2.3225, - "step": 289800 - }, - { - "epoch": 0.51, - "learning_rate": 2.473030898063247e-05, - "loss": 2.349, - "step": 289810 - }, - { - "epoch": 0.51, - "learning_rate": 2.4729437040705644e-05, - "loss": 2.4892, - "step": 289820 - }, - { - "epoch": 0.51, - "learning_rate": 2.4728565100778818e-05, - "loss": 2.4997, - "step": 289830 - }, - { - "epoch": 0.51, - "learning_rate": 2.472769316085199e-05, - "loss": 2.2927, - "step": 289840 - }, - { - "epoch": 0.51, - "learning_rate": 2.4726821220925165e-05, - "loss": 2.3983, - "step": 289850 - }, - { - "epoch": 0.51, - "learning_rate": 2.4725949280998336e-05, - "loss": 2.2869, - "step": 289860 - }, - { - "epoch": 0.51, - "learning_rate": 2.4725077341071513e-05, - "loss": 2.2917, - "step": 289870 - }, - { - "epoch": 0.51, - "learning_rate": 2.4724205401144683e-05, - "loss": 2.4332, - "step": 289880 - }, - { - "epoch": 0.51, - "learning_rate": 2.4723333461217857e-05, - "loss": 2.3978, - "step": 289890 - }, - { - "epoch": 0.51, - "learning_rate": 2.472246152129103e-05, - "loss": 2.4321, - "step": 289900 - }, - { - "epoch": 0.51, - "learning_rate": 2.4721589581364205e-05, - "loss": 2.5071, - "step": 289910 - }, - { - "epoch": 0.51, - "learning_rate": 2.472071764143738e-05, - "loss": 2.3462, - "step": 289920 - }, - { - "epoch": 0.51, - "learning_rate": 2.471984570151055e-05, - "loss": 2.4456, - "step": 289930 - }, - { - "epoch": 0.51, - "learning_rate": 2.4718973761583723e-05, - "loss": 2.3691, - "step": 289940 - }, - { - "epoch": 0.51, - "learning_rate": 2.4718101821656896e-05, - "loss": 2.437, - "step": 289950 - }, - { - "epoch": 0.51, - "learning_rate": 2.471722988173007e-05, - "loss": 2.3449, - "step": 289960 - }, - { - "epoch": 0.51, - "learning_rate": 2.471635794180324e-05, - "loss": 2.3039, - "step": 289970 - }, - { - "epoch": 0.51, - "learning_rate": 2.4715486001876418e-05, - "loss": 2.4202, - "step": 289980 - }, - { - "epoch": 0.51, - "learning_rate": 2.4714614061949588e-05, - "loss": 2.3993, - "step": 289990 - }, - { - "epoch": 0.51, - "learning_rate": 2.4713742122022762e-05, - "loss": 2.2215, - "step": 290000 - }, - { - "epoch": 0.51, - "learning_rate": 2.4712870182095936e-05, - "loss": 2.5296, - "step": 290010 - }, - { - "epoch": 0.51, - "learning_rate": 2.471199824216911e-05, - "loss": 2.328, - "step": 290020 - }, - { - "epoch": 0.51, - "learning_rate": 2.4711126302242283e-05, - "loss": 2.3154, - "step": 290030 - }, - { - "epoch": 0.51, - "learning_rate": 2.4710254362315454e-05, - "loss": 2.3397, - "step": 290040 - }, - { - "epoch": 0.51, - "learning_rate": 2.4709382422388627e-05, - "loss": 2.3884, - "step": 290050 - }, - { - "epoch": 0.51, - "learning_rate": 2.47085104824618e-05, - "loss": 2.4105, - "step": 290060 - }, - { - "epoch": 0.51, - "learning_rate": 2.4707638542534975e-05, - "loss": 2.3218, - "step": 290070 - }, - { - "epoch": 0.51, - "learning_rate": 2.470676660260815e-05, - "loss": 2.5264, - "step": 290080 - }, - { - "epoch": 0.51, - "learning_rate": 2.470589466268132e-05, - "loss": 2.2383, - "step": 290090 - }, - { - "epoch": 0.51, - "learning_rate": 2.4705022722754496e-05, - "loss": 2.3599, - "step": 290100 - }, - { - "epoch": 0.51, - "learning_rate": 2.4704150782827667e-05, - "loss": 2.4215, - "step": 290110 - }, - { - "epoch": 0.51, - "learning_rate": 2.470327884290084e-05, - "loss": 2.3351, - "step": 290120 - }, - { - "epoch": 0.51, - "learning_rate": 2.4702406902974014e-05, - "loss": 2.3194, - "step": 290130 - }, - { - "epoch": 0.51, - "learning_rate": 2.4701534963047188e-05, - "loss": 2.3975, - "step": 290140 - }, - { - "epoch": 0.51, - "learning_rate": 2.470066302312036e-05, - "loss": 2.3309, - "step": 290150 - }, - { - "epoch": 0.51, - "learning_rate": 2.4699791083193532e-05, - "loss": 2.4137, - "step": 290160 - }, - { - "epoch": 0.51, - "learning_rate": 2.469891914326671e-05, - "loss": 2.3648, - "step": 290170 - }, - { - "epoch": 0.51, - "learning_rate": 2.469804720333988e-05, - "loss": 2.3223, - "step": 290180 - }, - { - "epoch": 0.51, - "learning_rate": 2.4697175263413053e-05, - "loss": 2.2615, - "step": 290190 - }, - { - "epoch": 0.51, - "learning_rate": 2.4696303323486224e-05, - "loss": 2.2955, - "step": 290200 - }, - { - "epoch": 0.51, - "learning_rate": 2.46954313835594e-05, - "loss": 2.285, - "step": 290210 - }, - { - "epoch": 0.51, - "learning_rate": 2.469455944363257e-05, - "loss": 2.2654, - "step": 290220 - }, - { - "epoch": 0.51, - "learning_rate": 2.4693687503705745e-05, - "loss": 2.4573, - "step": 290230 - }, - { - "epoch": 0.51, - "learning_rate": 2.469281556377892e-05, - "loss": 2.26, - "step": 290240 - }, - { - "epoch": 0.51, - "learning_rate": 2.4691943623852093e-05, - "loss": 2.3259, - "step": 290250 - }, - { - "epoch": 0.51, - "learning_rate": 2.4691071683925266e-05, - "loss": 2.2398, - "step": 290260 - }, - { - "epoch": 0.51, - "learning_rate": 2.4690199743998437e-05, - "loss": 2.3792, - "step": 290270 - }, - { - "epoch": 0.51, - "learning_rate": 2.4689327804071614e-05, - "loss": 2.4395, - "step": 290280 - }, - { - "epoch": 0.51, - "learning_rate": 2.4688455864144784e-05, - "loss": 2.2543, - "step": 290290 - }, - { - "epoch": 0.51, - "learning_rate": 2.4687583924217958e-05, - "loss": 2.3868, - "step": 290300 - }, - { - "epoch": 0.51, - "learning_rate": 2.4686711984291132e-05, - "loss": 2.3944, - "step": 290310 - }, - { - "epoch": 0.51, - "learning_rate": 2.4685840044364306e-05, - "loss": 2.4142, - "step": 290320 - }, - { - "epoch": 0.51, - "learning_rate": 2.468496810443748e-05, - "loss": 2.467, - "step": 290330 - }, - { - "epoch": 0.51, - "learning_rate": 2.468409616451065e-05, - "loss": 2.4157, - "step": 290340 - }, - { - "epoch": 0.51, - "learning_rate": 2.4683224224583823e-05, - "loss": 2.2731, - "step": 290350 - }, - { - "epoch": 0.51, - "learning_rate": 2.4682352284656997e-05, - "loss": 2.4202, - "step": 290360 - }, - { - "epoch": 0.51, - "learning_rate": 2.468148034473017e-05, - "loss": 2.3596, - "step": 290370 - }, - { - "epoch": 0.51, - "learning_rate": 2.4680608404803345e-05, - "loss": 2.2681, - "step": 290380 - }, - { - "epoch": 0.51, - "learning_rate": 2.467973646487652e-05, - "loss": 2.3925, - "step": 290390 - }, - { - "epoch": 0.51, - "learning_rate": 2.4678864524949692e-05, - "loss": 2.4209, - "step": 290400 - }, - { - "epoch": 0.51, - "learning_rate": 2.4677992585022863e-05, - "loss": 2.4489, - "step": 290410 - }, - { - "epoch": 0.51, - "learning_rate": 2.4677120645096036e-05, - "loss": 2.2727, - "step": 290420 - }, - { - "epoch": 0.51, - "learning_rate": 2.467624870516921e-05, - "loss": 2.2134, - "step": 290430 - }, - { - "epoch": 0.51, - "learning_rate": 2.4675376765242384e-05, - "loss": 2.2759, - "step": 290440 - }, - { - "epoch": 0.51, - "learning_rate": 2.4674504825315554e-05, - "loss": 2.3137, - "step": 290450 - }, - { - "epoch": 0.51, - "learning_rate": 2.4673632885388728e-05, - "loss": 2.4497, - "step": 290460 - }, - { - "epoch": 0.51, - "learning_rate": 2.4672760945461902e-05, - "loss": 2.3005, - "step": 290470 - }, - { - "epoch": 0.51, - "learning_rate": 2.4671889005535076e-05, - "loss": 2.3795, - "step": 290480 - }, - { - "epoch": 0.51, - "learning_rate": 2.467101706560825e-05, - "loss": 2.3937, - "step": 290490 - }, - { - "epoch": 0.51, - "learning_rate": 2.467014512568142e-05, - "loss": 2.4106, - "step": 290500 - }, - { - "epoch": 0.51, - "learning_rate": 2.4669273185754597e-05, - "loss": 2.4397, - "step": 290510 - }, - { - "epoch": 0.51, - "learning_rate": 2.4668401245827767e-05, - "loss": 2.3451, - "step": 290520 - }, - { - "epoch": 0.51, - "learning_rate": 2.466752930590094e-05, - "loss": 2.3493, - "step": 290530 - }, - { - "epoch": 0.51, - "learning_rate": 2.4666657365974115e-05, - "loss": 2.3672, - "step": 290540 - }, - { - "epoch": 0.51, - "learning_rate": 2.466578542604729e-05, - "loss": 2.2177, - "step": 290550 - }, - { - "epoch": 0.51, - "learning_rate": 2.4664913486120462e-05, - "loss": 2.3938, - "step": 290560 - }, - { - "epoch": 0.51, - "learning_rate": 2.4664041546193633e-05, - "loss": 2.3694, - "step": 290570 - }, - { - "epoch": 0.51, - "learning_rate": 2.466316960626681e-05, - "loss": 2.3685, - "step": 290580 - }, - { - "epoch": 0.51, - "learning_rate": 2.466229766633998e-05, - "loss": 2.3158, - "step": 290590 - }, - { - "epoch": 0.51, - "learning_rate": 2.4661425726413154e-05, - "loss": 2.4338, - "step": 290600 - }, - { - "epoch": 0.51, - "learning_rate": 2.4660553786486325e-05, - "loss": 2.4061, - "step": 290610 - }, - { - "epoch": 0.51, - "learning_rate": 2.46596818465595e-05, - "loss": 2.4087, - "step": 290620 - }, - { - "epoch": 0.51, - "learning_rate": 2.4658809906632675e-05, - "loss": 2.429, - "step": 290630 - }, - { - "epoch": 0.51, - "learning_rate": 2.4657937966705846e-05, - "loss": 2.3303, - "step": 290640 - }, - { - "epoch": 0.51, - "learning_rate": 2.4657066026779023e-05, - "loss": 2.4193, - "step": 290650 - }, - { - "epoch": 0.51, - "learning_rate": 2.4656194086852193e-05, - "loss": 2.3597, - "step": 290660 - }, - { - "epoch": 0.51, - "learning_rate": 2.4655322146925367e-05, - "loss": 2.3759, - "step": 290670 - }, - { - "epoch": 0.51, - "learning_rate": 2.4654450206998538e-05, - "loss": 2.4201, - "step": 290680 - }, - { - "epoch": 0.51, - "learning_rate": 2.4653578267071715e-05, - "loss": 2.3443, - "step": 290690 - }, - { - "epoch": 0.51, - "learning_rate": 2.4652706327144885e-05, - "loss": 2.3261, - "step": 290700 - }, - { - "epoch": 0.51, - "learning_rate": 2.465183438721806e-05, - "loss": 2.3234, - "step": 290710 - }, - { - "epoch": 0.51, - "learning_rate": 2.4650962447291233e-05, - "loss": 2.4269, - "step": 290720 - }, - { - "epoch": 0.51, - "learning_rate": 2.4650090507364406e-05, - "loss": 2.3269, - "step": 290730 - }, - { - "epoch": 0.51, - "learning_rate": 2.464921856743758e-05, - "loss": 2.3469, - "step": 290740 - }, - { - "epoch": 0.51, - "learning_rate": 2.464834662751075e-05, - "loss": 2.2616, - "step": 290750 - }, - { - "epoch": 0.51, - "learning_rate": 2.4647474687583924e-05, - "loss": 2.4772, - "step": 290760 - }, - { - "epoch": 0.51, - "learning_rate": 2.4646602747657098e-05, - "loss": 2.2957, - "step": 290770 - }, - { - "epoch": 0.51, - "learning_rate": 2.4645730807730272e-05, - "loss": 2.4445, - "step": 290780 - }, - { - "epoch": 0.51, - "learning_rate": 2.4644858867803446e-05, - "loss": 2.2416, - "step": 290790 - }, - { - "epoch": 0.51, - "learning_rate": 2.464398692787662e-05, - "loss": 2.3741, - "step": 290800 - }, - { - "epoch": 0.51, - "learning_rate": 2.4643114987949793e-05, - "loss": 2.4135, - "step": 290810 - }, - { - "epoch": 0.51, - "learning_rate": 2.4642243048022964e-05, - "loss": 2.2906, - "step": 290820 - }, - { - "epoch": 0.51, - "learning_rate": 2.4641371108096137e-05, - "loss": 2.4283, - "step": 290830 - }, - { - "epoch": 0.51, - "learning_rate": 2.464049916816931e-05, - "loss": 2.4637, - "step": 290840 - }, - { - "epoch": 0.51, - "learning_rate": 2.4639627228242485e-05, - "loss": 2.2789, - "step": 290850 - }, - { - "epoch": 0.51, - "learning_rate": 2.463875528831566e-05, - "loss": 2.4686, - "step": 290860 - }, - { - "epoch": 0.51, - "learning_rate": 2.463788334838883e-05, - "loss": 2.4092, - "step": 290870 - }, - { - "epoch": 0.51, - "learning_rate": 2.4637011408462006e-05, - "loss": 2.3775, - "step": 290880 - }, - { - "epoch": 0.51, - "learning_rate": 2.4636139468535177e-05, - "loss": 2.1926, - "step": 290890 - }, - { - "epoch": 0.51, - "learning_rate": 2.463526752860835e-05, - "loss": 2.3059, - "step": 290900 - }, - { - "epoch": 0.51, - "learning_rate": 2.4634395588681524e-05, - "loss": 2.406, - "step": 290910 - }, - { - "epoch": 0.51, - "learning_rate": 2.4633523648754698e-05, - "loss": 2.3754, - "step": 290920 - }, - { - "epoch": 0.51, - "learning_rate": 2.4632651708827868e-05, - "loss": 2.3531, - "step": 290930 - }, - { - "epoch": 0.51, - "learning_rate": 2.4631779768901042e-05, - "loss": 2.3518, - "step": 290940 - }, - { - "epoch": 0.51, - "learning_rate": 2.4630907828974216e-05, - "loss": 2.361, - "step": 290950 - }, - { - "epoch": 0.51, - "learning_rate": 2.463003588904739e-05, - "loss": 2.2983, - "step": 290960 - }, - { - "epoch": 0.51, - "learning_rate": 2.4629163949120563e-05, - "loss": 2.2878, - "step": 290970 - }, - { - "epoch": 0.51, - "learning_rate": 2.4628292009193734e-05, - "loss": 2.2756, - "step": 290980 - }, - { - "epoch": 0.51, - "learning_rate": 2.462742006926691e-05, - "loss": 2.3712, - "step": 290990 - }, - { - "epoch": 0.51, - "learning_rate": 2.462654812934008e-05, - "loss": 2.4059, - "step": 291000 - }, - { - "epoch": 0.51, - "learning_rate": 2.4625676189413255e-05, - "loss": 2.3662, - "step": 291010 - }, - { - "epoch": 0.51, - "learning_rate": 2.462480424948643e-05, - "loss": 2.4489, - "step": 291020 - }, - { - "epoch": 0.51, - "learning_rate": 2.4623932309559603e-05, - "loss": 2.3683, - "step": 291030 - }, - { - "epoch": 0.51, - "learning_rate": 2.4623060369632776e-05, - "loss": 2.3423, - "step": 291040 - }, - { - "epoch": 0.51, - "learning_rate": 2.4622188429705947e-05, - "loss": 2.3977, - "step": 291050 - }, - { - "epoch": 0.51, - "learning_rate": 2.4621316489779124e-05, - "loss": 2.3872, - "step": 291060 - }, - { - "epoch": 0.51, - "learning_rate": 2.4620444549852294e-05, - "loss": 2.2665, - "step": 291070 - }, - { - "epoch": 0.51, - "learning_rate": 2.4619572609925468e-05, - "loss": 2.3818, - "step": 291080 - }, - { - "epoch": 0.51, - "learning_rate": 2.461870066999864e-05, - "loss": 2.3291, - "step": 291090 - }, - { - "epoch": 0.51, - "learning_rate": 2.4617828730071816e-05, - "loss": 2.2563, - "step": 291100 - }, - { - "epoch": 0.51, - "learning_rate": 2.461695679014499e-05, - "loss": 2.4648, - "step": 291110 - }, - { - "epoch": 0.51, - "learning_rate": 2.461608485021816e-05, - "loss": 2.3638, - "step": 291120 - }, - { - "epoch": 0.51, - "learning_rate": 2.4615212910291333e-05, - "loss": 2.4421, - "step": 291130 - }, - { - "epoch": 0.51, - "learning_rate": 2.4614340970364507e-05, - "loss": 2.3165, - "step": 291140 - }, - { - "epoch": 0.51, - "learning_rate": 2.461346903043768e-05, - "loss": 2.2855, - "step": 291150 - }, - { - "epoch": 0.51, - "learning_rate": 2.461259709051085e-05, - "loss": 2.4823, - "step": 291160 - }, - { - "epoch": 0.51, - "learning_rate": 2.4611725150584025e-05, - "loss": 2.3494, - "step": 291170 - }, - { - "epoch": 0.51, - "learning_rate": 2.46108532106572e-05, - "loss": 2.3245, - "step": 291180 - }, - { - "epoch": 0.51, - "learning_rate": 2.4609981270730373e-05, - "loss": 2.3648, - "step": 291190 - }, - { - "epoch": 0.51, - "learning_rate": 2.4609109330803546e-05, - "loss": 2.3025, - "step": 291200 - }, - { - "epoch": 0.51, - "learning_rate": 2.460823739087672e-05, - "loss": 2.3609, - "step": 291210 - }, - { - "epoch": 0.51, - "learning_rate": 2.4607365450949894e-05, - "loss": 2.355, - "step": 291220 - }, - { - "epoch": 0.51, - "learning_rate": 2.4606493511023064e-05, - "loss": 2.3562, - "step": 291230 - }, - { - "epoch": 0.51, - "learning_rate": 2.4605621571096238e-05, - "loss": 2.4601, - "step": 291240 - }, - { - "epoch": 0.51, - "learning_rate": 2.4604749631169412e-05, - "loss": 2.2682, - "step": 291250 - }, - { - "epoch": 0.51, - "learning_rate": 2.4603877691242586e-05, - "loss": 2.3156, - "step": 291260 - }, - { - "epoch": 0.51, - "learning_rate": 2.460300575131576e-05, - "loss": 2.3936, - "step": 291270 - }, - { - "epoch": 0.51, - "learning_rate": 2.460213381138893e-05, - "loss": 2.3774, - "step": 291280 - }, - { - "epoch": 0.51, - "learning_rate": 2.4601261871462107e-05, - "loss": 2.2621, - "step": 291290 - }, - { - "epoch": 0.51, - "learning_rate": 2.4600389931535277e-05, - "loss": 2.4418, - "step": 291300 - }, - { - "epoch": 0.51, - "learning_rate": 2.459951799160845e-05, - "loss": 2.4683, - "step": 291310 - }, - { - "epoch": 0.51, - "learning_rate": 2.4598646051681625e-05, - "loss": 2.4363, - "step": 291320 - }, - { - "epoch": 0.51, - "learning_rate": 2.45977741117548e-05, - "loss": 2.367, - "step": 291330 - }, - { - "epoch": 0.51, - "learning_rate": 2.459690217182797e-05, - "loss": 2.3213, - "step": 291340 - }, - { - "epoch": 0.51, - "learning_rate": 2.4596030231901143e-05, - "loss": 2.3019, - "step": 291350 - }, - { - "epoch": 0.51, - "learning_rate": 2.459515829197432e-05, - "loss": 2.5196, - "step": 291360 - }, - { - "epoch": 0.51, - "learning_rate": 2.459428635204749e-05, - "loss": 2.5076, - "step": 291370 - }, - { - "epoch": 0.51, - "learning_rate": 2.4593414412120664e-05, - "loss": 2.359, - "step": 291380 - }, - { - "epoch": 0.51, - "learning_rate": 2.4592542472193835e-05, - "loss": 2.4206, - "step": 291390 - }, - { - "epoch": 0.51, - "learning_rate": 2.459167053226701e-05, - "loss": 2.4193, - "step": 291400 - }, - { - "epoch": 0.51, - "learning_rate": 2.4590798592340182e-05, - "loss": 2.3422, - "step": 291410 - }, - { - "epoch": 0.51, - "learning_rate": 2.4589926652413356e-05, - "loss": 2.3402, - "step": 291420 - }, - { - "epoch": 0.51, - "learning_rate": 2.458905471248653e-05, - "loss": 2.353, - "step": 291430 - }, - { - "epoch": 0.51, - "learning_rate": 2.4588182772559703e-05, - "loss": 2.477, - "step": 291440 - }, - { - "epoch": 0.51, - "learning_rate": 2.4587310832632877e-05, - "loss": 2.4094, - "step": 291450 - }, - { - "epoch": 0.51, - "learning_rate": 2.4586438892706048e-05, - "loss": 2.4597, - "step": 291460 - }, - { - "epoch": 0.51, - "learning_rate": 2.4585566952779225e-05, - "loss": 2.4476, - "step": 291470 - }, - { - "epoch": 0.51, - "learning_rate": 2.4584695012852395e-05, - "loss": 2.4248, - "step": 291480 - }, - { - "epoch": 0.51, - "learning_rate": 2.458382307292557e-05, - "loss": 2.2478, - "step": 291490 - }, - { - "epoch": 0.51, - "learning_rate": 2.4582951132998743e-05, - "loss": 2.3611, - "step": 291500 - }, - { - "epoch": 0.51, - "learning_rate": 2.4582079193071916e-05, - "loss": 2.3716, - "step": 291510 - }, - { - "epoch": 0.51, - "learning_rate": 2.458120725314509e-05, - "loss": 2.3944, - "step": 291520 - }, - { - "epoch": 0.51, - "learning_rate": 2.458033531321826e-05, - "loss": 2.4157, - "step": 291530 - }, - { - "epoch": 0.51, - "learning_rate": 2.4579463373291434e-05, - "loss": 2.3429, - "step": 291540 - }, - { - "epoch": 0.51, - "learning_rate": 2.4578591433364608e-05, - "loss": 2.2594, - "step": 291550 - }, - { - "epoch": 0.51, - "learning_rate": 2.4577719493437782e-05, - "loss": 2.3294, - "step": 291560 - }, - { - "epoch": 0.51, - "learning_rate": 2.4576847553510952e-05, - "loss": 2.4084, - "step": 291570 - }, - { - "epoch": 0.51, - "learning_rate": 2.457597561358413e-05, - "loss": 2.3373, - "step": 291580 - }, - { - "epoch": 0.51, - "learning_rate": 2.4575103673657303e-05, - "loss": 2.4561, - "step": 291590 - }, - { - "epoch": 0.51, - "learning_rate": 2.4574231733730474e-05, - "loss": 2.297, - "step": 291600 - }, - { - "epoch": 0.51, - "learning_rate": 2.4573359793803647e-05, - "loss": 2.3382, - "step": 291610 - }, - { - "epoch": 0.51, - "learning_rate": 2.457248785387682e-05, - "loss": 2.2478, - "step": 291620 - }, - { - "epoch": 0.51, - "learning_rate": 2.4571615913949995e-05, - "loss": 2.4447, - "step": 291630 - }, - { - "epoch": 0.51, - "learning_rate": 2.4570743974023165e-05, - "loss": 2.2985, - "step": 291640 - }, - { - "epoch": 0.51, - "learning_rate": 2.456987203409634e-05, - "loss": 2.3452, - "step": 291650 - }, - { - "epoch": 0.51, - "learning_rate": 2.4569000094169513e-05, - "loss": 2.3543, - "step": 291660 - }, - { - "epoch": 0.51, - "learning_rate": 2.4568128154242687e-05, - "loss": 2.3935, - "step": 291670 - }, - { - "epoch": 0.51, - "learning_rate": 2.456725621431586e-05, - "loss": 2.4599, - "step": 291680 - }, - { - "epoch": 0.51, - "learning_rate": 2.456638427438903e-05, - "loss": 2.3412, - "step": 291690 - }, - { - "epoch": 0.51, - "learning_rate": 2.4565512334462208e-05, - "loss": 2.3389, - "step": 291700 - }, - { - "epoch": 0.51, - "learning_rate": 2.4564640394535378e-05, - "loss": 2.3661, - "step": 291710 - }, - { - "epoch": 0.51, - "learning_rate": 2.4563768454608552e-05, - "loss": 2.2814, - "step": 291720 - }, - { - "epoch": 0.51, - "learning_rate": 2.4562896514681726e-05, - "loss": 2.2423, - "step": 291730 - }, - { - "epoch": 0.51, - "learning_rate": 2.45620245747549e-05, - "loss": 2.3546, - "step": 291740 - }, - { - "epoch": 0.51, - "learning_rate": 2.4561152634828073e-05, - "loss": 2.3158, - "step": 291750 - }, - { - "epoch": 0.51, - "learning_rate": 2.4560280694901244e-05, - "loss": 2.3967, - "step": 291760 - }, - { - "epoch": 0.51, - "learning_rate": 2.455940875497442e-05, - "loss": 2.2346, - "step": 291770 - }, - { - "epoch": 0.51, - "learning_rate": 2.455853681504759e-05, - "loss": 2.3362, - "step": 291780 - }, - { - "epoch": 0.51, - "learning_rate": 2.4557664875120765e-05, - "loss": 2.2338, - "step": 291790 - }, - { - "epoch": 0.51, - "learning_rate": 2.4556792935193935e-05, - "loss": 2.3445, - "step": 291800 - }, - { - "epoch": 0.51, - "learning_rate": 2.4555920995267113e-05, - "loss": 2.3916, - "step": 291810 - }, - { - "epoch": 0.51, - "learning_rate": 2.4555049055340283e-05, - "loss": 2.3692, - "step": 291820 - }, - { - "epoch": 0.51, - "learning_rate": 2.4554177115413457e-05, - "loss": 2.3902, - "step": 291830 - }, - { - "epoch": 0.51, - "learning_rate": 2.4553305175486634e-05, - "loss": 2.3893, - "step": 291840 - }, - { - "epoch": 0.51, - "learning_rate": 2.4552433235559804e-05, - "loss": 2.4269, - "step": 291850 - }, - { - "epoch": 0.51, - "learning_rate": 2.4551561295632978e-05, - "loss": 2.341, - "step": 291860 - }, - { - "epoch": 0.51, - "learning_rate": 2.455068935570615e-05, - "loss": 2.3313, - "step": 291870 - }, - { - "epoch": 0.51, - "learning_rate": 2.4549817415779326e-05, - "loss": 2.297, - "step": 291880 - }, - { - "epoch": 0.51, - "learning_rate": 2.4548945475852496e-05, - "loss": 2.4171, - "step": 291890 - }, - { - "epoch": 0.51, - "learning_rate": 2.454807353592567e-05, - "loss": 2.3132, - "step": 291900 - }, - { - "epoch": 0.51, - "learning_rate": 2.4547201595998843e-05, - "loss": 2.322, - "step": 291910 - }, - { - "epoch": 0.51, - "learning_rate": 2.4546329656072017e-05, - "loss": 2.5412, - "step": 291920 - }, - { - "epoch": 0.51, - "learning_rate": 2.454545771614519e-05, - "loss": 2.3927, - "step": 291930 - }, - { - "epoch": 0.51, - "learning_rate": 2.454458577621836e-05, - "loss": 2.4048, - "step": 291940 - }, - { - "epoch": 0.51, - "learning_rate": 2.4543713836291535e-05, - "loss": 2.4649, - "step": 291950 - }, - { - "epoch": 0.51, - "learning_rate": 2.454284189636471e-05, - "loss": 2.3086, - "step": 291960 - }, - { - "epoch": 0.51, - "learning_rate": 2.4541969956437883e-05, - "loss": 2.3803, - "step": 291970 - }, - { - "epoch": 0.51, - "learning_rate": 2.4541098016511056e-05, - "loss": 2.4346, - "step": 291980 - }, - { - "epoch": 0.51, - "learning_rate": 2.454022607658423e-05, - "loss": 2.4019, - "step": 291990 - }, - { - "epoch": 0.51, - "learning_rate": 2.4539354136657404e-05, - "loss": 2.3897, - "step": 292000 - }, - { - "epoch": 0.51, - "learning_rate": 2.4538482196730574e-05, - "loss": 2.3577, - "step": 292010 - }, - { - "epoch": 0.51, - "learning_rate": 2.4537610256803748e-05, - "loss": 2.4484, - "step": 292020 - }, - { - "epoch": 0.51, - "learning_rate": 2.4536738316876922e-05, - "loss": 2.297, - "step": 292030 - }, - { - "epoch": 0.51, - "learning_rate": 2.4535866376950096e-05, - "loss": 2.3377, - "step": 292040 - }, - { - "epoch": 0.51, - "learning_rate": 2.4534994437023266e-05, - "loss": 2.3127, - "step": 292050 - }, - { - "epoch": 0.51, - "learning_rate": 2.453412249709644e-05, - "loss": 2.3641, - "step": 292060 - }, - { - "epoch": 0.51, - "learning_rate": 2.4533250557169614e-05, - "loss": 2.4897, - "step": 292070 - }, - { - "epoch": 0.51, - "learning_rate": 2.4532378617242787e-05, - "loss": 2.2379, - "step": 292080 - }, - { - "epoch": 0.51, - "learning_rate": 2.453150667731596e-05, - "loss": 2.3314, - "step": 292090 - }, - { - "epoch": 0.51, - "learning_rate": 2.453063473738913e-05, - "loss": 2.3591, - "step": 292100 - }, - { - "epoch": 0.51, - "learning_rate": 2.452976279746231e-05, - "loss": 2.3668, - "step": 292110 - }, - { - "epoch": 0.51, - "learning_rate": 2.452889085753548e-05, - "loss": 2.2555, - "step": 292120 - }, - { - "epoch": 0.51, - "learning_rate": 2.4528018917608653e-05, - "loss": 2.3345, - "step": 292130 - }, - { - "epoch": 0.51, - "learning_rate": 2.4527146977681827e-05, - "loss": 2.3736, - "step": 292140 - }, - { - "epoch": 0.51, - "learning_rate": 2.4526275037755e-05, - "loss": 2.339, - "step": 292150 - }, - { - "epoch": 0.51, - "learning_rate": 2.4525403097828174e-05, - "loss": 2.4087, - "step": 292160 - }, - { - "epoch": 0.51, - "learning_rate": 2.4524531157901345e-05, - "loss": 2.3367, - "step": 292170 - }, - { - "epoch": 0.51, - "learning_rate": 2.452365921797452e-05, - "loss": 2.4806, - "step": 292180 - }, - { - "epoch": 0.51, - "learning_rate": 2.4522787278047692e-05, - "loss": 2.409, - "step": 292190 - }, - { - "epoch": 0.51, - "learning_rate": 2.4521915338120866e-05, - "loss": 2.3904, - "step": 292200 - }, - { - "epoch": 0.51, - "learning_rate": 2.452104339819404e-05, - "loss": 2.3598, - "step": 292210 - }, - { - "epoch": 0.51, - "learning_rate": 2.4520171458267213e-05, - "loss": 2.3739, - "step": 292220 - }, - { - "epoch": 0.51, - "learning_rate": 2.4519299518340387e-05, - "loss": 2.4826, - "step": 292230 - }, - { - "epoch": 0.51, - "learning_rate": 2.4518427578413558e-05, - "loss": 2.4041, - "step": 292240 - }, - { - "epoch": 0.51, - "learning_rate": 2.4517555638486735e-05, - "loss": 2.3391, - "step": 292250 - }, - { - "epoch": 0.51, - "learning_rate": 2.4516683698559905e-05, - "loss": 2.3471, - "step": 292260 - }, - { - "epoch": 0.51, - "learning_rate": 2.451581175863308e-05, - "loss": 2.3205, - "step": 292270 - }, - { - "epoch": 0.51, - "learning_rate": 2.451493981870625e-05, - "loss": 2.3357, - "step": 292280 - }, - { - "epoch": 0.51, - "learning_rate": 2.4514067878779426e-05, - "loss": 2.3474, - "step": 292290 - }, - { - "epoch": 0.51, - "learning_rate": 2.4513195938852597e-05, - "loss": 2.3294, - "step": 292300 - }, - { - "epoch": 0.51, - "learning_rate": 2.451232399892577e-05, - "loss": 2.3465, - "step": 292310 - }, - { - "epoch": 0.51, - "learning_rate": 2.4511452058998944e-05, - "loss": 2.3982, - "step": 292320 - }, - { - "epoch": 0.51, - "learning_rate": 2.4510580119072118e-05, - "loss": 2.4064, - "step": 292330 - }, - { - "epoch": 0.51, - "learning_rate": 2.4509708179145292e-05, - "loss": 2.43, - "step": 292340 - }, - { - "epoch": 0.51, - "learning_rate": 2.4508836239218462e-05, - "loss": 2.4327, - "step": 292350 - }, - { - "epoch": 0.51, - "learning_rate": 2.4507964299291636e-05, - "loss": 2.36, - "step": 292360 - }, - { - "epoch": 0.51, - "learning_rate": 2.450709235936481e-05, - "loss": 2.3841, - "step": 292370 - }, - { - "epoch": 0.51, - "learning_rate": 2.4506220419437984e-05, - "loss": 2.4096, - "step": 292380 - }, - { - "epoch": 0.51, - "learning_rate": 2.4505348479511157e-05, - "loss": 2.3595, - "step": 292390 - }, - { - "epoch": 0.51, - "learning_rate": 2.450447653958433e-05, - "loss": 2.4283, - "step": 292400 - }, - { - "epoch": 0.51, - "learning_rate": 2.4503604599657505e-05, - "loss": 2.3807, - "step": 292410 - }, - { - "epoch": 0.51, - "learning_rate": 2.4502732659730675e-05, - "loss": 2.4203, - "step": 292420 - }, - { - "epoch": 0.51, - "learning_rate": 2.450186071980385e-05, - "loss": 2.4003, - "step": 292430 - }, - { - "epoch": 0.51, - "learning_rate": 2.4500988779877023e-05, - "loss": 2.4556, - "step": 292440 - }, - { - "epoch": 0.51, - "learning_rate": 2.4500116839950197e-05, - "loss": 2.3077, - "step": 292450 - }, - { - "epoch": 0.51, - "learning_rate": 2.449924490002337e-05, - "loss": 2.2988, - "step": 292460 - }, - { - "epoch": 0.51, - "learning_rate": 2.449837296009654e-05, - "loss": 2.3325, - "step": 292470 - }, - { - "epoch": 0.51, - "learning_rate": 2.4497501020169718e-05, - "loss": 2.3681, - "step": 292480 - }, - { - "epoch": 0.51, - "learning_rate": 2.4496629080242888e-05, - "loss": 2.3967, - "step": 292490 - }, - { - "epoch": 0.51, - "learning_rate": 2.4495757140316062e-05, - "loss": 2.3275, - "step": 292500 - }, - { - "epoch": 0.51, - "learning_rate": 2.4494885200389236e-05, - "loss": 2.4833, - "step": 292510 - }, - { - "epoch": 0.51, - "learning_rate": 2.449401326046241e-05, - "loss": 2.2228, - "step": 292520 - }, - { - "epoch": 0.51, - "learning_rate": 2.449314132053558e-05, - "loss": 2.5103, - "step": 292530 - }, - { - "epoch": 0.51, - "learning_rate": 2.4492269380608754e-05, - "loss": 2.3132, - "step": 292540 - }, - { - "epoch": 0.51, - "learning_rate": 2.4491397440681927e-05, - "loss": 2.3898, - "step": 292550 - }, - { - "epoch": 0.51, - "learning_rate": 2.44905255007551e-05, - "loss": 2.3695, - "step": 292560 - }, - { - "epoch": 0.51, - "learning_rate": 2.4489653560828275e-05, - "loss": 2.4344, - "step": 292570 - }, - { - "epoch": 0.51, - "learning_rate": 2.4488781620901445e-05, - "loss": 2.2135, - "step": 292580 - }, - { - "epoch": 0.51, - "learning_rate": 2.4487909680974623e-05, - "loss": 2.3976, - "step": 292590 - }, - { - "epoch": 0.51, - "learning_rate": 2.4487037741047793e-05, - "loss": 2.2533, - "step": 292600 - }, - { - "epoch": 0.51, - "learning_rate": 2.4486165801120967e-05, - "loss": 2.2601, - "step": 292610 - }, - { - "epoch": 0.51, - "learning_rate": 2.448529386119414e-05, - "loss": 2.4375, - "step": 292620 - }, - { - "epoch": 0.51, - "learning_rate": 2.4484421921267314e-05, - "loss": 2.3092, - "step": 292630 - }, - { - "epoch": 0.51, - "learning_rate": 2.4483549981340488e-05, - "loss": 2.2986, - "step": 292640 - }, - { - "epoch": 0.51, - "learning_rate": 2.448267804141366e-05, - "loss": 2.3482, - "step": 292650 - }, - { - "epoch": 0.51, - "learning_rate": 2.4481806101486836e-05, - "loss": 2.3616, - "step": 292660 - }, - { - "epoch": 0.51, - "learning_rate": 2.4480934161560006e-05, - "loss": 2.2953, - "step": 292670 - }, - { - "epoch": 0.51, - "learning_rate": 2.448006222163318e-05, - "loss": 2.4005, - "step": 292680 - }, - { - "epoch": 0.51, - "learning_rate": 2.447919028170635e-05, - "loss": 2.2635, - "step": 292690 - }, - { - "epoch": 0.51, - "learning_rate": 2.4478318341779527e-05, - "loss": 2.317, - "step": 292700 - }, - { - "epoch": 0.51, - "learning_rate": 2.44774464018527e-05, - "loss": 2.3954, - "step": 292710 - }, - { - "epoch": 0.51, - "learning_rate": 2.447657446192587e-05, - "loss": 2.3817, - "step": 292720 - }, - { - "epoch": 0.51, - "learning_rate": 2.4475702521999045e-05, - "loss": 2.4173, - "step": 292730 - }, - { - "epoch": 0.51, - "learning_rate": 2.447483058207222e-05, - "loss": 2.3736, - "step": 292740 - }, - { - "epoch": 0.51, - "learning_rate": 2.4473958642145393e-05, - "loss": 2.4292, - "step": 292750 - }, - { - "epoch": 0.51, - "learning_rate": 2.4473086702218563e-05, - "loss": 2.4628, - "step": 292760 - }, - { - "epoch": 0.51, - "learning_rate": 2.447221476229174e-05, - "loss": 2.35, - "step": 292770 - }, - { - "epoch": 0.51, - "learning_rate": 2.447134282236491e-05, - "loss": 2.178, - "step": 292780 - }, - { - "epoch": 0.51, - "learning_rate": 2.4470470882438084e-05, - "loss": 2.4586, - "step": 292790 - }, - { - "epoch": 0.51, - "learning_rate": 2.4469598942511258e-05, - "loss": 2.3446, - "step": 292800 - }, - { - "epoch": 0.51, - "learning_rate": 2.4468727002584432e-05, - "loss": 2.376, - "step": 292810 - }, - { - "epoch": 0.51, - "learning_rate": 2.4467855062657606e-05, - "loss": 2.2514, - "step": 292820 - }, - { - "epoch": 0.51, - "learning_rate": 2.4466983122730776e-05, - "loss": 2.3567, - "step": 292830 - }, - { - "epoch": 0.51, - "learning_rate": 2.446611118280395e-05, - "loss": 2.2891, - "step": 292840 - }, - { - "epoch": 0.51, - "learning_rate": 2.4465239242877124e-05, - "loss": 2.4358, - "step": 292850 - }, - { - "epoch": 0.51, - "learning_rate": 2.4464367302950297e-05, - "loss": 2.488, - "step": 292860 - }, - { - "epoch": 0.51, - "learning_rate": 2.446349536302347e-05, - "loss": 2.4034, - "step": 292870 - }, - { - "epoch": 0.51, - "learning_rate": 2.446262342309664e-05, - "loss": 2.4693, - "step": 292880 - }, - { - "epoch": 0.51, - "learning_rate": 2.446175148316982e-05, - "loss": 2.4359, - "step": 292890 - }, - { - "epoch": 0.51, - "learning_rate": 2.446087954324299e-05, - "loss": 2.3533, - "step": 292900 - }, - { - "epoch": 0.51, - "learning_rate": 2.4460007603316163e-05, - "loss": 2.5399, - "step": 292910 - }, - { - "epoch": 0.51, - "learning_rate": 2.4459135663389337e-05, - "loss": 2.3827, - "step": 292920 - }, - { - "epoch": 0.51, - "learning_rate": 2.445826372346251e-05, - "loss": 2.3981, - "step": 292930 - }, - { - "epoch": 0.51, - "learning_rate": 2.4457391783535684e-05, - "loss": 2.3174, - "step": 292940 - }, - { - "epoch": 0.51, - "learning_rate": 2.4456519843608855e-05, - "loss": 2.3619, - "step": 292950 - }, - { - "epoch": 0.51, - "learning_rate": 2.445564790368203e-05, - "loss": 2.4439, - "step": 292960 - }, - { - "epoch": 0.51, - "learning_rate": 2.4454775963755202e-05, - "loss": 2.3195, - "step": 292970 - }, - { - "epoch": 0.51, - "learning_rate": 2.4453904023828376e-05, - "loss": 2.391, - "step": 292980 - }, - { - "epoch": 0.51, - "learning_rate": 2.4453032083901546e-05, - "loss": 2.1927, - "step": 292990 - }, - { - "epoch": 0.51, - "learning_rate": 2.4452160143974723e-05, - "loss": 2.4358, - "step": 293000 - }, - { - "epoch": 0.51, - "learning_rate": 2.4451288204047894e-05, - "loss": 2.3245, - "step": 293010 - }, - { - "epoch": 0.51, - "learning_rate": 2.4450416264121068e-05, - "loss": 2.4803, - "step": 293020 - }, - { - "epoch": 0.51, - "learning_rate": 2.444954432419424e-05, - "loss": 2.3618, - "step": 293030 - }, - { - "epoch": 0.51, - "learning_rate": 2.4448672384267415e-05, - "loss": 2.3453, - "step": 293040 - }, - { - "epoch": 0.51, - "learning_rate": 2.444780044434059e-05, - "loss": 2.3555, - "step": 293050 - }, - { - "epoch": 0.51, - "learning_rate": 2.444692850441376e-05, - "loss": 2.3378, - "step": 293060 - }, - { - "epoch": 0.51, - "learning_rate": 2.4446056564486936e-05, - "loss": 2.3807, - "step": 293070 - }, - { - "epoch": 0.51, - "learning_rate": 2.4445184624560107e-05, - "loss": 2.36, - "step": 293080 - }, - { - "epoch": 0.51, - "learning_rate": 2.444431268463328e-05, - "loss": 2.3589, - "step": 293090 - }, - { - "epoch": 0.51, - "learning_rate": 2.4443440744706454e-05, - "loss": 2.3427, - "step": 293100 - }, - { - "epoch": 0.51, - "learning_rate": 2.4442568804779628e-05, - "loss": 2.3045, - "step": 293110 - }, - { - "epoch": 0.51, - "learning_rate": 2.4441696864852802e-05, - "loss": 2.3685, - "step": 293120 - }, - { - "epoch": 0.51, - "learning_rate": 2.4440824924925972e-05, - "loss": 2.3765, - "step": 293130 - }, - { - "epoch": 0.51, - "learning_rate": 2.4439952984999146e-05, - "loss": 2.4848, - "step": 293140 - }, - { - "epoch": 0.51, - "learning_rate": 2.443908104507232e-05, - "loss": 2.3953, - "step": 293150 - }, - { - "epoch": 0.51, - "learning_rate": 2.4438209105145494e-05, - "loss": 2.3476, - "step": 293160 - }, - { - "epoch": 0.51, - "learning_rate": 2.4437337165218664e-05, - "loss": 2.2844, - "step": 293170 - }, - { - "epoch": 0.51, - "learning_rate": 2.443646522529184e-05, - "loss": 2.26, - "step": 293180 - }, - { - "epoch": 0.51, - "learning_rate": 2.4435593285365015e-05, - "loss": 2.4091, - "step": 293190 - }, - { - "epoch": 0.51, - "learning_rate": 2.4434721345438185e-05, - "loss": 2.3181, - "step": 293200 - }, - { - "epoch": 0.51, - "learning_rate": 2.443384940551136e-05, - "loss": 2.3653, - "step": 293210 - }, - { - "epoch": 0.51, - "learning_rate": 2.4432977465584533e-05, - "loss": 2.3879, - "step": 293220 - }, - { - "epoch": 0.51, - "learning_rate": 2.4432105525657707e-05, - "loss": 2.3799, - "step": 293230 - }, - { - "epoch": 0.51, - "learning_rate": 2.4431233585730877e-05, - "loss": 2.2191, - "step": 293240 - }, - { - "epoch": 0.51, - "learning_rate": 2.443036164580405e-05, - "loss": 2.3914, - "step": 293250 - }, - { - "epoch": 0.51, - "learning_rate": 2.4429489705877224e-05, - "loss": 2.2835, - "step": 293260 - }, - { - "epoch": 0.51, - "learning_rate": 2.4428617765950398e-05, - "loss": 2.4139, - "step": 293270 - }, - { - "epoch": 0.51, - "learning_rate": 2.4427745826023572e-05, - "loss": 2.3899, - "step": 293280 - }, - { - "epoch": 0.51, - "learning_rate": 2.4426873886096742e-05, - "loss": 2.4091, - "step": 293290 - }, - { - "epoch": 0.51, - "learning_rate": 2.442600194616992e-05, - "loss": 2.3656, - "step": 293300 - }, - { - "epoch": 0.51, - "learning_rate": 2.442513000624309e-05, - "loss": 2.3877, - "step": 293310 - }, - { - "epoch": 0.51, - "learning_rate": 2.4424258066316264e-05, - "loss": 2.2914, - "step": 293320 - }, - { - "epoch": 0.51, - "learning_rate": 2.4423386126389437e-05, - "loss": 2.3138, - "step": 293330 - }, - { - "epoch": 0.51, - "learning_rate": 2.442251418646261e-05, - "loss": 2.3753, - "step": 293340 - }, - { - "epoch": 0.51, - "learning_rate": 2.4421642246535785e-05, - "loss": 2.4282, - "step": 293350 - }, - { - "epoch": 0.51, - "learning_rate": 2.4420770306608955e-05, - "loss": 2.4263, - "step": 293360 - }, - { - "epoch": 0.51, - "learning_rate": 2.4419898366682133e-05, - "loss": 2.3755, - "step": 293370 - }, - { - "epoch": 0.51, - "learning_rate": 2.4419026426755303e-05, - "loss": 2.4155, - "step": 293380 - }, - { - "epoch": 0.51, - "learning_rate": 2.4418154486828477e-05, - "loss": 2.3003, - "step": 293390 - }, - { - "epoch": 0.51, - "learning_rate": 2.4417282546901647e-05, - "loss": 2.3015, - "step": 293400 - }, - { - "epoch": 0.51, - "learning_rate": 2.4416410606974824e-05, - "loss": 2.2976, - "step": 293410 - }, - { - "epoch": 0.51, - "learning_rate": 2.4415538667047995e-05, - "loss": 2.4048, - "step": 293420 - }, - { - "epoch": 0.51, - "learning_rate": 2.441466672712117e-05, - "loss": 2.204, - "step": 293430 - }, - { - "epoch": 0.51, - "learning_rate": 2.4413794787194346e-05, - "loss": 2.2934, - "step": 293440 - }, - { - "epoch": 0.51, - "learning_rate": 2.4412922847267516e-05, - "loss": 2.4056, - "step": 293450 - }, - { - "epoch": 0.51, - "learning_rate": 2.441205090734069e-05, - "loss": 2.356, - "step": 293460 - }, - { - "epoch": 0.51, - "learning_rate": 2.441117896741386e-05, - "loss": 2.2916, - "step": 293470 - }, - { - "epoch": 0.51, - "learning_rate": 2.4410307027487037e-05, - "loss": 2.39, - "step": 293480 - }, - { - "epoch": 0.51, - "learning_rate": 2.4409435087560208e-05, - "loss": 2.4137, - "step": 293490 - }, - { - "epoch": 0.51, - "learning_rate": 2.440856314763338e-05, - "loss": 2.4188, - "step": 293500 - }, - { - "epoch": 0.51, - "learning_rate": 2.4407691207706555e-05, - "loss": 2.3316, - "step": 293510 - }, - { - "epoch": 0.51, - "learning_rate": 2.440681926777973e-05, - "loss": 2.4288, - "step": 293520 - }, - { - "epoch": 0.51, - "learning_rate": 2.4405947327852903e-05, - "loss": 2.3076, - "step": 293530 - }, - { - "epoch": 0.51, - "learning_rate": 2.4405075387926073e-05, - "loss": 2.3884, - "step": 293540 - }, - { - "epoch": 0.51, - "learning_rate": 2.4404203447999247e-05, - "loss": 2.3742, - "step": 293550 - }, - { - "epoch": 0.51, - "learning_rate": 2.440333150807242e-05, - "loss": 2.3581, - "step": 293560 - }, - { - "epoch": 0.51, - "learning_rate": 2.4402459568145594e-05, - "loss": 2.3868, - "step": 293570 - }, - { - "epoch": 0.51, - "learning_rate": 2.4401587628218768e-05, - "loss": 2.3257, - "step": 293580 - }, - { - "epoch": 0.51, - "learning_rate": 2.4400715688291942e-05, - "loss": 2.3963, - "step": 293590 - }, - { - "epoch": 0.51, - "learning_rate": 2.4399843748365116e-05, - "loss": 2.4203, - "step": 293600 - }, - { - "epoch": 0.51, - "learning_rate": 2.4398971808438286e-05, - "loss": 2.3502, - "step": 293610 - }, - { - "epoch": 0.51, - "learning_rate": 2.439809986851146e-05, - "loss": 2.3056, - "step": 293620 - }, - { - "epoch": 0.51, - "learning_rate": 2.4397227928584634e-05, - "loss": 2.2855, - "step": 293630 - }, - { - "epoch": 0.51, - "learning_rate": 2.4396355988657807e-05, - "loss": 2.2872, - "step": 293640 - }, - { - "epoch": 0.51, - "learning_rate": 2.4395484048730978e-05, - "loss": 2.3805, - "step": 293650 - }, - { - "epoch": 0.51, - "learning_rate": 2.439461210880415e-05, - "loss": 2.2937, - "step": 293660 - }, - { - "epoch": 0.51, - "learning_rate": 2.439374016887733e-05, - "loss": 2.3208, - "step": 293670 - }, - { - "epoch": 0.51, - "learning_rate": 2.43928682289505e-05, - "loss": 2.2662, - "step": 293680 - }, - { - "epoch": 0.51, - "learning_rate": 2.4391996289023673e-05, - "loss": 2.295, - "step": 293690 - }, - { - "epoch": 0.51, - "learning_rate": 2.4391124349096843e-05, - "loss": 2.4106, - "step": 293700 - }, - { - "epoch": 0.51, - "learning_rate": 2.439025240917002e-05, - "loss": 2.3386, - "step": 293710 - }, - { - "epoch": 0.51, - "learning_rate": 2.438938046924319e-05, - "loss": 2.3495, - "step": 293720 - }, - { - "epoch": 0.51, - "learning_rate": 2.4388508529316365e-05, - "loss": 2.3207, - "step": 293730 - }, - { - "epoch": 0.51, - "learning_rate": 2.438763658938954e-05, - "loss": 2.4888, - "step": 293740 - }, - { - "epoch": 0.51, - "learning_rate": 2.4386764649462712e-05, - "loss": 2.3417, - "step": 293750 - }, - { - "epoch": 0.51, - "learning_rate": 2.4385892709535886e-05, - "loss": 2.2301, - "step": 293760 - }, - { - "epoch": 0.51, - "learning_rate": 2.4385020769609056e-05, - "loss": 2.4015, - "step": 293770 - }, - { - "epoch": 0.51, - "learning_rate": 2.4384148829682233e-05, - "loss": 2.4186, - "step": 293780 - }, - { - "epoch": 0.51, - "learning_rate": 2.4383276889755404e-05, - "loss": 2.3458, - "step": 293790 - }, - { - "epoch": 0.51, - "learning_rate": 2.4382404949828578e-05, - "loss": 2.3081, - "step": 293800 - }, - { - "epoch": 0.51, - "learning_rate": 2.438153300990175e-05, - "loss": 2.4744, - "step": 293810 - }, - { - "epoch": 0.51, - "learning_rate": 2.4380661069974925e-05, - "loss": 2.5508, - "step": 293820 - }, - { - "epoch": 0.51, - "learning_rate": 2.43797891300481e-05, - "loss": 2.4502, - "step": 293830 - }, - { - "epoch": 0.51, - "learning_rate": 2.437891719012127e-05, - "loss": 2.3643, - "step": 293840 - }, - { - "epoch": 0.51, - "learning_rate": 2.4378045250194446e-05, - "loss": 2.3866, - "step": 293850 - }, - { - "epoch": 0.51, - "learning_rate": 2.4377173310267617e-05, - "loss": 2.4414, - "step": 293860 - }, - { - "epoch": 0.51, - "learning_rate": 2.437630137034079e-05, - "loss": 2.3815, - "step": 293870 - }, - { - "epoch": 0.51, - "learning_rate": 2.437542943041396e-05, - "loss": 2.4083, - "step": 293880 - }, - { - "epoch": 0.51, - "learning_rate": 2.4374557490487138e-05, - "loss": 2.4427, - "step": 293890 - }, - { - "epoch": 0.51, - "learning_rate": 2.437368555056031e-05, - "loss": 2.3605, - "step": 293900 - }, - { - "epoch": 0.51, - "learning_rate": 2.4372813610633482e-05, - "loss": 2.3417, - "step": 293910 - }, - { - "epoch": 0.51, - "learning_rate": 2.4371941670706656e-05, - "loss": 2.3296, - "step": 293920 - }, - { - "epoch": 0.51, - "learning_rate": 2.437106973077983e-05, - "loss": 2.3687, - "step": 293930 - }, - { - "epoch": 0.51, - "learning_rate": 2.4370197790853004e-05, - "loss": 2.3422, - "step": 293940 - }, - { - "epoch": 0.51, - "learning_rate": 2.4369325850926174e-05, - "loss": 2.3847, - "step": 293950 - }, - { - "epoch": 0.51, - "learning_rate": 2.4368453910999348e-05, - "loss": 2.3577, - "step": 293960 - }, - { - "epoch": 0.51, - "learning_rate": 2.436758197107252e-05, - "loss": 2.3421, - "step": 293970 - }, - { - "epoch": 0.51, - "learning_rate": 2.4366710031145695e-05, - "loss": 2.1912, - "step": 293980 - }, - { - "epoch": 0.51, - "learning_rate": 2.436583809121887e-05, - "loss": 2.3589, - "step": 293990 - }, - { - "epoch": 0.51, - "learning_rate": 2.4364966151292043e-05, - "loss": 2.3521, - "step": 294000 - }, - { - "epoch": 0.51, - "learning_rate": 2.4364094211365217e-05, - "loss": 2.3625, - "step": 294010 - }, - { - "epoch": 0.51, - "learning_rate": 2.4363222271438387e-05, - "loss": 2.3814, - "step": 294020 - }, - { - "epoch": 0.51, - "learning_rate": 2.436235033151156e-05, - "loss": 2.3563, - "step": 294030 - }, - { - "epoch": 0.51, - "learning_rate": 2.4361478391584734e-05, - "loss": 2.4355, - "step": 294040 - }, - { - "epoch": 0.51, - "learning_rate": 2.4360606451657908e-05, - "loss": 2.4159, - "step": 294050 - }, - { - "epoch": 0.51, - "learning_rate": 2.4359734511731082e-05, - "loss": 2.2859, - "step": 294060 - }, - { - "epoch": 0.51, - "learning_rate": 2.4358862571804252e-05, - "loss": 2.3, - "step": 294070 - }, - { - "epoch": 0.51, - "learning_rate": 2.435799063187743e-05, - "loss": 2.3573, - "step": 294080 - }, - { - "epoch": 0.51, - "learning_rate": 2.43571186919506e-05, - "loss": 2.3259, - "step": 294090 - }, - { - "epoch": 0.51, - "learning_rate": 2.4356246752023774e-05, - "loss": 2.3747, - "step": 294100 - }, - { - "epoch": 0.51, - "learning_rate": 2.4355374812096947e-05, - "loss": 2.4093, - "step": 294110 - }, - { - "epoch": 0.51, - "learning_rate": 2.435450287217012e-05, - "loss": 2.257, - "step": 294120 - }, - { - "epoch": 0.51, - "learning_rate": 2.435363093224329e-05, - "loss": 2.3075, - "step": 294130 - }, - { - "epoch": 0.51, - "learning_rate": 2.4352758992316465e-05, - "loss": 2.3553, - "step": 294140 - }, - { - "epoch": 0.51, - "learning_rate": 2.435188705238964e-05, - "loss": 2.2786, - "step": 294150 - }, - { - "epoch": 0.51, - "learning_rate": 2.4351015112462813e-05, - "loss": 2.3413, - "step": 294160 - }, - { - "epoch": 0.51, - "learning_rate": 2.4350143172535987e-05, - "loss": 2.3248, - "step": 294170 - }, - { - "epoch": 0.51, - "learning_rate": 2.4349271232609157e-05, - "loss": 2.3914, - "step": 294180 - }, - { - "epoch": 0.51, - "learning_rate": 2.4348399292682334e-05, - "loss": 2.3462, - "step": 294190 - }, - { - "epoch": 0.51, - "learning_rate": 2.4347527352755505e-05, - "loss": 2.33, - "step": 294200 - }, - { - "epoch": 0.51, - "learning_rate": 2.434665541282868e-05, - "loss": 2.2559, - "step": 294210 - }, - { - "epoch": 0.51, - "learning_rate": 2.4345783472901852e-05, - "loss": 2.3316, - "step": 294220 - }, - { - "epoch": 0.51, - "learning_rate": 2.4344911532975026e-05, - "loss": 2.3944, - "step": 294230 - }, - { - "epoch": 0.51, - "learning_rate": 2.43440395930482e-05, - "loss": 2.3816, - "step": 294240 - }, - { - "epoch": 0.51, - "learning_rate": 2.434316765312137e-05, - "loss": 2.3007, - "step": 294250 - }, - { - "epoch": 0.51, - "learning_rate": 2.4342295713194547e-05, - "loss": 2.3198, - "step": 294260 - }, - { - "epoch": 0.51, - "learning_rate": 2.4341423773267718e-05, - "loss": 2.4708, - "step": 294270 - }, - { - "epoch": 0.51, - "learning_rate": 2.434055183334089e-05, - "loss": 2.4152, - "step": 294280 - }, - { - "epoch": 0.51, - "learning_rate": 2.4339679893414065e-05, - "loss": 2.3169, - "step": 294290 - }, - { - "epoch": 0.51, - "learning_rate": 2.433880795348724e-05, - "loss": 2.3659, - "step": 294300 - }, - { - "epoch": 0.51, - "learning_rate": 2.4337936013560413e-05, - "loss": 2.4175, - "step": 294310 - }, - { - "epoch": 0.51, - "learning_rate": 2.4337064073633583e-05, - "loss": 2.3175, - "step": 294320 - }, - { - "epoch": 0.51, - "learning_rate": 2.4336192133706757e-05, - "loss": 2.3101, - "step": 294330 - }, - { - "epoch": 0.51, - "learning_rate": 2.433532019377993e-05, - "loss": 2.4071, - "step": 294340 - }, - { - "epoch": 0.51, - "learning_rate": 2.4334448253853104e-05, - "loss": 2.3313, - "step": 294350 - }, - { - "epoch": 0.51, - "learning_rate": 2.4333576313926275e-05, - "loss": 2.4011, - "step": 294360 - }, - { - "epoch": 0.51, - "learning_rate": 2.4332704373999452e-05, - "loss": 2.3934, - "step": 294370 - }, - { - "epoch": 0.51, - "learning_rate": 2.4331832434072622e-05, - "loss": 2.3892, - "step": 294380 - }, - { - "epoch": 0.51, - "learning_rate": 2.4330960494145796e-05, - "loss": 2.3352, - "step": 294390 - }, - { - "epoch": 0.51, - "learning_rate": 2.433008855421897e-05, - "loss": 2.345, - "step": 294400 - }, - { - "epoch": 0.51, - "learning_rate": 2.4329216614292144e-05, - "loss": 2.4206, - "step": 294410 - }, - { - "epoch": 0.51, - "learning_rate": 2.4328344674365317e-05, - "loss": 2.3137, - "step": 294420 - }, - { - "epoch": 0.51, - "learning_rate": 2.4327472734438488e-05, - "loss": 2.4247, - "step": 294430 - }, - { - "epoch": 0.51, - "learning_rate": 2.432660079451166e-05, - "loss": 2.4007, - "step": 294440 - }, - { - "epoch": 0.51, - "learning_rate": 2.4325728854584835e-05, - "loss": 2.2474, - "step": 294450 - }, - { - "epoch": 0.51, - "learning_rate": 2.432485691465801e-05, - "loss": 2.4126, - "step": 294460 - }, - { - "epoch": 0.51, - "learning_rate": 2.4323984974731183e-05, - "loss": 2.2271, - "step": 294470 - }, - { - "epoch": 0.51, - "learning_rate": 2.4323113034804353e-05, - "loss": 2.4587, - "step": 294480 - }, - { - "epoch": 0.51, - "learning_rate": 2.432224109487753e-05, - "loss": 2.3741, - "step": 294490 - }, - { - "epoch": 0.51, - "learning_rate": 2.43213691549507e-05, - "loss": 2.3865, - "step": 294500 - }, - { - "epoch": 0.51, - "learning_rate": 2.4320497215023875e-05, - "loss": 2.3469, - "step": 294510 - }, - { - "epoch": 0.51, - "learning_rate": 2.431962527509705e-05, - "loss": 2.4668, - "step": 294520 - }, - { - "epoch": 0.51, - "learning_rate": 2.4318753335170222e-05, - "loss": 2.2556, - "step": 294530 - }, - { - "epoch": 0.51, - "learning_rate": 2.4317881395243396e-05, - "loss": 2.427, - "step": 294540 - }, - { - "epoch": 0.51, - "learning_rate": 2.4317009455316566e-05, - "loss": 2.4085, - "step": 294550 - }, - { - "epoch": 0.51, - "learning_rate": 2.4316137515389743e-05, - "loss": 2.2341, - "step": 294560 - }, - { - "epoch": 0.51, - "learning_rate": 2.4315265575462914e-05, - "loss": 2.2077, - "step": 294570 - }, - { - "epoch": 0.51, - "learning_rate": 2.4314393635536088e-05, - "loss": 2.272, - "step": 294580 - }, - { - "epoch": 0.51, - "learning_rate": 2.4313521695609258e-05, - "loss": 2.4181, - "step": 294590 - }, - { - "epoch": 0.51, - "learning_rate": 2.4312649755682435e-05, - "loss": 2.4314, - "step": 294600 - }, - { - "epoch": 0.51, - "learning_rate": 2.4311777815755605e-05, - "loss": 2.3632, - "step": 294610 - }, - { - "epoch": 0.51, - "learning_rate": 2.431090587582878e-05, - "loss": 2.2815, - "step": 294620 - }, - { - "epoch": 0.51, - "learning_rate": 2.4310033935901953e-05, - "loss": 2.3291, - "step": 294630 - }, - { - "epoch": 0.51, - "learning_rate": 2.4309161995975127e-05, - "loss": 2.3784, - "step": 294640 - }, - { - "epoch": 0.51, - "learning_rate": 2.43082900560483e-05, - "loss": 2.3663, - "step": 294650 - }, - { - "epoch": 0.51, - "learning_rate": 2.430741811612147e-05, - "loss": 2.2887, - "step": 294660 - }, - { - "epoch": 0.51, - "learning_rate": 2.4306546176194648e-05, - "loss": 2.3531, - "step": 294670 - }, - { - "epoch": 0.51, - "learning_rate": 2.430567423626782e-05, - "loss": 2.3348, - "step": 294680 - }, - { - "epoch": 0.51, - "learning_rate": 2.4304802296340992e-05, - "loss": 2.4173, - "step": 294690 - }, - { - "epoch": 0.51, - "learning_rate": 2.4303930356414166e-05, - "loss": 2.3965, - "step": 294700 - }, - { - "epoch": 0.51, - "learning_rate": 2.430305841648734e-05, - "loss": 2.2771, - "step": 294710 - }, - { - "epoch": 0.51, - "learning_rate": 2.4302186476560514e-05, - "loss": 2.2864, - "step": 294720 - }, - { - "epoch": 0.51, - "learning_rate": 2.4301314536633684e-05, - "loss": 2.3188, - "step": 294730 - }, - { - "epoch": 0.51, - "learning_rate": 2.4300442596706858e-05, - "loss": 2.302, - "step": 294740 - }, - { - "epoch": 0.51, - "learning_rate": 2.429957065678003e-05, - "loss": 2.4366, - "step": 294750 - }, - { - "epoch": 0.51, - "learning_rate": 2.4298698716853205e-05, - "loss": 2.379, - "step": 294760 - }, - { - "epoch": 0.51, - "learning_rate": 2.429782677692638e-05, - "loss": 2.3621, - "step": 294770 - }, - { - "epoch": 0.51, - "learning_rate": 2.4296954836999553e-05, - "loss": 2.3967, - "step": 294780 - }, - { - "epoch": 0.51, - "learning_rate": 2.4296082897072727e-05, - "loss": 2.286, - "step": 294790 - }, - { - "epoch": 0.51, - "learning_rate": 2.4295210957145897e-05, - "loss": 2.378, - "step": 294800 - }, - { - "epoch": 0.51, - "learning_rate": 2.429433901721907e-05, - "loss": 2.2571, - "step": 294810 - }, - { - "epoch": 0.51, - "learning_rate": 2.4293467077292244e-05, - "loss": 2.3375, - "step": 294820 - }, - { - "epoch": 0.51, - "learning_rate": 2.4292595137365418e-05, - "loss": 2.4127, - "step": 294830 - }, - { - "epoch": 0.51, - "learning_rate": 2.429172319743859e-05, - "loss": 2.3337, - "step": 294840 - }, - { - "epoch": 0.51, - "learning_rate": 2.4290851257511762e-05, - "loss": 2.4333, - "step": 294850 - }, - { - "epoch": 0.51, - "learning_rate": 2.4289979317584936e-05, - "loss": 2.3955, - "step": 294860 - }, - { - "epoch": 0.51, - "learning_rate": 2.428910737765811e-05, - "loss": 2.3698, - "step": 294870 - }, - { - "epoch": 0.51, - "learning_rate": 2.4288235437731284e-05, - "loss": 2.345, - "step": 294880 - }, - { - "epoch": 0.51, - "learning_rate": 2.4287363497804454e-05, - "loss": 2.494, - "step": 294890 - }, - { - "epoch": 0.51, - "learning_rate": 2.428649155787763e-05, - "loss": 2.2505, - "step": 294900 - }, - { - "epoch": 0.51, - "learning_rate": 2.42856196179508e-05, - "loss": 2.3602, - "step": 294910 - }, - { - "epoch": 0.51, - "learning_rate": 2.4284747678023975e-05, - "loss": 2.2915, - "step": 294920 - }, - { - "epoch": 0.51, - "learning_rate": 2.428387573809715e-05, - "loss": 2.4685, - "step": 294930 - }, - { - "epoch": 0.51, - "learning_rate": 2.4283003798170323e-05, - "loss": 2.4712, - "step": 294940 - }, - { - "epoch": 0.51, - "learning_rate": 2.4282131858243497e-05, - "loss": 2.4043, - "step": 294950 - }, - { - "epoch": 0.51, - "learning_rate": 2.4281259918316667e-05, - "loss": 2.3163, - "step": 294960 - }, - { - "epoch": 0.51, - "learning_rate": 2.4280387978389844e-05, - "loss": 2.3468, - "step": 294970 - }, - { - "epoch": 0.51, - "learning_rate": 2.4279516038463015e-05, - "loss": 2.358, - "step": 294980 - }, - { - "epoch": 0.51, - "learning_rate": 2.427864409853619e-05, - "loss": 2.2489, - "step": 294990 - }, - { - "epoch": 0.51, - "learning_rate": 2.427777215860936e-05, - "loss": 2.5064, - "step": 295000 - }, - { - "epoch": 0.51, - "learning_rate": 2.4276900218682536e-05, - "loss": 2.4526, - "step": 295010 - }, - { - "epoch": 0.51, - "learning_rate": 2.427602827875571e-05, - "loss": 2.2351, - "step": 295020 - }, - { - "epoch": 0.51, - "learning_rate": 2.427515633882888e-05, - "loss": 2.2259, - "step": 295030 - }, - { - "epoch": 0.51, - "learning_rate": 2.4274284398902057e-05, - "loss": 2.4917, - "step": 295040 - }, - { - "epoch": 0.51, - "learning_rate": 2.4273412458975228e-05, - "loss": 2.2773, - "step": 295050 - }, - { - "epoch": 0.51, - "learning_rate": 2.42725405190484e-05, - "loss": 2.3175, - "step": 295060 - }, - { - "epoch": 0.51, - "learning_rate": 2.4271668579121572e-05, - "loss": 2.3784, - "step": 295070 - }, - { - "epoch": 0.51, - "learning_rate": 2.427079663919475e-05, - "loss": 2.273, - "step": 295080 - }, - { - "epoch": 0.51, - "learning_rate": 2.426992469926792e-05, - "loss": 2.4423, - "step": 295090 - }, - { - "epoch": 0.51, - "learning_rate": 2.4269052759341093e-05, - "loss": 2.2985, - "step": 295100 - }, - { - "epoch": 0.51, - "learning_rate": 2.4268180819414267e-05, - "loss": 2.369, - "step": 295110 - }, - { - "epoch": 0.51, - "learning_rate": 2.426730887948744e-05, - "loss": 2.2971, - "step": 295120 - }, - { - "epoch": 0.51, - "learning_rate": 2.4266436939560614e-05, - "loss": 2.3704, - "step": 295130 - }, - { - "epoch": 0.51, - "learning_rate": 2.4265564999633785e-05, - "loss": 2.3631, - "step": 295140 - }, - { - "epoch": 0.51, - "learning_rate": 2.426469305970696e-05, - "loss": 2.4548, - "step": 295150 - }, - { - "epoch": 0.51, - "learning_rate": 2.4263821119780132e-05, - "loss": 2.3596, - "step": 295160 - }, - { - "epoch": 0.51, - "learning_rate": 2.4262949179853306e-05, - "loss": 2.393, - "step": 295170 - }, - { - "epoch": 0.51, - "learning_rate": 2.426207723992648e-05, - "loss": 2.449, - "step": 295180 - }, - { - "epoch": 0.51, - "learning_rate": 2.4261205299999654e-05, - "loss": 2.3407, - "step": 295190 - }, - { - "epoch": 0.51, - "learning_rate": 2.4260333360072827e-05, - "loss": 2.3338, - "step": 295200 - }, - { - "epoch": 0.51, - "learning_rate": 2.4259461420145998e-05, - "loss": 2.2596, - "step": 295210 - }, - { - "epoch": 0.51, - "learning_rate": 2.425858948021917e-05, - "loss": 2.3164, - "step": 295220 - }, - { - "epoch": 0.51, - "learning_rate": 2.4257717540292345e-05, - "loss": 2.1746, - "step": 295230 - }, - { - "epoch": 0.51, - "learning_rate": 2.425684560036552e-05, - "loss": 2.3627, - "step": 295240 - }, - { - "epoch": 0.51, - "learning_rate": 2.425597366043869e-05, - "loss": 2.4099, - "step": 295250 - }, - { - "epoch": 0.51, - "learning_rate": 2.4255101720511863e-05, - "loss": 2.3606, - "step": 295260 - }, - { - "epoch": 0.51, - "learning_rate": 2.425422978058504e-05, - "loss": 2.3796, - "step": 295270 - }, - { - "epoch": 0.51, - "learning_rate": 2.425335784065821e-05, - "loss": 2.43, - "step": 295280 - }, - { - "epoch": 0.51, - "learning_rate": 2.4252485900731385e-05, - "loss": 2.2416, - "step": 295290 - }, - { - "epoch": 0.51, - "learning_rate": 2.425161396080456e-05, - "loss": 2.371, - "step": 295300 - }, - { - "epoch": 0.51, - "learning_rate": 2.4250742020877732e-05, - "loss": 2.3468, - "step": 295310 - }, - { - "epoch": 0.52, - "learning_rate": 2.4249870080950902e-05, - "loss": 2.397, - "step": 295320 - }, - { - "epoch": 0.52, - "learning_rate": 2.4248998141024076e-05, - "loss": 2.3506, - "step": 295330 - }, - { - "epoch": 0.52, - "learning_rate": 2.424812620109725e-05, - "loss": 2.362, - "step": 295340 - }, - { - "epoch": 0.52, - "learning_rate": 2.4247254261170424e-05, - "loss": 2.3848, - "step": 295350 - }, - { - "epoch": 0.52, - "learning_rate": 2.4246382321243598e-05, - "loss": 2.4137, - "step": 295360 - }, - { - "epoch": 0.52, - "learning_rate": 2.4245510381316768e-05, - "loss": 2.4302, - "step": 295370 - }, - { - "epoch": 0.52, - "learning_rate": 2.4244638441389945e-05, - "loss": 2.3109, - "step": 295380 - }, - { - "epoch": 0.52, - "learning_rate": 2.4243766501463115e-05, - "loss": 2.3739, - "step": 295390 - }, - { - "epoch": 0.52, - "learning_rate": 2.424289456153629e-05, - "loss": 2.49, - "step": 295400 - }, - { - "epoch": 0.52, - "learning_rate": 2.4242022621609463e-05, - "loss": 2.3198, - "step": 295410 - }, - { - "epoch": 0.52, - "learning_rate": 2.4241150681682637e-05, - "loss": 2.3873, - "step": 295420 - }, - { - "epoch": 0.52, - "learning_rate": 2.424027874175581e-05, - "loss": 2.348, - "step": 295430 - }, - { - "epoch": 0.52, - "learning_rate": 2.423940680182898e-05, - "loss": 2.407, - "step": 295440 - }, - { - "epoch": 0.52, - "learning_rate": 2.4238534861902158e-05, - "loss": 2.3074, - "step": 295450 - }, - { - "epoch": 0.52, - "learning_rate": 2.423766292197533e-05, - "loss": 2.3515, - "step": 295460 - }, - { - "epoch": 0.52, - "learning_rate": 2.4236790982048502e-05, - "loss": 2.2991, - "step": 295470 - }, - { - "epoch": 0.52, - "learning_rate": 2.4235919042121673e-05, - "loss": 2.3571, - "step": 295480 - }, - { - "epoch": 0.52, - "learning_rate": 2.423504710219485e-05, - "loss": 2.4773, - "step": 295490 - }, - { - "epoch": 0.52, - "learning_rate": 2.4234175162268024e-05, - "loss": 2.319, - "step": 295500 - }, - { - "epoch": 0.52, - "learning_rate": 2.4233303222341194e-05, - "loss": 2.3215, - "step": 295510 - }, - { - "epoch": 0.52, - "learning_rate": 2.4232431282414368e-05, - "loss": 2.3969, - "step": 295520 - }, - { - "epoch": 0.52, - "learning_rate": 2.423155934248754e-05, - "loss": 2.3433, - "step": 295530 - }, - { - "epoch": 0.52, - "learning_rate": 2.4230687402560715e-05, - "loss": 2.3224, - "step": 295540 - }, - { - "epoch": 0.52, - "learning_rate": 2.4229815462633886e-05, - "loss": 2.4313, - "step": 295550 - }, - { - "epoch": 0.52, - "learning_rate": 2.422894352270706e-05, - "loss": 2.3733, - "step": 295560 - }, - { - "epoch": 0.52, - "learning_rate": 2.4228071582780233e-05, - "loss": 2.3426, - "step": 295570 - }, - { - "epoch": 0.52, - "learning_rate": 2.4227199642853407e-05, - "loss": 2.2331, - "step": 295580 - }, - { - "epoch": 0.52, - "learning_rate": 2.422632770292658e-05, - "loss": 2.3389, - "step": 295590 - }, - { - "epoch": 0.52, - "learning_rate": 2.4225455762999754e-05, - "loss": 2.2931, - "step": 295600 - }, - { - "epoch": 0.52, - "learning_rate": 2.4224583823072928e-05, - "loss": 2.319, - "step": 295610 - }, - { - "epoch": 0.52, - "learning_rate": 2.42237118831461e-05, - "loss": 2.412, - "step": 295620 - }, - { - "epoch": 0.52, - "learning_rate": 2.4222839943219272e-05, - "loss": 2.3956, - "step": 295630 - }, - { - "epoch": 0.52, - "learning_rate": 2.4221968003292446e-05, - "loss": 2.3638, - "step": 295640 - }, - { - "epoch": 0.52, - "learning_rate": 2.422109606336562e-05, - "loss": 2.2816, - "step": 295650 - }, - { - "epoch": 0.52, - "learning_rate": 2.4220224123438794e-05, - "loss": 2.2917, - "step": 295660 - }, - { - "epoch": 0.52, - "learning_rate": 2.4219352183511964e-05, - "loss": 2.3163, - "step": 295670 - }, - { - "epoch": 0.52, - "learning_rate": 2.421848024358514e-05, - "loss": 2.4275, - "step": 295680 - }, - { - "epoch": 0.52, - "learning_rate": 2.421760830365831e-05, - "loss": 2.2805, - "step": 295690 - }, - { - "epoch": 0.52, - "learning_rate": 2.4216736363731485e-05, - "loss": 2.2908, - "step": 295700 - }, - { - "epoch": 0.52, - "learning_rate": 2.421586442380466e-05, - "loss": 2.2296, - "step": 295710 - }, - { - "epoch": 0.52, - "learning_rate": 2.4214992483877833e-05, - "loss": 2.4453, - "step": 295720 - }, - { - "epoch": 0.52, - "learning_rate": 2.4214120543951003e-05, - "loss": 2.3145, - "step": 295730 - }, - { - "epoch": 0.52, - "learning_rate": 2.4213248604024177e-05, - "loss": 2.2828, - "step": 295740 - }, - { - "epoch": 0.52, - "learning_rate": 2.4212376664097354e-05, - "loss": 2.4007, - "step": 295750 - }, - { - "epoch": 0.52, - "learning_rate": 2.4211504724170525e-05, - "loss": 2.3331, - "step": 295760 - }, - { - "epoch": 0.52, - "learning_rate": 2.42106327842437e-05, - "loss": 2.291, - "step": 295770 - }, - { - "epoch": 0.52, - "learning_rate": 2.420976084431687e-05, - "loss": 2.4279, - "step": 295780 - }, - { - "epoch": 0.52, - "learning_rate": 2.4208888904390046e-05, - "loss": 2.3839, - "step": 295790 - }, - { - "epoch": 0.52, - "learning_rate": 2.4208016964463216e-05, - "loss": 2.4101, - "step": 295800 - }, - { - "epoch": 0.52, - "learning_rate": 2.420714502453639e-05, - "loss": 2.1885, - "step": 295810 - }, - { - "epoch": 0.52, - "learning_rate": 2.4206273084609564e-05, - "loss": 2.2554, - "step": 295820 - }, - { - "epoch": 0.52, - "learning_rate": 2.4205401144682738e-05, - "loss": 2.3402, - "step": 295830 - }, - { - "epoch": 0.52, - "learning_rate": 2.420452920475591e-05, - "loss": 2.3298, - "step": 295840 - }, - { - "epoch": 0.52, - "learning_rate": 2.4203657264829082e-05, - "loss": 2.3644, - "step": 295850 - }, - { - "epoch": 0.52, - "learning_rate": 2.420278532490226e-05, - "loss": 2.2729, - "step": 295860 - }, - { - "epoch": 0.52, - "learning_rate": 2.420191338497543e-05, - "loss": 2.4198, - "step": 295870 - }, - { - "epoch": 0.52, - "learning_rate": 2.4201041445048603e-05, - "loss": 2.357, - "step": 295880 - }, - { - "epoch": 0.52, - "learning_rate": 2.4200169505121777e-05, - "loss": 2.3334, - "step": 295890 - }, - { - "epoch": 0.52, - "learning_rate": 2.419929756519495e-05, - "loss": 2.42, - "step": 295900 - }, - { - "epoch": 0.52, - "learning_rate": 2.4198425625268124e-05, - "loss": 2.2355, - "step": 295910 - }, - { - "epoch": 0.52, - "learning_rate": 2.4197553685341295e-05, - "loss": 2.4225, - "step": 295920 - }, - { - "epoch": 0.52, - "learning_rate": 2.419668174541447e-05, - "loss": 2.3122, - "step": 295930 - }, - { - "epoch": 0.52, - "learning_rate": 2.4195809805487642e-05, - "loss": 2.3533, - "step": 295940 - }, - { - "epoch": 0.52, - "learning_rate": 2.4194937865560816e-05, - "loss": 2.3941, - "step": 295950 - }, - { - "epoch": 0.52, - "learning_rate": 2.4194065925633986e-05, - "loss": 2.2337, - "step": 295960 - }, - { - "epoch": 0.52, - "learning_rate": 2.4193193985707164e-05, - "loss": 2.4214, - "step": 295970 - }, - { - "epoch": 0.52, - "learning_rate": 2.4192322045780334e-05, - "loss": 2.3645, - "step": 295980 - }, - { - "epoch": 0.52, - "learning_rate": 2.4191450105853508e-05, - "loss": 2.4198, - "step": 295990 - }, - { - "epoch": 0.52, - "learning_rate": 2.419057816592668e-05, - "loss": 2.3333, - "step": 296000 - }, - { - "epoch": 0.52, - "learning_rate": 2.4189706225999855e-05, - "loss": 2.4367, - "step": 296010 - }, - { - "epoch": 0.52, - "learning_rate": 2.418883428607303e-05, - "loss": 2.3389, - "step": 296020 - }, - { - "epoch": 0.52, - "learning_rate": 2.41879623461462e-05, - "loss": 2.3269, - "step": 296030 - }, - { - "epoch": 0.52, - "learning_rate": 2.4187090406219373e-05, - "loss": 2.4022, - "step": 296040 - }, - { - "epoch": 0.52, - "learning_rate": 2.4186218466292547e-05, - "loss": 2.3568, - "step": 296050 - }, - { - "epoch": 0.52, - "learning_rate": 2.418534652636572e-05, - "loss": 2.3563, - "step": 296060 - }, - { - "epoch": 0.52, - "learning_rate": 2.4184474586438895e-05, - "loss": 2.3961, - "step": 296070 - }, - { - "epoch": 0.52, - "learning_rate": 2.4183602646512065e-05, - "loss": 2.3986, - "step": 296080 - }, - { - "epoch": 0.52, - "learning_rate": 2.4182730706585242e-05, - "loss": 2.3511, - "step": 296090 - }, - { - "epoch": 0.52, - "learning_rate": 2.4181858766658412e-05, - "loss": 2.4208, - "step": 296100 - }, - { - "epoch": 0.52, - "learning_rate": 2.4180986826731586e-05, - "loss": 2.2703, - "step": 296110 - }, - { - "epoch": 0.52, - "learning_rate": 2.418011488680476e-05, - "loss": 2.4193, - "step": 296120 - }, - { - "epoch": 0.52, - "learning_rate": 2.4179242946877934e-05, - "loss": 2.3359, - "step": 296130 - }, - { - "epoch": 0.52, - "learning_rate": 2.4178371006951108e-05, - "loss": 2.5308, - "step": 296140 - }, - { - "epoch": 0.52, - "learning_rate": 2.4177499067024278e-05, - "loss": 2.3087, - "step": 296150 - }, - { - "epoch": 0.52, - "learning_rate": 2.4176627127097455e-05, - "loss": 2.4525, - "step": 296160 - }, - { - "epoch": 0.52, - "learning_rate": 2.4175755187170625e-05, - "loss": 2.4367, - "step": 296170 - }, - { - "epoch": 0.52, - "learning_rate": 2.41748832472438e-05, - "loss": 2.349, - "step": 296180 - }, - { - "epoch": 0.52, - "learning_rate": 2.417401130731697e-05, - "loss": 2.425, - "step": 296190 - }, - { - "epoch": 0.52, - "learning_rate": 2.4173139367390147e-05, - "loss": 2.3491, - "step": 296200 - }, - { - "epoch": 0.52, - "learning_rate": 2.4172267427463317e-05, - "loss": 2.3822, - "step": 296210 - }, - { - "epoch": 0.52, - "learning_rate": 2.417139548753649e-05, - "loss": 2.3717, - "step": 296220 - }, - { - "epoch": 0.52, - "learning_rate": 2.4170523547609668e-05, - "loss": 2.3725, - "step": 296230 - }, - { - "epoch": 0.52, - "learning_rate": 2.416965160768284e-05, - "loss": 2.3642, - "step": 296240 - }, - { - "epoch": 0.52, - "learning_rate": 2.4168779667756012e-05, - "loss": 2.2628, - "step": 296250 - }, - { - "epoch": 0.52, - "learning_rate": 2.4167907727829183e-05, - "loss": 2.3441, - "step": 296260 - }, - { - "epoch": 0.52, - "learning_rate": 2.416703578790236e-05, - "loss": 2.2571, - "step": 296270 - }, - { - "epoch": 0.52, - "learning_rate": 2.416616384797553e-05, - "loss": 2.3014, - "step": 296280 - }, - { - "epoch": 0.52, - "learning_rate": 2.4165291908048704e-05, - "loss": 2.3395, - "step": 296290 - }, - { - "epoch": 0.52, - "learning_rate": 2.4164419968121878e-05, - "loss": 2.3155, - "step": 296300 - }, - { - "epoch": 0.52, - "learning_rate": 2.416354802819505e-05, - "loss": 2.3571, - "step": 296310 - }, - { - "epoch": 0.52, - "learning_rate": 2.4162676088268225e-05, - "loss": 2.4261, - "step": 296320 - }, - { - "epoch": 0.52, - "learning_rate": 2.4161804148341396e-05, - "loss": 2.4282, - "step": 296330 - }, - { - "epoch": 0.52, - "learning_rate": 2.416093220841457e-05, - "loss": 2.3945, - "step": 296340 - }, - { - "epoch": 0.52, - "learning_rate": 2.4160060268487743e-05, - "loss": 2.3914, - "step": 296350 - }, - { - "epoch": 0.52, - "learning_rate": 2.4159188328560917e-05, - "loss": 2.3475, - "step": 296360 - }, - { - "epoch": 0.52, - "learning_rate": 2.415831638863409e-05, - "loss": 2.316, - "step": 296370 - }, - { - "epoch": 0.52, - "learning_rate": 2.4157444448707264e-05, - "loss": 2.3342, - "step": 296380 - }, - { - "epoch": 0.52, - "learning_rate": 2.4156572508780438e-05, - "loss": 2.3956, - "step": 296390 - }, - { - "epoch": 0.52, - "learning_rate": 2.415570056885361e-05, - "loss": 2.3305, - "step": 296400 - }, - { - "epoch": 0.52, - "learning_rate": 2.4154828628926782e-05, - "loss": 2.4679, - "step": 296410 - }, - { - "epoch": 0.52, - "learning_rate": 2.4153956688999956e-05, - "loss": 2.4174, - "step": 296420 - }, - { - "epoch": 0.52, - "learning_rate": 2.415308474907313e-05, - "loss": 2.2616, - "step": 296430 - }, - { - "epoch": 0.52, - "learning_rate": 2.41522128091463e-05, - "loss": 2.3505, - "step": 296440 - }, - { - "epoch": 0.52, - "learning_rate": 2.4151340869219474e-05, - "loss": 2.3103, - "step": 296450 - }, - { - "epoch": 0.52, - "learning_rate": 2.4150468929292648e-05, - "loss": 2.3139, - "step": 296460 - }, - { - "epoch": 0.52, - "learning_rate": 2.414959698936582e-05, - "loss": 2.3818, - "step": 296470 - }, - { - "epoch": 0.52, - "learning_rate": 2.4148725049438995e-05, - "loss": 2.3594, - "step": 296480 - }, - { - "epoch": 0.52, - "learning_rate": 2.4147853109512166e-05, - "loss": 2.2473, - "step": 296490 - }, - { - "epoch": 0.52, - "learning_rate": 2.4146981169585343e-05, - "loss": 2.4907, - "step": 296500 - }, - { - "epoch": 0.52, - "learning_rate": 2.4146109229658513e-05, - "loss": 2.41, - "step": 296510 - }, - { - "epoch": 0.52, - "learning_rate": 2.4145237289731687e-05, - "loss": 2.356, - "step": 296520 - }, - { - "epoch": 0.52, - "learning_rate": 2.414436534980486e-05, - "loss": 2.4267, - "step": 296530 - }, - { - "epoch": 0.52, - "learning_rate": 2.4143493409878035e-05, - "loss": 2.4036, - "step": 296540 - }, - { - "epoch": 0.52, - "learning_rate": 2.414262146995121e-05, - "loss": 2.3708, - "step": 296550 - }, - { - "epoch": 0.52, - "learning_rate": 2.414174953002438e-05, - "loss": 2.3971, - "step": 296560 - }, - { - "epoch": 0.52, - "learning_rate": 2.4140877590097556e-05, - "loss": 2.3912, - "step": 296570 - }, - { - "epoch": 0.52, - "learning_rate": 2.4140005650170726e-05, - "loss": 2.4169, - "step": 296580 - }, - { - "epoch": 0.52, - "learning_rate": 2.41391337102439e-05, - "loss": 2.4244, - "step": 296590 - }, - { - "epoch": 0.52, - "learning_rate": 2.413826177031707e-05, - "loss": 2.4777, - "step": 296600 - }, - { - "epoch": 0.52, - "learning_rate": 2.4137389830390248e-05, - "loss": 2.4467, - "step": 296610 - }, - { - "epoch": 0.52, - "learning_rate": 2.413651789046342e-05, - "loss": 2.4072, - "step": 296620 - }, - { - "epoch": 0.52, - "learning_rate": 2.4135645950536592e-05, - "loss": 2.3297, - "step": 296630 - }, - { - "epoch": 0.52, - "learning_rate": 2.413477401060977e-05, - "loss": 2.4823, - "step": 296640 - }, - { - "epoch": 0.52, - "learning_rate": 2.413390207068294e-05, - "loss": 2.284, - "step": 296650 - }, - { - "epoch": 0.52, - "learning_rate": 2.4133030130756113e-05, - "loss": 2.2946, - "step": 296660 - }, - { - "epoch": 0.52, - "learning_rate": 2.4132158190829283e-05, - "loss": 2.3518, - "step": 296670 - }, - { - "epoch": 0.52, - "learning_rate": 2.413128625090246e-05, - "loss": 2.2944, - "step": 296680 - }, - { - "epoch": 0.52, - "learning_rate": 2.413041431097563e-05, - "loss": 2.4773, - "step": 296690 - }, - { - "epoch": 0.52, - "learning_rate": 2.4129542371048805e-05, - "loss": 2.3016, - "step": 296700 - }, - { - "epoch": 0.52, - "learning_rate": 2.412867043112198e-05, - "loss": 2.3098, - "step": 296710 - }, - { - "epoch": 0.52, - "learning_rate": 2.4127798491195152e-05, - "loss": 2.4037, - "step": 296720 - }, - { - "epoch": 0.52, - "learning_rate": 2.4126926551268326e-05, - "loss": 2.3645, - "step": 296730 - }, - { - "epoch": 0.52, - "learning_rate": 2.4126054611341496e-05, - "loss": 2.2945, - "step": 296740 - }, - { - "epoch": 0.52, - "learning_rate": 2.412518267141467e-05, - "loss": 2.3816, - "step": 296750 - }, - { - "epoch": 0.52, - "learning_rate": 2.4124310731487844e-05, - "loss": 2.4236, - "step": 296760 - }, - { - "epoch": 0.52, - "learning_rate": 2.4123438791561018e-05, - "loss": 2.2445, - "step": 296770 - }, - { - "epoch": 0.52, - "learning_rate": 2.412256685163419e-05, - "loss": 2.3876, - "step": 296780 - }, - { - "epoch": 0.52, - "learning_rate": 2.4121694911707365e-05, - "loss": 2.3426, - "step": 296790 - }, - { - "epoch": 0.52, - "learning_rate": 2.412082297178054e-05, - "loss": 2.2915, - "step": 296800 - }, - { - "epoch": 0.52, - "learning_rate": 2.411995103185371e-05, - "loss": 2.3787, - "step": 296810 - }, - { - "epoch": 0.52, - "learning_rate": 2.4119079091926883e-05, - "loss": 2.3806, - "step": 296820 - }, - { - "epoch": 0.52, - "learning_rate": 2.4118207152000057e-05, - "loss": 2.3306, - "step": 296830 - }, - { - "epoch": 0.52, - "learning_rate": 2.411733521207323e-05, - "loss": 2.4501, - "step": 296840 - }, - { - "epoch": 0.52, - "learning_rate": 2.4116463272146405e-05, - "loss": 2.3546, - "step": 296850 - }, - { - "epoch": 0.52, - "learning_rate": 2.4115591332219575e-05, - "loss": 2.4276, - "step": 296860 - }, - { - "epoch": 0.52, - "learning_rate": 2.4114719392292752e-05, - "loss": 2.3071, - "step": 296870 - }, - { - "epoch": 0.52, - "learning_rate": 2.4113847452365922e-05, - "loss": 2.1949, - "step": 296880 - }, - { - "epoch": 0.52, - "learning_rate": 2.4112975512439096e-05, - "loss": 2.35, - "step": 296890 - }, - { - "epoch": 0.52, - "learning_rate": 2.411210357251227e-05, - "loss": 2.4089, - "step": 296900 - }, - { - "epoch": 0.52, - "learning_rate": 2.4111231632585444e-05, - "loss": 2.3727, - "step": 296910 - }, - { - "epoch": 0.52, - "learning_rate": 2.4110359692658614e-05, - "loss": 2.3974, - "step": 296920 - }, - { - "epoch": 0.52, - "learning_rate": 2.4109487752731788e-05, - "loss": 2.3477, - "step": 296930 - }, - { - "epoch": 0.52, - "learning_rate": 2.4108615812804962e-05, - "loss": 2.4351, - "step": 296940 - }, - { - "epoch": 0.52, - "learning_rate": 2.4107743872878135e-05, - "loss": 2.4083, - "step": 296950 - }, - { - "epoch": 0.52, - "learning_rate": 2.410687193295131e-05, - "loss": 2.4757, - "step": 296960 - }, - { - "epoch": 0.52, - "learning_rate": 2.410599999302448e-05, - "loss": 2.3786, - "step": 296970 - }, - { - "epoch": 0.52, - "learning_rate": 2.4105128053097657e-05, - "loss": 2.3901, - "step": 296980 - }, - { - "epoch": 0.52, - "learning_rate": 2.4104256113170827e-05, - "loss": 2.3225, - "step": 296990 - }, - { - "epoch": 0.52, - "learning_rate": 2.4103384173244e-05, - "loss": 2.3622, - "step": 297000 - }, - { - "epoch": 0.52, - "learning_rate": 2.4102512233317175e-05, - "loss": 2.2861, - "step": 297010 - }, - { - "epoch": 0.52, - "learning_rate": 2.410164029339035e-05, - "loss": 2.3462, - "step": 297020 - }, - { - "epoch": 0.52, - "learning_rate": 2.4100768353463522e-05, - "loss": 2.3164, - "step": 297030 - }, - { - "epoch": 0.52, - "learning_rate": 2.4099896413536693e-05, - "loss": 2.5175, - "step": 297040 - }, - { - "epoch": 0.52, - "learning_rate": 2.409902447360987e-05, - "loss": 2.4223, - "step": 297050 - }, - { - "epoch": 0.52, - "learning_rate": 2.409815253368304e-05, - "loss": 2.3797, - "step": 297060 - }, - { - "epoch": 0.52, - "learning_rate": 2.4097280593756214e-05, - "loss": 2.2892, - "step": 297070 - }, - { - "epoch": 0.52, - "learning_rate": 2.4096408653829384e-05, - "loss": 2.2963, - "step": 297080 - }, - { - "epoch": 0.52, - "learning_rate": 2.409553671390256e-05, - "loss": 2.4475, - "step": 297090 - }, - { - "epoch": 0.52, - "learning_rate": 2.4094664773975735e-05, - "loss": 2.3132, - "step": 297100 - }, - { - "epoch": 0.52, - "learning_rate": 2.4093792834048906e-05, - "loss": 2.3714, - "step": 297110 - }, - { - "epoch": 0.52, - "learning_rate": 2.409292089412208e-05, - "loss": 2.3071, - "step": 297120 - }, - { - "epoch": 0.52, - "learning_rate": 2.4092048954195253e-05, - "loss": 2.3781, - "step": 297130 - }, - { - "epoch": 0.52, - "learning_rate": 2.4091177014268427e-05, - "loss": 2.2608, - "step": 297140 - }, - { - "epoch": 0.52, - "learning_rate": 2.4090305074341597e-05, - "loss": 2.337, - "step": 297150 - }, - { - "epoch": 0.52, - "learning_rate": 2.4089433134414774e-05, - "loss": 2.3308, - "step": 297160 - }, - { - "epoch": 0.52, - "learning_rate": 2.4088561194487945e-05, - "loss": 2.396, - "step": 297170 - }, - { - "epoch": 0.52, - "learning_rate": 2.408768925456112e-05, - "loss": 2.2818, - "step": 297180 - }, - { - "epoch": 0.52, - "learning_rate": 2.4086817314634292e-05, - "loss": 2.3783, - "step": 297190 - }, - { - "epoch": 0.52, - "learning_rate": 2.4085945374707466e-05, - "loss": 2.4016, - "step": 297200 - }, - { - "epoch": 0.52, - "learning_rate": 2.408507343478064e-05, - "loss": 2.3643, - "step": 297210 - }, - { - "epoch": 0.52, - "learning_rate": 2.408420149485381e-05, - "loss": 2.3205, - "step": 297220 - }, - { - "epoch": 0.52, - "learning_rate": 2.4083329554926984e-05, - "loss": 2.3577, - "step": 297230 - }, - { - "epoch": 0.52, - "learning_rate": 2.4082457615000158e-05, - "loss": 2.3293, - "step": 297240 - }, - { - "epoch": 0.52, - "learning_rate": 2.408158567507333e-05, - "loss": 2.4477, - "step": 297250 - }, - { - "epoch": 0.52, - "learning_rate": 2.4080713735146505e-05, - "loss": 2.3044, - "step": 297260 - }, - { - "epoch": 0.52, - "learning_rate": 2.4079841795219676e-05, - "loss": 2.2366, - "step": 297270 - }, - { - "epoch": 0.52, - "learning_rate": 2.4078969855292853e-05, - "loss": 2.349, - "step": 297280 - }, - { - "epoch": 0.52, - "learning_rate": 2.4078097915366023e-05, - "loss": 2.1976, - "step": 297290 - }, - { - "epoch": 0.52, - "learning_rate": 2.4077225975439197e-05, - "loss": 2.3507, - "step": 297300 - }, - { - "epoch": 0.52, - "learning_rate": 2.407635403551237e-05, - "loss": 2.4036, - "step": 297310 - }, - { - "epoch": 0.52, - "learning_rate": 2.4075482095585545e-05, - "loss": 2.406, - "step": 297320 - }, - { - "epoch": 0.52, - "learning_rate": 2.4074610155658715e-05, - "loss": 2.3773, - "step": 297330 - }, - { - "epoch": 0.52, - "learning_rate": 2.407373821573189e-05, - "loss": 2.3741, - "step": 297340 - }, - { - "epoch": 0.52, - "learning_rate": 2.4072866275805066e-05, - "loss": 2.3162, - "step": 297350 - }, - { - "epoch": 0.52, - "learning_rate": 2.4071994335878236e-05, - "loss": 2.3258, - "step": 297360 - }, - { - "epoch": 0.52, - "learning_rate": 2.407112239595141e-05, - "loss": 2.3956, - "step": 297370 - }, - { - "epoch": 0.52, - "learning_rate": 2.407025045602458e-05, - "loss": 2.3212, - "step": 297380 - }, - { - "epoch": 0.52, - "learning_rate": 2.4069378516097758e-05, - "loss": 2.393, - "step": 297390 - }, - { - "epoch": 0.52, - "learning_rate": 2.4068506576170928e-05, - "loss": 2.3889, - "step": 297400 - }, - { - "epoch": 0.52, - "learning_rate": 2.4067634636244102e-05, - "loss": 2.3058, - "step": 297410 - }, - { - "epoch": 0.52, - "learning_rate": 2.4066762696317276e-05, - "loss": 2.4461, - "step": 297420 - }, - { - "epoch": 0.52, - "learning_rate": 2.406589075639045e-05, - "loss": 2.3612, - "step": 297430 - }, - { - "epoch": 0.52, - "learning_rate": 2.4065018816463623e-05, - "loss": 2.3045, - "step": 297440 - }, - { - "epoch": 0.52, - "learning_rate": 2.4064146876536793e-05, - "loss": 2.3221, - "step": 297450 - }, - { - "epoch": 0.52, - "learning_rate": 2.406327493660997e-05, - "loss": 2.3353, - "step": 297460 - }, - { - "epoch": 0.52, - "learning_rate": 2.406240299668314e-05, - "loss": 2.3953, - "step": 297470 - }, - { - "epoch": 0.52, - "learning_rate": 2.4061531056756315e-05, - "loss": 2.4031, - "step": 297480 - }, - { - "epoch": 0.52, - "learning_rate": 2.406065911682949e-05, - "loss": 2.4412, - "step": 297490 - }, - { - "epoch": 0.52, - "learning_rate": 2.4059787176902662e-05, - "loss": 2.3916, - "step": 297500 - }, - { - "epoch": 0.52, - "learning_rate": 2.4058915236975836e-05, - "loss": 2.279, - "step": 297510 - }, - { - "epoch": 0.52, - "learning_rate": 2.4058043297049006e-05, - "loss": 2.4273, - "step": 297520 - }, - { - "epoch": 0.52, - "learning_rate": 2.405717135712218e-05, - "loss": 2.2596, - "step": 297530 - }, - { - "epoch": 0.52, - "learning_rate": 2.4056299417195354e-05, - "loss": 2.3529, - "step": 297540 - }, - { - "epoch": 0.52, - "learning_rate": 2.4055427477268528e-05, - "loss": 2.4115, - "step": 297550 - }, - { - "epoch": 0.52, - "learning_rate": 2.4054555537341698e-05, - "loss": 2.4824, - "step": 297560 - }, - { - "epoch": 0.52, - "learning_rate": 2.4053683597414875e-05, - "loss": 2.3328, - "step": 297570 - }, - { - "epoch": 0.52, - "learning_rate": 2.405281165748805e-05, - "loss": 2.4304, - "step": 297580 - }, - { - "epoch": 0.52, - "learning_rate": 2.405193971756122e-05, - "loss": 2.4048, - "step": 297590 - }, - { - "epoch": 0.52, - "learning_rate": 2.4051067777634393e-05, - "loss": 2.3564, - "step": 297600 - }, - { - "epoch": 0.52, - "learning_rate": 2.4050195837707567e-05, - "loss": 2.234, - "step": 297610 - }, - { - "epoch": 0.52, - "learning_rate": 2.404932389778074e-05, - "loss": 2.4742, - "step": 297620 - }, - { - "epoch": 0.52, - "learning_rate": 2.404845195785391e-05, - "loss": 2.333, - "step": 297630 - }, - { - "epoch": 0.52, - "learning_rate": 2.4047580017927085e-05, - "loss": 2.3936, - "step": 297640 - }, - { - "epoch": 0.52, - "learning_rate": 2.404670807800026e-05, - "loss": 2.3351, - "step": 297650 - }, - { - "epoch": 0.52, - "learning_rate": 2.4045836138073433e-05, - "loss": 2.296, - "step": 297660 - }, - { - "epoch": 0.52, - "learning_rate": 2.4044964198146606e-05, - "loss": 2.3051, - "step": 297670 - }, - { - "epoch": 0.52, - "learning_rate": 2.4044092258219777e-05, - "loss": 2.3947, - "step": 297680 - }, - { - "epoch": 0.52, - "learning_rate": 2.4043220318292954e-05, - "loss": 2.3098, - "step": 297690 - }, - { - "epoch": 0.52, - "learning_rate": 2.4042348378366124e-05, - "loss": 2.3213, - "step": 297700 - }, - { - "epoch": 0.52, - "learning_rate": 2.4041476438439298e-05, - "loss": 2.3768, - "step": 297710 - }, - { - "epoch": 0.52, - "learning_rate": 2.4040604498512472e-05, - "loss": 2.2669, - "step": 297720 - }, - { - "epoch": 0.52, - "learning_rate": 2.4039732558585646e-05, - "loss": 2.4884, - "step": 297730 - }, - { - "epoch": 0.52, - "learning_rate": 2.403886061865882e-05, - "loss": 2.4029, - "step": 297740 - }, - { - "epoch": 0.52, - "learning_rate": 2.403798867873199e-05, - "loss": 2.4367, - "step": 297750 - }, - { - "epoch": 0.52, - "learning_rate": 2.4037116738805167e-05, - "loss": 2.3747, - "step": 297760 - }, - { - "epoch": 0.52, - "learning_rate": 2.4036244798878337e-05, - "loss": 2.3959, - "step": 297770 - }, - { - "epoch": 0.52, - "learning_rate": 2.403537285895151e-05, - "loss": 2.443, - "step": 297780 - }, - { - "epoch": 0.52, - "learning_rate": 2.403450091902468e-05, - "loss": 2.3733, - "step": 297790 - }, - { - "epoch": 0.52, - "learning_rate": 2.403362897909786e-05, - "loss": 2.3583, - "step": 297800 - }, - { - "epoch": 0.52, - "learning_rate": 2.403275703917103e-05, - "loss": 2.3565, - "step": 297810 - }, - { - "epoch": 0.52, - "learning_rate": 2.4031885099244203e-05, - "loss": 2.4303, - "step": 297820 - }, - { - "epoch": 0.52, - "learning_rate": 2.403101315931738e-05, - "loss": 2.3575, - "step": 297830 - }, - { - "epoch": 0.52, - "learning_rate": 2.403014121939055e-05, - "loss": 2.2844, - "step": 297840 - }, - { - "epoch": 0.52, - "learning_rate": 2.4029269279463724e-05, - "loss": 2.413, - "step": 297850 - }, - { - "epoch": 0.52, - "learning_rate": 2.4028397339536894e-05, - "loss": 2.2738, - "step": 297860 - }, - { - "epoch": 0.52, - "learning_rate": 2.402752539961007e-05, - "loss": 2.2955, - "step": 297870 - }, - { - "epoch": 0.52, - "learning_rate": 2.4026653459683242e-05, - "loss": 2.2689, - "step": 297880 - }, - { - "epoch": 0.52, - "learning_rate": 2.4025781519756416e-05, - "loss": 2.2689, - "step": 297890 - }, - { - "epoch": 0.52, - "learning_rate": 2.402490957982959e-05, - "loss": 2.3153, - "step": 297900 - }, - { - "epoch": 0.52, - "learning_rate": 2.4024037639902763e-05, - "loss": 2.386, - "step": 297910 - }, - { - "epoch": 0.52, - "learning_rate": 2.4023165699975937e-05, - "loss": 2.3515, - "step": 297920 - }, - { - "epoch": 0.52, - "learning_rate": 2.4022293760049107e-05, - "loss": 2.3811, - "step": 297930 - }, - { - "epoch": 0.52, - "learning_rate": 2.402142182012228e-05, - "loss": 2.4554, - "step": 297940 - }, - { - "epoch": 0.52, - "learning_rate": 2.4020549880195455e-05, - "loss": 2.3814, - "step": 297950 - }, - { - "epoch": 0.52, - "learning_rate": 2.401967794026863e-05, - "loss": 2.3235, - "step": 297960 - }, - { - "epoch": 0.52, - "learning_rate": 2.4018806000341802e-05, - "loss": 2.3916, - "step": 297970 - }, - { - "epoch": 0.52, - "learning_rate": 2.4017934060414976e-05, - "loss": 2.3604, - "step": 297980 - }, - { - "epoch": 0.52, - "learning_rate": 2.401706212048815e-05, - "loss": 2.3884, - "step": 297990 - }, - { - "epoch": 0.52, - "learning_rate": 2.401619018056132e-05, - "loss": 2.3166, - "step": 298000 - }, - { - "epoch": 0.52, - "learning_rate": 2.4015318240634494e-05, - "loss": 2.3882, - "step": 298010 - }, - { - "epoch": 0.52, - "learning_rate": 2.4014446300707668e-05, - "loss": 2.1687, - "step": 298020 - }, - { - "epoch": 0.52, - "learning_rate": 2.401357436078084e-05, - "loss": 2.3266, - "step": 298030 - }, - { - "epoch": 0.52, - "learning_rate": 2.4012702420854012e-05, - "loss": 2.4029, - "step": 298040 - }, - { - "epoch": 0.52, - "learning_rate": 2.4011830480927186e-05, - "loss": 2.4651, - "step": 298050 - }, - { - "epoch": 0.52, - "learning_rate": 2.401095854100036e-05, - "loss": 2.3789, - "step": 298060 - }, - { - "epoch": 0.52, - "learning_rate": 2.4010086601073533e-05, - "loss": 2.1877, - "step": 298070 - }, - { - "epoch": 0.52, - "learning_rate": 2.4009214661146707e-05, - "loss": 2.2465, - "step": 298080 - }, - { - "epoch": 0.52, - "learning_rate": 2.400834272121988e-05, - "loss": 2.389, - "step": 298090 - }, - { - "epoch": 0.52, - "learning_rate": 2.4007470781293055e-05, - "loss": 2.2933, - "step": 298100 - }, - { - "epoch": 0.52, - "learning_rate": 2.4006598841366225e-05, - "loss": 2.3182, - "step": 298110 - }, - { - "epoch": 0.52, - "learning_rate": 2.40057269014394e-05, - "loss": 2.3552, - "step": 298120 - }, - { - "epoch": 0.52, - "learning_rate": 2.4004854961512573e-05, - "loss": 2.3301, - "step": 298130 - }, - { - "epoch": 0.52, - "learning_rate": 2.4003983021585746e-05, - "loss": 2.2901, - "step": 298140 - }, - { - "epoch": 0.52, - "learning_rate": 2.400311108165892e-05, - "loss": 2.3478, - "step": 298150 - }, - { - "epoch": 0.52, - "learning_rate": 2.400223914173209e-05, - "loss": 2.2687, - "step": 298160 - }, - { - "epoch": 0.52, - "learning_rate": 2.4001367201805268e-05, - "loss": 2.3241, - "step": 298170 - }, - { - "epoch": 0.52, - "learning_rate": 2.4000495261878438e-05, - "loss": 2.4653, - "step": 298180 - }, - { - "epoch": 0.52, - "learning_rate": 2.3999623321951612e-05, - "loss": 2.462, - "step": 298190 - }, - { - "epoch": 0.52, - "learning_rate": 2.3998751382024786e-05, - "loss": 2.3549, - "step": 298200 - }, - { - "epoch": 0.52, - "learning_rate": 2.399787944209796e-05, - "loss": 2.3325, - "step": 298210 - }, - { - "epoch": 0.52, - "learning_rate": 2.3997007502171133e-05, - "loss": 2.3489, - "step": 298220 - }, - { - "epoch": 0.52, - "learning_rate": 2.3996135562244304e-05, - "loss": 2.4747, - "step": 298230 - }, - { - "epoch": 0.52, - "learning_rate": 2.399526362231748e-05, - "loss": 2.3861, - "step": 298240 - }, - { - "epoch": 0.52, - "learning_rate": 2.399439168239065e-05, - "loss": 2.3714, - "step": 298250 - }, - { - "epoch": 0.52, - "learning_rate": 2.3993519742463825e-05, - "loss": 2.3373, - "step": 298260 - }, - { - "epoch": 0.52, - "learning_rate": 2.3992647802536995e-05, - "loss": 2.2479, - "step": 298270 - }, - { - "epoch": 0.52, - "learning_rate": 2.3991775862610172e-05, - "loss": 2.359, - "step": 298280 - }, - { - "epoch": 0.52, - "learning_rate": 2.3990903922683343e-05, - "loss": 2.3528, - "step": 298290 - }, - { - "epoch": 0.52, - "learning_rate": 2.3990031982756517e-05, - "loss": 2.2611, - "step": 298300 - }, - { - "epoch": 0.52, - "learning_rate": 2.398916004282969e-05, - "loss": 2.3599, - "step": 298310 - }, - { - "epoch": 0.52, - "learning_rate": 2.3988288102902864e-05, - "loss": 2.4444, - "step": 298320 - }, - { - "epoch": 0.52, - "learning_rate": 2.3987416162976038e-05, - "loss": 2.3371, - "step": 298330 - }, - { - "epoch": 0.52, - "learning_rate": 2.3986544223049208e-05, - "loss": 2.2852, - "step": 298340 - }, - { - "epoch": 0.52, - "learning_rate": 2.3985672283122382e-05, - "loss": 2.3866, - "step": 298350 - }, - { - "epoch": 0.52, - "learning_rate": 2.3984800343195556e-05, - "loss": 2.332, - "step": 298360 - }, - { - "epoch": 0.52, - "learning_rate": 2.398392840326873e-05, - "loss": 2.2616, - "step": 298370 - }, - { - "epoch": 0.52, - "learning_rate": 2.3983056463341903e-05, - "loss": 2.3193, - "step": 298380 - }, - { - "epoch": 0.52, - "learning_rate": 2.3982184523415077e-05, - "loss": 2.3397, - "step": 298390 - }, - { - "epoch": 0.52, - "learning_rate": 2.398131258348825e-05, - "loss": 2.4031, - "step": 298400 - }, - { - "epoch": 0.52, - "learning_rate": 2.398044064356142e-05, - "loss": 2.4654, - "step": 298410 - }, - { - "epoch": 0.52, - "learning_rate": 2.3979568703634595e-05, - "loss": 2.4139, - "step": 298420 - }, - { - "epoch": 0.52, - "learning_rate": 2.397869676370777e-05, - "loss": 2.4389, - "step": 298430 - }, - { - "epoch": 0.52, - "learning_rate": 2.3977824823780943e-05, - "loss": 2.3445, - "step": 298440 - }, - { - "epoch": 0.52, - "learning_rate": 2.3976952883854116e-05, - "loss": 2.4012, - "step": 298450 - }, - { - "epoch": 0.52, - "learning_rate": 2.3976080943927287e-05, - "loss": 2.392, - "step": 298460 - }, - { - "epoch": 0.52, - "learning_rate": 2.3975209004000464e-05, - "loss": 2.2844, - "step": 298470 - }, - { - "epoch": 0.52, - "learning_rate": 2.3974337064073634e-05, - "loss": 2.3327, - "step": 298480 - }, - { - "epoch": 0.52, - "learning_rate": 2.3973465124146808e-05, - "loss": 2.3495, - "step": 298490 - }, - { - "epoch": 0.52, - "learning_rate": 2.3972593184219982e-05, - "loss": 2.3056, - "step": 298500 - }, - { - "epoch": 0.52, - "learning_rate": 2.3971721244293156e-05, - "loss": 2.3538, - "step": 298510 - }, - { - "epoch": 0.52, - "learning_rate": 2.3970849304366326e-05, - "loss": 2.4222, - "step": 298520 - }, - { - "epoch": 0.52, - "learning_rate": 2.39699773644395e-05, - "loss": 2.3434, - "step": 298530 - }, - { - "epoch": 0.52, - "learning_rate": 2.3969105424512673e-05, - "loss": 2.1794, - "step": 298540 - }, - { - "epoch": 0.52, - "learning_rate": 2.3968233484585847e-05, - "loss": 2.3099, - "step": 298550 - }, - { - "epoch": 0.52, - "learning_rate": 2.396736154465902e-05, - "loss": 2.3143, - "step": 298560 - }, - { - "epoch": 0.52, - "learning_rate": 2.396648960473219e-05, - "loss": 2.4291, - "step": 298570 - }, - { - "epoch": 0.52, - "learning_rate": 2.396561766480537e-05, - "loss": 2.4371, - "step": 298580 - }, - { - "epoch": 0.52, - "learning_rate": 2.396474572487854e-05, - "loss": 2.3971, - "step": 298590 - }, - { - "epoch": 0.52, - "learning_rate": 2.3963873784951713e-05, - "loss": 2.4434, - "step": 298600 - }, - { - "epoch": 0.52, - "learning_rate": 2.3963001845024886e-05, - "loss": 2.3345, - "step": 298610 - }, - { - "epoch": 0.52, - "learning_rate": 2.396212990509806e-05, - "loss": 2.3578, - "step": 298620 - }, - { - "epoch": 0.52, - "learning_rate": 2.3961257965171234e-05, - "loss": 2.4378, - "step": 298630 - }, - { - "epoch": 0.52, - "learning_rate": 2.3960386025244404e-05, - "loss": 2.2763, - "step": 298640 - }, - { - "epoch": 0.52, - "learning_rate": 2.395951408531758e-05, - "loss": 2.3253, - "step": 298650 - }, - { - "epoch": 0.52, - "learning_rate": 2.3958642145390752e-05, - "loss": 2.3756, - "step": 298660 - }, - { - "epoch": 0.52, - "learning_rate": 2.3957770205463926e-05, - "loss": 2.3341, - "step": 298670 - }, - { - "epoch": 0.52, - "learning_rate": 2.3956898265537096e-05, - "loss": 2.3576, - "step": 298680 - }, - { - "epoch": 0.52, - "learning_rate": 2.3956026325610273e-05, - "loss": 2.3172, - "step": 298690 - }, - { - "epoch": 0.52, - "learning_rate": 2.3955154385683447e-05, - "loss": 2.4036, - "step": 298700 - }, - { - "epoch": 0.52, - "learning_rate": 2.3954282445756617e-05, - "loss": 2.4294, - "step": 298710 - }, - { - "epoch": 0.52, - "learning_rate": 2.395341050582979e-05, - "loss": 2.2991, - "step": 298720 - }, - { - "epoch": 0.52, - "learning_rate": 2.3952538565902965e-05, - "loss": 2.2898, - "step": 298730 - }, - { - "epoch": 0.52, - "learning_rate": 2.395166662597614e-05, - "loss": 2.3908, - "step": 298740 - }, - { - "epoch": 0.52, - "learning_rate": 2.395079468604931e-05, - "loss": 2.3507, - "step": 298750 - }, - { - "epoch": 0.52, - "learning_rate": 2.3949922746122486e-05, - "loss": 2.3435, - "step": 298760 - }, - { - "epoch": 0.52, - "learning_rate": 2.3949050806195657e-05, - "loss": 2.3595, - "step": 298770 - }, - { - "epoch": 0.52, - "learning_rate": 2.394817886626883e-05, - "loss": 2.3252, - "step": 298780 - }, - { - "epoch": 0.52, - "learning_rate": 2.3947306926342004e-05, - "loss": 2.3864, - "step": 298790 - }, - { - "epoch": 0.52, - "learning_rate": 2.3946434986415178e-05, - "loss": 2.4623, - "step": 298800 - }, - { - "epoch": 0.52, - "learning_rate": 2.394556304648835e-05, - "loss": 2.3665, - "step": 298810 - }, - { - "epoch": 0.52, - "learning_rate": 2.3944691106561522e-05, - "loss": 2.4105, - "step": 298820 - }, - { - "epoch": 0.52, - "learning_rate": 2.3943819166634696e-05, - "loss": 2.4514, - "step": 298830 - }, - { - "epoch": 0.52, - "learning_rate": 2.394294722670787e-05, - "loss": 2.3404, - "step": 298840 - }, - { - "epoch": 0.52, - "learning_rate": 2.3942075286781043e-05, - "loss": 2.3495, - "step": 298850 - }, - { - "epoch": 0.52, - "learning_rate": 2.3941203346854217e-05, - "loss": 2.2663, - "step": 298860 - }, - { - "epoch": 0.52, - "learning_rate": 2.3940331406927388e-05, - "loss": 2.2043, - "step": 298870 - }, - { - "epoch": 0.52, - "learning_rate": 2.3939459467000565e-05, - "loss": 2.3801, - "step": 298880 - }, - { - "epoch": 0.52, - "learning_rate": 2.3938587527073735e-05, - "loss": 2.3454, - "step": 298890 - }, - { - "epoch": 0.52, - "learning_rate": 2.393771558714691e-05, - "loss": 2.3439, - "step": 298900 - }, - { - "epoch": 0.52, - "learning_rate": 2.3936843647220083e-05, - "loss": 2.4104, - "step": 298910 - }, - { - "epoch": 0.52, - "learning_rate": 2.3935971707293256e-05, - "loss": 2.4333, - "step": 298920 - }, - { - "epoch": 0.52, - "learning_rate": 2.393509976736643e-05, - "loss": 2.4035, - "step": 298930 - }, - { - "epoch": 0.52, - "learning_rate": 2.39342278274396e-05, - "loss": 2.4567, - "step": 298940 - }, - { - "epoch": 0.52, - "learning_rate": 2.3933355887512778e-05, - "loss": 2.3274, - "step": 298950 - }, - { - "epoch": 0.52, - "learning_rate": 2.3932483947585948e-05, - "loss": 2.2209, - "step": 298960 - }, - { - "epoch": 0.52, - "learning_rate": 2.3931612007659122e-05, - "loss": 2.3782, - "step": 298970 - }, - { - "epoch": 0.52, - "learning_rate": 2.3930740067732292e-05, - "loss": 2.4172, - "step": 298980 - }, - { - "epoch": 0.52, - "learning_rate": 2.392986812780547e-05, - "loss": 2.3175, - "step": 298990 - }, - { - "epoch": 0.52, - "learning_rate": 2.392899618787864e-05, - "loss": 2.3399, - "step": 299000 - }, - { - "epoch": 0.52, - "learning_rate": 2.3928124247951814e-05, - "loss": 2.3811, - "step": 299010 - }, - { - "epoch": 0.52, - "learning_rate": 2.3927252308024987e-05, - "loss": 2.3431, - "step": 299020 - }, - { - "epoch": 0.52, - "learning_rate": 2.392638036809816e-05, - "loss": 2.305, - "step": 299030 - }, - { - "epoch": 0.52, - "learning_rate": 2.3925508428171335e-05, - "loss": 2.3377, - "step": 299040 - }, - { - "epoch": 0.52, - "learning_rate": 2.3924636488244505e-05, - "loss": 2.2855, - "step": 299050 - }, - { - "epoch": 0.52, - "learning_rate": 2.3923764548317682e-05, - "loss": 2.3402, - "step": 299060 - }, - { - "epoch": 0.52, - "learning_rate": 2.3922892608390853e-05, - "loss": 2.2562, - "step": 299070 - }, - { - "epoch": 0.52, - "learning_rate": 2.3922020668464027e-05, - "loss": 2.26, - "step": 299080 - }, - { - "epoch": 0.52, - "learning_rate": 2.39211487285372e-05, - "loss": 2.3393, - "step": 299090 - }, - { - "epoch": 0.52, - "learning_rate": 2.3920276788610374e-05, - "loss": 2.2985, - "step": 299100 - }, - { - "epoch": 0.52, - "learning_rate": 2.3919404848683548e-05, - "loss": 2.3349, - "step": 299110 - }, - { - "epoch": 0.52, - "learning_rate": 2.3918532908756718e-05, - "loss": 2.3364, - "step": 299120 - }, - { - "epoch": 0.52, - "learning_rate": 2.3917660968829892e-05, - "loss": 2.4134, - "step": 299130 - }, - { - "epoch": 0.52, - "learning_rate": 2.3916789028903066e-05, - "loss": 2.4021, - "step": 299140 - }, - { - "epoch": 0.52, - "learning_rate": 2.391591708897624e-05, - "loss": 2.2097, - "step": 299150 - }, - { - "epoch": 0.52, - "learning_rate": 2.391504514904941e-05, - "loss": 2.439, - "step": 299160 - }, - { - "epoch": 0.52, - "learning_rate": 2.3914173209122587e-05, - "loss": 2.3635, - "step": 299170 - }, - { - "epoch": 0.52, - "learning_rate": 2.391330126919576e-05, - "loss": 2.4014, - "step": 299180 - }, - { - "epoch": 0.52, - "learning_rate": 2.391242932926893e-05, - "loss": 2.3333, - "step": 299190 - }, - { - "epoch": 0.52, - "learning_rate": 2.3911557389342105e-05, - "loss": 2.3149, - "step": 299200 - }, - { - "epoch": 0.52, - "learning_rate": 2.391068544941528e-05, - "loss": 2.3255, - "step": 299210 - }, - { - "epoch": 0.52, - "learning_rate": 2.3909813509488453e-05, - "loss": 2.2944, - "step": 299220 - }, - { - "epoch": 0.52, - "learning_rate": 2.3908941569561623e-05, - "loss": 2.347, - "step": 299230 - }, - { - "epoch": 0.52, - "learning_rate": 2.3908069629634797e-05, - "loss": 2.379, - "step": 299240 - }, - { - "epoch": 0.52, - "learning_rate": 2.390719768970797e-05, - "loss": 2.3578, - "step": 299250 - }, - { - "epoch": 0.52, - "learning_rate": 2.3906325749781144e-05, - "loss": 2.2682, - "step": 299260 - }, - { - "epoch": 0.52, - "learning_rate": 2.3905453809854318e-05, - "loss": 2.4337, - "step": 299270 - }, - { - "epoch": 0.52, - "learning_rate": 2.390458186992749e-05, - "loss": 2.3057, - "step": 299280 - }, - { - "epoch": 0.52, - "learning_rate": 2.3903709930000666e-05, - "loss": 2.3779, - "step": 299290 - }, - { - "epoch": 0.52, - "learning_rate": 2.3902837990073836e-05, - "loss": 2.3126, - "step": 299300 - }, - { - "epoch": 0.52, - "learning_rate": 2.390196605014701e-05, - "loss": 2.2984, - "step": 299310 - }, - { - "epoch": 0.52, - "learning_rate": 2.3901094110220183e-05, - "loss": 2.4538, - "step": 299320 - }, - { - "epoch": 0.52, - "learning_rate": 2.3900222170293357e-05, - "loss": 2.2232, - "step": 299330 - }, - { - "epoch": 0.52, - "learning_rate": 2.389935023036653e-05, - "loss": 2.218, - "step": 299340 - }, - { - "epoch": 0.52, - "learning_rate": 2.38984782904397e-05, - "loss": 2.3992, - "step": 299350 - }, - { - "epoch": 0.52, - "learning_rate": 2.389760635051288e-05, - "loss": 2.2998, - "step": 299360 - }, - { - "epoch": 0.52, - "learning_rate": 2.389673441058605e-05, - "loss": 2.3024, - "step": 299370 - }, - { - "epoch": 0.52, - "learning_rate": 2.3895862470659223e-05, - "loss": 2.3207, - "step": 299380 - }, - { - "epoch": 0.52, - "learning_rate": 2.3894990530732393e-05, - "loss": 2.3587, - "step": 299390 - }, - { - "epoch": 0.52, - "learning_rate": 2.389411859080557e-05, - "loss": 2.4273, - "step": 299400 - }, - { - "epoch": 0.52, - "learning_rate": 2.389324665087874e-05, - "loss": 2.3814, - "step": 299410 - }, - { - "epoch": 0.52, - "learning_rate": 2.3892374710951914e-05, - "loss": 2.3292, - "step": 299420 - }, - { - "epoch": 0.52, - "learning_rate": 2.389150277102509e-05, - "loss": 2.3233, - "step": 299430 - }, - { - "epoch": 0.52, - "learning_rate": 2.3890630831098262e-05, - "loss": 2.3734, - "step": 299440 - }, - { - "epoch": 0.52, - "learning_rate": 2.3889758891171436e-05, - "loss": 2.3548, - "step": 299450 - }, - { - "epoch": 0.52, - "learning_rate": 2.3888886951244606e-05, - "loss": 2.4766, - "step": 299460 - }, - { - "epoch": 0.52, - "learning_rate": 2.3888015011317783e-05, - "loss": 2.2948, - "step": 299470 - }, - { - "epoch": 0.52, - "learning_rate": 2.3887143071390954e-05, - "loss": 2.3389, - "step": 299480 - }, - { - "epoch": 0.52, - "learning_rate": 2.3886271131464127e-05, - "loss": 2.289, - "step": 299490 - }, - { - "epoch": 0.52, - "learning_rate": 2.38853991915373e-05, - "loss": 2.3675, - "step": 299500 - }, - { - "epoch": 0.52, - "learning_rate": 2.3884527251610475e-05, - "loss": 2.3451, - "step": 299510 - }, - { - "epoch": 0.52, - "learning_rate": 2.388365531168365e-05, - "loss": 2.3353, - "step": 299520 - }, - { - "epoch": 0.52, - "learning_rate": 2.388278337175682e-05, - "loss": 2.3957, - "step": 299530 - }, - { - "epoch": 0.52, - "learning_rate": 2.3881911431829993e-05, - "loss": 2.28, - "step": 299540 - }, - { - "epoch": 0.52, - "learning_rate": 2.3881039491903167e-05, - "loss": 2.2324, - "step": 299550 - }, - { - "epoch": 0.52, - "learning_rate": 2.388016755197634e-05, - "loss": 2.3397, - "step": 299560 - }, - { - "epoch": 0.52, - "learning_rate": 2.3879295612049514e-05, - "loss": 2.3797, - "step": 299570 - }, - { - "epoch": 0.52, - "learning_rate": 2.3878423672122688e-05, - "loss": 2.318, - "step": 299580 - }, - { - "epoch": 0.52, - "learning_rate": 2.387755173219586e-05, - "loss": 2.4466, - "step": 299590 - }, - { - "epoch": 0.52, - "learning_rate": 2.3876679792269032e-05, - "loss": 2.4188, - "step": 299600 - }, - { - "epoch": 0.52, - "learning_rate": 2.3875807852342206e-05, - "loss": 2.4025, - "step": 299610 - }, - { - "epoch": 0.52, - "learning_rate": 2.387493591241538e-05, - "loss": 2.4276, - "step": 299620 - }, - { - "epoch": 0.52, - "learning_rate": 2.3874063972488553e-05, - "loss": 2.1958, - "step": 299630 - }, - { - "epoch": 0.52, - "learning_rate": 2.3873192032561724e-05, - "loss": 2.1722, - "step": 299640 - }, - { - "epoch": 0.52, - "learning_rate": 2.3872320092634898e-05, - "loss": 2.5097, - "step": 299650 - }, - { - "epoch": 0.52, - "learning_rate": 2.3871448152708075e-05, - "loss": 2.3201, - "step": 299660 - }, - { - "epoch": 0.52, - "learning_rate": 2.3870576212781245e-05, - "loss": 2.3811, - "step": 299670 - }, - { - "epoch": 0.52, - "learning_rate": 2.386970427285442e-05, - "loss": 2.3658, - "step": 299680 - }, - { - "epoch": 0.52, - "learning_rate": 2.3868832332927593e-05, - "loss": 2.2777, - "step": 299690 - }, - { - "epoch": 0.52, - "learning_rate": 2.3867960393000766e-05, - "loss": 2.3977, - "step": 299700 - }, - { - "epoch": 0.52, - "learning_rate": 2.3867088453073937e-05, - "loss": 2.4308, - "step": 299710 - }, - { - "epoch": 0.52, - "learning_rate": 2.386621651314711e-05, - "loss": 2.2278, - "step": 299720 - }, - { - "epoch": 0.52, - "learning_rate": 2.3865344573220284e-05, - "loss": 2.3338, - "step": 299730 - }, - { - "epoch": 0.52, - "learning_rate": 2.3864472633293458e-05, - "loss": 2.3737, - "step": 299740 - }, - { - "epoch": 0.52, - "learning_rate": 2.3863600693366632e-05, - "loss": 2.2853, - "step": 299750 - }, - { - "epoch": 0.52, - "learning_rate": 2.3862728753439802e-05, - "loss": 2.3684, - "step": 299760 - }, - { - "epoch": 0.52, - "learning_rate": 2.386185681351298e-05, - "loss": 2.4128, - "step": 299770 - }, - { - "epoch": 0.52, - "learning_rate": 2.386098487358615e-05, - "loss": 2.3138, - "step": 299780 - }, - { - "epoch": 0.52, - "learning_rate": 2.3860112933659324e-05, - "loss": 2.3332, - "step": 299790 - }, - { - "epoch": 0.52, - "learning_rate": 2.3859240993732497e-05, - "loss": 2.3616, - "step": 299800 - }, - { - "epoch": 0.52, - "learning_rate": 2.385836905380567e-05, - "loss": 2.1653, - "step": 299810 - }, - { - "epoch": 0.52, - "learning_rate": 2.3857497113878845e-05, - "loss": 2.371, - "step": 299820 - }, - { - "epoch": 0.52, - "learning_rate": 2.3856625173952015e-05, - "loss": 2.4103, - "step": 299830 - }, - { - "epoch": 0.52, - "learning_rate": 2.3855753234025192e-05, - "loss": 2.2514, - "step": 299840 - }, - { - "epoch": 0.52, - "learning_rate": 2.3854881294098363e-05, - "loss": 2.4345, - "step": 299850 - }, - { - "epoch": 0.52, - "learning_rate": 2.3854009354171537e-05, - "loss": 2.3466, - "step": 299860 - }, - { - "epoch": 0.52, - "learning_rate": 2.3853137414244707e-05, - "loss": 2.3819, - "step": 299870 - }, - { - "epoch": 0.52, - "learning_rate": 2.3852265474317884e-05, - "loss": 2.391, - "step": 299880 - }, - { - "epoch": 0.52, - "learning_rate": 2.3851393534391054e-05, - "loss": 2.4149, - "step": 299890 - }, - { - "epoch": 0.52, - "learning_rate": 2.3850521594464228e-05, - "loss": 2.2777, - "step": 299900 - }, - { - "epoch": 0.52, - "learning_rate": 2.3849649654537402e-05, - "loss": 2.3819, - "step": 299910 - }, - { - "epoch": 0.52, - "learning_rate": 2.3848777714610576e-05, - "loss": 2.3471, - "step": 299920 - }, - { - "epoch": 0.52, - "learning_rate": 2.384790577468375e-05, - "loss": 2.3025, - "step": 299930 - }, - { - "epoch": 0.52, - "learning_rate": 2.384703383475692e-05, - "loss": 2.3968, - "step": 299940 - }, - { - "epoch": 0.52, - "learning_rate": 2.3846161894830094e-05, - "loss": 2.3988, - "step": 299950 - }, - { - "epoch": 0.52, - "learning_rate": 2.3845289954903267e-05, - "loss": 2.3272, - "step": 299960 - }, - { - "epoch": 0.52, - "learning_rate": 2.384441801497644e-05, - "loss": 2.3496, - "step": 299970 - }, - { - "epoch": 0.52, - "learning_rate": 2.3843546075049615e-05, - "loss": 2.4131, - "step": 299980 - }, - { - "epoch": 0.52, - "learning_rate": 2.384267413512279e-05, - "loss": 2.4005, - "step": 299990 - }, - { - "epoch": 0.52, - "learning_rate": 2.3841802195195963e-05, - "loss": 2.3317, - "step": 300000 - }, - { - "epoch": 0.52, - "learning_rate": 2.3840930255269133e-05, - "loss": 2.4029, - "step": 300010 - }, - { - "epoch": 0.52, - "learning_rate": 2.3840058315342307e-05, - "loss": 2.3246, - "step": 300020 - }, - { - "epoch": 0.52, - "learning_rate": 2.383918637541548e-05, - "loss": 2.3127, - "step": 300030 - }, - { - "epoch": 0.52, - "learning_rate": 2.3838314435488654e-05, - "loss": 2.4224, - "step": 300040 - }, - { - "epoch": 0.52, - "learning_rate": 2.3837442495561828e-05, - "loss": 2.3674, - "step": 300050 - }, - { - "epoch": 0.52, - "learning_rate": 2.3836570555635e-05, - "loss": 2.3342, - "step": 300060 - }, - { - "epoch": 0.52, - "learning_rate": 2.3835698615708176e-05, - "loss": 2.4147, - "step": 300070 - }, - { - "epoch": 0.52, - "learning_rate": 2.3834826675781346e-05, - "loss": 2.329, - "step": 300080 - }, - { - "epoch": 0.52, - "learning_rate": 2.383395473585452e-05, - "loss": 2.3219, - "step": 300090 - }, - { - "epoch": 0.52, - "learning_rate": 2.3833082795927693e-05, - "loss": 2.3097, - "step": 300100 - }, - { - "epoch": 0.52, - "learning_rate": 2.3832210856000867e-05, - "loss": 2.4489, - "step": 300110 - }, - { - "epoch": 0.52, - "learning_rate": 2.3831338916074038e-05, - "loss": 2.3109, - "step": 300120 - }, - { - "epoch": 0.52, - "learning_rate": 2.383046697614721e-05, - "loss": 2.3898, - "step": 300130 - }, - { - "epoch": 0.52, - "learning_rate": 2.3829595036220385e-05, - "loss": 2.4545, - "step": 300140 - }, - { - "epoch": 0.52, - "learning_rate": 2.382872309629356e-05, - "loss": 2.3681, - "step": 300150 - }, - { - "epoch": 0.52, - "learning_rate": 2.3827851156366733e-05, - "loss": 2.374, - "step": 300160 - }, - { - "epoch": 0.52, - "learning_rate": 2.3826979216439903e-05, - "loss": 2.3299, - "step": 300170 - }, - { - "epoch": 0.52, - "learning_rate": 2.382610727651308e-05, - "loss": 2.3384, - "step": 300180 - }, - { - "epoch": 0.52, - "learning_rate": 2.382523533658625e-05, - "loss": 2.3792, - "step": 300190 - }, - { - "epoch": 0.52, - "learning_rate": 2.3824363396659424e-05, - "loss": 2.2949, - "step": 300200 - }, - { - "epoch": 0.52, - "learning_rate": 2.3823491456732598e-05, - "loss": 2.4736, - "step": 300210 - }, - { - "epoch": 0.52, - "learning_rate": 2.3822619516805772e-05, - "loss": 2.418, - "step": 300220 - }, - { - "epoch": 0.52, - "learning_rate": 2.3821747576878946e-05, - "loss": 2.4105, - "step": 300230 - }, - { - "epoch": 0.52, - "learning_rate": 2.3820875636952116e-05, - "loss": 2.4319, - "step": 300240 - }, - { - "epoch": 0.52, - "learning_rate": 2.3820003697025293e-05, - "loss": 2.3482, - "step": 300250 - }, - { - "epoch": 0.52, - "learning_rate": 2.3819131757098464e-05, - "loss": 2.375, - "step": 300260 - }, - { - "epoch": 0.52, - "learning_rate": 2.3818259817171637e-05, - "loss": 2.3268, - "step": 300270 - }, - { - "epoch": 0.52, - "learning_rate": 2.381738787724481e-05, - "loss": 2.3331, - "step": 300280 - }, - { - "epoch": 0.52, - "learning_rate": 2.3816515937317985e-05, - "loss": 2.3496, - "step": 300290 - }, - { - "epoch": 0.52, - "learning_rate": 2.381564399739116e-05, - "loss": 2.3152, - "step": 300300 - }, - { - "epoch": 0.52, - "learning_rate": 2.381477205746433e-05, - "loss": 2.2133, - "step": 300310 - }, - { - "epoch": 0.52, - "learning_rate": 2.3813900117537503e-05, - "loss": 2.4334, - "step": 300320 - }, - { - "epoch": 0.52, - "learning_rate": 2.3813028177610677e-05, - "loss": 2.3448, - "step": 300330 - }, - { - "epoch": 0.52, - "learning_rate": 2.381215623768385e-05, - "loss": 2.2927, - "step": 300340 - }, - { - "epoch": 0.52, - "learning_rate": 2.381128429775702e-05, - "loss": 2.3051, - "step": 300350 - }, - { - "epoch": 0.52, - "learning_rate": 2.3810412357830198e-05, - "loss": 2.2859, - "step": 300360 - }, - { - "epoch": 0.52, - "learning_rate": 2.3809540417903368e-05, - "loss": 2.4602, - "step": 300370 - }, - { - "epoch": 0.52, - "learning_rate": 2.3808668477976542e-05, - "loss": 2.295, - "step": 300380 - }, - { - "epoch": 0.52, - "learning_rate": 2.3807796538049716e-05, - "loss": 2.2436, - "step": 300390 - }, - { - "epoch": 0.52, - "learning_rate": 2.380692459812289e-05, - "loss": 2.3343, - "step": 300400 - }, - { - "epoch": 0.52, - "learning_rate": 2.3806052658196063e-05, - "loss": 2.3187, - "step": 300410 - }, - { - "epoch": 0.52, - "learning_rate": 2.3805180718269234e-05, - "loss": 2.4621, - "step": 300420 - }, - { - "epoch": 0.52, - "learning_rate": 2.3804308778342408e-05, - "loss": 2.3796, - "step": 300430 - }, - { - "epoch": 0.52, - "learning_rate": 2.380343683841558e-05, - "loss": 2.3807, - "step": 300440 - }, - { - "epoch": 0.52, - "learning_rate": 2.3802564898488755e-05, - "loss": 2.389, - "step": 300450 - }, - { - "epoch": 0.52, - "learning_rate": 2.380169295856193e-05, - "loss": 2.5112, - "step": 300460 - }, - { - "epoch": 0.52, - "learning_rate": 2.38008210186351e-05, - "loss": 2.3963, - "step": 300470 - }, - { - "epoch": 0.52, - "learning_rate": 2.3799949078708276e-05, - "loss": 2.3261, - "step": 300480 - }, - { - "epoch": 0.52, - "learning_rate": 2.3799077138781447e-05, - "loss": 2.348, - "step": 300490 - }, - { - "epoch": 0.52, - "learning_rate": 2.379820519885462e-05, - "loss": 2.3094, - "step": 300500 - }, - { - "epoch": 0.52, - "learning_rate": 2.3797333258927794e-05, - "loss": 2.3275, - "step": 300510 - }, - { - "epoch": 0.52, - "learning_rate": 2.3796461319000968e-05, - "loss": 2.364, - "step": 300520 - }, - { - "epoch": 0.52, - "learning_rate": 2.3795589379074142e-05, - "loss": 2.4253, - "step": 300530 - }, - { - "epoch": 0.52, - "learning_rate": 2.3794717439147312e-05, - "loss": 2.387, - "step": 300540 - }, - { - "epoch": 0.52, - "learning_rate": 2.379384549922049e-05, - "loss": 2.227, - "step": 300550 - }, - { - "epoch": 0.52, - "learning_rate": 2.379297355929366e-05, - "loss": 2.4034, - "step": 300560 - }, - { - "epoch": 0.52, - "learning_rate": 2.3792101619366834e-05, - "loss": 2.3373, - "step": 300570 - }, - { - "epoch": 0.52, - "learning_rate": 2.3791229679440004e-05, - "loss": 2.2771, - "step": 300580 - }, - { - "epoch": 0.52, - "learning_rate": 2.379035773951318e-05, - "loss": 2.4098, - "step": 300590 - }, - { - "epoch": 0.52, - "learning_rate": 2.378948579958635e-05, - "loss": 2.4892, - "step": 300600 - }, - { - "epoch": 0.52, - "learning_rate": 2.3788613859659525e-05, - "loss": 2.4271, - "step": 300610 - }, - { - "epoch": 0.52, - "learning_rate": 2.37877419197327e-05, - "loss": 2.3235, - "step": 300620 - }, - { - "epoch": 0.52, - "learning_rate": 2.3786869979805873e-05, - "loss": 2.3709, - "step": 300630 - }, - { - "epoch": 0.52, - "learning_rate": 2.3785998039879047e-05, - "loss": 2.3633, - "step": 300640 - }, - { - "epoch": 0.52, - "learning_rate": 2.3785126099952217e-05, - "loss": 2.4392, - "step": 300650 - }, - { - "epoch": 0.52, - "learning_rate": 2.3784254160025394e-05, - "loss": 2.3696, - "step": 300660 - }, - { - "epoch": 0.52, - "learning_rate": 2.3783382220098564e-05, - "loss": 2.4024, - "step": 300670 - }, - { - "epoch": 0.52, - "learning_rate": 2.3782510280171738e-05, - "loss": 2.3702, - "step": 300680 - }, - { - "epoch": 0.52, - "learning_rate": 2.3781638340244912e-05, - "loss": 2.312, - "step": 300690 - }, - { - "epoch": 0.52, - "learning_rate": 2.3780766400318086e-05, - "loss": 2.3198, - "step": 300700 - }, - { - "epoch": 0.52, - "learning_rate": 2.377989446039126e-05, - "loss": 2.3439, - "step": 300710 - }, - { - "epoch": 0.52, - "learning_rate": 2.377902252046443e-05, - "loss": 2.3563, - "step": 300720 - }, - { - "epoch": 0.52, - "learning_rate": 2.3778150580537604e-05, - "loss": 2.4317, - "step": 300730 - }, - { - "epoch": 0.52, - "learning_rate": 2.3777278640610777e-05, - "loss": 2.3422, - "step": 300740 - }, - { - "epoch": 0.52, - "learning_rate": 2.377640670068395e-05, - "loss": 2.3629, - "step": 300750 - }, - { - "epoch": 0.52, - "learning_rate": 2.377553476075712e-05, - "loss": 2.3273, - "step": 300760 - }, - { - "epoch": 0.52, - "learning_rate": 2.37746628208303e-05, - "loss": 2.3552, - "step": 300770 - }, - { - "epoch": 0.52, - "learning_rate": 2.3773790880903473e-05, - "loss": 2.3987, - "step": 300780 - }, - { - "epoch": 0.52, - "learning_rate": 2.3772918940976643e-05, - "loss": 2.4073, - "step": 300790 - }, - { - "epoch": 0.52, - "learning_rate": 2.3772047001049817e-05, - "loss": 2.408, - "step": 300800 - }, - { - "epoch": 0.52, - "learning_rate": 2.377117506112299e-05, - "loss": 2.3465, - "step": 300810 - }, - { - "epoch": 0.52, - "learning_rate": 2.3770303121196164e-05, - "loss": 2.3802, - "step": 300820 - }, - { - "epoch": 0.52, - "learning_rate": 2.3769431181269335e-05, - "loss": 2.4369, - "step": 300830 - }, - { - "epoch": 0.52, - "learning_rate": 2.376855924134251e-05, - "loss": 2.2449, - "step": 300840 - }, - { - "epoch": 0.52, - "learning_rate": 2.3767687301415682e-05, - "loss": 2.2549, - "step": 300850 - }, - { - "epoch": 0.52, - "learning_rate": 2.3766815361488856e-05, - "loss": 2.4913, - "step": 300860 - }, - { - "epoch": 0.52, - "learning_rate": 2.376594342156203e-05, - "loss": 2.2707, - "step": 300870 - }, - { - "epoch": 0.52, - "learning_rate": 2.37650714816352e-05, - "loss": 2.3875, - "step": 300880 - }, - { - "epoch": 0.52, - "learning_rate": 2.3764199541708377e-05, - "loss": 2.392, - "step": 300890 - }, - { - "epoch": 0.52, - "learning_rate": 2.3763327601781548e-05, - "loss": 2.3677, - "step": 300900 - }, - { - "epoch": 0.52, - "learning_rate": 2.376245566185472e-05, - "loss": 2.3618, - "step": 300910 - }, - { - "epoch": 0.52, - "learning_rate": 2.3761583721927895e-05, - "loss": 2.2893, - "step": 300920 - }, - { - "epoch": 0.52, - "learning_rate": 2.376071178200107e-05, - "loss": 2.3625, - "step": 300930 - }, - { - "epoch": 0.52, - "learning_rate": 2.3759839842074243e-05, - "loss": 2.422, - "step": 300940 - }, - { - "epoch": 0.52, - "learning_rate": 2.3758967902147413e-05, - "loss": 2.4033, - "step": 300950 - }, - { - "epoch": 0.52, - "learning_rate": 2.375809596222059e-05, - "loss": 2.399, - "step": 300960 - }, - { - "epoch": 0.52, - "learning_rate": 2.375722402229376e-05, - "loss": 2.4757, - "step": 300970 - }, - { - "epoch": 0.52, - "learning_rate": 2.3756352082366934e-05, - "loss": 2.4271, - "step": 300980 - }, - { - "epoch": 0.52, - "learning_rate": 2.3755480142440105e-05, - "loss": 2.3474, - "step": 300990 - }, - { - "epoch": 0.52, - "learning_rate": 2.3754608202513282e-05, - "loss": 2.3037, - "step": 301000 - }, - { - "epoch": 0.52, - "learning_rate": 2.3753736262586456e-05, - "loss": 2.3524, - "step": 301010 - }, - { - "epoch": 0.52, - "learning_rate": 2.3752864322659626e-05, - "loss": 2.4028, - "step": 301020 - }, - { - "epoch": 0.52, - "learning_rate": 2.3751992382732803e-05, - "loss": 2.3644, - "step": 301030 - }, - { - "epoch": 0.52, - "learning_rate": 2.3751120442805974e-05, - "loss": 2.4088, - "step": 301040 - }, - { - "epoch": 0.52, - "learning_rate": 2.3750248502879147e-05, - "loss": 2.2296, - "step": 301050 - }, - { - "epoch": 0.53, - "learning_rate": 2.3749376562952318e-05, - "loss": 2.4, - "step": 301060 - }, - { - "epoch": 0.53, - "learning_rate": 2.3748504623025495e-05, - "loss": 2.3954, - "step": 301070 - }, - { - "epoch": 0.53, - "learning_rate": 2.3747632683098665e-05, - "loss": 2.3123, - "step": 301080 - }, - { - "epoch": 0.53, - "learning_rate": 2.374676074317184e-05, - "loss": 2.3621, - "step": 301090 - }, - { - "epoch": 0.53, - "learning_rate": 2.3745888803245013e-05, - "loss": 2.4489, - "step": 301100 - }, - { - "epoch": 0.53, - "learning_rate": 2.3745016863318187e-05, - "loss": 2.3608, - "step": 301110 - }, - { - "epoch": 0.53, - "learning_rate": 2.374414492339136e-05, - "loss": 2.3221, - "step": 301120 - }, - { - "epoch": 0.53, - "learning_rate": 2.374327298346453e-05, - "loss": 2.3651, - "step": 301130 - }, - { - "epoch": 0.53, - "learning_rate": 2.3742401043537705e-05, - "loss": 2.3502, - "step": 301140 - }, - { - "epoch": 0.53, - "learning_rate": 2.3741529103610878e-05, - "loss": 2.4234, - "step": 301150 - }, - { - "epoch": 0.53, - "learning_rate": 2.3740657163684052e-05, - "loss": 2.3072, - "step": 301160 - }, - { - "epoch": 0.53, - "learning_rate": 2.3739785223757226e-05, - "loss": 2.3473, - "step": 301170 - }, - { - "epoch": 0.53, - "learning_rate": 2.37389132838304e-05, - "loss": 2.4013, - "step": 301180 - }, - { - "epoch": 0.53, - "learning_rate": 2.3738041343903573e-05, - "loss": 2.3067, - "step": 301190 - }, - { - "epoch": 0.53, - "learning_rate": 2.3737169403976744e-05, - "loss": 2.3212, - "step": 301200 - }, - { - "epoch": 0.53, - "learning_rate": 2.3736297464049918e-05, - "loss": 2.3003, - "step": 301210 - }, - { - "epoch": 0.53, - "learning_rate": 2.373542552412309e-05, - "loss": 2.4968, - "step": 301220 - }, - { - "epoch": 0.53, - "learning_rate": 2.3734553584196265e-05, - "loss": 2.2603, - "step": 301230 - }, - { - "epoch": 0.53, - "learning_rate": 2.3733681644269435e-05, - "loss": 2.3421, - "step": 301240 - }, - { - "epoch": 0.53, - "learning_rate": 2.373280970434261e-05, - "loss": 2.3586, - "step": 301250 - }, - { - "epoch": 0.53, - "learning_rate": 2.3731937764415786e-05, - "loss": 2.3779, - "step": 301260 - }, - { - "epoch": 0.53, - "learning_rate": 2.3731065824488957e-05, - "loss": 2.4461, - "step": 301270 - }, - { - "epoch": 0.53, - "learning_rate": 2.373019388456213e-05, - "loss": 2.3797, - "step": 301280 - }, - { - "epoch": 0.53, - "learning_rate": 2.3729321944635304e-05, - "loss": 2.3383, - "step": 301290 - }, - { - "epoch": 0.53, - "learning_rate": 2.3728450004708478e-05, - "loss": 2.3466, - "step": 301300 - }, - { - "epoch": 0.53, - "learning_rate": 2.372757806478165e-05, - "loss": 2.3369, - "step": 301310 - }, - { - "epoch": 0.53, - "learning_rate": 2.3726706124854822e-05, - "loss": 2.3702, - "step": 301320 - }, - { - "epoch": 0.53, - "learning_rate": 2.3725834184927996e-05, - "loss": 2.3259, - "step": 301330 - }, - { - "epoch": 0.53, - "learning_rate": 2.372496224500117e-05, - "loss": 2.3491, - "step": 301340 - }, - { - "epoch": 0.53, - "learning_rate": 2.3724090305074344e-05, - "loss": 2.3301, - "step": 301350 - }, - { - "epoch": 0.53, - "learning_rate": 2.3723218365147514e-05, - "loss": 2.4424, - "step": 301360 - }, - { - "epoch": 0.53, - "learning_rate": 2.372234642522069e-05, - "loss": 2.4061, - "step": 301370 - }, - { - "epoch": 0.53, - "learning_rate": 2.372147448529386e-05, - "loss": 2.2959, - "step": 301380 - }, - { - "epoch": 0.53, - "learning_rate": 2.3720602545367035e-05, - "loss": 2.3743, - "step": 301390 - }, - { - "epoch": 0.53, - "learning_rate": 2.371973060544021e-05, - "loss": 2.4235, - "step": 301400 - }, - { - "epoch": 0.53, - "learning_rate": 2.3718858665513383e-05, - "loss": 2.3331, - "step": 301410 - }, - { - "epoch": 0.53, - "learning_rate": 2.3717986725586557e-05, - "loss": 2.3316, - "step": 301420 - }, - { - "epoch": 0.53, - "learning_rate": 2.3717114785659727e-05, - "loss": 2.2949, - "step": 301430 - }, - { - "epoch": 0.53, - "learning_rate": 2.3716242845732904e-05, - "loss": 2.3935, - "step": 301440 - }, - { - "epoch": 0.53, - "learning_rate": 2.3715370905806074e-05, - "loss": 2.3381, - "step": 301450 - }, - { - "epoch": 0.53, - "learning_rate": 2.3714498965879248e-05, - "loss": 2.3822, - "step": 301460 - }, - { - "epoch": 0.53, - "learning_rate": 2.371362702595242e-05, - "loss": 2.3171, - "step": 301470 - }, - { - "epoch": 0.53, - "learning_rate": 2.3712755086025596e-05, - "loss": 2.4164, - "step": 301480 - }, - { - "epoch": 0.53, - "learning_rate": 2.3711883146098766e-05, - "loss": 2.4096, - "step": 301490 - }, - { - "epoch": 0.53, - "learning_rate": 2.371101120617194e-05, - "loss": 2.2938, - "step": 301500 - }, - { - "epoch": 0.53, - "learning_rate": 2.3710139266245114e-05, - "loss": 2.2931, - "step": 301510 - }, - { - "epoch": 0.53, - "learning_rate": 2.3709267326318287e-05, - "loss": 2.4137, - "step": 301520 - }, - { - "epoch": 0.53, - "learning_rate": 2.370839538639146e-05, - "loss": 2.3809, - "step": 301530 - }, - { - "epoch": 0.53, - "learning_rate": 2.370752344646463e-05, - "loss": 2.3434, - "step": 301540 - }, - { - "epoch": 0.53, - "learning_rate": 2.370665150653781e-05, - "loss": 2.4694, - "step": 301550 - }, - { - "epoch": 0.53, - "learning_rate": 2.370577956661098e-05, - "loss": 2.2417, - "step": 301560 - }, - { - "epoch": 0.53, - "learning_rate": 2.3704907626684153e-05, - "loss": 2.4017, - "step": 301570 - }, - { - "epoch": 0.53, - "learning_rate": 2.3704035686757327e-05, - "loss": 2.3627, - "step": 301580 - }, - { - "epoch": 0.53, - "learning_rate": 2.37031637468305e-05, - "loss": 2.2268, - "step": 301590 - }, - { - "epoch": 0.53, - "learning_rate": 2.3702291806903674e-05, - "loss": 2.3505, - "step": 301600 - }, - { - "epoch": 0.53, - "learning_rate": 2.3701419866976845e-05, - "loss": 2.2819, - "step": 301610 - }, - { - "epoch": 0.53, - "learning_rate": 2.370054792705002e-05, - "loss": 2.3852, - "step": 301620 - }, - { - "epoch": 0.53, - "learning_rate": 2.3699675987123192e-05, - "loss": 2.3472, - "step": 301630 - }, - { - "epoch": 0.53, - "learning_rate": 2.3698804047196366e-05, - "loss": 2.3174, - "step": 301640 - }, - { - "epoch": 0.53, - "learning_rate": 2.369793210726954e-05, - "loss": 2.3611, - "step": 301650 - }, - { - "epoch": 0.53, - "learning_rate": 2.369706016734271e-05, - "loss": 2.3693, - "step": 301660 - }, - { - "epoch": 0.53, - "learning_rate": 2.3696188227415887e-05, - "loss": 2.3317, - "step": 301670 - }, - { - "epoch": 0.53, - "learning_rate": 2.3695316287489058e-05, - "loss": 2.4929, - "step": 301680 - }, - { - "epoch": 0.53, - "learning_rate": 2.369444434756223e-05, - "loss": 2.4628, - "step": 301690 - }, - { - "epoch": 0.53, - "learning_rate": 2.3693572407635405e-05, - "loss": 2.3623, - "step": 301700 - }, - { - "epoch": 0.53, - "learning_rate": 2.369270046770858e-05, - "loss": 2.2643, - "step": 301710 - }, - { - "epoch": 0.53, - "learning_rate": 2.369182852778175e-05, - "loss": 2.2373, - "step": 301720 - }, - { - "epoch": 0.53, - "learning_rate": 2.3690956587854923e-05, - "loss": 2.3141, - "step": 301730 - }, - { - "epoch": 0.53, - "learning_rate": 2.36900846479281e-05, - "loss": 2.339, - "step": 301740 - }, - { - "epoch": 0.53, - "learning_rate": 2.368921270800127e-05, - "loss": 2.3962, - "step": 301750 - }, - { - "epoch": 0.53, - "learning_rate": 2.3688340768074444e-05, - "loss": 2.2081, - "step": 301760 - }, - { - "epoch": 0.53, - "learning_rate": 2.3687468828147615e-05, - "loss": 2.3665, - "step": 301770 - }, - { - "epoch": 0.53, - "learning_rate": 2.3686596888220792e-05, - "loss": 2.2939, - "step": 301780 - }, - { - "epoch": 0.53, - "learning_rate": 2.3685724948293962e-05, - "loss": 2.4688, - "step": 301790 - }, - { - "epoch": 0.53, - "learning_rate": 2.3684853008367136e-05, - "loss": 2.3763, - "step": 301800 - }, - { - "epoch": 0.53, - "learning_rate": 2.368398106844031e-05, - "loss": 2.3867, - "step": 301810 - }, - { - "epoch": 0.53, - "learning_rate": 2.3683109128513484e-05, - "loss": 2.3927, - "step": 301820 - }, - { - "epoch": 0.53, - "learning_rate": 2.3682237188586657e-05, - "loss": 2.2659, - "step": 301830 - }, - { - "epoch": 0.53, - "learning_rate": 2.3681365248659828e-05, - "loss": 2.3199, - "step": 301840 - }, - { - "epoch": 0.53, - "learning_rate": 2.3680493308733005e-05, - "loss": 2.2609, - "step": 301850 - }, - { - "epoch": 0.53, - "learning_rate": 2.3679621368806175e-05, - "loss": 2.4466, - "step": 301860 - }, - { - "epoch": 0.53, - "learning_rate": 2.367874942887935e-05, - "loss": 2.2935, - "step": 301870 - }, - { - "epoch": 0.53, - "learning_rate": 2.3677877488952523e-05, - "loss": 2.3574, - "step": 301880 - }, - { - "epoch": 0.53, - "learning_rate": 2.3677005549025697e-05, - "loss": 2.4092, - "step": 301890 - }, - { - "epoch": 0.53, - "learning_rate": 2.367613360909887e-05, - "loss": 2.4272, - "step": 301900 - }, - { - "epoch": 0.53, - "learning_rate": 2.367526166917204e-05, - "loss": 2.2743, - "step": 301910 - }, - { - "epoch": 0.53, - "learning_rate": 2.3674389729245215e-05, - "loss": 2.3377, - "step": 301920 - }, - { - "epoch": 0.53, - "learning_rate": 2.367351778931839e-05, - "loss": 2.3911, - "step": 301930 - }, - { - "epoch": 0.53, - "learning_rate": 2.3672645849391562e-05, - "loss": 2.3702, - "step": 301940 - }, - { - "epoch": 0.53, - "learning_rate": 2.3671773909464732e-05, - "loss": 2.4448, - "step": 301950 - }, - { - "epoch": 0.53, - "learning_rate": 2.367090196953791e-05, - "loss": 2.3374, - "step": 301960 - }, - { - "epoch": 0.53, - "learning_rate": 2.367003002961108e-05, - "loss": 2.3366, - "step": 301970 - }, - { - "epoch": 0.53, - "learning_rate": 2.3669158089684254e-05, - "loss": 2.2965, - "step": 301980 - }, - { - "epoch": 0.53, - "learning_rate": 2.3668286149757428e-05, - "loss": 2.3242, - "step": 301990 - }, - { - "epoch": 0.53, - "learning_rate": 2.36674142098306e-05, - "loss": 2.3807, - "step": 302000 - }, - { - "epoch": 0.53, - "learning_rate": 2.3666542269903775e-05, - "loss": 2.2452, - "step": 302010 - }, - { - "epoch": 0.53, - "learning_rate": 2.3665670329976945e-05, - "loss": 2.3459, - "step": 302020 - }, - { - "epoch": 0.53, - "learning_rate": 2.366479839005012e-05, - "loss": 2.4356, - "step": 302030 - }, - { - "epoch": 0.53, - "learning_rate": 2.3663926450123293e-05, - "loss": 2.4115, - "step": 302040 - }, - { - "epoch": 0.53, - "learning_rate": 2.3663054510196467e-05, - "loss": 2.3268, - "step": 302050 - }, - { - "epoch": 0.53, - "learning_rate": 2.366218257026964e-05, - "loss": 2.3882, - "step": 302060 - }, - { - "epoch": 0.53, - "learning_rate": 2.366131063034281e-05, - "loss": 2.3759, - "step": 302070 - }, - { - "epoch": 0.53, - "learning_rate": 2.3660438690415988e-05, - "loss": 2.4027, - "step": 302080 - }, - { - "epoch": 0.53, - "learning_rate": 2.365956675048916e-05, - "loss": 2.392, - "step": 302090 - }, - { - "epoch": 0.53, - "learning_rate": 2.3658694810562332e-05, - "loss": 2.2918, - "step": 302100 - }, - { - "epoch": 0.53, - "learning_rate": 2.3657822870635506e-05, - "loss": 2.334, - "step": 302110 - }, - { - "epoch": 0.53, - "learning_rate": 2.365695093070868e-05, - "loss": 2.3081, - "step": 302120 - }, - { - "epoch": 0.53, - "learning_rate": 2.3656078990781854e-05, - "loss": 2.3328, - "step": 302130 - }, - { - "epoch": 0.53, - "learning_rate": 2.3655207050855024e-05, - "loss": 2.3392, - "step": 302140 - }, - { - "epoch": 0.53, - "learning_rate": 2.36543351109282e-05, - "loss": 2.2693, - "step": 302150 - }, - { - "epoch": 0.53, - "learning_rate": 2.365346317100137e-05, - "loss": 2.4263, - "step": 302160 - }, - { - "epoch": 0.53, - "learning_rate": 2.3652591231074545e-05, - "loss": 2.3253, - "step": 302170 - }, - { - "epoch": 0.53, - "learning_rate": 2.3651719291147716e-05, - "loss": 2.3192, - "step": 302180 - }, - { - "epoch": 0.53, - "learning_rate": 2.3650847351220893e-05, - "loss": 2.323, - "step": 302190 - }, - { - "epoch": 0.53, - "learning_rate": 2.3649975411294063e-05, - "loss": 2.4138, - "step": 302200 - }, - { - "epoch": 0.53, - "learning_rate": 2.3649103471367237e-05, - "loss": 2.4864, - "step": 302210 - }, - { - "epoch": 0.53, - "learning_rate": 2.364823153144041e-05, - "loss": 2.4626, - "step": 302220 - }, - { - "epoch": 0.53, - "learning_rate": 2.3647359591513584e-05, - "loss": 2.3358, - "step": 302230 - }, - { - "epoch": 0.53, - "learning_rate": 2.3646487651586758e-05, - "loss": 2.3601, - "step": 302240 - }, - { - "epoch": 0.53, - "learning_rate": 2.364561571165993e-05, - "loss": 2.3502, - "step": 302250 - }, - { - "epoch": 0.53, - "learning_rate": 2.3644743771733106e-05, - "loss": 2.3826, - "step": 302260 - }, - { - "epoch": 0.53, - "learning_rate": 2.3643871831806276e-05, - "loss": 2.32, - "step": 302270 - }, - { - "epoch": 0.53, - "learning_rate": 2.364299989187945e-05, - "loss": 2.3522, - "step": 302280 - }, - { - "epoch": 0.53, - "learning_rate": 2.3642127951952624e-05, - "loss": 2.3688, - "step": 302290 - }, - { - "epoch": 0.53, - "learning_rate": 2.3641256012025797e-05, - "loss": 2.4282, - "step": 302300 - }, - { - "epoch": 0.53, - "learning_rate": 2.364038407209897e-05, - "loss": 2.3648, - "step": 302310 - }, - { - "epoch": 0.53, - "learning_rate": 2.363951213217214e-05, - "loss": 2.3078, - "step": 302320 - }, - { - "epoch": 0.53, - "learning_rate": 2.3638640192245315e-05, - "loss": 2.3681, - "step": 302330 - }, - { - "epoch": 0.53, - "learning_rate": 2.363776825231849e-05, - "loss": 2.3421, - "step": 302340 - }, - { - "epoch": 0.53, - "learning_rate": 2.3636896312391663e-05, - "loss": 2.3005, - "step": 302350 - }, - { - "epoch": 0.53, - "learning_rate": 2.3636024372464837e-05, - "loss": 2.3122, - "step": 302360 - }, - { - "epoch": 0.53, - "learning_rate": 2.363515243253801e-05, - "loss": 2.4796, - "step": 302370 - }, - { - "epoch": 0.53, - "learning_rate": 2.3634280492611184e-05, - "loss": 2.3926, - "step": 302380 - }, - { - "epoch": 0.53, - "learning_rate": 2.3633408552684355e-05, - "loss": 2.3787, - "step": 302390 - }, - { - "epoch": 0.53, - "learning_rate": 2.363253661275753e-05, - "loss": 2.3531, - "step": 302400 - }, - { - "epoch": 0.53, - "learning_rate": 2.3631664672830702e-05, - "loss": 2.2262, - "step": 302410 - }, - { - "epoch": 0.53, - "learning_rate": 2.3630792732903876e-05, - "loss": 2.2417, - "step": 302420 - }, - { - "epoch": 0.53, - "learning_rate": 2.3629920792977046e-05, - "loss": 2.3424, - "step": 302430 - }, - { - "epoch": 0.53, - "learning_rate": 2.362904885305022e-05, - "loss": 2.3652, - "step": 302440 - }, - { - "epoch": 0.53, - "learning_rate": 2.3628176913123394e-05, - "loss": 2.3944, - "step": 302450 - }, - { - "epoch": 0.53, - "learning_rate": 2.3627304973196568e-05, - "loss": 2.4333, - "step": 302460 - }, - { - "epoch": 0.53, - "learning_rate": 2.362643303326974e-05, - "loss": 2.2318, - "step": 302470 - }, - { - "epoch": 0.53, - "learning_rate": 2.3625561093342915e-05, - "loss": 2.3402, - "step": 302480 - }, - { - "epoch": 0.53, - "learning_rate": 2.362468915341609e-05, - "loss": 2.3971, - "step": 302490 - }, - { - "epoch": 0.53, - "learning_rate": 2.362381721348926e-05, - "loss": 2.4744, - "step": 302500 - }, - { - "epoch": 0.53, - "learning_rate": 2.3622945273562433e-05, - "loss": 2.4682, - "step": 302510 - }, - { - "epoch": 0.53, - "learning_rate": 2.3622073333635607e-05, - "loss": 2.4122, - "step": 302520 - }, - { - "epoch": 0.53, - "learning_rate": 2.362120139370878e-05, - "loss": 2.2915, - "step": 302530 - }, - { - "epoch": 0.53, - "learning_rate": 2.3620329453781954e-05, - "loss": 2.3859, - "step": 302540 - }, - { - "epoch": 0.53, - "learning_rate": 2.3619457513855125e-05, - "loss": 2.4158, - "step": 302550 - }, - { - "epoch": 0.53, - "learning_rate": 2.3618585573928302e-05, - "loss": 2.366, - "step": 302560 - }, - { - "epoch": 0.53, - "learning_rate": 2.3617713634001472e-05, - "loss": 2.4249, - "step": 302570 - }, - { - "epoch": 0.53, - "learning_rate": 2.3616841694074646e-05, - "loss": 2.3413, - "step": 302580 - }, - { - "epoch": 0.53, - "learning_rate": 2.3615969754147816e-05, - "loss": 2.4553, - "step": 302590 - }, - { - "epoch": 0.53, - "learning_rate": 2.3615097814220994e-05, - "loss": 2.4527, - "step": 302600 - }, - { - "epoch": 0.53, - "learning_rate": 2.3614225874294167e-05, - "loss": 2.4346, - "step": 302610 - }, - { - "epoch": 0.53, - "learning_rate": 2.3613353934367338e-05, - "loss": 2.3573, - "step": 302620 - }, - { - "epoch": 0.53, - "learning_rate": 2.3612481994440515e-05, - "loss": 2.3721, - "step": 302630 - }, - { - "epoch": 0.53, - "learning_rate": 2.3611610054513685e-05, - "loss": 2.2834, - "step": 302640 - }, - { - "epoch": 0.53, - "learning_rate": 2.361073811458686e-05, - "loss": 2.3909, - "step": 302650 - }, - { - "epoch": 0.53, - "learning_rate": 2.360986617466003e-05, - "loss": 2.3229, - "step": 302660 - }, - { - "epoch": 0.53, - "learning_rate": 2.3608994234733207e-05, - "loss": 2.238, - "step": 302670 - }, - { - "epoch": 0.53, - "learning_rate": 2.3608122294806377e-05, - "loss": 2.271, - "step": 302680 - }, - { - "epoch": 0.53, - "learning_rate": 2.360725035487955e-05, - "loss": 2.3317, - "step": 302690 - }, - { - "epoch": 0.53, - "learning_rate": 2.3606378414952725e-05, - "loss": 2.3896, - "step": 302700 - }, - { - "epoch": 0.53, - "learning_rate": 2.36055064750259e-05, - "loss": 2.3822, - "step": 302710 - }, - { - "epoch": 0.53, - "learning_rate": 2.3604634535099072e-05, - "loss": 2.2804, - "step": 302720 - }, - { - "epoch": 0.53, - "learning_rate": 2.3603762595172242e-05, - "loss": 2.2609, - "step": 302730 - }, - { - "epoch": 0.53, - "learning_rate": 2.3602890655245416e-05, - "loss": 2.4344, - "step": 302740 - }, - { - "epoch": 0.53, - "learning_rate": 2.360201871531859e-05, - "loss": 2.2908, - "step": 302750 - }, - { - "epoch": 0.53, - "learning_rate": 2.3601146775391764e-05, - "loss": 2.3295, - "step": 302760 - }, - { - "epoch": 0.53, - "learning_rate": 2.3600274835464938e-05, - "loss": 2.3276, - "step": 302770 - }, - { - "epoch": 0.53, - "learning_rate": 2.359940289553811e-05, - "loss": 2.3563, - "step": 302780 - }, - { - "epoch": 0.53, - "learning_rate": 2.3598530955611285e-05, - "loss": 2.3687, - "step": 302790 - }, - { - "epoch": 0.53, - "learning_rate": 2.3597659015684455e-05, - "loss": 2.3655, - "step": 302800 - }, - { - "epoch": 0.53, - "learning_rate": 2.359678707575763e-05, - "loss": 2.3339, - "step": 302810 - }, - { - "epoch": 0.53, - "learning_rate": 2.3595915135830803e-05, - "loss": 2.2707, - "step": 302820 - }, - { - "epoch": 0.53, - "learning_rate": 2.3595043195903977e-05, - "loss": 2.3334, - "step": 302830 - }, - { - "epoch": 0.53, - "learning_rate": 2.3594171255977147e-05, - "loss": 2.3031, - "step": 302840 - }, - { - "epoch": 0.53, - "learning_rate": 2.359329931605032e-05, - "loss": 2.3998, - "step": 302850 - }, - { - "epoch": 0.53, - "learning_rate": 2.3592427376123498e-05, - "loss": 2.3254, - "step": 302860 - }, - { - "epoch": 0.53, - "learning_rate": 2.359155543619667e-05, - "loss": 2.3816, - "step": 302870 - }, - { - "epoch": 0.53, - "learning_rate": 2.3590683496269842e-05, - "loss": 2.4089, - "step": 302880 - }, - { - "epoch": 0.53, - "learning_rate": 2.3589811556343016e-05, - "loss": 2.3967, - "step": 302890 - }, - { - "epoch": 0.53, - "learning_rate": 2.358893961641619e-05, - "loss": 2.4391, - "step": 302900 - }, - { - "epoch": 0.53, - "learning_rate": 2.358806767648936e-05, - "loss": 2.422, - "step": 302910 - }, - { - "epoch": 0.53, - "learning_rate": 2.3587195736562534e-05, - "loss": 2.4401, - "step": 302920 - }, - { - "epoch": 0.53, - "learning_rate": 2.3586323796635708e-05, - "loss": 2.3831, - "step": 302930 - }, - { - "epoch": 0.53, - "learning_rate": 2.358545185670888e-05, - "loss": 2.4387, - "step": 302940 - }, - { - "epoch": 0.53, - "learning_rate": 2.3584579916782055e-05, - "loss": 2.3418, - "step": 302950 - }, - { - "epoch": 0.53, - "learning_rate": 2.3583707976855226e-05, - "loss": 2.256, - "step": 302960 - }, - { - "epoch": 0.53, - "learning_rate": 2.3582836036928403e-05, - "loss": 2.4634, - "step": 302970 - }, - { - "epoch": 0.53, - "learning_rate": 2.3581964097001573e-05, - "loss": 2.2971, - "step": 302980 - }, - { - "epoch": 0.53, - "learning_rate": 2.3581092157074747e-05, - "loss": 2.3762, - "step": 302990 - }, - { - "epoch": 0.53, - "learning_rate": 2.358022021714792e-05, - "loss": 2.3146, - "step": 303000 - }, - { - "epoch": 0.53, - "learning_rate": 2.3579348277221094e-05, - "loss": 2.3465, - "step": 303010 - }, - { - "epoch": 0.53, - "learning_rate": 2.3578476337294268e-05, - "loss": 2.3544, - "step": 303020 - }, - { - "epoch": 0.53, - "learning_rate": 2.357760439736744e-05, - "loss": 2.2447, - "step": 303030 - }, - { - "epoch": 0.53, - "learning_rate": 2.3576732457440616e-05, - "loss": 2.3749, - "step": 303040 - }, - { - "epoch": 0.53, - "learning_rate": 2.3575860517513786e-05, - "loss": 2.2887, - "step": 303050 - }, - { - "epoch": 0.53, - "learning_rate": 2.357498857758696e-05, - "loss": 2.2695, - "step": 303060 - }, - { - "epoch": 0.53, - "learning_rate": 2.357411663766013e-05, - "loss": 2.3104, - "step": 303070 - }, - { - "epoch": 0.53, - "learning_rate": 2.3573244697733307e-05, - "loss": 2.3493, - "step": 303080 - }, - { - "epoch": 0.53, - "learning_rate": 2.357237275780648e-05, - "loss": 2.4712, - "step": 303090 - }, - { - "epoch": 0.53, - "learning_rate": 2.357150081787965e-05, - "loss": 2.3411, - "step": 303100 - }, - { - "epoch": 0.53, - "learning_rate": 2.3570628877952825e-05, - "loss": 2.3155, - "step": 303110 - }, - { - "epoch": 0.53, - "learning_rate": 2.3569756938026e-05, - "loss": 2.4119, - "step": 303120 - }, - { - "epoch": 0.53, - "learning_rate": 2.3568884998099173e-05, - "loss": 2.4102, - "step": 303130 - }, - { - "epoch": 0.53, - "learning_rate": 2.3568013058172343e-05, - "loss": 2.3576, - "step": 303140 - }, - { - "epoch": 0.53, - "learning_rate": 2.356714111824552e-05, - "loss": 2.4071, - "step": 303150 - }, - { - "epoch": 0.53, - "learning_rate": 2.356626917831869e-05, - "loss": 2.4162, - "step": 303160 - }, - { - "epoch": 0.53, - "learning_rate": 2.3565397238391865e-05, - "loss": 2.2413, - "step": 303170 - }, - { - "epoch": 0.53, - "learning_rate": 2.356452529846504e-05, - "loss": 2.363, - "step": 303180 - }, - { - "epoch": 0.53, - "learning_rate": 2.3563653358538212e-05, - "loss": 2.2569, - "step": 303190 - }, - { - "epoch": 0.53, - "learning_rate": 2.3562781418611386e-05, - "loss": 2.3314, - "step": 303200 - }, - { - "epoch": 0.53, - "learning_rate": 2.3561909478684556e-05, - "loss": 2.3624, - "step": 303210 - }, - { - "epoch": 0.53, - "learning_rate": 2.356103753875773e-05, - "loss": 2.3272, - "step": 303220 - }, - { - "epoch": 0.53, - "learning_rate": 2.3560165598830904e-05, - "loss": 2.3366, - "step": 303230 - }, - { - "epoch": 0.53, - "learning_rate": 2.3559293658904078e-05, - "loss": 2.3012, - "step": 303240 - }, - { - "epoch": 0.53, - "learning_rate": 2.355842171897725e-05, - "loss": 2.3195, - "step": 303250 - }, - { - "epoch": 0.53, - "learning_rate": 2.3557549779050422e-05, - "loss": 2.3298, - "step": 303260 - }, - { - "epoch": 0.53, - "learning_rate": 2.35566778391236e-05, - "loss": 2.3087, - "step": 303270 - }, - { - "epoch": 0.53, - "learning_rate": 2.355580589919677e-05, - "loss": 2.3167, - "step": 303280 - }, - { - "epoch": 0.53, - "learning_rate": 2.3554933959269943e-05, - "loss": 2.2715, - "step": 303290 - }, - { - "epoch": 0.53, - "learning_rate": 2.3554062019343117e-05, - "loss": 2.291, - "step": 303300 - }, - { - "epoch": 0.53, - "learning_rate": 2.355319007941629e-05, - "loss": 2.4339, - "step": 303310 - }, - { - "epoch": 0.53, - "learning_rate": 2.355231813948946e-05, - "loss": 2.426, - "step": 303320 - }, - { - "epoch": 0.53, - "learning_rate": 2.3551446199562635e-05, - "loss": 2.3288, - "step": 303330 - }, - { - "epoch": 0.53, - "learning_rate": 2.3550574259635812e-05, - "loss": 2.304, - "step": 303340 - }, - { - "epoch": 0.53, - "learning_rate": 2.3549702319708982e-05, - "loss": 2.2892, - "step": 303350 - }, - { - "epoch": 0.53, - "learning_rate": 2.3548830379782156e-05, - "loss": 2.3325, - "step": 303360 - }, - { - "epoch": 0.53, - "learning_rate": 2.3547958439855326e-05, - "loss": 2.3765, - "step": 303370 - }, - { - "epoch": 0.53, - "learning_rate": 2.3547086499928504e-05, - "loss": 2.366, - "step": 303380 - }, - { - "epoch": 0.53, - "learning_rate": 2.3546214560001674e-05, - "loss": 2.3492, - "step": 303390 - }, - { - "epoch": 0.53, - "learning_rate": 2.3545342620074848e-05, - "loss": 2.354, - "step": 303400 - }, - { - "epoch": 0.53, - "learning_rate": 2.354447068014802e-05, - "loss": 2.3466, - "step": 303410 - }, - { - "epoch": 0.53, - "learning_rate": 2.3543598740221195e-05, - "loss": 2.4431, - "step": 303420 - }, - { - "epoch": 0.53, - "learning_rate": 2.354272680029437e-05, - "loss": 2.3349, - "step": 303430 - }, - { - "epoch": 0.53, - "learning_rate": 2.354185486036754e-05, - "loss": 2.2902, - "step": 303440 - }, - { - "epoch": 0.53, - "learning_rate": 2.3540982920440717e-05, - "loss": 2.31, - "step": 303450 - }, - { - "epoch": 0.53, - "learning_rate": 2.3540110980513887e-05, - "loss": 2.267, - "step": 303460 - }, - { - "epoch": 0.53, - "learning_rate": 2.353923904058706e-05, - "loss": 2.4542, - "step": 303470 - }, - { - "epoch": 0.53, - "learning_rate": 2.3538367100660235e-05, - "loss": 2.2184, - "step": 303480 - }, - { - "epoch": 0.53, - "learning_rate": 2.353749516073341e-05, - "loss": 2.2979, - "step": 303490 - }, - { - "epoch": 0.53, - "learning_rate": 2.3536623220806582e-05, - "loss": 2.4383, - "step": 303500 - }, - { - "epoch": 0.53, - "learning_rate": 2.3535751280879752e-05, - "loss": 2.3656, - "step": 303510 - }, - { - "epoch": 0.53, - "learning_rate": 2.3534879340952926e-05, - "loss": 2.4111, - "step": 303520 - }, - { - "epoch": 0.53, - "learning_rate": 2.35340074010261e-05, - "loss": 2.2684, - "step": 303530 - }, - { - "epoch": 0.53, - "learning_rate": 2.3533135461099274e-05, - "loss": 2.279, - "step": 303540 - }, - { - "epoch": 0.53, - "learning_rate": 2.3532263521172444e-05, - "loss": 2.3443, - "step": 303550 - }, - { - "epoch": 0.53, - "learning_rate": 2.353139158124562e-05, - "loss": 2.385, - "step": 303560 - }, - { - "epoch": 0.53, - "learning_rate": 2.3530519641318792e-05, - "loss": 2.4572, - "step": 303570 - }, - { - "epoch": 0.53, - "learning_rate": 2.3529647701391965e-05, - "loss": 2.3667, - "step": 303580 - }, - { - "epoch": 0.53, - "learning_rate": 2.352877576146514e-05, - "loss": 2.2884, - "step": 303590 - }, - { - "epoch": 0.53, - "learning_rate": 2.3527903821538313e-05, - "loss": 2.413, - "step": 303600 - }, - { - "epoch": 0.53, - "learning_rate": 2.3527031881611487e-05, - "loss": 2.3865, - "step": 303610 - }, - { - "epoch": 0.53, - "learning_rate": 2.3526159941684657e-05, - "loss": 2.4123, - "step": 303620 - }, - { - "epoch": 0.53, - "learning_rate": 2.352528800175783e-05, - "loss": 2.4341, - "step": 303630 - }, - { - "epoch": 0.53, - "learning_rate": 2.3524416061831005e-05, - "loss": 2.2489, - "step": 303640 - }, - { - "epoch": 0.53, - "learning_rate": 2.352354412190418e-05, - "loss": 2.3324, - "step": 303650 - }, - { - "epoch": 0.53, - "learning_rate": 2.3522672181977352e-05, - "loss": 2.4473, - "step": 303660 - }, - { - "epoch": 0.53, - "learning_rate": 2.3521800242050523e-05, - "loss": 2.3907, - "step": 303670 - }, - { - "epoch": 0.53, - "learning_rate": 2.35209283021237e-05, - "loss": 2.3835, - "step": 303680 - }, - { - "epoch": 0.53, - "learning_rate": 2.352005636219687e-05, - "loss": 2.3881, - "step": 303690 - }, - { - "epoch": 0.53, - "learning_rate": 2.3519184422270044e-05, - "loss": 2.3996, - "step": 303700 - }, - { - "epoch": 0.53, - "learning_rate": 2.3518312482343218e-05, - "loss": 2.3181, - "step": 303710 - }, - { - "epoch": 0.53, - "learning_rate": 2.351744054241639e-05, - "loss": 2.4368, - "step": 303720 - }, - { - "epoch": 0.53, - "learning_rate": 2.3516568602489565e-05, - "loss": 2.3566, - "step": 303730 - }, - { - "epoch": 0.53, - "learning_rate": 2.3515696662562736e-05, - "loss": 2.3347, - "step": 303740 - }, - { - "epoch": 0.53, - "learning_rate": 2.3514824722635913e-05, - "loss": 2.368, - "step": 303750 - }, - { - "epoch": 0.53, - "learning_rate": 2.3513952782709083e-05, - "loss": 2.3518, - "step": 303760 - }, - { - "epoch": 0.53, - "learning_rate": 2.3513080842782257e-05, - "loss": 2.2735, - "step": 303770 - }, - { - "epoch": 0.53, - "learning_rate": 2.3512208902855427e-05, - "loss": 2.3975, - "step": 303780 - }, - { - "epoch": 0.53, - "learning_rate": 2.3511336962928604e-05, - "loss": 2.3155, - "step": 303790 - }, - { - "epoch": 0.53, - "learning_rate": 2.3510465023001775e-05, - "loss": 2.3138, - "step": 303800 - }, - { - "epoch": 0.53, - "learning_rate": 2.350959308307495e-05, - "loss": 2.42, - "step": 303810 - }, - { - "epoch": 0.53, - "learning_rate": 2.3508721143148126e-05, - "loss": 2.4714, - "step": 303820 - }, - { - "epoch": 0.53, - "learning_rate": 2.3507849203221296e-05, - "loss": 2.3024, - "step": 303830 - }, - { - "epoch": 0.53, - "learning_rate": 2.350697726329447e-05, - "loss": 2.4194, - "step": 303840 - }, - { - "epoch": 0.53, - "learning_rate": 2.350610532336764e-05, - "loss": 2.4333, - "step": 303850 - }, - { - "epoch": 0.53, - "learning_rate": 2.3505233383440817e-05, - "loss": 2.4367, - "step": 303860 - }, - { - "epoch": 0.53, - "learning_rate": 2.3504361443513988e-05, - "loss": 2.4282, - "step": 303870 - }, - { - "epoch": 0.53, - "learning_rate": 2.350348950358716e-05, - "loss": 2.396, - "step": 303880 - }, - { - "epoch": 0.53, - "learning_rate": 2.3502617563660335e-05, - "loss": 2.2664, - "step": 303890 - }, - { - "epoch": 0.53, - "learning_rate": 2.350174562373351e-05, - "loss": 2.3142, - "step": 303900 - }, - { - "epoch": 0.53, - "learning_rate": 2.3500873683806683e-05, - "loss": 2.3224, - "step": 303910 - }, - { - "epoch": 0.53, - "learning_rate": 2.3500001743879853e-05, - "loss": 2.3727, - "step": 303920 - }, - { - "epoch": 0.53, - "learning_rate": 2.3499129803953027e-05, - "loss": 2.3613, - "step": 303930 - }, - { - "epoch": 0.53, - "learning_rate": 2.34982578640262e-05, - "loss": 2.3297, - "step": 303940 - }, - { - "epoch": 0.53, - "learning_rate": 2.3497385924099375e-05, - "loss": 2.4179, - "step": 303950 - }, - { - "epoch": 0.53, - "learning_rate": 2.349651398417255e-05, - "loss": 2.4246, - "step": 303960 - }, - { - "epoch": 0.53, - "learning_rate": 2.3495642044245722e-05, - "loss": 2.2693, - "step": 303970 - }, - { - "epoch": 0.53, - "learning_rate": 2.3494770104318896e-05, - "loss": 2.2915, - "step": 303980 - }, - { - "epoch": 0.53, - "learning_rate": 2.3493898164392066e-05, - "loss": 2.281, - "step": 303990 - }, - { - "epoch": 0.53, - "learning_rate": 2.349302622446524e-05, - "loss": 2.3728, - "step": 304000 - }, - { - "epoch": 0.53, - "learning_rate": 2.3492154284538414e-05, - "loss": 2.4526, - "step": 304010 - }, - { - "epoch": 0.53, - "learning_rate": 2.3491282344611588e-05, - "loss": 2.4209, - "step": 304020 - }, - { - "epoch": 0.53, - "learning_rate": 2.3490410404684758e-05, - "loss": 2.3715, - "step": 304030 - }, - { - "epoch": 0.53, - "learning_rate": 2.3489538464757932e-05, - "loss": 2.3712, - "step": 304040 - }, - { - "epoch": 0.53, - "learning_rate": 2.3488666524831106e-05, - "loss": 2.3466, - "step": 304050 - }, - { - "epoch": 0.53, - "learning_rate": 2.348779458490428e-05, - "loss": 2.3539, - "step": 304060 - }, - { - "epoch": 0.53, - "learning_rate": 2.3486922644977453e-05, - "loss": 2.3372, - "step": 304070 - }, - { - "epoch": 0.53, - "learning_rate": 2.3486050705050627e-05, - "loss": 2.3369, - "step": 304080 - }, - { - "epoch": 0.53, - "learning_rate": 2.34851787651238e-05, - "loss": 2.2873, - "step": 304090 - }, - { - "epoch": 0.53, - "learning_rate": 2.348430682519697e-05, - "loss": 2.4244, - "step": 304100 - }, - { - "epoch": 0.53, - "learning_rate": 2.3483434885270145e-05, - "loss": 2.4921, - "step": 304110 - }, - { - "epoch": 0.53, - "learning_rate": 2.348256294534332e-05, - "loss": 2.3877, - "step": 304120 - }, - { - "epoch": 0.53, - "learning_rate": 2.3481691005416492e-05, - "loss": 2.3785, - "step": 304130 - }, - { - "epoch": 0.53, - "learning_rate": 2.3480819065489666e-05, - "loss": 2.3163, - "step": 304140 - }, - { - "epoch": 0.53, - "learning_rate": 2.3479947125562836e-05, - "loss": 2.2604, - "step": 304150 - }, - { - "epoch": 0.53, - "learning_rate": 2.3479075185636014e-05, - "loss": 2.3488, - "step": 304160 - }, - { - "epoch": 0.53, - "learning_rate": 2.3478203245709184e-05, - "loss": 2.4512, - "step": 304170 - }, - { - "epoch": 0.53, - "learning_rate": 2.3477331305782358e-05, - "loss": 2.3333, - "step": 304180 - }, - { - "epoch": 0.53, - "learning_rate": 2.3476459365855528e-05, - "loss": 2.4232, - "step": 304190 - }, - { - "epoch": 0.53, - "learning_rate": 2.3475587425928705e-05, - "loss": 2.3311, - "step": 304200 - }, - { - "epoch": 0.53, - "learning_rate": 2.347471548600188e-05, - "loss": 2.3077, - "step": 304210 - }, - { - "epoch": 0.53, - "learning_rate": 2.347384354607505e-05, - "loss": 2.3061, - "step": 304220 - }, - { - "epoch": 0.53, - "learning_rate": 2.3472971606148227e-05, - "loss": 2.4134, - "step": 304230 - }, - { - "epoch": 0.53, - "learning_rate": 2.3472099666221397e-05, - "loss": 2.25, - "step": 304240 - }, - { - "epoch": 0.53, - "learning_rate": 2.347122772629457e-05, - "loss": 2.3004, - "step": 304250 - }, - { - "epoch": 0.53, - "learning_rate": 2.347035578636774e-05, - "loss": 2.4141, - "step": 304260 - }, - { - "epoch": 0.53, - "learning_rate": 2.346948384644092e-05, - "loss": 2.33, - "step": 304270 - }, - { - "epoch": 0.53, - "learning_rate": 2.346861190651409e-05, - "loss": 2.4411, - "step": 304280 - }, - { - "epoch": 0.53, - "learning_rate": 2.3467739966587262e-05, - "loss": 2.3422, - "step": 304290 - }, - { - "epoch": 0.53, - "learning_rate": 2.3466868026660436e-05, - "loss": 2.2222, - "step": 304300 - }, - { - "epoch": 0.53, - "learning_rate": 2.346599608673361e-05, - "loss": 2.4453, - "step": 304310 - }, - { - "epoch": 0.53, - "learning_rate": 2.3465124146806784e-05, - "loss": 2.4185, - "step": 304320 - }, - { - "epoch": 0.53, - "learning_rate": 2.3464252206879954e-05, - "loss": 2.3602, - "step": 304330 - }, - { - "epoch": 0.53, - "learning_rate": 2.3463380266953128e-05, - "loss": 2.3201, - "step": 304340 - }, - { - "epoch": 0.53, - "learning_rate": 2.3462508327026302e-05, - "loss": 2.2294, - "step": 304350 - }, - { - "epoch": 0.53, - "learning_rate": 2.3461636387099475e-05, - "loss": 2.2797, - "step": 304360 - }, - { - "epoch": 0.53, - "learning_rate": 2.346076444717265e-05, - "loss": 2.2957, - "step": 304370 - }, - { - "epoch": 0.53, - "learning_rate": 2.3459892507245823e-05, - "loss": 2.416, - "step": 304380 - }, - { - "epoch": 0.53, - "learning_rate": 2.3459020567318997e-05, - "loss": 2.4102, - "step": 304390 - }, - { - "epoch": 0.53, - "learning_rate": 2.3458148627392167e-05, - "loss": 2.3246, - "step": 304400 - }, - { - "epoch": 0.53, - "learning_rate": 2.345727668746534e-05, - "loss": 2.3112, - "step": 304410 - }, - { - "epoch": 0.53, - "learning_rate": 2.3456404747538515e-05, - "loss": 2.2904, - "step": 304420 - }, - { - "epoch": 0.53, - "learning_rate": 2.345553280761169e-05, - "loss": 2.3722, - "step": 304430 - }, - { - "epoch": 0.53, - "learning_rate": 2.3454660867684862e-05, - "loss": 2.4106, - "step": 304440 - }, - { - "epoch": 0.53, - "learning_rate": 2.3453788927758033e-05, - "loss": 2.2869, - "step": 304450 - }, - { - "epoch": 0.53, - "learning_rate": 2.345291698783121e-05, - "loss": 2.3706, - "step": 304460 - }, - { - "epoch": 0.53, - "learning_rate": 2.345204504790438e-05, - "loss": 2.4087, - "step": 304470 - }, - { - "epoch": 0.53, - "learning_rate": 2.3451173107977554e-05, - "loss": 2.4137, - "step": 304480 - }, - { - "epoch": 0.53, - "learning_rate": 2.3450301168050728e-05, - "loss": 2.4359, - "step": 304490 - }, - { - "epoch": 0.53, - "learning_rate": 2.34494292281239e-05, - "loss": 2.3714, - "step": 304500 - }, - { - "epoch": 0.53, - "learning_rate": 2.3448557288197072e-05, - "loss": 2.3223, - "step": 304510 - }, - { - "epoch": 0.53, - "learning_rate": 2.3447685348270246e-05, - "loss": 2.4282, - "step": 304520 - }, - { - "epoch": 0.53, - "learning_rate": 2.344681340834342e-05, - "loss": 2.3701, - "step": 304530 - }, - { - "epoch": 0.53, - "learning_rate": 2.3445941468416593e-05, - "loss": 2.418, - "step": 304540 - }, - { - "epoch": 0.53, - "learning_rate": 2.3445069528489767e-05, - "loss": 2.2299, - "step": 304550 - }, - { - "epoch": 0.53, - "learning_rate": 2.3444197588562937e-05, - "loss": 2.4502, - "step": 304560 - }, - { - "epoch": 0.53, - "learning_rate": 2.3443325648636114e-05, - "loss": 2.4466, - "step": 304570 - }, - { - "epoch": 0.53, - "learning_rate": 2.3442453708709285e-05, - "loss": 2.3124, - "step": 304580 - }, - { - "epoch": 0.53, - "learning_rate": 2.344158176878246e-05, - "loss": 2.2952, - "step": 304590 - }, - { - "epoch": 0.53, - "learning_rate": 2.3440709828855632e-05, - "loss": 2.3238, - "step": 304600 - }, - { - "epoch": 0.53, - "learning_rate": 2.3439837888928806e-05, - "loss": 2.3543, - "step": 304610 - }, - { - "epoch": 0.53, - "learning_rate": 2.343896594900198e-05, - "loss": 2.3704, - "step": 304620 - }, - { - "epoch": 0.53, - "learning_rate": 2.343809400907515e-05, - "loss": 2.2783, - "step": 304630 - }, - { - "epoch": 0.53, - "learning_rate": 2.3437222069148327e-05, - "loss": 2.4493, - "step": 304640 - }, - { - "epoch": 0.53, - "learning_rate": 2.3436350129221498e-05, - "loss": 2.3167, - "step": 304650 - }, - { - "epoch": 0.53, - "learning_rate": 2.343547818929467e-05, - "loss": 2.3981, - "step": 304660 - }, - { - "epoch": 0.53, - "learning_rate": 2.3434606249367842e-05, - "loss": 2.3315, - "step": 304670 - }, - { - "epoch": 0.53, - "learning_rate": 2.343373430944102e-05, - "loss": 2.3974, - "step": 304680 - }, - { - "epoch": 0.53, - "learning_rate": 2.3432862369514193e-05, - "loss": 2.2042, - "step": 304690 - }, - { - "epoch": 0.53, - "learning_rate": 2.3431990429587363e-05, - "loss": 2.3749, - "step": 304700 - }, - { - "epoch": 0.53, - "learning_rate": 2.3431118489660537e-05, - "loss": 2.3399, - "step": 304710 - }, - { - "epoch": 0.53, - "learning_rate": 2.343024654973371e-05, - "loss": 2.2334, - "step": 304720 - }, - { - "epoch": 0.53, - "learning_rate": 2.3429374609806885e-05, - "loss": 2.3193, - "step": 304730 - }, - { - "epoch": 0.53, - "learning_rate": 2.3428502669880055e-05, - "loss": 2.3672, - "step": 304740 - }, - { - "epoch": 0.53, - "learning_rate": 2.3427630729953232e-05, - "loss": 2.4695, - "step": 304750 - }, - { - "epoch": 0.53, - "learning_rate": 2.3426758790026403e-05, - "loss": 2.3405, - "step": 304760 - }, - { - "epoch": 0.53, - "learning_rate": 2.3425886850099576e-05, - "loss": 2.4381, - "step": 304770 - }, - { - "epoch": 0.53, - "learning_rate": 2.342501491017275e-05, - "loss": 2.3443, - "step": 304780 - }, - { - "epoch": 0.53, - "learning_rate": 2.3424142970245924e-05, - "loss": 2.3277, - "step": 304790 - }, - { - "epoch": 0.53, - "learning_rate": 2.3423271030319098e-05, - "loss": 2.34, - "step": 304800 - }, - { - "epoch": 0.53, - "learning_rate": 2.3422399090392268e-05, - "loss": 2.3158, - "step": 304810 - }, - { - "epoch": 0.53, - "learning_rate": 2.3421527150465442e-05, - "loss": 2.4118, - "step": 304820 - }, - { - "epoch": 0.53, - "learning_rate": 2.3420655210538616e-05, - "loss": 2.2972, - "step": 304830 - }, - { - "epoch": 0.53, - "learning_rate": 2.341978327061179e-05, - "loss": 2.2959, - "step": 304840 - }, - { - "epoch": 0.53, - "learning_rate": 2.3418911330684963e-05, - "loss": 2.3083, - "step": 304850 - }, - { - "epoch": 0.53, - "learning_rate": 2.3418039390758133e-05, - "loss": 2.3564, - "step": 304860 - }, - { - "epoch": 0.53, - "learning_rate": 2.341716745083131e-05, - "loss": 2.3326, - "step": 304870 - }, - { - "epoch": 0.53, - "learning_rate": 2.341629551090448e-05, - "loss": 2.316, - "step": 304880 - }, - { - "epoch": 0.53, - "learning_rate": 2.3415423570977655e-05, - "loss": 2.4068, - "step": 304890 - }, - { - "epoch": 0.53, - "learning_rate": 2.341455163105083e-05, - "loss": 2.4943, - "step": 304900 - }, - { - "epoch": 0.53, - "learning_rate": 2.3413679691124002e-05, - "loss": 2.4787, - "step": 304910 - }, - { - "epoch": 0.53, - "learning_rate": 2.3412807751197173e-05, - "loss": 2.3997, - "step": 304920 - }, - { - "epoch": 0.53, - "learning_rate": 2.3411935811270346e-05, - "loss": 2.275, - "step": 304930 - }, - { - "epoch": 0.53, - "learning_rate": 2.3411063871343524e-05, - "loss": 2.3588, - "step": 304940 - }, - { - "epoch": 0.53, - "learning_rate": 2.3410191931416694e-05, - "loss": 2.4374, - "step": 304950 - }, - { - "epoch": 0.53, - "learning_rate": 2.3409319991489868e-05, - "loss": 2.4661, - "step": 304960 - }, - { - "epoch": 0.53, - "learning_rate": 2.3408448051563038e-05, - "loss": 2.3314, - "step": 304970 - }, - { - "epoch": 0.53, - "learning_rate": 2.3407576111636215e-05, - "loss": 2.3891, - "step": 304980 - }, - { - "epoch": 0.53, - "learning_rate": 2.3406704171709386e-05, - "loss": 2.2607, - "step": 304990 - }, - { - "epoch": 0.53, - "learning_rate": 2.340583223178256e-05, - "loss": 2.2758, - "step": 305000 - }, - { - "epoch": 0.53, - "learning_rate": 2.3404960291855733e-05, - "loss": 2.3161, - "step": 305010 - }, - { - "epoch": 0.53, - "learning_rate": 2.3404088351928907e-05, - "loss": 2.3247, - "step": 305020 - }, - { - "epoch": 0.53, - "learning_rate": 2.340321641200208e-05, - "loss": 2.341, - "step": 305030 - }, - { - "epoch": 0.53, - "learning_rate": 2.340234447207525e-05, - "loss": 2.3846, - "step": 305040 - }, - { - "epoch": 0.53, - "learning_rate": 2.340147253214843e-05, - "loss": 2.3279, - "step": 305050 - }, - { - "epoch": 0.53, - "learning_rate": 2.34006005922216e-05, - "loss": 2.3448, - "step": 305060 - }, - { - "epoch": 0.53, - "learning_rate": 2.3399728652294772e-05, - "loss": 2.4171, - "step": 305070 - }, - { - "epoch": 0.53, - "learning_rate": 2.3398856712367946e-05, - "loss": 2.4226, - "step": 305080 - }, - { - "epoch": 0.53, - "learning_rate": 2.339798477244112e-05, - "loss": 2.3297, - "step": 305090 - }, - { - "epoch": 0.53, - "learning_rate": 2.3397112832514294e-05, - "loss": 2.3843, - "step": 305100 - }, - { - "epoch": 0.53, - "learning_rate": 2.3396240892587464e-05, - "loss": 2.3692, - "step": 305110 - }, - { - "epoch": 0.53, - "learning_rate": 2.3395368952660638e-05, - "loss": 2.4109, - "step": 305120 - }, - { - "epoch": 0.53, - "learning_rate": 2.3394497012733812e-05, - "loss": 2.3301, - "step": 305130 - }, - { - "epoch": 0.53, - "learning_rate": 2.3393625072806985e-05, - "loss": 2.3903, - "step": 305140 - }, - { - "epoch": 0.53, - "learning_rate": 2.3392753132880156e-05, - "loss": 2.3727, - "step": 305150 - }, - { - "epoch": 0.53, - "learning_rate": 2.3391881192953333e-05, - "loss": 2.3635, - "step": 305160 - }, - { - "epoch": 0.53, - "learning_rate": 2.3391009253026507e-05, - "loss": 2.3476, - "step": 305170 - }, - { - "epoch": 0.53, - "learning_rate": 2.3390137313099677e-05, - "loss": 2.3918, - "step": 305180 - }, - { - "epoch": 0.53, - "learning_rate": 2.338926537317285e-05, - "loss": 2.4644, - "step": 305190 - }, - { - "epoch": 0.53, - "learning_rate": 2.3388393433246025e-05, - "loss": 2.4575, - "step": 305200 - }, - { - "epoch": 0.53, - "learning_rate": 2.33875214933192e-05, - "loss": 2.3031, - "step": 305210 - }, - { - "epoch": 0.53, - "learning_rate": 2.338664955339237e-05, - "loss": 2.3484, - "step": 305220 - }, - { - "epoch": 0.53, - "learning_rate": 2.3385777613465543e-05, - "loss": 2.2995, - "step": 305230 - }, - { - "epoch": 0.53, - "learning_rate": 2.3384905673538716e-05, - "loss": 2.3932, - "step": 305240 - }, - { - "epoch": 0.53, - "learning_rate": 2.338403373361189e-05, - "loss": 2.3615, - "step": 305250 - }, - { - "epoch": 0.53, - "learning_rate": 2.3383161793685064e-05, - "loss": 2.3141, - "step": 305260 - }, - { - "epoch": 0.53, - "learning_rate": 2.3382289853758234e-05, - "loss": 2.3311, - "step": 305270 - }, - { - "epoch": 0.53, - "learning_rate": 2.338141791383141e-05, - "loss": 2.3248, - "step": 305280 - }, - { - "epoch": 0.53, - "learning_rate": 2.3380545973904582e-05, - "loss": 2.3792, - "step": 305290 - }, - { - "epoch": 0.53, - "learning_rate": 2.3379674033977756e-05, - "loss": 2.3672, - "step": 305300 - }, - { - "epoch": 0.53, - "learning_rate": 2.337880209405093e-05, - "loss": 2.3641, - "step": 305310 - }, - { - "epoch": 0.53, - "learning_rate": 2.3377930154124103e-05, - "loss": 2.3058, - "step": 305320 - }, - { - "epoch": 0.53, - "learning_rate": 2.3377058214197277e-05, - "loss": 2.411, - "step": 305330 - }, - { - "epoch": 0.53, - "learning_rate": 2.3376186274270447e-05, - "loss": 2.3911, - "step": 305340 - }, - { - "epoch": 0.53, - "learning_rate": 2.3375314334343624e-05, - "loss": 2.4017, - "step": 305350 - }, - { - "epoch": 0.53, - "learning_rate": 2.3374442394416795e-05, - "loss": 2.4498, - "step": 305360 - }, - { - "epoch": 0.53, - "learning_rate": 2.337357045448997e-05, - "loss": 2.3868, - "step": 305370 - }, - { - "epoch": 0.53, - "learning_rate": 2.337269851456314e-05, - "loss": 2.3473, - "step": 305380 - }, - { - "epoch": 0.53, - "learning_rate": 2.3371826574636316e-05, - "loss": 2.4411, - "step": 305390 - }, - { - "epoch": 0.53, - "learning_rate": 2.3370954634709487e-05, - "loss": 2.248, - "step": 305400 - }, - { - "epoch": 0.53, - "learning_rate": 2.337008269478266e-05, - "loss": 2.3263, - "step": 305410 - }, - { - "epoch": 0.53, - "learning_rate": 2.3369210754855837e-05, - "loss": 2.4265, - "step": 305420 - }, - { - "epoch": 0.53, - "learning_rate": 2.3368338814929008e-05, - "loss": 2.3764, - "step": 305430 - }, - { - "epoch": 0.53, - "learning_rate": 2.336746687500218e-05, - "loss": 2.4405, - "step": 305440 - }, - { - "epoch": 0.53, - "learning_rate": 2.3366594935075352e-05, - "loss": 2.2798, - "step": 305450 - }, - { - "epoch": 0.53, - "learning_rate": 2.336572299514853e-05, - "loss": 2.4021, - "step": 305460 - }, - { - "epoch": 0.53, - "learning_rate": 2.33648510552217e-05, - "loss": 2.4359, - "step": 305470 - }, - { - "epoch": 0.53, - "learning_rate": 2.3363979115294873e-05, - "loss": 2.3238, - "step": 305480 - }, - { - "epoch": 0.53, - "learning_rate": 2.3363107175368047e-05, - "loss": 2.3903, - "step": 305490 - }, - { - "epoch": 0.53, - "learning_rate": 2.336223523544122e-05, - "loss": 2.4176, - "step": 305500 - }, - { - "epoch": 0.53, - "learning_rate": 2.3361363295514395e-05, - "loss": 2.3879, - "step": 305510 - }, - { - "epoch": 0.53, - "learning_rate": 2.3360491355587565e-05, - "loss": 2.4457, - "step": 305520 - }, - { - "epoch": 0.53, - "learning_rate": 2.335961941566074e-05, - "loss": 2.3431, - "step": 305530 - }, - { - "epoch": 0.53, - "learning_rate": 2.3358747475733913e-05, - "loss": 2.3429, - "step": 305540 - }, - { - "epoch": 0.53, - "learning_rate": 2.3357875535807086e-05, - "loss": 2.322, - "step": 305550 - }, - { - "epoch": 0.53, - "learning_rate": 2.335700359588026e-05, - "loss": 2.3396, - "step": 305560 - }, - { - "epoch": 0.53, - "learning_rate": 2.3356131655953434e-05, - "loss": 2.4937, - "step": 305570 - }, - { - "epoch": 0.53, - "learning_rate": 2.3355259716026608e-05, - "loss": 2.4149, - "step": 305580 - }, - { - "epoch": 0.53, - "learning_rate": 2.3354387776099778e-05, - "loss": 2.2799, - "step": 305590 - }, - { - "epoch": 0.53, - "learning_rate": 2.3353515836172952e-05, - "loss": 2.3651, - "step": 305600 - }, - { - "epoch": 0.53, - "learning_rate": 2.3352643896246126e-05, - "loss": 2.3432, - "step": 305610 - }, - { - "epoch": 0.53, - "learning_rate": 2.33517719563193e-05, - "loss": 2.3558, - "step": 305620 - }, - { - "epoch": 0.53, - "learning_rate": 2.335090001639247e-05, - "loss": 2.372, - "step": 305630 - }, - { - "epoch": 0.53, - "learning_rate": 2.3350028076465643e-05, - "loss": 2.3735, - "step": 305640 - }, - { - "epoch": 0.53, - "learning_rate": 2.3349156136538817e-05, - "loss": 2.343, - "step": 305650 - }, - { - "epoch": 0.53, - "learning_rate": 2.334828419661199e-05, - "loss": 2.4173, - "step": 305660 - }, - { - "epoch": 0.53, - "learning_rate": 2.3347412256685165e-05, - "loss": 2.3012, - "step": 305670 - }, - { - "epoch": 0.53, - "learning_rate": 2.334654031675834e-05, - "loss": 2.3567, - "step": 305680 - }, - { - "epoch": 0.53, - "learning_rate": 2.3345668376831512e-05, - "loss": 2.3439, - "step": 305690 - }, - { - "epoch": 0.53, - "learning_rate": 2.3344796436904683e-05, - "loss": 2.3233, - "step": 305700 - }, - { - "epoch": 0.53, - "learning_rate": 2.3343924496977856e-05, - "loss": 2.4134, - "step": 305710 - }, - { - "epoch": 0.53, - "learning_rate": 2.334305255705103e-05, - "loss": 2.4283, - "step": 305720 - }, - { - "epoch": 0.53, - "learning_rate": 2.3342180617124204e-05, - "loss": 2.3451, - "step": 305730 - }, - { - "epoch": 0.53, - "learning_rate": 2.3341308677197378e-05, - "loss": 2.3161, - "step": 305740 - }, - { - "epoch": 0.53, - "learning_rate": 2.3340436737270548e-05, - "loss": 2.3403, - "step": 305750 - }, - { - "epoch": 0.53, - "learning_rate": 2.3339564797343725e-05, - "loss": 2.3672, - "step": 305760 - }, - { - "epoch": 0.53, - "learning_rate": 2.3338692857416896e-05, - "loss": 2.3477, - "step": 305770 - }, - { - "epoch": 0.53, - "learning_rate": 2.333782091749007e-05, - "loss": 2.3022, - "step": 305780 - }, - { - "epoch": 0.53, - "learning_rate": 2.3336948977563243e-05, - "loss": 2.3811, - "step": 305790 - }, - { - "epoch": 0.53, - "learning_rate": 2.3336077037636417e-05, - "loss": 2.3271, - "step": 305800 - }, - { - "epoch": 0.53, - "learning_rate": 2.333520509770959e-05, - "loss": 2.4178, - "step": 305810 - }, - { - "epoch": 0.53, - "learning_rate": 2.333433315778276e-05, - "loss": 2.2556, - "step": 305820 - }, - { - "epoch": 0.53, - "learning_rate": 2.333346121785594e-05, - "loss": 2.4738, - "step": 305830 - }, - { - "epoch": 0.53, - "learning_rate": 2.333258927792911e-05, - "loss": 2.2746, - "step": 305840 - }, - { - "epoch": 0.53, - "learning_rate": 2.3331717338002282e-05, - "loss": 2.3853, - "step": 305850 - }, - { - "epoch": 0.53, - "learning_rate": 2.3330845398075453e-05, - "loss": 2.3498, - "step": 305860 - }, - { - "epoch": 0.53, - "learning_rate": 2.332997345814863e-05, - "loss": 2.2895, - "step": 305870 - }, - { - "epoch": 0.53, - "learning_rate": 2.33291015182218e-05, - "loss": 2.3446, - "step": 305880 - }, - { - "epoch": 0.53, - "learning_rate": 2.3328229578294974e-05, - "loss": 2.3856, - "step": 305890 - }, - { - "epoch": 0.53, - "learning_rate": 2.3327357638368148e-05, - "loss": 2.2688, - "step": 305900 - }, - { - "epoch": 0.53, - "learning_rate": 2.3326485698441322e-05, - "loss": 2.3463, - "step": 305910 - }, - { - "epoch": 0.53, - "learning_rate": 2.3325613758514495e-05, - "loss": 2.3384, - "step": 305920 - }, - { - "epoch": 0.53, - "learning_rate": 2.3324741818587666e-05, - "loss": 2.36, - "step": 305930 - }, - { - "epoch": 0.53, - "learning_rate": 2.3323869878660843e-05, - "loss": 2.375, - "step": 305940 - }, - { - "epoch": 0.53, - "learning_rate": 2.3322997938734013e-05, - "loss": 2.4221, - "step": 305950 - }, - { - "epoch": 0.53, - "learning_rate": 2.3322125998807187e-05, - "loss": 2.3571, - "step": 305960 - }, - { - "epoch": 0.53, - "learning_rate": 2.332125405888036e-05, - "loss": 2.5195, - "step": 305970 - }, - { - "epoch": 0.53, - "learning_rate": 2.3320382118953535e-05, - "loss": 2.3496, - "step": 305980 - }, - { - "epoch": 0.53, - "learning_rate": 2.331951017902671e-05, - "loss": 2.3701, - "step": 305990 - }, - { - "epoch": 0.53, - "learning_rate": 2.331863823909988e-05, - "loss": 2.4755, - "step": 306000 - }, - { - "epoch": 0.53, - "learning_rate": 2.3317766299173053e-05, - "loss": 2.26, - "step": 306010 - }, - { - "epoch": 0.53, - "learning_rate": 2.3316894359246226e-05, - "loss": 2.2112, - "step": 306020 - }, - { - "epoch": 0.53, - "learning_rate": 2.33160224193194e-05, - "loss": 2.46, - "step": 306030 - }, - { - "epoch": 0.53, - "learning_rate": 2.3315150479392574e-05, - "loss": 2.3883, - "step": 306040 - }, - { - "epoch": 0.53, - "learning_rate": 2.3314278539465744e-05, - "loss": 2.4129, - "step": 306050 - }, - { - "epoch": 0.53, - "learning_rate": 2.331340659953892e-05, - "loss": 2.3555, - "step": 306060 - }, - { - "epoch": 0.53, - "learning_rate": 2.3312534659612092e-05, - "loss": 2.3615, - "step": 306070 - }, - { - "epoch": 0.53, - "learning_rate": 2.3311662719685266e-05, - "loss": 2.3861, - "step": 306080 - }, - { - "epoch": 0.53, - "learning_rate": 2.331079077975844e-05, - "loss": 2.3499, - "step": 306090 - }, - { - "epoch": 0.53, - "learning_rate": 2.3309918839831613e-05, - "loss": 2.1665, - "step": 306100 - }, - { - "epoch": 0.53, - "learning_rate": 2.3309046899904784e-05, - "loss": 2.2171, - "step": 306110 - }, - { - "epoch": 0.53, - "learning_rate": 2.3308174959977957e-05, - "loss": 2.3761, - "step": 306120 - }, - { - "epoch": 0.53, - "learning_rate": 2.330730302005113e-05, - "loss": 2.331, - "step": 306130 - }, - { - "epoch": 0.53, - "learning_rate": 2.3306431080124305e-05, - "loss": 2.3322, - "step": 306140 - }, - { - "epoch": 0.53, - "learning_rate": 2.330555914019748e-05, - "loss": 2.258, - "step": 306150 - }, - { - "epoch": 0.53, - "learning_rate": 2.330468720027065e-05, - "loss": 2.407, - "step": 306160 - }, - { - "epoch": 0.53, - "learning_rate": 2.3303815260343826e-05, - "loss": 2.4332, - "step": 306170 - }, - { - "epoch": 0.53, - "learning_rate": 2.3302943320416997e-05, - "loss": 2.2975, - "step": 306180 - }, - { - "epoch": 0.53, - "learning_rate": 2.330207138049017e-05, - "loss": 2.3918, - "step": 306190 - }, - { - "epoch": 0.53, - "learning_rate": 2.3301199440563344e-05, - "loss": 2.4251, - "step": 306200 - }, - { - "epoch": 0.53, - "learning_rate": 2.3300327500636518e-05, - "loss": 2.4443, - "step": 306210 - }, - { - "epoch": 0.53, - "learning_rate": 2.329945556070969e-05, - "loss": 2.4317, - "step": 306220 - }, - { - "epoch": 0.53, - "learning_rate": 2.3298583620782862e-05, - "loss": 2.2808, - "step": 306230 - }, - { - "epoch": 0.53, - "learning_rate": 2.329771168085604e-05, - "loss": 2.3702, - "step": 306240 - }, - { - "epoch": 0.53, - "learning_rate": 2.329683974092921e-05, - "loss": 2.29, - "step": 306250 - }, - { - "epoch": 0.53, - "learning_rate": 2.3295967801002383e-05, - "loss": 2.4293, - "step": 306260 - }, - { - "epoch": 0.53, - "learning_rate": 2.3295095861075554e-05, - "loss": 2.3276, - "step": 306270 - }, - { - "epoch": 0.53, - "learning_rate": 2.329422392114873e-05, - "loss": 2.3816, - "step": 306280 - }, - { - "epoch": 0.53, - "learning_rate": 2.3293351981221905e-05, - "loss": 2.3872, - "step": 306290 - }, - { - "epoch": 0.53, - "learning_rate": 2.3292480041295075e-05, - "loss": 2.3305, - "step": 306300 - }, - { - "epoch": 0.53, - "learning_rate": 2.329160810136825e-05, - "loss": 2.2872, - "step": 306310 - }, - { - "epoch": 0.53, - "learning_rate": 2.3290736161441423e-05, - "loss": 2.3478, - "step": 306320 - }, - { - "epoch": 0.53, - "learning_rate": 2.3289864221514596e-05, - "loss": 2.3494, - "step": 306330 - }, - { - "epoch": 0.53, - "learning_rate": 2.3288992281587767e-05, - "loss": 2.4218, - "step": 306340 - }, - { - "epoch": 0.53, - "learning_rate": 2.3288120341660944e-05, - "loss": 2.2799, - "step": 306350 - }, - { - "epoch": 0.53, - "learning_rate": 2.3287248401734114e-05, - "loss": 2.273, - "step": 306360 - }, - { - "epoch": 0.53, - "learning_rate": 2.3286376461807288e-05, - "loss": 2.3505, - "step": 306370 - }, - { - "epoch": 0.53, - "learning_rate": 2.3285504521880462e-05, - "loss": 2.2345, - "step": 306380 - }, - { - "epoch": 0.53, - "learning_rate": 2.3284632581953636e-05, - "loss": 2.3725, - "step": 306390 - }, - { - "epoch": 0.53, - "learning_rate": 2.328376064202681e-05, - "loss": 2.3643, - "step": 306400 - }, - { - "epoch": 0.53, - "learning_rate": 2.328288870209998e-05, - "loss": 2.3694, - "step": 306410 - }, - { - "epoch": 0.53, - "learning_rate": 2.3282016762173153e-05, - "loss": 2.3029, - "step": 306420 - }, - { - "epoch": 0.53, - "learning_rate": 2.3281144822246327e-05, - "loss": 2.2385, - "step": 306430 - }, - { - "epoch": 0.53, - "learning_rate": 2.32802728823195e-05, - "loss": 2.2859, - "step": 306440 - }, - { - "epoch": 0.53, - "learning_rate": 2.3279400942392675e-05, - "loss": 2.5034, - "step": 306450 - }, - { - "epoch": 0.53, - "learning_rate": 2.3278529002465845e-05, - "loss": 2.3145, - "step": 306460 - }, - { - "epoch": 0.53, - "learning_rate": 2.3277657062539022e-05, - "loss": 2.3731, - "step": 306470 - }, - { - "epoch": 0.53, - "learning_rate": 2.3276785122612193e-05, - "loss": 2.3945, - "step": 306480 - }, - { - "epoch": 0.53, - "learning_rate": 2.3275913182685366e-05, - "loss": 2.3619, - "step": 306490 - }, - { - "epoch": 0.53, - "learning_rate": 2.327504124275854e-05, - "loss": 2.3074, - "step": 306500 - }, - { - "epoch": 0.53, - "learning_rate": 2.3274169302831714e-05, - "loss": 2.1831, - "step": 306510 - }, - { - "epoch": 0.53, - "learning_rate": 2.3273297362904888e-05, - "loss": 2.3069, - "step": 306520 - }, - { - "epoch": 0.53, - "learning_rate": 2.3272425422978058e-05, - "loss": 2.3738, - "step": 306530 - }, - { - "epoch": 0.53, - "learning_rate": 2.3271553483051235e-05, - "loss": 2.3375, - "step": 306540 - }, - { - "epoch": 0.53, - "learning_rate": 2.3270681543124406e-05, - "loss": 2.3517, - "step": 306550 - }, - { - "epoch": 0.53, - "learning_rate": 2.326980960319758e-05, - "loss": 2.4286, - "step": 306560 - }, - { - "epoch": 0.53, - "learning_rate": 2.326893766327075e-05, - "loss": 2.3282, - "step": 306570 - }, - { - "epoch": 0.53, - "learning_rate": 2.3268065723343927e-05, - "loss": 2.3311, - "step": 306580 - }, - { - "epoch": 0.53, - "learning_rate": 2.3267193783417097e-05, - "loss": 2.438, - "step": 306590 - }, - { - "epoch": 0.53, - "learning_rate": 2.326632184349027e-05, - "loss": 2.3116, - "step": 306600 - }, - { - "epoch": 0.53, - "learning_rate": 2.3265449903563445e-05, - "loss": 2.4249, - "step": 306610 - }, - { - "epoch": 0.53, - "learning_rate": 2.326457796363662e-05, - "loss": 2.4275, - "step": 306620 - }, - { - "epoch": 0.53, - "learning_rate": 2.3263706023709793e-05, - "loss": 2.218, - "step": 306630 - }, - { - "epoch": 0.53, - "learning_rate": 2.3262834083782963e-05, - "loss": 2.2857, - "step": 306640 - }, - { - "epoch": 0.53, - "learning_rate": 2.326196214385614e-05, - "loss": 2.4008, - "step": 306650 - }, - { - "epoch": 0.53, - "learning_rate": 2.326109020392931e-05, - "loss": 2.2992, - "step": 306660 - }, - { - "epoch": 0.53, - "learning_rate": 2.3260218264002484e-05, - "loss": 2.3449, - "step": 306670 - }, - { - "epoch": 0.53, - "learning_rate": 2.3259346324075658e-05, - "loss": 2.3616, - "step": 306680 - }, - { - "epoch": 0.53, - "learning_rate": 2.3258474384148832e-05, - "loss": 2.4528, - "step": 306690 - }, - { - "epoch": 0.53, - "learning_rate": 2.3257602444222006e-05, - "loss": 2.2744, - "step": 306700 - }, - { - "epoch": 0.53, - "learning_rate": 2.3256730504295176e-05, - "loss": 2.2738, - "step": 306710 - }, - { - "epoch": 0.53, - "learning_rate": 2.325585856436835e-05, - "loss": 2.4185, - "step": 306720 - }, - { - "epoch": 0.53, - "learning_rate": 2.3254986624441523e-05, - "loss": 2.3239, - "step": 306730 - }, - { - "epoch": 0.53, - "learning_rate": 2.3254114684514697e-05, - "loss": 2.3597, - "step": 306740 - }, - { - "epoch": 0.53, - "learning_rate": 2.3253242744587868e-05, - "loss": 2.274, - "step": 306750 - }, - { - "epoch": 0.53, - "learning_rate": 2.3252370804661045e-05, - "loss": 2.2678, - "step": 306760 - }, - { - "epoch": 0.53, - "learning_rate": 2.325149886473422e-05, - "loss": 2.3149, - "step": 306770 - }, - { - "epoch": 0.53, - "learning_rate": 2.325062692480739e-05, - "loss": 2.4488, - "step": 306780 - }, - { - "epoch": 0.54, - "learning_rate": 2.3249754984880563e-05, - "loss": 2.3422, - "step": 306790 - }, - { - "epoch": 0.54, - "learning_rate": 2.3248883044953736e-05, - "loss": 2.3123, - "step": 306800 - }, - { - "epoch": 0.54, - "learning_rate": 2.324801110502691e-05, - "loss": 2.3184, - "step": 306810 - }, - { - "epoch": 0.54, - "learning_rate": 2.324713916510008e-05, - "loss": 2.3598, - "step": 306820 - }, - { - "epoch": 0.54, - "learning_rate": 2.3246267225173254e-05, - "loss": 2.4109, - "step": 306830 - }, - { - "epoch": 0.54, - "learning_rate": 2.3245395285246428e-05, - "loss": 2.4432, - "step": 306840 - }, - { - "epoch": 0.54, - "learning_rate": 2.3244523345319602e-05, - "loss": 2.3933, - "step": 306850 - }, - { - "epoch": 0.54, - "learning_rate": 2.3243651405392776e-05, - "loss": 2.3849, - "step": 306860 - }, - { - "epoch": 0.54, - "learning_rate": 2.324277946546595e-05, - "loss": 2.4041, - "step": 306870 - }, - { - "epoch": 0.54, - "learning_rate": 2.3241907525539123e-05, - "loss": 2.3716, - "step": 306880 - }, - { - "epoch": 0.54, - "learning_rate": 2.3241035585612294e-05, - "loss": 2.4537, - "step": 306890 - }, - { - "epoch": 0.54, - "learning_rate": 2.3240163645685467e-05, - "loss": 2.4438, - "step": 306900 - }, - { - "epoch": 0.54, - "learning_rate": 2.323929170575864e-05, - "loss": 2.3649, - "step": 306910 - }, - { - "epoch": 0.54, - "learning_rate": 2.3238419765831815e-05, - "loss": 2.4837, - "step": 306920 - }, - { - "epoch": 0.54, - "learning_rate": 2.323754782590499e-05, - "loss": 2.3461, - "step": 306930 - }, - { - "epoch": 0.54, - "learning_rate": 2.323667588597816e-05, - "loss": 2.3432, - "step": 306940 - }, - { - "epoch": 0.54, - "learning_rate": 2.3235803946051336e-05, - "loss": 2.4608, - "step": 306950 - }, - { - "epoch": 0.54, - "learning_rate": 2.3234932006124507e-05, - "loss": 2.4227, - "step": 306960 - }, - { - "epoch": 0.54, - "learning_rate": 2.323406006619768e-05, - "loss": 2.3343, - "step": 306970 - }, - { - "epoch": 0.54, - "learning_rate": 2.323318812627085e-05, - "loss": 2.3588, - "step": 306980 - }, - { - "epoch": 0.54, - "learning_rate": 2.3232316186344028e-05, - "loss": 2.3629, - "step": 306990 - }, - { - "epoch": 0.54, - "learning_rate": 2.3231444246417198e-05, - "loss": 2.3383, - "step": 307000 - }, - { - "epoch": 0.54, - "learning_rate": 2.3230572306490372e-05, - "loss": 2.3093, - "step": 307010 - }, - { - "epoch": 0.54, - "learning_rate": 2.322970036656355e-05, - "loss": 2.3129, - "step": 307020 - }, - { - "epoch": 0.54, - "learning_rate": 2.322882842663672e-05, - "loss": 2.2721, - "step": 307030 - }, - { - "epoch": 0.54, - "learning_rate": 2.3227956486709893e-05, - "loss": 2.3325, - "step": 307040 - }, - { - "epoch": 0.54, - "learning_rate": 2.3227084546783064e-05, - "loss": 2.2743, - "step": 307050 - }, - { - "epoch": 0.54, - "learning_rate": 2.322621260685624e-05, - "loss": 2.4088, - "step": 307060 - }, - { - "epoch": 0.54, - "learning_rate": 2.322534066692941e-05, - "loss": 2.3009, - "step": 307070 - }, - { - "epoch": 0.54, - "learning_rate": 2.3224468727002585e-05, - "loss": 2.2164, - "step": 307080 - }, - { - "epoch": 0.54, - "learning_rate": 2.322359678707576e-05, - "loss": 2.2777, - "step": 307090 - }, - { - "epoch": 0.54, - "learning_rate": 2.3222724847148933e-05, - "loss": 2.3933, - "step": 307100 - }, - { - "epoch": 0.54, - "learning_rate": 2.3221852907222106e-05, - "loss": 2.2683, - "step": 307110 - }, - { - "epoch": 0.54, - "learning_rate": 2.3220980967295277e-05, - "loss": 2.2663, - "step": 307120 - }, - { - "epoch": 0.54, - "learning_rate": 2.322010902736845e-05, - "loss": 2.3453, - "step": 307130 - }, - { - "epoch": 0.54, - "learning_rate": 2.3219237087441624e-05, - "loss": 2.3012, - "step": 307140 - }, - { - "epoch": 0.54, - "learning_rate": 2.3218365147514798e-05, - "loss": 2.2845, - "step": 307150 - }, - { - "epoch": 0.54, - "learning_rate": 2.3217493207587972e-05, - "loss": 2.4087, - "step": 307160 - }, - { - "epoch": 0.54, - "learning_rate": 2.3216621267661146e-05, - "loss": 2.3373, - "step": 307170 - }, - { - "epoch": 0.54, - "learning_rate": 2.321574932773432e-05, - "loss": 2.4432, - "step": 307180 - }, - { - "epoch": 0.54, - "learning_rate": 2.321487738780749e-05, - "loss": 2.4192, - "step": 307190 - }, - { - "epoch": 0.54, - "learning_rate": 2.3214005447880664e-05, - "loss": 2.3801, - "step": 307200 - }, - { - "epoch": 0.54, - "learning_rate": 2.3213133507953837e-05, - "loss": 2.3561, - "step": 307210 - }, - { - "epoch": 0.54, - "learning_rate": 2.321226156802701e-05, - "loss": 2.3334, - "step": 307220 - }, - { - "epoch": 0.54, - "learning_rate": 2.321138962810018e-05, - "loss": 2.2995, - "step": 307230 - }, - { - "epoch": 0.54, - "learning_rate": 2.3210517688173355e-05, - "loss": 2.2386, - "step": 307240 - }, - { - "epoch": 0.54, - "learning_rate": 2.3209645748246532e-05, - "loss": 2.2522, - "step": 307250 - }, - { - "epoch": 0.54, - "learning_rate": 2.3208773808319703e-05, - "loss": 2.2986, - "step": 307260 - }, - { - "epoch": 0.54, - "learning_rate": 2.3207901868392877e-05, - "loss": 2.4082, - "step": 307270 - }, - { - "epoch": 0.54, - "learning_rate": 2.320702992846605e-05, - "loss": 2.2183, - "step": 307280 - }, - { - "epoch": 0.54, - "learning_rate": 2.3206157988539224e-05, - "loss": 2.4093, - "step": 307290 - }, - { - "epoch": 0.54, - "learning_rate": 2.3205286048612394e-05, - "loss": 2.2705, - "step": 307300 - }, - { - "epoch": 0.54, - "learning_rate": 2.3204414108685568e-05, - "loss": 2.4365, - "step": 307310 - }, - { - "epoch": 0.54, - "learning_rate": 2.3203542168758742e-05, - "loss": 2.303, - "step": 307320 - }, - { - "epoch": 0.54, - "learning_rate": 2.3202670228831916e-05, - "loss": 2.3416, - "step": 307330 - }, - { - "epoch": 0.54, - "learning_rate": 2.320179828890509e-05, - "loss": 2.3932, - "step": 307340 - }, - { - "epoch": 0.54, - "learning_rate": 2.320092634897826e-05, - "loss": 2.2163, - "step": 307350 - }, - { - "epoch": 0.54, - "learning_rate": 2.3200054409051437e-05, - "loss": 2.4351, - "step": 307360 - }, - { - "epoch": 0.54, - "learning_rate": 2.3199182469124607e-05, - "loss": 2.4136, - "step": 307370 - }, - { - "epoch": 0.54, - "learning_rate": 2.319831052919778e-05, - "loss": 2.3591, - "step": 307380 - }, - { - "epoch": 0.54, - "learning_rate": 2.3197438589270955e-05, - "loss": 2.3674, - "step": 307390 - }, - { - "epoch": 0.54, - "learning_rate": 2.319656664934413e-05, - "loss": 2.349, - "step": 307400 - }, - { - "epoch": 0.54, - "learning_rate": 2.3195694709417303e-05, - "loss": 2.4122, - "step": 307410 - }, - { - "epoch": 0.54, - "learning_rate": 2.3194822769490473e-05, - "loss": 2.2862, - "step": 307420 - }, - { - "epoch": 0.54, - "learning_rate": 2.319395082956365e-05, - "loss": 2.3248, - "step": 307430 - }, - { - "epoch": 0.54, - "learning_rate": 2.319307888963682e-05, - "loss": 2.3845, - "step": 307440 - }, - { - "epoch": 0.54, - "learning_rate": 2.3192206949709994e-05, - "loss": 2.4467, - "step": 307450 - }, - { - "epoch": 0.54, - "learning_rate": 2.3191335009783165e-05, - "loss": 2.3945, - "step": 307460 - }, - { - "epoch": 0.54, - "learning_rate": 2.3190463069856342e-05, - "loss": 2.3087, - "step": 307470 - }, - { - "epoch": 0.54, - "learning_rate": 2.3189591129929512e-05, - "loss": 2.3568, - "step": 307480 - }, - { - "epoch": 0.54, - "learning_rate": 2.3188719190002686e-05, - "loss": 2.3391, - "step": 307490 - }, - { - "epoch": 0.54, - "learning_rate": 2.318784725007586e-05, - "loss": 2.3964, - "step": 307500 - }, - { - "epoch": 0.54, - "learning_rate": 2.3186975310149033e-05, - "loss": 2.3436, - "step": 307510 - }, - { - "epoch": 0.54, - "learning_rate": 2.3186103370222207e-05, - "loss": 2.3028, - "step": 307520 - }, - { - "epoch": 0.54, - "learning_rate": 2.3185231430295378e-05, - "loss": 2.4295, - "step": 307530 - }, - { - "epoch": 0.54, - "learning_rate": 2.3184359490368555e-05, - "loss": 2.365, - "step": 307540 - }, - { - "epoch": 0.54, - "learning_rate": 2.3183487550441725e-05, - "loss": 2.3828, - "step": 307550 - }, - { - "epoch": 0.54, - "learning_rate": 2.31826156105149e-05, - "loss": 2.389, - "step": 307560 - }, - { - "epoch": 0.54, - "learning_rate": 2.3181743670588073e-05, - "loss": 2.3816, - "step": 307570 - }, - { - "epoch": 0.54, - "learning_rate": 2.3180871730661246e-05, - "loss": 2.3344, - "step": 307580 - }, - { - "epoch": 0.54, - "learning_rate": 2.317999979073442e-05, - "loss": 2.3323, - "step": 307590 - }, - { - "epoch": 0.54, - "learning_rate": 2.317912785080759e-05, - "loss": 2.2775, - "step": 307600 - }, - { - "epoch": 0.54, - "learning_rate": 2.3178255910880764e-05, - "loss": 2.3133, - "step": 307610 - }, - { - "epoch": 0.54, - "learning_rate": 2.3177383970953938e-05, - "loss": 2.2677, - "step": 307620 - }, - { - "epoch": 0.54, - "learning_rate": 2.3176512031027112e-05, - "loss": 2.4139, - "step": 307630 - }, - { - "epoch": 0.54, - "learning_rate": 2.3175640091100286e-05, - "loss": 2.4077, - "step": 307640 - }, - { - "epoch": 0.54, - "learning_rate": 2.3174768151173456e-05, - "loss": 2.3651, - "step": 307650 - }, - { - "epoch": 0.54, - "learning_rate": 2.3173896211246633e-05, - "loss": 2.3525, - "step": 307660 - }, - { - "epoch": 0.54, - "learning_rate": 2.3173024271319804e-05, - "loss": 2.2801, - "step": 307670 - }, - { - "epoch": 0.54, - "learning_rate": 2.3172152331392977e-05, - "loss": 2.2808, - "step": 307680 - }, - { - "epoch": 0.54, - "learning_rate": 2.317128039146615e-05, - "loss": 2.3117, - "step": 307690 - }, - { - "epoch": 0.54, - "learning_rate": 2.3170408451539325e-05, - "loss": 2.3952, - "step": 307700 - }, - { - "epoch": 0.54, - "learning_rate": 2.3169536511612495e-05, - "loss": 2.335, - "step": 307710 - }, - { - "epoch": 0.54, - "learning_rate": 2.316866457168567e-05, - "loss": 2.5446, - "step": 307720 - }, - { - "epoch": 0.54, - "learning_rate": 2.3167792631758846e-05, - "loss": 2.3703, - "step": 307730 - }, - { - "epoch": 0.54, - "learning_rate": 2.3166920691832017e-05, - "loss": 2.3234, - "step": 307740 - }, - { - "epoch": 0.54, - "learning_rate": 2.316604875190519e-05, - "loss": 2.3474, - "step": 307750 - }, - { - "epoch": 0.54, - "learning_rate": 2.316517681197836e-05, - "loss": 2.3584, - "step": 307760 - }, - { - "epoch": 0.54, - "learning_rate": 2.3164304872051538e-05, - "loss": 2.3688, - "step": 307770 - }, - { - "epoch": 0.54, - "learning_rate": 2.3163432932124708e-05, - "loss": 2.304, - "step": 307780 - }, - { - "epoch": 0.54, - "learning_rate": 2.3162560992197882e-05, - "loss": 2.3271, - "step": 307790 - }, - { - "epoch": 0.54, - "learning_rate": 2.3161689052271056e-05, - "loss": 2.3117, - "step": 307800 - }, - { - "epoch": 0.54, - "learning_rate": 2.316081711234423e-05, - "loss": 2.3056, - "step": 307810 - }, - { - "epoch": 0.54, - "learning_rate": 2.3159945172417403e-05, - "loss": 2.4345, - "step": 307820 - }, - { - "epoch": 0.54, - "learning_rate": 2.3159073232490574e-05, - "loss": 2.3774, - "step": 307830 - }, - { - "epoch": 0.54, - "learning_rate": 2.315820129256375e-05, - "loss": 2.3886, - "step": 307840 - }, - { - "epoch": 0.54, - "learning_rate": 2.315732935263692e-05, - "loss": 2.3168, - "step": 307850 - }, - { - "epoch": 0.54, - "learning_rate": 2.3156457412710095e-05, - "loss": 2.4064, - "step": 307860 - }, - { - "epoch": 0.54, - "learning_rate": 2.315558547278327e-05, - "loss": 2.4216, - "step": 307870 - }, - { - "epoch": 0.54, - "learning_rate": 2.3154713532856443e-05, - "loss": 2.3461, - "step": 307880 - }, - { - "epoch": 0.54, - "learning_rate": 2.3153841592929616e-05, - "loss": 2.3366, - "step": 307890 - }, - { - "epoch": 0.54, - "learning_rate": 2.3152969653002787e-05, - "loss": 2.3301, - "step": 307900 - }, - { - "epoch": 0.54, - "learning_rate": 2.315209771307596e-05, - "loss": 2.2644, - "step": 307910 - }, - { - "epoch": 0.54, - "learning_rate": 2.3151225773149134e-05, - "loss": 2.3029, - "step": 307920 - }, - { - "epoch": 0.54, - "learning_rate": 2.3150353833222308e-05, - "loss": 2.3099, - "step": 307930 - }, - { - "epoch": 0.54, - "learning_rate": 2.314948189329548e-05, - "loss": 2.2722, - "step": 307940 - }, - { - "epoch": 0.54, - "learning_rate": 2.3148609953368656e-05, - "loss": 2.4429, - "step": 307950 - }, - { - "epoch": 0.54, - "learning_rate": 2.3147738013441826e-05, - "loss": 2.2755, - "step": 307960 - }, - { - "epoch": 0.54, - "learning_rate": 2.3146866073515e-05, - "loss": 2.4211, - "step": 307970 - }, - { - "epoch": 0.54, - "learning_rate": 2.3145994133588174e-05, - "loss": 2.4952, - "step": 307980 - }, - { - "epoch": 0.54, - "learning_rate": 2.3145122193661347e-05, - "loss": 2.2692, - "step": 307990 - }, - { - "epoch": 0.54, - "learning_rate": 2.314425025373452e-05, - "loss": 2.328, - "step": 308000 - }, - { - "epoch": 0.54, - "learning_rate": 2.314337831380769e-05, - "loss": 2.3214, - "step": 308010 - }, - { - "epoch": 0.54, - "learning_rate": 2.3142506373880865e-05, - "loss": 2.2848, - "step": 308020 - }, - { - "epoch": 0.54, - "learning_rate": 2.314163443395404e-05, - "loss": 2.3698, - "step": 308030 - }, - { - "epoch": 0.54, - "learning_rate": 2.3140762494027213e-05, - "loss": 2.4306, - "step": 308040 - }, - { - "epoch": 0.54, - "learning_rate": 2.3139890554100387e-05, - "loss": 2.3984, - "step": 308050 - }, - { - "epoch": 0.54, - "learning_rate": 2.3139018614173557e-05, - "loss": 2.2873, - "step": 308060 - }, - { - "epoch": 0.54, - "learning_rate": 2.3138146674246734e-05, - "loss": 2.3187, - "step": 308070 - }, - { - "epoch": 0.54, - "learning_rate": 2.3137274734319904e-05, - "loss": 2.4468, - "step": 308080 - }, - { - "epoch": 0.54, - "learning_rate": 2.3136402794393078e-05, - "loss": 2.2986, - "step": 308090 - }, - { - "epoch": 0.54, - "learning_rate": 2.3135530854466252e-05, - "loss": 2.3454, - "step": 308100 - }, - { - "epoch": 0.54, - "learning_rate": 2.3134658914539426e-05, - "loss": 2.2789, - "step": 308110 - }, - { - "epoch": 0.54, - "learning_rate": 2.31337869746126e-05, - "loss": 2.2691, - "step": 308120 - }, - { - "epoch": 0.54, - "learning_rate": 2.313291503468577e-05, - "loss": 2.3339, - "step": 308130 - }, - { - "epoch": 0.54, - "learning_rate": 2.3132043094758947e-05, - "loss": 2.362, - "step": 308140 - }, - { - "epoch": 0.54, - "learning_rate": 2.3131171154832117e-05, - "loss": 2.4109, - "step": 308150 - }, - { - "epoch": 0.54, - "learning_rate": 2.313029921490529e-05, - "loss": 2.4519, - "step": 308160 - }, - { - "epoch": 0.54, - "learning_rate": 2.312942727497846e-05, - "loss": 2.3204, - "step": 308170 - }, - { - "epoch": 0.54, - "learning_rate": 2.312855533505164e-05, - "loss": 2.4331, - "step": 308180 - }, - { - "epoch": 0.54, - "learning_rate": 2.312768339512481e-05, - "loss": 2.3897, - "step": 308190 - }, - { - "epoch": 0.54, - "learning_rate": 2.3126811455197983e-05, - "loss": 2.3581, - "step": 308200 - }, - { - "epoch": 0.54, - "learning_rate": 2.3125939515271157e-05, - "loss": 2.4071, - "step": 308210 - }, - { - "epoch": 0.54, - "learning_rate": 2.312506757534433e-05, - "loss": 2.5047, - "step": 308220 - }, - { - "epoch": 0.54, - "learning_rate": 2.3124195635417504e-05, - "loss": 2.3848, - "step": 308230 - }, - { - "epoch": 0.54, - "learning_rate": 2.3123323695490675e-05, - "loss": 2.4267, - "step": 308240 - }, - { - "epoch": 0.54, - "learning_rate": 2.3122451755563852e-05, - "loss": 2.3446, - "step": 308250 - }, - { - "epoch": 0.54, - "learning_rate": 2.3121579815637022e-05, - "loss": 2.2854, - "step": 308260 - }, - { - "epoch": 0.54, - "learning_rate": 2.3120707875710196e-05, - "loss": 2.368, - "step": 308270 - }, - { - "epoch": 0.54, - "learning_rate": 2.311983593578337e-05, - "loss": 2.3558, - "step": 308280 - }, - { - "epoch": 0.54, - "learning_rate": 2.3118963995856543e-05, - "loss": 2.4043, - "step": 308290 - }, - { - "epoch": 0.54, - "learning_rate": 2.3118092055929717e-05, - "loss": 2.3805, - "step": 308300 - }, - { - "epoch": 0.54, - "learning_rate": 2.3117220116002888e-05, - "loss": 2.2663, - "step": 308310 - }, - { - "epoch": 0.54, - "learning_rate": 2.311634817607606e-05, - "loss": 2.3266, - "step": 308320 - }, - { - "epoch": 0.54, - "learning_rate": 2.3115476236149235e-05, - "loss": 2.2826, - "step": 308330 - }, - { - "epoch": 0.54, - "learning_rate": 2.311460429622241e-05, - "loss": 2.34, - "step": 308340 - }, - { - "epoch": 0.54, - "learning_rate": 2.3113732356295583e-05, - "loss": 2.2159, - "step": 308350 - }, - { - "epoch": 0.54, - "learning_rate": 2.3112860416368756e-05, - "loss": 2.2704, - "step": 308360 - }, - { - "epoch": 0.54, - "learning_rate": 2.311198847644193e-05, - "loss": 2.3178, - "step": 308370 - }, - { - "epoch": 0.54, - "learning_rate": 2.31111165365151e-05, - "loss": 2.28, - "step": 308380 - }, - { - "epoch": 0.54, - "learning_rate": 2.3110244596588274e-05, - "loss": 2.4512, - "step": 308390 - }, - { - "epoch": 0.54, - "learning_rate": 2.3109372656661448e-05, - "loss": 2.4277, - "step": 308400 - }, - { - "epoch": 0.54, - "learning_rate": 2.3108500716734622e-05, - "loss": 2.4223, - "step": 308410 - }, - { - "epoch": 0.54, - "learning_rate": 2.3107628776807792e-05, - "loss": 2.4024, - "step": 308420 - }, - { - "epoch": 0.54, - "learning_rate": 2.3106756836880966e-05, - "loss": 2.3133, - "step": 308430 - }, - { - "epoch": 0.54, - "learning_rate": 2.310588489695414e-05, - "loss": 2.4321, - "step": 308440 - }, - { - "epoch": 0.54, - "learning_rate": 2.3105012957027314e-05, - "loss": 2.3256, - "step": 308450 - }, - { - "epoch": 0.54, - "learning_rate": 2.3104141017100487e-05, - "loss": 2.3274, - "step": 308460 - }, - { - "epoch": 0.54, - "learning_rate": 2.310326907717366e-05, - "loss": 2.399, - "step": 308470 - }, - { - "epoch": 0.54, - "learning_rate": 2.3102397137246835e-05, - "loss": 2.2953, - "step": 308480 - }, - { - "epoch": 0.54, - "learning_rate": 2.3101525197320005e-05, - "loss": 2.4566, - "step": 308490 - }, - { - "epoch": 0.54, - "learning_rate": 2.310065325739318e-05, - "loss": 2.2903, - "step": 308500 - }, - { - "epoch": 0.54, - "learning_rate": 2.3099781317466353e-05, - "loss": 2.4233, - "step": 308510 - }, - { - "epoch": 0.54, - "learning_rate": 2.3098909377539527e-05, - "loss": 2.3966, - "step": 308520 - }, - { - "epoch": 0.54, - "learning_rate": 2.30980374376127e-05, - "loss": 2.3474, - "step": 308530 - }, - { - "epoch": 0.54, - "learning_rate": 2.309716549768587e-05, - "loss": 2.2508, - "step": 308540 - }, - { - "epoch": 0.54, - "learning_rate": 2.3096293557759048e-05, - "loss": 2.3078, - "step": 308550 - }, - { - "epoch": 0.54, - "learning_rate": 2.3095421617832218e-05, - "loss": 2.4158, - "step": 308560 - }, - { - "epoch": 0.54, - "learning_rate": 2.3094549677905392e-05, - "loss": 2.3783, - "step": 308570 - }, - { - "epoch": 0.54, - "learning_rate": 2.3093677737978562e-05, - "loss": 2.4238, - "step": 308580 - }, - { - "epoch": 0.54, - "learning_rate": 2.309280579805174e-05, - "loss": 2.3675, - "step": 308590 - }, - { - "epoch": 0.54, - "learning_rate": 2.3091933858124913e-05, - "loss": 2.3529, - "step": 308600 - }, - { - "epoch": 0.54, - "learning_rate": 2.3091061918198084e-05, - "loss": 2.4153, - "step": 308610 - }, - { - "epoch": 0.54, - "learning_rate": 2.309018997827126e-05, - "loss": 2.1741, - "step": 308620 - }, - { - "epoch": 0.54, - "learning_rate": 2.308931803834443e-05, - "loss": 2.345, - "step": 308630 - }, - { - "epoch": 0.54, - "learning_rate": 2.3088446098417605e-05, - "loss": 2.2745, - "step": 308640 - }, - { - "epoch": 0.54, - "learning_rate": 2.3087574158490775e-05, - "loss": 2.2047, - "step": 308650 - }, - { - "epoch": 0.54, - "learning_rate": 2.3086702218563953e-05, - "loss": 2.4047, - "step": 308660 - }, - { - "epoch": 0.54, - "learning_rate": 2.3085830278637123e-05, - "loss": 2.4789, - "step": 308670 - }, - { - "epoch": 0.54, - "learning_rate": 2.3084958338710297e-05, - "loss": 2.3106, - "step": 308680 - }, - { - "epoch": 0.54, - "learning_rate": 2.308408639878347e-05, - "loss": 2.32, - "step": 308690 - }, - { - "epoch": 0.54, - "learning_rate": 2.3083214458856644e-05, - "loss": 2.3605, - "step": 308700 - }, - { - "epoch": 0.54, - "learning_rate": 2.3082342518929818e-05, - "loss": 2.3522, - "step": 308710 - }, - { - "epoch": 0.54, - "learning_rate": 2.308147057900299e-05, - "loss": 2.333, - "step": 308720 - }, - { - "epoch": 0.54, - "learning_rate": 2.3080598639076162e-05, - "loss": 2.3514, - "step": 308730 - }, - { - "epoch": 0.54, - "learning_rate": 2.3079726699149336e-05, - "loss": 2.3047, - "step": 308740 - }, - { - "epoch": 0.54, - "learning_rate": 2.307885475922251e-05, - "loss": 2.4302, - "step": 308750 - }, - { - "epoch": 0.54, - "learning_rate": 2.3077982819295684e-05, - "loss": 2.4445, - "step": 308760 - }, - { - "epoch": 0.54, - "learning_rate": 2.3077110879368857e-05, - "loss": 2.2356, - "step": 308770 - }, - { - "epoch": 0.54, - "learning_rate": 2.307623893944203e-05, - "loss": 2.3144, - "step": 308780 - }, - { - "epoch": 0.54, - "learning_rate": 2.30753669995152e-05, - "loss": 2.327, - "step": 308790 - }, - { - "epoch": 0.54, - "learning_rate": 2.3074495059588375e-05, - "loss": 2.3684, - "step": 308800 - }, - { - "epoch": 0.54, - "learning_rate": 2.307362311966155e-05, - "loss": 2.3763, - "step": 308810 - }, - { - "epoch": 0.54, - "learning_rate": 2.3072751179734723e-05, - "loss": 2.4955, - "step": 308820 - }, - { - "epoch": 0.54, - "learning_rate": 2.3071879239807893e-05, - "loss": 2.217, - "step": 308830 - }, - { - "epoch": 0.54, - "learning_rate": 2.3071007299881067e-05, - "loss": 2.3307, - "step": 308840 - }, - { - "epoch": 0.54, - "learning_rate": 2.3070135359954244e-05, - "loss": 2.3995, - "step": 308850 - }, - { - "epoch": 0.54, - "learning_rate": 2.3069263420027414e-05, - "loss": 2.3188, - "step": 308860 - }, - { - "epoch": 0.54, - "learning_rate": 2.3068391480100588e-05, - "loss": 2.4257, - "step": 308870 - }, - { - "epoch": 0.54, - "learning_rate": 2.3067519540173762e-05, - "loss": 2.358, - "step": 308880 - }, - { - "epoch": 0.54, - "learning_rate": 2.3066647600246936e-05, - "loss": 2.3219, - "step": 308890 - }, - { - "epoch": 0.54, - "learning_rate": 2.3065775660320106e-05, - "loss": 2.3955, - "step": 308900 - }, - { - "epoch": 0.54, - "learning_rate": 2.306490372039328e-05, - "loss": 2.3413, - "step": 308910 - }, - { - "epoch": 0.54, - "learning_rate": 2.3064031780466454e-05, - "loss": 2.2109, - "step": 308920 - }, - { - "epoch": 0.54, - "learning_rate": 2.3063159840539627e-05, - "loss": 2.4715, - "step": 308930 - }, - { - "epoch": 0.54, - "learning_rate": 2.30622879006128e-05, - "loss": 2.4194, - "step": 308940 - }, - { - "epoch": 0.54, - "learning_rate": 2.306141596068597e-05, - "loss": 2.4249, - "step": 308950 - }, - { - "epoch": 0.54, - "learning_rate": 2.306054402075915e-05, - "loss": 2.3834, - "step": 308960 - }, - { - "epoch": 0.54, - "learning_rate": 2.305967208083232e-05, - "loss": 2.3294, - "step": 308970 - }, - { - "epoch": 0.54, - "learning_rate": 2.3058800140905493e-05, - "loss": 2.3259, - "step": 308980 - }, - { - "epoch": 0.54, - "learning_rate": 2.3057928200978667e-05, - "loss": 2.3885, - "step": 308990 - }, - { - "epoch": 0.54, - "learning_rate": 2.305705626105184e-05, - "loss": 2.3564, - "step": 309000 - }, - { - "epoch": 0.54, - "learning_rate": 2.3056184321125014e-05, - "loss": 2.4174, - "step": 309010 - }, - { - "epoch": 0.54, - "learning_rate": 2.3055312381198185e-05, - "loss": 2.3482, - "step": 309020 - }, - { - "epoch": 0.54, - "learning_rate": 2.3054440441271362e-05, - "loss": 2.3369, - "step": 309030 - }, - { - "epoch": 0.54, - "learning_rate": 2.3053568501344532e-05, - "loss": 2.2842, - "step": 309040 - }, - { - "epoch": 0.54, - "learning_rate": 2.3052696561417706e-05, - "loss": 2.3913, - "step": 309050 - }, - { - "epoch": 0.54, - "learning_rate": 2.3051824621490876e-05, - "loss": 2.3162, - "step": 309060 - }, - { - "epoch": 0.54, - "learning_rate": 2.3050952681564053e-05, - "loss": 2.4402, - "step": 309070 - }, - { - "epoch": 0.54, - "learning_rate": 2.3050080741637227e-05, - "loss": 2.3623, - "step": 309080 - }, - { - "epoch": 0.54, - "learning_rate": 2.3049208801710398e-05, - "loss": 2.3617, - "step": 309090 - }, - { - "epoch": 0.54, - "learning_rate": 2.304833686178357e-05, - "loss": 2.2225, - "step": 309100 - }, - { - "epoch": 0.54, - "learning_rate": 2.3047464921856745e-05, - "loss": 2.4258, - "step": 309110 - }, - { - "epoch": 0.54, - "learning_rate": 2.304659298192992e-05, - "loss": 2.2446, - "step": 309120 - }, - { - "epoch": 0.54, - "learning_rate": 2.304572104200309e-05, - "loss": 2.418, - "step": 309130 - }, - { - "epoch": 0.54, - "learning_rate": 2.3044849102076266e-05, - "loss": 2.282, - "step": 309140 - }, - { - "epoch": 0.54, - "learning_rate": 2.3043977162149437e-05, - "loss": 2.3853, - "step": 309150 - }, - { - "epoch": 0.54, - "learning_rate": 2.304310522222261e-05, - "loss": 2.3168, - "step": 309160 - }, - { - "epoch": 0.54, - "learning_rate": 2.3042233282295784e-05, - "loss": 2.3995, - "step": 309170 - }, - { - "epoch": 0.54, - "learning_rate": 2.3041361342368958e-05, - "loss": 2.2738, - "step": 309180 - }, - { - "epoch": 0.54, - "learning_rate": 2.3040489402442132e-05, - "loss": 2.318, - "step": 309190 - }, - { - "epoch": 0.54, - "learning_rate": 2.3039617462515302e-05, - "loss": 2.2969, - "step": 309200 - }, - { - "epoch": 0.54, - "learning_rate": 2.3038745522588476e-05, - "loss": 2.2593, - "step": 309210 - }, - { - "epoch": 0.54, - "learning_rate": 2.303787358266165e-05, - "loss": 2.3654, - "step": 309220 - }, - { - "epoch": 0.54, - "learning_rate": 2.3037001642734824e-05, - "loss": 2.3673, - "step": 309230 - }, - { - "epoch": 0.54, - "learning_rate": 2.3036129702807997e-05, - "loss": 2.3284, - "step": 309240 - }, - { - "epoch": 0.54, - "learning_rate": 2.3035257762881168e-05, - "loss": 2.3593, - "step": 309250 - }, - { - "epoch": 0.54, - "learning_rate": 2.3034385822954345e-05, - "loss": 2.3454, - "step": 309260 - }, - { - "epoch": 0.54, - "learning_rate": 2.3033513883027515e-05, - "loss": 2.3303, - "step": 309270 - }, - { - "epoch": 0.54, - "learning_rate": 2.303264194310069e-05, - "loss": 2.3101, - "step": 309280 - }, - { - "epoch": 0.54, - "learning_rate": 2.3031770003173863e-05, - "loss": 2.3515, - "step": 309290 - }, - { - "epoch": 0.54, - "learning_rate": 2.3030898063247037e-05, - "loss": 2.4038, - "step": 309300 - }, - { - "epoch": 0.54, - "learning_rate": 2.3030026123320207e-05, - "loss": 2.2953, - "step": 309310 - }, - { - "epoch": 0.54, - "learning_rate": 2.302915418339338e-05, - "loss": 2.3679, - "step": 309320 - }, - { - "epoch": 0.54, - "learning_rate": 2.3028282243466558e-05, - "loss": 2.3405, - "step": 309330 - }, - { - "epoch": 0.54, - "learning_rate": 2.3027410303539728e-05, - "loss": 2.395, - "step": 309340 - }, - { - "epoch": 0.54, - "learning_rate": 2.3026538363612902e-05, - "loss": 2.3237, - "step": 309350 - }, - { - "epoch": 0.54, - "learning_rate": 2.3025666423686072e-05, - "loss": 2.3769, - "step": 309360 - }, - { - "epoch": 0.54, - "learning_rate": 2.302479448375925e-05, - "loss": 2.3819, - "step": 309370 - }, - { - "epoch": 0.54, - "learning_rate": 2.302392254383242e-05, - "loss": 2.2777, - "step": 309380 - }, - { - "epoch": 0.54, - "learning_rate": 2.3023050603905594e-05, - "loss": 2.3574, - "step": 309390 - }, - { - "epoch": 0.54, - "learning_rate": 2.3022178663978768e-05, - "loss": 2.2716, - "step": 309400 - }, - { - "epoch": 0.54, - "learning_rate": 2.302130672405194e-05, - "loss": 2.3514, - "step": 309410 - }, - { - "epoch": 0.54, - "learning_rate": 2.3020434784125115e-05, - "loss": 2.2668, - "step": 309420 - }, - { - "epoch": 0.54, - "learning_rate": 2.3019562844198285e-05, - "loss": 2.3517, - "step": 309430 - }, - { - "epoch": 0.54, - "learning_rate": 2.3018690904271463e-05, - "loss": 2.2889, - "step": 309440 - }, - { - "epoch": 0.54, - "learning_rate": 2.3017818964344633e-05, - "loss": 2.3778, - "step": 309450 - }, - { - "epoch": 0.54, - "learning_rate": 2.3016947024417807e-05, - "loss": 2.269, - "step": 309460 - }, - { - "epoch": 0.54, - "learning_rate": 2.301607508449098e-05, - "loss": 2.3228, - "step": 309470 - }, - { - "epoch": 0.54, - "learning_rate": 2.3015203144564154e-05, - "loss": 2.3774, - "step": 309480 - }, - { - "epoch": 0.54, - "learning_rate": 2.3014331204637328e-05, - "loss": 2.4254, - "step": 309490 - }, - { - "epoch": 0.54, - "learning_rate": 2.30134592647105e-05, - "loss": 2.2631, - "step": 309500 - }, - { - "epoch": 0.54, - "learning_rate": 2.3012587324783672e-05, - "loss": 2.4287, - "step": 309510 - }, - { - "epoch": 0.54, - "learning_rate": 2.3011715384856846e-05, - "loss": 2.3152, - "step": 309520 - }, - { - "epoch": 0.54, - "learning_rate": 2.301084344493002e-05, - "loss": 2.344, - "step": 309530 - }, - { - "epoch": 0.54, - "learning_rate": 2.300997150500319e-05, - "loss": 2.2597, - "step": 309540 - }, - { - "epoch": 0.54, - "learning_rate": 2.3009099565076367e-05, - "loss": 2.2466, - "step": 309550 - }, - { - "epoch": 0.54, - "learning_rate": 2.3008227625149538e-05, - "loss": 2.3985, - "step": 309560 - }, - { - "epoch": 0.54, - "learning_rate": 2.300735568522271e-05, - "loss": 2.3702, - "step": 309570 - }, - { - "epoch": 0.54, - "learning_rate": 2.3006483745295885e-05, - "loss": 2.3853, - "step": 309580 - }, - { - "epoch": 0.54, - "learning_rate": 2.300561180536906e-05, - "loss": 2.3261, - "step": 309590 - }, - { - "epoch": 0.54, - "learning_rate": 2.3004739865442233e-05, - "loss": 2.4662, - "step": 309600 - }, - { - "epoch": 0.54, - "learning_rate": 2.3003867925515403e-05, - "loss": 2.2797, - "step": 309610 - }, - { - "epoch": 0.54, - "learning_rate": 2.3002995985588577e-05, - "loss": 2.4746, - "step": 309620 - }, - { - "epoch": 0.54, - "learning_rate": 2.300212404566175e-05, - "loss": 2.2587, - "step": 309630 - }, - { - "epoch": 0.54, - "learning_rate": 2.3001252105734924e-05, - "loss": 2.4215, - "step": 309640 - }, - { - "epoch": 0.54, - "learning_rate": 2.3000380165808098e-05, - "loss": 2.363, - "step": 309650 - }, - { - "epoch": 0.54, - "learning_rate": 2.299950822588127e-05, - "loss": 2.3489, - "step": 309660 - }, - { - "epoch": 0.54, - "learning_rate": 2.2998636285954446e-05, - "loss": 2.4456, - "step": 309670 - }, - { - "epoch": 0.54, - "learning_rate": 2.2997764346027616e-05, - "loss": 2.3488, - "step": 309680 - }, - { - "epoch": 0.54, - "learning_rate": 2.299689240610079e-05, - "loss": 2.454, - "step": 309690 - }, - { - "epoch": 0.54, - "learning_rate": 2.2996020466173964e-05, - "loss": 2.4099, - "step": 309700 - }, - { - "epoch": 0.54, - "learning_rate": 2.2995148526247137e-05, - "loss": 2.5074, - "step": 309710 - }, - { - "epoch": 0.54, - "learning_rate": 2.299427658632031e-05, - "loss": 2.3912, - "step": 309720 - }, - { - "epoch": 0.54, - "learning_rate": 2.299340464639348e-05, - "loss": 2.385, - "step": 309730 - }, - { - "epoch": 0.54, - "learning_rate": 2.299253270646666e-05, - "loss": 2.3678, - "step": 309740 - }, - { - "epoch": 0.54, - "learning_rate": 2.299166076653983e-05, - "loss": 2.4252, - "step": 309750 - }, - { - "epoch": 0.54, - "learning_rate": 2.2990788826613003e-05, - "loss": 2.2554, - "step": 309760 - }, - { - "epoch": 0.54, - "learning_rate": 2.2989916886686173e-05, - "loss": 2.3676, - "step": 309770 - }, - { - "epoch": 0.54, - "learning_rate": 2.298904494675935e-05, - "loss": 2.324, - "step": 309780 - }, - { - "epoch": 0.54, - "learning_rate": 2.298817300683252e-05, - "loss": 2.2739, - "step": 309790 - }, - { - "epoch": 0.54, - "learning_rate": 2.2987301066905695e-05, - "loss": 2.3458, - "step": 309800 - }, - { - "epoch": 0.54, - "learning_rate": 2.2986429126978872e-05, - "loss": 2.4042, - "step": 309810 - }, - { - "epoch": 0.54, - "learning_rate": 2.2985557187052042e-05, - "loss": 2.3376, - "step": 309820 - }, - { - "epoch": 0.54, - "learning_rate": 2.2984685247125216e-05, - "loss": 2.3121, - "step": 309830 - }, - { - "epoch": 0.54, - "learning_rate": 2.2983813307198386e-05, - "loss": 2.438, - "step": 309840 - }, - { - "epoch": 0.54, - "learning_rate": 2.2982941367271563e-05, - "loss": 2.3564, - "step": 309850 - }, - { - "epoch": 0.54, - "learning_rate": 2.2982069427344734e-05, - "loss": 2.4303, - "step": 309860 - }, - { - "epoch": 0.54, - "learning_rate": 2.2981197487417908e-05, - "loss": 2.3761, - "step": 309870 - }, - { - "epoch": 0.54, - "learning_rate": 2.298032554749108e-05, - "loss": 2.365, - "step": 309880 - }, - { - "epoch": 0.54, - "learning_rate": 2.2979453607564255e-05, - "loss": 2.2526, - "step": 309890 - }, - { - "epoch": 0.54, - "learning_rate": 2.297858166763743e-05, - "loss": 2.327, - "step": 309900 - }, - { - "epoch": 0.54, - "learning_rate": 2.29777097277106e-05, - "loss": 2.3498, - "step": 309910 - }, - { - "epoch": 0.54, - "learning_rate": 2.2976837787783773e-05, - "loss": 2.3462, - "step": 309920 - }, - { - "epoch": 0.54, - "learning_rate": 2.2975965847856947e-05, - "loss": 2.3909, - "step": 309930 - }, - { - "epoch": 0.54, - "learning_rate": 2.297509390793012e-05, - "loss": 2.3666, - "step": 309940 - }, - { - "epoch": 0.54, - "learning_rate": 2.2974221968003294e-05, - "loss": 2.4615, - "step": 309950 - }, - { - "epoch": 0.54, - "learning_rate": 2.2973350028076468e-05, - "loss": 2.3342, - "step": 309960 - }, - { - "epoch": 0.54, - "learning_rate": 2.2972478088149642e-05, - "loss": 2.4468, - "step": 309970 - }, - { - "epoch": 0.54, - "learning_rate": 2.2971606148222812e-05, - "loss": 2.3805, - "step": 309980 - }, - { - "epoch": 0.54, - "learning_rate": 2.2970734208295986e-05, - "loss": 2.3317, - "step": 309990 - }, - { - "epoch": 0.54, - "learning_rate": 2.296986226836916e-05, - "loss": 2.3041, - "step": 310000 - }, - { - "epoch": 0.54, - "learning_rate": 2.2968990328442334e-05, - "loss": 2.2814, - "step": 310010 - }, - { - "epoch": 0.54, - "learning_rate": 2.2968118388515504e-05, - "loss": 2.3631, - "step": 310020 - }, - { - "epoch": 0.54, - "learning_rate": 2.2967246448588678e-05, - "loss": 2.3224, - "step": 310030 - }, - { - "epoch": 0.54, - "learning_rate": 2.296637450866185e-05, - "loss": 2.4179, - "step": 310040 - }, - { - "epoch": 0.54, - "learning_rate": 2.2965502568735025e-05, - "loss": 2.2716, - "step": 310050 - }, - { - "epoch": 0.54, - "learning_rate": 2.29646306288082e-05, - "loss": 2.2581, - "step": 310060 - }, - { - "epoch": 0.54, - "learning_rate": 2.2963758688881373e-05, - "loss": 2.3106, - "step": 310070 - }, - { - "epoch": 0.54, - "learning_rate": 2.2962886748954547e-05, - "loss": 2.4251, - "step": 310080 - }, - { - "epoch": 0.54, - "learning_rate": 2.2962014809027717e-05, - "loss": 2.308, - "step": 310090 - }, - { - "epoch": 0.54, - "learning_rate": 2.296114286910089e-05, - "loss": 2.389, - "step": 310100 - }, - { - "epoch": 0.54, - "learning_rate": 2.2960270929174065e-05, - "loss": 2.2577, - "step": 310110 - }, - { - "epoch": 0.54, - "learning_rate": 2.2959398989247238e-05, - "loss": 2.3306, - "step": 310120 - }, - { - "epoch": 0.54, - "learning_rate": 2.2958527049320412e-05, - "loss": 2.3226, - "step": 310130 - }, - { - "epoch": 0.54, - "learning_rate": 2.2957655109393582e-05, - "loss": 2.355, - "step": 310140 - }, - { - "epoch": 0.54, - "learning_rate": 2.295678316946676e-05, - "loss": 2.5563, - "step": 310150 - }, - { - "epoch": 0.54, - "learning_rate": 2.295591122953993e-05, - "loss": 2.3578, - "step": 310160 - }, - { - "epoch": 0.54, - "learning_rate": 2.2955039289613104e-05, - "loss": 2.4279, - "step": 310170 - }, - { - "epoch": 0.54, - "learning_rate": 2.2954167349686274e-05, - "loss": 2.269, - "step": 310180 - }, - { - "epoch": 0.54, - "learning_rate": 2.295329540975945e-05, - "loss": 2.3533, - "step": 310190 - }, - { - "epoch": 0.54, - "learning_rate": 2.2952423469832625e-05, - "loss": 2.2829, - "step": 310200 - }, - { - "epoch": 0.54, - "learning_rate": 2.2951551529905795e-05, - "loss": 2.2822, - "step": 310210 - }, - { - "epoch": 0.54, - "learning_rate": 2.2950679589978973e-05, - "loss": 2.3241, - "step": 310220 - }, - { - "epoch": 0.54, - "learning_rate": 2.2949807650052143e-05, - "loss": 2.2963, - "step": 310230 - }, - { - "epoch": 0.54, - "learning_rate": 2.2948935710125317e-05, - "loss": 2.3264, - "step": 310240 - }, - { - "epoch": 0.54, - "learning_rate": 2.2948063770198487e-05, - "loss": 2.3063, - "step": 310250 - }, - { - "epoch": 0.54, - "learning_rate": 2.2947191830271664e-05, - "loss": 2.299, - "step": 310260 - }, - { - "epoch": 0.54, - "learning_rate": 2.2946319890344835e-05, - "loss": 2.3937, - "step": 310270 - }, - { - "epoch": 0.54, - "learning_rate": 2.294544795041801e-05, - "loss": 2.4553, - "step": 310280 - }, - { - "epoch": 0.54, - "learning_rate": 2.2944576010491182e-05, - "loss": 2.391, - "step": 310290 - }, - { - "epoch": 0.54, - "learning_rate": 2.2943704070564356e-05, - "loss": 2.3434, - "step": 310300 - }, - { - "epoch": 0.54, - "learning_rate": 2.294283213063753e-05, - "loss": 2.296, - "step": 310310 - }, - { - "epoch": 0.54, - "learning_rate": 2.29419601907107e-05, - "loss": 2.3769, - "step": 310320 - }, - { - "epoch": 0.54, - "learning_rate": 2.2941088250783877e-05, - "loss": 2.3734, - "step": 310330 - }, - { - "epoch": 0.54, - "learning_rate": 2.2940216310857048e-05, - "loss": 2.4788, - "step": 310340 - }, - { - "epoch": 0.54, - "learning_rate": 2.293934437093022e-05, - "loss": 2.3037, - "step": 310350 - }, - { - "epoch": 0.54, - "learning_rate": 2.2938472431003395e-05, - "loss": 2.3024, - "step": 310360 - }, - { - "epoch": 0.54, - "learning_rate": 2.293760049107657e-05, - "loss": 2.3725, - "step": 310370 - }, - { - "epoch": 0.54, - "learning_rate": 2.2936728551149743e-05, - "loss": 2.4222, - "step": 310380 - }, - { - "epoch": 0.54, - "learning_rate": 2.2935856611222913e-05, - "loss": 2.4066, - "step": 310390 - }, - { - "epoch": 0.54, - "learning_rate": 2.2934984671296087e-05, - "loss": 2.2567, - "step": 310400 - }, - { - "epoch": 0.54, - "learning_rate": 2.293411273136926e-05, - "loss": 2.3455, - "step": 310410 - }, - { - "epoch": 0.54, - "learning_rate": 2.2933240791442434e-05, - "loss": 2.3122, - "step": 310420 - }, - { - "epoch": 0.54, - "learning_rate": 2.2932368851515608e-05, - "loss": 2.4473, - "step": 310430 - }, - { - "epoch": 0.54, - "learning_rate": 2.293149691158878e-05, - "loss": 2.3213, - "step": 310440 - }, - { - "epoch": 0.54, - "learning_rate": 2.2930624971661956e-05, - "loss": 2.4715, - "step": 310450 - }, - { - "epoch": 0.54, - "learning_rate": 2.2929753031735126e-05, - "loss": 2.3872, - "step": 310460 - }, - { - "epoch": 0.54, - "learning_rate": 2.29288810918083e-05, - "loss": 2.3489, - "step": 310470 - }, - { - "epoch": 0.54, - "learning_rate": 2.2928009151881474e-05, - "loss": 2.3108, - "step": 310480 - }, - { - "epoch": 0.54, - "learning_rate": 2.2927137211954647e-05, - "loss": 2.4139, - "step": 310490 - }, - { - "epoch": 0.54, - "learning_rate": 2.2926265272027818e-05, - "loss": 2.3336, - "step": 310500 - }, - { - "epoch": 0.54, - "learning_rate": 2.292539333210099e-05, - "loss": 2.3945, - "step": 310510 - }, - { - "epoch": 0.54, - "learning_rate": 2.2924521392174165e-05, - "loss": 2.4009, - "step": 310520 - }, - { - "epoch": 0.54, - "learning_rate": 2.292364945224734e-05, - "loss": 2.3049, - "step": 310530 - }, - { - "epoch": 0.54, - "learning_rate": 2.2922777512320513e-05, - "loss": 2.3334, - "step": 310540 - }, - { - "epoch": 0.54, - "learning_rate": 2.2921905572393683e-05, - "loss": 2.3231, - "step": 310550 - }, - { - "epoch": 0.54, - "learning_rate": 2.292103363246686e-05, - "loss": 2.3574, - "step": 310560 - }, - { - "epoch": 0.54, - "learning_rate": 2.292016169254003e-05, - "loss": 2.3374, - "step": 310570 - }, - { - "epoch": 0.54, - "learning_rate": 2.2919289752613205e-05, - "loss": 2.315, - "step": 310580 - }, - { - "epoch": 0.54, - "learning_rate": 2.291841781268638e-05, - "loss": 2.3086, - "step": 310590 - }, - { - "epoch": 0.54, - "learning_rate": 2.2917545872759552e-05, - "loss": 2.2405, - "step": 310600 - }, - { - "epoch": 0.54, - "learning_rate": 2.2916673932832726e-05, - "loss": 2.3102, - "step": 310610 - }, - { - "epoch": 0.54, - "learning_rate": 2.2915801992905896e-05, - "loss": 2.3825, - "step": 310620 - }, - { - "epoch": 0.54, - "learning_rate": 2.2914930052979073e-05, - "loss": 2.2727, - "step": 310630 - }, - { - "epoch": 0.54, - "learning_rate": 2.2914058113052244e-05, - "loss": 2.2433, - "step": 310640 - }, - { - "epoch": 0.54, - "learning_rate": 2.2913186173125418e-05, - "loss": 2.3138, - "step": 310650 - }, - { - "epoch": 0.54, - "learning_rate": 2.2912314233198588e-05, - "loss": 2.363, - "step": 310660 - }, - { - "epoch": 0.54, - "learning_rate": 2.2911442293271765e-05, - "loss": 2.303, - "step": 310670 - }, - { - "epoch": 0.54, - "learning_rate": 2.291057035334494e-05, - "loss": 2.2752, - "step": 310680 - }, - { - "epoch": 0.54, - "learning_rate": 2.290969841341811e-05, - "loss": 2.3406, - "step": 310690 - }, - { - "epoch": 0.54, - "learning_rate": 2.2908826473491283e-05, - "loss": 2.2835, - "step": 310700 - }, - { - "epoch": 0.54, - "learning_rate": 2.2907954533564457e-05, - "loss": 2.2091, - "step": 310710 - }, - { - "epoch": 0.54, - "learning_rate": 2.290708259363763e-05, - "loss": 2.3464, - "step": 310720 - }, - { - "epoch": 0.54, - "learning_rate": 2.29062106537108e-05, - "loss": 2.4372, - "step": 310730 - }, - { - "epoch": 0.54, - "learning_rate": 2.2905338713783978e-05, - "loss": 2.3064, - "step": 310740 - }, - { - "epoch": 0.54, - "learning_rate": 2.290446677385715e-05, - "loss": 2.3329, - "step": 310750 - }, - { - "epoch": 0.54, - "learning_rate": 2.2903594833930322e-05, - "loss": 2.3609, - "step": 310760 - }, - { - "epoch": 0.54, - "learning_rate": 2.2902722894003496e-05, - "loss": 2.3469, - "step": 310770 - }, - { - "epoch": 0.54, - "learning_rate": 2.290185095407667e-05, - "loss": 2.4503, - "step": 310780 - }, - { - "epoch": 0.54, - "learning_rate": 2.2900979014149844e-05, - "loss": 2.3143, - "step": 310790 - }, - { - "epoch": 0.54, - "learning_rate": 2.2900107074223014e-05, - "loss": 2.3876, - "step": 310800 - }, - { - "epoch": 0.54, - "learning_rate": 2.2899235134296188e-05, - "loss": 2.2584, - "step": 310810 - }, - { - "epoch": 0.54, - "learning_rate": 2.289836319436936e-05, - "loss": 2.3295, - "step": 310820 - }, - { - "epoch": 0.54, - "learning_rate": 2.2897491254442535e-05, - "loss": 2.4838, - "step": 310830 - }, - { - "epoch": 0.54, - "learning_rate": 2.289661931451571e-05, - "loss": 2.3394, - "step": 310840 - }, - { - "epoch": 0.54, - "learning_rate": 2.289574737458888e-05, - "loss": 2.2702, - "step": 310850 - }, - { - "epoch": 0.54, - "learning_rate": 2.2894875434662057e-05, - "loss": 2.3025, - "step": 310860 - }, - { - "epoch": 0.54, - "learning_rate": 2.2894003494735227e-05, - "loss": 2.3129, - "step": 310870 - }, - { - "epoch": 0.54, - "learning_rate": 2.28931315548084e-05, - "loss": 2.3993, - "step": 310880 - }, - { - "epoch": 0.54, - "learning_rate": 2.2892259614881575e-05, - "loss": 2.3537, - "step": 310890 - }, - { - "epoch": 0.54, - "learning_rate": 2.289138767495475e-05, - "loss": 2.2166, - "step": 310900 - }, - { - "epoch": 0.54, - "learning_rate": 2.289051573502792e-05, - "loss": 2.3975, - "step": 310910 - }, - { - "epoch": 0.54, - "learning_rate": 2.2889643795101092e-05, - "loss": 2.3784, - "step": 310920 - }, - { - "epoch": 0.54, - "learning_rate": 2.288877185517427e-05, - "loss": 2.3723, - "step": 310930 - }, - { - "epoch": 0.54, - "learning_rate": 2.288789991524744e-05, - "loss": 2.2979, - "step": 310940 - }, - { - "epoch": 0.54, - "learning_rate": 2.2887027975320614e-05, - "loss": 2.2904, - "step": 310950 - }, - { - "epoch": 0.54, - "learning_rate": 2.2886156035393784e-05, - "loss": 2.3426, - "step": 310960 - }, - { - "epoch": 0.54, - "learning_rate": 2.288528409546696e-05, - "loss": 2.2511, - "step": 310970 - }, - { - "epoch": 0.54, - "learning_rate": 2.288441215554013e-05, - "loss": 2.3457, - "step": 310980 - }, - { - "epoch": 0.54, - "learning_rate": 2.2883540215613305e-05, - "loss": 2.2078, - "step": 310990 - }, - { - "epoch": 0.54, - "learning_rate": 2.288266827568648e-05, - "loss": 2.2612, - "step": 311000 - }, - { - "epoch": 0.54, - "learning_rate": 2.2881796335759653e-05, - "loss": 2.5342, - "step": 311010 - }, - { - "epoch": 0.54, - "learning_rate": 2.2880924395832827e-05, - "loss": 2.4467, - "step": 311020 - }, - { - "epoch": 0.54, - "learning_rate": 2.2880052455905997e-05, - "loss": 2.3114, - "step": 311030 - }, - { - "epoch": 0.54, - "learning_rate": 2.2879180515979174e-05, - "loss": 2.2962, - "step": 311040 - }, - { - "epoch": 0.54, - "learning_rate": 2.2878308576052345e-05, - "loss": 2.4604, - "step": 311050 - }, - { - "epoch": 0.54, - "learning_rate": 2.287743663612552e-05, - "loss": 2.4393, - "step": 311060 - }, - { - "epoch": 0.54, - "learning_rate": 2.2876564696198692e-05, - "loss": 2.3673, - "step": 311070 - }, - { - "epoch": 0.54, - "learning_rate": 2.2875692756271866e-05, - "loss": 2.3692, - "step": 311080 - }, - { - "epoch": 0.54, - "learning_rate": 2.287482081634504e-05, - "loss": 2.3674, - "step": 311090 - }, - { - "epoch": 0.54, - "learning_rate": 2.287394887641821e-05, - "loss": 2.3624, - "step": 311100 - }, - { - "epoch": 0.54, - "learning_rate": 2.2873076936491384e-05, - "loss": 2.4216, - "step": 311110 - }, - { - "epoch": 0.54, - "learning_rate": 2.2872204996564558e-05, - "loss": 2.2208, - "step": 311120 - }, - { - "epoch": 0.54, - "learning_rate": 2.287133305663773e-05, - "loss": 2.3237, - "step": 311130 - }, - { - "epoch": 0.54, - "learning_rate": 2.2870461116710902e-05, - "loss": 2.223, - "step": 311140 - }, - { - "epoch": 0.54, - "learning_rate": 2.286958917678408e-05, - "loss": 2.3978, - "step": 311150 - }, - { - "epoch": 0.54, - "learning_rate": 2.2868717236857253e-05, - "loss": 2.378, - "step": 311160 - }, - { - "epoch": 0.54, - "learning_rate": 2.2867845296930423e-05, - "loss": 2.2223, - "step": 311170 - }, - { - "epoch": 0.54, - "learning_rate": 2.2866973357003597e-05, - "loss": 2.4554, - "step": 311180 - }, - { - "epoch": 0.54, - "learning_rate": 2.286610141707677e-05, - "loss": 2.4338, - "step": 311190 - }, - { - "epoch": 0.54, - "learning_rate": 2.2865229477149944e-05, - "loss": 2.3135, - "step": 311200 - }, - { - "epoch": 0.54, - "learning_rate": 2.2864357537223115e-05, - "loss": 2.4422, - "step": 311210 - }, - { - "epoch": 0.54, - "learning_rate": 2.286348559729629e-05, - "loss": 2.2733, - "step": 311220 - }, - { - "epoch": 0.54, - "learning_rate": 2.2862613657369462e-05, - "loss": 2.3215, - "step": 311230 - }, - { - "epoch": 0.54, - "learning_rate": 2.2861741717442636e-05, - "loss": 2.3758, - "step": 311240 - }, - { - "epoch": 0.54, - "learning_rate": 2.286086977751581e-05, - "loss": 2.3548, - "step": 311250 - }, - { - "epoch": 0.54, - "learning_rate": 2.2859997837588984e-05, - "loss": 2.3167, - "step": 311260 - }, - { - "epoch": 0.54, - "learning_rate": 2.2859125897662157e-05, - "loss": 2.315, - "step": 311270 - }, - { - "epoch": 0.54, - "learning_rate": 2.2858253957735328e-05, - "loss": 2.3294, - "step": 311280 - }, - { - "epoch": 0.54, - "learning_rate": 2.28573820178085e-05, - "loss": 2.3582, - "step": 311290 - }, - { - "epoch": 0.54, - "learning_rate": 2.2856510077881675e-05, - "loss": 2.4034, - "step": 311300 - }, - { - "epoch": 0.54, - "learning_rate": 2.285563813795485e-05, - "loss": 2.3458, - "step": 311310 - }, - { - "epoch": 0.54, - "learning_rate": 2.2854766198028023e-05, - "loss": 2.2888, - "step": 311320 - }, - { - "epoch": 0.54, - "learning_rate": 2.2853894258101193e-05, - "loss": 2.4166, - "step": 311330 - }, - { - "epoch": 0.54, - "learning_rate": 2.285302231817437e-05, - "loss": 2.3493, - "step": 311340 - }, - { - "epoch": 0.54, - "learning_rate": 2.285215037824754e-05, - "loss": 2.34, - "step": 311350 - }, - { - "epoch": 0.54, - "learning_rate": 2.2851278438320715e-05, - "loss": 2.3402, - "step": 311360 - }, - { - "epoch": 0.54, - "learning_rate": 2.2850406498393885e-05, - "loss": 2.3165, - "step": 311370 - }, - { - "epoch": 0.54, - "learning_rate": 2.2849534558467062e-05, - "loss": 2.3194, - "step": 311380 - }, - { - "epoch": 0.54, - "learning_rate": 2.2848662618540233e-05, - "loss": 2.407, - "step": 311390 - }, - { - "epoch": 0.54, - "learning_rate": 2.2847790678613406e-05, - "loss": 2.3345, - "step": 311400 - }, - { - "epoch": 0.54, - "learning_rate": 2.2846918738686583e-05, - "loss": 2.3859, - "step": 311410 - }, - { - "epoch": 0.54, - "learning_rate": 2.2846046798759754e-05, - "loss": 2.3354, - "step": 311420 - }, - { - "epoch": 0.54, - "learning_rate": 2.2845174858832928e-05, - "loss": 2.339, - "step": 311430 - }, - { - "epoch": 0.54, - "learning_rate": 2.2844302918906098e-05, - "loss": 2.2823, - "step": 311440 - }, - { - "epoch": 0.54, - "learning_rate": 2.2843430978979275e-05, - "loss": 2.456, - "step": 311450 - }, - { - "epoch": 0.54, - "learning_rate": 2.2842559039052446e-05, - "loss": 2.4084, - "step": 311460 - }, - { - "epoch": 0.54, - "learning_rate": 2.284168709912562e-05, - "loss": 2.2694, - "step": 311470 - }, - { - "epoch": 0.54, - "learning_rate": 2.2840815159198793e-05, - "loss": 2.3406, - "step": 311480 - }, - { - "epoch": 0.54, - "learning_rate": 2.2839943219271967e-05, - "loss": 2.3504, - "step": 311490 - }, - { - "epoch": 0.54, - "learning_rate": 2.283907127934514e-05, - "loss": 2.3869, - "step": 311500 - }, - { - "epoch": 0.54, - "learning_rate": 2.283819933941831e-05, - "loss": 2.4069, - "step": 311510 - }, - { - "epoch": 0.54, - "learning_rate": 2.2837327399491485e-05, - "loss": 2.3829, - "step": 311520 - }, - { - "epoch": 0.54, - "learning_rate": 2.283645545956466e-05, - "loss": 2.3315, - "step": 311530 - }, - { - "epoch": 0.54, - "learning_rate": 2.2835583519637832e-05, - "loss": 2.4456, - "step": 311540 - }, - { - "epoch": 0.54, - "learning_rate": 2.2834711579711006e-05, - "loss": 2.4359, - "step": 311550 - }, - { - "epoch": 0.54, - "learning_rate": 2.283383963978418e-05, - "loss": 2.3643, - "step": 311560 - }, - { - "epoch": 0.54, - "learning_rate": 2.2832967699857354e-05, - "loss": 2.3874, - "step": 311570 - }, - { - "epoch": 0.54, - "learning_rate": 2.2832095759930524e-05, - "loss": 2.2989, - "step": 311580 - }, - { - "epoch": 0.54, - "learning_rate": 2.2831223820003698e-05, - "loss": 2.4085, - "step": 311590 - }, - { - "epoch": 0.54, - "learning_rate": 2.283035188007687e-05, - "loss": 2.3794, - "step": 311600 - }, - { - "epoch": 0.54, - "learning_rate": 2.2829479940150045e-05, - "loss": 2.3747, - "step": 311610 - }, - { - "epoch": 0.54, - "learning_rate": 2.2828608000223216e-05, - "loss": 2.3575, - "step": 311620 - }, - { - "epoch": 0.54, - "learning_rate": 2.282773606029639e-05, - "loss": 2.3367, - "step": 311630 - }, - { - "epoch": 0.54, - "learning_rate": 2.2826864120369563e-05, - "loss": 2.352, - "step": 311640 - }, - { - "epoch": 0.54, - "learning_rate": 2.2825992180442737e-05, - "loss": 2.1931, - "step": 311650 - }, - { - "epoch": 0.54, - "learning_rate": 2.282512024051591e-05, - "loss": 2.4093, - "step": 311660 - }, - { - "epoch": 0.54, - "learning_rate": 2.2824248300589085e-05, - "loss": 2.3494, - "step": 311670 - }, - { - "epoch": 0.54, - "learning_rate": 2.282337636066226e-05, - "loss": 2.3825, - "step": 311680 - }, - { - "epoch": 0.54, - "learning_rate": 2.282250442073543e-05, - "loss": 2.316, - "step": 311690 - }, - { - "epoch": 0.54, - "learning_rate": 2.2821632480808602e-05, - "loss": 2.2928, - "step": 311700 - }, - { - "epoch": 0.54, - "learning_rate": 2.2820760540881776e-05, - "loss": 2.2633, - "step": 311710 - }, - { - "epoch": 0.54, - "learning_rate": 2.281988860095495e-05, - "loss": 2.2747, - "step": 311720 - }, - { - "epoch": 0.54, - "learning_rate": 2.2819016661028124e-05, - "loss": 2.4111, - "step": 311730 - }, - { - "epoch": 0.54, - "learning_rate": 2.2818144721101294e-05, - "loss": 2.3823, - "step": 311740 - }, - { - "epoch": 0.54, - "learning_rate": 2.281727278117447e-05, - "loss": 2.4038, - "step": 311750 - }, - { - "epoch": 0.54, - "learning_rate": 2.2816400841247642e-05, - "loss": 2.4854, - "step": 311760 - }, - { - "epoch": 0.54, - "learning_rate": 2.2815528901320815e-05, - "loss": 2.4312, - "step": 311770 - }, - { - "epoch": 0.54, - "learning_rate": 2.281465696139399e-05, - "loss": 2.2804, - "step": 311780 - }, - { - "epoch": 0.54, - "learning_rate": 2.2813785021467163e-05, - "loss": 2.1642, - "step": 311790 - }, - { - "epoch": 0.54, - "learning_rate": 2.2812913081540337e-05, - "loss": 2.3574, - "step": 311800 - }, - { - "epoch": 0.54, - "learning_rate": 2.2812041141613507e-05, - "loss": 2.3768, - "step": 311810 - }, - { - "epoch": 0.54, - "learning_rate": 2.2811169201686684e-05, - "loss": 2.3778, - "step": 311820 - }, - { - "epoch": 0.54, - "learning_rate": 2.2810297261759855e-05, - "loss": 2.4256, - "step": 311830 - }, - { - "epoch": 0.54, - "learning_rate": 2.280942532183303e-05, - "loss": 2.2905, - "step": 311840 - }, - { - "epoch": 0.54, - "learning_rate": 2.28085533819062e-05, - "loss": 2.3247, - "step": 311850 - }, - { - "epoch": 0.54, - "learning_rate": 2.2807681441979376e-05, - "loss": 2.403, - "step": 311860 - }, - { - "epoch": 0.54, - "learning_rate": 2.2806809502052546e-05, - "loss": 2.5187, - "step": 311870 - }, - { - "epoch": 0.54, - "learning_rate": 2.280593756212572e-05, - "loss": 2.3471, - "step": 311880 - }, - { - "epoch": 0.54, - "learning_rate": 2.2805065622198894e-05, - "loss": 2.3513, - "step": 311890 - }, - { - "epoch": 0.54, - "learning_rate": 2.2804193682272068e-05, - "loss": 2.3286, - "step": 311900 - }, - { - "epoch": 0.54, - "learning_rate": 2.280332174234524e-05, - "loss": 2.4756, - "step": 311910 - }, - { - "epoch": 0.54, - "learning_rate": 2.2802449802418412e-05, - "loss": 2.4419, - "step": 311920 - }, - { - "epoch": 0.54, - "learning_rate": 2.280157786249159e-05, - "loss": 2.2999, - "step": 311930 - }, - { - "epoch": 0.54, - "learning_rate": 2.280070592256476e-05, - "loss": 2.426, - "step": 311940 - }, - { - "epoch": 0.54, - "learning_rate": 2.2799833982637933e-05, - "loss": 2.3991, - "step": 311950 - }, - { - "epoch": 0.54, - "learning_rate": 2.2798962042711107e-05, - "loss": 2.3641, - "step": 311960 - }, - { - "epoch": 0.54, - "learning_rate": 2.279809010278428e-05, - "loss": 2.5196, - "step": 311970 - }, - { - "epoch": 0.54, - "learning_rate": 2.2797218162857454e-05, - "loss": 2.4018, - "step": 311980 - }, - { - "epoch": 0.54, - "learning_rate": 2.2796346222930625e-05, - "loss": 2.3126, - "step": 311990 - }, - { - "epoch": 0.54, - "learning_rate": 2.27954742830038e-05, - "loss": 2.2379, - "step": 312000 - }, - { - "epoch": 0.54, - "learning_rate": 2.2794602343076972e-05, - "loss": 2.4212, - "step": 312010 - }, - { - "epoch": 0.54, - "learning_rate": 2.2793730403150146e-05, - "loss": 2.4378, - "step": 312020 - }, - { - "epoch": 0.54, - "learning_rate": 2.279285846322332e-05, - "loss": 2.3503, - "step": 312030 - }, - { - "epoch": 0.54, - "learning_rate": 2.279198652329649e-05, - "loss": 2.4409, - "step": 312040 - }, - { - "epoch": 0.54, - "learning_rate": 2.2791114583369667e-05, - "loss": 2.3203, - "step": 312050 - }, - { - "epoch": 0.54, - "learning_rate": 2.2790242643442838e-05, - "loss": 2.1087, - "step": 312060 - }, - { - "epoch": 0.54, - "learning_rate": 2.278937070351601e-05, - "loss": 2.4556, - "step": 312070 - }, - { - "epoch": 0.54, - "learning_rate": 2.2788498763589185e-05, - "loss": 2.3684, - "step": 312080 - }, - { - "epoch": 0.54, - "learning_rate": 2.278762682366236e-05, - "loss": 2.4722, - "step": 312090 - }, - { - "epoch": 0.54, - "learning_rate": 2.278675488373553e-05, - "loss": 2.4132, - "step": 312100 - }, - { - "epoch": 0.54, - "learning_rate": 2.2785882943808703e-05, - "loss": 2.3748, - "step": 312110 - }, - { - "epoch": 0.54, - "learning_rate": 2.2785011003881877e-05, - "loss": 2.3852, - "step": 312120 - }, - { - "epoch": 0.54, - "learning_rate": 2.278413906395505e-05, - "loss": 2.4077, - "step": 312130 - }, - { - "epoch": 0.54, - "learning_rate": 2.2783267124028225e-05, - "loss": 2.2971, - "step": 312140 - }, - { - "epoch": 0.54, - "learning_rate": 2.2782395184101395e-05, - "loss": 2.2619, - "step": 312150 - }, - { - "epoch": 0.54, - "learning_rate": 2.2781523244174572e-05, - "loss": 2.3761, - "step": 312160 - }, - { - "epoch": 0.54, - "learning_rate": 2.2780651304247743e-05, - "loss": 2.329, - "step": 312170 - }, - { - "epoch": 0.54, - "learning_rate": 2.2779779364320916e-05, - "loss": 2.3629, - "step": 312180 - }, - { - "epoch": 0.54, - "learning_rate": 2.277890742439409e-05, - "loss": 2.2936, - "step": 312190 - }, - { - "epoch": 0.54, - "learning_rate": 2.2778035484467264e-05, - "loss": 2.4545, - "step": 312200 - }, - { - "epoch": 0.54, - "learning_rate": 2.2777163544540438e-05, - "loss": 2.3475, - "step": 312210 - }, - { - "epoch": 0.54, - "learning_rate": 2.2776291604613608e-05, - "loss": 2.3966, - "step": 312220 - }, - { - "epoch": 0.54, - "learning_rate": 2.2775419664686785e-05, - "loss": 2.4019, - "step": 312230 - }, - { - "epoch": 0.54, - "learning_rate": 2.2774547724759956e-05, - "loss": 2.3677, - "step": 312240 - }, - { - "epoch": 0.54, - "learning_rate": 2.277367578483313e-05, - "loss": 2.3732, - "step": 312250 - }, - { - "epoch": 0.54, - "learning_rate": 2.27728038449063e-05, - "loss": 2.3273, - "step": 312260 - }, - { - "epoch": 0.54, - "learning_rate": 2.2771931904979477e-05, - "loss": 2.3502, - "step": 312270 - }, - { - "epoch": 0.54, - "learning_rate": 2.277105996505265e-05, - "loss": 2.3706, - "step": 312280 - }, - { - "epoch": 0.54, - "learning_rate": 2.277018802512582e-05, - "loss": 2.3331, - "step": 312290 - }, - { - "epoch": 0.54, - "learning_rate": 2.2769316085198995e-05, - "loss": 2.2576, - "step": 312300 - }, - { - "epoch": 0.54, - "learning_rate": 2.276844414527217e-05, - "loss": 2.4447, - "step": 312310 - }, - { - "epoch": 0.54, - "learning_rate": 2.2767572205345342e-05, - "loss": 2.2985, - "step": 312320 - }, - { - "epoch": 0.54, - "learning_rate": 2.2766700265418513e-05, - "loss": 2.4391, - "step": 312330 - }, - { - "epoch": 0.54, - "learning_rate": 2.276582832549169e-05, - "loss": 2.317, - "step": 312340 - }, - { - "epoch": 0.54, - "learning_rate": 2.276495638556486e-05, - "loss": 2.3054, - "step": 312350 - }, - { - "epoch": 0.54, - "learning_rate": 2.2764084445638034e-05, - "loss": 2.2477, - "step": 312360 - }, - { - "epoch": 0.54, - "learning_rate": 2.2763212505711208e-05, - "loss": 2.2919, - "step": 312370 - }, - { - "epoch": 0.54, - "learning_rate": 2.276234056578438e-05, - "loss": 2.3586, - "step": 312380 - }, - { - "epoch": 0.54, - "learning_rate": 2.2761468625857555e-05, - "loss": 2.2678, - "step": 312390 - }, - { - "epoch": 0.54, - "learning_rate": 2.2760596685930726e-05, - "loss": 2.3322, - "step": 312400 - }, - { - "epoch": 0.54, - "learning_rate": 2.27597247460039e-05, - "loss": 2.2897, - "step": 312410 - }, - { - "epoch": 0.54, - "learning_rate": 2.2758852806077073e-05, - "loss": 2.4009, - "step": 312420 - }, - { - "epoch": 0.54, - "learning_rate": 2.2757980866150247e-05, - "loss": 2.4331, - "step": 312430 - }, - { - "epoch": 0.54, - "learning_rate": 2.275710892622342e-05, - "loss": 2.413, - "step": 312440 - }, - { - "epoch": 0.54, - "learning_rate": 2.275623698629659e-05, - "loss": 2.337, - "step": 312450 - }, - { - "epoch": 0.54, - "learning_rate": 2.275536504636977e-05, - "loss": 2.3292, - "step": 312460 - }, - { - "epoch": 0.54, - "learning_rate": 2.275449310644294e-05, - "loss": 2.3816, - "step": 312470 - }, - { - "epoch": 0.54, - "learning_rate": 2.2753621166516112e-05, - "loss": 2.3316, - "step": 312480 - }, - { - "epoch": 0.54, - "learning_rate": 2.2752749226589286e-05, - "loss": 2.2966, - "step": 312490 - }, - { - "epoch": 0.54, - "learning_rate": 2.275187728666246e-05, - "loss": 2.3637, - "step": 312500 - }, - { - "epoch": 0.54, - "learning_rate": 2.2751005346735634e-05, - "loss": 2.2694, - "step": 312510 - }, - { - "epoch": 0.54, - "learning_rate": 2.2750133406808804e-05, - "loss": 2.3574, - "step": 312520 - }, - { - "epoch": 0.55, - "learning_rate": 2.274926146688198e-05, - "loss": 2.3186, - "step": 312530 - }, - { - "epoch": 0.55, - "learning_rate": 2.2748389526955152e-05, - "loss": 2.478, - "step": 312540 - }, - { - "epoch": 0.55, - "learning_rate": 2.2747517587028325e-05, - "loss": 2.3734, - "step": 312550 - }, - { - "epoch": 0.55, - "learning_rate": 2.2746645647101496e-05, - "loss": 2.3221, - "step": 312560 - }, - { - "epoch": 0.55, - "learning_rate": 2.2745773707174673e-05, - "loss": 2.163, - "step": 312570 - }, - { - "epoch": 0.55, - "learning_rate": 2.2744901767247843e-05, - "loss": 2.3498, - "step": 312580 - }, - { - "epoch": 0.55, - "learning_rate": 2.2744029827321017e-05, - "loss": 2.2903, - "step": 312590 - }, - { - "epoch": 0.55, - "learning_rate": 2.274315788739419e-05, - "loss": 2.3541, - "step": 312600 - }, - { - "epoch": 0.55, - "learning_rate": 2.2742285947467365e-05, - "loss": 2.3343, - "step": 312610 - }, - { - "epoch": 0.55, - "learning_rate": 2.274141400754054e-05, - "loss": 2.3407, - "step": 312620 - }, - { - "epoch": 0.55, - "learning_rate": 2.274054206761371e-05, - "loss": 2.3601, - "step": 312630 - }, - { - "epoch": 0.55, - "learning_rate": 2.2739670127686886e-05, - "loss": 2.3501, - "step": 312640 - }, - { - "epoch": 0.55, - "learning_rate": 2.2738798187760056e-05, - "loss": 2.3029, - "step": 312650 - }, - { - "epoch": 0.55, - "learning_rate": 2.273792624783323e-05, - "loss": 2.2851, - "step": 312660 - }, - { - "epoch": 0.55, - "learning_rate": 2.2737054307906404e-05, - "loss": 2.3443, - "step": 312670 - }, - { - "epoch": 0.55, - "learning_rate": 2.2736182367979578e-05, - "loss": 2.3788, - "step": 312680 - }, - { - "epoch": 0.55, - "learning_rate": 2.273531042805275e-05, - "loss": 2.3382, - "step": 312690 - }, - { - "epoch": 0.55, - "learning_rate": 2.2734438488125922e-05, - "loss": 2.1886, - "step": 312700 - }, - { - "epoch": 0.55, - "learning_rate": 2.2733566548199096e-05, - "loss": 2.4349, - "step": 312710 - }, - { - "epoch": 0.55, - "learning_rate": 2.273269460827227e-05, - "loss": 2.2532, - "step": 312720 - }, - { - "epoch": 0.55, - "learning_rate": 2.2731822668345443e-05, - "loss": 2.4559, - "step": 312730 - }, - { - "epoch": 0.55, - "learning_rate": 2.2730950728418614e-05, - "loss": 2.2886, - "step": 312740 - }, - { - "epoch": 0.55, - "learning_rate": 2.273007878849179e-05, - "loss": 2.3527, - "step": 312750 - }, - { - "epoch": 0.55, - "learning_rate": 2.2729206848564964e-05, - "loss": 2.3507, - "step": 312760 - }, - { - "epoch": 0.55, - "learning_rate": 2.2728334908638135e-05, - "loss": 2.4272, - "step": 312770 - }, - { - "epoch": 0.55, - "learning_rate": 2.272746296871131e-05, - "loss": 2.272, - "step": 312780 - }, - { - "epoch": 0.55, - "learning_rate": 2.2726591028784482e-05, - "loss": 2.3665, - "step": 312790 - }, - { - "epoch": 0.55, - "learning_rate": 2.2725719088857656e-05, - "loss": 2.4617, - "step": 312800 - }, - { - "epoch": 0.55, - "learning_rate": 2.2724847148930827e-05, - "loss": 2.3528, - "step": 312810 - }, - { - "epoch": 0.55, - "learning_rate": 2.2723975209004e-05, - "loss": 2.341, - "step": 312820 - }, - { - "epoch": 0.55, - "learning_rate": 2.2723103269077174e-05, - "loss": 2.2878, - "step": 312830 - }, - { - "epoch": 0.55, - "learning_rate": 2.2722231329150348e-05, - "loss": 2.3126, - "step": 312840 - }, - { - "epoch": 0.55, - "learning_rate": 2.272135938922352e-05, - "loss": 2.3771, - "step": 312850 - }, - { - "epoch": 0.55, - "learning_rate": 2.2720487449296695e-05, - "loss": 2.3319, - "step": 312860 - }, - { - "epoch": 0.55, - "learning_rate": 2.271961550936987e-05, - "loss": 2.3409, - "step": 312870 - }, - { - "epoch": 0.55, - "learning_rate": 2.271874356944304e-05, - "loss": 2.406, - "step": 312880 - }, - { - "epoch": 0.55, - "learning_rate": 2.2717871629516213e-05, - "loss": 2.3438, - "step": 312890 - }, - { - "epoch": 0.55, - "learning_rate": 2.2716999689589387e-05, - "loss": 2.3431, - "step": 312900 - }, - { - "epoch": 0.55, - "learning_rate": 2.271612774966256e-05, - "loss": 2.2782, - "step": 312910 - }, - { - "epoch": 0.55, - "learning_rate": 2.2715255809735735e-05, - "loss": 2.3685, - "step": 312920 - }, - { - "epoch": 0.55, - "learning_rate": 2.2714383869808905e-05, - "loss": 2.2011, - "step": 312930 - }, - { - "epoch": 0.55, - "learning_rate": 2.2713511929882082e-05, - "loss": 2.3653, - "step": 312940 - }, - { - "epoch": 0.55, - "learning_rate": 2.2712639989955253e-05, - "loss": 2.3782, - "step": 312950 - }, - { - "epoch": 0.55, - "learning_rate": 2.2711768050028426e-05, - "loss": 2.4416, - "step": 312960 - }, - { - "epoch": 0.55, - "learning_rate": 2.2710896110101597e-05, - "loss": 2.2939, - "step": 312970 - }, - { - "epoch": 0.55, - "learning_rate": 2.2710024170174774e-05, - "loss": 2.3199, - "step": 312980 - }, - { - "epoch": 0.55, - "learning_rate": 2.2709152230247944e-05, - "loss": 2.3631, - "step": 312990 - }, - { - "epoch": 0.55, - "learning_rate": 2.2708280290321118e-05, - "loss": 2.2987, - "step": 313000 - }, - { - "epoch": 0.55, - "learning_rate": 2.2707408350394295e-05, - "loss": 2.2784, - "step": 313010 - }, - { - "epoch": 0.55, - "learning_rate": 2.2706536410467466e-05, - "loss": 2.261, - "step": 313020 - }, - { - "epoch": 0.55, - "learning_rate": 2.270566447054064e-05, - "loss": 2.4226, - "step": 313030 - }, - { - "epoch": 0.55, - "learning_rate": 2.270479253061381e-05, - "loss": 2.3244, - "step": 313040 - }, - { - "epoch": 0.55, - "learning_rate": 2.2703920590686987e-05, - "loss": 2.4178, - "step": 313050 - }, - { - "epoch": 0.55, - "learning_rate": 2.2703048650760157e-05, - "loss": 2.4645, - "step": 313060 - }, - { - "epoch": 0.55, - "learning_rate": 2.270217671083333e-05, - "loss": 2.2625, - "step": 313070 - }, - { - "epoch": 0.55, - "learning_rate": 2.2701304770906505e-05, - "loss": 2.4505, - "step": 313080 - }, - { - "epoch": 0.55, - "learning_rate": 2.270043283097968e-05, - "loss": 2.3709, - "step": 313090 - }, - { - "epoch": 0.55, - "learning_rate": 2.2699560891052852e-05, - "loss": 2.2381, - "step": 313100 - }, - { - "epoch": 0.55, - "learning_rate": 2.2698688951126023e-05, - "loss": 2.2715, - "step": 313110 - }, - { - "epoch": 0.55, - "learning_rate": 2.2697817011199196e-05, - "loss": 2.4123, - "step": 313120 - }, - { - "epoch": 0.55, - "learning_rate": 2.269694507127237e-05, - "loss": 2.3427, - "step": 313130 - }, - { - "epoch": 0.55, - "learning_rate": 2.2696073131345544e-05, - "loss": 2.3766, - "step": 313140 - }, - { - "epoch": 0.55, - "learning_rate": 2.2695201191418718e-05, - "loss": 2.4202, - "step": 313150 - }, - { - "epoch": 0.55, - "learning_rate": 2.269432925149189e-05, - "loss": 2.3421, - "step": 313160 - }, - { - "epoch": 0.55, - "learning_rate": 2.2693457311565065e-05, - "loss": 2.2658, - "step": 313170 - }, - { - "epoch": 0.55, - "learning_rate": 2.2692585371638236e-05, - "loss": 2.2803, - "step": 313180 - }, - { - "epoch": 0.55, - "learning_rate": 2.269171343171141e-05, - "loss": 2.3596, - "step": 313190 - }, - { - "epoch": 0.55, - "learning_rate": 2.2690841491784583e-05, - "loss": 2.2732, - "step": 313200 - }, - { - "epoch": 0.55, - "learning_rate": 2.2689969551857757e-05, - "loss": 2.4464, - "step": 313210 - }, - { - "epoch": 0.55, - "learning_rate": 2.2689097611930927e-05, - "loss": 2.2793, - "step": 313220 - }, - { - "epoch": 0.55, - "learning_rate": 2.26882256720041e-05, - "loss": 2.3806, - "step": 313230 - }, - { - "epoch": 0.55, - "learning_rate": 2.268735373207728e-05, - "loss": 2.3416, - "step": 313240 - }, - { - "epoch": 0.55, - "learning_rate": 2.268648179215045e-05, - "loss": 2.2204, - "step": 313250 - }, - { - "epoch": 0.55, - "learning_rate": 2.2685609852223622e-05, - "loss": 2.2895, - "step": 313260 - }, - { - "epoch": 0.55, - "learning_rate": 2.2684737912296796e-05, - "loss": 2.355, - "step": 313270 - }, - { - "epoch": 0.55, - "learning_rate": 2.268386597236997e-05, - "loss": 2.3114, - "step": 313280 - }, - { - "epoch": 0.55, - "learning_rate": 2.268299403244314e-05, - "loss": 2.3657, - "step": 313290 - }, - { - "epoch": 0.55, - "learning_rate": 2.2682122092516314e-05, - "loss": 2.3091, - "step": 313300 - }, - { - "epoch": 0.55, - "learning_rate": 2.2681250152589488e-05, - "loss": 2.2557, - "step": 313310 - }, - { - "epoch": 0.55, - "learning_rate": 2.2680378212662662e-05, - "loss": 2.2397, - "step": 313320 - }, - { - "epoch": 0.55, - "learning_rate": 2.2679506272735835e-05, - "loss": 2.411, - "step": 313330 - }, - { - "epoch": 0.55, - "learning_rate": 2.2678634332809006e-05, - "loss": 2.3132, - "step": 313340 - }, - { - "epoch": 0.55, - "learning_rate": 2.2677762392882183e-05, - "loss": 2.2849, - "step": 313350 - }, - { - "epoch": 0.55, - "learning_rate": 2.2676890452955353e-05, - "loss": 2.4112, - "step": 313360 - }, - { - "epoch": 0.55, - "learning_rate": 2.2676018513028527e-05, - "loss": 2.3391, - "step": 313370 - }, - { - "epoch": 0.55, - "learning_rate": 2.26751465731017e-05, - "loss": 2.3641, - "step": 313380 - }, - { - "epoch": 0.55, - "learning_rate": 2.2674274633174875e-05, - "loss": 2.249, - "step": 313390 - }, - { - "epoch": 0.55, - "learning_rate": 2.267340269324805e-05, - "loss": 2.3987, - "step": 313400 - }, - { - "epoch": 0.55, - "learning_rate": 2.267253075332122e-05, - "loss": 2.3994, - "step": 313410 - }, - { - "epoch": 0.55, - "learning_rate": 2.2671658813394396e-05, - "loss": 2.345, - "step": 313420 - }, - { - "epoch": 0.55, - "learning_rate": 2.2670786873467566e-05, - "loss": 2.3088, - "step": 313430 - }, - { - "epoch": 0.55, - "learning_rate": 2.266991493354074e-05, - "loss": 2.3802, - "step": 313440 - }, - { - "epoch": 0.55, - "learning_rate": 2.266904299361391e-05, - "loss": 2.2994, - "step": 313450 - }, - { - "epoch": 0.55, - "learning_rate": 2.2668171053687088e-05, - "loss": 2.3061, - "step": 313460 - }, - { - "epoch": 0.55, - "learning_rate": 2.2667299113760258e-05, - "loss": 2.2162, - "step": 313470 - }, - { - "epoch": 0.55, - "learning_rate": 2.2666427173833432e-05, - "loss": 2.2614, - "step": 313480 - }, - { - "epoch": 0.55, - "learning_rate": 2.2665555233906606e-05, - "loss": 2.2692, - "step": 313490 - }, - { - "epoch": 0.55, - "learning_rate": 2.266468329397978e-05, - "loss": 2.3938, - "step": 313500 - }, - { - "epoch": 0.55, - "learning_rate": 2.2663811354052953e-05, - "loss": 2.3281, - "step": 313510 - }, - { - "epoch": 0.55, - "learning_rate": 2.2662939414126124e-05, - "loss": 2.4015, - "step": 313520 - }, - { - "epoch": 0.55, - "learning_rate": 2.26620674741993e-05, - "loss": 2.3454, - "step": 313530 - }, - { - "epoch": 0.55, - "learning_rate": 2.266119553427247e-05, - "loss": 2.3108, - "step": 313540 - }, - { - "epoch": 0.55, - "learning_rate": 2.2660323594345645e-05, - "loss": 2.3644, - "step": 313550 - }, - { - "epoch": 0.55, - "learning_rate": 2.265945165441882e-05, - "loss": 2.3248, - "step": 313560 - }, - { - "epoch": 0.55, - "learning_rate": 2.2658579714491992e-05, - "loss": 2.3353, - "step": 313570 - }, - { - "epoch": 0.55, - "learning_rate": 2.2657707774565166e-05, - "loss": 2.37, - "step": 313580 - }, - { - "epoch": 0.55, - "learning_rate": 2.2656835834638337e-05, - "loss": 2.3323, - "step": 313590 - }, - { - "epoch": 0.55, - "learning_rate": 2.265596389471151e-05, - "loss": 2.2631, - "step": 313600 - }, - { - "epoch": 0.55, - "learning_rate": 2.2655091954784684e-05, - "loss": 2.3017, - "step": 313610 - }, - { - "epoch": 0.55, - "learning_rate": 2.2654220014857858e-05, - "loss": 2.4063, - "step": 313620 - }, - { - "epoch": 0.55, - "learning_rate": 2.265334807493103e-05, - "loss": 2.4248, - "step": 313630 - }, - { - "epoch": 0.55, - "learning_rate": 2.2652476135004202e-05, - "loss": 2.3714, - "step": 313640 - }, - { - "epoch": 0.55, - "learning_rate": 2.265160419507738e-05, - "loss": 2.2849, - "step": 313650 - }, - { - "epoch": 0.55, - "learning_rate": 2.265073225515055e-05, - "loss": 2.3087, - "step": 313660 - }, - { - "epoch": 0.55, - "learning_rate": 2.2649860315223723e-05, - "loss": 2.2466, - "step": 313670 - }, - { - "epoch": 0.55, - "learning_rate": 2.2648988375296897e-05, - "loss": 2.3443, - "step": 313680 - }, - { - "epoch": 0.55, - "learning_rate": 2.264811643537007e-05, - "loss": 2.3187, - "step": 313690 - }, - { - "epoch": 0.55, - "learning_rate": 2.264724449544324e-05, - "loss": 2.2674, - "step": 313700 - }, - { - "epoch": 0.55, - "learning_rate": 2.2646372555516415e-05, - "loss": 2.3645, - "step": 313710 - }, - { - "epoch": 0.55, - "learning_rate": 2.264550061558959e-05, - "loss": 2.4453, - "step": 313720 - }, - { - "epoch": 0.55, - "learning_rate": 2.2644628675662763e-05, - "loss": 2.395, - "step": 313730 - }, - { - "epoch": 0.55, - "learning_rate": 2.2643756735735936e-05, - "loss": 2.3383, - "step": 313740 - }, - { - "epoch": 0.55, - "learning_rate": 2.2642884795809107e-05, - "loss": 2.3368, - "step": 313750 - }, - { - "epoch": 0.55, - "learning_rate": 2.2642012855882284e-05, - "loss": 2.3749, - "step": 313760 - }, - { - "epoch": 0.55, - "learning_rate": 2.2641140915955454e-05, - "loss": 2.3872, - "step": 313770 - }, - { - "epoch": 0.55, - "learning_rate": 2.2640268976028628e-05, - "loss": 2.3082, - "step": 313780 - }, - { - "epoch": 0.55, - "learning_rate": 2.2639397036101802e-05, - "loss": 2.3839, - "step": 313790 - }, - { - "epoch": 0.55, - "learning_rate": 2.2638525096174976e-05, - "loss": 2.3106, - "step": 313800 - }, - { - "epoch": 0.55, - "learning_rate": 2.263765315624815e-05, - "loss": 2.3832, - "step": 313810 - }, - { - "epoch": 0.55, - "learning_rate": 2.263678121632132e-05, - "loss": 2.3185, - "step": 313820 - }, - { - "epoch": 0.55, - "learning_rate": 2.2635909276394497e-05, - "loss": 2.4072, - "step": 313830 - }, - { - "epoch": 0.55, - "learning_rate": 2.2635037336467667e-05, - "loss": 2.3385, - "step": 313840 - }, - { - "epoch": 0.55, - "learning_rate": 2.263416539654084e-05, - "loss": 2.3103, - "step": 313850 - }, - { - "epoch": 0.55, - "learning_rate": 2.2633293456614015e-05, - "loss": 2.3481, - "step": 313860 - }, - { - "epoch": 0.55, - "learning_rate": 2.263242151668719e-05, - "loss": 2.271, - "step": 313870 - }, - { - "epoch": 0.55, - "learning_rate": 2.2631549576760362e-05, - "loss": 2.2799, - "step": 313880 - }, - { - "epoch": 0.55, - "learning_rate": 2.2630677636833533e-05, - "loss": 2.3268, - "step": 313890 - }, - { - "epoch": 0.55, - "learning_rate": 2.2629805696906706e-05, - "loss": 2.2587, - "step": 313900 - }, - { - "epoch": 0.55, - "learning_rate": 2.262893375697988e-05, - "loss": 2.3239, - "step": 313910 - }, - { - "epoch": 0.55, - "learning_rate": 2.2628061817053054e-05, - "loss": 2.3281, - "step": 313920 - }, - { - "epoch": 0.55, - "learning_rate": 2.2627189877126224e-05, - "loss": 2.2842, - "step": 313930 - }, - { - "epoch": 0.55, - "learning_rate": 2.26263179371994e-05, - "loss": 2.3319, - "step": 313940 - }, - { - "epoch": 0.55, - "learning_rate": 2.2625445997272572e-05, - "loss": 2.3536, - "step": 313950 - }, - { - "epoch": 0.55, - "learning_rate": 2.2624574057345746e-05, - "loss": 2.3085, - "step": 313960 - }, - { - "epoch": 0.55, - "learning_rate": 2.262370211741892e-05, - "loss": 2.3999, - "step": 313970 - }, - { - "epoch": 0.55, - "learning_rate": 2.2622830177492093e-05, - "loss": 2.2754, - "step": 313980 - }, - { - "epoch": 0.55, - "learning_rate": 2.2621958237565267e-05, - "loss": 2.3974, - "step": 313990 - }, - { - "epoch": 0.55, - "learning_rate": 2.2621086297638437e-05, - "loss": 2.5112, - "step": 314000 - }, - { - "epoch": 0.55, - "learning_rate": 2.262021435771161e-05, - "loss": 2.3276, - "step": 314010 - }, - { - "epoch": 0.55, - "learning_rate": 2.2619342417784785e-05, - "loss": 2.2369, - "step": 314020 - }, - { - "epoch": 0.55, - "learning_rate": 2.261847047785796e-05, - "loss": 2.3815, - "step": 314030 - }, - { - "epoch": 0.55, - "learning_rate": 2.2617598537931132e-05, - "loss": 2.393, - "step": 314040 - }, - { - "epoch": 0.55, - "learning_rate": 2.2616726598004303e-05, - "loss": 2.3445, - "step": 314050 - }, - { - "epoch": 0.55, - "learning_rate": 2.261585465807748e-05, - "loss": 2.1963, - "step": 314060 - }, - { - "epoch": 0.55, - "learning_rate": 2.261498271815065e-05, - "loss": 2.3228, - "step": 314070 - }, - { - "epoch": 0.55, - "learning_rate": 2.2614110778223824e-05, - "loss": 2.35, - "step": 314080 - }, - { - "epoch": 0.55, - "learning_rate": 2.2613238838296998e-05, - "loss": 2.2615, - "step": 314090 - }, - { - "epoch": 0.55, - "learning_rate": 2.2612366898370172e-05, - "loss": 2.214, - "step": 314100 - }, - { - "epoch": 0.55, - "learning_rate": 2.2611494958443345e-05, - "loss": 2.243, - "step": 314110 - }, - { - "epoch": 0.55, - "learning_rate": 2.2610623018516516e-05, - "loss": 2.3548, - "step": 314120 - }, - { - "epoch": 0.55, - "learning_rate": 2.2609751078589693e-05, - "loss": 2.3954, - "step": 314130 - }, - { - "epoch": 0.55, - "learning_rate": 2.2608879138662863e-05, - "loss": 2.3713, - "step": 314140 - }, - { - "epoch": 0.55, - "learning_rate": 2.2608007198736037e-05, - "loss": 2.4168, - "step": 314150 - }, - { - "epoch": 0.55, - "learning_rate": 2.2607135258809208e-05, - "loss": 2.3869, - "step": 314160 - }, - { - "epoch": 0.55, - "learning_rate": 2.2606263318882385e-05, - "loss": 2.4367, - "step": 314170 - }, - { - "epoch": 0.55, - "learning_rate": 2.2605391378955555e-05, - "loss": 2.4441, - "step": 314180 - }, - { - "epoch": 0.55, - "learning_rate": 2.260451943902873e-05, - "loss": 2.3694, - "step": 314190 - }, - { - "epoch": 0.55, - "learning_rate": 2.2603647499101903e-05, - "loss": 2.4625, - "step": 314200 - }, - { - "epoch": 0.55, - "learning_rate": 2.2602775559175076e-05, - "loss": 2.3353, - "step": 314210 - }, - { - "epoch": 0.55, - "learning_rate": 2.260190361924825e-05, - "loss": 2.2786, - "step": 314220 - }, - { - "epoch": 0.55, - "learning_rate": 2.260103167932142e-05, - "loss": 2.3325, - "step": 314230 - }, - { - "epoch": 0.55, - "learning_rate": 2.2600159739394598e-05, - "loss": 2.2998, - "step": 314240 - }, - { - "epoch": 0.55, - "learning_rate": 2.2599287799467768e-05, - "loss": 2.3386, - "step": 314250 - }, - { - "epoch": 0.55, - "learning_rate": 2.2598415859540942e-05, - "loss": 2.5385, - "step": 314260 - }, - { - "epoch": 0.55, - "learning_rate": 2.2597543919614116e-05, - "loss": 2.3196, - "step": 314270 - }, - { - "epoch": 0.55, - "learning_rate": 2.259667197968729e-05, - "loss": 2.421, - "step": 314280 - }, - { - "epoch": 0.55, - "learning_rate": 2.2595800039760463e-05, - "loss": 2.3855, - "step": 314290 - }, - { - "epoch": 0.55, - "learning_rate": 2.2594928099833634e-05, - "loss": 2.3472, - "step": 314300 - }, - { - "epoch": 0.55, - "learning_rate": 2.2594056159906807e-05, - "loss": 2.4088, - "step": 314310 - }, - { - "epoch": 0.55, - "learning_rate": 2.259318421997998e-05, - "loss": 2.3285, - "step": 314320 - }, - { - "epoch": 0.55, - "learning_rate": 2.2592312280053155e-05, - "loss": 2.2972, - "step": 314330 - }, - { - "epoch": 0.55, - "learning_rate": 2.2591440340126325e-05, - "loss": 2.3606, - "step": 314340 - }, - { - "epoch": 0.55, - "learning_rate": 2.2590568400199502e-05, - "loss": 2.365, - "step": 314350 - }, - { - "epoch": 0.55, - "learning_rate": 2.2589696460272676e-05, - "loss": 2.4118, - "step": 314360 - }, - { - "epoch": 0.55, - "learning_rate": 2.2588824520345847e-05, - "loss": 2.3582, - "step": 314370 - }, - { - "epoch": 0.55, - "learning_rate": 2.258795258041902e-05, - "loss": 2.3403, - "step": 314380 - }, - { - "epoch": 0.55, - "learning_rate": 2.2587080640492194e-05, - "loss": 2.379, - "step": 314390 - }, - { - "epoch": 0.55, - "learning_rate": 2.2586208700565368e-05, - "loss": 2.4509, - "step": 314400 - }, - { - "epoch": 0.55, - "learning_rate": 2.2585336760638538e-05, - "loss": 2.416, - "step": 314410 - }, - { - "epoch": 0.55, - "learning_rate": 2.2584464820711712e-05, - "loss": 2.3756, - "step": 314420 - }, - { - "epoch": 0.55, - "learning_rate": 2.2583592880784886e-05, - "loss": 2.2454, - "step": 314430 - }, - { - "epoch": 0.55, - "learning_rate": 2.258272094085806e-05, - "loss": 2.3783, - "step": 314440 - }, - { - "epoch": 0.55, - "learning_rate": 2.2581849000931233e-05, - "loss": 2.3342, - "step": 314450 - }, - { - "epoch": 0.55, - "learning_rate": 2.2580977061004407e-05, - "loss": 2.2772, - "step": 314460 - }, - { - "epoch": 0.55, - "learning_rate": 2.258010512107758e-05, - "loss": 2.2931, - "step": 314470 - }, - { - "epoch": 0.55, - "learning_rate": 2.257923318115075e-05, - "loss": 2.3205, - "step": 314480 - }, - { - "epoch": 0.55, - "learning_rate": 2.2578361241223925e-05, - "loss": 2.2994, - "step": 314490 - }, - { - "epoch": 0.55, - "learning_rate": 2.25774893012971e-05, - "loss": 2.308, - "step": 314500 - }, - { - "epoch": 0.55, - "learning_rate": 2.2576617361370273e-05, - "loss": 2.3886, - "step": 314510 - }, - { - "epoch": 0.55, - "learning_rate": 2.2575745421443446e-05, - "loss": 2.4213, - "step": 314520 - }, - { - "epoch": 0.55, - "learning_rate": 2.2574873481516617e-05, - "loss": 2.3738, - "step": 314530 - }, - { - "epoch": 0.55, - "learning_rate": 2.2574001541589794e-05, - "loss": 2.2116, - "step": 314540 - }, - { - "epoch": 0.55, - "learning_rate": 2.2573129601662964e-05, - "loss": 2.3064, - "step": 314550 - }, - { - "epoch": 0.55, - "learning_rate": 2.2572257661736138e-05, - "loss": 2.2651, - "step": 314560 - }, - { - "epoch": 0.55, - "learning_rate": 2.257138572180931e-05, - "loss": 2.2532, - "step": 314570 - }, - { - "epoch": 0.55, - "learning_rate": 2.2570513781882486e-05, - "loss": 2.3519, - "step": 314580 - }, - { - "epoch": 0.55, - "learning_rate": 2.256964184195566e-05, - "loss": 2.3007, - "step": 314590 - }, - { - "epoch": 0.55, - "learning_rate": 2.256876990202883e-05, - "loss": 2.2636, - "step": 314600 - }, - { - "epoch": 0.55, - "learning_rate": 2.2567897962102007e-05, - "loss": 2.2958, - "step": 314610 - }, - { - "epoch": 0.55, - "learning_rate": 2.2567026022175177e-05, - "loss": 2.2277, - "step": 314620 - }, - { - "epoch": 0.55, - "learning_rate": 2.256615408224835e-05, - "loss": 2.1732, - "step": 314630 - }, - { - "epoch": 0.55, - "learning_rate": 2.256528214232152e-05, - "loss": 2.3052, - "step": 314640 - }, - { - "epoch": 0.55, - "learning_rate": 2.25644102023947e-05, - "loss": 2.3197, - "step": 314650 - }, - { - "epoch": 0.55, - "learning_rate": 2.256353826246787e-05, - "loss": 2.3446, - "step": 314660 - }, - { - "epoch": 0.55, - "learning_rate": 2.2562666322541043e-05, - "loss": 2.3254, - "step": 314670 - }, - { - "epoch": 0.55, - "learning_rate": 2.2561794382614216e-05, - "loss": 2.2456, - "step": 314680 - }, - { - "epoch": 0.55, - "learning_rate": 2.256092244268739e-05, - "loss": 2.3048, - "step": 314690 - }, - { - "epoch": 0.55, - "learning_rate": 2.2560050502760564e-05, - "loss": 2.3745, - "step": 314700 - }, - { - "epoch": 0.55, - "learning_rate": 2.2559178562833734e-05, - "loss": 2.4663, - "step": 314710 - }, - { - "epoch": 0.55, - "learning_rate": 2.255830662290691e-05, - "loss": 2.2627, - "step": 314720 - }, - { - "epoch": 0.55, - "learning_rate": 2.2557434682980082e-05, - "loss": 2.3445, - "step": 314730 - }, - { - "epoch": 0.55, - "learning_rate": 2.2556562743053256e-05, - "loss": 2.4614, - "step": 314740 - }, - { - "epoch": 0.55, - "learning_rate": 2.255569080312643e-05, - "loss": 2.2756, - "step": 314750 - }, - { - "epoch": 0.55, - "learning_rate": 2.2554818863199603e-05, - "loss": 2.3104, - "step": 314760 - }, - { - "epoch": 0.55, - "learning_rate": 2.2553946923272777e-05, - "loss": 2.2777, - "step": 314770 - }, - { - "epoch": 0.55, - "learning_rate": 2.2553074983345947e-05, - "loss": 2.4317, - "step": 314780 - }, - { - "epoch": 0.55, - "learning_rate": 2.255220304341912e-05, - "loss": 2.3829, - "step": 314790 - }, - { - "epoch": 0.55, - "learning_rate": 2.2551331103492295e-05, - "loss": 2.3904, - "step": 314800 - }, - { - "epoch": 0.55, - "learning_rate": 2.255045916356547e-05, - "loss": 2.3142, - "step": 314810 - }, - { - "epoch": 0.55, - "learning_rate": 2.254958722363864e-05, - "loss": 2.4042, - "step": 314820 - }, - { - "epoch": 0.55, - "learning_rate": 2.2548715283711813e-05, - "loss": 2.4525, - "step": 314830 - }, - { - "epoch": 0.55, - "learning_rate": 2.254784334378499e-05, - "loss": 2.4338, - "step": 314840 - }, - { - "epoch": 0.55, - "learning_rate": 2.254697140385816e-05, - "loss": 2.2556, - "step": 314850 - }, - { - "epoch": 0.55, - "learning_rate": 2.2546099463931334e-05, - "loss": 2.2683, - "step": 314860 - }, - { - "epoch": 0.55, - "learning_rate": 2.2545227524004508e-05, - "loss": 2.3915, - "step": 314870 - }, - { - "epoch": 0.55, - "learning_rate": 2.2544355584077682e-05, - "loss": 2.297, - "step": 314880 - }, - { - "epoch": 0.55, - "learning_rate": 2.2543483644150852e-05, - "loss": 2.3105, - "step": 314890 - }, - { - "epoch": 0.55, - "learning_rate": 2.2542611704224026e-05, - "loss": 2.3908, - "step": 314900 - }, - { - "epoch": 0.55, - "learning_rate": 2.25417397642972e-05, - "loss": 2.2315, - "step": 314910 - }, - { - "epoch": 0.55, - "learning_rate": 2.2540867824370373e-05, - "loss": 2.3294, - "step": 314920 - }, - { - "epoch": 0.55, - "learning_rate": 2.2539995884443547e-05, - "loss": 2.3482, - "step": 314930 - }, - { - "epoch": 0.55, - "learning_rate": 2.2539123944516718e-05, - "loss": 2.2837, - "step": 314940 - }, - { - "epoch": 0.55, - "learning_rate": 2.2538252004589895e-05, - "loss": 2.3622, - "step": 314950 - }, - { - "epoch": 0.55, - "learning_rate": 2.2537380064663065e-05, - "loss": 2.275, - "step": 314960 - }, - { - "epoch": 0.55, - "learning_rate": 2.253650812473624e-05, - "loss": 2.3741, - "step": 314970 - }, - { - "epoch": 0.55, - "learning_rate": 2.2535636184809413e-05, - "loss": 2.3674, - "step": 314980 - }, - { - "epoch": 0.55, - "learning_rate": 2.2534764244882586e-05, - "loss": 2.2629, - "step": 314990 - }, - { - "epoch": 0.55, - "learning_rate": 2.253389230495576e-05, - "loss": 2.3975, - "step": 315000 - }, - { - "epoch": 0.55, - "learning_rate": 2.253302036502893e-05, - "loss": 2.2698, - "step": 315010 - }, - { - "epoch": 0.55, - "learning_rate": 2.2532148425102108e-05, - "loss": 2.3825, - "step": 315020 - }, - { - "epoch": 0.55, - "learning_rate": 2.2531276485175278e-05, - "loss": 2.3417, - "step": 315030 - }, - { - "epoch": 0.55, - "learning_rate": 2.2530404545248452e-05, - "loss": 2.3138, - "step": 315040 - }, - { - "epoch": 0.55, - "learning_rate": 2.2529532605321622e-05, - "loss": 2.3617, - "step": 315050 - }, - { - "epoch": 0.55, - "learning_rate": 2.25286606653948e-05, - "loss": 2.3398, - "step": 315060 - }, - { - "epoch": 0.55, - "learning_rate": 2.252778872546797e-05, - "loss": 2.4565, - "step": 315070 - }, - { - "epoch": 0.55, - "learning_rate": 2.2526916785541144e-05, - "loss": 2.3286, - "step": 315080 - }, - { - "epoch": 0.55, - "learning_rate": 2.2526044845614317e-05, - "loss": 2.3242, - "step": 315090 - }, - { - "epoch": 0.55, - "learning_rate": 2.252517290568749e-05, - "loss": 2.4442, - "step": 315100 - }, - { - "epoch": 0.55, - "learning_rate": 2.2524300965760665e-05, - "loss": 2.2114, - "step": 315110 - }, - { - "epoch": 0.55, - "learning_rate": 2.2523429025833835e-05, - "loss": 2.3648, - "step": 315120 - }, - { - "epoch": 0.55, - "learning_rate": 2.2522557085907012e-05, - "loss": 2.3342, - "step": 315130 - }, - { - "epoch": 0.55, - "learning_rate": 2.2521685145980183e-05, - "loss": 2.3016, - "step": 315140 - }, - { - "epoch": 0.55, - "learning_rate": 2.2520813206053357e-05, - "loss": 2.2343, - "step": 315150 - }, - { - "epoch": 0.55, - "learning_rate": 2.251994126612653e-05, - "loss": 2.2731, - "step": 315160 - }, - { - "epoch": 0.55, - "learning_rate": 2.2519069326199704e-05, - "loss": 2.4034, - "step": 315170 - }, - { - "epoch": 0.55, - "learning_rate": 2.2518197386272878e-05, - "loss": 2.3739, - "step": 315180 - }, - { - "epoch": 0.55, - "learning_rate": 2.2517325446346048e-05, - "loss": 2.4199, - "step": 315190 - }, - { - "epoch": 0.55, - "learning_rate": 2.2516453506419222e-05, - "loss": 2.3775, - "step": 315200 - }, - { - "epoch": 0.55, - "learning_rate": 2.2515581566492396e-05, - "loss": 2.3192, - "step": 315210 - }, - { - "epoch": 0.55, - "learning_rate": 2.251470962656557e-05, - "loss": 2.3017, - "step": 315220 - }, - { - "epoch": 0.55, - "learning_rate": 2.2513837686638743e-05, - "loss": 2.236, - "step": 315230 - }, - { - "epoch": 0.55, - "learning_rate": 2.2512965746711914e-05, - "loss": 2.4782, - "step": 315240 - }, - { - "epoch": 0.55, - "learning_rate": 2.251209380678509e-05, - "loss": 2.3625, - "step": 315250 - }, - { - "epoch": 0.55, - "learning_rate": 2.251122186685826e-05, - "loss": 2.4281, - "step": 315260 - }, - { - "epoch": 0.55, - "learning_rate": 2.2510349926931435e-05, - "loss": 2.316, - "step": 315270 - }, - { - "epoch": 0.55, - "learning_rate": 2.250947798700461e-05, - "loss": 2.3206, - "step": 315280 - }, - { - "epoch": 0.55, - "learning_rate": 2.2508606047077783e-05, - "loss": 2.387, - "step": 315290 - }, - { - "epoch": 0.55, - "learning_rate": 2.2507734107150953e-05, - "loss": 2.4897, - "step": 315300 - }, - { - "epoch": 0.55, - "learning_rate": 2.2506862167224127e-05, - "loss": 2.3392, - "step": 315310 - }, - { - "epoch": 0.55, - "learning_rate": 2.2505990227297304e-05, - "loss": 2.3188, - "step": 315320 - }, - { - "epoch": 0.55, - "learning_rate": 2.2505118287370474e-05, - "loss": 2.4036, - "step": 315330 - }, - { - "epoch": 0.55, - "learning_rate": 2.2504246347443648e-05, - "loss": 2.4711, - "step": 315340 - }, - { - "epoch": 0.55, - "learning_rate": 2.250337440751682e-05, - "loss": 2.2878, - "step": 315350 - }, - { - "epoch": 0.55, - "learning_rate": 2.2502502467589996e-05, - "loss": 2.2966, - "step": 315360 - }, - { - "epoch": 0.55, - "learning_rate": 2.2501630527663166e-05, - "loss": 2.4066, - "step": 315370 - }, - { - "epoch": 0.55, - "learning_rate": 2.250075858773634e-05, - "loss": 2.3954, - "step": 315380 - }, - { - "epoch": 0.55, - "learning_rate": 2.2499886647809513e-05, - "loss": 2.2828, - "step": 315390 - }, - { - "epoch": 0.55, - "learning_rate": 2.2499014707882687e-05, - "loss": 2.4273, - "step": 315400 - }, - { - "epoch": 0.55, - "learning_rate": 2.249814276795586e-05, - "loss": 2.2866, - "step": 315410 - }, - { - "epoch": 0.55, - "learning_rate": 2.249727082802903e-05, - "loss": 2.3235, - "step": 315420 - }, - { - "epoch": 0.55, - "learning_rate": 2.249639888810221e-05, - "loss": 2.3165, - "step": 315430 - }, - { - "epoch": 0.55, - "learning_rate": 2.249552694817538e-05, - "loss": 2.2472, - "step": 315440 - }, - { - "epoch": 0.55, - "learning_rate": 2.2494655008248553e-05, - "loss": 2.3904, - "step": 315450 - }, - { - "epoch": 0.55, - "learning_rate": 2.2493783068321727e-05, - "loss": 2.3681, - "step": 315460 - }, - { - "epoch": 0.55, - "learning_rate": 2.24929111283949e-05, - "loss": 2.3595, - "step": 315470 - }, - { - "epoch": 0.55, - "learning_rate": 2.2492039188468074e-05, - "loss": 2.5414, - "step": 315480 - }, - { - "epoch": 0.55, - "learning_rate": 2.2491167248541244e-05, - "loss": 2.3578, - "step": 315490 - }, - { - "epoch": 0.55, - "learning_rate": 2.2490295308614418e-05, - "loss": 2.2454, - "step": 315500 - }, - { - "epoch": 0.55, - "learning_rate": 2.2489423368687592e-05, - "loss": 2.4158, - "step": 315510 - }, - { - "epoch": 0.55, - "learning_rate": 2.2488551428760766e-05, - "loss": 2.3346, - "step": 315520 - }, - { - "epoch": 0.55, - "learning_rate": 2.2487679488833936e-05, - "loss": 2.2748, - "step": 315530 - }, - { - "epoch": 0.55, - "learning_rate": 2.2486807548907113e-05, - "loss": 2.3915, - "step": 315540 - }, - { - "epoch": 0.55, - "learning_rate": 2.2485935608980284e-05, - "loss": 2.3661, - "step": 315550 - }, - { - "epoch": 0.55, - "learning_rate": 2.2485063669053457e-05, - "loss": 2.3755, - "step": 315560 - }, - { - "epoch": 0.55, - "learning_rate": 2.248419172912663e-05, - "loss": 2.4164, - "step": 315570 - }, - { - "epoch": 0.55, - "learning_rate": 2.2483319789199805e-05, - "loss": 2.3458, - "step": 315580 - }, - { - "epoch": 0.55, - "learning_rate": 2.248244784927298e-05, - "loss": 2.3671, - "step": 315590 - }, - { - "epoch": 0.55, - "learning_rate": 2.248157590934615e-05, - "loss": 2.2906, - "step": 315600 - }, - { - "epoch": 0.55, - "learning_rate": 2.2480703969419323e-05, - "loss": 2.4242, - "step": 315610 - }, - { - "epoch": 0.55, - "learning_rate": 2.2479832029492497e-05, - "loss": 2.2925, - "step": 315620 - }, - { - "epoch": 0.55, - "learning_rate": 2.247896008956567e-05, - "loss": 2.3351, - "step": 315630 - }, - { - "epoch": 0.55, - "learning_rate": 2.2478088149638844e-05, - "loss": 2.3541, - "step": 315640 - }, - { - "epoch": 0.55, - "learning_rate": 2.2477216209712018e-05, - "loss": 2.3871, - "step": 315650 - }, - { - "epoch": 0.55, - "learning_rate": 2.2476344269785192e-05, - "loss": 2.3101, - "step": 315660 - }, - { - "epoch": 0.55, - "learning_rate": 2.2475472329858362e-05, - "loss": 2.3238, - "step": 315670 - }, - { - "epoch": 0.55, - "learning_rate": 2.2474600389931536e-05, - "loss": 2.4171, - "step": 315680 - }, - { - "epoch": 0.55, - "learning_rate": 2.247372845000471e-05, - "loss": 2.4277, - "step": 315690 - }, - { - "epoch": 0.55, - "learning_rate": 2.2472856510077883e-05, - "loss": 2.335, - "step": 315700 - }, - { - "epoch": 0.55, - "learning_rate": 2.2471984570151057e-05, - "loss": 2.4658, - "step": 315710 - }, - { - "epoch": 0.55, - "learning_rate": 2.2471112630224228e-05, - "loss": 2.2941, - "step": 315720 - }, - { - "epoch": 0.55, - "learning_rate": 2.2470240690297405e-05, - "loss": 2.1949, - "step": 315730 - }, - { - "epoch": 0.55, - "learning_rate": 2.2469368750370575e-05, - "loss": 2.3746, - "step": 315740 - }, - { - "epoch": 0.55, - "learning_rate": 2.246849681044375e-05, - "loss": 2.334, - "step": 315750 - }, - { - "epoch": 0.55, - "learning_rate": 2.246762487051692e-05, - "loss": 2.3317, - "step": 315760 - }, - { - "epoch": 0.55, - "learning_rate": 2.2466752930590096e-05, - "loss": 2.3229, - "step": 315770 - }, - { - "epoch": 0.55, - "learning_rate": 2.2465880990663267e-05, - "loss": 2.3577, - "step": 315780 - }, - { - "epoch": 0.55, - "learning_rate": 2.246500905073644e-05, - "loss": 2.2118, - "step": 315790 - }, - { - "epoch": 0.55, - "learning_rate": 2.2464137110809614e-05, - "loss": 2.3778, - "step": 315800 - }, - { - "epoch": 0.55, - "learning_rate": 2.2463265170882788e-05, - "loss": 2.3583, - "step": 315810 - }, - { - "epoch": 0.55, - "learning_rate": 2.2462393230955962e-05, - "loss": 2.4006, - "step": 315820 - }, - { - "epoch": 0.55, - "learning_rate": 2.2461521291029132e-05, - "loss": 2.229, - "step": 315830 - }, - { - "epoch": 0.55, - "learning_rate": 2.246064935110231e-05, - "loss": 2.3129, - "step": 315840 - }, - { - "epoch": 0.55, - "learning_rate": 2.245977741117548e-05, - "loss": 2.3162, - "step": 315850 - }, - { - "epoch": 0.55, - "learning_rate": 2.2458905471248654e-05, - "loss": 2.4268, - "step": 315860 - }, - { - "epoch": 0.55, - "learning_rate": 2.2458033531321827e-05, - "loss": 2.4057, - "step": 315870 - }, - { - "epoch": 0.55, - "learning_rate": 2.2457161591395e-05, - "loss": 2.4097, - "step": 315880 - }, - { - "epoch": 0.55, - "learning_rate": 2.2456289651468175e-05, - "loss": 2.2551, - "step": 315890 - }, - { - "epoch": 0.55, - "learning_rate": 2.2455417711541345e-05, - "loss": 2.2189, - "step": 315900 - }, - { - "epoch": 0.55, - "learning_rate": 2.245454577161452e-05, - "loss": 2.3259, - "step": 315910 - }, - { - "epoch": 0.55, - "learning_rate": 2.2453673831687693e-05, - "loss": 2.3713, - "step": 315920 - }, - { - "epoch": 0.55, - "learning_rate": 2.2452801891760867e-05, - "loss": 2.3185, - "step": 315930 - }, - { - "epoch": 0.55, - "learning_rate": 2.245192995183404e-05, - "loss": 2.3719, - "step": 315940 - }, - { - "epoch": 0.55, - "learning_rate": 2.2451058011907214e-05, - "loss": 2.3073, - "step": 315950 - }, - { - "epoch": 0.55, - "learning_rate": 2.2450186071980388e-05, - "loss": 2.3973, - "step": 315960 - }, - { - "epoch": 0.55, - "learning_rate": 2.2449314132053558e-05, - "loss": 2.351, - "step": 315970 - }, - { - "epoch": 0.55, - "learning_rate": 2.2448442192126732e-05, - "loss": 2.2967, - "step": 315980 - }, - { - "epoch": 0.55, - "learning_rate": 2.2447570252199906e-05, - "loss": 2.4183, - "step": 315990 - }, - { - "epoch": 0.55, - "learning_rate": 2.244669831227308e-05, - "loss": 2.3556, - "step": 316000 - }, - { - "epoch": 0.55, - "learning_rate": 2.244582637234625e-05, - "loss": 2.4114, - "step": 316010 - }, - { - "epoch": 0.55, - "learning_rate": 2.2444954432419424e-05, - "loss": 2.3707, - "step": 316020 - }, - { - "epoch": 0.55, - "learning_rate": 2.2444082492492598e-05, - "loss": 2.4114, - "step": 316030 - }, - { - "epoch": 0.55, - "learning_rate": 2.244321055256577e-05, - "loss": 2.3351, - "step": 316040 - }, - { - "epoch": 0.55, - "learning_rate": 2.2442338612638945e-05, - "loss": 2.3768, - "step": 316050 - }, - { - "epoch": 0.55, - "learning_rate": 2.244146667271212e-05, - "loss": 2.3214, - "step": 316060 - }, - { - "epoch": 0.55, - "learning_rate": 2.2440594732785293e-05, - "loss": 2.3731, - "step": 316070 - }, - { - "epoch": 0.55, - "learning_rate": 2.2439722792858463e-05, - "loss": 2.3255, - "step": 316080 - }, - { - "epoch": 0.55, - "learning_rate": 2.2438850852931637e-05, - "loss": 2.1945, - "step": 316090 - }, - { - "epoch": 0.55, - "learning_rate": 2.243797891300481e-05, - "loss": 2.3499, - "step": 316100 - }, - { - "epoch": 0.55, - "learning_rate": 2.2437106973077984e-05, - "loss": 2.4306, - "step": 316110 - }, - { - "epoch": 0.55, - "learning_rate": 2.2436235033151158e-05, - "loss": 2.313, - "step": 316120 - }, - { - "epoch": 0.55, - "learning_rate": 2.243536309322433e-05, - "loss": 2.3024, - "step": 316130 - }, - { - "epoch": 0.55, - "learning_rate": 2.2434491153297506e-05, - "loss": 2.2512, - "step": 316140 - }, - { - "epoch": 0.55, - "learning_rate": 2.2433619213370676e-05, - "loss": 2.2975, - "step": 316150 - }, - { - "epoch": 0.55, - "learning_rate": 2.243274727344385e-05, - "loss": 2.4051, - "step": 316160 - }, - { - "epoch": 0.55, - "learning_rate": 2.243187533351702e-05, - "loss": 2.2873, - "step": 316170 - }, - { - "epoch": 0.55, - "learning_rate": 2.2431003393590197e-05, - "loss": 2.3373, - "step": 316180 - }, - { - "epoch": 0.55, - "learning_rate": 2.243013145366337e-05, - "loss": 2.4293, - "step": 316190 - }, - { - "epoch": 0.55, - "learning_rate": 2.242925951373654e-05, - "loss": 2.2309, - "step": 316200 - }, - { - "epoch": 0.55, - "learning_rate": 2.242838757380972e-05, - "loss": 2.3317, - "step": 316210 - }, - { - "epoch": 0.55, - "learning_rate": 2.242751563388289e-05, - "loss": 2.3321, - "step": 316220 - }, - { - "epoch": 0.55, - "learning_rate": 2.2426643693956063e-05, - "loss": 2.2578, - "step": 316230 - }, - { - "epoch": 0.55, - "learning_rate": 2.2425771754029233e-05, - "loss": 2.3338, - "step": 316240 - }, - { - "epoch": 0.55, - "learning_rate": 2.242489981410241e-05, - "loss": 2.3166, - "step": 316250 - }, - { - "epoch": 0.55, - "learning_rate": 2.242402787417558e-05, - "loss": 2.315, - "step": 316260 - }, - { - "epoch": 0.55, - "learning_rate": 2.2423155934248754e-05, - "loss": 2.3888, - "step": 316270 - }, - { - "epoch": 0.55, - "learning_rate": 2.2422283994321928e-05, - "loss": 2.2763, - "step": 316280 - }, - { - "epoch": 0.55, - "learning_rate": 2.2421412054395102e-05, - "loss": 2.2771, - "step": 316290 - }, - { - "epoch": 0.55, - "learning_rate": 2.2420540114468276e-05, - "loss": 2.4192, - "step": 316300 - }, - { - "epoch": 0.55, - "learning_rate": 2.2419668174541446e-05, - "loss": 2.2538, - "step": 316310 - }, - { - "epoch": 0.55, - "learning_rate": 2.2418796234614623e-05, - "loss": 2.4536, - "step": 316320 - }, - { - "epoch": 0.55, - "learning_rate": 2.2417924294687794e-05, - "loss": 2.4095, - "step": 316330 - }, - { - "epoch": 0.55, - "learning_rate": 2.2417052354760967e-05, - "loss": 2.3087, - "step": 316340 - }, - { - "epoch": 0.55, - "learning_rate": 2.241618041483414e-05, - "loss": 2.3699, - "step": 316350 - }, - { - "epoch": 0.55, - "learning_rate": 2.2415308474907315e-05, - "loss": 2.3741, - "step": 316360 - }, - { - "epoch": 0.55, - "learning_rate": 2.241443653498049e-05, - "loss": 2.2926, - "step": 316370 - }, - { - "epoch": 0.55, - "learning_rate": 2.241356459505366e-05, - "loss": 2.2625, - "step": 316380 - }, - { - "epoch": 0.55, - "learning_rate": 2.2412692655126833e-05, - "loss": 2.3531, - "step": 316390 - }, - { - "epoch": 0.55, - "learning_rate": 2.2411820715200007e-05, - "loss": 2.2487, - "step": 316400 - }, - { - "epoch": 0.55, - "learning_rate": 2.241094877527318e-05, - "loss": 2.3119, - "step": 316410 - }, - { - "epoch": 0.55, - "learning_rate": 2.241007683534635e-05, - "loss": 2.4335, - "step": 316420 - }, - { - "epoch": 0.55, - "learning_rate": 2.2409204895419525e-05, - "loss": 2.4732, - "step": 316430 - }, - { - "epoch": 0.55, - "learning_rate": 2.2408332955492702e-05, - "loss": 2.3711, - "step": 316440 - }, - { - "epoch": 0.55, - "learning_rate": 2.2407461015565872e-05, - "loss": 2.2668, - "step": 316450 - }, - { - "epoch": 0.55, - "learning_rate": 2.2406589075639046e-05, - "loss": 2.436, - "step": 316460 - }, - { - "epoch": 0.55, - "learning_rate": 2.240571713571222e-05, - "loss": 2.3165, - "step": 316470 - }, - { - "epoch": 0.55, - "learning_rate": 2.2404845195785393e-05, - "loss": 2.2792, - "step": 316480 - }, - { - "epoch": 0.55, - "learning_rate": 2.2403973255858564e-05, - "loss": 2.3029, - "step": 316490 - }, - { - "epoch": 0.55, - "learning_rate": 2.2403101315931738e-05, - "loss": 2.2729, - "step": 316500 - }, - { - "epoch": 0.55, - "learning_rate": 2.240222937600491e-05, - "loss": 2.5285, - "step": 316510 - }, - { - "epoch": 0.55, - "learning_rate": 2.2401357436078085e-05, - "loss": 2.1958, - "step": 316520 - }, - { - "epoch": 0.55, - "learning_rate": 2.240048549615126e-05, - "loss": 2.2366, - "step": 316530 - }, - { - "epoch": 0.55, - "learning_rate": 2.239961355622443e-05, - "loss": 2.3736, - "step": 316540 - }, - { - "epoch": 0.55, - "learning_rate": 2.2398741616297606e-05, - "loss": 2.3696, - "step": 316550 - }, - { - "epoch": 0.55, - "learning_rate": 2.2397869676370777e-05, - "loss": 2.392, - "step": 316560 - }, - { - "epoch": 0.55, - "learning_rate": 2.239699773644395e-05, - "loss": 2.3777, - "step": 316570 - }, - { - "epoch": 0.55, - "learning_rate": 2.2396125796517124e-05, - "loss": 2.353, - "step": 316580 - }, - { - "epoch": 0.55, - "learning_rate": 2.2395253856590298e-05, - "loss": 2.3273, - "step": 316590 - }, - { - "epoch": 0.55, - "learning_rate": 2.2394381916663472e-05, - "loss": 2.3538, - "step": 316600 - }, - { - "epoch": 0.55, - "learning_rate": 2.2393509976736642e-05, - "loss": 2.4374, - "step": 316610 - }, - { - "epoch": 0.55, - "learning_rate": 2.239263803680982e-05, - "loss": 2.3854, - "step": 316620 - }, - { - "epoch": 0.55, - "learning_rate": 2.239176609688299e-05, - "loss": 2.279, - "step": 316630 - }, - { - "epoch": 0.55, - "learning_rate": 2.2390894156956164e-05, - "loss": 2.421, - "step": 316640 - }, - { - "epoch": 0.55, - "learning_rate": 2.2390022217029334e-05, - "loss": 2.2885, - "step": 316650 - }, - { - "epoch": 0.55, - "learning_rate": 2.238915027710251e-05, - "loss": 2.2418, - "step": 316660 - }, - { - "epoch": 0.55, - "learning_rate": 2.2388278337175685e-05, - "loss": 2.2976, - "step": 316670 - }, - { - "epoch": 0.55, - "learning_rate": 2.2387406397248855e-05, - "loss": 2.248, - "step": 316680 - }, - { - "epoch": 0.55, - "learning_rate": 2.238653445732203e-05, - "loss": 2.3827, - "step": 316690 - }, - { - "epoch": 0.55, - "learning_rate": 2.2385662517395203e-05, - "loss": 2.2894, - "step": 316700 - }, - { - "epoch": 0.55, - "learning_rate": 2.2384790577468377e-05, - "loss": 2.3521, - "step": 316710 - }, - { - "epoch": 0.55, - "learning_rate": 2.2383918637541547e-05, - "loss": 2.3344, - "step": 316720 - }, - { - "epoch": 0.55, - "learning_rate": 2.2383046697614724e-05, - "loss": 2.3829, - "step": 316730 - }, - { - "epoch": 0.55, - "learning_rate": 2.2382174757687895e-05, - "loss": 2.3827, - "step": 316740 - }, - { - "epoch": 0.55, - "learning_rate": 2.2381302817761068e-05, - "loss": 2.2964, - "step": 316750 - }, - { - "epoch": 0.55, - "learning_rate": 2.2380430877834242e-05, - "loss": 2.3578, - "step": 316760 - }, - { - "epoch": 0.55, - "learning_rate": 2.2379558937907416e-05, - "loss": 2.3977, - "step": 316770 - }, - { - "epoch": 0.55, - "learning_rate": 2.237868699798059e-05, - "loss": 2.3898, - "step": 316780 - }, - { - "epoch": 0.55, - "learning_rate": 2.237781505805376e-05, - "loss": 2.3822, - "step": 316790 - }, - { - "epoch": 0.55, - "learning_rate": 2.2376943118126934e-05, - "loss": 2.4772, - "step": 316800 - }, - { - "epoch": 0.55, - "learning_rate": 2.2376071178200108e-05, - "loss": 2.304, - "step": 316810 - }, - { - "epoch": 0.55, - "learning_rate": 2.237519923827328e-05, - "loss": 2.3747, - "step": 316820 - }, - { - "epoch": 0.55, - "learning_rate": 2.2374327298346455e-05, - "loss": 2.2857, - "step": 316830 - }, - { - "epoch": 0.55, - "learning_rate": 2.2373455358419625e-05, - "loss": 2.4124, - "step": 316840 - }, - { - "epoch": 0.55, - "learning_rate": 2.2372583418492803e-05, - "loss": 2.3655, - "step": 316850 - }, - { - "epoch": 0.55, - "learning_rate": 2.2371711478565973e-05, - "loss": 2.3696, - "step": 316860 - }, - { - "epoch": 0.55, - "learning_rate": 2.2370839538639147e-05, - "loss": 2.3258, - "step": 316870 - }, - { - "epoch": 0.55, - "learning_rate": 2.236996759871232e-05, - "loss": 2.3341, - "step": 316880 - }, - { - "epoch": 0.55, - "learning_rate": 2.2369095658785494e-05, - "loss": 2.3565, - "step": 316890 - }, - { - "epoch": 0.55, - "learning_rate": 2.2368223718858665e-05, - "loss": 2.445, - "step": 316900 - }, - { - "epoch": 0.55, - "learning_rate": 2.236735177893184e-05, - "loss": 2.2848, - "step": 316910 - }, - { - "epoch": 0.55, - "learning_rate": 2.2366479839005016e-05, - "loss": 2.3512, - "step": 316920 - }, - { - "epoch": 0.55, - "learning_rate": 2.2365607899078186e-05, - "loss": 2.3245, - "step": 316930 - }, - { - "epoch": 0.55, - "learning_rate": 2.236473595915136e-05, - "loss": 2.3897, - "step": 316940 - }, - { - "epoch": 0.55, - "learning_rate": 2.236386401922453e-05, - "loss": 2.315, - "step": 316950 - }, - { - "epoch": 0.55, - "learning_rate": 2.2362992079297707e-05, - "loss": 2.3069, - "step": 316960 - }, - { - "epoch": 0.55, - "learning_rate": 2.2362120139370878e-05, - "loss": 2.3227, - "step": 316970 - }, - { - "epoch": 0.55, - "learning_rate": 2.236124819944405e-05, - "loss": 2.2381, - "step": 316980 - }, - { - "epoch": 0.55, - "learning_rate": 2.2360376259517225e-05, - "loss": 2.4051, - "step": 316990 - }, - { - "epoch": 0.55, - "learning_rate": 2.23595043195904e-05, - "loss": 2.318, - "step": 317000 - }, - { - "epoch": 0.55, - "learning_rate": 2.2358632379663573e-05, - "loss": 2.4065, - "step": 317010 - }, - { - "epoch": 0.55, - "learning_rate": 2.2357760439736743e-05, - "loss": 2.226, - "step": 317020 - }, - { - "epoch": 0.55, - "learning_rate": 2.235688849980992e-05, - "loss": 2.4522, - "step": 317030 - }, - { - "epoch": 0.55, - "learning_rate": 2.235601655988309e-05, - "loss": 2.222, - "step": 317040 - }, - { - "epoch": 0.55, - "learning_rate": 2.2355144619956264e-05, - "loss": 2.3055, - "step": 317050 - }, - { - "epoch": 0.55, - "learning_rate": 2.2354272680029438e-05, - "loss": 2.3006, - "step": 317060 - }, - { - "epoch": 0.55, - "learning_rate": 2.2353400740102612e-05, - "loss": 2.4156, - "step": 317070 - }, - { - "epoch": 0.55, - "learning_rate": 2.2352528800175786e-05, - "loss": 2.4632, - "step": 317080 - }, - { - "epoch": 0.55, - "learning_rate": 2.2351656860248956e-05, - "loss": 2.3122, - "step": 317090 - }, - { - "epoch": 0.55, - "learning_rate": 2.235078492032213e-05, - "loss": 2.3262, - "step": 317100 - }, - { - "epoch": 0.55, - "learning_rate": 2.2349912980395304e-05, - "loss": 2.243, - "step": 317110 - }, - { - "epoch": 0.55, - "learning_rate": 2.2349041040468477e-05, - "loss": 2.4362, - "step": 317120 - }, - { - "epoch": 0.55, - "learning_rate": 2.2348169100541648e-05, - "loss": 2.4393, - "step": 317130 - }, - { - "epoch": 0.55, - "learning_rate": 2.2347297160614825e-05, - "loss": 2.3543, - "step": 317140 - }, - { - "epoch": 0.55, - "learning_rate": 2.2346425220687995e-05, - "loss": 2.4195, - "step": 317150 - }, - { - "epoch": 0.55, - "learning_rate": 2.234555328076117e-05, - "loss": 2.4779, - "step": 317160 - }, - { - "epoch": 0.55, - "learning_rate": 2.2344681340834343e-05, - "loss": 2.4014, - "step": 317170 - }, - { - "epoch": 0.55, - "learning_rate": 2.2343809400907517e-05, - "loss": 2.2794, - "step": 317180 - }, - { - "epoch": 0.55, - "learning_rate": 2.234293746098069e-05, - "loss": 2.3022, - "step": 317190 - }, - { - "epoch": 0.55, - "learning_rate": 2.234206552105386e-05, - "loss": 2.4602, - "step": 317200 - }, - { - "epoch": 0.55, - "learning_rate": 2.2341193581127035e-05, - "loss": 2.3237, - "step": 317210 - }, - { - "epoch": 0.55, - "learning_rate": 2.234032164120021e-05, - "loss": 2.3632, - "step": 317220 - }, - { - "epoch": 0.55, - "learning_rate": 2.2339449701273382e-05, - "loss": 2.2982, - "step": 317230 - }, - { - "epoch": 0.55, - "learning_rate": 2.2338577761346556e-05, - "loss": 2.4608, - "step": 317240 - }, - { - "epoch": 0.55, - "learning_rate": 2.233770582141973e-05, - "loss": 2.3005, - "step": 317250 - }, - { - "epoch": 0.55, - "learning_rate": 2.2336833881492903e-05, - "loss": 2.4035, - "step": 317260 - }, - { - "epoch": 0.55, - "learning_rate": 2.2335961941566074e-05, - "loss": 2.4147, - "step": 317270 - }, - { - "epoch": 0.55, - "learning_rate": 2.2335090001639248e-05, - "loss": 2.3008, - "step": 317280 - }, - { - "epoch": 0.55, - "learning_rate": 2.233421806171242e-05, - "loss": 2.3135, - "step": 317290 - }, - { - "epoch": 0.55, - "learning_rate": 2.2333346121785595e-05, - "loss": 2.3453, - "step": 317300 - }, - { - "epoch": 0.55, - "learning_rate": 2.233247418185877e-05, - "loss": 2.2678, - "step": 317310 - }, - { - "epoch": 0.55, - "learning_rate": 2.233160224193194e-05, - "loss": 2.342, - "step": 317320 - }, - { - "epoch": 0.55, - "learning_rate": 2.2330730302005116e-05, - "loss": 2.3047, - "step": 317330 - }, - { - "epoch": 0.55, - "learning_rate": 2.2329858362078287e-05, - "loss": 2.3495, - "step": 317340 - }, - { - "epoch": 0.55, - "learning_rate": 2.232898642215146e-05, - "loss": 2.3897, - "step": 317350 - }, - { - "epoch": 0.55, - "learning_rate": 2.232811448222463e-05, - "loss": 2.4212, - "step": 317360 - }, - { - "epoch": 0.55, - "learning_rate": 2.2327242542297808e-05, - "loss": 2.339, - "step": 317370 - }, - { - "epoch": 0.55, - "learning_rate": 2.232637060237098e-05, - "loss": 2.4031, - "step": 317380 - }, - { - "epoch": 0.55, - "learning_rate": 2.2325498662444152e-05, - "loss": 2.275, - "step": 317390 - }, - { - "epoch": 0.55, - "learning_rate": 2.232462672251733e-05, - "loss": 2.3781, - "step": 317400 - }, - { - "epoch": 0.55, - "learning_rate": 2.23237547825905e-05, - "loss": 2.4906, - "step": 317410 - }, - { - "epoch": 0.55, - "learning_rate": 2.2322882842663674e-05, - "loss": 2.3438, - "step": 317420 - }, - { - "epoch": 0.55, - "learning_rate": 2.2322010902736844e-05, - "loss": 2.4436, - "step": 317430 - }, - { - "epoch": 0.55, - "learning_rate": 2.232113896281002e-05, - "loss": 2.3118, - "step": 317440 - }, - { - "epoch": 0.55, - "learning_rate": 2.232026702288319e-05, - "loss": 2.332, - "step": 317450 - }, - { - "epoch": 0.55, - "learning_rate": 2.2319395082956365e-05, - "loss": 2.3431, - "step": 317460 - }, - { - "epoch": 0.55, - "learning_rate": 2.231852314302954e-05, - "loss": 2.25, - "step": 317470 - }, - { - "epoch": 0.55, - "learning_rate": 2.2317651203102713e-05, - "loss": 2.3209, - "step": 317480 - }, - { - "epoch": 0.55, - "learning_rate": 2.2316779263175887e-05, - "loss": 2.4146, - "step": 317490 - }, - { - "epoch": 0.55, - "learning_rate": 2.2315907323249057e-05, - "loss": 2.4348, - "step": 317500 - }, - { - "epoch": 0.55, - "learning_rate": 2.231503538332223e-05, - "loss": 2.3966, - "step": 317510 - }, - { - "epoch": 0.55, - "learning_rate": 2.2314163443395405e-05, - "loss": 2.383, - "step": 317520 - }, - { - "epoch": 0.55, - "learning_rate": 2.2313291503468578e-05, - "loss": 2.3926, - "step": 317530 - }, - { - "epoch": 0.55, - "learning_rate": 2.2312419563541752e-05, - "loss": 2.4092, - "step": 317540 - }, - { - "epoch": 0.55, - "learning_rate": 2.2311547623614926e-05, - "loss": 2.3134, - "step": 317550 - }, - { - "epoch": 0.55, - "learning_rate": 2.23106756836881e-05, - "loss": 2.3145, - "step": 317560 - }, - { - "epoch": 0.55, - "learning_rate": 2.230980374376127e-05, - "loss": 2.2945, - "step": 317570 - }, - { - "epoch": 0.55, - "learning_rate": 2.2308931803834444e-05, - "loss": 2.2865, - "step": 317580 - }, - { - "epoch": 0.55, - "learning_rate": 2.2308059863907618e-05, - "loss": 2.4237, - "step": 317590 - }, - { - "epoch": 0.55, - "learning_rate": 2.230718792398079e-05, - "loss": 2.367, - "step": 317600 - }, - { - "epoch": 0.55, - "learning_rate": 2.230631598405396e-05, - "loss": 2.3435, - "step": 317610 - }, - { - "epoch": 0.55, - "learning_rate": 2.2305444044127135e-05, - "loss": 2.3461, - "step": 317620 - }, - { - "epoch": 0.55, - "learning_rate": 2.230457210420031e-05, - "loss": 2.3391, - "step": 317630 - }, - { - "epoch": 0.55, - "learning_rate": 2.2303700164273483e-05, - "loss": 2.2758, - "step": 317640 - }, - { - "epoch": 0.55, - "learning_rate": 2.2302828224346657e-05, - "loss": 2.2627, - "step": 317650 - }, - { - "epoch": 0.55, - "learning_rate": 2.230195628441983e-05, - "loss": 2.3366, - "step": 317660 - }, - { - "epoch": 0.55, - "learning_rate": 2.2301084344493004e-05, - "loss": 2.3684, - "step": 317670 - }, - { - "epoch": 0.55, - "learning_rate": 2.2300212404566175e-05, - "loss": 2.3594, - "step": 317680 - }, - { - "epoch": 0.55, - "learning_rate": 2.229934046463935e-05, - "loss": 2.3101, - "step": 317690 - }, - { - "epoch": 0.55, - "learning_rate": 2.2298468524712522e-05, - "loss": 2.264, - "step": 317700 - }, - { - "epoch": 0.55, - "learning_rate": 2.2297596584785696e-05, - "loss": 2.4543, - "step": 317710 - }, - { - "epoch": 0.55, - "learning_rate": 2.229672464485887e-05, - "loss": 2.3688, - "step": 317720 - }, - { - "epoch": 0.55, - "learning_rate": 2.229585270493204e-05, - "loss": 2.3772, - "step": 317730 - }, - { - "epoch": 0.55, - "learning_rate": 2.2294980765005217e-05, - "loss": 2.3572, - "step": 317740 - }, - { - "epoch": 0.55, - "learning_rate": 2.2294108825078388e-05, - "loss": 2.3625, - "step": 317750 - }, - { - "epoch": 0.55, - "learning_rate": 2.229323688515156e-05, - "loss": 2.3541, - "step": 317760 - }, - { - "epoch": 0.55, - "learning_rate": 2.2292364945224732e-05, - "loss": 2.4044, - "step": 317770 - }, - { - "epoch": 0.55, - "learning_rate": 2.229149300529791e-05, - "loss": 2.3638, - "step": 317780 - }, - { - "epoch": 0.55, - "learning_rate": 2.2290621065371083e-05, - "loss": 2.2829, - "step": 317790 - }, - { - "epoch": 0.55, - "learning_rate": 2.2289749125444253e-05, - "loss": 2.3276, - "step": 317800 - }, - { - "epoch": 0.55, - "learning_rate": 2.228887718551743e-05, - "loss": 2.47, - "step": 317810 - }, - { - "epoch": 0.55, - "learning_rate": 2.22880052455906e-05, - "loss": 2.3498, - "step": 317820 - }, - { - "epoch": 0.55, - "learning_rate": 2.2287133305663774e-05, - "loss": 2.4007, - "step": 317830 - }, - { - "epoch": 0.55, - "learning_rate": 2.2286261365736945e-05, - "loss": 2.4448, - "step": 317840 - }, - { - "epoch": 0.55, - "learning_rate": 2.2285389425810122e-05, - "loss": 2.4125, - "step": 317850 - }, - { - "epoch": 0.55, - "learning_rate": 2.2284517485883292e-05, - "loss": 2.2947, - "step": 317860 - }, - { - "epoch": 0.55, - "learning_rate": 2.2283645545956466e-05, - "loss": 2.4116, - "step": 317870 - }, - { - "epoch": 0.55, - "learning_rate": 2.228277360602964e-05, - "loss": 2.271, - "step": 317880 - }, - { - "epoch": 0.55, - "learning_rate": 2.2281901666102814e-05, - "loss": 2.5024, - "step": 317890 - }, - { - "epoch": 0.55, - "learning_rate": 2.2281029726175987e-05, - "loss": 2.3491, - "step": 317900 - }, - { - "epoch": 0.55, - "learning_rate": 2.2280157786249158e-05, - "loss": 2.2889, - "step": 317910 - }, - { - "epoch": 0.55, - "learning_rate": 2.2279285846322335e-05, - "loss": 2.3039, - "step": 317920 - }, - { - "epoch": 0.55, - "learning_rate": 2.2278413906395505e-05, - "loss": 2.3299, - "step": 317930 - }, - { - "epoch": 0.55, - "learning_rate": 2.227754196646868e-05, - "loss": 2.3497, - "step": 317940 - }, - { - "epoch": 0.55, - "learning_rate": 2.2276670026541853e-05, - "loss": 2.2414, - "step": 317950 - }, - { - "epoch": 0.55, - "learning_rate": 2.2275798086615027e-05, - "loss": 2.4232, - "step": 317960 - }, - { - "epoch": 0.55, - "learning_rate": 2.22749261466882e-05, - "loss": 2.2758, - "step": 317970 - }, - { - "epoch": 0.55, - "learning_rate": 2.227405420676137e-05, - "loss": 2.3025, - "step": 317980 - }, - { - "epoch": 0.55, - "learning_rate": 2.2273182266834545e-05, - "loss": 2.3589, - "step": 317990 - }, - { - "epoch": 0.55, - "learning_rate": 2.227231032690772e-05, - "loss": 2.3658, - "step": 318000 - }, - { - "epoch": 0.55, - "learning_rate": 2.2271438386980892e-05, - "loss": 2.2908, - "step": 318010 - }, - { - "epoch": 0.55, - "learning_rate": 2.2270566447054066e-05, - "loss": 2.4927, - "step": 318020 - }, - { - "epoch": 0.55, - "learning_rate": 2.2269694507127236e-05, - "loss": 2.2872, - "step": 318030 - }, - { - "epoch": 0.55, - "learning_rate": 2.2268822567200413e-05, - "loss": 2.4357, - "step": 318040 - }, - { - "epoch": 0.55, - "learning_rate": 2.2267950627273584e-05, - "loss": 2.3412, - "step": 318050 - }, - { - "epoch": 0.55, - "learning_rate": 2.2267078687346758e-05, - "loss": 2.3953, - "step": 318060 - }, - { - "epoch": 0.55, - "learning_rate": 2.226620674741993e-05, - "loss": 2.3645, - "step": 318070 - }, - { - "epoch": 0.55, - "learning_rate": 2.2265334807493105e-05, - "loss": 2.2403, - "step": 318080 - }, - { - "epoch": 0.55, - "learning_rate": 2.2264462867566276e-05, - "loss": 2.4452, - "step": 318090 - }, - { - "epoch": 0.55, - "learning_rate": 2.226359092763945e-05, - "loss": 2.3932, - "step": 318100 - }, - { - "epoch": 0.55, - "learning_rate": 2.2262718987712623e-05, - "loss": 2.2817, - "step": 318110 - }, - { - "epoch": 0.55, - "learning_rate": 2.2261847047785797e-05, - "loss": 2.3627, - "step": 318120 - }, - { - "epoch": 0.55, - "learning_rate": 2.226097510785897e-05, - "loss": 2.3385, - "step": 318130 - }, - { - "epoch": 0.55, - "learning_rate": 2.226010316793214e-05, - "loss": 2.4189, - "step": 318140 - }, - { - "epoch": 0.55, - "learning_rate": 2.2259231228005318e-05, - "loss": 2.3179, - "step": 318150 - }, - { - "epoch": 0.55, - "learning_rate": 2.225835928807849e-05, - "loss": 2.4425, - "step": 318160 - }, - { - "epoch": 0.55, - "learning_rate": 2.2257487348151662e-05, - "loss": 2.2816, - "step": 318170 - }, - { - "epoch": 0.55, - "learning_rate": 2.2256615408224836e-05, - "loss": 2.3009, - "step": 318180 - }, - { - "epoch": 0.55, - "learning_rate": 2.225574346829801e-05, - "loss": 2.2788, - "step": 318190 - }, - { - "epoch": 0.55, - "learning_rate": 2.2254871528371184e-05, - "loss": 2.3717, - "step": 318200 - }, - { - "epoch": 0.55, - "learning_rate": 2.2253999588444354e-05, - "loss": 2.3794, - "step": 318210 - }, - { - "epoch": 0.55, - "learning_rate": 2.225312764851753e-05, - "loss": 2.2488, - "step": 318220 - }, - { - "epoch": 0.55, - "learning_rate": 2.22522557085907e-05, - "loss": 2.4705, - "step": 318230 - }, - { - "epoch": 0.55, - "learning_rate": 2.2251383768663875e-05, - "loss": 2.3851, - "step": 318240 - }, - { - "epoch": 0.55, - "learning_rate": 2.2250511828737046e-05, - "loss": 2.361, - "step": 318250 - }, - { - "epoch": 0.56, - "learning_rate": 2.2249639888810223e-05, - "loss": 2.3715, - "step": 318260 - }, - { - "epoch": 0.56, - "learning_rate": 2.2248767948883397e-05, - "loss": 2.4219, - "step": 318270 - }, - { - "epoch": 0.56, - "learning_rate": 2.2247896008956567e-05, - "loss": 2.3745, - "step": 318280 - }, - { - "epoch": 0.56, - "learning_rate": 2.224702406902974e-05, - "loss": 2.3387, - "step": 318290 - }, - { - "epoch": 0.56, - "learning_rate": 2.2246152129102915e-05, - "loss": 2.3058, - "step": 318300 - }, - { - "epoch": 0.56, - "learning_rate": 2.2245280189176088e-05, - "loss": 2.3259, - "step": 318310 - }, - { - "epoch": 0.56, - "learning_rate": 2.224440824924926e-05, - "loss": 2.5157, - "step": 318320 - }, - { - "epoch": 0.56, - "learning_rate": 2.2243536309322436e-05, - "loss": 2.3647, - "step": 318330 - }, - { - "epoch": 0.56, - "learning_rate": 2.2242664369395606e-05, - "loss": 2.4175, - "step": 318340 - }, - { - "epoch": 0.56, - "learning_rate": 2.224179242946878e-05, - "loss": 2.4496, - "step": 318350 - }, - { - "epoch": 0.56, - "learning_rate": 2.2240920489541954e-05, - "loss": 2.2956, - "step": 318360 - }, - { - "epoch": 0.56, - "learning_rate": 2.2240048549615128e-05, - "loss": 2.0526, - "step": 318370 - }, - { - "epoch": 0.56, - "learning_rate": 2.22391766096883e-05, - "loss": 2.2604, - "step": 318380 - }, - { - "epoch": 0.56, - "learning_rate": 2.223830466976147e-05, - "loss": 2.5169, - "step": 318390 - }, - { - "epoch": 0.56, - "learning_rate": 2.2237432729834645e-05, - "loss": 2.4378, - "step": 318400 - }, - { - "epoch": 0.56, - "learning_rate": 2.223656078990782e-05, - "loss": 2.3389, - "step": 318410 - }, - { - "epoch": 0.56, - "learning_rate": 2.2235688849980993e-05, - "loss": 2.3136, - "step": 318420 - }, - { - "epoch": 0.56, - "learning_rate": 2.2234816910054167e-05, - "loss": 2.2648, - "step": 318430 - }, - { - "epoch": 0.56, - "learning_rate": 2.2233944970127337e-05, - "loss": 2.3973, - "step": 318440 - }, - { - "epoch": 0.56, - "learning_rate": 2.2233073030200514e-05, - "loss": 2.4024, - "step": 318450 - }, - { - "epoch": 0.56, - "learning_rate": 2.2232201090273685e-05, - "loss": 2.285, - "step": 318460 - }, - { - "epoch": 0.56, - "learning_rate": 2.223132915034686e-05, - "loss": 2.3217, - "step": 318470 - }, - { - "epoch": 0.56, - "learning_rate": 2.2230457210420032e-05, - "loss": 2.2505, - "step": 318480 - }, - { - "epoch": 0.56, - "learning_rate": 2.2229585270493206e-05, - "loss": 2.2464, - "step": 318490 - }, - { - "epoch": 0.56, - "learning_rate": 2.2228713330566376e-05, - "loss": 2.299, - "step": 318500 - }, - { - "epoch": 0.56, - "learning_rate": 2.222784139063955e-05, - "loss": 2.2984, - "step": 318510 - }, - { - "epoch": 0.56, - "learning_rate": 2.2226969450712727e-05, - "loss": 2.2907, - "step": 318520 - }, - { - "epoch": 0.56, - "learning_rate": 2.2226097510785898e-05, - "loss": 2.352, - "step": 318530 - }, - { - "epoch": 0.56, - "learning_rate": 2.222522557085907e-05, - "loss": 2.3077, - "step": 318540 - }, - { - "epoch": 0.56, - "learning_rate": 2.2224353630932242e-05, - "loss": 2.2108, - "step": 318550 - }, - { - "epoch": 0.56, - "learning_rate": 2.222348169100542e-05, - "loss": 2.4585, - "step": 318560 - }, - { - "epoch": 0.56, - "learning_rate": 2.222260975107859e-05, - "loss": 2.3616, - "step": 318570 - }, - { - "epoch": 0.56, - "learning_rate": 2.2221737811151763e-05, - "loss": 2.2455, - "step": 318580 - }, - { - "epoch": 0.56, - "learning_rate": 2.2220865871224937e-05, - "loss": 2.3442, - "step": 318590 - }, - { - "epoch": 0.56, - "learning_rate": 2.221999393129811e-05, - "loss": 2.2599, - "step": 318600 - }, - { - "epoch": 0.56, - "learning_rate": 2.2219121991371284e-05, - "loss": 2.2938, - "step": 318610 - }, - { - "epoch": 0.56, - "learning_rate": 2.2218250051444455e-05, - "loss": 2.3715, - "step": 318620 - }, - { - "epoch": 0.56, - "learning_rate": 2.2217378111517632e-05, - "loss": 2.3437, - "step": 318630 - }, - { - "epoch": 0.56, - "learning_rate": 2.2216506171590802e-05, - "loss": 2.3842, - "step": 318640 - }, - { - "epoch": 0.56, - "learning_rate": 2.2215634231663976e-05, - "loss": 2.379, - "step": 318650 - }, - { - "epoch": 0.56, - "learning_rate": 2.221476229173715e-05, - "loss": 2.2819, - "step": 318660 - }, - { - "epoch": 0.56, - "learning_rate": 2.2213890351810324e-05, - "loss": 2.3621, - "step": 318670 - }, - { - "epoch": 0.56, - "learning_rate": 2.2213018411883497e-05, - "loss": 2.315, - "step": 318680 - }, - { - "epoch": 0.56, - "learning_rate": 2.2212146471956668e-05, - "loss": 2.3439, - "step": 318690 - }, - { - "epoch": 0.56, - "learning_rate": 2.221127453202984e-05, - "loss": 2.2827, - "step": 318700 - }, - { - "epoch": 0.56, - "learning_rate": 2.2210402592103015e-05, - "loss": 2.2616, - "step": 318710 - }, - { - "epoch": 0.56, - "learning_rate": 2.220953065217619e-05, - "loss": 2.3027, - "step": 318720 - }, - { - "epoch": 0.56, - "learning_rate": 2.220865871224936e-05, - "loss": 2.375, - "step": 318730 - }, - { - "epoch": 0.56, - "learning_rate": 2.2207786772322537e-05, - "loss": 2.3976, - "step": 318740 - }, - { - "epoch": 0.56, - "learning_rate": 2.220691483239571e-05, - "loss": 2.4027, - "step": 318750 - }, - { - "epoch": 0.56, - "learning_rate": 2.220604289246888e-05, - "loss": 2.3075, - "step": 318760 - }, - { - "epoch": 0.56, - "learning_rate": 2.2205170952542055e-05, - "loss": 2.2555, - "step": 318770 - }, - { - "epoch": 0.56, - "learning_rate": 2.220429901261523e-05, - "loss": 2.3177, - "step": 318780 - }, - { - "epoch": 0.56, - "learning_rate": 2.2203427072688402e-05, - "loss": 2.3243, - "step": 318790 - }, - { - "epoch": 0.56, - "learning_rate": 2.2202555132761573e-05, - "loss": 2.38, - "step": 318800 - }, - { - "epoch": 0.56, - "learning_rate": 2.2201683192834746e-05, - "loss": 2.2974, - "step": 318810 - }, - { - "epoch": 0.56, - "learning_rate": 2.220081125290792e-05, - "loss": 2.4204, - "step": 318820 - }, - { - "epoch": 0.56, - "learning_rate": 2.2199939312981094e-05, - "loss": 2.392, - "step": 318830 - }, - { - "epoch": 0.56, - "learning_rate": 2.2199067373054268e-05, - "loss": 2.3368, - "step": 318840 - }, - { - "epoch": 0.56, - "learning_rate": 2.219819543312744e-05, - "loss": 2.2559, - "step": 318850 - }, - { - "epoch": 0.56, - "learning_rate": 2.2197323493200615e-05, - "loss": 2.3951, - "step": 318860 - }, - { - "epoch": 0.56, - "learning_rate": 2.2196451553273786e-05, - "loss": 2.3555, - "step": 318870 - }, - { - "epoch": 0.56, - "learning_rate": 2.219557961334696e-05, - "loss": 2.1453, - "step": 318880 - }, - { - "epoch": 0.56, - "learning_rate": 2.2194707673420133e-05, - "loss": 2.5277, - "step": 318890 - }, - { - "epoch": 0.56, - "learning_rate": 2.2193835733493307e-05, - "loss": 2.4172, - "step": 318900 - }, - { - "epoch": 0.56, - "learning_rate": 2.219296379356648e-05, - "loss": 2.3423, - "step": 318910 - }, - { - "epoch": 0.56, - "learning_rate": 2.219209185363965e-05, - "loss": 2.3497, - "step": 318920 - }, - { - "epoch": 0.56, - "learning_rate": 2.2191219913712828e-05, - "loss": 2.3678, - "step": 318930 - }, - { - "epoch": 0.56, - "learning_rate": 2.2190347973786e-05, - "loss": 2.4562, - "step": 318940 - }, - { - "epoch": 0.56, - "learning_rate": 2.2189476033859172e-05, - "loss": 2.2795, - "step": 318950 - }, - { - "epoch": 0.56, - "learning_rate": 2.2188604093932343e-05, - "loss": 2.2934, - "step": 318960 - }, - { - "epoch": 0.56, - "learning_rate": 2.218773215400552e-05, - "loss": 2.453, - "step": 318970 - }, - { - "epoch": 0.56, - "learning_rate": 2.218686021407869e-05, - "loss": 2.271, - "step": 318980 - }, - { - "epoch": 0.56, - "learning_rate": 2.2185988274151864e-05, - "loss": 2.4483, - "step": 318990 - }, - { - "epoch": 0.56, - "learning_rate": 2.218511633422504e-05, - "loss": 2.4944, - "step": 319000 - }, - { - "epoch": 0.56, - "learning_rate": 2.218424439429821e-05, - "loss": 2.444, - "step": 319010 - }, - { - "epoch": 0.56, - "learning_rate": 2.2183372454371385e-05, - "loss": 2.1628, - "step": 319020 - }, - { - "epoch": 0.56, - "learning_rate": 2.2182500514444556e-05, - "loss": 2.2621, - "step": 319030 - }, - { - "epoch": 0.56, - "learning_rate": 2.2181628574517733e-05, - "loss": 2.3111, - "step": 319040 - }, - { - "epoch": 0.56, - "learning_rate": 2.2180756634590903e-05, - "loss": 2.3862, - "step": 319050 - }, - { - "epoch": 0.56, - "learning_rate": 2.2179884694664077e-05, - "loss": 2.2786, - "step": 319060 - }, - { - "epoch": 0.56, - "learning_rate": 2.217901275473725e-05, - "loss": 2.3302, - "step": 319070 - }, - { - "epoch": 0.56, - "learning_rate": 2.2178140814810425e-05, - "loss": 2.3805, - "step": 319080 - }, - { - "epoch": 0.56, - "learning_rate": 2.2177268874883598e-05, - "loss": 2.3411, - "step": 319090 - }, - { - "epoch": 0.56, - "learning_rate": 2.217639693495677e-05, - "loss": 2.3764, - "step": 319100 - }, - { - "epoch": 0.56, - "learning_rate": 2.2175524995029946e-05, - "loss": 2.3173, - "step": 319110 - }, - { - "epoch": 0.56, - "learning_rate": 2.2174653055103116e-05, - "loss": 2.397, - "step": 319120 - }, - { - "epoch": 0.56, - "learning_rate": 2.217378111517629e-05, - "loss": 2.3568, - "step": 319130 - }, - { - "epoch": 0.56, - "learning_rate": 2.2172909175249464e-05, - "loss": 2.2698, - "step": 319140 - }, - { - "epoch": 0.56, - "learning_rate": 2.2172037235322638e-05, - "loss": 2.3397, - "step": 319150 - }, - { - "epoch": 0.56, - "learning_rate": 2.217116529539581e-05, - "loss": 2.3942, - "step": 319160 - }, - { - "epoch": 0.56, - "learning_rate": 2.217029335546898e-05, - "loss": 2.3686, - "step": 319170 - }, - { - "epoch": 0.56, - "learning_rate": 2.2169421415542155e-05, - "loss": 2.4237, - "step": 319180 - }, - { - "epoch": 0.56, - "learning_rate": 2.216854947561533e-05, - "loss": 2.2946, - "step": 319190 - }, - { - "epoch": 0.56, - "learning_rate": 2.2167677535688503e-05, - "loss": 2.31, - "step": 319200 - }, - { - "epoch": 0.56, - "learning_rate": 2.2166805595761673e-05, - "loss": 2.4126, - "step": 319210 - }, - { - "epoch": 0.56, - "learning_rate": 2.2165933655834847e-05, - "loss": 2.3182, - "step": 319220 - }, - { - "epoch": 0.56, - "learning_rate": 2.216506171590802e-05, - "loss": 2.2225, - "step": 319230 - }, - { - "epoch": 0.56, - "learning_rate": 2.2164189775981195e-05, - "loss": 2.2407, - "step": 319240 - }, - { - "epoch": 0.56, - "learning_rate": 2.216331783605437e-05, - "loss": 2.3732, - "step": 319250 - }, - { - "epoch": 0.56, - "learning_rate": 2.2162445896127542e-05, - "loss": 2.2974, - "step": 319260 - }, - { - "epoch": 0.56, - "learning_rate": 2.2161573956200716e-05, - "loss": 2.3994, - "step": 319270 - }, - { - "epoch": 0.56, - "learning_rate": 2.2160702016273886e-05, - "loss": 2.3777, - "step": 319280 - }, - { - "epoch": 0.56, - "learning_rate": 2.215983007634706e-05, - "loss": 2.3297, - "step": 319290 - }, - { - "epoch": 0.56, - "learning_rate": 2.2158958136420234e-05, - "loss": 2.3682, - "step": 319300 - }, - { - "epoch": 0.56, - "learning_rate": 2.2158086196493408e-05, - "loss": 2.3626, - "step": 319310 - }, - { - "epoch": 0.56, - "learning_rate": 2.215721425656658e-05, - "loss": 2.3103, - "step": 319320 - }, - { - "epoch": 0.56, - "learning_rate": 2.2156342316639752e-05, - "loss": 2.3536, - "step": 319330 - }, - { - "epoch": 0.56, - "learning_rate": 2.215547037671293e-05, - "loss": 2.4437, - "step": 319340 - }, - { - "epoch": 0.56, - "learning_rate": 2.21545984367861e-05, - "loss": 2.3866, - "step": 319350 - }, - { - "epoch": 0.56, - "learning_rate": 2.2153726496859273e-05, - "loss": 2.293, - "step": 319360 - }, - { - "epoch": 0.56, - "learning_rate": 2.2152854556932447e-05, - "loss": 2.4152, - "step": 319370 - }, - { - "epoch": 0.56, - "learning_rate": 2.215198261700562e-05, - "loss": 2.4288, - "step": 319380 - }, - { - "epoch": 0.56, - "learning_rate": 2.2151110677078794e-05, - "loss": 2.3295, - "step": 319390 - }, - { - "epoch": 0.56, - "learning_rate": 2.2150238737151965e-05, - "loss": 2.2817, - "step": 319400 - }, - { - "epoch": 0.56, - "learning_rate": 2.2149366797225142e-05, - "loss": 2.2554, - "step": 319410 - }, - { - "epoch": 0.56, - "learning_rate": 2.2148494857298312e-05, - "loss": 2.3334, - "step": 319420 - }, - { - "epoch": 0.56, - "learning_rate": 2.2147622917371486e-05, - "loss": 2.2772, - "step": 319430 - }, - { - "epoch": 0.56, - "learning_rate": 2.2146750977444657e-05, - "loss": 2.459, - "step": 319440 - }, - { - "epoch": 0.56, - "learning_rate": 2.2145879037517834e-05, - "loss": 2.4288, - "step": 319450 - }, - { - "epoch": 0.56, - "learning_rate": 2.2145007097591004e-05, - "loss": 2.3656, - "step": 319460 - }, - { - "epoch": 0.56, - "learning_rate": 2.2144135157664178e-05, - "loss": 2.4663, - "step": 319470 - }, - { - "epoch": 0.56, - "learning_rate": 2.214326321773735e-05, - "loss": 2.3576, - "step": 319480 - }, - { - "epoch": 0.56, - "learning_rate": 2.2142391277810525e-05, - "loss": 2.4527, - "step": 319490 - }, - { - "epoch": 0.56, - "learning_rate": 2.21415193378837e-05, - "loss": 2.3553, - "step": 319500 - }, - { - "epoch": 0.56, - "learning_rate": 2.214064739795687e-05, - "loss": 2.2272, - "step": 319510 - }, - { - "epoch": 0.56, - "learning_rate": 2.2139775458030047e-05, - "loss": 2.2641, - "step": 319520 - }, - { - "epoch": 0.56, - "learning_rate": 2.2138903518103217e-05, - "loss": 2.3054, - "step": 319530 - }, - { - "epoch": 0.56, - "learning_rate": 2.213803157817639e-05, - "loss": 2.2674, - "step": 319540 - }, - { - "epoch": 0.56, - "learning_rate": 2.2137159638249565e-05, - "loss": 2.3325, - "step": 319550 - }, - { - "epoch": 0.56, - "learning_rate": 2.213628769832274e-05, - "loss": 2.4179, - "step": 319560 - }, - { - "epoch": 0.56, - "learning_rate": 2.2135415758395912e-05, - "loss": 2.3024, - "step": 319570 - }, - { - "epoch": 0.56, - "learning_rate": 2.2134543818469083e-05, - "loss": 2.3414, - "step": 319580 - }, - { - "epoch": 0.56, - "learning_rate": 2.2133671878542256e-05, - "loss": 2.4059, - "step": 319590 - }, - { - "epoch": 0.56, - "learning_rate": 2.213279993861543e-05, - "loss": 2.2603, - "step": 319600 - }, - { - "epoch": 0.56, - "learning_rate": 2.2131927998688604e-05, - "loss": 2.3344, - "step": 319610 - }, - { - "epoch": 0.56, - "learning_rate": 2.2131056058761778e-05, - "loss": 2.3425, - "step": 319620 - }, - { - "epoch": 0.56, - "learning_rate": 2.2130184118834948e-05, - "loss": 2.2519, - "step": 319630 - }, - { - "epoch": 0.56, - "learning_rate": 2.2129312178908125e-05, - "loss": 2.3494, - "step": 319640 - }, - { - "epoch": 0.56, - "learning_rate": 2.2128440238981296e-05, - "loss": 2.3569, - "step": 319650 - }, - { - "epoch": 0.56, - "learning_rate": 2.212756829905447e-05, - "loss": 2.3109, - "step": 319660 - }, - { - "epoch": 0.56, - "learning_rate": 2.2126696359127643e-05, - "loss": 2.2998, - "step": 319670 - }, - { - "epoch": 0.56, - "learning_rate": 2.2125824419200817e-05, - "loss": 2.3789, - "step": 319680 - }, - { - "epoch": 0.56, - "learning_rate": 2.2124952479273987e-05, - "loss": 2.3062, - "step": 319690 - }, - { - "epoch": 0.56, - "learning_rate": 2.212408053934716e-05, - "loss": 2.35, - "step": 319700 - }, - { - "epoch": 0.56, - "learning_rate": 2.2123208599420335e-05, - "loss": 2.396, - "step": 319710 - }, - { - "epoch": 0.56, - "learning_rate": 2.212233665949351e-05, - "loss": 2.3283, - "step": 319720 - }, - { - "epoch": 0.56, - "learning_rate": 2.2121464719566682e-05, - "loss": 2.1968, - "step": 319730 - }, - { - "epoch": 0.56, - "learning_rate": 2.2120592779639853e-05, - "loss": 2.4499, - "step": 319740 - }, - { - "epoch": 0.56, - "learning_rate": 2.211972083971303e-05, - "loss": 2.2959, - "step": 319750 - }, - { - "epoch": 0.56, - "learning_rate": 2.21188488997862e-05, - "loss": 2.3699, - "step": 319760 - }, - { - "epoch": 0.56, - "learning_rate": 2.2117976959859374e-05, - "loss": 2.2533, - "step": 319770 - }, - { - "epoch": 0.56, - "learning_rate": 2.2117105019932548e-05, - "loss": 2.4147, - "step": 319780 - }, - { - "epoch": 0.56, - "learning_rate": 2.211623308000572e-05, - "loss": 2.2611, - "step": 319790 - }, - { - "epoch": 0.56, - "learning_rate": 2.2115361140078895e-05, - "loss": 2.395, - "step": 319800 - }, - { - "epoch": 0.56, - "learning_rate": 2.2114489200152066e-05, - "loss": 2.3674, - "step": 319810 - }, - { - "epoch": 0.56, - "learning_rate": 2.2113617260225243e-05, - "loss": 2.3685, - "step": 319820 - }, - { - "epoch": 0.56, - "learning_rate": 2.2112745320298413e-05, - "loss": 2.2834, - "step": 319830 - }, - { - "epoch": 0.56, - "learning_rate": 2.2111873380371587e-05, - "loss": 2.2971, - "step": 319840 - }, - { - "epoch": 0.56, - "learning_rate": 2.2111001440444757e-05, - "loss": 2.2923, - "step": 319850 - }, - { - "epoch": 0.56, - "learning_rate": 2.2110129500517935e-05, - "loss": 2.3142, - "step": 319860 - }, - { - "epoch": 0.56, - "learning_rate": 2.210925756059111e-05, - "loss": 2.3104, - "step": 319870 - }, - { - "epoch": 0.56, - "learning_rate": 2.210838562066428e-05, - "loss": 2.2476, - "step": 319880 - }, - { - "epoch": 0.56, - "learning_rate": 2.2107513680737452e-05, - "loss": 2.3517, - "step": 319890 - }, - { - "epoch": 0.56, - "learning_rate": 2.2106641740810626e-05, - "loss": 2.2838, - "step": 319900 - }, - { - "epoch": 0.56, - "learning_rate": 2.21057698008838e-05, - "loss": 2.3802, - "step": 319910 - }, - { - "epoch": 0.56, - "learning_rate": 2.210489786095697e-05, - "loss": 2.1858, - "step": 319920 - }, - { - "epoch": 0.56, - "learning_rate": 2.2104025921030148e-05, - "loss": 2.4369, - "step": 319930 - }, - { - "epoch": 0.56, - "learning_rate": 2.2103153981103318e-05, - "loss": 2.3436, - "step": 319940 - }, - { - "epoch": 0.56, - "learning_rate": 2.210228204117649e-05, - "loss": 2.2701, - "step": 319950 - }, - { - "epoch": 0.56, - "learning_rate": 2.2101410101249665e-05, - "loss": 2.3148, - "step": 319960 - }, - { - "epoch": 0.56, - "learning_rate": 2.210053816132284e-05, - "loss": 2.3518, - "step": 319970 - }, - { - "epoch": 0.56, - "learning_rate": 2.2099666221396013e-05, - "loss": 2.4018, - "step": 319980 - }, - { - "epoch": 0.56, - "learning_rate": 2.2098794281469183e-05, - "loss": 2.4242, - "step": 319990 - }, - { - "epoch": 0.56, - "learning_rate": 2.2097922341542357e-05, - "loss": 2.2703, - "step": 320000 - }, - { - "epoch": 0.56, - "learning_rate": 2.209705040161553e-05, - "loss": 2.4134, - "step": 320010 - }, - { - "epoch": 0.56, - "learning_rate": 2.2096178461688705e-05, - "loss": 2.3049, - "step": 320020 - }, - { - "epoch": 0.56, - "learning_rate": 2.209530652176188e-05, - "loss": 2.4368, - "step": 320030 - }, - { - "epoch": 0.56, - "learning_rate": 2.2094434581835052e-05, - "loss": 2.4247, - "step": 320040 - }, - { - "epoch": 0.56, - "learning_rate": 2.2093562641908226e-05, - "loss": 2.3378, - "step": 320050 - }, - { - "epoch": 0.56, - "learning_rate": 2.2092690701981396e-05, - "loss": 2.4327, - "step": 320060 - }, - { - "epoch": 0.56, - "learning_rate": 2.209181876205457e-05, - "loss": 2.3488, - "step": 320070 - }, - { - "epoch": 0.56, - "learning_rate": 2.2090946822127744e-05, - "loss": 2.3722, - "step": 320080 - }, - { - "epoch": 0.56, - "learning_rate": 2.2090074882200918e-05, - "loss": 2.42, - "step": 320090 - }, - { - "epoch": 0.56, - "learning_rate": 2.208920294227409e-05, - "loss": 2.4425, - "step": 320100 - }, - { - "epoch": 0.56, - "learning_rate": 2.2088331002347262e-05, - "loss": 2.3405, - "step": 320110 - }, - { - "epoch": 0.56, - "learning_rate": 2.208745906242044e-05, - "loss": 2.2951, - "step": 320120 - }, - { - "epoch": 0.56, - "learning_rate": 2.208658712249361e-05, - "loss": 2.3491, - "step": 320130 - }, - { - "epoch": 0.56, - "learning_rate": 2.2085715182566783e-05, - "loss": 2.3311, - "step": 320140 - }, - { - "epoch": 0.56, - "learning_rate": 2.2084843242639954e-05, - "loss": 2.3843, - "step": 320150 - }, - { - "epoch": 0.56, - "learning_rate": 2.208397130271313e-05, - "loss": 2.3171, - "step": 320160 - }, - { - "epoch": 0.56, - "learning_rate": 2.20830993627863e-05, - "loss": 2.4045, - "step": 320170 - }, - { - "epoch": 0.56, - "learning_rate": 2.2082227422859475e-05, - "loss": 2.3014, - "step": 320180 - }, - { - "epoch": 0.56, - "learning_rate": 2.208135548293265e-05, - "loss": 2.3695, - "step": 320190 - }, - { - "epoch": 0.56, - "learning_rate": 2.2080483543005822e-05, - "loss": 2.4005, - "step": 320200 - }, - { - "epoch": 0.56, - "learning_rate": 2.2079611603078996e-05, - "loss": 2.346, - "step": 320210 - }, - { - "epoch": 0.56, - "learning_rate": 2.2078739663152167e-05, - "loss": 2.2974, - "step": 320220 - }, - { - "epoch": 0.56, - "learning_rate": 2.2077867723225344e-05, - "loss": 2.4039, - "step": 320230 - }, - { - "epoch": 0.56, - "learning_rate": 2.2076995783298514e-05, - "loss": 2.2934, - "step": 320240 - }, - { - "epoch": 0.56, - "learning_rate": 2.2076123843371688e-05, - "loss": 2.4454, - "step": 320250 - }, - { - "epoch": 0.56, - "learning_rate": 2.207525190344486e-05, - "loss": 2.3525, - "step": 320260 - }, - { - "epoch": 0.56, - "learning_rate": 2.2074379963518035e-05, - "loss": 2.3681, - "step": 320270 - }, - { - "epoch": 0.56, - "learning_rate": 2.207350802359121e-05, - "loss": 2.1837, - "step": 320280 - }, - { - "epoch": 0.56, - "learning_rate": 2.207263608366438e-05, - "loss": 2.4031, - "step": 320290 - }, - { - "epoch": 0.56, - "learning_rate": 2.2071764143737553e-05, - "loss": 2.3638, - "step": 320300 - }, - { - "epoch": 0.56, - "learning_rate": 2.2070892203810727e-05, - "loss": 2.4025, - "step": 320310 - }, - { - "epoch": 0.56, - "learning_rate": 2.20700202638839e-05, - "loss": 2.339, - "step": 320320 - }, - { - "epoch": 0.56, - "learning_rate": 2.206914832395707e-05, - "loss": 2.2562, - "step": 320330 - }, - { - "epoch": 0.56, - "learning_rate": 2.206827638403025e-05, - "loss": 2.3263, - "step": 320340 - }, - { - "epoch": 0.56, - "learning_rate": 2.2067404444103422e-05, - "loss": 2.3932, - "step": 320350 - }, - { - "epoch": 0.56, - "learning_rate": 2.2066532504176593e-05, - "loss": 2.2916, - "step": 320360 - }, - { - "epoch": 0.56, - "learning_rate": 2.2065660564249766e-05, - "loss": 2.3762, - "step": 320370 - }, - { - "epoch": 0.56, - "learning_rate": 2.206478862432294e-05, - "loss": 2.4156, - "step": 320380 - }, - { - "epoch": 0.56, - "learning_rate": 2.2063916684396114e-05, - "loss": 2.4563, - "step": 320390 - }, - { - "epoch": 0.56, - "learning_rate": 2.2063044744469284e-05, - "loss": 2.4347, - "step": 320400 - }, - { - "epoch": 0.56, - "learning_rate": 2.2062172804542458e-05, - "loss": 2.2606, - "step": 320410 - }, - { - "epoch": 0.56, - "learning_rate": 2.2061300864615632e-05, - "loss": 2.4164, - "step": 320420 - }, - { - "epoch": 0.56, - "learning_rate": 2.2060428924688806e-05, - "loss": 2.3688, - "step": 320430 - }, - { - "epoch": 0.56, - "learning_rate": 2.205955698476198e-05, - "loss": 2.3822, - "step": 320440 - }, - { - "epoch": 0.56, - "learning_rate": 2.2058685044835153e-05, - "loss": 2.3703, - "step": 320450 - }, - { - "epoch": 0.56, - "learning_rate": 2.2057813104908327e-05, - "loss": 2.2898, - "step": 320460 - }, - { - "epoch": 0.56, - "learning_rate": 2.2056941164981497e-05, - "loss": 2.34, - "step": 320470 - }, - { - "epoch": 0.56, - "learning_rate": 2.205606922505467e-05, - "loss": 2.3431, - "step": 320480 - }, - { - "epoch": 0.56, - "learning_rate": 2.2055197285127845e-05, - "loss": 2.3906, - "step": 320490 - }, - { - "epoch": 0.56, - "learning_rate": 2.205432534520102e-05, - "loss": 2.3471, - "step": 320500 - }, - { - "epoch": 0.56, - "learning_rate": 2.2053453405274192e-05, - "loss": 2.3204, - "step": 320510 - }, - { - "epoch": 0.56, - "learning_rate": 2.2052581465347363e-05, - "loss": 2.2533, - "step": 320520 - }, - { - "epoch": 0.56, - "learning_rate": 2.205170952542054e-05, - "loss": 2.371, - "step": 320530 - }, - { - "epoch": 0.56, - "learning_rate": 2.205083758549371e-05, - "loss": 2.3705, - "step": 320540 - }, - { - "epoch": 0.56, - "learning_rate": 2.2049965645566884e-05, - "loss": 2.3491, - "step": 320550 - }, - { - "epoch": 0.56, - "learning_rate": 2.2049093705640054e-05, - "loss": 2.4094, - "step": 320560 - }, - { - "epoch": 0.56, - "learning_rate": 2.204822176571323e-05, - "loss": 2.3025, - "step": 320570 - }, - { - "epoch": 0.56, - "learning_rate": 2.2047349825786405e-05, - "loss": 2.3921, - "step": 320580 - }, - { - "epoch": 0.56, - "learning_rate": 2.2046477885859576e-05, - "loss": 2.3958, - "step": 320590 - }, - { - "epoch": 0.56, - "learning_rate": 2.2045605945932753e-05, - "loss": 2.388, - "step": 320600 - }, - { - "epoch": 0.56, - "learning_rate": 2.2044734006005923e-05, - "loss": 2.4296, - "step": 320610 - }, - { - "epoch": 0.56, - "learning_rate": 2.2043862066079097e-05, - "loss": 2.3531, - "step": 320620 - }, - { - "epoch": 0.56, - "learning_rate": 2.2042990126152267e-05, - "loss": 2.2403, - "step": 320630 - }, - { - "epoch": 0.56, - "learning_rate": 2.2042118186225445e-05, - "loss": 2.3062, - "step": 320640 - }, - { - "epoch": 0.56, - "learning_rate": 2.2041246246298615e-05, - "loss": 2.3036, - "step": 320650 - }, - { - "epoch": 0.56, - "learning_rate": 2.204037430637179e-05, - "loss": 2.3714, - "step": 320660 - }, - { - "epoch": 0.56, - "learning_rate": 2.2039502366444962e-05, - "loss": 2.3733, - "step": 320670 - }, - { - "epoch": 0.56, - "learning_rate": 2.2038630426518136e-05, - "loss": 2.3704, - "step": 320680 - }, - { - "epoch": 0.56, - "learning_rate": 2.203775848659131e-05, - "loss": 2.3046, - "step": 320690 - }, - { - "epoch": 0.56, - "learning_rate": 2.203688654666448e-05, - "loss": 2.3939, - "step": 320700 - }, - { - "epoch": 0.56, - "learning_rate": 2.2036014606737658e-05, - "loss": 2.3909, - "step": 320710 - }, - { - "epoch": 0.56, - "learning_rate": 2.2035142666810828e-05, - "loss": 2.2506, - "step": 320720 - }, - { - "epoch": 0.56, - "learning_rate": 2.2034270726884002e-05, - "loss": 2.2521, - "step": 320730 - }, - { - "epoch": 0.56, - "learning_rate": 2.2033398786957175e-05, - "loss": 2.2658, - "step": 320740 - }, - { - "epoch": 0.56, - "learning_rate": 2.203252684703035e-05, - "loss": 2.3013, - "step": 320750 - }, - { - "epoch": 0.56, - "learning_rate": 2.2031654907103523e-05, - "loss": 2.2841, - "step": 320760 - }, - { - "epoch": 0.56, - "learning_rate": 2.2030782967176693e-05, - "loss": 2.4694, - "step": 320770 - }, - { - "epoch": 0.56, - "learning_rate": 2.2029911027249867e-05, - "loss": 2.3424, - "step": 320780 - }, - { - "epoch": 0.56, - "learning_rate": 2.202903908732304e-05, - "loss": 2.3298, - "step": 320790 - }, - { - "epoch": 0.56, - "learning_rate": 2.2028167147396215e-05, - "loss": 2.396, - "step": 320800 - }, - { - "epoch": 0.56, - "learning_rate": 2.2027295207469385e-05, - "loss": 2.2581, - "step": 320810 - }, - { - "epoch": 0.56, - "learning_rate": 2.202642326754256e-05, - "loss": 2.4091, - "step": 320820 - }, - { - "epoch": 0.56, - "learning_rate": 2.2025551327615736e-05, - "loss": 2.4688, - "step": 320830 - }, - { - "epoch": 0.56, - "learning_rate": 2.2024679387688906e-05, - "loss": 2.3997, - "step": 320840 - }, - { - "epoch": 0.56, - "learning_rate": 2.202380744776208e-05, - "loss": 2.4519, - "step": 320850 - }, - { - "epoch": 0.56, - "learning_rate": 2.2022935507835254e-05, - "loss": 2.2835, - "step": 320860 - }, - { - "epoch": 0.56, - "learning_rate": 2.2022063567908428e-05, - "loss": 2.1772, - "step": 320870 - }, - { - "epoch": 0.56, - "learning_rate": 2.2021191627981598e-05, - "loss": 2.2179, - "step": 320880 - }, - { - "epoch": 0.56, - "learning_rate": 2.2020319688054772e-05, - "loss": 2.4057, - "step": 320890 - }, - { - "epoch": 0.56, - "learning_rate": 2.2019447748127946e-05, - "loss": 2.3236, - "step": 320900 - }, - { - "epoch": 0.56, - "learning_rate": 2.201857580820112e-05, - "loss": 2.4212, - "step": 320910 - }, - { - "epoch": 0.56, - "learning_rate": 2.2017703868274293e-05, - "loss": 2.3344, - "step": 320920 - }, - { - "epoch": 0.56, - "learning_rate": 2.2016831928347464e-05, - "loss": 2.3234, - "step": 320930 - }, - { - "epoch": 0.56, - "learning_rate": 2.201595998842064e-05, - "loss": 2.2781, - "step": 320940 - }, - { - "epoch": 0.56, - "learning_rate": 2.201508804849381e-05, - "loss": 2.3984, - "step": 320950 - }, - { - "epoch": 0.56, - "learning_rate": 2.2014216108566985e-05, - "loss": 2.3, - "step": 320960 - }, - { - "epoch": 0.56, - "learning_rate": 2.201334416864016e-05, - "loss": 2.3913, - "step": 320970 - }, - { - "epoch": 0.56, - "learning_rate": 2.2012472228713332e-05, - "loss": 2.3993, - "step": 320980 - }, - { - "epoch": 0.56, - "learning_rate": 2.2011600288786506e-05, - "loss": 2.3457, - "step": 320990 - }, - { - "epoch": 0.56, - "learning_rate": 2.2010728348859677e-05, - "loss": 2.3367, - "step": 321000 - }, - { - "epoch": 0.56, - "learning_rate": 2.2009856408932854e-05, - "loss": 2.4385, - "step": 321010 - }, - { - "epoch": 0.56, - "learning_rate": 2.2008984469006024e-05, - "loss": 2.3268, - "step": 321020 - }, - { - "epoch": 0.56, - "learning_rate": 2.2008112529079198e-05, - "loss": 2.3983, - "step": 321030 - }, - { - "epoch": 0.56, - "learning_rate": 2.2007240589152368e-05, - "loss": 2.3782, - "step": 321040 - }, - { - "epoch": 0.56, - "learning_rate": 2.2006368649225545e-05, - "loss": 2.4717, - "step": 321050 - }, - { - "epoch": 0.56, - "learning_rate": 2.2005496709298716e-05, - "loss": 2.3095, - "step": 321060 - }, - { - "epoch": 0.56, - "learning_rate": 2.200462476937189e-05, - "loss": 2.5284, - "step": 321070 - }, - { - "epoch": 0.56, - "learning_rate": 2.2003752829445063e-05, - "loss": 2.3307, - "step": 321080 - }, - { - "epoch": 0.56, - "learning_rate": 2.2002880889518237e-05, - "loss": 2.4189, - "step": 321090 - }, - { - "epoch": 0.56, - "learning_rate": 2.200200894959141e-05, - "loss": 2.3579, - "step": 321100 - }, - { - "epoch": 0.56, - "learning_rate": 2.200113700966458e-05, - "loss": 2.4058, - "step": 321110 - }, - { - "epoch": 0.56, - "learning_rate": 2.200026506973776e-05, - "loss": 2.3628, - "step": 321120 - }, - { - "epoch": 0.56, - "learning_rate": 2.199939312981093e-05, - "loss": 2.2277, - "step": 321130 - }, - { - "epoch": 0.56, - "learning_rate": 2.1998521189884103e-05, - "loss": 2.3224, - "step": 321140 - }, - { - "epoch": 0.56, - "learning_rate": 2.1997649249957276e-05, - "loss": 2.2955, - "step": 321150 - }, - { - "epoch": 0.56, - "learning_rate": 2.199677731003045e-05, - "loss": 2.3742, - "step": 321160 - }, - { - "epoch": 0.56, - "learning_rate": 2.1995905370103624e-05, - "loss": 2.297, - "step": 321170 - }, - { - "epoch": 0.56, - "learning_rate": 2.1995033430176794e-05, - "loss": 2.329, - "step": 321180 - }, - { - "epoch": 0.56, - "learning_rate": 2.1994161490249968e-05, - "loss": 2.4243, - "step": 321190 - }, - { - "epoch": 0.56, - "learning_rate": 2.1993289550323142e-05, - "loss": 2.3112, - "step": 321200 - }, - { - "epoch": 0.56, - "learning_rate": 2.1992417610396316e-05, - "loss": 2.3329, - "step": 321210 - }, - { - "epoch": 0.56, - "learning_rate": 2.199154567046949e-05, - "loss": 2.3333, - "step": 321220 - }, - { - "epoch": 0.56, - "learning_rate": 2.199067373054266e-05, - "loss": 2.3016, - "step": 321230 - }, - { - "epoch": 0.56, - "learning_rate": 2.1989801790615837e-05, - "loss": 2.3122, - "step": 321240 - }, - { - "epoch": 0.56, - "learning_rate": 2.1988929850689007e-05, - "loss": 2.3463, - "step": 321250 - }, - { - "epoch": 0.56, - "learning_rate": 2.198805791076218e-05, - "loss": 2.3238, - "step": 321260 - }, - { - "epoch": 0.56, - "learning_rate": 2.1987185970835355e-05, - "loss": 2.335, - "step": 321270 - }, - { - "epoch": 0.56, - "learning_rate": 2.198631403090853e-05, - "loss": 2.3036, - "step": 321280 - }, - { - "epoch": 0.56, - "learning_rate": 2.19854420909817e-05, - "loss": 2.387, - "step": 321290 - }, - { - "epoch": 0.56, - "learning_rate": 2.1984570151054873e-05, - "loss": 2.229, - "step": 321300 - }, - { - "epoch": 0.56, - "learning_rate": 2.198369821112805e-05, - "loss": 2.4781, - "step": 321310 - }, - { - "epoch": 0.56, - "learning_rate": 2.198282627120122e-05, - "loss": 2.3133, - "step": 321320 - }, - { - "epoch": 0.56, - "learning_rate": 2.1981954331274394e-05, - "loss": 2.3673, - "step": 321330 - }, - { - "epoch": 0.56, - "learning_rate": 2.1981082391347564e-05, - "loss": 2.3563, - "step": 321340 - }, - { - "epoch": 0.56, - "learning_rate": 2.198021045142074e-05, - "loss": 2.3589, - "step": 321350 - }, - { - "epoch": 0.56, - "learning_rate": 2.1979338511493912e-05, - "loss": 2.4577, - "step": 321360 - }, - { - "epoch": 0.56, - "learning_rate": 2.1978466571567086e-05, - "loss": 2.2753, - "step": 321370 - }, - { - "epoch": 0.56, - "learning_rate": 2.197759463164026e-05, - "loss": 2.3411, - "step": 321380 - }, - { - "epoch": 0.56, - "learning_rate": 2.1976722691713433e-05, - "loss": 2.416, - "step": 321390 - }, - { - "epoch": 0.56, - "learning_rate": 2.1975850751786607e-05, - "loss": 2.3922, - "step": 321400 - }, - { - "epoch": 0.56, - "learning_rate": 2.1974978811859777e-05, - "loss": 2.3704, - "step": 321410 - }, - { - "epoch": 0.56, - "learning_rate": 2.1974106871932955e-05, - "loss": 2.3217, - "step": 321420 - }, - { - "epoch": 0.56, - "learning_rate": 2.1973234932006125e-05, - "loss": 2.3295, - "step": 321430 - }, - { - "epoch": 0.56, - "learning_rate": 2.19723629920793e-05, - "loss": 2.3397, - "step": 321440 - }, - { - "epoch": 0.56, - "learning_rate": 2.1971491052152472e-05, - "loss": 2.3364, - "step": 321450 - }, - { - "epoch": 0.56, - "learning_rate": 2.1970619112225646e-05, - "loss": 2.4735, - "step": 321460 - }, - { - "epoch": 0.56, - "learning_rate": 2.196974717229882e-05, - "loss": 2.3586, - "step": 321470 - }, - { - "epoch": 0.56, - "learning_rate": 2.196887523237199e-05, - "loss": 2.3539, - "step": 321480 - }, - { - "epoch": 0.56, - "learning_rate": 2.1968003292445164e-05, - "loss": 2.3672, - "step": 321490 - }, - { - "epoch": 0.56, - "learning_rate": 2.1967131352518338e-05, - "loss": 2.3498, - "step": 321500 - }, - { - "epoch": 0.56, - "learning_rate": 2.1966259412591512e-05, - "loss": 2.4743, - "step": 321510 - }, - { - "epoch": 0.56, - "learning_rate": 2.1965387472664682e-05, - "loss": 2.4237, - "step": 321520 - }, - { - "epoch": 0.56, - "learning_rate": 2.196451553273786e-05, - "loss": 2.3326, - "step": 321530 - }, - { - "epoch": 0.56, - "learning_rate": 2.196364359281103e-05, - "loss": 2.3207, - "step": 321540 - }, - { - "epoch": 0.56, - "learning_rate": 2.1962771652884203e-05, - "loss": 2.3964, - "step": 321550 - }, - { - "epoch": 0.56, - "learning_rate": 2.1961899712957377e-05, - "loss": 2.3343, - "step": 321560 - }, - { - "epoch": 0.56, - "learning_rate": 2.196102777303055e-05, - "loss": 2.4224, - "step": 321570 - }, - { - "epoch": 0.56, - "learning_rate": 2.1960155833103725e-05, - "loss": 2.3177, - "step": 321580 - }, - { - "epoch": 0.56, - "learning_rate": 2.1959283893176895e-05, - "loss": 2.3824, - "step": 321590 - }, - { - "epoch": 0.56, - "learning_rate": 2.195841195325007e-05, - "loss": 2.2812, - "step": 321600 - }, - { - "epoch": 0.56, - "learning_rate": 2.1957540013323243e-05, - "loss": 2.3757, - "step": 321610 - }, - { - "epoch": 0.56, - "learning_rate": 2.1956668073396416e-05, - "loss": 2.3415, - "step": 321620 - }, - { - "epoch": 0.56, - "learning_rate": 2.195579613346959e-05, - "loss": 2.3328, - "step": 321630 - }, - { - "epoch": 0.56, - "learning_rate": 2.1954924193542764e-05, - "loss": 2.391, - "step": 321640 - }, - { - "epoch": 0.56, - "learning_rate": 2.1954052253615938e-05, - "loss": 2.3737, - "step": 321650 - }, - { - "epoch": 0.56, - "learning_rate": 2.1953180313689108e-05, - "loss": 2.3325, - "step": 321660 - }, - { - "epoch": 0.56, - "learning_rate": 2.1952308373762282e-05, - "loss": 2.2921, - "step": 321670 - }, - { - "epoch": 0.56, - "learning_rate": 2.1951436433835456e-05, - "loss": 2.4212, - "step": 321680 - }, - { - "epoch": 0.56, - "learning_rate": 2.195056449390863e-05, - "loss": 2.3571, - "step": 321690 - }, - { - "epoch": 0.56, - "learning_rate": 2.1949692553981803e-05, - "loss": 2.4673, - "step": 321700 - }, - { - "epoch": 0.56, - "learning_rate": 2.1948820614054974e-05, - "loss": 2.3288, - "step": 321710 - }, - { - "epoch": 0.56, - "learning_rate": 2.194794867412815e-05, - "loss": 2.3305, - "step": 321720 - }, - { - "epoch": 0.56, - "learning_rate": 2.194707673420132e-05, - "loss": 2.3305, - "step": 321730 - }, - { - "epoch": 0.56, - "learning_rate": 2.1946204794274495e-05, - "loss": 2.3209, - "step": 321740 - }, - { - "epoch": 0.56, - "learning_rate": 2.1945332854347665e-05, - "loss": 2.3571, - "step": 321750 - }, - { - "epoch": 0.56, - "learning_rate": 2.1944460914420842e-05, - "loss": 2.3101, - "step": 321760 - }, - { - "epoch": 0.56, - "learning_rate": 2.1943588974494013e-05, - "loss": 2.3539, - "step": 321770 - }, - { - "epoch": 0.56, - "learning_rate": 2.1942717034567187e-05, - "loss": 2.3772, - "step": 321780 - }, - { - "epoch": 0.56, - "learning_rate": 2.194184509464036e-05, - "loss": 2.3614, - "step": 321790 - }, - { - "epoch": 0.56, - "learning_rate": 2.1940973154713534e-05, - "loss": 2.3634, - "step": 321800 - }, - { - "epoch": 0.56, - "learning_rate": 2.1940101214786708e-05, - "loss": 2.3255, - "step": 321810 - }, - { - "epoch": 0.56, - "learning_rate": 2.1939229274859878e-05, - "loss": 2.4184, - "step": 321820 - }, - { - "epoch": 0.56, - "learning_rate": 2.1938357334933055e-05, - "loss": 2.2732, - "step": 321830 - }, - { - "epoch": 0.56, - "learning_rate": 2.1937485395006226e-05, - "loss": 2.3667, - "step": 321840 - }, - { - "epoch": 0.56, - "learning_rate": 2.19366134550794e-05, - "loss": 2.3936, - "step": 321850 - }, - { - "epoch": 0.56, - "learning_rate": 2.1935741515152573e-05, - "loss": 2.4113, - "step": 321860 - }, - { - "epoch": 0.56, - "learning_rate": 2.1934869575225747e-05, - "loss": 2.3706, - "step": 321870 - }, - { - "epoch": 0.56, - "learning_rate": 2.193399763529892e-05, - "loss": 2.4589, - "step": 321880 - }, - { - "epoch": 0.56, - "learning_rate": 2.193312569537209e-05, - "loss": 2.3172, - "step": 321890 - }, - { - "epoch": 0.56, - "learning_rate": 2.193225375544527e-05, - "loss": 2.4241, - "step": 321900 - }, - { - "epoch": 0.56, - "learning_rate": 2.193138181551844e-05, - "loss": 2.2768, - "step": 321910 - }, - { - "epoch": 0.56, - "learning_rate": 2.1930509875591613e-05, - "loss": 2.3429, - "step": 321920 - }, - { - "epoch": 0.56, - "learning_rate": 2.1929637935664786e-05, - "loss": 2.3827, - "step": 321930 - }, - { - "epoch": 0.56, - "learning_rate": 2.192876599573796e-05, - "loss": 2.3515, - "step": 321940 - }, - { - "epoch": 0.56, - "learning_rate": 2.1927894055811134e-05, - "loss": 2.3933, - "step": 321950 - }, - { - "epoch": 0.56, - "learning_rate": 2.1927022115884304e-05, - "loss": 2.2903, - "step": 321960 - }, - { - "epoch": 0.56, - "learning_rate": 2.1926150175957478e-05, - "loss": 2.3672, - "step": 321970 - }, - { - "epoch": 0.56, - "learning_rate": 2.1925278236030652e-05, - "loss": 2.269, - "step": 321980 - }, - { - "epoch": 0.56, - "learning_rate": 2.1924406296103826e-05, - "loss": 2.2986, - "step": 321990 - }, - { - "epoch": 0.56, - "learning_rate": 2.1923534356176996e-05, - "loss": 2.3769, - "step": 322000 - }, - { - "epoch": 0.56, - "learning_rate": 2.192266241625017e-05, - "loss": 2.2913, - "step": 322010 - }, - { - "epoch": 0.56, - "learning_rate": 2.1921790476323343e-05, - "loss": 2.2951, - "step": 322020 - }, - { - "epoch": 0.56, - "learning_rate": 2.1920918536396517e-05, - "loss": 2.3669, - "step": 322030 - }, - { - "epoch": 0.56, - "learning_rate": 2.192004659646969e-05, - "loss": 2.3538, - "step": 322040 - }, - { - "epoch": 0.56, - "learning_rate": 2.1919174656542865e-05, - "loss": 2.3063, - "step": 322050 - }, - { - "epoch": 0.56, - "learning_rate": 2.191830271661604e-05, - "loss": 2.2845, - "step": 322060 - }, - { - "epoch": 0.56, - "learning_rate": 2.191743077668921e-05, - "loss": 2.3595, - "step": 322070 - }, - { - "epoch": 0.56, - "learning_rate": 2.1916558836762383e-05, - "loss": 2.3284, - "step": 322080 - }, - { - "epoch": 0.56, - "learning_rate": 2.1915686896835556e-05, - "loss": 2.2519, - "step": 322090 - }, - { - "epoch": 0.56, - "learning_rate": 2.191481495690873e-05, - "loss": 2.322, - "step": 322100 - }, - { - "epoch": 0.56, - "learning_rate": 2.1913943016981904e-05, - "loss": 2.3569, - "step": 322110 - }, - { - "epoch": 0.56, - "learning_rate": 2.1913071077055074e-05, - "loss": 2.3706, - "step": 322120 - }, - { - "epoch": 0.56, - "learning_rate": 2.191219913712825e-05, - "loss": 2.3477, - "step": 322130 - }, - { - "epoch": 0.56, - "learning_rate": 2.1911327197201422e-05, - "loss": 2.4115, - "step": 322140 - }, - { - "epoch": 0.56, - "learning_rate": 2.1910455257274596e-05, - "loss": 2.2481, - "step": 322150 - }, - { - "epoch": 0.56, - "learning_rate": 2.1909583317347766e-05, - "loss": 2.3055, - "step": 322160 - }, - { - "epoch": 0.56, - "learning_rate": 2.1908711377420943e-05, - "loss": 2.287, - "step": 322170 - }, - { - "epoch": 0.56, - "learning_rate": 2.1907839437494117e-05, - "loss": 2.2745, - "step": 322180 - }, - { - "epoch": 0.56, - "learning_rate": 2.1906967497567287e-05, - "loss": 2.3452, - "step": 322190 - }, - { - "epoch": 0.56, - "learning_rate": 2.1906095557640465e-05, - "loss": 2.3714, - "step": 322200 - }, - { - "epoch": 0.56, - "learning_rate": 2.1905223617713635e-05, - "loss": 2.2452, - "step": 322210 - }, - { - "epoch": 0.56, - "learning_rate": 2.190435167778681e-05, - "loss": 2.3371, - "step": 322220 - }, - { - "epoch": 0.56, - "learning_rate": 2.190347973785998e-05, - "loss": 2.3569, - "step": 322230 - }, - { - "epoch": 0.56, - "learning_rate": 2.1902607797933156e-05, - "loss": 2.3744, - "step": 322240 - }, - { - "epoch": 0.56, - "learning_rate": 2.1901735858006327e-05, - "loss": 2.2793, - "step": 322250 - }, - { - "epoch": 0.56, - "learning_rate": 2.19008639180795e-05, - "loss": 2.4216, - "step": 322260 - }, - { - "epoch": 0.56, - "learning_rate": 2.1899991978152674e-05, - "loss": 2.4271, - "step": 322270 - }, - { - "epoch": 0.56, - "learning_rate": 2.1899120038225848e-05, - "loss": 2.3549, - "step": 322280 - }, - { - "epoch": 0.56, - "learning_rate": 2.1898248098299022e-05, - "loss": 2.356, - "step": 322290 - }, - { - "epoch": 0.56, - "learning_rate": 2.1897376158372192e-05, - "loss": 2.1577, - "step": 322300 - }, - { - "epoch": 0.56, - "learning_rate": 2.189650421844537e-05, - "loss": 2.3889, - "step": 322310 - }, - { - "epoch": 0.56, - "learning_rate": 2.189563227851854e-05, - "loss": 2.2827, - "step": 322320 - }, - { - "epoch": 0.56, - "learning_rate": 2.1894760338591713e-05, - "loss": 2.382, - "step": 322330 - }, - { - "epoch": 0.56, - "learning_rate": 2.1893888398664887e-05, - "loss": 2.3108, - "step": 322340 - }, - { - "epoch": 0.56, - "learning_rate": 2.189301645873806e-05, - "loss": 2.248, - "step": 322350 - }, - { - "epoch": 0.56, - "learning_rate": 2.1892144518811235e-05, - "loss": 2.3016, - "step": 322360 - }, - { - "epoch": 0.56, - "learning_rate": 2.1891272578884405e-05, - "loss": 2.3592, - "step": 322370 - }, - { - "epoch": 0.56, - "learning_rate": 2.189040063895758e-05, - "loss": 2.2996, - "step": 322380 - }, - { - "epoch": 0.56, - "learning_rate": 2.1889528699030753e-05, - "loss": 2.3736, - "step": 322390 - }, - { - "epoch": 0.56, - "learning_rate": 2.1888656759103926e-05, - "loss": 2.2197, - "step": 322400 - }, - { - "epoch": 0.56, - "learning_rate": 2.1887784819177097e-05, - "loss": 2.3045, - "step": 322410 - }, - { - "epoch": 0.56, - "learning_rate": 2.188691287925027e-05, - "loss": 2.2362, - "step": 322420 - }, - { - "epoch": 0.56, - "learning_rate": 2.1886040939323448e-05, - "loss": 2.3843, - "step": 322430 - }, - { - "epoch": 0.56, - "learning_rate": 2.1885168999396618e-05, - "loss": 2.3769, - "step": 322440 - }, - { - "epoch": 0.56, - "learning_rate": 2.1884297059469792e-05, - "loss": 2.379, - "step": 322450 - }, - { - "epoch": 0.56, - "learning_rate": 2.1883425119542966e-05, - "loss": 2.344, - "step": 322460 - }, - { - "epoch": 0.56, - "learning_rate": 2.188255317961614e-05, - "loss": 2.3288, - "step": 322470 - }, - { - "epoch": 0.56, - "learning_rate": 2.188168123968931e-05, - "loss": 2.475, - "step": 322480 - }, - { - "epoch": 0.56, - "learning_rate": 2.1880809299762484e-05, - "loss": 2.3883, - "step": 322490 - }, - { - "epoch": 0.56, - "learning_rate": 2.1879937359835657e-05, - "loss": 2.3131, - "step": 322500 - }, - { - "epoch": 0.56, - "learning_rate": 2.187906541990883e-05, - "loss": 2.3429, - "step": 322510 - }, - { - "epoch": 0.56, - "learning_rate": 2.1878193479982005e-05, - "loss": 2.4013, - "step": 322520 - }, - { - "epoch": 0.56, - "learning_rate": 2.1877321540055175e-05, - "loss": 2.3209, - "step": 322530 - }, - { - "epoch": 0.56, - "learning_rate": 2.1876449600128352e-05, - "loss": 2.474, - "step": 322540 - }, - { - "epoch": 0.56, - "learning_rate": 2.1875577660201523e-05, - "loss": 2.2728, - "step": 322550 - }, - { - "epoch": 0.56, - "learning_rate": 2.1874705720274697e-05, - "loss": 2.3764, - "step": 322560 - }, - { - "epoch": 0.56, - "learning_rate": 2.187383378034787e-05, - "loss": 2.3059, - "step": 322570 - }, - { - "epoch": 0.56, - "learning_rate": 2.1872961840421044e-05, - "loss": 2.4285, - "step": 322580 - }, - { - "epoch": 0.56, - "learning_rate": 2.1872089900494218e-05, - "loss": 2.3922, - "step": 322590 - }, - { - "epoch": 0.56, - "learning_rate": 2.1871217960567388e-05, - "loss": 2.3152, - "step": 322600 - }, - { - "epoch": 0.56, - "learning_rate": 2.1870346020640565e-05, - "loss": 2.2915, - "step": 322610 - }, - { - "epoch": 0.56, - "learning_rate": 2.1869474080713736e-05, - "loss": 2.3079, - "step": 322620 - }, - { - "epoch": 0.56, - "learning_rate": 2.186860214078691e-05, - "loss": 2.4096, - "step": 322630 - }, - { - "epoch": 0.56, - "learning_rate": 2.186773020086008e-05, - "loss": 2.3548, - "step": 322640 - }, - { - "epoch": 0.56, - "learning_rate": 2.1866858260933257e-05, - "loss": 2.2814, - "step": 322650 - }, - { - "epoch": 0.56, - "learning_rate": 2.186598632100643e-05, - "loss": 2.2786, - "step": 322660 - }, - { - "epoch": 0.56, - "learning_rate": 2.18651143810796e-05, - "loss": 2.3271, - "step": 322670 - }, - { - "epoch": 0.56, - "learning_rate": 2.1864242441152775e-05, - "loss": 2.2722, - "step": 322680 - }, - { - "epoch": 0.56, - "learning_rate": 2.186337050122595e-05, - "loss": 2.4052, - "step": 322690 - }, - { - "epoch": 0.56, - "learning_rate": 2.1862498561299123e-05, - "loss": 2.4173, - "step": 322700 - }, - { - "epoch": 0.56, - "learning_rate": 2.1861626621372293e-05, - "loss": 2.4556, - "step": 322710 - }, - { - "epoch": 0.56, - "learning_rate": 2.186075468144547e-05, - "loss": 2.3867, - "step": 322720 - }, - { - "epoch": 0.56, - "learning_rate": 2.185988274151864e-05, - "loss": 2.3887, - "step": 322730 - }, - { - "epoch": 0.56, - "learning_rate": 2.1859010801591814e-05, - "loss": 2.4299, - "step": 322740 - }, - { - "epoch": 0.56, - "learning_rate": 2.1858138861664988e-05, - "loss": 2.2603, - "step": 322750 - }, - { - "epoch": 0.56, - "learning_rate": 2.1857266921738162e-05, - "loss": 2.2981, - "step": 322760 - }, - { - "epoch": 0.56, - "learning_rate": 2.1856394981811336e-05, - "loss": 2.5019, - "step": 322770 - }, - { - "epoch": 0.56, - "learning_rate": 2.1855523041884506e-05, - "loss": 2.3744, - "step": 322780 - }, - { - "epoch": 0.56, - "learning_rate": 2.185465110195768e-05, - "loss": 2.3171, - "step": 322790 - }, - { - "epoch": 0.56, - "learning_rate": 2.1853779162030853e-05, - "loss": 2.268, - "step": 322800 - }, - { - "epoch": 0.56, - "learning_rate": 2.1852907222104027e-05, - "loss": 2.4127, - "step": 322810 - }, - { - "epoch": 0.56, - "learning_rate": 2.18520352821772e-05, - "loss": 2.3494, - "step": 322820 - }, - { - "epoch": 0.56, - "learning_rate": 2.185116334225037e-05, - "loss": 2.3664, - "step": 322830 - }, - { - "epoch": 0.56, - "learning_rate": 2.185029140232355e-05, - "loss": 2.3906, - "step": 322840 - }, - { - "epoch": 0.56, - "learning_rate": 2.184941946239672e-05, - "loss": 2.4184, - "step": 322850 - }, - { - "epoch": 0.56, - "learning_rate": 2.1848547522469893e-05, - "loss": 2.3993, - "step": 322860 - }, - { - "epoch": 0.56, - "learning_rate": 2.1847675582543066e-05, - "loss": 2.3118, - "step": 322870 - }, - { - "epoch": 0.56, - "learning_rate": 2.184680364261624e-05, - "loss": 2.3401, - "step": 322880 - }, - { - "epoch": 0.56, - "learning_rate": 2.184593170268941e-05, - "loss": 2.4143, - "step": 322890 - }, - { - "epoch": 0.56, - "learning_rate": 2.1845059762762584e-05, - "loss": 2.3244, - "step": 322900 - }, - { - "epoch": 0.56, - "learning_rate": 2.184418782283576e-05, - "loss": 2.2556, - "step": 322910 - }, - { - "epoch": 0.56, - "learning_rate": 2.1843315882908932e-05, - "loss": 2.4289, - "step": 322920 - }, - { - "epoch": 0.56, - "learning_rate": 2.1842443942982106e-05, - "loss": 2.3631, - "step": 322930 - }, - { - "epoch": 0.56, - "learning_rate": 2.1841572003055276e-05, - "loss": 2.3868, - "step": 322940 - }, - { - "epoch": 0.56, - "learning_rate": 2.1840700063128453e-05, - "loss": 2.2177, - "step": 322950 - }, - { - "epoch": 0.56, - "learning_rate": 2.1839828123201624e-05, - "loss": 2.4083, - "step": 322960 - }, - { - "epoch": 0.56, - "learning_rate": 2.1838956183274797e-05, - "loss": 2.3973, - "step": 322970 - }, - { - "epoch": 0.56, - "learning_rate": 2.183808424334797e-05, - "loss": 2.3968, - "step": 322980 - }, - { - "epoch": 0.56, - "learning_rate": 2.1837212303421145e-05, - "loss": 2.3966, - "step": 322990 - }, - { - "epoch": 0.56, - "learning_rate": 2.183634036349432e-05, - "loss": 2.1521, - "step": 323000 - }, - { - "epoch": 0.56, - "learning_rate": 2.183546842356749e-05, - "loss": 2.293, - "step": 323010 - }, - { - "epoch": 0.56, - "learning_rate": 2.1834596483640666e-05, - "loss": 2.365, - "step": 323020 - }, - { - "epoch": 0.56, - "learning_rate": 2.1833724543713837e-05, - "loss": 2.3218, - "step": 323030 - }, - { - "epoch": 0.56, - "learning_rate": 2.183285260378701e-05, - "loss": 2.3536, - "step": 323040 - }, - { - "epoch": 0.56, - "learning_rate": 2.1831980663860184e-05, - "loss": 2.3527, - "step": 323050 - }, - { - "epoch": 0.56, - "learning_rate": 2.1831108723933358e-05, - "loss": 2.3366, - "step": 323060 - }, - { - "epoch": 0.56, - "learning_rate": 2.1830236784006532e-05, - "loss": 2.3599, - "step": 323070 - }, - { - "epoch": 0.56, - "learning_rate": 2.1829364844079702e-05, - "loss": 2.3121, - "step": 323080 - }, - { - "epoch": 0.56, - "learning_rate": 2.1828492904152876e-05, - "loss": 2.3471, - "step": 323090 - }, - { - "epoch": 0.56, - "learning_rate": 2.182762096422605e-05, - "loss": 2.302, - "step": 323100 - }, - { - "epoch": 0.56, - "learning_rate": 2.1826749024299223e-05, - "loss": 2.3995, - "step": 323110 - }, - { - "epoch": 0.56, - "learning_rate": 2.1825877084372394e-05, - "loss": 2.3042, - "step": 323120 - }, - { - "epoch": 0.56, - "learning_rate": 2.182500514444557e-05, - "loss": 2.4492, - "step": 323130 - }, - { - "epoch": 0.56, - "learning_rate": 2.182413320451874e-05, - "loss": 2.3296, - "step": 323140 - }, - { - "epoch": 0.56, - "learning_rate": 2.1823261264591915e-05, - "loss": 2.3594, - "step": 323150 - }, - { - "epoch": 0.56, - "learning_rate": 2.182238932466509e-05, - "loss": 2.3172, - "step": 323160 - }, - { - "epoch": 0.56, - "learning_rate": 2.1821517384738263e-05, - "loss": 2.3962, - "step": 323170 - }, - { - "epoch": 0.56, - "learning_rate": 2.1820645444811436e-05, - "loss": 2.3268, - "step": 323180 - }, - { - "epoch": 0.56, - "learning_rate": 2.1819773504884607e-05, - "loss": 2.3174, - "step": 323190 - }, - { - "epoch": 0.56, - "learning_rate": 2.181890156495778e-05, - "loss": 2.2225, - "step": 323200 - }, - { - "epoch": 0.56, - "learning_rate": 2.1818029625030954e-05, - "loss": 2.3102, - "step": 323210 - }, - { - "epoch": 0.56, - "learning_rate": 2.1817157685104128e-05, - "loss": 2.3743, - "step": 323220 - }, - { - "epoch": 0.56, - "learning_rate": 2.1816285745177302e-05, - "loss": 2.3855, - "step": 323230 - }, - { - "epoch": 0.56, - "learning_rate": 2.1815413805250476e-05, - "loss": 2.32, - "step": 323240 - }, - { - "epoch": 0.56, - "learning_rate": 2.181454186532365e-05, - "loss": 2.3448, - "step": 323250 - }, - { - "epoch": 0.56, - "learning_rate": 2.181366992539682e-05, - "loss": 2.3667, - "step": 323260 - }, - { - "epoch": 0.56, - "learning_rate": 2.1812797985469994e-05, - "loss": 2.3675, - "step": 323270 - }, - { - "epoch": 0.56, - "learning_rate": 2.1811926045543167e-05, - "loss": 2.331, - "step": 323280 - }, - { - "epoch": 0.56, - "learning_rate": 2.181105410561634e-05, - "loss": 2.3712, - "step": 323290 - }, - { - "epoch": 0.56, - "learning_rate": 2.1810182165689515e-05, - "loss": 2.3333, - "step": 323300 - }, - { - "epoch": 0.56, - "learning_rate": 2.1809310225762685e-05, - "loss": 2.2524, - "step": 323310 - }, - { - "epoch": 0.56, - "learning_rate": 2.1808438285835862e-05, - "loss": 2.3064, - "step": 323320 - }, - { - "epoch": 0.56, - "learning_rate": 2.1807566345909033e-05, - "loss": 2.3077, - "step": 323330 - }, - { - "epoch": 0.56, - "learning_rate": 2.1806694405982207e-05, - "loss": 2.3643, - "step": 323340 - }, - { - "epoch": 0.56, - "learning_rate": 2.1805822466055377e-05, - "loss": 2.4481, - "step": 323350 - }, - { - "epoch": 0.56, - "learning_rate": 2.1804950526128554e-05, - "loss": 2.3148, - "step": 323360 - }, - { - "epoch": 0.56, - "learning_rate": 2.1804078586201724e-05, - "loss": 2.2958, - "step": 323370 - }, - { - "epoch": 0.56, - "learning_rate": 2.1803206646274898e-05, - "loss": 2.4328, - "step": 323380 - }, - { - "epoch": 0.56, - "learning_rate": 2.1802334706348075e-05, - "loss": 2.3577, - "step": 323390 - }, - { - "epoch": 0.56, - "learning_rate": 2.1801462766421246e-05, - "loss": 2.3483, - "step": 323400 - }, - { - "epoch": 0.56, - "learning_rate": 2.180059082649442e-05, - "loss": 2.2729, - "step": 323410 - }, - { - "epoch": 0.56, - "learning_rate": 2.179971888656759e-05, - "loss": 2.2716, - "step": 323420 - }, - { - "epoch": 0.56, - "learning_rate": 2.1798846946640767e-05, - "loss": 2.278, - "step": 323430 - }, - { - "epoch": 0.56, - "learning_rate": 2.1797975006713937e-05, - "loss": 2.4747, - "step": 323440 - }, - { - "epoch": 0.56, - "learning_rate": 2.179710306678711e-05, - "loss": 2.3499, - "step": 323450 - }, - { - "epoch": 0.56, - "learning_rate": 2.1796231126860285e-05, - "loss": 2.3181, - "step": 323460 - }, - { - "epoch": 0.56, - "learning_rate": 2.179535918693346e-05, - "loss": 2.3954, - "step": 323470 - }, - { - "epoch": 0.56, - "learning_rate": 2.1794487247006633e-05, - "loss": 2.2611, - "step": 323480 - }, - { - "epoch": 0.56, - "learning_rate": 2.1793615307079803e-05, - "loss": 2.3054, - "step": 323490 - }, - { - "epoch": 0.56, - "learning_rate": 2.179274336715298e-05, - "loss": 2.299, - "step": 323500 - }, - { - "epoch": 0.56, - "learning_rate": 2.179187142722615e-05, - "loss": 2.3663, - "step": 323510 - }, - { - "epoch": 0.56, - "learning_rate": 2.1790999487299324e-05, - "loss": 2.2273, - "step": 323520 - }, - { - "epoch": 0.56, - "learning_rate": 2.1790127547372498e-05, - "loss": 2.3146, - "step": 323530 - }, - { - "epoch": 0.56, - "learning_rate": 2.1789255607445672e-05, - "loss": 2.2908, - "step": 323540 - }, - { - "epoch": 0.56, - "learning_rate": 2.1788383667518846e-05, - "loss": 2.3464, - "step": 323550 - }, - { - "epoch": 0.56, - "learning_rate": 2.1787511727592016e-05, - "loss": 2.3571, - "step": 323560 - }, - { - "epoch": 0.56, - "learning_rate": 2.178663978766519e-05, - "loss": 2.3218, - "step": 323570 - }, - { - "epoch": 0.56, - "learning_rate": 2.1785767847738363e-05, - "loss": 2.4122, - "step": 323580 - }, - { - "epoch": 0.56, - "learning_rate": 2.1784895907811537e-05, - "loss": 2.4264, - "step": 323590 - }, - { - "epoch": 0.56, - "learning_rate": 2.1784023967884708e-05, - "loss": 2.2904, - "step": 323600 - }, - { - "epoch": 0.56, - "learning_rate": 2.178315202795788e-05, - "loss": 2.3645, - "step": 323610 - }, - { - "epoch": 0.56, - "learning_rate": 2.1782280088031055e-05, - "loss": 2.3752, - "step": 323620 - }, - { - "epoch": 0.56, - "learning_rate": 2.178140814810423e-05, - "loss": 2.3916, - "step": 323630 - }, - { - "epoch": 0.56, - "learning_rate": 2.1780536208177403e-05, - "loss": 2.2, - "step": 323640 - }, - { - "epoch": 0.56, - "learning_rate": 2.1779664268250576e-05, - "loss": 2.2393, - "step": 323650 - }, - { - "epoch": 0.56, - "learning_rate": 2.177879232832375e-05, - "loss": 2.3722, - "step": 323660 - }, - { - "epoch": 0.56, - "learning_rate": 2.177792038839692e-05, - "loss": 2.2746, - "step": 323670 - }, - { - "epoch": 0.56, - "learning_rate": 2.1777048448470094e-05, - "loss": 2.3891, - "step": 323680 - }, - { - "epoch": 0.56, - "learning_rate": 2.1776176508543268e-05, - "loss": 2.3025, - "step": 323690 - }, - { - "epoch": 0.56, - "learning_rate": 2.1775304568616442e-05, - "loss": 2.3342, - "step": 323700 - }, - { - "epoch": 0.56, - "learning_rate": 2.1774432628689616e-05, - "loss": 2.3353, - "step": 323710 - }, - { - "epoch": 0.56, - "learning_rate": 2.1773560688762786e-05, - "loss": 2.3393, - "step": 323720 - }, - { - "epoch": 0.56, - "learning_rate": 2.1772688748835963e-05, - "loss": 2.2925, - "step": 323730 - }, - { - "epoch": 0.56, - "learning_rate": 2.1771816808909134e-05, - "loss": 2.2444, - "step": 323740 - }, - { - "epoch": 0.56, - "learning_rate": 2.1770944868982307e-05, - "loss": 2.5031, - "step": 323750 - }, - { - "epoch": 0.56, - "learning_rate": 2.1770072929055478e-05, - "loss": 2.3171, - "step": 323760 - }, - { - "epoch": 0.56, - "learning_rate": 2.1769200989128655e-05, - "loss": 2.3432, - "step": 323770 - }, - { - "epoch": 0.56, - "learning_rate": 2.176832904920183e-05, - "loss": 2.2618, - "step": 323780 - }, - { - "epoch": 0.56, - "learning_rate": 2.1767457109275e-05, - "loss": 2.3705, - "step": 323790 - }, - { - "epoch": 0.56, - "learning_rate": 2.1766585169348176e-05, - "loss": 2.2998, - "step": 323800 - }, - { - "epoch": 0.56, - "learning_rate": 2.1765713229421347e-05, - "loss": 2.4165, - "step": 323810 - }, - { - "epoch": 0.56, - "learning_rate": 2.176484128949452e-05, - "loss": 2.3463, - "step": 323820 - }, - { - "epoch": 0.56, - "learning_rate": 2.176396934956769e-05, - "loss": 2.4572, - "step": 323830 - }, - { - "epoch": 0.56, - "learning_rate": 2.1763097409640868e-05, - "loss": 2.1615, - "step": 323840 - }, - { - "epoch": 0.56, - "learning_rate": 2.176222546971404e-05, - "loss": 2.2716, - "step": 323850 - }, - { - "epoch": 0.56, - "learning_rate": 2.1761353529787212e-05, - "loss": 2.3645, - "step": 323860 - }, - { - "epoch": 0.56, - "learning_rate": 2.1760481589860386e-05, - "loss": 2.4038, - "step": 323870 - }, - { - "epoch": 0.56, - "learning_rate": 2.175960964993356e-05, - "loss": 2.2059, - "step": 323880 - }, - { - "epoch": 0.56, - "learning_rate": 2.1758737710006733e-05, - "loss": 2.3659, - "step": 323890 - }, - { - "epoch": 0.56, - "learning_rate": 2.1757865770079904e-05, - "loss": 2.3279, - "step": 323900 - }, - { - "epoch": 0.56, - "learning_rate": 2.175699383015308e-05, - "loss": 2.328, - "step": 323910 - }, - { - "epoch": 0.56, - "learning_rate": 2.175612189022625e-05, - "loss": 2.3479, - "step": 323920 - }, - { - "epoch": 0.56, - "learning_rate": 2.1755249950299425e-05, - "loss": 2.3345, - "step": 323930 - }, - { - "epoch": 0.56, - "learning_rate": 2.17543780103726e-05, - "loss": 2.3089, - "step": 323940 - }, - { - "epoch": 0.56, - "learning_rate": 2.1753506070445773e-05, - "loss": 2.3647, - "step": 323950 - }, - { - "epoch": 0.56, - "learning_rate": 2.1752634130518946e-05, - "loss": 2.3164, - "step": 323960 - }, - { - "epoch": 0.56, - "learning_rate": 2.1751762190592117e-05, - "loss": 2.3977, - "step": 323970 - }, - { - "epoch": 0.56, - "learning_rate": 2.175089025066529e-05, - "loss": 2.2806, - "step": 323980 - }, - { - "epoch": 0.56, - "learning_rate": 2.1750018310738464e-05, - "loss": 2.3459, - "step": 323990 - }, - { - "epoch": 0.57, - "learning_rate": 2.1749146370811638e-05, - "loss": 2.3291, - "step": 324000 - }, - { - "epoch": 0.57, - "learning_rate": 2.1748274430884812e-05, - "loss": 2.2928, - "step": 324010 - }, - { - "epoch": 0.57, - "learning_rate": 2.1747402490957982e-05, - "loss": 2.3442, - "step": 324020 - }, - { - "epoch": 0.57, - "learning_rate": 2.174653055103116e-05, - "loss": 2.3405, - "step": 324030 - }, - { - "epoch": 0.57, - "learning_rate": 2.174565861110433e-05, - "loss": 2.4095, - "step": 324040 - }, - { - "epoch": 0.57, - "learning_rate": 2.1744786671177504e-05, - "loss": 2.3156, - "step": 324050 - }, - { - "epoch": 0.57, - "learning_rate": 2.1743914731250677e-05, - "loss": 2.3552, - "step": 324060 - }, - { - "epoch": 0.57, - "learning_rate": 2.174304279132385e-05, - "loss": 2.3214, - "step": 324070 - }, - { - "epoch": 0.57, - "learning_rate": 2.174217085139702e-05, - "loss": 2.3239, - "step": 324080 - }, - { - "epoch": 0.57, - "learning_rate": 2.1741298911470195e-05, - "loss": 2.2569, - "step": 324090 - }, - { - "epoch": 0.57, - "learning_rate": 2.174042697154337e-05, - "loss": 2.3726, - "step": 324100 - }, - { - "epoch": 0.57, - "learning_rate": 2.1739555031616543e-05, - "loss": 2.2854, - "step": 324110 - }, - { - "epoch": 0.57, - "learning_rate": 2.1738683091689717e-05, - "loss": 2.2577, - "step": 324120 - }, - { - "epoch": 0.57, - "learning_rate": 2.1737811151762887e-05, - "loss": 2.3584, - "step": 324130 - }, - { - "epoch": 0.57, - "learning_rate": 2.1736939211836064e-05, - "loss": 2.4694, - "step": 324140 - }, - { - "epoch": 0.57, - "learning_rate": 2.1736067271909234e-05, - "loss": 2.2618, - "step": 324150 - }, - { - "epoch": 0.57, - "learning_rate": 2.1735195331982408e-05, - "loss": 2.2758, - "step": 324160 - }, - { - "epoch": 0.57, - "learning_rate": 2.1734323392055582e-05, - "loss": 2.2685, - "step": 324170 - }, - { - "epoch": 0.57, - "learning_rate": 2.1733451452128756e-05, - "loss": 2.3522, - "step": 324180 - }, - { - "epoch": 0.57, - "learning_rate": 2.173257951220193e-05, - "loss": 2.3359, - "step": 324190 - }, - { - "epoch": 0.57, - "learning_rate": 2.17317075722751e-05, - "loss": 2.4001, - "step": 324200 - }, - { - "epoch": 0.57, - "learning_rate": 2.1730835632348277e-05, - "loss": 2.3169, - "step": 324210 - }, - { - "epoch": 0.57, - "learning_rate": 2.1729963692421447e-05, - "loss": 2.3137, - "step": 324220 - }, - { - "epoch": 0.57, - "learning_rate": 2.172909175249462e-05, - "loss": 2.3458, - "step": 324230 - }, - { - "epoch": 0.57, - "learning_rate": 2.172821981256779e-05, - "loss": 2.4613, - "step": 324240 - }, - { - "epoch": 0.57, - "learning_rate": 2.172734787264097e-05, - "loss": 2.3482, - "step": 324250 - }, - { - "epoch": 0.57, - "learning_rate": 2.1726475932714143e-05, - "loss": 2.4159, - "step": 324260 - }, - { - "epoch": 0.57, - "learning_rate": 2.1725603992787313e-05, - "loss": 2.4192, - "step": 324270 - }, - { - "epoch": 0.57, - "learning_rate": 2.1724732052860487e-05, - "loss": 2.2986, - "step": 324280 - }, - { - "epoch": 0.57, - "learning_rate": 2.172386011293366e-05, - "loss": 2.406, - "step": 324290 - }, - { - "epoch": 0.57, - "learning_rate": 2.1722988173006834e-05, - "loss": 2.3291, - "step": 324300 - }, - { - "epoch": 0.57, - "learning_rate": 2.1722116233080005e-05, - "loss": 2.2723, - "step": 324310 - }, - { - "epoch": 0.57, - "learning_rate": 2.1721244293153182e-05, - "loss": 2.3499, - "step": 324320 - }, - { - "epoch": 0.57, - "learning_rate": 2.1720372353226352e-05, - "loss": 2.3657, - "step": 324330 - }, - { - "epoch": 0.57, - "learning_rate": 2.1719500413299526e-05, - "loss": 2.21, - "step": 324340 - }, - { - "epoch": 0.57, - "learning_rate": 2.17186284733727e-05, - "loss": 2.2857, - "step": 324350 - }, - { - "epoch": 0.57, - "learning_rate": 2.1717756533445874e-05, - "loss": 2.312, - "step": 324360 - }, - { - "epoch": 0.57, - "learning_rate": 2.1716884593519047e-05, - "loss": 2.3438, - "step": 324370 - }, - { - "epoch": 0.57, - "learning_rate": 2.1716012653592218e-05, - "loss": 2.3486, - "step": 324380 - }, - { - "epoch": 0.57, - "learning_rate": 2.171514071366539e-05, - "loss": 2.2784, - "step": 324390 - }, - { - "epoch": 0.57, - "learning_rate": 2.1714268773738565e-05, - "loss": 2.3863, - "step": 324400 - }, - { - "epoch": 0.57, - "learning_rate": 2.171339683381174e-05, - "loss": 2.4562, - "step": 324410 - }, - { - "epoch": 0.57, - "learning_rate": 2.1712524893884913e-05, - "loss": 2.42, - "step": 324420 - }, - { - "epoch": 0.57, - "learning_rate": 2.1711652953958087e-05, - "loss": 2.2824, - "step": 324430 - }, - { - "epoch": 0.57, - "learning_rate": 2.171078101403126e-05, - "loss": 2.3439, - "step": 324440 - }, - { - "epoch": 0.57, - "learning_rate": 2.170990907410443e-05, - "loss": 2.3629, - "step": 324450 - }, - { - "epoch": 0.57, - "learning_rate": 2.1709037134177604e-05, - "loss": 2.4285, - "step": 324460 - }, - { - "epoch": 0.57, - "learning_rate": 2.1708165194250778e-05, - "loss": 2.3181, - "step": 324470 - }, - { - "epoch": 0.57, - "learning_rate": 2.1707293254323952e-05, - "loss": 2.3222, - "step": 324480 - }, - { - "epoch": 0.57, - "learning_rate": 2.1706421314397122e-05, - "loss": 2.3361, - "step": 324490 - }, - { - "epoch": 0.57, - "learning_rate": 2.1705549374470296e-05, - "loss": 2.4158, - "step": 324500 - }, - { - "epoch": 0.57, - "learning_rate": 2.1704677434543473e-05, - "loss": 2.3583, - "step": 324510 - }, - { - "epoch": 0.57, - "learning_rate": 2.1703805494616644e-05, - "loss": 2.3139, - "step": 324520 - }, - { - "epoch": 0.57, - "learning_rate": 2.1702933554689817e-05, - "loss": 2.3242, - "step": 324530 - }, - { - "epoch": 0.57, - "learning_rate": 2.1702061614762988e-05, - "loss": 2.3238, - "step": 324540 - }, - { - "epoch": 0.57, - "learning_rate": 2.1701189674836165e-05, - "loss": 2.3436, - "step": 324550 - }, - { - "epoch": 0.57, - "learning_rate": 2.1700317734909335e-05, - "loss": 2.3601, - "step": 324560 - }, - { - "epoch": 0.57, - "learning_rate": 2.169944579498251e-05, - "loss": 2.3334, - "step": 324570 - }, - { - "epoch": 0.57, - "learning_rate": 2.1698573855055683e-05, - "loss": 2.3025, - "step": 324580 - }, - { - "epoch": 0.57, - "learning_rate": 2.1697701915128857e-05, - "loss": 2.3521, - "step": 324590 - }, - { - "epoch": 0.57, - "learning_rate": 2.169682997520203e-05, - "loss": 2.3927, - "step": 324600 - }, - { - "epoch": 0.57, - "learning_rate": 2.16959580352752e-05, - "loss": 2.1775, - "step": 324610 - }, - { - "epoch": 0.57, - "learning_rate": 2.1695086095348378e-05, - "loss": 2.4065, - "step": 324620 - }, - { - "epoch": 0.57, - "learning_rate": 2.169421415542155e-05, - "loss": 2.4272, - "step": 324630 - }, - { - "epoch": 0.57, - "learning_rate": 2.1693342215494722e-05, - "loss": 2.4426, - "step": 324640 - }, - { - "epoch": 0.57, - "learning_rate": 2.1692470275567896e-05, - "loss": 2.3795, - "step": 324650 - }, - { - "epoch": 0.57, - "learning_rate": 2.169159833564107e-05, - "loss": 2.535, - "step": 324660 - }, - { - "epoch": 0.57, - "learning_rate": 2.1690726395714243e-05, - "loss": 2.3735, - "step": 324670 - }, - { - "epoch": 0.57, - "learning_rate": 2.1689854455787414e-05, - "loss": 2.3002, - "step": 324680 - }, - { - "epoch": 0.57, - "learning_rate": 2.1688982515860588e-05, - "loss": 2.3278, - "step": 324690 - }, - { - "epoch": 0.57, - "learning_rate": 2.168811057593376e-05, - "loss": 2.3897, - "step": 324700 - }, - { - "epoch": 0.57, - "learning_rate": 2.1687238636006935e-05, - "loss": 2.3375, - "step": 324710 - }, - { - "epoch": 0.57, - "learning_rate": 2.1686366696080106e-05, - "loss": 2.4145, - "step": 324720 - }, - { - "epoch": 0.57, - "learning_rate": 2.1685494756153283e-05, - "loss": 2.2415, - "step": 324730 - }, - { - "epoch": 0.57, - "learning_rate": 2.1684622816226456e-05, - "loss": 2.1979, - "step": 324740 - }, - { - "epoch": 0.57, - "learning_rate": 2.1683750876299627e-05, - "loss": 2.3504, - "step": 324750 - }, - { - "epoch": 0.57, - "learning_rate": 2.16828789363728e-05, - "loss": 2.5496, - "step": 324760 - }, - { - "epoch": 0.57, - "learning_rate": 2.1682006996445974e-05, - "loss": 2.277, - "step": 324770 - }, - { - "epoch": 0.57, - "learning_rate": 2.1681135056519148e-05, - "loss": 2.251, - "step": 324780 - }, - { - "epoch": 0.57, - "learning_rate": 2.168026311659232e-05, - "loss": 2.3996, - "step": 324790 - }, - { - "epoch": 0.57, - "learning_rate": 2.1679391176665492e-05, - "loss": 2.4412, - "step": 324800 - }, - { - "epoch": 0.57, - "learning_rate": 2.1678519236738666e-05, - "loss": 2.3214, - "step": 324810 - }, - { - "epoch": 0.57, - "learning_rate": 2.167764729681184e-05, - "loss": 2.234, - "step": 324820 - }, - { - "epoch": 0.57, - "learning_rate": 2.1676775356885014e-05, - "loss": 2.3437, - "step": 324830 - }, - { - "epoch": 0.57, - "learning_rate": 2.1675903416958187e-05, - "loss": 2.3327, - "step": 324840 - }, - { - "epoch": 0.57, - "learning_rate": 2.167503147703136e-05, - "loss": 2.303, - "step": 324850 - }, - { - "epoch": 0.57, - "learning_rate": 2.167415953710453e-05, - "loss": 2.3563, - "step": 324860 - }, - { - "epoch": 0.57, - "learning_rate": 2.1673287597177705e-05, - "loss": 2.3669, - "step": 324870 - }, - { - "epoch": 0.57, - "learning_rate": 2.167241565725088e-05, - "loss": 2.2141, - "step": 324880 - }, - { - "epoch": 0.57, - "learning_rate": 2.1671543717324053e-05, - "loss": 2.3145, - "step": 324890 - }, - { - "epoch": 0.57, - "learning_rate": 2.1670671777397227e-05, - "loss": 2.3361, - "step": 324900 - }, - { - "epoch": 0.57, - "learning_rate": 2.1669799837470397e-05, - "loss": 2.348, - "step": 324910 - }, - { - "epoch": 0.57, - "learning_rate": 2.1668927897543574e-05, - "loss": 2.3332, - "step": 324920 - }, - { - "epoch": 0.57, - "learning_rate": 2.1668055957616745e-05, - "loss": 2.3945, - "step": 324930 - }, - { - "epoch": 0.57, - "learning_rate": 2.1667184017689918e-05, - "loss": 2.3782, - "step": 324940 - }, - { - "epoch": 0.57, - "learning_rate": 2.166631207776309e-05, - "loss": 2.3308, - "step": 324950 - }, - { - "epoch": 0.57, - "learning_rate": 2.1665440137836266e-05, - "loss": 2.3711, - "step": 324960 - }, - { - "epoch": 0.57, - "learning_rate": 2.1664568197909436e-05, - "loss": 2.367, - "step": 324970 - }, - { - "epoch": 0.57, - "learning_rate": 2.166369625798261e-05, - "loss": 2.3798, - "step": 324980 - }, - { - "epoch": 0.57, - "learning_rate": 2.1662824318055787e-05, - "loss": 2.3459, - "step": 324990 - }, - { - "epoch": 0.57, - "learning_rate": 2.1661952378128958e-05, - "loss": 2.3554, - "step": 325000 - }, - { - "epoch": 0.57, - "learning_rate": 2.166108043820213e-05, - "loss": 2.398, - "step": 325010 - }, - { - "epoch": 0.57, - "learning_rate": 2.16602084982753e-05, - "loss": 2.2237, - "step": 325020 - }, - { - "epoch": 0.57, - "learning_rate": 2.165933655834848e-05, - "loss": 2.3121, - "step": 325030 - }, - { - "epoch": 0.57, - "learning_rate": 2.165846461842165e-05, - "loss": 2.3307, - "step": 325040 - }, - { - "epoch": 0.57, - "learning_rate": 2.1657592678494823e-05, - "loss": 2.3645, - "step": 325050 - }, - { - "epoch": 0.57, - "learning_rate": 2.1656720738567997e-05, - "loss": 2.3873, - "step": 325060 - }, - { - "epoch": 0.57, - "learning_rate": 2.165584879864117e-05, - "loss": 2.3477, - "step": 325070 - }, - { - "epoch": 0.57, - "learning_rate": 2.1654976858714344e-05, - "loss": 2.2482, - "step": 325080 - }, - { - "epoch": 0.57, - "learning_rate": 2.1654104918787515e-05, - "loss": 2.427, - "step": 325090 - }, - { - "epoch": 0.57, - "learning_rate": 2.1653232978860692e-05, - "loss": 2.3261, - "step": 325100 - }, - { - "epoch": 0.57, - "learning_rate": 2.1652361038933862e-05, - "loss": 2.2743, - "step": 325110 - }, - { - "epoch": 0.57, - "learning_rate": 2.1651489099007036e-05, - "loss": 2.3925, - "step": 325120 - }, - { - "epoch": 0.57, - "learning_rate": 2.165061715908021e-05, - "loss": 2.3315, - "step": 325130 - }, - { - "epoch": 0.57, - "learning_rate": 2.1649745219153384e-05, - "loss": 2.2498, - "step": 325140 - }, - { - "epoch": 0.57, - "learning_rate": 2.1648873279226557e-05, - "loss": 2.3311, - "step": 325150 - }, - { - "epoch": 0.57, - "learning_rate": 2.1648001339299728e-05, - "loss": 2.3887, - "step": 325160 - }, - { - "epoch": 0.57, - "learning_rate": 2.16471293993729e-05, - "loss": 2.3769, - "step": 325170 - }, - { - "epoch": 0.57, - "learning_rate": 2.1646257459446075e-05, - "loss": 2.4127, - "step": 325180 - }, - { - "epoch": 0.57, - "learning_rate": 2.164538551951925e-05, - "loss": 2.4282, - "step": 325190 - }, - { - "epoch": 0.57, - "learning_rate": 2.164451357959242e-05, - "loss": 2.2962, - "step": 325200 - }, - { - "epoch": 0.57, - "learning_rate": 2.1643641639665593e-05, - "loss": 2.3028, - "step": 325210 - }, - { - "epoch": 0.57, - "learning_rate": 2.1642769699738767e-05, - "loss": 2.3608, - "step": 325220 - }, - { - "epoch": 0.57, - "learning_rate": 2.164189775981194e-05, - "loss": 2.2981, - "step": 325230 - }, - { - "epoch": 0.57, - "learning_rate": 2.1641025819885114e-05, - "loss": 2.3271, - "step": 325240 - }, - { - "epoch": 0.57, - "learning_rate": 2.1640153879958288e-05, - "loss": 2.4282, - "step": 325250 - }, - { - "epoch": 0.57, - "learning_rate": 2.1639281940031462e-05, - "loss": 2.3707, - "step": 325260 - }, - { - "epoch": 0.57, - "learning_rate": 2.1638410000104632e-05, - "loss": 2.3439, - "step": 325270 - }, - { - "epoch": 0.57, - "learning_rate": 2.1637538060177806e-05, - "loss": 2.2964, - "step": 325280 - }, - { - "epoch": 0.57, - "learning_rate": 2.163666612025098e-05, - "loss": 2.2897, - "step": 325290 - }, - { - "epoch": 0.57, - "learning_rate": 2.1635794180324154e-05, - "loss": 2.2683, - "step": 325300 - }, - { - "epoch": 0.57, - "learning_rate": 2.1634922240397327e-05, - "loss": 2.4125, - "step": 325310 - }, - { - "epoch": 0.57, - "learning_rate": 2.1634050300470498e-05, - "loss": 2.4071, - "step": 325320 - }, - { - "epoch": 0.57, - "learning_rate": 2.1633178360543675e-05, - "loss": 2.3953, - "step": 325330 - }, - { - "epoch": 0.57, - "learning_rate": 2.1632306420616845e-05, - "loss": 2.3523, - "step": 325340 - }, - { - "epoch": 0.57, - "learning_rate": 2.163143448069002e-05, - "loss": 2.3922, - "step": 325350 - }, - { - "epoch": 0.57, - "learning_rate": 2.1630562540763193e-05, - "loss": 2.2905, - "step": 325360 - }, - { - "epoch": 0.57, - "learning_rate": 2.1629690600836367e-05, - "loss": 2.3148, - "step": 325370 - }, - { - "epoch": 0.57, - "learning_rate": 2.162881866090954e-05, - "loss": 2.3729, - "step": 325380 - }, - { - "epoch": 0.57, - "learning_rate": 2.162794672098271e-05, - "loss": 2.379, - "step": 325390 - }, - { - "epoch": 0.57, - "learning_rate": 2.1627074781055888e-05, - "loss": 2.3793, - "step": 325400 - }, - { - "epoch": 0.57, - "learning_rate": 2.162620284112906e-05, - "loss": 2.3651, - "step": 325410 - }, - { - "epoch": 0.57, - "learning_rate": 2.1625330901202232e-05, - "loss": 2.2779, - "step": 325420 - }, - { - "epoch": 0.57, - "learning_rate": 2.1624458961275403e-05, - "loss": 2.2842, - "step": 325430 - }, - { - "epoch": 0.57, - "learning_rate": 2.162358702134858e-05, - "loss": 2.3994, - "step": 325440 - }, - { - "epoch": 0.57, - "learning_rate": 2.162271508142175e-05, - "loss": 2.3735, - "step": 325450 - }, - { - "epoch": 0.57, - "learning_rate": 2.1621843141494924e-05, - "loss": 2.2903, - "step": 325460 - }, - { - "epoch": 0.57, - "learning_rate": 2.1620971201568098e-05, - "loss": 2.3159, - "step": 325470 - }, - { - "epoch": 0.57, - "learning_rate": 2.162009926164127e-05, - "loss": 2.1918, - "step": 325480 - }, - { - "epoch": 0.57, - "learning_rate": 2.1619227321714445e-05, - "loss": 2.4497, - "step": 325490 - }, - { - "epoch": 0.57, - "learning_rate": 2.1618355381787616e-05, - "loss": 2.3086, - "step": 325500 - }, - { - "epoch": 0.57, - "learning_rate": 2.1617483441860793e-05, - "loss": 2.4627, - "step": 325510 - }, - { - "epoch": 0.57, - "learning_rate": 2.1616611501933963e-05, - "loss": 2.3617, - "step": 325520 - }, - { - "epoch": 0.57, - "learning_rate": 2.1615739562007137e-05, - "loss": 2.3771, - "step": 325530 - }, - { - "epoch": 0.57, - "learning_rate": 2.161486762208031e-05, - "loss": 2.4072, - "step": 325540 - }, - { - "epoch": 0.57, - "learning_rate": 2.1613995682153484e-05, - "loss": 2.3025, - "step": 325550 - }, - { - "epoch": 0.57, - "learning_rate": 2.1613123742226658e-05, - "loss": 2.3435, - "step": 325560 - }, - { - "epoch": 0.57, - "learning_rate": 2.161225180229983e-05, - "loss": 2.4122, - "step": 325570 - }, - { - "epoch": 0.57, - "learning_rate": 2.1611379862373002e-05, - "loss": 2.2751, - "step": 325580 - }, - { - "epoch": 0.57, - "learning_rate": 2.1610507922446176e-05, - "loss": 2.342, - "step": 325590 - }, - { - "epoch": 0.57, - "learning_rate": 2.160963598251935e-05, - "loss": 2.3612, - "step": 325600 - }, - { - "epoch": 0.57, - "learning_rate": 2.1608764042592524e-05, - "loss": 2.3398, - "step": 325610 - }, - { - "epoch": 0.57, - "learning_rate": 2.1607892102665694e-05, - "loss": 2.3732, - "step": 325620 - }, - { - "epoch": 0.57, - "learning_rate": 2.160702016273887e-05, - "loss": 2.3597, - "step": 325630 - }, - { - "epoch": 0.57, - "learning_rate": 2.160614822281204e-05, - "loss": 2.366, - "step": 325640 - }, - { - "epoch": 0.57, - "learning_rate": 2.1605276282885215e-05, - "loss": 2.4004, - "step": 325650 - }, - { - "epoch": 0.57, - "learning_rate": 2.160440434295839e-05, - "loss": 2.4164, - "step": 325660 - }, - { - "epoch": 0.57, - "learning_rate": 2.1603532403031563e-05, - "loss": 2.388, - "step": 325670 - }, - { - "epoch": 0.57, - "learning_rate": 2.1602660463104733e-05, - "loss": 2.3688, - "step": 325680 - }, - { - "epoch": 0.57, - "learning_rate": 2.1601788523177907e-05, - "loss": 2.2449, - "step": 325690 - }, - { - "epoch": 0.57, - "learning_rate": 2.160091658325108e-05, - "loss": 2.3607, - "step": 325700 - }, - { - "epoch": 0.57, - "learning_rate": 2.1600044643324255e-05, - "loss": 2.2932, - "step": 325710 - }, - { - "epoch": 0.57, - "learning_rate": 2.1599172703397428e-05, - "loss": 2.3354, - "step": 325720 - }, - { - "epoch": 0.57, - "learning_rate": 2.15983007634706e-05, - "loss": 2.3635, - "step": 325730 - }, - { - "epoch": 0.57, - "learning_rate": 2.1597428823543776e-05, - "loss": 2.3701, - "step": 325740 - }, - { - "epoch": 0.57, - "learning_rate": 2.1596556883616946e-05, - "loss": 2.2344, - "step": 325750 - }, - { - "epoch": 0.57, - "learning_rate": 2.159568494369012e-05, - "loss": 2.2932, - "step": 325760 - }, - { - "epoch": 0.57, - "learning_rate": 2.1594813003763294e-05, - "loss": 2.2381, - "step": 325770 - }, - { - "epoch": 0.57, - "learning_rate": 2.1593941063836468e-05, - "loss": 2.3297, - "step": 325780 - }, - { - "epoch": 0.57, - "learning_rate": 2.159306912390964e-05, - "loss": 2.3016, - "step": 325790 - }, - { - "epoch": 0.57, - "learning_rate": 2.159219718398281e-05, - "loss": 2.3524, - "step": 325800 - }, - { - "epoch": 0.57, - "learning_rate": 2.159132524405599e-05, - "loss": 2.3665, - "step": 325810 - }, - { - "epoch": 0.57, - "learning_rate": 2.159045330412916e-05, - "loss": 2.4357, - "step": 325820 - }, - { - "epoch": 0.57, - "learning_rate": 2.1589581364202333e-05, - "loss": 2.3144, - "step": 325830 - }, - { - "epoch": 0.57, - "learning_rate": 2.1588709424275503e-05, - "loss": 2.3468, - "step": 325840 - }, - { - "epoch": 0.57, - "learning_rate": 2.158783748434868e-05, - "loss": 2.408, - "step": 325850 - }, - { - "epoch": 0.57, - "learning_rate": 2.1586965544421854e-05, - "loss": 2.3734, - "step": 325860 - }, - { - "epoch": 0.57, - "learning_rate": 2.1586093604495025e-05, - "loss": 2.4074, - "step": 325870 - }, - { - "epoch": 0.57, - "learning_rate": 2.15852216645682e-05, - "loss": 2.477, - "step": 325880 - }, - { - "epoch": 0.57, - "learning_rate": 2.1584349724641372e-05, - "loss": 2.432, - "step": 325890 - }, - { - "epoch": 0.57, - "learning_rate": 2.1583477784714546e-05, - "loss": 2.4178, - "step": 325900 - }, - { - "epoch": 0.57, - "learning_rate": 2.1582605844787716e-05, - "loss": 2.2547, - "step": 325910 - }, - { - "epoch": 0.57, - "learning_rate": 2.1581733904860894e-05, - "loss": 2.3103, - "step": 325920 - }, - { - "epoch": 0.57, - "learning_rate": 2.1580861964934064e-05, - "loss": 2.28, - "step": 325930 - }, - { - "epoch": 0.57, - "learning_rate": 2.1579990025007238e-05, - "loss": 2.2938, - "step": 325940 - }, - { - "epoch": 0.57, - "learning_rate": 2.157911808508041e-05, - "loss": 2.3712, - "step": 325950 - }, - { - "epoch": 0.57, - "learning_rate": 2.1578246145153585e-05, - "loss": 2.3598, - "step": 325960 - }, - { - "epoch": 0.57, - "learning_rate": 2.157737420522676e-05, - "loss": 2.3564, - "step": 325970 - }, - { - "epoch": 0.57, - "learning_rate": 2.157650226529993e-05, - "loss": 2.3423, - "step": 325980 - }, - { - "epoch": 0.57, - "learning_rate": 2.1575630325373103e-05, - "loss": 2.4945, - "step": 325990 - }, - { - "epoch": 0.57, - "learning_rate": 2.1574758385446277e-05, - "loss": 2.3916, - "step": 326000 - }, - { - "epoch": 0.57, - "learning_rate": 2.157388644551945e-05, - "loss": 2.3127, - "step": 326010 - }, - { - "epoch": 0.57, - "learning_rate": 2.1573014505592624e-05, - "loss": 2.3185, - "step": 326020 - }, - { - "epoch": 0.57, - "learning_rate": 2.1572142565665798e-05, - "loss": 2.3427, - "step": 326030 - }, - { - "epoch": 0.57, - "learning_rate": 2.1571270625738972e-05, - "loss": 2.2453, - "step": 326040 - }, - { - "epoch": 0.57, - "learning_rate": 2.1570398685812142e-05, - "loss": 2.2426, - "step": 326050 - }, - { - "epoch": 0.57, - "learning_rate": 2.1569526745885316e-05, - "loss": 2.4844, - "step": 326060 - }, - { - "epoch": 0.57, - "learning_rate": 2.156865480595849e-05, - "loss": 2.2634, - "step": 326070 - }, - { - "epoch": 0.57, - "learning_rate": 2.1567782866031664e-05, - "loss": 2.4328, - "step": 326080 - }, - { - "epoch": 0.57, - "learning_rate": 2.1566910926104837e-05, - "loss": 2.1761, - "step": 326090 - }, - { - "epoch": 0.57, - "learning_rate": 2.1566038986178008e-05, - "loss": 2.2846, - "step": 326100 - }, - { - "epoch": 0.57, - "learning_rate": 2.1565167046251185e-05, - "loss": 2.3706, - "step": 326110 - }, - { - "epoch": 0.57, - "learning_rate": 2.1564295106324355e-05, - "loss": 2.3939, - "step": 326120 - }, - { - "epoch": 0.57, - "learning_rate": 2.156342316639753e-05, - "loss": 2.3386, - "step": 326130 - }, - { - "epoch": 0.57, - "learning_rate": 2.15625512264707e-05, - "loss": 2.2984, - "step": 326140 - }, - { - "epoch": 0.57, - "learning_rate": 2.1561679286543877e-05, - "loss": 2.1456, - "step": 326150 - }, - { - "epoch": 0.57, - "learning_rate": 2.1560807346617047e-05, - "loss": 2.3765, - "step": 326160 - }, - { - "epoch": 0.57, - "learning_rate": 2.155993540669022e-05, - "loss": 2.3181, - "step": 326170 - }, - { - "epoch": 0.57, - "learning_rate": 2.1559063466763395e-05, - "loss": 2.3263, - "step": 326180 - }, - { - "epoch": 0.57, - "learning_rate": 2.155819152683657e-05, - "loss": 2.4416, - "step": 326190 - }, - { - "epoch": 0.57, - "learning_rate": 2.1557319586909742e-05, - "loss": 2.4508, - "step": 326200 - }, - { - "epoch": 0.57, - "learning_rate": 2.1556447646982913e-05, - "loss": 2.3513, - "step": 326210 - }, - { - "epoch": 0.57, - "learning_rate": 2.155557570705609e-05, - "loss": 2.3694, - "step": 326220 - }, - { - "epoch": 0.57, - "learning_rate": 2.155470376712926e-05, - "loss": 2.3011, - "step": 326230 - }, - { - "epoch": 0.57, - "learning_rate": 2.1553831827202434e-05, - "loss": 2.3944, - "step": 326240 - }, - { - "epoch": 0.57, - "learning_rate": 2.1552959887275608e-05, - "loss": 2.4008, - "step": 326250 - }, - { - "epoch": 0.57, - "learning_rate": 2.155208794734878e-05, - "loss": 2.3661, - "step": 326260 - }, - { - "epoch": 0.57, - "learning_rate": 2.1551216007421955e-05, - "loss": 2.3675, - "step": 326270 - }, - { - "epoch": 0.57, - "learning_rate": 2.1550344067495126e-05, - "loss": 2.4674, - "step": 326280 - }, - { - "epoch": 0.57, - "learning_rate": 2.1549472127568303e-05, - "loss": 2.2509, - "step": 326290 - }, - { - "epoch": 0.57, - "learning_rate": 2.1548600187641473e-05, - "loss": 2.3652, - "step": 326300 - }, - { - "epoch": 0.57, - "learning_rate": 2.1547728247714647e-05, - "loss": 2.3591, - "step": 326310 - }, - { - "epoch": 0.57, - "learning_rate": 2.1546856307787817e-05, - "loss": 2.3428, - "step": 326320 - }, - { - "epoch": 0.57, - "learning_rate": 2.1545984367860994e-05, - "loss": 2.3165, - "step": 326330 - }, - { - "epoch": 0.57, - "learning_rate": 2.1545112427934168e-05, - "loss": 2.4802, - "step": 326340 - }, - { - "epoch": 0.57, - "learning_rate": 2.154424048800734e-05, - "loss": 2.3266, - "step": 326350 - }, - { - "epoch": 0.57, - "learning_rate": 2.1543368548080512e-05, - "loss": 2.2585, - "step": 326360 - }, - { - "epoch": 0.57, - "learning_rate": 2.1542496608153686e-05, - "loss": 2.3584, - "step": 326370 - }, - { - "epoch": 0.57, - "learning_rate": 2.154162466822686e-05, - "loss": 2.3771, - "step": 326380 - }, - { - "epoch": 0.57, - "learning_rate": 2.154075272830003e-05, - "loss": 2.2731, - "step": 326390 - }, - { - "epoch": 0.57, - "learning_rate": 2.1539880788373204e-05, - "loss": 2.3346, - "step": 326400 - }, - { - "epoch": 0.57, - "learning_rate": 2.1539008848446378e-05, - "loss": 2.3257, - "step": 326410 - }, - { - "epoch": 0.57, - "learning_rate": 2.153813690851955e-05, - "loss": 2.3472, - "step": 326420 - }, - { - "epoch": 0.57, - "learning_rate": 2.1537264968592725e-05, - "loss": 2.2904, - "step": 326430 - }, - { - "epoch": 0.57, - "learning_rate": 2.15363930286659e-05, - "loss": 2.383, - "step": 326440 - }, - { - "epoch": 0.57, - "learning_rate": 2.1535521088739073e-05, - "loss": 2.2793, - "step": 326450 - }, - { - "epoch": 0.57, - "learning_rate": 2.1534649148812243e-05, - "loss": 2.3121, - "step": 326460 - }, - { - "epoch": 0.57, - "learning_rate": 2.1533777208885417e-05, - "loss": 2.2681, - "step": 326470 - }, - { - "epoch": 0.57, - "learning_rate": 2.153290526895859e-05, - "loss": 2.3793, - "step": 326480 - }, - { - "epoch": 0.57, - "learning_rate": 2.1532033329031765e-05, - "loss": 2.4144, - "step": 326490 - }, - { - "epoch": 0.57, - "learning_rate": 2.1531161389104938e-05, - "loss": 2.2392, - "step": 326500 - }, - { - "epoch": 0.57, - "learning_rate": 2.153028944917811e-05, - "loss": 2.3213, - "step": 326510 - }, - { - "epoch": 0.57, - "learning_rate": 2.1529417509251286e-05, - "loss": 2.3064, - "step": 326520 - }, - { - "epoch": 0.57, - "learning_rate": 2.1528545569324456e-05, - "loss": 2.3038, - "step": 326530 - }, - { - "epoch": 0.57, - "learning_rate": 2.152767362939763e-05, - "loss": 2.3707, - "step": 326540 - }, - { - "epoch": 0.57, - "learning_rate": 2.15268016894708e-05, - "loss": 2.325, - "step": 326550 - }, - { - "epoch": 0.57, - "learning_rate": 2.1525929749543978e-05, - "loss": 2.4135, - "step": 326560 - }, - { - "epoch": 0.57, - "learning_rate": 2.1525057809617148e-05, - "loss": 2.3384, - "step": 326570 - }, - { - "epoch": 0.57, - "learning_rate": 2.152418586969032e-05, - "loss": 2.4399, - "step": 326580 - }, - { - "epoch": 0.57, - "learning_rate": 2.15233139297635e-05, - "loss": 2.3208, - "step": 326590 - }, - { - "epoch": 0.57, - "learning_rate": 2.152244198983667e-05, - "loss": 2.3495, - "step": 326600 - }, - { - "epoch": 0.57, - "learning_rate": 2.1521570049909843e-05, - "loss": 2.3076, - "step": 326610 - }, - { - "epoch": 0.57, - "learning_rate": 2.1520698109983013e-05, - "loss": 2.3659, - "step": 326620 - }, - { - "epoch": 0.57, - "learning_rate": 2.151982617005619e-05, - "loss": 2.3612, - "step": 326630 - }, - { - "epoch": 0.57, - "learning_rate": 2.151895423012936e-05, - "loss": 2.3795, - "step": 326640 - }, - { - "epoch": 0.57, - "learning_rate": 2.1518082290202535e-05, - "loss": 2.4171, - "step": 326650 - }, - { - "epoch": 0.57, - "learning_rate": 2.151721035027571e-05, - "loss": 2.3143, - "step": 326660 - }, - { - "epoch": 0.57, - "learning_rate": 2.1516338410348882e-05, - "loss": 2.4504, - "step": 326670 - }, - { - "epoch": 0.57, - "learning_rate": 2.1515466470422056e-05, - "loss": 2.3162, - "step": 326680 - }, - { - "epoch": 0.57, - "learning_rate": 2.1514594530495226e-05, - "loss": 2.2518, - "step": 326690 - }, - { - "epoch": 0.57, - "learning_rate": 2.1513722590568404e-05, - "loss": 2.2392, - "step": 326700 - }, - { - "epoch": 0.57, - "learning_rate": 2.1512850650641574e-05, - "loss": 2.3268, - "step": 326710 - }, - { - "epoch": 0.57, - "learning_rate": 2.1511978710714748e-05, - "loss": 2.4256, - "step": 326720 - }, - { - "epoch": 0.57, - "learning_rate": 2.151110677078792e-05, - "loss": 2.2929, - "step": 326730 - }, - { - "epoch": 0.57, - "learning_rate": 2.1510234830861095e-05, - "loss": 2.3042, - "step": 326740 - }, - { - "epoch": 0.57, - "learning_rate": 2.150936289093427e-05, - "loss": 2.3999, - "step": 326750 - }, - { - "epoch": 0.57, - "learning_rate": 2.150849095100744e-05, - "loss": 2.3663, - "step": 326760 - }, - { - "epoch": 0.57, - "learning_rate": 2.1507619011080613e-05, - "loss": 2.3489, - "step": 326770 - }, - { - "epoch": 0.57, - "learning_rate": 2.1506747071153787e-05, - "loss": 2.3435, - "step": 326780 - }, - { - "epoch": 0.57, - "learning_rate": 2.150587513122696e-05, - "loss": 2.3479, - "step": 326790 - }, - { - "epoch": 0.57, - "learning_rate": 2.150500319130013e-05, - "loss": 2.3475, - "step": 326800 - }, - { - "epoch": 0.57, - "learning_rate": 2.1504131251373305e-05, - "loss": 2.3838, - "step": 326810 - }, - { - "epoch": 0.57, - "learning_rate": 2.1503259311446482e-05, - "loss": 2.4594, - "step": 326820 - }, - { - "epoch": 0.57, - "learning_rate": 2.1502387371519652e-05, - "loss": 2.3684, - "step": 326830 - }, - { - "epoch": 0.57, - "learning_rate": 2.1501515431592826e-05, - "loss": 2.306, - "step": 326840 - }, - { - "epoch": 0.57, - "learning_rate": 2.1500643491666e-05, - "loss": 2.3087, - "step": 326850 - }, - { - "epoch": 0.57, - "learning_rate": 2.1499771551739174e-05, - "loss": 2.3907, - "step": 326860 - }, - { - "epoch": 0.57, - "learning_rate": 2.1498899611812344e-05, - "loss": 2.2955, - "step": 326870 - }, - { - "epoch": 0.57, - "learning_rate": 2.1498027671885518e-05, - "loss": 2.2617, - "step": 326880 - }, - { - "epoch": 0.57, - "learning_rate": 2.149715573195869e-05, - "loss": 2.3548, - "step": 326890 - }, - { - "epoch": 0.57, - "learning_rate": 2.1496283792031865e-05, - "loss": 2.3454, - "step": 326900 - }, - { - "epoch": 0.57, - "learning_rate": 2.149541185210504e-05, - "loss": 2.3429, - "step": 326910 - }, - { - "epoch": 0.57, - "learning_rate": 2.149453991217821e-05, - "loss": 2.2985, - "step": 326920 - }, - { - "epoch": 0.57, - "learning_rate": 2.1493667972251387e-05, - "loss": 2.2237, - "step": 326930 - }, - { - "epoch": 0.57, - "learning_rate": 2.1492796032324557e-05, - "loss": 2.327, - "step": 326940 - }, - { - "epoch": 0.57, - "learning_rate": 2.149192409239773e-05, - "loss": 2.3252, - "step": 326950 - }, - { - "epoch": 0.57, - "learning_rate": 2.1491052152470905e-05, - "loss": 2.2553, - "step": 326960 - }, - { - "epoch": 0.57, - "learning_rate": 2.149018021254408e-05, - "loss": 2.4013, - "step": 326970 - }, - { - "epoch": 0.57, - "learning_rate": 2.1489308272617252e-05, - "loss": 2.3083, - "step": 326980 - }, - { - "epoch": 0.57, - "learning_rate": 2.1488436332690423e-05, - "loss": 2.3641, - "step": 326990 - }, - { - "epoch": 0.57, - "learning_rate": 2.14875643927636e-05, - "loss": 2.3702, - "step": 327000 - }, - { - "epoch": 0.57, - "learning_rate": 2.148669245283677e-05, - "loss": 2.3475, - "step": 327010 - }, - { - "epoch": 0.57, - "learning_rate": 2.1485820512909944e-05, - "loss": 2.3408, - "step": 327020 - }, - { - "epoch": 0.57, - "learning_rate": 2.1484948572983114e-05, - "loss": 2.3768, - "step": 327030 - }, - { - "epoch": 0.57, - "learning_rate": 2.148407663305629e-05, - "loss": 2.4606, - "step": 327040 - }, - { - "epoch": 0.57, - "learning_rate": 2.1483204693129462e-05, - "loss": 2.463, - "step": 327050 - }, - { - "epoch": 0.57, - "learning_rate": 2.1482332753202636e-05, - "loss": 2.3149, - "step": 327060 - }, - { - "epoch": 0.57, - "learning_rate": 2.148146081327581e-05, - "loss": 2.3492, - "step": 327070 - }, - { - "epoch": 0.57, - "learning_rate": 2.1480588873348983e-05, - "loss": 2.474, - "step": 327080 - }, - { - "epoch": 0.57, - "learning_rate": 2.1479716933422157e-05, - "loss": 2.3645, - "step": 327090 - }, - { - "epoch": 0.57, - "learning_rate": 2.1478844993495327e-05, - "loss": 2.3679, - "step": 327100 - }, - { - "epoch": 0.57, - "learning_rate": 2.1477973053568504e-05, - "loss": 2.3641, - "step": 327110 - }, - { - "epoch": 0.57, - "learning_rate": 2.1477101113641675e-05, - "loss": 2.3958, - "step": 327120 - }, - { - "epoch": 0.57, - "learning_rate": 2.147622917371485e-05, - "loss": 2.453, - "step": 327130 - }, - { - "epoch": 0.57, - "learning_rate": 2.1475357233788022e-05, - "loss": 2.3317, - "step": 327140 - }, - { - "epoch": 0.57, - "learning_rate": 2.1474485293861196e-05, - "loss": 2.2838, - "step": 327150 - }, - { - "epoch": 0.57, - "learning_rate": 2.147361335393437e-05, - "loss": 2.4008, - "step": 327160 - }, - { - "epoch": 0.57, - "learning_rate": 2.147274141400754e-05, - "loss": 2.2806, - "step": 327170 - }, - { - "epoch": 0.57, - "learning_rate": 2.1471869474080714e-05, - "loss": 2.3475, - "step": 327180 - }, - { - "epoch": 0.57, - "learning_rate": 2.1470997534153888e-05, - "loss": 2.3151, - "step": 327190 - }, - { - "epoch": 0.57, - "learning_rate": 2.147012559422706e-05, - "loss": 2.3756, - "step": 327200 - }, - { - "epoch": 0.57, - "learning_rate": 2.1469253654300235e-05, - "loss": 2.4463, - "step": 327210 - }, - { - "epoch": 0.57, - "learning_rate": 2.1468381714373406e-05, - "loss": 2.272, - "step": 327220 - }, - { - "epoch": 0.57, - "learning_rate": 2.1467509774446583e-05, - "loss": 2.4778, - "step": 327230 - }, - { - "epoch": 0.57, - "learning_rate": 2.1466637834519753e-05, - "loss": 2.3386, - "step": 327240 - }, - { - "epoch": 0.57, - "learning_rate": 2.1465765894592927e-05, - "loss": 2.3076, - "step": 327250 - }, - { - "epoch": 0.57, - "learning_rate": 2.14648939546661e-05, - "loss": 2.2943, - "step": 327260 - }, - { - "epoch": 0.57, - "learning_rate": 2.1464022014739275e-05, - "loss": 2.2784, - "step": 327270 - }, - { - "epoch": 0.57, - "learning_rate": 2.1463150074812445e-05, - "loss": 2.2831, - "step": 327280 - }, - { - "epoch": 0.57, - "learning_rate": 2.146227813488562e-05, - "loss": 2.454, - "step": 327290 - }, - { - "epoch": 0.57, - "learning_rate": 2.1461406194958792e-05, - "loss": 2.2842, - "step": 327300 - }, - { - "epoch": 0.57, - "learning_rate": 2.1460534255031966e-05, - "loss": 2.3019, - "step": 327310 - }, - { - "epoch": 0.57, - "learning_rate": 2.145966231510514e-05, - "loss": 2.3023, - "step": 327320 - }, - { - "epoch": 0.57, - "learning_rate": 2.145879037517831e-05, - "loss": 2.3825, - "step": 327330 - }, - { - "epoch": 0.57, - "learning_rate": 2.1457918435251488e-05, - "loss": 2.3717, - "step": 327340 - }, - { - "epoch": 0.57, - "learning_rate": 2.1457046495324658e-05, - "loss": 2.3264, - "step": 327350 - }, - { - "epoch": 0.57, - "learning_rate": 2.145617455539783e-05, - "loss": 2.3209, - "step": 327360 - }, - { - "epoch": 0.57, - "learning_rate": 2.1455302615471005e-05, - "loss": 2.3175, - "step": 327370 - }, - { - "epoch": 0.57, - "learning_rate": 2.145443067554418e-05, - "loss": 2.271, - "step": 327380 - }, - { - "epoch": 0.57, - "learning_rate": 2.1453558735617353e-05, - "loss": 2.3185, - "step": 327390 - }, - { - "epoch": 0.57, - "learning_rate": 2.1452686795690523e-05, - "loss": 2.4233, - "step": 327400 - }, - { - "epoch": 0.57, - "learning_rate": 2.14518148557637e-05, - "loss": 2.2855, - "step": 327410 - }, - { - "epoch": 0.57, - "learning_rate": 2.145094291583687e-05, - "loss": 2.2325, - "step": 327420 - }, - { - "epoch": 0.57, - "learning_rate": 2.1450070975910045e-05, - "loss": 2.4644, - "step": 327430 - }, - { - "epoch": 0.57, - "learning_rate": 2.144919903598322e-05, - "loss": 2.3165, - "step": 327440 - }, - { - "epoch": 0.57, - "learning_rate": 2.1448327096056392e-05, - "loss": 2.3589, - "step": 327450 - }, - { - "epoch": 0.57, - "learning_rate": 2.1447455156129566e-05, - "loss": 2.3508, - "step": 327460 - }, - { - "epoch": 0.57, - "learning_rate": 2.1446583216202736e-05, - "loss": 2.2455, - "step": 327470 - }, - { - "epoch": 0.57, - "learning_rate": 2.144571127627591e-05, - "loss": 2.3703, - "step": 327480 - }, - { - "epoch": 0.57, - "learning_rate": 2.1444839336349084e-05, - "loss": 2.3294, - "step": 327490 - }, - { - "epoch": 0.57, - "learning_rate": 2.1443967396422258e-05, - "loss": 2.4329, - "step": 327500 - }, - { - "epoch": 0.57, - "learning_rate": 2.1443095456495428e-05, - "loss": 2.2805, - "step": 327510 - }, - { - "epoch": 0.57, - "learning_rate": 2.1442223516568605e-05, - "loss": 2.32, - "step": 327520 - }, - { - "epoch": 0.57, - "learning_rate": 2.1441351576641776e-05, - "loss": 2.4105, - "step": 327530 - }, - { - "epoch": 0.57, - "learning_rate": 2.144047963671495e-05, - "loss": 2.2387, - "step": 327540 - }, - { - "epoch": 0.57, - "learning_rate": 2.1439607696788123e-05, - "loss": 2.3219, - "step": 327550 - }, - { - "epoch": 0.57, - "learning_rate": 2.1438735756861297e-05, - "loss": 2.1798, - "step": 327560 - }, - { - "epoch": 0.57, - "learning_rate": 2.143786381693447e-05, - "loss": 2.2723, - "step": 327570 - }, - { - "epoch": 0.57, - "learning_rate": 2.143699187700764e-05, - "loss": 2.4521, - "step": 327580 - }, - { - "epoch": 0.57, - "learning_rate": 2.1436119937080815e-05, - "loss": 2.3545, - "step": 327590 - }, - { - "epoch": 0.57, - "learning_rate": 2.143524799715399e-05, - "loss": 2.3818, - "step": 327600 - }, - { - "epoch": 0.57, - "learning_rate": 2.1434376057227162e-05, - "loss": 2.2901, - "step": 327610 - }, - { - "epoch": 0.57, - "learning_rate": 2.1433504117300336e-05, - "loss": 2.305, - "step": 327620 - }, - { - "epoch": 0.57, - "learning_rate": 2.143263217737351e-05, - "loss": 2.4237, - "step": 327630 - }, - { - "epoch": 0.57, - "learning_rate": 2.1431760237446684e-05, - "loss": 2.5445, - "step": 327640 - }, - { - "epoch": 0.57, - "learning_rate": 2.1430888297519854e-05, - "loss": 2.35, - "step": 327650 - }, - { - "epoch": 0.57, - "learning_rate": 2.1430016357593028e-05, - "loss": 2.4051, - "step": 327660 - }, - { - "epoch": 0.57, - "learning_rate": 2.14291444176662e-05, - "loss": 2.3122, - "step": 327670 - }, - { - "epoch": 0.57, - "learning_rate": 2.1428272477739375e-05, - "loss": 2.35, - "step": 327680 - }, - { - "epoch": 0.57, - "learning_rate": 2.142740053781255e-05, - "loss": 2.4346, - "step": 327690 - }, - { - "epoch": 0.57, - "learning_rate": 2.142652859788572e-05, - "loss": 2.3262, - "step": 327700 - }, - { - "epoch": 0.57, - "learning_rate": 2.1425656657958897e-05, - "loss": 2.3752, - "step": 327710 - }, - { - "epoch": 0.57, - "learning_rate": 2.1424784718032067e-05, - "loss": 2.4151, - "step": 327720 - }, - { - "epoch": 0.57, - "learning_rate": 2.142391277810524e-05, - "loss": 2.2872, - "step": 327730 - }, - { - "epoch": 0.57, - "learning_rate": 2.142304083817841e-05, - "loss": 2.3854, - "step": 327740 - }, - { - "epoch": 0.57, - "learning_rate": 2.142216889825159e-05, - "loss": 2.3676, - "step": 327750 - }, - { - "epoch": 0.57, - "learning_rate": 2.142129695832476e-05, - "loss": 2.3139, - "step": 327760 - }, - { - "epoch": 0.57, - "learning_rate": 2.1420425018397933e-05, - "loss": 2.3384, - "step": 327770 - }, - { - "epoch": 0.57, - "learning_rate": 2.1419553078471106e-05, - "loss": 2.3929, - "step": 327780 - }, - { - "epoch": 0.57, - "learning_rate": 2.141868113854428e-05, - "loss": 2.3269, - "step": 327790 - }, - { - "epoch": 0.57, - "learning_rate": 2.1417809198617454e-05, - "loss": 2.4078, - "step": 327800 - }, - { - "epoch": 0.57, - "learning_rate": 2.1416937258690624e-05, - "loss": 2.3863, - "step": 327810 - }, - { - "epoch": 0.57, - "learning_rate": 2.14160653187638e-05, - "loss": 2.4324, - "step": 327820 - }, - { - "epoch": 0.57, - "learning_rate": 2.1415193378836972e-05, - "loss": 2.4023, - "step": 327830 - }, - { - "epoch": 0.57, - "learning_rate": 2.1414321438910146e-05, - "loss": 2.2086, - "step": 327840 - }, - { - "epoch": 0.57, - "learning_rate": 2.141344949898332e-05, - "loss": 2.3583, - "step": 327850 - }, - { - "epoch": 0.57, - "learning_rate": 2.1412577559056493e-05, - "loss": 2.3224, - "step": 327860 - }, - { - "epoch": 0.57, - "learning_rate": 2.1411705619129667e-05, - "loss": 2.3866, - "step": 327870 - }, - { - "epoch": 0.57, - "learning_rate": 2.1410833679202837e-05, - "loss": 2.3909, - "step": 327880 - }, - { - "epoch": 0.57, - "learning_rate": 2.1409961739276014e-05, - "loss": 2.3816, - "step": 327890 - }, - { - "epoch": 0.57, - "learning_rate": 2.1409089799349185e-05, - "loss": 2.2544, - "step": 327900 - }, - { - "epoch": 0.57, - "learning_rate": 2.140821785942236e-05, - "loss": 2.4825, - "step": 327910 - }, - { - "epoch": 0.57, - "learning_rate": 2.140734591949553e-05, - "loss": 2.3419, - "step": 327920 - }, - { - "epoch": 0.57, - "learning_rate": 2.1406473979568706e-05, - "loss": 2.3872, - "step": 327930 - }, - { - "epoch": 0.57, - "learning_rate": 2.140560203964188e-05, - "loss": 2.3063, - "step": 327940 - }, - { - "epoch": 0.57, - "learning_rate": 2.140473009971505e-05, - "loss": 2.3405, - "step": 327950 - }, - { - "epoch": 0.57, - "learning_rate": 2.1403858159788224e-05, - "loss": 2.3659, - "step": 327960 - }, - { - "epoch": 0.57, - "learning_rate": 2.1402986219861398e-05, - "loss": 2.3508, - "step": 327970 - }, - { - "epoch": 0.57, - "learning_rate": 2.140211427993457e-05, - "loss": 2.3269, - "step": 327980 - }, - { - "epoch": 0.57, - "learning_rate": 2.1401242340007742e-05, - "loss": 2.3684, - "step": 327990 - }, - { - "epoch": 0.57, - "learning_rate": 2.1400370400080916e-05, - "loss": 2.3539, - "step": 328000 - }, - { - "epoch": 0.57, - "learning_rate": 2.139949846015409e-05, - "loss": 2.2274, - "step": 328010 - }, - { - "epoch": 0.57, - "learning_rate": 2.1398626520227263e-05, - "loss": 2.2791, - "step": 328020 - }, - { - "epoch": 0.57, - "learning_rate": 2.1397754580300437e-05, - "loss": 2.3037, - "step": 328030 - }, - { - "epoch": 0.57, - "learning_rate": 2.139688264037361e-05, - "loss": 2.3632, - "step": 328040 - }, - { - "epoch": 0.57, - "learning_rate": 2.1396010700446785e-05, - "loss": 2.3904, - "step": 328050 - }, - { - "epoch": 0.57, - "learning_rate": 2.1395138760519955e-05, - "loss": 2.3803, - "step": 328060 - }, - { - "epoch": 0.57, - "learning_rate": 2.139426682059313e-05, - "loss": 2.3881, - "step": 328070 - }, - { - "epoch": 0.57, - "learning_rate": 2.1393394880666302e-05, - "loss": 2.254, - "step": 328080 - }, - { - "epoch": 0.57, - "learning_rate": 2.1392522940739476e-05, - "loss": 2.2945, - "step": 328090 - }, - { - "epoch": 0.57, - "learning_rate": 2.139165100081265e-05, - "loss": 2.3379, - "step": 328100 - }, - { - "epoch": 0.57, - "learning_rate": 2.139077906088582e-05, - "loss": 2.366, - "step": 328110 - }, - { - "epoch": 0.57, - "learning_rate": 2.1389907120958998e-05, - "loss": 2.3762, - "step": 328120 - }, - { - "epoch": 0.57, - "learning_rate": 2.1389035181032168e-05, - "loss": 2.2291, - "step": 328130 - }, - { - "epoch": 0.57, - "learning_rate": 2.138816324110534e-05, - "loss": 2.3523, - "step": 328140 - }, - { - "epoch": 0.57, - "learning_rate": 2.1387291301178512e-05, - "loss": 2.081, - "step": 328150 - }, - { - "epoch": 0.57, - "learning_rate": 2.138641936125169e-05, - "loss": 2.3711, - "step": 328160 - }, - { - "epoch": 0.57, - "learning_rate": 2.1385547421324863e-05, - "loss": 2.3999, - "step": 328170 - }, - { - "epoch": 0.57, - "learning_rate": 2.1384675481398033e-05, - "loss": 2.2494, - "step": 328180 - }, - { - "epoch": 0.57, - "learning_rate": 2.138380354147121e-05, - "loss": 2.4211, - "step": 328190 - }, - { - "epoch": 0.57, - "learning_rate": 2.138293160154438e-05, - "loss": 2.3655, - "step": 328200 - }, - { - "epoch": 0.57, - "learning_rate": 2.1382059661617555e-05, - "loss": 2.2782, - "step": 328210 - }, - { - "epoch": 0.57, - "learning_rate": 2.1381187721690725e-05, - "loss": 2.3465, - "step": 328220 - }, - { - "epoch": 0.57, - "learning_rate": 2.1380315781763902e-05, - "loss": 2.3429, - "step": 328230 - }, - { - "epoch": 0.57, - "learning_rate": 2.1379443841837073e-05, - "loss": 2.295, - "step": 328240 - }, - { - "epoch": 0.57, - "learning_rate": 2.1378571901910246e-05, - "loss": 2.3057, - "step": 328250 - }, - { - "epoch": 0.57, - "learning_rate": 2.137769996198342e-05, - "loss": 2.2015, - "step": 328260 - }, - { - "epoch": 0.57, - "learning_rate": 2.1376828022056594e-05, - "loss": 2.2464, - "step": 328270 - }, - { - "epoch": 0.57, - "learning_rate": 2.1375956082129768e-05, - "loss": 2.3169, - "step": 328280 - }, - { - "epoch": 0.57, - "learning_rate": 2.1375084142202938e-05, - "loss": 2.4221, - "step": 328290 - }, - { - "epoch": 0.57, - "learning_rate": 2.1374212202276115e-05, - "loss": 2.4354, - "step": 328300 - }, - { - "epoch": 0.57, - "learning_rate": 2.1373340262349286e-05, - "loss": 2.2398, - "step": 328310 - }, - { - "epoch": 0.57, - "learning_rate": 2.137246832242246e-05, - "loss": 2.4312, - "step": 328320 - }, - { - "epoch": 0.57, - "learning_rate": 2.1371596382495633e-05, - "loss": 2.2961, - "step": 328330 - }, - { - "epoch": 0.57, - "learning_rate": 2.1370724442568807e-05, - "loss": 2.2918, - "step": 328340 - }, - { - "epoch": 0.57, - "learning_rate": 2.136985250264198e-05, - "loss": 2.4436, - "step": 328350 - }, - { - "epoch": 0.57, - "learning_rate": 2.136898056271515e-05, - "loss": 2.4402, - "step": 328360 - }, - { - "epoch": 0.57, - "learning_rate": 2.1368108622788325e-05, - "loss": 2.3225, - "step": 328370 - }, - { - "epoch": 0.57, - "learning_rate": 2.13672366828615e-05, - "loss": 2.2788, - "step": 328380 - }, - { - "epoch": 0.57, - "learning_rate": 2.1366364742934672e-05, - "loss": 2.3212, - "step": 328390 - }, - { - "epoch": 0.57, - "learning_rate": 2.1365492803007843e-05, - "loss": 2.3857, - "step": 328400 - }, - { - "epoch": 0.57, - "learning_rate": 2.1364620863081017e-05, - "loss": 2.3924, - "step": 328410 - }, - { - "epoch": 0.57, - "learning_rate": 2.1363748923154194e-05, - "loss": 2.3875, - "step": 328420 - }, - { - "epoch": 0.57, - "learning_rate": 2.1362876983227364e-05, - "loss": 2.3231, - "step": 328430 - }, - { - "epoch": 0.57, - "learning_rate": 2.1362005043300538e-05, - "loss": 2.27, - "step": 328440 - }, - { - "epoch": 0.57, - "learning_rate": 2.136113310337371e-05, - "loss": 2.3472, - "step": 328450 - }, - { - "epoch": 0.57, - "learning_rate": 2.1360261163446885e-05, - "loss": 2.3403, - "step": 328460 - }, - { - "epoch": 0.57, - "learning_rate": 2.1359389223520056e-05, - "loss": 2.4451, - "step": 328470 - }, - { - "epoch": 0.57, - "learning_rate": 2.135851728359323e-05, - "loss": 2.232, - "step": 328480 - }, - { - "epoch": 0.57, - "learning_rate": 2.1357645343666403e-05, - "loss": 2.2502, - "step": 328490 - }, - { - "epoch": 0.57, - "learning_rate": 2.1356773403739577e-05, - "loss": 2.3266, - "step": 328500 - }, - { - "epoch": 0.57, - "learning_rate": 2.135590146381275e-05, - "loss": 2.3468, - "step": 328510 - }, - { - "epoch": 0.57, - "learning_rate": 2.135502952388592e-05, - "loss": 2.1999, - "step": 328520 - }, - { - "epoch": 0.57, - "learning_rate": 2.13541575839591e-05, - "loss": 2.3668, - "step": 328530 - }, - { - "epoch": 0.57, - "learning_rate": 2.135328564403227e-05, - "loss": 2.1818, - "step": 328540 - }, - { - "epoch": 0.57, - "learning_rate": 2.1352413704105443e-05, - "loss": 2.3175, - "step": 328550 - }, - { - "epoch": 0.57, - "learning_rate": 2.1351541764178616e-05, - "loss": 2.2502, - "step": 328560 - }, - { - "epoch": 0.57, - "learning_rate": 2.135066982425179e-05, - "loss": 2.3764, - "step": 328570 - }, - { - "epoch": 0.57, - "learning_rate": 2.1349797884324964e-05, - "loss": 2.2589, - "step": 328580 - }, - { - "epoch": 0.57, - "learning_rate": 2.1348925944398134e-05, - "loss": 2.3606, - "step": 328590 - }, - { - "epoch": 0.57, - "learning_rate": 2.134805400447131e-05, - "loss": 2.2838, - "step": 328600 - }, - { - "epoch": 0.57, - "learning_rate": 2.1347182064544482e-05, - "loss": 2.3272, - "step": 328610 - }, - { - "epoch": 0.57, - "learning_rate": 2.1346310124617656e-05, - "loss": 2.2869, - "step": 328620 - }, - { - "epoch": 0.57, - "learning_rate": 2.1345438184690826e-05, - "loss": 2.2257, - "step": 328630 - }, - { - "epoch": 0.57, - "learning_rate": 2.1344566244764003e-05, - "loss": 2.4818, - "step": 328640 - }, - { - "epoch": 0.57, - "learning_rate": 2.1343694304837173e-05, - "loss": 2.4055, - "step": 328650 - }, - { - "epoch": 0.57, - "learning_rate": 2.1342822364910347e-05, - "loss": 2.4423, - "step": 328660 - }, - { - "epoch": 0.57, - "learning_rate": 2.134195042498352e-05, - "loss": 2.3457, - "step": 328670 - }, - { - "epoch": 0.57, - "learning_rate": 2.1341078485056695e-05, - "loss": 2.3978, - "step": 328680 - }, - { - "epoch": 0.57, - "learning_rate": 2.134020654512987e-05, - "loss": 2.3706, - "step": 328690 - }, - { - "epoch": 0.57, - "learning_rate": 2.133933460520304e-05, - "loss": 2.4158, - "step": 328700 - }, - { - "epoch": 0.57, - "learning_rate": 2.1338462665276216e-05, - "loss": 2.3133, - "step": 328710 - }, - { - "epoch": 0.57, - "learning_rate": 2.1337590725349386e-05, - "loss": 2.1928, - "step": 328720 - }, - { - "epoch": 0.57, - "learning_rate": 2.133671878542256e-05, - "loss": 2.3976, - "step": 328730 - }, - { - "epoch": 0.57, - "learning_rate": 2.1335846845495734e-05, - "loss": 2.345, - "step": 328740 - }, - { - "epoch": 0.57, - "learning_rate": 2.1334974905568908e-05, - "loss": 2.315, - "step": 328750 - }, - { - "epoch": 0.57, - "learning_rate": 2.133410296564208e-05, - "loss": 2.3643, - "step": 328760 - }, - { - "epoch": 0.57, - "learning_rate": 2.1333231025715252e-05, - "loss": 2.3634, - "step": 328770 - }, - { - "epoch": 0.57, - "learning_rate": 2.1332359085788426e-05, - "loss": 2.3367, - "step": 328780 - }, - { - "epoch": 0.57, - "learning_rate": 2.13314871458616e-05, - "loss": 2.3519, - "step": 328790 - }, - { - "epoch": 0.57, - "learning_rate": 2.1330615205934773e-05, - "loss": 2.3727, - "step": 328800 - }, - { - "epoch": 0.57, - "learning_rate": 2.1329743266007947e-05, - "loss": 2.3349, - "step": 328810 - }, - { - "epoch": 0.57, - "learning_rate": 2.132887132608112e-05, - "loss": 2.3909, - "step": 328820 - }, - { - "epoch": 0.57, - "learning_rate": 2.1327999386154295e-05, - "loss": 2.3312, - "step": 328830 - }, - { - "epoch": 0.57, - "learning_rate": 2.1327127446227465e-05, - "loss": 2.4762, - "step": 328840 - }, - { - "epoch": 0.57, - "learning_rate": 2.132625550630064e-05, - "loss": 2.3606, - "step": 328850 - }, - { - "epoch": 0.57, - "learning_rate": 2.1325383566373812e-05, - "loss": 2.4225, - "step": 328860 - }, - { - "epoch": 0.57, - "learning_rate": 2.1324511626446986e-05, - "loss": 2.4058, - "step": 328870 - }, - { - "epoch": 0.57, - "learning_rate": 2.1323639686520157e-05, - "loss": 2.3966, - "step": 328880 - }, - { - "epoch": 0.57, - "learning_rate": 2.132276774659333e-05, - "loss": 2.4173, - "step": 328890 - }, - { - "epoch": 0.57, - "learning_rate": 2.1321895806666508e-05, - "loss": 2.349, - "step": 328900 - }, - { - "epoch": 0.57, - "learning_rate": 2.1321023866739678e-05, - "loss": 2.4596, - "step": 328910 - }, - { - "epoch": 0.57, - "learning_rate": 2.132015192681285e-05, - "loss": 2.3013, - "step": 328920 - }, - { - "epoch": 0.57, - "learning_rate": 2.1319279986886022e-05, - "loss": 2.3932, - "step": 328930 - }, - { - "epoch": 0.57, - "learning_rate": 2.13184080469592e-05, - "loss": 2.2759, - "step": 328940 - }, - { - "epoch": 0.57, - "learning_rate": 2.131753610703237e-05, - "loss": 2.3308, - "step": 328950 - }, - { - "epoch": 0.57, - "learning_rate": 2.1316664167105543e-05, - "loss": 2.4877, - "step": 328960 - }, - { - "epoch": 0.57, - "learning_rate": 2.1315792227178717e-05, - "loss": 2.3771, - "step": 328970 - }, - { - "epoch": 0.57, - "learning_rate": 2.131492028725189e-05, - "loss": 2.2641, - "step": 328980 - }, - { - "epoch": 0.57, - "learning_rate": 2.1314048347325065e-05, - "loss": 2.3867, - "step": 328990 - }, - { - "epoch": 0.57, - "learning_rate": 2.1313176407398235e-05, - "loss": 2.3376, - "step": 329000 - }, - { - "epoch": 0.57, - "learning_rate": 2.1312304467471412e-05, - "loss": 2.4304, - "step": 329010 - }, - { - "epoch": 0.57, - "learning_rate": 2.1311432527544583e-05, - "loss": 2.378, - "step": 329020 - }, - { - "epoch": 0.57, - "learning_rate": 2.1310560587617756e-05, - "loss": 2.325, - "step": 329030 - }, - { - "epoch": 0.57, - "learning_rate": 2.130968864769093e-05, - "loss": 2.3993, - "step": 329040 - }, - { - "epoch": 0.57, - "learning_rate": 2.1308816707764104e-05, - "loss": 2.3161, - "step": 329050 - }, - { - "epoch": 0.57, - "learning_rate": 2.1307944767837278e-05, - "loss": 2.3042, - "step": 329060 - }, - { - "epoch": 0.57, - "learning_rate": 2.1307072827910448e-05, - "loss": 2.3846, - "step": 329070 - }, - { - "epoch": 0.57, - "learning_rate": 2.1306200887983622e-05, - "loss": 2.3439, - "step": 329080 - }, - { - "epoch": 0.57, - "learning_rate": 2.1305328948056796e-05, - "loss": 2.3712, - "step": 329090 - }, - { - "epoch": 0.57, - "learning_rate": 2.130445700812997e-05, - "loss": 2.1971, - "step": 329100 - }, - { - "epoch": 0.57, - "learning_rate": 2.130358506820314e-05, - "loss": 2.4055, - "step": 329110 - }, - { - "epoch": 0.57, - "learning_rate": 2.1302713128276317e-05, - "loss": 2.3831, - "step": 329120 - }, - { - "epoch": 0.57, - "learning_rate": 2.1301841188349487e-05, - "loss": 2.3508, - "step": 329130 - }, - { - "epoch": 0.57, - "learning_rate": 2.130096924842266e-05, - "loss": 2.3286, - "step": 329140 - }, - { - "epoch": 0.57, - "learning_rate": 2.1300097308495835e-05, - "loss": 2.4273, - "step": 329150 - }, - { - "epoch": 0.57, - "learning_rate": 2.129922536856901e-05, - "loss": 2.3222, - "step": 329160 - }, - { - "epoch": 0.57, - "learning_rate": 2.1298353428642182e-05, - "loss": 2.3167, - "step": 329170 - }, - { - "epoch": 0.57, - "learning_rate": 2.1297481488715353e-05, - "loss": 2.3656, - "step": 329180 - }, - { - "epoch": 0.57, - "learning_rate": 2.1296609548788527e-05, - "loss": 2.38, - "step": 329190 - }, - { - "epoch": 0.57, - "learning_rate": 2.12957376088617e-05, - "loss": 2.3599, - "step": 329200 - }, - { - "epoch": 0.57, - "learning_rate": 2.1294865668934874e-05, - "loss": 2.4016, - "step": 329210 - }, - { - "epoch": 0.57, - "learning_rate": 2.1293993729008048e-05, - "loss": 2.2686, - "step": 329220 - }, - { - "epoch": 0.57, - "learning_rate": 2.129312178908122e-05, - "loss": 2.4104, - "step": 329230 - }, - { - "epoch": 0.57, - "learning_rate": 2.1292249849154395e-05, - "loss": 2.3262, - "step": 329240 - }, - { - "epoch": 0.57, - "learning_rate": 2.1291377909227566e-05, - "loss": 2.3009, - "step": 329250 - }, - { - "epoch": 0.57, - "learning_rate": 2.129050596930074e-05, - "loss": 2.2622, - "step": 329260 - }, - { - "epoch": 0.57, - "learning_rate": 2.1289634029373913e-05, - "loss": 2.3216, - "step": 329270 - }, - { - "epoch": 0.57, - "learning_rate": 2.1288762089447087e-05, - "loss": 2.3128, - "step": 329280 - }, - { - "epoch": 0.57, - "learning_rate": 2.128789014952026e-05, - "loss": 2.3718, - "step": 329290 - }, - { - "epoch": 0.57, - "learning_rate": 2.128701820959343e-05, - "loss": 2.3608, - "step": 329300 - }, - { - "epoch": 0.57, - "learning_rate": 2.128614626966661e-05, - "loss": 2.2428, - "step": 329310 - }, - { - "epoch": 0.57, - "learning_rate": 2.128527432973978e-05, - "loss": 2.3497, - "step": 329320 - }, - { - "epoch": 0.57, - "learning_rate": 2.1284402389812953e-05, - "loss": 2.298, - "step": 329330 - }, - { - "epoch": 0.57, - "learning_rate": 2.1283530449886123e-05, - "loss": 2.4022, - "step": 329340 - }, - { - "epoch": 0.57, - "learning_rate": 2.12826585099593e-05, - "loss": 2.2927, - "step": 329350 - }, - { - "epoch": 0.57, - "learning_rate": 2.128178657003247e-05, - "loss": 2.2517, - "step": 329360 - }, - { - "epoch": 0.57, - "learning_rate": 2.1280914630105644e-05, - "loss": 2.356, - "step": 329370 - }, - { - "epoch": 0.57, - "learning_rate": 2.1280042690178818e-05, - "loss": 2.3369, - "step": 329380 - }, - { - "epoch": 0.57, - "learning_rate": 2.1279170750251992e-05, - "loss": 2.2344, - "step": 329390 - }, - { - "epoch": 0.57, - "learning_rate": 2.1278298810325166e-05, - "loss": 2.2487, - "step": 329400 - }, - { - "epoch": 0.57, - "learning_rate": 2.1277426870398336e-05, - "loss": 2.3097, - "step": 329410 - }, - { - "epoch": 0.57, - "learning_rate": 2.1276554930471513e-05, - "loss": 2.3492, - "step": 329420 - }, - { - "epoch": 0.57, - "learning_rate": 2.1275682990544683e-05, - "loss": 2.3838, - "step": 329430 - }, - { - "epoch": 0.57, - "learning_rate": 2.1274811050617857e-05, - "loss": 2.3083, - "step": 329440 - }, - { - "epoch": 0.57, - "learning_rate": 2.127393911069103e-05, - "loss": 2.2925, - "step": 329450 - }, - { - "epoch": 0.57, - "learning_rate": 2.1273067170764205e-05, - "loss": 2.3671, - "step": 329460 - }, - { - "epoch": 0.57, - "learning_rate": 2.127219523083738e-05, - "loss": 2.3193, - "step": 329470 - }, - { - "epoch": 0.57, - "learning_rate": 2.127132329091055e-05, - "loss": 2.3383, - "step": 329480 - }, - { - "epoch": 0.57, - "learning_rate": 2.1270451350983726e-05, - "loss": 2.2417, - "step": 329490 - }, - { - "epoch": 0.57, - "learning_rate": 2.1269579411056896e-05, - "loss": 2.255, - "step": 329500 - }, - { - "epoch": 0.57, - "learning_rate": 2.126870747113007e-05, - "loss": 2.2875, - "step": 329510 - }, - { - "epoch": 0.57, - "learning_rate": 2.1267835531203244e-05, - "loss": 2.4277, - "step": 329520 - }, - { - "epoch": 0.57, - "learning_rate": 2.1266963591276418e-05, - "loss": 2.4092, - "step": 329530 - }, - { - "epoch": 0.57, - "learning_rate": 2.126609165134959e-05, - "loss": 2.2331, - "step": 329540 - }, - { - "epoch": 0.57, - "learning_rate": 2.1265219711422762e-05, - "loss": 2.3071, - "step": 329550 - }, - { - "epoch": 0.57, - "learning_rate": 2.1264347771495936e-05, - "loss": 2.3641, - "step": 329560 - }, - { - "epoch": 0.57, - "learning_rate": 2.126347583156911e-05, - "loss": 2.3398, - "step": 329570 - }, - { - "epoch": 0.57, - "learning_rate": 2.1262603891642283e-05, - "loss": 2.297, - "step": 329580 - }, - { - "epoch": 0.57, - "learning_rate": 2.1261731951715454e-05, - "loss": 2.4432, - "step": 329590 - }, - { - "epoch": 0.57, - "learning_rate": 2.1260860011788627e-05, - "loss": 2.3338, - "step": 329600 - }, - { - "epoch": 0.57, - "learning_rate": 2.12599880718618e-05, - "loss": 2.4203, - "step": 329610 - }, - { - "epoch": 0.57, - "learning_rate": 2.1259116131934975e-05, - "loss": 2.3264, - "step": 329620 - }, - { - "epoch": 0.57, - "learning_rate": 2.125824419200815e-05, - "loss": 2.3684, - "step": 329630 - }, - { - "epoch": 0.57, - "learning_rate": 2.1257372252081322e-05, - "loss": 2.3326, - "step": 329640 - }, - { - "epoch": 0.57, - "learning_rate": 2.1256500312154496e-05, - "loss": 2.3373, - "step": 329650 - }, - { - "epoch": 0.57, - "learning_rate": 2.1255628372227667e-05, - "loss": 2.441, - "step": 329660 - }, - { - "epoch": 0.57, - "learning_rate": 2.125475643230084e-05, - "loss": 2.2139, - "step": 329670 - }, - { - "epoch": 0.57, - "learning_rate": 2.1253884492374014e-05, - "loss": 2.2938, - "step": 329680 - }, - { - "epoch": 0.57, - "learning_rate": 2.1253012552447188e-05, - "loss": 2.2921, - "step": 329690 - }, - { - "epoch": 0.57, - "learning_rate": 2.1252140612520362e-05, - "loss": 2.4018, - "step": 329700 - }, - { - "epoch": 0.57, - "learning_rate": 2.1251268672593532e-05, - "loss": 2.2944, - "step": 329710 - }, - { - "epoch": 0.57, - "learning_rate": 2.125039673266671e-05, - "loss": 2.3032, - "step": 329720 - }, - { - "epoch": 0.58, - "learning_rate": 2.124952479273988e-05, - "loss": 2.2442, - "step": 329730 - }, - { - "epoch": 0.58, - "learning_rate": 2.1248652852813053e-05, - "loss": 2.3446, - "step": 329740 - }, - { - "epoch": 0.58, - "learning_rate": 2.1247780912886227e-05, - "loss": 2.2293, - "step": 329750 - }, - { - "epoch": 0.58, - "learning_rate": 2.12469089729594e-05, - "loss": 2.3335, - "step": 329760 - }, - { - "epoch": 0.58, - "learning_rate": 2.1246037033032575e-05, - "loss": 2.273, - "step": 329770 - }, - { - "epoch": 0.58, - "learning_rate": 2.1245165093105745e-05, - "loss": 2.3094, - "step": 329780 - }, - { - "epoch": 0.58, - "learning_rate": 2.1244293153178922e-05, - "loss": 2.3919, - "step": 329790 - }, - { - "epoch": 0.58, - "learning_rate": 2.1243421213252093e-05, - "loss": 2.3365, - "step": 329800 - }, - { - "epoch": 0.58, - "learning_rate": 2.1242549273325266e-05, - "loss": 2.3275, - "step": 329810 - }, - { - "epoch": 0.58, - "learning_rate": 2.1241677333398437e-05, - "loss": 2.3214, - "step": 329820 - }, - { - "epoch": 0.58, - "learning_rate": 2.1240805393471614e-05, - "loss": 2.3668, - "step": 329830 - }, - { - "epoch": 0.58, - "learning_rate": 2.1239933453544784e-05, - "loss": 2.3831, - "step": 329840 - }, - { - "epoch": 0.58, - "learning_rate": 2.1239061513617958e-05, - "loss": 2.2958, - "step": 329850 - }, - { - "epoch": 0.58, - "learning_rate": 2.1238189573691132e-05, - "loss": 2.2502, - "step": 329860 - }, - { - "epoch": 0.58, - "learning_rate": 2.1237317633764306e-05, - "loss": 2.2139, - "step": 329870 - }, - { - "epoch": 0.58, - "learning_rate": 2.123644569383748e-05, - "loss": 2.2611, - "step": 329880 - }, - { - "epoch": 0.58, - "learning_rate": 2.123557375391065e-05, - "loss": 2.4451, - "step": 329890 - }, - { - "epoch": 0.58, - "learning_rate": 2.1234701813983827e-05, - "loss": 2.3835, - "step": 329900 - }, - { - "epoch": 0.58, - "learning_rate": 2.1233829874056997e-05, - "loss": 2.3874, - "step": 329910 - }, - { - "epoch": 0.58, - "learning_rate": 2.123295793413017e-05, - "loss": 2.3782, - "step": 329920 - }, - { - "epoch": 0.58, - "learning_rate": 2.1232085994203345e-05, - "loss": 2.2801, - "step": 329930 - }, - { - "epoch": 0.58, - "learning_rate": 2.123121405427652e-05, - "loss": 2.2719, - "step": 329940 - }, - { - "epoch": 0.58, - "learning_rate": 2.1230342114349692e-05, - "loss": 2.2854, - "step": 329950 - }, - { - "epoch": 0.58, - "learning_rate": 2.1229470174422863e-05, - "loss": 2.3691, - "step": 329960 - }, - { - "epoch": 0.58, - "learning_rate": 2.1228598234496037e-05, - "loss": 2.2255, - "step": 329970 - }, - { - "epoch": 0.58, - "learning_rate": 2.122772629456921e-05, - "loss": 2.3106, - "step": 329980 - }, - { - "epoch": 0.58, - "learning_rate": 2.1226854354642384e-05, - "loss": 2.2297, - "step": 329990 - }, - { - "epoch": 0.58, - "learning_rate": 2.1225982414715554e-05, - "loss": 2.3703, - "step": 330000 - }, - { - "epoch": 0.58, - "learning_rate": 2.1225110474788728e-05, - "loss": 2.338, - "step": 330010 - }, - { - "epoch": 0.58, - "learning_rate": 2.1224238534861905e-05, - "loss": 2.3234, - "step": 330020 - }, - { - "epoch": 0.58, - "learning_rate": 2.1223366594935076e-05, - "loss": 2.4078, - "step": 330030 - }, - { - "epoch": 0.58, - "learning_rate": 2.122249465500825e-05, - "loss": 2.3127, - "step": 330040 - }, - { - "epoch": 0.58, - "learning_rate": 2.1221622715081423e-05, - "loss": 2.2959, - "step": 330050 - }, - { - "epoch": 0.58, - "learning_rate": 2.1220750775154597e-05, - "loss": 2.3038, - "step": 330060 - }, - { - "epoch": 0.58, - "learning_rate": 2.1219878835227767e-05, - "loss": 2.2859, - "step": 330070 - }, - { - "epoch": 0.58, - "learning_rate": 2.121900689530094e-05, - "loss": 2.4298, - "step": 330080 - }, - { - "epoch": 0.58, - "learning_rate": 2.1218134955374115e-05, - "loss": 2.3114, - "step": 330090 - }, - { - "epoch": 0.58, - "learning_rate": 2.121726301544729e-05, - "loss": 2.4369, - "step": 330100 - }, - { - "epoch": 0.58, - "learning_rate": 2.1216391075520463e-05, - "loss": 2.3844, - "step": 330110 - }, - { - "epoch": 0.58, - "learning_rate": 2.1215519135593633e-05, - "loss": 2.2079, - "step": 330120 - }, - { - "epoch": 0.58, - "learning_rate": 2.121464719566681e-05, - "loss": 2.3452, - "step": 330130 - }, - { - "epoch": 0.58, - "learning_rate": 2.121377525573998e-05, - "loss": 2.3779, - "step": 330140 - }, - { - "epoch": 0.58, - "learning_rate": 2.1212903315813154e-05, - "loss": 2.3438, - "step": 330150 - }, - { - "epoch": 0.58, - "learning_rate": 2.1212031375886328e-05, - "loss": 2.345, - "step": 330160 - }, - { - "epoch": 0.58, - "learning_rate": 2.1211159435959502e-05, - "loss": 2.4659, - "step": 330170 - }, - { - "epoch": 0.58, - "learning_rate": 2.1210287496032676e-05, - "loss": 2.3256, - "step": 330180 - }, - { - "epoch": 0.58, - "learning_rate": 2.1209415556105846e-05, - "loss": 2.3762, - "step": 330190 - }, - { - "epoch": 0.58, - "learning_rate": 2.1208543616179023e-05, - "loss": 2.2225, - "step": 330200 - }, - { - "epoch": 0.58, - "learning_rate": 2.1207671676252193e-05, - "loss": 2.4192, - "step": 330210 - }, - { - "epoch": 0.58, - "learning_rate": 2.1206799736325367e-05, - "loss": 2.2714, - "step": 330220 - }, - { - "epoch": 0.58, - "learning_rate": 2.1205927796398538e-05, - "loss": 2.1806, - "step": 330230 - }, - { - "epoch": 0.58, - "learning_rate": 2.1205055856471715e-05, - "loss": 2.4105, - "step": 330240 - }, - { - "epoch": 0.58, - "learning_rate": 2.120418391654489e-05, - "loss": 2.4349, - "step": 330250 - }, - { - "epoch": 0.58, - "learning_rate": 2.120331197661806e-05, - "loss": 2.2821, - "step": 330260 - }, - { - "epoch": 0.58, - "learning_rate": 2.1202440036691233e-05, - "loss": 2.3755, - "step": 330270 - }, - { - "epoch": 0.58, - "learning_rate": 2.1201568096764406e-05, - "loss": 2.268, - "step": 330280 - }, - { - "epoch": 0.58, - "learning_rate": 2.120069615683758e-05, - "loss": 2.4506, - "step": 330290 - }, - { - "epoch": 0.58, - "learning_rate": 2.119982421691075e-05, - "loss": 2.3692, - "step": 330300 - }, - { - "epoch": 0.58, - "learning_rate": 2.1198952276983928e-05, - "loss": 2.3737, - "step": 330310 - }, - { - "epoch": 0.58, - "learning_rate": 2.1198080337057098e-05, - "loss": 2.3647, - "step": 330320 - }, - { - "epoch": 0.58, - "learning_rate": 2.1197208397130272e-05, - "loss": 2.3994, - "step": 330330 - }, - { - "epoch": 0.58, - "learning_rate": 2.1196336457203446e-05, - "loss": 2.4788, - "step": 330340 - }, - { - "epoch": 0.58, - "learning_rate": 2.119546451727662e-05, - "loss": 2.3283, - "step": 330350 - }, - { - "epoch": 0.58, - "learning_rate": 2.1194592577349793e-05, - "loss": 2.4376, - "step": 330360 - }, - { - "epoch": 0.58, - "learning_rate": 2.1193720637422964e-05, - "loss": 2.2191, - "step": 330370 - }, - { - "epoch": 0.58, - "learning_rate": 2.1192848697496137e-05, - "loss": 2.4535, - "step": 330380 - }, - { - "epoch": 0.58, - "learning_rate": 2.119197675756931e-05, - "loss": 2.4245, - "step": 330390 - }, - { - "epoch": 0.58, - "learning_rate": 2.1191104817642485e-05, - "loss": 2.1765, - "step": 330400 - }, - { - "epoch": 0.58, - "learning_rate": 2.119023287771566e-05, - "loss": 2.3386, - "step": 330410 - }, - { - "epoch": 0.58, - "learning_rate": 2.1189360937788832e-05, - "loss": 2.3799, - "step": 330420 - }, - { - "epoch": 0.58, - "learning_rate": 2.1188488997862006e-05, - "loss": 2.3849, - "step": 330430 - }, - { - "epoch": 0.58, - "learning_rate": 2.1187617057935177e-05, - "loss": 2.3692, - "step": 330440 - }, - { - "epoch": 0.58, - "learning_rate": 2.118674511800835e-05, - "loss": 2.3738, - "step": 330450 - }, - { - "epoch": 0.58, - "learning_rate": 2.1185873178081524e-05, - "loss": 2.3412, - "step": 330460 - }, - { - "epoch": 0.58, - "learning_rate": 2.1185001238154698e-05, - "loss": 2.3559, - "step": 330470 - }, - { - "epoch": 0.58, - "learning_rate": 2.118412929822787e-05, - "loss": 2.3487, - "step": 330480 - }, - { - "epoch": 0.58, - "learning_rate": 2.1183257358301042e-05, - "loss": 2.4105, - "step": 330490 - }, - { - "epoch": 0.58, - "learning_rate": 2.118238541837422e-05, - "loss": 2.2681, - "step": 330500 - }, - { - "epoch": 0.58, - "learning_rate": 2.118151347844739e-05, - "loss": 2.4421, - "step": 330510 - }, - { - "epoch": 0.58, - "learning_rate": 2.1180641538520563e-05, - "loss": 2.2799, - "step": 330520 - }, - { - "epoch": 0.58, - "learning_rate": 2.1179769598593734e-05, - "loss": 2.3308, - "step": 330530 - }, - { - "epoch": 0.58, - "learning_rate": 2.117889765866691e-05, - "loss": 2.2923, - "step": 330540 - }, - { - "epoch": 0.58, - "learning_rate": 2.117802571874008e-05, - "loss": 2.3017, - "step": 330550 - }, - { - "epoch": 0.58, - "learning_rate": 2.1177153778813255e-05, - "loss": 2.3151, - "step": 330560 - }, - { - "epoch": 0.58, - "learning_rate": 2.117628183888643e-05, - "loss": 2.2553, - "step": 330570 - }, - { - "epoch": 0.58, - "learning_rate": 2.1175409898959603e-05, - "loss": 2.33, - "step": 330580 - }, - { - "epoch": 0.58, - "learning_rate": 2.1174537959032776e-05, - "loss": 2.3635, - "step": 330590 - }, - { - "epoch": 0.58, - "learning_rate": 2.1173666019105947e-05, - "loss": 2.3473, - "step": 330600 - }, - { - "epoch": 0.58, - "learning_rate": 2.1172794079179124e-05, - "loss": 2.2836, - "step": 330610 - }, - { - "epoch": 0.58, - "learning_rate": 2.1171922139252294e-05, - "loss": 2.3135, - "step": 330620 - }, - { - "epoch": 0.58, - "learning_rate": 2.1171050199325468e-05, - "loss": 2.3021, - "step": 330630 - }, - { - "epoch": 0.58, - "learning_rate": 2.1170178259398642e-05, - "loss": 2.2311, - "step": 330640 - }, - { - "epoch": 0.58, - "learning_rate": 2.1169306319471816e-05, - "loss": 2.2157, - "step": 330650 - }, - { - "epoch": 0.58, - "learning_rate": 2.116843437954499e-05, - "loss": 2.3393, - "step": 330660 - }, - { - "epoch": 0.58, - "learning_rate": 2.116756243961816e-05, - "loss": 2.3514, - "step": 330670 - }, - { - "epoch": 0.58, - "learning_rate": 2.1166690499691337e-05, - "loss": 2.301, - "step": 330680 - }, - { - "epoch": 0.58, - "learning_rate": 2.1165818559764507e-05, - "loss": 2.3681, - "step": 330690 - }, - { - "epoch": 0.58, - "learning_rate": 2.116494661983768e-05, - "loss": 2.3856, - "step": 330700 - }, - { - "epoch": 0.58, - "learning_rate": 2.116407467991085e-05, - "loss": 2.3727, - "step": 330710 - }, - { - "epoch": 0.58, - "learning_rate": 2.116320273998403e-05, - "loss": 2.3496, - "step": 330720 - }, - { - "epoch": 0.58, - "learning_rate": 2.11623308000572e-05, - "loss": 2.2649, - "step": 330730 - }, - { - "epoch": 0.58, - "learning_rate": 2.1161458860130373e-05, - "loss": 2.2897, - "step": 330740 - }, - { - "epoch": 0.58, - "learning_rate": 2.1160586920203547e-05, - "loss": 2.2983, - "step": 330750 - }, - { - "epoch": 0.58, - "learning_rate": 2.115971498027672e-05, - "loss": 2.2989, - "step": 330760 - }, - { - "epoch": 0.58, - "learning_rate": 2.1158843040349894e-05, - "loss": 2.3604, - "step": 330770 - }, - { - "epoch": 0.58, - "learning_rate": 2.1157971100423064e-05, - "loss": 2.3172, - "step": 330780 - }, - { - "epoch": 0.58, - "learning_rate": 2.1157099160496238e-05, - "loss": 2.2811, - "step": 330790 - }, - { - "epoch": 0.58, - "learning_rate": 2.1156227220569412e-05, - "loss": 2.3564, - "step": 330800 - }, - { - "epoch": 0.58, - "learning_rate": 2.1155355280642586e-05, - "loss": 2.254, - "step": 330810 - }, - { - "epoch": 0.58, - "learning_rate": 2.115448334071576e-05, - "loss": 2.3179, - "step": 330820 - }, - { - "epoch": 0.58, - "learning_rate": 2.1153611400788933e-05, - "loss": 2.2982, - "step": 330830 - }, - { - "epoch": 0.58, - "learning_rate": 2.1152739460862107e-05, - "loss": 2.3741, - "step": 330840 - }, - { - "epoch": 0.58, - "learning_rate": 2.1151867520935277e-05, - "loss": 2.3414, - "step": 330850 - }, - { - "epoch": 0.58, - "learning_rate": 2.115099558100845e-05, - "loss": 2.3453, - "step": 330860 - }, - { - "epoch": 0.58, - "learning_rate": 2.1150123641081625e-05, - "loss": 2.2692, - "step": 330870 - }, - { - "epoch": 0.58, - "learning_rate": 2.11492517011548e-05, - "loss": 2.2181, - "step": 330880 - }, - { - "epoch": 0.58, - "learning_rate": 2.1148379761227973e-05, - "loss": 2.2586, - "step": 330890 - }, - { - "epoch": 0.58, - "learning_rate": 2.1147507821301143e-05, - "loss": 2.2053, - "step": 330900 - }, - { - "epoch": 0.58, - "learning_rate": 2.114663588137432e-05, - "loss": 2.3327, - "step": 330910 - }, - { - "epoch": 0.58, - "learning_rate": 2.114576394144749e-05, - "loss": 2.3602, - "step": 330920 - }, - { - "epoch": 0.58, - "learning_rate": 2.1144892001520664e-05, - "loss": 2.382, - "step": 330930 - }, - { - "epoch": 0.58, - "learning_rate": 2.1144020061593835e-05, - "loss": 2.3213, - "step": 330940 - }, - { - "epoch": 0.58, - "learning_rate": 2.1143148121667012e-05, - "loss": 2.2978, - "step": 330950 - }, - { - "epoch": 0.58, - "learning_rate": 2.1142276181740182e-05, - "loss": 2.3414, - "step": 330960 - }, - { - "epoch": 0.58, - "learning_rate": 2.1141404241813356e-05, - "loss": 2.2844, - "step": 330970 - }, - { - "epoch": 0.58, - "learning_rate": 2.1140532301886533e-05, - "loss": 2.455, - "step": 330980 - }, - { - "epoch": 0.58, - "learning_rate": 2.1139660361959703e-05, - "loss": 2.3152, - "step": 330990 - }, - { - "epoch": 0.58, - "learning_rate": 2.1138788422032877e-05, - "loss": 2.3032, - "step": 331000 - }, - { - "epoch": 0.58, - "learning_rate": 2.1137916482106048e-05, - "loss": 2.3552, - "step": 331010 - }, - { - "epoch": 0.58, - "learning_rate": 2.1137044542179225e-05, - "loss": 2.4063, - "step": 331020 - }, - { - "epoch": 0.58, - "learning_rate": 2.1136172602252395e-05, - "loss": 2.3659, - "step": 331030 - }, - { - "epoch": 0.58, - "learning_rate": 2.113530066232557e-05, - "loss": 2.227, - "step": 331040 - }, - { - "epoch": 0.58, - "learning_rate": 2.1134428722398743e-05, - "loss": 2.302, - "step": 331050 - }, - { - "epoch": 0.58, - "learning_rate": 2.1133556782471916e-05, - "loss": 2.3517, - "step": 331060 - }, - { - "epoch": 0.58, - "learning_rate": 2.113268484254509e-05, - "loss": 2.3203, - "step": 331070 - }, - { - "epoch": 0.58, - "learning_rate": 2.113181290261826e-05, - "loss": 2.3711, - "step": 331080 - }, - { - "epoch": 0.58, - "learning_rate": 2.1130940962691438e-05, - "loss": 2.2157, - "step": 331090 - }, - { - "epoch": 0.58, - "learning_rate": 2.1130069022764608e-05, - "loss": 2.2404, - "step": 331100 - }, - { - "epoch": 0.58, - "learning_rate": 2.1129197082837782e-05, - "loss": 2.3604, - "step": 331110 - }, - { - "epoch": 0.58, - "learning_rate": 2.1128325142910956e-05, - "loss": 2.3019, - "step": 331120 - }, - { - "epoch": 0.58, - "learning_rate": 2.112745320298413e-05, - "loss": 2.3707, - "step": 331130 - }, - { - "epoch": 0.58, - "learning_rate": 2.1126581263057303e-05, - "loss": 2.3981, - "step": 331140 - }, - { - "epoch": 0.58, - "learning_rate": 2.1125709323130474e-05, - "loss": 2.3076, - "step": 331150 - }, - { - "epoch": 0.58, - "learning_rate": 2.1124837383203647e-05, - "loss": 2.3339, - "step": 331160 - }, - { - "epoch": 0.58, - "learning_rate": 2.112396544327682e-05, - "loss": 2.3551, - "step": 331170 - }, - { - "epoch": 0.58, - "learning_rate": 2.1123093503349995e-05, - "loss": 2.3067, - "step": 331180 - }, - { - "epoch": 0.58, - "learning_rate": 2.1122221563423165e-05, - "loss": 2.3079, - "step": 331190 - }, - { - "epoch": 0.58, - "learning_rate": 2.112134962349634e-05, - "loss": 2.3334, - "step": 331200 - }, - { - "epoch": 0.58, - "learning_rate": 2.1120477683569513e-05, - "loss": 2.4573, - "step": 331210 - }, - { - "epoch": 0.58, - "learning_rate": 2.1119605743642687e-05, - "loss": 2.29, - "step": 331220 - }, - { - "epoch": 0.58, - "learning_rate": 2.111873380371586e-05, - "loss": 2.2826, - "step": 331230 - }, - { - "epoch": 0.58, - "learning_rate": 2.1117861863789034e-05, - "loss": 2.3899, - "step": 331240 - }, - { - "epoch": 0.58, - "learning_rate": 2.1116989923862208e-05, - "loss": 2.3194, - "step": 331250 - }, - { - "epoch": 0.58, - "learning_rate": 2.111611798393538e-05, - "loss": 2.3761, - "step": 331260 - }, - { - "epoch": 0.58, - "learning_rate": 2.1115246044008552e-05, - "loss": 2.3072, - "step": 331270 - }, - { - "epoch": 0.58, - "learning_rate": 2.1114374104081726e-05, - "loss": 2.404, - "step": 331280 - }, - { - "epoch": 0.58, - "learning_rate": 2.11135021641549e-05, - "loss": 2.3082, - "step": 331290 - }, - { - "epoch": 0.58, - "learning_rate": 2.1112630224228073e-05, - "loss": 2.4075, - "step": 331300 - }, - { - "epoch": 0.58, - "learning_rate": 2.1111758284301244e-05, - "loss": 2.284, - "step": 331310 - }, - { - "epoch": 0.58, - "learning_rate": 2.111088634437442e-05, - "loss": 2.4308, - "step": 331320 - }, - { - "epoch": 0.58, - "learning_rate": 2.111001440444759e-05, - "loss": 2.3421, - "step": 331330 - }, - { - "epoch": 0.58, - "learning_rate": 2.1109142464520765e-05, - "loss": 2.2159, - "step": 331340 - }, - { - "epoch": 0.58, - "learning_rate": 2.110827052459394e-05, - "loss": 2.2826, - "step": 331350 - }, - { - "epoch": 0.58, - "learning_rate": 2.1107398584667113e-05, - "loss": 2.4458, - "step": 331360 - }, - { - "epoch": 0.58, - "learning_rate": 2.1106526644740286e-05, - "loss": 2.261, - "step": 331370 - }, - { - "epoch": 0.58, - "learning_rate": 2.1105654704813457e-05, - "loss": 2.2384, - "step": 331380 - }, - { - "epoch": 0.58, - "learning_rate": 2.1104782764886634e-05, - "loss": 2.4135, - "step": 331390 - }, - { - "epoch": 0.58, - "learning_rate": 2.1103910824959804e-05, - "loss": 2.3057, - "step": 331400 - }, - { - "epoch": 0.58, - "learning_rate": 2.1103038885032978e-05, - "loss": 2.2864, - "step": 331410 - }, - { - "epoch": 0.58, - "learning_rate": 2.110216694510615e-05, - "loss": 2.2138, - "step": 331420 - }, - { - "epoch": 0.58, - "learning_rate": 2.1101295005179326e-05, - "loss": 2.4212, - "step": 331430 - }, - { - "epoch": 0.58, - "learning_rate": 2.1100423065252496e-05, - "loss": 2.3146, - "step": 331440 - }, - { - "epoch": 0.58, - "learning_rate": 2.109955112532567e-05, - "loss": 2.3094, - "step": 331450 - }, - { - "epoch": 0.58, - "learning_rate": 2.1098679185398844e-05, - "loss": 2.3242, - "step": 331460 - }, - { - "epoch": 0.58, - "learning_rate": 2.1097807245472017e-05, - "loss": 2.4165, - "step": 331470 - }, - { - "epoch": 0.58, - "learning_rate": 2.109693530554519e-05, - "loss": 2.2859, - "step": 331480 - }, - { - "epoch": 0.58, - "learning_rate": 2.109606336561836e-05, - "loss": 2.2615, - "step": 331490 - }, - { - "epoch": 0.58, - "learning_rate": 2.109519142569154e-05, - "loss": 2.4834, - "step": 331500 - }, - { - "epoch": 0.58, - "learning_rate": 2.109431948576471e-05, - "loss": 2.3469, - "step": 331510 - }, - { - "epoch": 0.58, - "learning_rate": 2.1093447545837883e-05, - "loss": 2.2846, - "step": 331520 - }, - { - "epoch": 0.58, - "learning_rate": 2.1092575605911057e-05, - "loss": 2.3392, - "step": 331530 - }, - { - "epoch": 0.58, - "learning_rate": 2.109170366598423e-05, - "loss": 2.2899, - "step": 331540 - }, - { - "epoch": 0.58, - "learning_rate": 2.1090831726057404e-05, - "loss": 2.2635, - "step": 331550 - }, - { - "epoch": 0.58, - "learning_rate": 2.1089959786130574e-05, - "loss": 2.2825, - "step": 331560 - }, - { - "epoch": 0.58, - "learning_rate": 2.1089087846203748e-05, - "loss": 2.4102, - "step": 331570 - }, - { - "epoch": 0.58, - "learning_rate": 2.1088215906276922e-05, - "loss": 2.3355, - "step": 331580 - }, - { - "epoch": 0.58, - "learning_rate": 2.1087343966350096e-05, - "loss": 2.426, - "step": 331590 - }, - { - "epoch": 0.58, - "learning_rate": 2.108647202642327e-05, - "loss": 2.3151, - "step": 331600 - }, - { - "epoch": 0.58, - "learning_rate": 2.108560008649644e-05, - "loss": 2.3628, - "step": 331610 - }, - { - "epoch": 0.58, - "learning_rate": 2.1084728146569617e-05, - "loss": 2.374, - "step": 331620 - }, - { - "epoch": 0.58, - "learning_rate": 2.1083856206642787e-05, - "loss": 2.3608, - "step": 331630 - }, - { - "epoch": 0.58, - "learning_rate": 2.108298426671596e-05, - "loss": 2.2921, - "step": 331640 - }, - { - "epoch": 0.58, - "learning_rate": 2.1082112326789135e-05, - "loss": 2.333, - "step": 331650 - }, - { - "epoch": 0.58, - "learning_rate": 2.108124038686231e-05, - "loss": 2.3861, - "step": 331660 - }, - { - "epoch": 0.58, - "learning_rate": 2.108036844693548e-05, - "loss": 2.2493, - "step": 331670 - }, - { - "epoch": 0.58, - "learning_rate": 2.1079496507008653e-05, - "loss": 2.3895, - "step": 331680 - }, - { - "epoch": 0.58, - "learning_rate": 2.1078624567081827e-05, - "loss": 2.4576, - "step": 331690 - }, - { - "epoch": 0.58, - "learning_rate": 2.1077752627155e-05, - "loss": 2.2758, - "step": 331700 - }, - { - "epoch": 0.58, - "learning_rate": 2.1076880687228174e-05, - "loss": 2.2788, - "step": 331710 - }, - { - "epoch": 0.58, - "learning_rate": 2.1076008747301345e-05, - "loss": 2.2826, - "step": 331720 - }, - { - "epoch": 0.58, - "learning_rate": 2.1075136807374522e-05, - "loss": 2.2985, - "step": 331730 - }, - { - "epoch": 0.58, - "learning_rate": 2.1074264867447692e-05, - "loss": 2.271, - "step": 331740 - }, - { - "epoch": 0.58, - "learning_rate": 2.1073392927520866e-05, - "loss": 2.2985, - "step": 331750 - }, - { - "epoch": 0.58, - "learning_rate": 2.107252098759404e-05, - "loss": 2.2391, - "step": 331760 - }, - { - "epoch": 0.58, - "learning_rate": 2.1071649047667213e-05, - "loss": 2.3479, - "step": 331770 - }, - { - "epoch": 0.58, - "learning_rate": 2.1070777107740387e-05, - "loss": 2.2975, - "step": 331780 - }, - { - "epoch": 0.58, - "learning_rate": 2.1069905167813558e-05, - "loss": 2.2835, - "step": 331790 - }, - { - "epoch": 0.58, - "learning_rate": 2.1069033227886735e-05, - "loss": 2.3767, - "step": 331800 - }, - { - "epoch": 0.58, - "learning_rate": 2.1068161287959905e-05, - "loss": 2.4244, - "step": 331810 - }, - { - "epoch": 0.58, - "learning_rate": 2.106728934803308e-05, - "loss": 2.3304, - "step": 331820 - }, - { - "epoch": 0.58, - "learning_rate": 2.106641740810625e-05, - "loss": 2.2724, - "step": 331830 - }, - { - "epoch": 0.58, - "learning_rate": 2.1065545468179426e-05, - "loss": 2.3446, - "step": 331840 - }, - { - "epoch": 0.58, - "learning_rate": 2.10646735282526e-05, - "loss": 2.2556, - "step": 331850 - }, - { - "epoch": 0.58, - "learning_rate": 2.106380158832577e-05, - "loss": 2.371, - "step": 331860 - }, - { - "epoch": 0.58, - "learning_rate": 2.1062929648398944e-05, - "loss": 2.2427, - "step": 331870 - }, - { - "epoch": 0.58, - "learning_rate": 2.1062057708472118e-05, - "loss": 2.2679, - "step": 331880 - }, - { - "epoch": 0.58, - "learning_rate": 2.1061185768545292e-05, - "loss": 2.3364, - "step": 331890 - }, - { - "epoch": 0.58, - "learning_rate": 2.1060313828618462e-05, - "loss": 2.2652, - "step": 331900 - }, - { - "epoch": 0.58, - "learning_rate": 2.105944188869164e-05, - "loss": 2.3388, - "step": 331910 - }, - { - "epoch": 0.58, - "learning_rate": 2.105856994876481e-05, - "loss": 2.437, - "step": 331920 - }, - { - "epoch": 0.58, - "learning_rate": 2.1057698008837984e-05, - "loss": 2.3925, - "step": 331930 - }, - { - "epoch": 0.58, - "learning_rate": 2.1056826068911157e-05, - "loss": 2.2451, - "step": 331940 - }, - { - "epoch": 0.58, - "learning_rate": 2.105595412898433e-05, - "loss": 2.4141, - "step": 331950 - }, - { - "epoch": 0.58, - "learning_rate": 2.1055082189057505e-05, - "loss": 2.4586, - "step": 331960 - }, - { - "epoch": 0.58, - "learning_rate": 2.1054210249130675e-05, - "loss": 2.4166, - "step": 331970 - }, - { - "epoch": 0.58, - "learning_rate": 2.105333830920385e-05, - "loss": 2.285, - "step": 331980 - }, - { - "epoch": 0.58, - "learning_rate": 2.1052466369277023e-05, - "loss": 2.4062, - "step": 331990 - }, - { - "epoch": 0.58, - "learning_rate": 2.1051594429350197e-05, - "loss": 2.3515, - "step": 332000 - }, - { - "epoch": 0.58, - "learning_rate": 2.105072248942337e-05, - "loss": 2.3034, - "step": 332010 - }, - { - "epoch": 0.58, - "learning_rate": 2.1049850549496544e-05, - "loss": 2.3782, - "step": 332020 - }, - { - "epoch": 0.58, - "learning_rate": 2.1048978609569718e-05, - "loss": 2.3573, - "step": 332030 - }, - { - "epoch": 0.58, - "learning_rate": 2.104810666964289e-05, - "loss": 2.2841, - "step": 332040 - }, - { - "epoch": 0.58, - "learning_rate": 2.1047234729716062e-05, - "loss": 2.3776, - "step": 332050 - }, - { - "epoch": 0.58, - "learning_rate": 2.1046362789789236e-05, - "loss": 2.3405, - "step": 332060 - }, - { - "epoch": 0.58, - "learning_rate": 2.104549084986241e-05, - "loss": 2.1603, - "step": 332070 - }, - { - "epoch": 0.58, - "learning_rate": 2.104461890993558e-05, - "loss": 2.2864, - "step": 332080 - }, - { - "epoch": 0.58, - "learning_rate": 2.1043746970008754e-05, - "loss": 2.3613, - "step": 332090 - }, - { - "epoch": 0.58, - "learning_rate": 2.104287503008193e-05, - "loss": 2.2777, - "step": 332100 - }, - { - "epoch": 0.58, - "learning_rate": 2.10420030901551e-05, - "loss": 2.3224, - "step": 332110 - }, - { - "epoch": 0.58, - "learning_rate": 2.1041131150228275e-05, - "loss": 2.3017, - "step": 332120 - }, - { - "epoch": 0.58, - "learning_rate": 2.1040259210301445e-05, - "loss": 2.4039, - "step": 332130 - }, - { - "epoch": 0.58, - "learning_rate": 2.1039387270374623e-05, - "loss": 2.4262, - "step": 332140 - }, - { - "epoch": 0.58, - "learning_rate": 2.1038515330447793e-05, - "loss": 2.3055, - "step": 332150 - }, - { - "epoch": 0.58, - "learning_rate": 2.1037643390520967e-05, - "loss": 2.2311, - "step": 332160 - }, - { - "epoch": 0.58, - "learning_rate": 2.103677145059414e-05, - "loss": 2.3658, - "step": 332170 - }, - { - "epoch": 0.58, - "learning_rate": 2.1035899510667314e-05, - "loss": 2.3691, - "step": 332180 - }, - { - "epoch": 0.58, - "learning_rate": 2.1035027570740488e-05, - "loss": 2.3646, - "step": 332190 - }, - { - "epoch": 0.58, - "learning_rate": 2.103415563081366e-05, - "loss": 2.395, - "step": 332200 - }, - { - "epoch": 0.58, - "learning_rate": 2.1033283690886836e-05, - "loss": 2.4215, - "step": 332210 - }, - { - "epoch": 0.58, - "learning_rate": 2.1032411750960006e-05, - "loss": 2.3719, - "step": 332220 - }, - { - "epoch": 0.58, - "learning_rate": 2.103153981103318e-05, - "loss": 2.3922, - "step": 332230 - }, - { - "epoch": 0.58, - "learning_rate": 2.1030667871106354e-05, - "loss": 2.315, - "step": 332240 - }, - { - "epoch": 0.58, - "learning_rate": 2.1029795931179527e-05, - "loss": 2.3156, - "step": 332250 - }, - { - "epoch": 0.58, - "learning_rate": 2.10289239912527e-05, - "loss": 2.3289, - "step": 332260 - }, - { - "epoch": 0.58, - "learning_rate": 2.102805205132587e-05, - "loss": 2.3193, - "step": 332270 - }, - { - "epoch": 0.58, - "learning_rate": 2.102718011139905e-05, - "loss": 2.3812, - "step": 332280 - }, - { - "epoch": 0.58, - "learning_rate": 2.102630817147222e-05, - "loss": 2.2654, - "step": 332290 - }, - { - "epoch": 0.58, - "learning_rate": 2.1025436231545393e-05, - "loss": 2.3175, - "step": 332300 - }, - { - "epoch": 0.58, - "learning_rate": 2.1024564291618563e-05, - "loss": 2.4188, - "step": 332310 - }, - { - "epoch": 0.58, - "learning_rate": 2.102369235169174e-05, - "loss": 2.3565, - "step": 332320 - }, - { - "epoch": 0.58, - "learning_rate": 2.1022820411764914e-05, - "loss": 2.3777, - "step": 332330 - }, - { - "epoch": 0.58, - "learning_rate": 2.1021948471838084e-05, - "loss": 2.2389, - "step": 332340 - }, - { - "epoch": 0.58, - "learning_rate": 2.1021076531911258e-05, - "loss": 2.3938, - "step": 332350 - }, - { - "epoch": 0.58, - "learning_rate": 2.1020204591984432e-05, - "loss": 2.3265, - "step": 332360 - }, - { - "epoch": 0.58, - "learning_rate": 2.1019332652057606e-05, - "loss": 2.3629, - "step": 332370 - }, - { - "epoch": 0.58, - "learning_rate": 2.1018460712130776e-05, - "loss": 2.3906, - "step": 332380 - }, - { - "epoch": 0.58, - "learning_rate": 2.101758877220395e-05, - "loss": 2.4485, - "step": 332390 - }, - { - "epoch": 0.58, - "learning_rate": 2.1016716832277124e-05, - "loss": 2.2912, - "step": 332400 - }, - { - "epoch": 0.58, - "learning_rate": 2.1015844892350297e-05, - "loss": 2.2923, - "step": 332410 - }, - { - "epoch": 0.58, - "learning_rate": 2.101497295242347e-05, - "loss": 2.4041, - "step": 332420 - }, - { - "epoch": 0.58, - "learning_rate": 2.1014101012496645e-05, - "loss": 2.3409, - "step": 332430 - }, - { - "epoch": 0.58, - "learning_rate": 2.101322907256982e-05, - "loss": 2.249, - "step": 332440 - }, - { - "epoch": 0.58, - "learning_rate": 2.101235713264299e-05, - "loss": 2.3955, - "step": 332450 - }, - { - "epoch": 0.58, - "learning_rate": 2.1011485192716163e-05, - "loss": 2.2388, - "step": 332460 - }, - { - "epoch": 0.58, - "learning_rate": 2.1010613252789337e-05, - "loss": 2.3177, - "step": 332470 - }, - { - "epoch": 0.58, - "learning_rate": 2.100974131286251e-05, - "loss": 2.3138, - "step": 332480 - }, - { - "epoch": 0.58, - "learning_rate": 2.1008869372935684e-05, - "loss": 2.3136, - "step": 332490 - }, - { - "epoch": 0.58, - "learning_rate": 2.1007997433008855e-05, - "loss": 2.3532, - "step": 332500 - }, - { - "epoch": 0.58, - "learning_rate": 2.1007125493082032e-05, - "loss": 2.3281, - "step": 332510 - }, - { - "epoch": 0.58, - "learning_rate": 2.1006253553155202e-05, - "loss": 2.347, - "step": 332520 - }, - { - "epoch": 0.58, - "learning_rate": 2.1005381613228376e-05, - "loss": 2.251, - "step": 332530 - }, - { - "epoch": 0.58, - "learning_rate": 2.1004509673301546e-05, - "loss": 2.4278, - "step": 332540 - }, - { - "epoch": 0.58, - "learning_rate": 2.1003637733374723e-05, - "loss": 2.2274, - "step": 332550 - }, - { - "epoch": 0.58, - "learning_rate": 2.1002765793447894e-05, - "loss": 2.309, - "step": 332560 - }, - { - "epoch": 0.58, - "learning_rate": 2.1001893853521068e-05, - "loss": 2.3586, - "step": 332570 - }, - { - "epoch": 0.58, - "learning_rate": 2.1001021913594245e-05, - "loss": 2.2519, - "step": 332580 - }, - { - "epoch": 0.58, - "learning_rate": 2.1000149973667415e-05, - "loss": 2.31, - "step": 332590 - }, - { - "epoch": 0.58, - "learning_rate": 2.099927803374059e-05, - "loss": 2.3282, - "step": 332600 - }, - { - "epoch": 0.58, - "learning_rate": 2.099840609381376e-05, - "loss": 2.3775, - "step": 332610 - }, - { - "epoch": 0.58, - "learning_rate": 2.0997534153886936e-05, - "loss": 2.3458, - "step": 332620 - }, - { - "epoch": 0.58, - "learning_rate": 2.0996662213960107e-05, - "loss": 2.4899, - "step": 332630 - }, - { - "epoch": 0.58, - "learning_rate": 2.099579027403328e-05, - "loss": 2.3935, - "step": 332640 - }, - { - "epoch": 0.58, - "learning_rate": 2.0994918334106454e-05, - "loss": 2.338, - "step": 332650 - }, - { - "epoch": 0.58, - "learning_rate": 2.0994046394179628e-05, - "loss": 2.2941, - "step": 332660 - }, - { - "epoch": 0.58, - "learning_rate": 2.0993174454252802e-05, - "loss": 2.2671, - "step": 332670 - }, - { - "epoch": 0.58, - "learning_rate": 2.0992302514325972e-05, - "loss": 2.3903, - "step": 332680 - }, - { - "epoch": 0.58, - "learning_rate": 2.099143057439915e-05, - "loss": 2.2412, - "step": 332690 - }, - { - "epoch": 0.58, - "learning_rate": 2.099055863447232e-05, - "loss": 2.3846, - "step": 332700 - }, - { - "epoch": 0.58, - "learning_rate": 2.0989686694545494e-05, - "loss": 2.3578, - "step": 332710 - }, - { - "epoch": 0.58, - "learning_rate": 2.0988814754618667e-05, - "loss": 2.3972, - "step": 332720 - }, - { - "epoch": 0.58, - "learning_rate": 2.098794281469184e-05, - "loss": 2.2864, - "step": 332730 - }, - { - "epoch": 0.58, - "learning_rate": 2.0987070874765015e-05, - "loss": 2.3322, - "step": 332740 - }, - { - "epoch": 0.58, - "learning_rate": 2.0986198934838185e-05, - "loss": 2.3444, - "step": 332750 - }, - { - "epoch": 0.58, - "learning_rate": 2.098532699491136e-05, - "loss": 2.2796, - "step": 332760 - }, - { - "epoch": 0.58, - "learning_rate": 2.0984455054984533e-05, - "loss": 2.3497, - "step": 332770 - }, - { - "epoch": 0.58, - "learning_rate": 2.0983583115057707e-05, - "loss": 2.3297, - "step": 332780 - }, - { - "epoch": 0.58, - "learning_rate": 2.0982711175130877e-05, - "loss": 2.3763, - "step": 332790 - }, - { - "epoch": 0.58, - "learning_rate": 2.098183923520405e-05, - "loss": 2.3271, - "step": 332800 - }, - { - "epoch": 0.58, - "learning_rate": 2.0980967295277225e-05, - "loss": 2.2655, - "step": 332810 - }, - { - "epoch": 0.58, - "learning_rate": 2.09800953553504e-05, - "loss": 2.2209, - "step": 332820 - }, - { - "epoch": 0.58, - "learning_rate": 2.0979223415423572e-05, - "loss": 2.362, - "step": 332830 - }, - { - "epoch": 0.58, - "learning_rate": 2.0978351475496746e-05, - "loss": 2.253, - "step": 332840 - }, - { - "epoch": 0.58, - "learning_rate": 2.097747953556992e-05, - "loss": 2.3625, - "step": 332850 - }, - { - "epoch": 0.58, - "learning_rate": 2.097660759564309e-05, - "loss": 2.2809, - "step": 332860 - }, - { - "epoch": 0.58, - "learning_rate": 2.0975735655716264e-05, - "loss": 2.3391, - "step": 332870 - }, - { - "epoch": 0.58, - "learning_rate": 2.0974863715789438e-05, - "loss": 2.3176, - "step": 332880 - }, - { - "epoch": 0.58, - "learning_rate": 2.097399177586261e-05, - "loss": 2.304, - "step": 332890 - }, - { - "epoch": 0.58, - "learning_rate": 2.0973119835935785e-05, - "loss": 2.3482, - "step": 332900 - }, - { - "epoch": 0.58, - "learning_rate": 2.0972247896008955e-05, - "loss": 2.3385, - "step": 332910 - }, - { - "epoch": 0.58, - "learning_rate": 2.0971375956082133e-05, - "loss": 2.4194, - "step": 332920 - }, - { - "epoch": 0.58, - "learning_rate": 2.0970504016155303e-05, - "loss": 2.2658, - "step": 332930 - }, - { - "epoch": 0.58, - "learning_rate": 2.0969632076228477e-05, - "loss": 2.3248, - "step": 332940 - }, - { - "epoch": 0.58, - "learning_rate": 2.096876013630165e-05, - "loss": 2.4774, - "step": 332950 - }, - { - "epoch": 0.58, - "learning_rate": 2.0967888196374824e-05, - "loss": 2.3209, - "step": 332960 - }, - { - "epoch": 0.58, - "learning_rate": 2.0967016256447998e-05, - "loss": 2.3741, - "step": 332970 - }, - { - "epoch": 0.58, - "learning_rate": 2.096614431652117e-05, - "loss": 2.3559, - "step": 332980 - }, - { - "epoch": 0.58, - "learning_rate": 2.0965272376594346e-05, - "loss": 2.3577, - "step": 332990 - }, - { - "epoch": 0.58, - "learning_rate": 2.0964400436667516e-05, - "loss": 2.4038, - "step": 333000 - }, - { - "epoch": 0.58, - "learning_rate": 2.096352849674069e-05, - "loss": 2.4093, - "step": 333010 - }, - { - "epoch": 0.58, - "learning_rate": 2.096265655681386e-05, - "loss": 2.3801, - "step": 333020 - }, - { - "epoch": 0.58, - "learning_rate": 2.0961784616887037e-05, - "loss": 2.4384, - "step": 333030 - }, - { - "epoch": 0.58, - "learning_rate": 2.0960912676960208e-05, - "loss": 2.1224, - "step": 333040 - }, - { - "epoch": 0.58, - "learning_rate": 2.096004073703338e-05, - "loss": 2.3105, - "step": 333050 - }, - { - "epoch": 0.58, - "learning_rate": 2.0959168797106555e-05, - "loss": 2.3545, - "step": 333060 - }, - { - "epoch": 0.58, - "learning_rate": 2.095829685717973e-05, - "loss": 2.2249, - "step": 333070 - }, - { - "epoch": 0.58, - "learning_rate": 2.0957424917252903e-05, - "loss": 2.3651, - "step": 333080 - }, - { - "epoch": 0.58, - "learning_rate": 2.0956552977326073e-05, - "loss": 2.2603, - "step": 333090 - }, - { - "epoch": 0.58, - "learning_rate": 2.095568103739925e-05, - "loss": 2.2548, - "step": 333100 - }, - { - "epoch": 0.58, - "learning_rate": 2.095480909747242e-05, - "loss": 2.3563, - "step": 333110 - }, - { - "epoch": 0.58, - "learning_rate": 2.0953937157545594e-05, - "loss": 2.2813, - "step": 333120 - }, - { - "epoch": 0.58, - "learning_rate": 2.0953065217618768e-05, - "loss": 2.2987, - "step": 333130 - }, - { - "epoch": 0.58, - "learning_rate": 2.0952193277691942e-05, - "loss": 2.3156, - "step": 333140 - }, - { - "epoch": 0.58, - "learning_rate": 2.0951321337765116e-05, - "loss": 2.2948, - "step": 333150 - }, - { - "epoch": 0.58, - "learning_rate": 2.0950449397838286e-05, - "loss": 2.3406, - "step": 333160 - }, - { - "epoch": 0.58, - "learning_rate": 2.094957745791146e-05, - "loss": 2.379, - "step": 333170 - }, - { - "epoch": 0.58, - "learning_rate": 2.0948705517984634e-05, - "loss": 2.3093, - "step": 333180 - }, - { - "epoch": 0.58, - "learning_rate": 2.0947833578057807e-05, - "loss": 2.302, - "step": 333190 - }, - { - "epoch": 0.58, - "learning_rate": 2.094696163813098e-05, - "loss": 2.3785, - "step": 333200 - }, - { - "epoch": 0.58, - "learning_rate": 2.0946089698204155e-05, - "loss": 2.3221, - "step": 333210 - }, - { - "epoch": 0.58, - "learning_rate": 2.094521775827733e-05, - "loss": 2.2867, - "step": 333220 - }, - { - "epoch": 0.58, - "learning_rate": 2.09443458183505e-05, - "loss": 2.3409, - "step": 333230 - }, - { - "epoch": 0.58, - "learning_rate": 2.0943473878423673e-05, - "loss": 2.3665, - "step": 333240 - }, - { - "epoch": 0.58, - "learning_rate": 2.0942601938496847e-05, - "loss": 2.3541, - "step": 333250 - }, - { - "epoch": 0.58, - "learning_rate": 2.094172999857002e-05, - "loss": 2.3214, - "step": 333260 - }, - { - "epoch": 0.58, - "learning_rate": 2.094085805864319e-05, - "loss": 2.2546, - "step": 333270 - }, - { - "epoch": 0.58, - "learning_rate": 2.0939986118716365e-05, - "loss": 2.3087, - "step": 333280 - }, - { - "epoch": 0.58, - "learning_rate": 2.093911417878954e-05, - "loss": 2.2347, - "step": 333290 - }, - { - "epoch": 0.58, - "learning_rate": 2.0938242238862712e-05, - "loss": 2.3037, - "step": 333300 - }, - { - "epoch": 0.58, - "learning_rate": 2.0937370298935886e-05, - "loss": 2.2373, - "step": 333310 - }, - { - "epoch": 0.58, - "learning_rate": 2.0936498359009056e-05, - "loss": 2.3279, - "step": 333320 - }, - { - "epoch": 0.58, - "learning_rate": 2.0935626419082234e-05, - "loss": 2.4537, - "step": 333330 - }, - { - "epoch": 0.58, - "learning_rate": 2.0934754479155404e-05, - "loss": 2.4537, - "step": 333340 - }, - { - "epoch": 0.58, - "learning_rate": 2.0933882539228578e-05, - "loss": 2.3025, - "step": 333350 - }, - { - "epoch": 0.58, - "learning_rate": 2.093301059930175e-05, - "loss": 2.3957, - "step": 333360 - }, - { - "epoch": 0.58, - "learning_rate": 2.0932138659374925e-05, - "loss": 2.3143, - "step": 333370 - }, - { - "epoch": 0.58, - "learning_rate": 2.09312667194481e-05, - "loss": 2.3033, - "step": 333380 - }, - { - "epoch": 0.58, - "learning_rate": 2.093039477952127e-05, - "loss": 2.3338, - "step": 333390 - }, - { - "epoch": 0.58, - "learning_rate": 2.0929522839594447e-05, - "loss": 2.4436, - "step": 333400 - }, - { - "epoch": 0.58, - "learning_rate": 2.0928650899667617e-05, - "loss": 2.3172, - "step": 333410 - }, - { - "epoch": 0.58, - "learning_rate": 2.092777895974079e-05, - "loss": 2.3115, - "step": 333420 - }, - { - "epoch": 0.58, - "learning_rate": 2.0926907019813964e-05, - "loss": 2.3784, - "step": 333430 - }, - { - "epoch": 0.58, - "learning_rate": 2.0926035079887138e-05, - "loss": 2.2896, - "step": 333440 - }, - { - "epoch": 0.58, - "learning_rate": 2.0925163139960312e-05, - "loss": 2.3138, - "step": 333450 - }, - { - "epoch": 0.58, - "learning_rate": 2.0924291200033482e-05, - "loss": 2.3278, - "step": 333460 - }, - { - "epoch": 0.58, - "learning_rate": 2.0923419260106656e-05, - "loss": 2.2977, - "step": 333470 - }, - { - "epoch": 0.58, - "learning_rate": 2.092254732017983e-05, - "loss": 2.3084, - "step": 333480 - }, - { - "epoch": 0.58, - "learning_rate": 2.0921675380253004e-05, - "loss": 2.3614, - "step": 333490 - }, - { - "epoch": 0.58, - "learning_rate": 2.0920803440326174e-05, - "loss": 2.2933, - "step": 333500 - }, - { - "epoch": 0.58, - "learning_rate": 2.091993150039935e-05, - "loss": 2.3163, - "step": 333510 - }, - { - "epoch": 0.58, - "learning_rate": 2.091905956047252e-05, - "loss": 2.3961, - "step": 333520 - }, - { - "epoch": 0.58, - "learning_rate": 2.0918187620545695e-05, - "loss": 2.3437, - "step": 333530 - }, - { - "epoch": 0.58, - "learning_rate": 2.091731568061887e-05, - "loss": 2.2885, - "step": 333540 - }, - { - "epoch": 0.58, - "learning_rate": 2.0916443740692043e-05, - "loss": 2.303, - "step": 333550 - }, - { - "epoch": 0.58, - "learning_rate": 2.0915571800765217e-05, - "loss": 2.3501, - "step": 333560 - }, - { - "epoch": 0.58, - "learning_rate": 2.0914699860838387e-05, - "loss": 2.3509, - "step": 333570 - }, - { - "epoch": 0.58, - "learning_rate": 2.091382792091156e-05, - "loss": 2.3157, - "step": 333580 - }, - { - "epoch": 0.58, - "learning_rate": 2.0912955980984735e-05, - "loss": 2.2078, - "step": 333590 - }, - { - "epoch": 0.58, - "learning_rate": 2.091208404105791e-05, - "loss": 2.3417, - "step": 333600 - }, - { - "epoch": 0.58, - "learning_rate": 2.0911212101131082e-05, - "loss": 2.3321, - "step": 333610 - }, - { - "epoch": 0.58, - "learning_rate": 2.0910340161204256e-05, - "loss": 2.4379, - "step": 333620 - }, - { - "epoch": 0.58, - "learning_rate": 2.090946822127743e-05, - "loss": 2.4691, - "step": 333630 - }, - { - "epoch": 0.58, - "learning_rate": 2.09085962813506e-05, - "loss": 2.2801, - "step": 333640 - }, - { - "epoch": 0.58, - "learning_rate": 2.0907724341423774e-05, - "loss": 2.1598, - "step": 333650 - }, - { - "epoch": 0.58, - "learning_rate": 2.0906852401496948e-05, - "loss": 2.3032, - "step": 333660 - }, - { - "epoch": 0.58, - "learning_rate": 2.090598046157012e-05, - "loss": 2.2803, - "step": 333670 - }, - { - "epoch": 0.58, - "learning_rate": 2.0905108521643295e-05, - "loss": 2.4337, - "step": 333680 - }, - { - "epoch": 0.58, - "learning_rate": 2.0904236581716466e-05, - "loss": 2.3405, - "step": 333690 - }, - { - "epoch": 0.58, - "learning_rate": 2.0903364641789643e-05, - "loss": 2.296, - "step": 333700 - }, - { - "epoch": 0.58, - "learning_rate": 2.0902492701862813e-05, - "loss": 2.3279, - "step": 333710 - }, - { - "epoch": 0.58, - "learning_rate": 2.0901620761935987e-05, - "loss": 2.3639, - "step": 333720 - }, - { - "epoch": 0.58, - "learning_rate": 2.0900748822009157e-05, - "loss": 2.2857, - "step": 333730 - }, - { - "epoch": 0.58, - "learning_rate": 2.0899876882082334e-05, - "loss": 2.2393, - "step": 333740 - }, - { - "epoch": 0.58, - "learning_rate": 2.0899004942155505e-05, - "loss": 2.3367, - "step": 333750 - }, - { - "epoch": 0.58, - "learning_rate": 2.089813300222868e-05, - "loss": 2.2362, - "step": 333760 - }, - { - "epoch": 0.58, - "learning_rate": 2.0897261062301852e-05, - "loss": 2.2315, - "step": 333770 - }, - { - "epoch": 0.58, - "learning_rate": 2.0896389122375026e-05, - "loss": 2.208, - "step": 333780 - }, - { - "epoch": 0.58, - "learning_rate": 2.08955171824482e-05, - "loss": 2.3756, - "step": 333790 - }, - { - "epoch": 0.58, - "learning_rate": 2.089464524252137e-05, - "loss": 2.2584, - "step": 333800 - }, - { - "epoch": 0.58, - "learning_rate": 2.0893773302594547e-05, - "loss": 2.347, - "step": 333810 - }, - { - "epoch": 0.58, - "learning_rate": 2.0892901362667718e-05, - "loss": 2.3091, - "step": 333820 - }, - { - "epoch": 0.58, - "learning_rate": 2.089202942274089e-05, - "loss": 2.214, - "step": 333830 - }, - { - "epoch": 0.58, - "learning_rate": 2.0891157482814065e-05, - "loss": 2.3701, - "step": 333840 - }, - { - "epoch": 0.58, - "learning_rate": 2.089028554288724e-05, - "loss": 2.3266, - "step": 333850 - }, - { - "epoch": 0.58, - "learning_rate": 2.0889413602960413e-05, - "loss": 2.3315, - "step": 333860 - }, - { - "epoch": 0.58, - "learning_rate": 2.0888541663033583e-05, - "loss": 2.311, - "step": 333870 - }, - { - "epoch": 0.58, - "learning_rate": 2.088766972310676e-05, - "loss": 2.3568, - "step": 333880 - }, - { - "epoch": 0.58, - "learning_rate": 2.088679778317993e-05, - "loss": 2.3191, - "step": 333890 - }, - { - "epoch": 0.58, - "learning_rate": 2.0885925843253105e-05, - "loss": 2.3148, - "step": 333900 - }, - { - "epoch": 0.58, - "learning_rate": 2.0885053903326275e-05, - "loss": 2.3337, - "step": 333910 - }, - { - "epoch": 0.58, - "learning_rate": 2.0884181963399452e-05, - "loss": 2.3942, - "step": 333920 - }, - { - "epoch": 0.58, - "learning_rate": 2.0883310023472626e-05, - "loss": 2.3463, - "step": 333930 - }, - { - "epoch": 0.58, - "learning_rate": 2.0882438083545796e-05, - "loss": 2.2327, - "step": 333940 - }, - { - "epoch": 0.58, - "learning_rate": 2.088156614361897e-05, - "loss": 2.3772, - "step": 333950 - }, - { - "epoch": 0.58, - "learning_rate": 2.0880694203692144e-05, - "loss": 2.306, - "step": 333960 - }, - { - "epoch": 0.58, - "learning_rate": 2.0879822263765318e-05, - "loss": 2.3154, - "step": 333970 - }, - { - "epoch": 0.58, - "learning_rate": 2.0878950323838488e-05, - "loss": 2.293, - "step": 333980 - }, - { - "epoch": 0.58, - "learning_rate": 2.087807838391166e-05, - "loss": 2.3141, - "step": 333990 - }, - { - "epoch": 0.58, - "learning_rate": 2.0877206443984835e-05, - "loss": 2.3507, - "step": 334000 - }, - { - "epoch": 0.58, - "learning_rate": 2.087633450405801e-05, - "loss": 2.2521, - "step": 334010 - }, - { - "epoch": 0.58, - "learning_rate": 2.0875462564131183e-05, - "loss": 2.4041, - "step": 334020 - }, - { - "epoch": 0.58, - "learning_rate": 2.0874590624204357e-05, - "loss": 2.2315, - "step": 334030 - }, - { - "epoch": 0.58, - "learning_rate": 2.087371868427753e-05, - "loss": 2.4264, - "step": 334040 - }, - { - "epoch": 0.58, - "learning_rate": 2.08728467443507e-05, - "loss": 2.2739, - "step": 334050 - }, - { - "epoch": 0.58, - "learning_rate": 2.0871974804423875e-05, - "loss": 2.2439, - "step": 334060 - }, - { - "epoch": 0.58, - "learning_rate": 2.087110286449705e-05, - "loss": 2.4256, - "step": 334070 - }, - { - "epoch": 0.58, - "learning_rate": 2.0870230924570222e-05, - "loss": 2.4389, - "step": 334080 - }, - { - "epoch": 0.58, - "learning_rate": 2.0869358984643396e-05, - "loss": 2.3198, - "step": 334090 - }, - { - "epoch": 0.58, - "learning_rate": 2.0868487044716566e-05, - "loss": 2.3355, - "step": 334100 - }, - { - "epoch": 0.58, - "learning_rate": 2.0867615104789744e-05, - "loss": 2.4243, - "step": 334110 - }, - { - "epoch": 0.58, - "learning_rate": 2.0866743164862914e-05, - "loss": 2.3594, - "step": 334120 - }, - { - "epoch": 0.58, - "learning_rate": 2.0865871224936088e-05, - "loss": 2.2278, - "step": 334130 - }, - { - "epoch": 0.58, - "learning_rate": 2.086499928500926e-05, - "loss": 2.2839, - "step": 334140 - }, - { - "epoch": 0.58, - "learning_rate": 2.0864127345082435e-05, - "loss": 2.379, - "step": 334150 - }, - { - "epoch": 0.58, - "learning_rate": 2.086325540515561e-05, - "loss": 2.4181, - "step": 334160 - }, - { - "epoch": 0.58, - "learning_rate": 2.086238346522878e-05, - "loss": 2.3612, - "step": 334170 - }, - { - "epoch": 0.58, - "learning_rate": 2.0861511525301957e-05, - "loss": 2.2494, - "step": 334180 - }, - { - "epoch": 0.58, - "learning_rate": 2.0860639585375127e-05, - "loss": 2.3163, - "step": 334190 - }, - { - "epoch": 0.58, - "learning_rate": 2.08597676454483e-05, - "loss": 2.3904, - "step": 334200 - }, - { - "epoch": 0.58, - "learning_rate": 2.085889570552147e-05, - "loss": 2.2972, - "step": 334210 - }, - { - "epoch": 0.58, - "learning_rate": 2.0858023765594648e-05, - "loss": 2.412, - "step": 334220 - }, - { - "epoch": 0.58, - "learning_rate": 2.085715182566782e-05, - "loss": 2.4625, - "step": 334230 - }, - { - "epoch": 0.58, - "learning_rate": 2.0856279885740992e-05, - "loss": 2.3629, - "step": 334240 - }, - { - "epoch": 0.58, - "learning_rate": 2.0855407945814166e-05, - "loss": 2.3118, - "step": 334250 - }, - { - "epoch": 0.58, - "learning_rate": 2.085453600588734e-05, - "loss": 2.2731, - "step": 334260 - }, - { - "epoch": 0.58, - "learning_rate": 2.0853664065960514e-05, - "loss": 2.299, - "step": 334270 - }, - { - "epoch": 0.58, - "learning_rate": 2.0852792126033684e-05, - "loss": 2.351, - "step": 334280 - }, - { - "epoch": 0.58, - "learning_rate": 2.085192018610686e-05, - "loss": 2.3262, - "step": 334290 - }, - { - "epoch": 0.58, - "learning_rate": 2.085104824618003e-05, - "loss": 2.32, - "step": 334300 - }, - { - "epoch": 0.58, - "learning_rate": 2.0850176306253205e-05, - "loss": 2.1992, - "step": 334310 - }, - { - "epoch": 0.58, - "learning_rate": 2.084930436632638e-05, - "loss": 2.337, - "step": 334320 - }, - { - "epoch": 0.58, - "learning_rate": 2.0848432426399553e-05, - "loss": 2.2603, - "step": 334330 - }, - { - "epoch": 0.58, - "learning_rate": 2.0847560486472727e-05, - "loss": 2.3826, - "step": 334340 - }, - { - "epoch": 0.58, - "learning_rate": 2.0846688546545897e-05, - "loss": 2.2297, - "step": 334350 - }, - { - "epoch": 0.58, - "learning_rate": 2.084581660661907e-05, - "loss": 2.2893, - "step": 334360 - }, - { - "epoch": 0.58, - "learning_rate": 2.0844944666692245e-05, - "loss": 2.4059, - "step": 334370 - }, - { - "epoch": 0.58, - "learning_rate": 2.084407272676542e-05, - "loss": 2.2102, - "step": 334380 - }, - { - "epoch": 0.58, - "learning_rate": 2.084320078683859e-05, - "loss": 2.2999, - "step": 334390 - }, - { - "epoch": 0.58, - "learning_rate": 2.0842328846911763e-05, - "loss": 2.1898, - "step": 334400 - }, - { - "epoch": 0.58, - "learning_rate": 2.084145690698494e-05, - "loss": 2.2384, - "step": 334410 - }, - { - "epoch": 0.58, - "learning_rate": 2.084058496705811e-05, - "loss": 2.3271, - "step": 334420 - }, - { - "epoch": 0.58, - "learning_rate": 2.0839713027131284e-05, - "loss": 2.279, - "step": 334430 - }, - { - "epoch": 0.58, - "learning_rate": 2.0838841087204458e-05, - "loss": 2.2065, - "step": 334440 - }, - { - "epoch": 0.58, - "learning_rate": 2.083796914727763e-05, - "loss": 2.4428, - "step": 334450 - }, - { - "epoch": 0.58, - "learning_rate": 2.0837097207350802e-05, - "loss": 2.3192, - "step": 334460 - }, - { - "epoch": 0.58, - "learning_rate": 2.0836225267423976e-05, - "loss": 2.3101, - "step": 334470 - }, - { - "epoch": 0.58, - "learning_rate": 2.083535332749715e-05, - "loss": 2.3376, - "step": 334480 - }, - { - "epoch": 0.58, - "learning_rate": 2.0834481387570323e-05, - "loss": 2.3738, - "step": 334490 - }, - { - "epoch": 0.58, - "learning_rate": 2.0833609447643497e-05, - "loss": 2.3364, - "step": 334500 - }, - { - "epoch": 0.58, - "learning_rate": 2.0832737507716667e-05, - "loss": 2.4187, - "step": 334510 - }, - { - "epoch": 0.58, - "learning_rate": 2.0831865567789844e-05, - "loss": 2.3209, - "step": 334520 - }, - { - "epoch": 0.58, - "learning_rate": 2.0830993627863015e-05, - "loss": 2.4048, - "step": 334530 - }, - { - "epoch": 0.58, - "learning_rate": 2.083012168793619e-05, - "loss": 2.3419, - "step": 334540 - }, - { - "epoch": 0.58, - "learning_rate": 2.0829249748009362e-05, - "loss": 2.3729, - "step": 334550 - }, - { - "epoch": 0.58, - "learning_rate": 2.0828377808082536e-05, - "loss": 2.3592, - "step": 334560 - }, - { - "epoch": 0.58, - "learning_rate": 2.082750586815571e-05, - "loss": 2.2149, - "step": 334570 - }, - { - "epoch": 0.58, - "learning_rate": 2.082663392822888e-05, - "loss": 2.4603, - "step": 334580 - }, - { - "epoch": 0.58, - "learning_rate": 2.0825761988302057e-05, - "loss": 2.3539, - "step": 334590 - }, - { - "epoch": 0.58, - "learning_rate": 2.0824890048375228e-05, - "loss": 2.2936, - "step": 334600 - }, - { - "epoch": 0.58, - "learning_rate": 2.08240181084484e-05, - "loss": 2.3485, - "step": 334610 - }, - { - "epoch": 0.58, - "learning_rate": 2.0823146168521572e-05, - "loss": 2.3267, - "step": 334620 - }, - { - "epoch": 0.58, - "learning_rate": 2.082227422859475e-05, - "loss": 2.3017, - "step": 334630 - }, - { - "epoch": 0.58, - "learning_rate": 2.082140228866792e-05, - "loss": 2.4247, - "step": 334640 - }, - { - "epoch": 0.58, - "learning_rate": 2.0820530348741093e-05, - "loss": 2.2992, - "step": 334650 - }, - { - "epoch": 0.58, - "learning_rate": 2.0819658408814267e-05, - "loss": 2.351, - "step": 334660 - }, - { - "epoch": 0.58, - "learning_rate": 2.081878646888744e-05, - "loss": 2.3601, - "step": 334670 - }, - { - "epoch": 0.58, - "learning_rate": 2.0817914528960615e-05, - "loss": 2.3474, - "step": 334680 - }, - { - "epoch": 0.58, - "learning_rate": 2.0817042589033785e-05, - "loss": 2.371, - "step": 334690 - }, - { - "epoch": 0.58, - "learning_rate": 2.0816170649106962e-05, - "loss": 2.3246, - "step": 334700 - }, - { - "epoch": 0.58, - "learning_rate": 2.0815298709180132e-05, - "loss": 2.3957, - "step": 334710 - }, - { - "epoch": 0.58, - "learning_rate": 2.0814426769253306e-05, - "loss": 2.2845, - "step": 334720 - }, - { - "epoch": 0.58, - "learning_rate": 2.081355482932648e-05, - "loss": 2.2759, - "step": 334730 - }, - { - "epoch": 0.58, - "learning_rate": 2.0812682889399654e-05, - "loss": 2.303, - "step": 334740 - }, - { - "epoch": 0.58, - "learning_rate": 2.0811810949472828e-05, - "loss": 2.2845, - "step": 334750 - }, - { - "epoch": 0.58, - "learning_rate": 2.0810939009545998e-05, - "loss": 2.4192, - "step": 334760 - }, - { - "epoch": 0.58, - "learning_rate": 2.081006706961917e-05, - "loss": 2.3347, - "step": 334770 - }, - { - "epoch": 0.58, - "learning_rate": 2.0809195129692345e-05, - "loss": 2.3345, - "step": 334780 - }, - { - "epoch": 0.58, - "learning_rate": 2.080832318976552e-05, - "loss": 2.2909, - "step": 334790 - }, - { - "epoch": 0.58, - "learning_rate": 2.0807451249838693e-05, - "loss": 2.3448, - "step": 334800 - }, - { - "epoch": 0.58, - "learning_rate": 2.0806579309911867e-05, - "loss": 2.3763, - "step": 334810 - }, - { - "epoch": 0.58, - "learning_rate": 2.080570736998504e-05, - "loss": 2.2592, - "step": 334820 - }, - { - "epoch": 0.58, - "learning_rate": 2.080483543005821e-05, - "loss": 2.3448, - "step": 334830 - }, - { - "epoch": 0.58, - "learning_rate": 2.0803963490131385e-05, - "loss": 2.1708, - "step": 334840 - }, - { - "epoch": 0.58, - "learning_rate": 2.080309155020456e-05, - "loss": 2.2902, - "step": 334850 - }, - { - "epoch": 0.58, - "learning_rate": 2.0802219610277732e-05, - "loss": 2.3207, - "step": 334860 - }, - { - "epoch": 0.58, - "learning_rate": 2.0801347670350903e-05, - "loss": 2.3918, - "step": 334870 - }, - { - "epoch": 0.58, - "learning_rate": 2.0800475730424076e-05, - "loss": 2.3468, - "step": 334880 - }, - { - "epoch": 0.58, - "learning_rate": 2.0799603790497254e-05, - "loss": 2.2199, - "step": 334890 - }, - { - "epoch": 0.58, - "learning_rate": 2.0798731850570424e-05, - "loss": 2.3629, - "step": 334900 - }, - { - "epoch": 0.58, - "learning_rate": 2.0797859910643598e-05, - "loss": 2.2944, - "step": 334910 - }, - { - "epoch": 0.58, - "learning_rate": 2.0796987970716768e-05, - "loss": 2.2509, - "step": 334920 - }, - { - "epoch": 0.58, - "learning_rate": 2.0796116030789945e-05, - "loss": 2.3374, - "step": 334930 - }, - { - "epoch": 0.58, - "learning_rate": 2.0795244090863116e-05, - "loss": 2.3429, - "step": 334940 - }, - { - "epoch": 0.58, - "learning_rate": 2.079437215093629e-05, - "loss": 2.4328, - "step": 334950 - }, - { - "epoch": 0.58, - "learning_rate": 2.0793500211009463e-05, - "loss": 2.3492, - "step": 334960 - }, - { - "epoch": 0.58, - "learning_rate": 2.0792628271082637e-05, - "loss": 2.3207, - "step": 334970 - }, - { - "epoch": 0.58, - "learning_rate": 2.079175633115581e-05, - "loss": 2.3817, - "step": 334980 - }, - { - "epoch": 0.58, - "learning_rate": 2.079088439122898e-05, - "loss": 2.3086, - "step": 334990 - }, - { - "epoch": 0.58, - "learning_rate": 2.0790012451302158e-05, - "loss": 2.3872, - "step": 335000 - }, - { - "epoch": 0.58, - "learning_rate": 2.078914051137533e-05, - "loss": 2.2607, - "step": 335010 - }, - { - "epoch": 0.58, - "learning_rate": 2.0788268571448502e-05, - "loss": 2.4312, - "step": 335020 - }, - { - "epoch": 0.58, - "learning_rate": 2.0787396631521676e-05, - "loss": 2.2673, - "step": 335030 - }, - { - "epoch": 0.58, - "learning_rate": 2.078652469159485e-05, - "loss": 2.3064, - "step": 335040 - }, - { - "epoch": 0.58, - "learning_rate": 2.0785652751668024e-05, - "loss": 2.4369, - "step": 335050 - }, - { - "epoch": 0.58, - "learning_rate": 2.0784780811741194e-05, - "loss": 2.4757, - "step": 335060 - }, - { - "epoch": 0.58, - "learning_rate": 2.078390887181437e-05, - "loss": 2.3024, - "step": 335070 - }, - { - "epoch": 0.58, - "learning_rate": 2.078303693188754e-05, - "loss": 2.3128, - "step": 335080 - }, - { - "epoch": 0.58, - "learning_rate": 2.0782164991960715e-05, - "loss": 2.3463, - "step": 335090 - }, - { - "epoch": 0.58, - "learning_rate": 2.0781293052033886e-05, - "loss": 2.3516, - "step": 335100 - }, - { - "epoch": 0.58, - "learning_rate": 2.0780421112107063e-05, - "loss": 2.3399, - "step": 335110 - }, - { - "epoch": 0.58, - "learning_rate": 2.0779549172180233e-05, - "loss": 2.319, - "step": 335120 - }, - { - "epoch": 0.58, - "learning_rate": 2.0778677232253407e-05, - "loss": 2.3536, - "step": 335130 - }, - { - "epoch": 0.58, - "learning_rate": 2.077780529232658e-05, - "loss": 2.3927, - "step": 335140 - }, - { - "epoch": 0.58, - "learning_rate": 2.0776933352399755e-05, - "loss": 2.3876, - "step": 335150 - }, - { - "epoch": 0.58, - "learning_rate": 2.077606141247293e-05, - "loss": 2.3012, - "step": 335160 - }, - { - "epoch": 0.58, - "learning_rate": 2.07751894725461e-05, - "loss": 2.2235, - "step": 335170 - }, - { - "epoch": 0.58, - "learning_rate": 2.0774317532619273e-05, - "loss": 2.3498, - "step": 335180 - }, - { - "epoch": 0.58, - "learning_rate": 2.0773445592692446e-05, - "loss": 2.2996, - "step": 335190 - }, - { - "epoch": 0.58, - "learning_rate": 2.077257365276562e-05, - "loss": 2.4026, - "step": 335200 - }, - { - "epoch": 0.58, - "learning_rate": 2.0771701712838794e-05, - "loss": 2.3166, - "step": 335210 - }, - { - "epoch": 0.58, - "learning_rate": 2.0770829772911968e-05, - "loss": 2.301, - "step": 335220 - }, - { - "epoch": 0.58, - "learning_rate": 2.076995783298514e-05, - "loss": 2.3005, - "step": 335230 - }, - { - "epoch": 0.58, - "learning_rate": 2.0769085893058312e-05, - "loss": 2.4258, - "step": 335240 - }, - { - "epoch": 0.58, - "learning_rate": 2.0768213953131486e-05, - "loss": 2.2285, - "step": 335250 - }, - { - "epoch": 0.58, - "learning_rate": 2.076734201320466e-05, - "loss": 2.3316, - "step": 335260 - }, - { - "epoch": 0.58, - "learning_rate": 2.0766470073277833e-05, - "loss": 2.3859, - "step": 335270 - }, - { - "epoch": 0.58, - "learning_rate": 2.0765598133351007e-05, - "loss": 2.4325, - "step": 335280 - }, - { - "epoch": 0.58, - "learning_rate": 2.0764726193424177e-05, - "loss": 2.3072, - "step": 335290 - }, - { - "epoch": 0.58, - "learning_rate": 2.0763854253497354e-05, - "loss": 2.2772, - "step": 335300 - }, - { - "epoch": 0.58, - "learning_rate": 2.0762982313570525e-05, - "loss": 2.343, - "step": 335310 - }, - { - "epoch": 0.58, - "learning_rate": 2.07621103736437e-05, - "loss": 2.4244, - "step": 335320 - }, - { - "epoch": 0.58, - "learning_rate": 2.076123843371687e-05, - "loss": 2.3023, - "step": 335330 - }, - { - "epoch": 0.58, - "learning_rate": 2.0760366493790046e-05, - "loss": 2.2626, - "step": 335340 - }, - { - "epoch": 0.58, - "learning_rate": 2.0759494553863216e-05, - "loss": 2.3619, - "step": 335350 - }, - { - "epoch": 0.58, - "learning_rate": 2.075862261393639e-05, - "loss": 2.3963, - "step": 335360 - }, - { - "epoch": 0.58, - "learning_rate": 2.0757750674009564e-05, - "loss": 2.366, - "step": 335370 - }, - { - "epoch": 0.58, - "learning_rate": 2.0756878734082738e-05, - "loss": 2.3343, - "step": 335380 - }, - { - "epoch": 0.58, - "learning_rate": 2.075600679415591e-05, - "loss": 2.4781, - "step": 335390 - }, - { - "epoch": 0.58, - "learning_rate": 2.0755134854229082e-05, - "loss": 2.3679, - "step": 335400 - }, - { - "epoch": 0.58, - "learning_rate": 2.075426291430226e-05, - "loss": 2.3357, - "step": 335410 - }, - { - "epoch": 0.58, - "learning_rate": 2.075339097437543e-05, - "loss": 2.2023, - "step": 335420 - }, - { - "epoch": 0.58, - "learning_rate": 2.0752519034448603e-05, - "loss": 2.4257, - "step": 335430 - }, - { - "epoch": 0.58, - "learning_rate": 2.0751647094521777e-05, - "loss": 2.2535, - "step": 335440 - }, - { - "epoch": 0.58, - "learning_rate": 2.075077515459495e-05, - "loss": 2.374, - "step": 335450 - }, - { - "epoch": 0.59, - "learning_rate": 2.0749903214668125e-05, - "loss": 2.3577, - "step": 335460 - }, - { - "epoch": 0.59, - "learning_rate": 2.0749031274741295e-05, - "loss": 2.3867, - "step": 335470 - }, - { - "epoch": 0.59, - "learning_rate": 2.0748159334814472e-05, - "loss": 2.348, - "step": 335480 - }, - { - "epoch": 0.59, - "learning_rate": 2.0747287394887642e-05, - "loss": 2.4506, - "step": 335490 - }, - { - "epoch": 0.59, - "learning_rate": 2.0746415454960816e-05, - "loss": 2.2948, - "step": 335500 - }, - { - "epoch": 0.59, - "learning_rate": 2.074554351503399e-05, - "loss": 2.3799, - "step": 335510 - }, - { - "epoch": 0.59, - "learning_rate": 2.0744671575107164e-05, - "loss": 2.4495, - "step": 335520 - }, - { - "epoch": 0.59, - "learning_rate": 2.0743799635180338e-05, - "loss": 2.2764, - "step": 335530 - }, - { - "epoch": 0.59, - "learning_rate": 2.0742927695253508e-05, - "loss": 2.3828, - "step": 335540 - }, - { - "epoch": 0.59, - "learning_rate": 2.074205575532668e-05, - "loss": 2.3029, - "step": 335550 - }, - { - "epoch": 0.59, - "learning_rate": 2.0741183815399855e-05, - "loss": 2.4462, - "step": 335560 - }, - { - "epoch": 0.59, - "learning_rate": 2.074031187547303e-05, - "loss": 2.3669, - "step": 335570 - }, - { - "epoch": 0.59, - "learning_rate": 2.07394399355462e-05, - "loss": 2.3032, - "step": 335580 - }, - { - "epoch": 0.59, - "learning_rate": 2.0738567995619373e-05, - "loss": 2.2916, - "step": 335590 - }, - { - "epoch": 0.59, - "learning_rate": 2.0737696055692547e-05, - "loss": 2.4487, - "step": 335600 - }, - { - "epoch": 0.59, - "learning_rate": 2.073682411576572e-05, - "loss": 2.2746, - "step": 335610 - }, - { - "epoch": 0.59, - "learning_rate": 2.0735952175838895e-05, - "loss": 2.4127, - "step": 335620 - }, - { - "epoch": 0.59, - "learning_rate": 2.073508023591207e-05, - "loss": 2.2715, - "step": 335630 - }, - { - "epoch": 0.59, - "learning_rate": 2.0734208295985242e-05, - "loss": 2.2083, - "step": 335640 - }, - { - "epoch": 0.59, - "learning_rate": 2.0733336356058413e-05, - "loss": 2.3645, - "step": 335650 - }, - { - "epoch": 0.59, - "learning_rate": 2.0732464416131586e-05, - "loss": 2.5133, - "step": 335660 - }, - { - "epoch": 0.59, - "learning_rate": 2.073159247620476e-05, - "loss": 2.4126, - "step": 335670 - }, - { - "epoch": 0.59, - "learning_rate": 2.0730720536277934e-05, - "loss": 2.343, - "step": 335680 - }, - { - "epoch": 0.59, - "learning_rate": 2.0729848596351108e-05, - "loss": 2.3379, - "step": 335690 - }, - { - "epoch": 0.59, - "learning_rate": 2.0728976656424278e-05, - "loss": 2.384, - "step": 335700 - }, - { - "epoch": 0.59, - "learning_rate": 2.0728104716497455e-05, - "loss": 2.4826, - "step": 335710 - }, - { - "epoch": 0.59, - "learning_rate": 2.0727232776570626e-05, - "loss": 2.2203, - "step": 335720 - }, - { - "epoch": 0.59, - "learning_rate": 2.07263608366438e-05, - "loss": 2.4299, - "step": 335730 - }, - { - "epoch": 0.59, - "learning_rate": 2.0725488896716973e-05, - "loss": 2.3813, - "step": 335740 - }, - { - "epoch": 0.59, - "learning_rate": 2.0724616956790147e-05, - "loss": 2.2575, - "step": 335750 - }, - { - "epoch": 0.59, - "learning_rate": 2.072374501686332e-05, - "loss": 2.3208, - "step": 335760 - }, - { - "epoch": 0.59, - "learning_rate": 2.072287307693649e-05, - "loss": 2.4052, - "step": 335770 - }, - { - "epoch": 0.59, - "learning_rate": 2.0722001137009668e-05, - "loss": 2.3823, - "step": 335780 - }, - { - "epoch": 0.59, - "learning_rate": 2.072112919708284e-05, - "loss": 2.3302, - "step": 335790 - }, - { - "epoch": 0.59, - "learning_rate": 2.0720257257156012e-05, - "loss": 2.3747, - "step": 335800 - }, - { - "epoch": 0.59, - "learning_rate": 2.0719385317229183e-05, - "loss": 2.1454, - "step": 335810 - }, - { - "epoch": 0.59, - "learning_rate": 2.071851337730236e-05, - "loss": 2.2089, - "step": 335820 - }, - { - "epoch": 0.59, - "learning_rate": 2.071764143737553e-05, - "loss": 2.3209, - "step": 335830 - }, - { - "epoch": 0.59, - "learning_rate": 2.0716769497448704e-05, - "loss": 2.312, - "step": 335840 - }, - { - "epoch": 0.59, - "learning_rate": 2.0715897557521878e-05, - "loss": 2.2569, - "step": 335850 - }, - { - "epoch": 0.59, - "learning_rate": 2.071502561759505e-05, - "loss": 2.2446, - "step": 335860 - }, - { - "epoch": 0.59, - "learning_rate": 2.0714153677668225e-05, - "loss": 2.4188, - "step": 335870 - }, - { - "epoch": 0.59, - "learning_rate": 2.0713281737741396e-05, - "loss": 2.274, - "step": 335880 - }, - { - "epoch": 0.59, - "learning_rate": 2.0712409797814573e-05, - "loss": 2.3587, - "step": 335890 - }, - { - "epoch": 0.59, - "learning_rate": 2.0711537857887743e-05, - "loss": 2.4021, - "step": 335900 - }, - { - "epoch": 0.59, - "learning_rate": 2.0710665917960917e-05, - "loss": 2.3406, - "step": 335910 - }, - { - "epoch": 0.59, - "learning_rate": 2.070979397803409e-05, - "loss": 2.328, - "step": 335920 - }, - { - "epoch": 0.59, - "learning_rate": 2.0708922038107265e-05, - "loss": 2.3039, - "step": 335930 - }, - { - "epoch": 0.59, - "learning_rate": 2.070805009818044e-05, - "loss": 2.3327, - "step": 335940 - }, - { - "epoch": 0.59, - "learning_rate": 2.070717815825361e-05, - "loss": 2.2726, - "step": 335950 - }, - { - "epoch": 0.59, - "learning_rate": 2.0706306218326783e-05, - "loss": 2.2221, - "step": 335960 - }, - { - "epoch": 0.59, - "learning_rate": 2.0705434278399956e-05, - "loss": 2.3098, - "step": 335970 - }, - { - "epoch": 0.59, - "learning_rate": 2.070456233847313e-05, - "loss": 2.3903, - "step": 335980 - }, - { - "epoch": 0.59, - "learning_rate": 2.07036903985463e-05, - "loss": 2.2562, - "step": 335990 - }, - { - "epoch": 0.59, - "learning_rate": 2.0702818458619478e-05, - "loss": 2.285, - "step": 336000 - }, - { - "epoch": 0.59, - "learning_rate": 2.070194651869265e-05, - "loss": 2.3275, - "step": 336010 - }, - { - "epoch": 0.59, - "learning_rate": 2.0701074578765822e-05, - "loss": 2.3549, - "step": 336020 - }, - { - "epoch": 0.59, - "learning_rate": 2.0700202638838996e-05, - "loss": 2.33, - "step": 336030 - }, - { - "epoch": 0.59, - "learning_rate": 2.069933069891217e-05, - "loss": 2.2892, - "step": 336040 - }, - { - "epoch": 0.59, - "learning_rate": 2.0698458758985343e-05, - "loss": 2.3973, - "step": 336050 - }, - { - "epoch": 0.59, - "learning_rate": 2.0697586819058513e-05, - "loss": 2.3359, - "step": 336060 - }, - { - "epoch": 0.59, - "learning_rate": 2.0696714879131687e-05, - "loss": 2.3729, - "step": 336070 - }, - { - "epoch": 0.59, - "learning_rate": 2.069584293920486e-05, - "loss": 2.3096, - "step": 336080 - }, - { - "epoch": 0.59, - "learning_rate": 2.0694970999278035e-05, - "loss": 2.2917, - "step": 336090 - }, - { - "epoch": 0.59, - "learning_rate": 2.069409905935121e-05, - "loss": 2.3664, - "step": 336100 - }, - { - "epoch": 0.59, - "learning_rate": 2.069322711942438e-05, - "loss": 2.3047, - "step": 336110 - }, - { - "epoch": 0.59, - "learning_rate": 2.0692355179497556e-05, - "loss": 2.2458, - "step": 336120 - }, - { - "epoch": 0.59, - "learning_rate": 2.0691483239570726e-05, - "loss": 2.246, - "step": 336130 - }, - { - "epoch": 0.59, - "learning_rate": 2.06906112996439e-05, - "loss": 2.2462, - "step": 336140 - }, - { - "epoch": 0.59, - "learning_rate": 2.0689739359717074e-05, - "loss": 2.2707, - "step": 336150 - }, - { - "epoch": 0.59, - "learning_rate": 2.0688867419790248e-05, - "loss": 2.3644, - "step": 336160 - }, - { - "epoch": 0.59, - "learning_rate": 2.068799547986342e-05, - "loss": 2.3219, - "step": 336170 - }, - { - "epoch": 0.59, - "learning_rate": 2.0687123539936592e-05, - "loss": 2.2721, - "step": 336180 - }, - { - "epoch": 0.59, - "learning_rate": 2.068625160000977e-05, - "loss": 2.478, - "step": 336190 - }, - { - "epoch": 0.59, - "learning_rate": 2.068537966008294e-05, - "loss": 2.3561, - "step": 336200 - }, - { - "epoch": 0.59, - "learning_rate": 2.0684507720156113e-05, - "loss": 2.3587, - "step": 336210 - }, - { - "epoch": 0.59, - "learning_rate": 2.0683635780229284e-05, - "loss": 2.3655, - "step": 336220 - }, - { - "epoch": 0.59, - "learning_rate": 2.068276384030246e-05, - "loss": 2.3361, - "step": 336230 - }, - { - "epoch": 0.59, - "learning_rate": 2.0681891900375635e-05, - "loss": 2.3005, - "step": 336240 - }, - { - "epoch": 0.59, - "learning_rate": 2.0681019960448805e-05, - "loss": 2.392, - "step": 336250 - }, - { - "epoch": 0.59, - "learning_rate": 2.068014802052198e-05, - "loss": 2.3332, - "step": 336260 - }, - { - "epoch": 0.59, - "learning_rate": 2.0679276080595152e-05, - "loss": 2.3854, - "step": 336270 - }, - { - "epoch": 0.59, - "learning_rate": 2.0678404140668326e-05, - "loss": 2.3912, - "step": 336280 - }, - { - "epoch": 0.59, - "learning_rate": 2.0677532200741497e-05, - "loss": 2.3918, - "step": 336290 - }, - { - "epoch": 0.59, - "learning_rate": 2.0676660260814674e-05, - "loss": 2.3691, - "step": 336300 - }, - { - "epoch": 0.59, - "learning_rate": 2.0675788320887844e-05, - "loss": 2.3311, - "step": 336310 - }, - { - "epoch": 0.59, - "learning_rate": 2.0674916380961018e-05, - "loss": 2.2325, - "step": 336320 - }, - { - "epoch": 0.59, - "learning_rate": 2.067404444103419e-05, - "loss": 2.4171, - "step": 336330 - }, - { - "epoch": 0.59, - "learning_rate": 2.0673172501107365e-05, - "loss": 2.2711, - "step": 336340 - }, - { - "epoch": 0.59, - "learning_rate": 2.067230056118054e-05, - "loss": 2.2987, - "step": 336350 - }, - { - "epoch": 0.59, - "learning_rate": 2.067142862125371e-05, - "loss": 2.3483, - "step": 336360 - }, - { - "epoch": 0.59, - "learning_rate": 2.0670556681326883e-05, - "loss": 2.2702, - "step": 336370 - }, - { - "epoch": 0.59, - "learning_rate": 2.0669684741400057e-05, - "loss": 2.3487, - "step": 336380 - }, - { - "epoch": 0.59, - "learning_rate": 2.066881280147323e-05, - "loss": 2.3668, - "step": 336390 - }, - { - "epoch": 0.59, - "learning_rate": 2.0667940861546405e-05, - "loss": 2.3, - "step": 336400 - }, - { - "epoch": 0.59, - "learning_rate": 2.066706892161958e-05, - "loss": 2.3559, - "step": 336410 - }, - { - "epoch": 0.59, - "learning_rate": 2.0666196981692752e-05, - "loss": 2.2485, - "step": 336420 - }, - { - "epoch": 0.59, - "learning_rate": 2.0665325041765923e-05, - "loss": 2.3504, - "step": 336430 - }, - { - "epoch": 0.59, - "learning_rate": 2.0664453101839096e-05, - "loss": 2.2661, - "step": 336440 - }, - { - "epoch": 0.59, - "learning_rate": 2.066358116191227e-05, - "loss": 2.2942, - "step": 336450 - }, - { - "epoch": 0.59, - "learning_rate": 2.0662709221985444e-05, - "loss": 2.3675, - "step": 336460 - }, - { - "epoch": 0.59, - "learning_rate": 2.0661837282058614e-05, - "loss": 2.3895, - "step": 336470 - }, - { - "epoch": 0.59, - "learning_rate": 2.0660965342131788e-05, - "loss": 2.2963, - "step": 336480 - }, - { - "epoch": 0.59, - "learning_rate": 2.0660093402204965e-05, - "loss": 2.2954, - "step": 336490 - }, - { - "epoch": 0.59, - "learning_rate": 2.0659221462278136e-05, - "loss": 2.3414, - "step": 336500 - }, - { - "epoch": 0.59, - "learning_rate": 2.065834952235131e-05, - "loss": 2.3208, - "step": 336510 - }, - { - "epoch": 0.59, - "learning_rate": 2.065747758242448e-05, - "loss": 2.3371, - "step": 336520 - }, - { - "epoch": 0.59, - "learning_rate": 2.0656605642497657e-05, - "loss": 2.2729, - "step": 336530 - }, - { - "epoch": 0.59, - "learning_rate": 2.0655733702570827e-05, - "loss": 2.3574, - "step": 336540 - }, - { - "epoch": 0.59, - "learning_rate": 2.0654861762644e-05, - "loss": 2.3453, - "step": 336550 - }, - { - "epoch": 0.59, - "learning_rate": 2.0653989822717175e-05, - "loss": 2.3284, - "step": 336560 - }, - { - "epoch": 0.59, - "learning_rate": 2.065311788279035e-05, - "loss": 2.2426, - "step": 336570 - }, - { - "epoch": 0.59, - "learning_rate": 2.0652245942863522e-05, - "loss": 2.288, - "step": 336580 - }, - { - "epoch": 0.59, - "learning_rate": 2.0651374002936693e-05, - "loss": 2.3182, - "step": 336590 - }, - { - "epoch": 0.59, - "learning_rate": 2.065050206300987e-05, - "loss": 2.3341, - "step": 336600 - }, - { - "epoch": 0.59, - "learning_rate": 2.064963012308304e-05, - "loss": 2.2939, - "step": 336610 - }, - { - "epoch": 0.59, - "learning_rate": 2.0648758183156214e-05, - "loss": 2.2639, - "step": 336620 - }, - { - "epoch": 0.59, - "learning_rate": 2.0647886243229388e-05, - "loss": 2.3278, - "step": 336630 - }, - { - "epoch": 0.59, - "learning_rate": 2.064701430330256e-05, - "loss": 2.2063, - "step": 336640 - }, - { - "epoch": 0.59, - "learning_rate": 2.0646142363375735e-05, - "loss": 2.312, - "step": 336650 - }, - { - "epoch": 0.59, - "learning_rate": 2.0645270423448906e-05, - "loss": 2.3383, - "step": 336660 - }, - { - "epoch": 0.59, - "learning_rate": 2.0644398483522083e-05, - "loss": 2.3101, - "step": 336670 - }, - { - "epoch": 0.59, - "learning_rate": 2.0643526543595253e-05, - "loss": 2.3627, - "step": 336680 - }, - { - "epoch": 0.59, - "learning_rate": 2.0642654603668427e-05, - "loss": 2.3509, - "step": 336690 - }, - { - "epoch": 0.59, - "learning_rate": 2.0641782663741597e-05, - "loss": 2.338, - "step": 336700 - }, - { - "epoch": 0.59, - "learning_rate": 2.0640910723814775e-05, - "loss": 2.2813, - "step": 336710 - }, - { - "epoch": 0.59, - "learning_rate": 2.0640038783887945e-05, - "loss": 2.2847, - "step": 336720 - }, - { - "epoch": 0.59, - "learning_rate": 2.063916684396112e-05, - "loss": 2.384, - "step": 336730 - }, - { - "epoch": 0.59, - "learning_rate": 2.0638294904034293e-05, - "loss": 2.3851, - "step": 336740 - }, - { - "epoch": 0.59, - "learning_rate": 2.0637422964107466e-05, - "loss": 2.3719, - "step": 336750 - }, - { - "epoch": 0.59, - "learning_rate": 2.063655102418064e-05, - "loss": 2.4496, - "step": 336760 - }, - { - "epoch": 0.59, - "learning_rate": 2.063567908425381e-05, - "loss": 2.3137, - "step": 336770 - }, - { - "epoch": 0.59, - "learning_rate": 2.0634807144326984e-05, - "loss": 2.2099, - "step": 336780 - }, - { - "epoch": 0.59, - "learning_rate": 2.0633935204400158e-05, - "loss": 2.4212, - "step": 336790 - }, - { - "epoch": 0.59, - "learning_rate": 2.0633063264473332e-05, - "loss": 2.3354, - "step": 336800 - }, - { - "epoch": 0.59, - "learning_rate": 2.0632191324546506e-05, - "loss": 2.3506, - "step": 336810 - }, - { - "epoch": 0.59, - "learning_rate": 2.063131938461968e-05, - "loss": 2.475, - "step": 336820 - }, - { - "epoch": 0.59, - "learning_rate": 2.0630447444692853e-05, - "loss": 2.3702, - "step": 336830 - }, - { - "epoch": 0.59, - "learning_rate": 2.0629575504766023e-05, - "loss": 2.3434, - "step": 336840 - }, - { - "epoch": 0.59, - "learning_rate": 2.0628703564839197e-05, - "loss": 2.4181, - "step": 336850 - }, - { - "epoch": 0.59, - "learning_rate": 2.062783162491237e-05, - "loss": 2.2173, - "step": 336860 - }, - { - "epoch": 0.59, - "learning_rate": 2.0626959684985545e-05, - "loss": 2.2848, - "step": 336870 - }, - { - "epoch": 0.59, - "learning_rate": 2.062608774505872e-05, - "loss": 2.2973, - "step": 336880 - }, - { - "epoch": 0.59, - "learning_rate": 2.062521580513189e-05, - "loss": 2.398, - "step": 336890 - }, - { - "epoch": 0.59, - "learning_rate": 2.0624343865205066e-05, - "loss": 2.2426, - "step": 336900 - }, - { - "epoch": 0.59, - "learning_rate": 2.0623471925278236e-05, - "loss": 2.4089, - "step": 336910 - }, - { - "epoch": 0.59, - "learning_rate": 2.062259998535141e-05, - "loss": 2.3535, - "step": 336920 - }, - { - "epoch": 0.59, - "learning_rate": 2.062172804542458e-05, - "loss": 2.3016, - "step": 336930 - }, - { - "epoch": 0.59, - "learning_rate": 2.0620856105497758e-05, - "loss": 2.3801, - "step": 336940 - }, - { - "epoch": 0.59, - "learning_rate": 2.0619984165570928e-05, - "loss": 2.3618, - "step": 336950 - }, - { - "epoch": 0.59, - "learning_rate": 2.0619112225644102e-05, - "loss": 2.4325, - "step": 336960 - }, - { - "epoch": 0.59, - "learning_rate": 2.061824028571728e-05, - "loss": 2.3608, - "step": 336970 - }, - { - "epoch": 0.59, - "learning_rate": 2.061736834579045e-05, - "loss": 2.3454, - "step": 336980 - }, - { - "epoch": 0.59, - "learning_rate": 2.0616496405863623e-05, - "loss": 2.5388, - "step": 336990 - }, - { - "epoch": 0.59, - "learning_rate": 2.0615624465936794e-05, - "loss": 2.2774, - "step": 337000 - }, - { - "epoch": 0.59, - "learning_rate": 2.061475252600997e-05, - "loss": 2.3326, - "step": 337010 - }, - { - "epoch": 0.59, - "learning_rate": 2.061388058608314e-05, - "loss": 2.2196, - "step": 337020 - }, - { - "epoch": 0.59, - "learning_rate": 2.0613008646156315e-05, - "loss": 2.2216, - "step": 337030 - }, - { - "epoch": 0.59, - "learning_rate": 2.061213670622949e-05, - "loss": 2.4363, - "step": 337040 - }, - { - "epoch": 0.59, - "learning_rate": 2.0611264766302662e-05, - "loss": 2.3805, - "step": 337050 - }, - { - "epoch": 0.59, - "learning_rate": 2.0610392826375836e-05, - "loss": 2.1664, - "step": 337060 - }, - { - "epoch": 0.59, - "learning_rate": 2.0609520886449007e-05, - "loss": 2.3097, - "step": 337070 - }, - { - "epoch": 0.59, - "learning_rate": 2.0608648946522184e-05, - "loss": 2.3323, - "step": 337080 - }, - { - "epoch": 0.59, - "learning_rate": 2.0607777006595354e-05, - "loss": 2.2812, - "step": 337090 - }, - { - "epoch": 0.59, - "learning_rate": 2.0606905066668528e-05, - "loss": 2.3378, - "step": 337100 - }, - { - "epoch": 0.59, - "learning_rate": 2.06060331267417e-05, - "loss": 2.3914, - "step": 337110 - }, - { - "epoch": 0.59, - "learning_rate": 2.0605161186814875e-05, - "loss": 2.2508, - "step": 337120 - }, - { - "epoch": 0.59, - "learning_rate": 2.060428924688805e-05, - "loss": 2.4147, - "step": 337130 - }, - { - "epoch": 0.59, - "learning_rate": 2.060341730696122e-05, - "loss": 2.1675, - "step": 337140 - }, - { - "epoch": 0.59, - "learning_rate": 2.0602545367034393e-05, - "loss": 2.2828, - "step": 337150 - }, - { - "epoch": 0.59, - "learning_rate": 2.0601673427107567e-05, - "loss": 2.3492, - "step": 337160 - }, - { - "epoch": 0.59, - "learning_rate": 2.060080148718074e-05, - "loss": 2.3558, - "step": 337170 - }, - { - "epoch": 0.59, - "learning_rate": 2.059992954725391e-05, - "loss": 2.3009, - "step": 337180 - }, - { - "epoch": 0.59, - "learning_rate": 2.0599057607327085e-05, - "loss": 2.2031, - "step": 337190 - }, - { - "epoch": 0.59, - "learning_rate": 2.059818566740026e-05, - "loss": 2.2927, - "step": 337200 - }, - { - "epoch": 0.59, - "learning_rate": 2.0597313727473433e-05, - "loss": 2.3941, - "step": 337210 - }, - { - "epoch": 0.59, - "learning_rate": 2.0596441787546606e-05, - "loss": 2.3459, - "step": 337220 - }, - { - "epoch": 0.59, - "learning_rate": 2.059556984761978e-05, - "loss": 2.2863, - "step": 337230 - }, - { - "epoch": 0.59, - "learning_rate": 2.0594697907692954e-05, - "loss": 2.3058, - "step": 337240 - }, - { - "epoch": 0.59, - "learning_rate": 2.0593825967766124e-05, - "loss": 2.3676, - "step": 337250 - }, - { - "epoch": 0.59, - "learning_rate": 2.0592954027839298e-05, - "loss": 2.3301, - "step": 337260 - }, - { - "epoch": 0.59, - "learning_rate": 2.0592082087912472e-05, - "loss": 2.2507, - "step": 337270 - }, - { - "epoch": 0.59, - "learning_rate": 2.0591210147985646e-05, - "loss": 2.3575, - "step": 337280 - }, - { - "epoch": 0.59, - "learning_rate": 2.059033820805882e-05, - "loss": 2.2905, - "step": 337290 - }, - { - "epoch": 0.59, - "learning_rate": 2.058946626813199e-05, - "loss": 2.3005, - "step": 337300 - }, - { - "epoch": 0.59, - "learning_rate": 2.0588594328205167e-05, - "loss": 2.3497, - "step": 337310 - }, - { - "epoch": 0.59, - "learning_rate": 2.0587722388278337e-05, - "loss": 2.4457, - "step": 337320 - }, - { - "epoch": 0.59, - "learning_rate": 2.058685044835151e-05, - "loss": 2.2952, - "step": 337330 - }, - { - "epoch": 0.59, - "learning_rate": 2.0585978508424685e-05, - "loss": 2.4518, - "step": 337340 - }, - { - "epoch": 0.59, - "learning_rate": 2.058510656849786e-05, - "loss": 2.3612, - "step": 337350 - }, - { - "epoch": 0.59, - "learning_rate": 2.0584234628571032e-05, - "loss": 2.3498, - "step": 337360 - }, - { - "epoch": 0.59, - "learning_rate": 2.0583362688644203e-05, - "loss": 2.2937, - "step": 337370 - }, - { - "epoch": 0.59, - "learning_rate": 2.058249074871738e-05, - "loss": 2.3464, - "step": 337380 - }, - { - "epoch": 0.59, - "learning_rate": 2.058161880879055e-05, - "loss": 2.3577, - "step": 337390 - }, - { - "epoch": 0.59, - "learning_rate": 2.0580746868863724e-05, - "loss": 2.4046, - "step": 337400 - }, - { - "epoch": 0.59, - "learning_rate": 2.0579874928936894e-05, - "loss": 2.4094, - "step": 337410 - }, - { - "epoch": 0.59, - "learning_rate": 2.057900298901007e-05, - "loss": 2.1753, - "step": 337420 - }, - { - "epoch": 0.59, - "learning_rate": 2.0578131049083242e-05, - "loss": 2.3331, - "step": 337430 - }, - { - "epoch": 0.59, - "learning_rate": 2.0577259109156416e-05, - "loss": 2.3079, - "step": 337440 - }, - { - "epoch": 0.59, - "learning_rate": 2.057638716922959e-05, - "loss": 2.3377, - "step": 337450 - }, - { - "epoch": 0.59, - "learning_rate": 2.0575515229302763e-05, - "loss": 2.3931, - "step": 337460 - }, - { - "epoch": 0.59, - "learning_rate": 2.0574643289375937e-05, - "loss": 2.2818, - "step": 337470 - }, - { - "epoch": 0.59, - "learning_rate": 2.0573771349449107e-05, - "loss": 2.2985, - "step": 337480 - }, - { - "epoch": 0.59, - "learning_rate": 2.0572899409522285e-05, - "loss": 2.2765, - "step": 337490 - }, - { - "epoch": 0.59, - "learning_rate": 2.0572027469595455e-05, - "loss": 2.2953, - "step": 337500 - }, - { - "epoch": 0.59, - "learning_rate": 2.057115552966863e-05, - "loss": 2.2476, - "step": 337510 - }, - { - "epoch": 0.59, - "learning_rate": 2.0570283589741803e-05, - "loss": 2.4119, - "step": 337520 - }, - { - "epoch": 0.59, - "learning_rate": 2.0569411649814976e-05, - "loss": 2.2611, - "step": 337530 - }, - { - "epoch": 0.59, - "learning_rate": 2.056853970988815e-05, - "loss": 2.4205, - "step": 337540 - }, - { - "epoch": 0.59, - "learning_rate": 2.056766776996132e-05, - "loss": 2.3137, - "step": 337550 - }, - { - "epoch": 0.59, - "learning_rate": 2.0566795830034494e-05, - "loss": 2.4246, - "step": 337560 - }, - { - "epoch": 0.59, - "learning_rate": 2.0565923890107668e-05, - "loss": 2.3443, - "step": 337570 - }, - { - "epoch": 0.59, - "learning_rate": 2.0565051950180842e-05, - "loss": 2.2561, - "step": 337580 - }, - { - "epoch": 0.59, - "learning_rate": 2.0564180010254016e-05, - "loss": 2.4313, - "step": 337590 - }, - { - "epoch": 0.59, - "learning_rate": 2.056330807032719e-05, - "loss": 2.4016, - "step": 337600 - }, - { - "epoch": 0.59, - "learning_rate": 2.0562436130400363e-05, - "loss": 2.3139, - "step": 337610 - }, - { - "epoch": 0.59, - "learning_rate": 2.0561564190473533e-05, - "loss": 2.1904, - "step": 337620 - }, - { - "epoch": 0.59, - "learning_rate": 2.0560692250546707e-05, - "loss": 2.3532, - "step": 337630 - }, - { - "epoch": 0.59, - "learning_rate": 2.055982031061988e-05, - "loss": 2.3578, - "step": 337640 - }, - { - "epoch": 0.59, - "learning_rate": 2.0558948370693055e-05, - "loss": 2.3194, - "step": 337650 - }, - { - "epoch": 0.59, - "learning_rate": 2.0558076430766225e-05, - "loss": 2.3152, - "step": 337660 - }, - { - "epoch": 0.59, - "learning_rate": 2.05572044908394e-05, - "loss": 2.4305, - "step": 337670 - }, - { - "epoch": 0.59, - "learning_rate": 2.0556332550912573e-05, - "loss": 2.4211, - "step": 337680 - }, - { - "epoch": 0.59, - "learning_rate": 2.0555460610985746e-05, - "loss": 2.3238, - "step": 337690 - }, - { - "epoch": 0.59, - "learning_rate": 2.055458867105892e-05, - "loss": 2.3169, - "step": 337700 - }, - { - "epoch": 0.59, - "learning_rate": 2.055371673113209e-05, - "loss": 2.3608, - "step": 337710 - }, - { - "epoch": 0.59, - "learning_rate": 2.0552844791205268e-05, - "loss": 2.4697, - "step": 337720 - }, - { - "epoch": 0.59, - "learning_rate": 2.0551972851278438e-05, - "loss": 2.217, - "step": 337730 - }, - { - "epoch": 0.59, - "learning_rate": 2.0551100911351612e-05, - "loss": 2.2556, - "step": 337740 - }, - { - "epoch": 0.59, - "learning_rate": 2.0550228971424786e-05, - "loss": 2.4138, - "step": 337750 - }, - { - "epoch": 0.59, - "learning_rate": 2.054935703149796e-05, - "loss": 2.3777, - "step": 337760 - }, - { - "epoch": 0.59, - "learning_rate": 2.0548485091571133e-05, - "loss": 2.4012, - "step": 337770 - }, - { - "epoch": 0.59, - "learning_rate": 2.0547613151644304e-05, - "loss": 2.3352, - "step": 337780 - }, - { - "epoch": 0.59, - "learning_rate": 2.054674121171748e-05, - "loss": 2.4596, - "step": 337790 - }, - { - "epoch": 0.59, - "learning_rate": 2.054586927179065e-05, - "loss": 2.4, - "step": 337800 - }, - { - "epoch": 0.59, - "learning_rate": 2.0544997331863825e-05, - "loss": 2.2689, - "step": 337810 - }, - { - "epoch": 0.59, - "learning_rate": 2.0544125391936995e-05, - "loss": 2.3449, - "step": 337820 - }, - { - "epoch": 0.59, - "learning_rate": 2.0543253452010172e-05, - "loss": 2.3583, - "step": 337830 - }, - { - "epoch": 0.59, - "learning_rate": 2.0542381512083346e-05, - "loss": 2.2992, - "step": 337840 - }, - { - "epoch": 0.59, - "learning_rate": 2.0541509572156517e-05, - "loss": 2.3472, - "step": 337850 - }, - { - "epoch": 0.59, - "learning_rate": 2.054063763222969e-05, - "loss": 2.395, - "step": 337860 - }, - { - "epoch": 0.59, - "learning_rate": 2.0539765692302864e-05, - "loss": 2.4164, - "step": 337870 - }, - { - "epoch": 0.59, - "learning_rate": 2.0538893752376038e-05, - "loss": 2.2504, - "step": 337880 - }, - { - "epoch": 0.59, - "learning_rate": 2.053802181244921e-05, - "loss": 2.2435, - "step": 337890 - }, - { - "epoch": 0.59, - "learning_rate": 2.0537149872522385e-05, - "loss": 2.4411, - "step": 337900 - }, - { - "epoch": 0.59, - "learning_rate": 2.0536277932595556e-05, - "loss": 2.4384, - "step": 337910 - }, - { - "epoch": 0.59, - "learning_rate": 2.053540599266873e-05, - "loss": 2.3965, - "step": 337920 - }, - { - "epoch": 0.59, - "learning_rate": 2.0534534052741903e-05, - "loss": 2.3504, - "step": 337930 - }, - { - "epoch": 0.59, - "learning_rate": 2.0533662112815077e-05, - "loss": 2.2414, - "step": 337940 - }, - { - "epoch": 0.59, - "learning_rate": 2.053279017288825e-05, - "loss": 2.3138, - "step": 337950 - }, - { - "epoch": 0.59, - "learning_rate": 2.053191823296142e-05, - "loss": 2.4171, - "step": 337960 - }, - { - "epoch": 0.59, - "learning_rate": 2.0531046293034595e-05, - "loss": 2.2983, - "step": 337970 - }, - { - "epoch": 0.59, - "learning_rate": 2.053017435310777e-05, - "loss": 2.2992, - "step": 337980 - }, - { - "epoch": 0.59, - "learning_rate": 2.0529302413180943e-05, - "loss": 2.35, - "step": 337990 - }, - { - "epoch": 0.59, - "learning_rate": 2.0528430473254116e-05, - "loss": 2.2002, - "step": 338000 - }, - { - "epoch": 0.59, - "learning_rate": 2.052755853332729e-05, - "loss": 2.3626, - "step": 338010 - }, - { - "epoch": 0.59, - "learning_rate": 2.0526686593400464e-05, - "loss": 2.2958, - "step": 338020 - }, - { - "epoch": 0.59, - "learning_rate": 2.0525814653473634e-05, - "loss": 2.4495, - "step": 338030 - }, - { - "epoch": 0.59, - "learning_rate": 2.0524942713546808e-05, - "loss": 2.3654, - "step": 338040 - }, - { - "epoch": 0.59, - "learning_rate": 2.0524070773619982e-05, - "loss": 2.3641, - "step": 338050 - }, - { - "epoch": 0.59, - "learning_rate": 2.0523198833693156e-05, - "loss": 2.2557, - "step": 338060 - }, - { - "epoch": 0.59, - "learning_rate": 2.0522326893766326e-05, - "loss": 2.3026, - "step": 338070 - }, - { - "epoch": 0.59, - "learning_rate": 2.05214549538395e-05, - "loss": 2.4836, - "step": 338080 - }, - { - "epoch": 0.59, - "learning_rate": 2.0520583013912677e-05, - "loss": 2.3843, - "step": 338090 - }, - { - "epoch": 0.59, - "learning_rate": 2.0519711073985847e-05, - "loss": 2.3269, - "step": 338100 - }, - { - "epoch": 0.59, - "learning_rate": 2.051883913405902e-05, - "loss": 2.2906, - "step": 338110 - }, - { - "epoch": 0.59, - "learning_rate": 2.051796719413219e-05, - "loss": 2.1633, - "step": 338120 - }, - { - "epoch": 0.59, - "learning_rate": 2.051709525420537e-05, - "loss": 2.3889, - "step": 338130 - }, - { - "epoch": 0.59, - "learning_rate": 2.051622331427854e-05, - "loss": 2.3214, - "step": 338140 - }, - { - "epoch": 0.59, - "learning_rate": 2.0515351374351713e-05, - "loss": 2.3289, - "step": 338150 - }, - { - "epoch": 0.59, - "learning_rate": 2.0514479434424887e-05, - "loss": 2.3302, - "step": 338160 - }, - { - "epoch": 0.59, - "learning_rate": 2.051360749449806e-05, - "loss": 2.3735, - "step": 338170 - }, - { - "epoch": 0.59, - "learning_rate": 2.0512735554571234e-05, - "loss": 2.2317, - "step": 338180 - }, - { - "epoch": 0.59, - "learning_rate": 2.0511863614644404e-05, - "loss": 2.4349, - "step": 338190 - }, - { - "epoch": 0.59, - "learning_rate": 2.051099167471758e-05, - "loss": 2.3051, - "step": 338200 - }, - { - "epoch": 0.59, - "learning_rate": 2.0510119734790752e-05, - "loss": 2.323, - "step": 338210 - }, - { - "epoch": 0.59, - "learning_rate": 2.0509247794863926e-05, - "loss": 2.3556, - "step": 338220 - }, - { - "epoch": 0.59, - "learning_rate": 2.05083758549371e-05, - "loss": 2.2918, - "step": 338230 - }, - { - "epoch": 0.59, - "learning_rate": 2.0507503915010273e-05, - "loss": 2.2994, - "step": 338240 - }, - { - "epoch": 0.59, - "learning_rate": 2.0506631975083447e-05, - "loss": 2.3722, - "step": 338250 - }, - { - "epoch": 0.59, - "learning_rate": 2.0505760035156617e-05, - "loss": 2.2436, - "step": 338260 - }, - { - "epoch": 0.59, - "learning_rate": 2.0504888095229795e-05, - "loss": 2.2651, - "step": 338270 - }, - { - "epoch": 0.59, - "learning_rate": 2.0504016155302965e-05, - "loss": 2.4471, - "step": 338280 - }, - { - "epoch": 0.59, - "learning_rate": 2.050314421537614e-05, - "loss": 2.3166, - "step": 338290 - }, - { - "epoch": 0.59, - "learning_rate": 2.050227227544931e-05, - "loss": 2.3708, - "step": 338300 - }, - { - "epoch": 0.59, - "learning_rate": 2.0501400335522486e-05, - "loss": 2.3614, - "step": 338310 - }, - { - "epoch": 0.59, - "learning_rate": 2.050052839559566e-05, - "loss": 2.287, - "step": 338320 - }, - { - "epoch": 0.59, - "learning_rate": 2.049965645566883e-05, - "loss": 2.2947, - "step": 338330 - }, - { - "epoch": 0.59, - "learning_rate": 2.0498784515742004e-05, - "loss": 2.3284, - "step": 338340 - }, - { - "epoch": 0.59, - "learning_rate": 2.0497912575815178e-05, - "loss": 2.3281, - "step": 338350 - }, - { - "epoch": 0.59, - "learning_rate": 2.0497040635888352e-05, - "loss": 2.3298, - "step": 338360 - }, - { - "epoch": 0.59, - "learning_rate": 2.0496168695961522e-05, - "loss": 2.3346, - "step": 338370 - }, - { - "epoch": 0.59, - "learning_rate": 2.0495296756034696e-05, - "loss": 2.3433, - "step": 338380 - }, - { - "epoch": 0.59, - "learning_rate": 2.049442481610787e-05, - "loss": 2.3973, - "step": 338390 - }, - { - "epoch": 0.59, - "learning_rate": 2.0493552876181043e-05, - "loss": 2.4238, - "step": 338400 - }, - { - "epoch": 0.59, - "learning_rate": 2.0492680936254217e-05, - "loss": 2.4015, - "step": 338410 - }, - { - "epoch": 0.59, - "learning_rate": 2.049180899632739e-05, - "loss": 2.2166, - "step": 338420 - }, - { - "epoch": 0.59, - "learning_rate": 2.0490937056400565e-05, - "loss": 2.3735, - "step": 338430 - }, - { - "epoch": 0.59, - "learning_rate": 2.0490065116473735e-05, - "loss": 2.3294, - "step": 338440 - }, - { - "epoch": 0.59, - "learning_rate": 2.048919317654691e-05, - "loss": 2.4274, - "step": 338450 - }, - { - "epoch": 0.59, - "learning_rate": 2.0488321236620083e-05, - "loss": 2.3142, - "step": 338460 - }, - { - "epoch": 0.59, - "learning_rate": 2.0487449296693256e-05, - "loss": 2.3487, - "step": 338470 - }, - { - "epoch": 0.59, - "learning_rate": 2.048657735676643e-05, - "loss": 2.4014, - "step": 338480 - }, - { - "epoch": 0.59, - "learning_rate": 2.04857054168396e-05, - "loss": 2.2979, - "step": 338490 - }, - { - "epoch": 0.59, - "learning_rate": 2.0484833476912778e-05, - "loss": 2.2724, - "step": 338500 - }, - { - "epoch": 0.59, - "learning_rate": 2.0483961536985948e-05, - "loss": 2.4308, - "step": 338510 - }, - { - "epoch": 0.59, - "learning_rate": 2.0483089597059122e-05, - "loss": 2.2926, - "step": 338520 - }, - { - "epoch": 0.59, - "learning_rate": 2.0482217657132296e-05, - "loss": 2.2096, - "step": 338530 - }, - { - "epoch": 0.59, - "learning_rate": 2.048134571720547e-05, - "loss": 2.2815, - "step": 338540 - }, - { - "epoch": 0.59, - "learning_rate": 2.048047377727864e-05, - "loss": 2.2617, - "step": 338550 - }, - { - "epoch": 0.59, - "learning_rate": 2.0479601837351814e-05, - "loss": 2.3567, - "step": 338560 - }, - { - "epoch": 0.59, - "learning_rate": 2.047872989742499e-05, - "loss": 2.3002, - "step": 338570 - }, - { - "epoch": 0.59, - "learning_rate": 2.047785795749816e-05, - "loss": 2.1965, - "step": 338580 - }, - { - "epoch": 0.59, - "learning_rate": 2.0476986017571335e-05, - "loss": 2.4156, - "step": 338590 - }, - { - "epoch": 0.59, - "learning_rate": 2.0476114077644505e-05, - "loss": 2.3433, - "step": 338600 - }, - { - "epoch": 0.59, - "learning_rate": 2.0475242137717682e-05, - "loss": 2.2955, - "step": 338610 - }, - { - "epoch": 0.59, - "learning_rate": 2.0474370197790853e-05, - "loss": 2.3147, - "step": 338620 - }, - { - "epoch": 0.59, - "learning_rate": 2.0473498257864027e-05, - "loss": 2.3357, - "step": 338630 - }, - { - "epoch": 0.59, - "learning_rate": 2.04726263179372e-05, - "loss": 2.3461, - "step": 338640 - }, - { - "epoch": 0.59, - "learning_rate": 2.0471754378010374e-05, - "loss": 2.4198, - "step": 338650 - }, - { - "epoch": 0.59, - "learning_rate": 2.0470882438083548e-05, - "loss": 2.3024, - "step": 338660 - }, - { - "epoch": 0.59, - "learning_rate": 2.047001049815672e-05, - "loss": 2.3236, - "step": 338670 - }, - { - "epoch": 0.59, - "learning_rate": 2.0469138558229895e-05, - "loss": 2.3758, - "step": 338680 - }, - { - "epoch": 0.59, - "learning_rate": 2.0468266618303066e-05, - "loss": 2.2963, - "step": 338690 - }, - { - "epoch": 0.59, - "learning_rate": 2.046739467837624e-05, - "loss": 2.4858, - "step": 338700 - }, - { - "epoch": 0.59, - "learning_rate": 2.0466522738449413e-05, - "loss": 2.3701, - "step": 338710 - }, - { - "epoch": 0.59, - "learning_rate": 2.0465650798522587e-05, - "loss": 2.3371, - "step": 338720 - }, - { - "epoch": 0.59, - "learning_rate": 2.046477885859576e-05, - "loss": 2.4031, - "step": 338730 - }, - { - "epoch": 0.59, - "learning_rate": 2.046390691866893e-05, - "loss": 2.2036, - "step": 338740 - }, - { - "epoch": 0.59, - "learning_rate": 2.0463034978742105e-05, - "loss": 2.3745, - "step": 338750 - }, - { - "epoch": 0.59, - "learning_rate": 2.046216303881528e-05, - "loss": 2.3086, - "step": 338760 - }, - { - "epoch": 0.59, - "learning_rate": 2.0461291098888453e-05, - "loss": 2.3761, - "step": 338770 - }, - { - "epoch": 0.59, - "learning_rate": 2.0460419158961623e-05, - "loss": 2.3703, - "step": 338780 - }, - { - "epoch": 0.59, - "learning_rate": 2.0459547219034797e-05, - "loss": 2.3941, - "step": 338790 - }, - { - "epoch": 0.59, - "learning_rate": 2.045867527910797e-05, - "loss": 2.3806, - "step": 338800 - }, - { - "epoch": 0.59, - "learning_rate": 2.0457803339181144e-05, - "loss": 2.3734, - "step": 338810 - }, - { - "epoch": 0.59, - "learning_rate": 2.0456931399254318e-05, - "loss": 2.4272, - "step": 338820 - }, - { - "epoch": 0.59, - "learning_rate": 2.0456059459327492e-05, - "loss": 2.3833, - "step": 338830 - }, - { - "epoch": 0.59, - "learning_rate": 2.0455187519400666e-05, - "loss": 2.2965, - "step": 338840 - }, - { - "epoch": 0.59, - "learning_rate": 2.0454315579473836e-05, - "loss": 2.2901, - "step": 338850 - }, - { - "epoch": 0.59, - "learning_rate": 2.045344363954701e-05, - "loss": 2.3508, - "step": 338860 - }, - { - "epoch": 0.59, - "learning_rate": 2.0452571699620184e-05, - "loss": 2.2939, - "step": 338870 - }, - { - "epoch": 0.59, - "learning_rate": 2.0451699759693357e-05, - "loss": 2.2642, - "step": 338880 - }, - { - "epoch": 0.59, - "learning_rate": 2.045082781976653e-05, - "loss": 2.415, - "step": 338890 - }, - { - "epoch": 0.59, - "learning_rate": 2.04499558798397e-05, - "loss": 2.4415, - "step": 338900 - }, - { - "epoch": 0.59, - "learning_rate": 2.044908393991288e-05, - "loss": 2.3275, - "step": 338910 - }, - { - "epoch": 0.59, - "learning_rate": 2.044821199998605e-05, - "loss": 2.44, - "step": 338920 - }, - { - "epoch": 0.59, - "learning_rate": 2.0447340060059223e-05, - "loss": 2.2695, - "step": 338930 - }, - { - "epoch": 0.59, - "learning_rate": 2.0446468120132397e-05, - "loss": 2.31, - "step": 338940 - }, - { - "epoch": 0.59, - "learning_rate": 2.044559618020557e-05, - "loss": 2.2762, - "step": 338950 - }, - { - "epoch": 0.59, - "learning_rate": 2.0444724240278744e-05, - "loss": 2.2724, - "step": 338960 - }, - { - "epoch": 0.59, - "learning_rate": 2.0443852300351914e-05, - "loss": 2.213, - "step": 338970 - }, - { - "epoch": 0.59, - "learning_rate": 2.044298036042509e-05, - "loss": 2.3357, - "step": 338980 - }, - { - "epoch": 0.59, - "learning_rate": 2.0442108420498262e-05, - "loss": 2.3008, - "step": 338990 - }, - { - "epoch": 0.59, - "learning_rate": 2.0441236480571436e-05, - "loss": 2.3261, - "step": 339000 - }, - { - "epoch": 0.59, - "learning_rate": 2.0440364540644606e-05, - "loss": 2.3434, - "step": 339010 - }, - { - "epoch": 0.59, - "learning_rate": 2.0439492600717783e-05, - "loss": 2.3712, - "step": 339020 - }, - { - "epoch": 0.59, - "learning_rate": 2.0438620660790954e-05, - "loss": 2.3729, - "step": 339030 - }, - { - "epoch": 0.59, - "learning_rate": 2.0437748720864127e-05, - "loss": 2.256, - "step": 339040 - }, - { - "epoch": 0.59, - "learning_rate": 2.04368767809373e-05, - "loss": 2.3348, - "step": 339050 - }, - { - "epoch": 0.59, - "learning_rate": 2.0436004841010475e-05, - "loss": 2.2632, - "step": 339060 - }, - { - "epoch": 0.59, - "learning_rate": 2.043513290108365e-05, - "loss": 2.3108, - "step": 339070 - }, - { - "epoch": 0.59, - "learning_rate": 2.043426096115682e-05, - "loss": 2.3164, - "step": 339080 - }, - { - "epoch": 0.59, - "learning_rate": 2.0433389021229996e-05, - "loss": 2.2914, - "step": 339090 - }, - { - "epoch": 0.59, - "learning_rate": 2.0432517081303167e-05, - "loss": 2.3507, - "step": 339100 - }, - { - "epoch": 0.59, - "learning_rate": 2.043164514137634e-05, - "loss": 2.3544, - "step": 339110 - }, - { - "epoch": 0.59, - "learning_rate": 2.0430773201449514e-05, - "loss": 2.4576, - "step": 339120 - }, - { - "epoch": 0.59, - "learning_rate": 2.0429901261522688e-05, - "loss": 2.4279, - "step": 339130 - }, - { - "epoch": 0.59, - "learning_rate": 2.0429029321595862e-05, - "loss": 2.3724, - "step": 339140 - }, - { - "epoch": 0.59, - "learning_rate": 2.0428157381669032e-05, - "loss": 2.2057, - "step": 339150 - }, - { - "epoch": 0.59, - "learning_rate": 2.0427285441742206e-05, - "loss": 2.3318, - "step": 339160 - }, - { - "epoch": 0.59, - "learning_rate": 2.042641350181538e-05, - "loss": 2.2895, - "step": 339170 - }, - { - "epoch": 0.59, - "learning_rate": 2.0425541561888553e-05, - "loss": 2.2591, - "step": 339180 - }, - { - "epoch": 0.59, - "learning_rate": 2.0424669621961727e-05, - "loss": 2.2749, - "step": 339190 - }, - { - "epoch": 0.59, - "learning_rate": 2.04237976820349e-05, - "loss": 2.2973, - "step": 339200 - }, - { - "epoch": 0.59, - "learning_rate": 2.0422925742108075e-05, - "loss": 2.3241, - "step": 339210 - }, - { - "epoch": 0.59, - "learning_rate": 2.0422053802181245e-05, - "loss": 2.3587, - "step": 339220 - }, - { - "epoch": 0.59, - "learning_rate": 2.042118186225442e-05, - "loss": 2.2497, - "step": 339230 - }, - { - "epoch": 0.59, - "learning_rate": 2.0420309922327593e-05, - "loss": 2.4041, - "step": 339240 - }, - { - "epoch": 0.59, - "learning_rate": 2.0419437982400766e-05, - "loss": 2.3722, - "step": 339250 - }, - { - "epoch": 0.59, - "learning_rate": 2.0418566042473937e-05, - "loss": 2.3612, - "step": 339260 - }, - { - "epoch": 0.59, - "learning_rate": 2.041769410254711e-05, - "loss": 2.3076, - "step": 339270 - }, - { - "epoch": 0.59, - "learning_rate": 2.0416822162620284e-05, - "loss": 2.3588, - "step": 339280 - }, - { - "epoch": 0.59, - "learning_rate": 2.0415950222693458e-05, - "loss": 2.2479, - "step": 339290 - }, - { - "epoch": 0.59, - "learning_rate": 2.0415078282766632e-05, - "loss": 2.3164, - "step": 339300 - }, - { - "epoch": 0.59, - "learning_rate": 2.0414206342839802e-05, - "loss": 2.2951, - "step": 339310 - }, - { - "epoch": 0.59, - "learning_rate": 2.041333440291298e-05, - "loss": 2.3763, - "step": 339320 - }, - { - "epoch": 0.59, - "learning_rate": 2.041246246298615e-05, - "loss": 2.234, - "step": 339330 - }, - { - "epoch": 0.59, - "learning_rate": 2.0411590523059324e-05, - "loss": 2.4055, - "step": 339340 - }, - { - "epoch": 0.59, - "learning_rate": 2.0410718583132497e-05, - "loss": 2.3094, - "step": 339350 - }, - { - "epoch": 0.59, - "learning_rate": 2.040984664320567e-05, - "loss": 2.2468, - "step": 339360 - }, - { - "epoch": 0.59, - "learning_rate": 2.0408974703278845e-05, - "loss": 2.3615, - "step": 339370 - }, - { - "epoch": 0.59, - "learning_rate": 2.0408102763352015e-05, - "loss": 2.2735, - "step": 339380 - }, - { - "epoch": 0.59, - "learning_rate": 2.0407230823425192e-05, - "loss": 2.2967, - "step": 339390 - }, - { - "epoch": 0.59, - "learning_rate": 2.0406358883498363e-05, - "loss": 2.3387, - "step": 339400 - }, - { - "epoch": 0.59, - "learning_rate": 2.0405486943571537e-05, - "loss": 2.3157, - "step": 339410 - }, - { - "epoch": 0.59, - "learning_rate": 2.0404615003644707e-05, - "loss": 2.3679, - "step": 339420 - }, - { - "epoch": 0.59, - "learning_rate": 2.0403743063717884e-05, - "loss": 2.2553, - "step": 339430 - }, - { - "epoch": 0.59, - "learning_rate": 2.0402871123791058e-05, - "loss": 2.4064, - "step": 339440 - }, - { - "epoch": 0.59, - "learning_rate": 2.040199918386423e-05, - "loss": 2.2975, - "step": 339450 - }, - { - "epoch": 0.59, - "learning_rate": 2.0401127243937405e-05, - "loss": 2.1787, - "step": 339460 - }, - { - "epoch": 0.59, - "learning_rate": 2.0400255304010576e-05, - "loss": 2.3414, - "step": 339470 - }, - { - "epoch": 0.59, - "learning_rate": 2.039938336408375e-05, - "loss": 2.3802, - "step": 339480 - }, - { - "epoch": 0.59, - "learning_rate": 2.039851142415692e-05, - "loss": 2.3936, - "step": 339490 - }, - { - "epoch": 0.59, - "learning_rate": 2.0397639484230097e-05, - "loss": 2.3279, - "step": 339500 - }, - { - "epoch": 0.59, - "learning_rate": 2.0396767544303268e-05, - "loss": 2.3667, - "step": 339510 - }, - { - "epoch": 0.59, - "learning_rate": 2.039589560437644e-05, - "loss": 2.3414, - "step": 339520 - }, - { - "epoch": 0.59, - "learning_rate": 2.0395023664449615e-05, - "loss": 2.2646, - "step": 339530 - }, - { - "epoch": 0.59, - "learning_rate": 2.039415172452279e-05, - "loss": 2.3582, - "step": 339540 - }, - { - "epoch": 0.59, - "learning_rate": 2.0393279784595963e-05, - "loss": 2.2752, - "step": 339550 - }, - { - "epoch": 0.59, - "learning_rate": 2.0392407844669133e-05, - "loss": 2.2626, - "step": 339560 - }, - { - "epoch": 0.59, - "learning_rate": 2.0391535904742307e-05, - "loss": 2.391, - "step": 339570 - }, - { - "epoch": 0.59, - "learning_rate": 2.039066396481548e-05, - "loss": 2.3213, - "step": 339580 - }, - { - "epoch": 0.59, - "learning_rate": 2.0389792024888654e-05, - "loss": 2.3387, - "step": 339590 - }, - { - "epoch": 0.59, - "learning_rate": 2.0388920084961828e-05, - "loss": 2.3302, - "step": 339600 - }, - { - "epoch": 0.59, - "learning_rate": 2.0388048145035002e-05, - "loss": 2.3337, - "step": 339610 - }, - { - "epoch": 0.59, - "learning_rate": 2.0387176205108176e-05, - "loss": 2.2835, - "step": 339620 - }, - { - "epoch": 0.59, - "learning_rate": 2.0386304265181346e-05, - "loss": 2.1967, - "step": 339630 - }, - { - "epoch": 0.59, - "learning_rate": 2.038543232525452e-05, - "loss": 2.2777, - "step": 339640 - }, - { - "epoch": 0.59, - "learning_rate": 2.0384560385327694e-05, - "loss": 2.2413, - "step": 339650 - }, - { - "epoch": 0.59, - "learning_rate": 2.0383688445400867e-05, - "loss": 2.3268, - "step": 339660 - }, - { - "epoch": 0.59, - "learning_rate": 2.038281650547404e-05, - "loss": 2.3581, - "step": 339670 - }, - { - "epoch": 0.59, - "learning_rate": 2.038194456554721e-05, - "loss": 2.2764, - "step": 339680 - }, - { - "epoch": 0.59, - "learning_rate": 2.038107262562039e-05, - "loss": 2.2702, - "step": 339690 - }, - { - "epoch": 0.59, - "learning_rate": 2.038020068569356e-05, - "loss": 2.4018, - "step": 339700 - }, - { - "epoch": 0.59, - "learning_rate": 2.0379328745766733e-05, - "loss": 2.5041, - "step": 339710 - }, - { - "epoch": 0.59, - "learning_rate": 2.0378456805839903e-05, - "loss": 2.3337, - "step": 339720 - }, - { - "epoch": 0.59, - "learning_rate": 2.037758486591308e-05, - "loss": 2.352, - "step": 339730 - }, - { - "epoch": 0.59, - "learning_rate": 2.037671292598625e-05, - "loss": 2.3072, - "step": 339740 - }, - { - "epoch": 0.59, - "learning_rate": 2.0375840986059424e-05, - "loss": 2.3939, - "step": 339750 - }, - { - "epoch": 0.59, - "learning_rate": 2.0374969046132598e-05, - "loss": 2.437, - "step": 339760 - }, - { - "epoch": 0.59, - "learning_rate": 2.0374097106205772e-05, - "loss": 2.1852, - "step": 339770 - }, - { - "epoch": 0.59, - "learning_rate": 2.0373225166278946e-05, - "loss": 2.332, - "step": 339780 - }, - { - "epoch": 0.59, - "learning_rate": 2.0372353226352116e-05, - "loss": 2.4255, - "step": 339790 - }, - { - "epoch": 0.59, - "learning_rate": 2.0371481286425293e-05, - "loss": 2.2389, - "step": 339800 - }, - { - "epoch": 0.59, - "learning_rate": 2.0370609346498464e-05, - "loss": 2.3441, - "step": 339810 - }, - { - "epoch": 0.59, - "learning_rate": 2.0369737406571637e-05, - "loss": 2.3938, - "step": 339820 - }, - { - "epoch": 0.59, - "learning_rate": 2.036886546664481e-05, - "loss": 2.2237, - "step": 339830 - }, - { - "epoch": 0.59, - "learning_rate": 2.0367993526717985e-05, - "loss": 2.4547, - "step": 339840 - }, - { - "epoch": 0.59, - "learning_rate": 2.036712158679116e-05, - "loss": 2.2844, - "step": 339850 - }, - { - "epoch": 0.59, - "learning_rate": 2.036624964686433e-05, - "loss": 2.3893, - "step": 339860 - }, - { - "epoch": 0.59, - "learning_rate": 2.0365377706937506e-05, - "loss": 2.3341, - "step": 339870 - }, - { - "epoch": 0.59, - "learning_rate": 2.0364505767010677e-05, - "loss": 2.2876, - "step": 339880 - }, - { - "epoch": 0.59, - "learning_rate": 2.036363382708385e-05, - "loss": 2.4237, - "step": 339890 - }, - { - "epoch": 0.59, - "learning_rate": 2.036276188715702e-05, - "loss": 2.3294, - "step": 339900 - }, - { - "epoch": 0.59, - "learning_rate": 2.0361889947230198e-05, - "loss": 2.3996, - "step": 339910 - }, - { - "epoch": 0.59, - "learning_rate": 2.0361018007303372e-05, - "loss": 2.3233, - "step": 339920 - }, - { - "epoch": 0.59, - "learning_rate": 2.0360146067376542e-05, - "loss": 2.3802, - "step": 339930 - }, - { - "epoch": 0.59, - "learning_rate": 2.0359274127449716e-05, - "loss": 2.3315, - "step": 339940 - }, - { - "epoch": 0.59, - "learning_rate": 2.035840218752289e-05, - "loss": 2.4106, - "step": 339950 - }, - { - "epoch": 0.59, - "learning_rate": 2.0357530247596063e-05, - "loss": 2.3374, - "step": 339960 - }, - { - "epoch": 0.59, - "learning_rate": 2.0356658307669234e-05, - "loss": 2.3202, - "step": 339970 - }, - { - "epoch": 0.59, - "learning_rate": 2.0355786367742408e-05, - "loss": 2.3638, - "step": 339980 - }, - { - "epoch": 0.59, - "learning_rate": 2.035491442781558e-05, - "loss": 2.33, - "step": 339990 - }, - { - "epoch": 0.59, - "learning_rate": 2.0354042487888755e-05, - "loss": 2.226, - "step": 340000 - }, - { - "epoch": 0.59, - "learning_rate": 2.035317054796193e-05, - "loss": 2.2696, - "step": 340010 - }, - { - "epoch": 0.59, - "learning_rate": 2.0352298608035103e-05, - "loss": 2.3564, - "step": 340020 - }, - { - "epoch": 0.59, - "learning_rate": 2.0351426668108276e-05, - "loss": 2.3542, - "step": 340030 - }, - { - "epoch": 0.59, - "learning_rate": 2.0350554728181447e-05, - "loss": 2.312, - "step": 340040 - }, - { - "epoch": 0.59, - "learning_rate": 2.034968278825462e-05, - "loss": 2.4018, - "step": 340050 - }, - { - "epoch": 0.59, - "learning_rate": 2.0348810848327794e-05, - "loss": 2.3373, - "step": 340060 - }, - { - "epoch": 0.59, - "learning_rate": 2.0347938908400968e-05, - "loss": 2.3603, - "step": 340070 - }, - { - "epoch": 0.59, - "learning_rate": 2.0347066968474142e-05, - "loss": 2.3865, - "step": 340080 - }, - { - "epoch": 0.59, - "learning_rate": 2.0346195028547312e-05, - "loss": 2.3306, - "step": 340090 - }, - { - "epoch": 0.59, - "learning_rate": 2.034532308862049e-05, - "loss": 2.3649, - "step": 340100 - }, - { - "epoch": 0.59, - "learning_rate": 2.034445114869366e-05, - "loss": 2.3298, - "step": 340110 - }, - { - "epoch": 0.59, - "learning_rate": 2.0343579208766834e-05, - "loss": 2.3441, - "step": 340120 - }, - { - "epoch": 0.59, - "learning_rate": 2.0342707268840007e-05, - "loss": 2.3679, - "step": 340130 - }, - { - "epoch": 0.59, - "learning_rate": 2.034183532891318e-05, - "loss": 2.3158, - "step": 340140 - }, - { - "epoch": 0.59, - "learning_rate": 2.034096338898635e-05, - "loss": 2.3952, - "step": 340150 - }, - { - "epoch": 0.59, - "learning_rate": 2.0340091449059525e-05, - "loss": 2.3664, - "step": 340160 - }, - { - "epoch": 0.59, - "learning_rate": 2.0339219509132702e-05, - "loss": 2.3641, - "step": 340170 - }, - { - "epoch": 0.59, - "learning_rate": 2.0338347569205873e-05, - "loss": 2.4024, - "step": 340180 - }, - { - "epoch": 0.59, - "learning_rate": 2.0337475629279047e-05, - "loss": 2.2719, - "step": 340190 - }, - { - "epoch": 0.59, - "learning_rate": 2.0336603689352217e-05, - "loss": 2.3343, - "step": 340200 - }, - { - "epoch": 0.59, - "learning_rate": 2.0335731749425394e-05, - "loss": 2.2099, - "step": 340210 - }, - { - "epoch": 0.59, - "learning_rate": 2.0334859809498565e-05, - "loss": 2.3492, - "step": 340220 - }, - { - "epoch": 0.59, - "learning_rate": 2.033398786957174e-05, - "loss": 2.346, - "step": 340230 - }, - { - "epoch": 0.59, - "learning_rate": 2.0333115929644912e-05, - "loss": 2.4019, - "step": 340240 - }, - { - "epoch": 0.59, - "learning_rate": 2.0332243989718086e-05, - "loss": 2.3093, - "step": 340250 - }, - { - "epoch": 0.59, - "learning_rate": 2.033137204979126e-05, - "loss": 2.3151, - "step": 340260 - }, - { - "epoch": 0.59, - "learning_rate": 2.033050010986443e-05, - "loss": 2.4479, - "step": 340270 - }, - { - "epoch": 0.59, - "learning_rate": 2.0329628169937607e-05, - "loss": 2.3687, - "step": 340280 - }, - { - "epoch": 0.59, - "learning_rate": 2.0328756230010778e-05, - "loss": 2.3479, - "step": 340290 - }, - { - "epoch": 0.59, - "learning_rate": 2.032788429008395e-05, - "loss": 2.3746, - "step": 340300 - }, - { - "epoch": 0.59, - "learning_rate": 2.0327012350157125e-05, - "loss": 2.3154, - "step": 340310 - }, - { - "epoch": 0.59, - "learning_rate": 2.03261404102303e-05, - "loss": 2.4012, - "step": 340320 - }, - { - "epoch": 0.59, - "learning_rate": 2.0325268470303473e-05, - "loss": 2.3542, - "step": 340330 - }, - { - "epoch": 0.59, - "learning_rate": 2.0324396530376643e-05, - "loss": 2.2898, - "step": 340340 - }, - { - "epoch": 0.59, - "learning_rate": 2.0323524590449817e-05, - "loss": 2.3583, - "step": 340350 - }, - { - "epoch": 0.59, - "learning_rate": 2.032265265052299e-05, - "loss": 2.4033, - "step": 340360 - }, - { - "epoch": 0.59, - "learning_rate": 2.0321780710596164e-05, - "loss": 2.4297, - "step": 340370 - }, - { - "epoch": 0.59, - "learning_rate": 2.0320908770669335e-05, - "loss": 2.2352, - "step": 340380 - }, - { - "epoch": 0.59, - "learning_rate": 2.0320036830742512e-05, - "loss": 2.381, - "step": 340390 - }, - { - "epoch": 0.59, - "learning_rate": 2.0319164890815686e-05, - "loss": 2.3732, - "step": 340400 - }, - { - "epoch": 0.59, - "learning_rate": 2.0318292950888856e-05, - "loss": 2.3483, - "step": 340410 - }, - { - "epoch": 0.59, - "learning_rate": 2.031742101096203e-05, - "loss": 2.3245, - "step": 340420 - }, - { - "epoch": 0.59, - "learning_rate": 2.0316549071035204e-05, - "loss": 2.4802, - "step": 340430 - }, - { - "epoch": 0.59, - "learning_rate": 2.0315677131108377e-05, - "loss": 2.3697, - "step": 340440 - }, - { - "epoch": 0.59, - "learning_rate": 2.0314805191181548e-05, - "loss": 2.2758, - "step": 340450 - }, - { - "epoch": 0.59, - "learning_rate": 2.031393325125472e-05, - "loss": 2.3291, - "step": 340460 - }, - { - "epoch": 0.59, - "learning_rate": 2.0313061311327895e-05, - "loss": 2.2362, - "step": 340470 - }, - { - "epoch": 0.59, - "learning_rate": 2.031218937140107e-05, - "loss": 2.39, - "step": 340480 - }, - { - "epoch": 0.59, - "learning_rate": 2.0311317431474243e-05, - "loss": 2.2683, - "step": 340490 - }, - { - "epoch": 0.59, - "learning_rate": 2.0310445491547413e-05, - "loss": 2.3664, - "step": 340500 - }, - { - "epoch": 0.59, - "learning_rate": 2.030957355162059e-05, - "loss": 2.3911, - "step": 340510 - }, - { - "epoch": 0.59, - "learning_rate": 2.030870161169376e-05, - "loss": 2.2157, - "step": 340520 - }, - { - "epoch": 0.59, - "learning_rate": 2.0307829671766934e-05, - "loss": 2.4022, - "step": 340530 - }, - { - "epoch": 0.59, - "learning_rate": 2.0306957731840108e-05, - "loss": 2.2833, - "step": 340540 - }, - { - "epoch": 0.59, - "learning_rate": 2.0306085791913282e-05, - "loss": 2.3323, - "step": 340550 - }, - { - "epoch": 0.59, - "learning_rate": 2.0305213851986456e-05, - "loss": 2.2676, - "step": 340560 - }, - { - "epoch": 0.59, - "learning_rate": 2.0304341912059626e-05, - "loss": 2.3743, - "step": 340570 - }, - { - "epoch": 0.59, - "learning_rate": 2.0303469972132803e-05, - "loss": 2.3049, - "step": 340580 - }, - { - "epoch": 0.59, - "learning_rate": 2.0302598032205974e-05, - "loss": 2.3102, - "step": 340590 - }, - { - "epoch": 0.59, - "learning_rate": 2.0301726092279147e-05, - "loss": 2.4176, - "step": 340600 - }, - { - "epoch": 0.59, - "learning_rate": 2.0300854152352318e-05, - "loss": 2.4024, - "step": 340610 - }, - { - "epoch": 0.59, - "learning_rate": 2.0299982212425495e-05, - "loss": 2.4224, - "step": 340620 - }, - { - "epoch": 0.59, - "learning_rate": 2.0299110272498665e-05, - "loss": 2.46, - "step": 340630 - }, - { - "epoch": 0.59, - "learning_rate": 2.029823833257184e-05, - "loss": 2.3574, - "step": 340640 - }, - { - "epoch": 0.59, - "learning_rate": 2.0297366392645013e-05, - "loss": 2.1638, - "step": 340650 - }, - { - "epoch": 0.59, - "learning_rate": 2.0296494452718187e-05, - "loss": 2.1449, - "step": 340660 - }, - { - "epoch": 0.59, - "learning_rate": 2.029562251279136e-05, - "loss": 2.3072, - "step": 340670 - }, - { - "epoch": 0.59, - "learning_rate": 2.029475057286453e-05, - "loss": 2.2714, - "step": 340680 - }, - { - "epoch": 0.59, - "learning_rate": 2.0293878632937708e-05, - "loss": 2.3977, - "step": 340690 - }, - { - "epoch": 0.59, - "learning_rate": 2.029300669301088e-05, - "loss": 2.2088, - "step": 340700 - }, - { - "epoch": 0.59, - "learning_rate": 2.0292134753084052e-05, - "loss": 2.376, - "step": 340710 - }, - { - "epoch": 0.59, - "learning_rate": 2.0291262813157226e-05, - "loss": 2.2381, - "step": 340720 - }, - { - "epoch": 0.59, - "learning_rate": 2.02903908732304e-05, - "loss": 2.329, - "step": 340730 - }, - { - "epoch": 0.59, - "learning_rate": 2.0289518933303573e-05, - "loss": 2.3243, - "step": 340740 - }, - { - "epoch": 0.59, - "learning_rate": 2.0288646993376744e-05, - "loss": 2.3403, - "step": 340750 - }, - { - "epoch": 0.59, - "learning_rate": 2.0287775053449918e-05, - "loss": 2.409, - "step": 340760 - }, - { - "epoch": 0.59, - "learning_rate": 2.028690311352309e-05, - "loss": 2.3717, - "step": 340770 - }, - { - "epoch": 0.59, - "learning_rate": 2.0286031173596265e-05, - "loss": 2.4473, - "step": 340780 - }, - { - "epoch": 0.59, - "learning_rate": 2.028515923366944e-05, - "loss": 2.281, - "step": 340790 - }, - { - "epoch": 0.59, - "learning_rate": 2.0284287293742613e-05, - "loss": 2.3212, - "step": 340800 - }, - { - "epoch": 0.59, - "learning_rate": 2.0283415353815786e-05, - "loss": 2.3251, - "step": 340810 - }, - { - "epoch": 0.59, - "learning_rate": 2.0282543413888957e-05, - "loss": 2.2641, - "step": 340820 - }, - { - "epoch": 0.59, - "learning_rate": 2.028167147396213e-05, - "loss": 2.3501, - "step": 340830 - }, - { - "epoch": 0.59, - "learning_rate": 2.0280799534035304e-05, - "loss": 2.3269, - "step": 340840 - }, - { - "epoch": 0.59, - "learning_rate": 2.0279927594108478e-05, - "loss": 2.2934, - "step": 340850 - }, - { - "epoch": 0.59, - "learning_rate": 2.027905565418165e-05, - "loss": 2.3227, - "step": 340860 - }, - { - "epoch": 0.59, - "learning_rate": 2.0278183714254822e-05, - "loss": 2.2563, - "step": 340870 - }, - { - "epoch": 0.59, - "learning_rate": 2.0277311774327996e-05, - "loss": 2.4297, - "step": 340880 - }, - { - "epoch": 0.59, - "learning_rate": 2.027643983440117e-05, - "loss": 2.3938, - "step": 340890 - }, - { - "epoch": 0.59, - "learning_rate": 2.0275567894474344e-05, - "loss": 2.3356, - "step": 340900 - }, - { - "epoch": 0.59, - "learning_rate": 2.0274695954547514e-05, - "loss": 2.2166, - "step": 340910 - }, - { - "epoch": 0.59, - "learning_rate": 2.027382401462069e-05, - "loss": 2.3034, - "step": 340920 - }, - { - "epoch": 0.59, - "learning_rate": 2.027295207469386e-05, - "loss": 2.4524, - "step": 340930 - }, - { - "epoch": 0.59, - "learning_rate": 2.0272080134767035e-05, - "loss": 2.1824, - "step": 340940 - }, - { - "epoch": 0.59, - "learning_rate": 2.027120819484021e-05, - "loss": 2.3341, - "step": 340950 - }, - { - "epoch": 0.59, - "learning_rate": 2.0270336254913383e-05, - "loss": 2.3364, - "step": 340960 - }, - { - "epoch": 0.59, - "learning_rate": 2.0269464314986557e-05, - "loss": 2.3534, - "step": 340970 - }, - { - "epoch": 0.59, - "learning_rate": 2.0268592375059727e-05, - "loss": 2.2773, - "step": 340980 - }, - { - "epoch": 0.59, - "learning_rate": 2.0267720435132904e-05, - "loss": 2.3409, - "step": 340990 - }, - { - "epoch": 0.59, - "learning_rate": 2.0266848495206075e-05, - "loss": 2.4168, - "step": 341000 - }, - { - "epoch": 0.59, - "learning_rate": 2.026597655527925e-05, - "loss": 2.2662, - "step": 341010 - }, - { - "epoch": 0.59, - "learning_rate": 2.0265104615352422e-05, - "loss": 2.2911, - "step": 341020 - }, - { - "epoch": 0.59, - "learning_rate": 2.0264232675425596e-05, - "loss": 2.3844, - "step": 341030 - }, - { - "epoch": 0.59, - "learning_rate": 2.026336073549877e-05, - "loss": 2.3672, - "step": 341040 - }, - { - "epoch": 0.59, - "learning_rate": 2.026248879557194e-05, - "loss": 2.2314, - "step": 341050 - }, - { - "epoch": 0.59, - "learning_rate": 2.0261616855645117e-05, - "loss": 2.2959, - "step": 341060 - }, - { - "epoch": 0.59, - "learning_rate": 2.0260744915718288e-05, - "loss": 2.4241, - "step": 341070 - }, - { - "epoch": 0.59, - "learning_rate": 2.025987297579146e-05, - "loss": 2.2399, - "step": 341080 - }, - { - "epoch": 0.59, - "learning_rate": 2.0259001035864632e-05, - "loss": 2.2942, - "step": 341090 - }, - { - "epoch": 0.59, - "learning_rate": 2.025812909593781e-05, - "loss": 2.354, - "step": 341100 - }, - { - "epoch": 0.59, - "learning_rate": 2.025725715601098e-05, - "loss": 2.362, - "step": 341110 - }, - { - "epoch": 0.59, - "learning_rate": 2.0256385216084153e-05, - "loss": 2.4763, - "step": 341120 - }, - { - "epoch": 0.59, - "learning_rate": 2.0255513276157327e-05, - "loss": 2.3644, - "step": 341130 - }, - { - "epoch": 0.59, - "learning_rate": 2.02546413362305e-05, - "loss": 2.3196, - "step": 341140 - }, - { - "epoch": 0.59, - "learning_rate": 2.0253769396303674e-05, - "loss": 2.2732, - "step": 341150 - }, - { - "epoch": 0.59, - "learning_rate": 2.0252897456376845e-05, - "loss": 2.4085, - "step": 341160 - }, - { - "epoch": 0.59, - "learning_rate": 2.025202551645002e-05, - "loss": 2.3187, - "step": 341170 - }, - { - "epoch": 0.59, - "learning_rate": 2.0251153576523192e-05, - "loss": 2.4741, - "step": 341180 - }, - { - "epoch": 0.59, - "learning_rate": 2.0250281636596366e-05, - "loss": 2.3462, - "step": 341190 - }, - { - "epoch": 0.6, - "learning_rate": 2.024940969666954e-05, - "loss": 2.3962, - "step": 341200 - }, - { - "epoch": 0.6, - "learning_rate": 2.0248537756742714e-05, - "loss": 2.2428, - "step": 341210 - }, - { - "epoch": 0.6, - "learning_rate": 2.0247665816815887e-05, - "loss": 2.3064, - "step": 341220 - }, - { - "epoch": 0.6, - "learning_rate": 2.0246793876889058e-05, - "loss": 2.3295, - "step": 341230 - }, - { - "epoch": 0.6, - "learning_rate": 2.024592193696223e-05, - "loss": 2.3817, - "step": 341240 - }, - { - "epoch": 0.6, - "learning_rate": 2.0245049997035405e-05, - "loss": 2.2351, - "step": 341250 - }, - { - "epoch": 0.6, - "learning_rate": 2.024417805710858e-05, - "loss": 2.4373, - "step": 341260 - }, - { - "epoch": 0.6, - "learning_rate": 2.0243306117181753e-05, - "loss": 2.419, - "step": 341270 - }, - { - "epoch": 0.6, - "learning_rate": 2.0242434177254923e-05, - "loss": 2.3316, - "step": 341280 - }, - { - "epoch": 0.6, - "learning_rate": 2.02415622373281e-05, - "loss": 2.3897, - "step": 341290 - }, - { - "epoch": 0.6, - "learning_rate": 2.024069029740127e-05, - "loss": 2.2845, - "step": 341300 - }, - { - "epoch": 0.6, - "learning_rate": 2.0239818357474444e-05, - "loss": 2.2769, - "step": 341310 - }, - { - "epoch": 0.6, - "learning_rate": 2.0238946417547615e-05, - "loss": 2.2532, - "step": 341320 - }, - { - "epoch": 0.6, - "learning_rate": 2.0238074477620792e-05, - "loss": 2.3457, - "step": 341330 - }, - { - "epoch": 0.6, - "learning_rate": 2.0237202537693962e-05, - "loss": 2.3121, - "step": 341340 - }, - { - "epoch": 0.6, - "learning_rate": 2.0236330597767136e-05, - "loss": 2.3389, - "step": 341350 - }, - { - "epoch": 0.6, - "learning_rate": 2.023545865784031e-05, - "loss": 2.2323, - "step": 341360 - }, - { - "epoch": 0.6, - "learning_rate": 2.0234586717913484e-05, - "loss": 2.4013, - "step": 341370 - }, - { - "epoch": 0.6, - "learning_rate": 2.0233714777986657e-05, - "loss": 2.362, - "step": 341380 - }, - { - "epoch": 0.6, - "learning_rate": 2.0232842838059828e-05, - "loss": 2.4031, - "step": 341390 - }, - { - "epoch": 0.6, - "learning_rate": 2.0231970898133005e-05, - "loss": 2.4226, - "step": 341400 - }, - { - "epoch": 0.6, - "learning_rate": 2.0231098958206175e-05, - "loss": 2.4111, - "step": 341410 - }, - { - "epoch": 0.6, - "learning_rate": 2.023022701827935e-05, - "loss": 2.3214, - "step": 341420 - }, - { - "epoch": 0.6, - "learning_rate": 2.0229355078352523e-05, - "loss": 2.3117, - "step": 341430 - }, - { - "epoch": 0.6, - "learning_rate": 2.0228483138425697e-05, - "loss": 2.3681, - "step": 341440 - }, - { - "epoch": 0.6, - "learning_rate": 2.022761119849887e-05, - "loss": 2.3072, - "step": 341450 - }, - { - "epoch": 0.6, - "learning_rate": 2.022673925857204e-05, - "loss": 2.3864, - "step": 341460 - }, - { - "epoch": 0.6, - "learning_rate": 2.0225867318645218e-05, - "loss": 2.4446, - "step": 341470 - }, - { - "epoch": 0.6, - "learning_rate": 2.022499537871839e-05, - "loss": 2.3723, - "step": 341480 - }, - { - "epoch": 0.6, - "learning_rate": 2.0224123438791562e-05, - "loss": 2.2936, - "step": 341490 - }, - { - "epoch": 0.6, - "learning_rate": 2.0223251498864733e-05, - "loss": 2.367, - "step": 341500 - }, - { - "epoch": 0.6, - "learning_rate": 2.022237955893791e-05, - "loss": 2.4904, - "step": 341510 - }, - { - "epoch": 0.6, - "learning_rate": 2.0221507619011083e-05, - "loss": 2.4098, - "step": 341520 - }, - { - "epoch": 0.6, - "learning_rate": 2.0220635679084254e-05, - "loss": 2.2596, - "step": 341530 - }, - { - "epoch": 0.6, - "learning_rate": 2.0219763739157428e-05, - "loss": 2.3812, - "step": 341540 - }, - { - "epoch": 0.6, - "learning_rate": 2.02188917992306e-05, - "loss": 2.2104, - "step": 341550 - }, - { - "epoch": 0.6, - "learning_rate": 2.0218019859303775e-05, - "loss": 2.4331, - "step": 341560 - }, - { - "epoch": 0.6, - "learning_rate": 2.0217147919376946e-05, - "loss": 2.2506, - "step": 341570 - }, - { - "epoch": 0.6, - "learning_rate": 2.021627597945012e-05, - "loss": 2.1874, - "step": 341580 - }, - { - "epoch": 0.6, - "learning_rate": 2.0215404039523293e-05, - "loss": 2.4036, - "step": 341590 - }, - { - "epoch": 0.6, - "learning_rate": 2.0214532099596467e-05, - "loss": 2.3196, - "step": 341600 - }, - { - "epoch": 0.6, - "learning_rate": 2.021366015966964e-05, - "loss": 2.3365, - "step": 341610 - }, - { - "epoch": 0.6, - "learning_rate": 2.0212788219742814e-05, - "loss": 2.2703, - "step": 341620 - }, - { - "epoch": 0.6, - "learning_rate": 2.0211916279815988e-05, - "loss": 2.3809, - "step": 341630 - }, - { - "epoch": 0.6, - "learning_rate": 2.021104433988916e-05, - "loss": 2.2975, - "step": 341640 - }, - { - "epoch": 0.6, - "learning_rate": 2.0210172399962332e-05, - "loss": 2.339, - "step": 341650 - }, - { - "epoch": 0.6, - "learning_rate": 2.0209300460035506e-05, - "loss": 2.2633, - "step": 341660 - }, - { - "epoch": 0.6, - "learning_rate": 2.020842852010868e-05, - "loss": 2.4616, - "step": 341670 - }, - { - "epoch": 0.6, - "learning_rate": 2.0207556580181854e-05, - "loss": 2.3123, - "step": 341680 - }, - { - "epoch": 0.6, - "learning_rate": 2.0206684640255024e-05, - "loss": 2.2788, - "step": 341690 - }, - { - "epoch": 0.6, - "learning_rate": 2.02058127003282e-05, - "loss": 2.3903, - "step": 341700 - }, - { - "epoch": 0.6, - "learning_rate": 2.020494076040137e-05, - "loss": 2.2938, - "step": 341710 - }, - { - "epoch": 0.6, - "learning_rate": 2.0204068820474545e-05, - "loss": 2.3046, - "step": 341720 - }, - { - "epoch": 0.6, - "learning_rate": 2.020319688054772e-05, - "loss": 2.4048, - "step": 341730 - }, - { - "epoch": 0.6, - "learning_rate": 2.0202324940620893e-05, - "loss": 2.2989, - "step": 341740 - }, - { - "epoch": 0.6, - "learning_rate": 2.0201453000694067e-05, - "loss": 2.3019, - "step": 341750 - }, - { - "epoch": 0.6, - "learning_rate": 2.0200581060767237e-05, - "loss": 2.4324, - "step": 341760 - }, - { - "epoch": 0.6, - "learning_rate": 2.0199709120840414e-05, - "loss": 2.331, - "step": 341770 - }, - { - "epoch": 0.6, - "learning_rate": 2.0198837180913585e-05, - "loss": 2.364, - "step": 341780 - }, - { - "epoch": 0.6, - "learning_rate": 2.019796524098676e-05, - "loss": 2.2464, - "step": 341790 - }, - { - "epoch": 0.6, - "learning_rate": 2.019709330105993e-05, - "loss": 2.453, - "step": 341800 - }, - { - "epoch": 0.6, - "learning_rate": 2.0196221361133106e-05, - "loss": 2.15, - "step": 341810 - }, - { - "epoch": 0.6, - "learning_rate": 2.0195349421206276e-05, - "loss": 2.4129, - "step": 341820 - }, - { - "epoch": 0.6, - "learning_rate": 2.019447748127945e-05, - "loss": 2.4066, - "step": 341830 - }, - { - "epoch": 0.6, - "learning_rate": 2.0193605541352624e-05, - "loss": 2.3199, - "step": 341840 - }, - { - "epoch": 0.6, - "learning_rate": 2.0192733601425798e-05, - "loss": 2.3768, - "step": 341850 - }, - { - "epoch": 0.6, - "learning_rate": 2.019186166149897e-05, - "loss": 2.4509, - "step": 341860 - }, - { - "epoch": 0.6, - "learning_rate": 2.0190989721572142e-05, - "loss": 2.3836, - "step": 341870 - }, - { - "epoch": 0.6, - "learning_rate": 2.019011778164532e-05, - "loss": 2.3596, - "step": 341880 - }, - { - "epoch": 0.6, - "learning_rate": 2.018924584171849e-05, - "loss": 2.4171, - "step": 341890 - }, - { - "epoch": 0.6, - "learning_rate": 2.0188373901791663e-05, - "loss": 2.3508, - "step": 341900 - }, - { - "epoch": 0.6, - "learning_rate": 2.0187501961864837e-05, - "loss": 2.363, - "step": 341910 - }, - { - "epoch": 0.6, - "learning_rate": 2.018663002193801e-05, - "loss": 2.3006, - "step": 341920 - }, - { - "epoch": 0.6, - "learning_rate": 2.0185758082011184e-05, - "loss": 2.2818, - "step": 341930 - }, - { - "epoch": 0.6, - "learning_rate": 2.0184886142084355e-05, - "loss": 2.3261, - "step": 341940 - }, - { - "epoch": 0.6, - "learning_rate": 2.018401420215753e-05, - "loss": 2.2891, - "step": 341950 - }, - { - "epoch": 0.6, - "learning_rate": 2.0183142262230702e-05, - "loss": 2.2543, - "step": 341960 - }, - { - "epoch": 0.6, - "learning_rate": 2.0182270322303876e-05, - "loss": 2.3567, - "step": 341970 - }, - { - "epoch": 0.6, - "learning_rate": 2.0181398382377046e-05, - "loss": 2.3505, - "step": 341980 - }, - { - "epoch": 0.6, - "learning_rate": 2.0180526442450224e-05, - "loss": 2.4119, - "step": 341990 - }, - { - "epoch": 0.6, - "learning_rate": 2.0179654502523397e-05, - "loss": 2.285, - "step": 342000 - }, - { - "epoch": 0.6, - "learning_rate": 2.0178782562596568e-05, - "loss": 2.4141, - "step": 342010 - }, - { - "epoch": 0.6, - "learning_rate": 2.017791062266974e-05, - "loss": 2.4262, - "step": 342020 - }, - { - "epoch": 0.6, - "learning_rate": 2.0177038682742915e-05, - "loss": 2.2708, - "step": 342030 - }, - { - "epoch": 0.6, - "learning_rate": 2.017616674281609e-05, - "loss": 2.2642, - "step": 342040 - }, - { - "epoch": 0.6, - "learning_rate": 2.017529480288926e-05, - "loss": 2.3878, - "step": 342050 - }, - { - "epoch": 0.6, - "learning_rate": 2.0174422862962433e-05, - "loss": 2.3642, - "step": 342060 - }, - { - "epoch": 0.6, - "learning_rate": 2.0173550923035607e-05, - "loss": 2.4486, - "step": 342070 - }, - { - "epoch": 0.6, - "learning_rate": 2.017267898310878e-05, - "loss": 2.3096, - "step": 342080 - }, - { - "epoch": 0.6, - "learning_rate": 2.0171807043181954e-05, - "loss": 2.3251, - "step": 342090 - }, - { - "epoch": 0.6, - "learning_rate": 2.0170935103255125e-05, - "loss": 2.2763, - "step": 342100 - }, - { - "epoch": 0.6, - "learning_rate": 2.0170063163328302e-05, - "loss": 2.3938, - "step": 342110 - }, - { - "epoch": 0.6, - "learning_rate": 2.0169191223401472e-05, - "loss": 2.3371, - "step": 342120 - }, - { - "epoch": 0.6, - "learning_rate": 2.0168319283474646e-05, - "loss": 2.2956, - "step": 342130 - }, - { - "epoch": 0.6, - "learning_rate": 2.016744734354782e-05, - "loss": 2.3498, - "step": 342140 - }, - { - "epoch": 0.6, - "learning_rate": 2.0166575403620994e-05, - "loss": 2.2867, - "step": 342150 - }, - { - "epoch": 0.6, - "learning_rate": 2.0165703463694168e-05, - "loss": 2.4461, - "step": 342160 - }, - { - "epoch": 0.6, - "learning_rate": 2.0164831523767338e-05, - "loss": 2.3365, - "step": 342170 - }, - { - "epoch": 0.6, - "learning_rate": 2.0163959583840515e-05, - "loss": 2.1946, - "step": 342180 - }, - { - "epoch": 0.6, - "learning_rate": 2.0163087643913685e-05, - "loss": 2.274, - "step": 342190 - }, - { - "epoch": 0.6, - "learning_rate": 2.016221570398686e-05, - "loss": 2.3539, - "step": 342200 - }, - { - "epoch": 0.6, - "learning_rate": 2.016134376406003e-05, - "loss": 2.2947, - "step": 342210 - }, - { - "epoch": 0.6, - "learning_rate": 2.0160471824133207e-05, - "loss": 2.3915, - "step": 342220 - }, - { - "epoch": 0.6, - "learning_rate": 2.0159599884206377e-05, - "loss": 2.3783, - "step": 342230 - }, - { - "epoch": 0.6, - "learning_rate": 2.015872794427955e-05, - "loss": 2.3846, - "step": 342240 - }, - { - "epoch": 0.6, - "learning_rate": 2.0157856004352725e-05, - "loss": 2.2895, - "step": 342250 - }, - { - "epoch": 0.6, - "learning_rate": 2.01569840644259e-05, - "loss": 2.4236, - "step": 342260 - }, - { - "epoch": 0.6, - "learning_rate": 2.0156112124499072e-05, - "loss": 2.2792, - "step": 342270 - }, - { - "epoch": 0.6, - "learning_rate": 2.0155240184572243e-05, - "loss": 2.3271, - "step": 342280 - }, - { - "epoch": 0.6, - "learning_rate": 2.015436824464542e-05, - "loss": 2.3608, - "step": 342290 - }, - { - "epoch": 0.6, - "learning_rate": 2.015349630471859e-05, - "loss": 2.2926, - "step": 342300 - }, - { - "epoch": 0.6, - "learning_rate": 2.0152624364791764e-05, - "loss": 2.2997, - "step": 342310 - }, - { - "epoch": 0.6, - "learning_rate": 2.0151752424864938e-05, - "loss": 2.3187, - "step": 342320 - }, - { - "epoch": 0.6, - "learning_rate": 2.015088048493811e-05, - "loss": 2.3137, - "step": 342330 - }, - { - "epoch": 0.6, - "learning_rate": 2.0150008545011285e-05, - "loss": 2.3463, - "step": 342340 - }, - { - "epoch": 0.6, - "learning_rate": 2.0149136605084456e-05, - "loss": 2.2562, - "step": 342350 - }, - { - "epoch": 0.6, - "learning_rate": 2.014826466515763e-05, - "loss": 2.3086, - "step": 342360 - }, - { - "epoch": 0.6, - "learning_rate": 2.0147392725230803e-05, - "loss": 2.3224, - "step": 342370 - }, - { - "epoch": 0.6, - "learning_rate": 2.0146520785303977e-05, - "loss": 2.4098, - "step": 342380 - }, - { - "epoch": 0.6, - "learning_rate": 2.014564884537715e-05, - "loss": 2.2975, - "step": 342390 - }, - { - "epoch": 0.6, - "learning_rate": 2.0144776905450324e-05, - "loss": 2.2376, - "step": 342400 - }, - { - "epoch": 0.6, - "learning_rate": 2.0143904965523498e-05, - "loss": 2.3993, - "step": 342410 - }, - { - "epoch": 0.6, - "learning_rate": 2.014303302559667e-05, - "loss": 2.3279, - "step": 342420 - }, - { - "epoch": 0.6, - "learning_rate": 2.0142161085669842e-05, - "loss": 2.3601, - "step": 342430 - }, - { - "epoch": 0.6, - "learning_rate": 2.0141289145743016e-05, - "loss": 2.2915, - "step": 342440 - }, - { - "epoch": 0.6, - "learning_rate": 2.014041720581619e-05, - "loss": 2.3503, - "step": 342450 - }, - { - "epoch": 0.6, - "learning_rate": 2.013954526588936e-05, - "loss": 2.2395, - "step": 342460 - }, - { - "epoch": 0.6, - "learning_rate": 2.0138673325962534e-05, - "loss": 2.3125, - "step": 342470 - }, - { - "epoch": 0.6, - "learning_rate": 2.013780138603571e-05, - "loss": 2.353, - "step": 342480 - }, - { - "epoch": 0.6, - "learning_rate": 2.013692944610888e-05, - "loss": 2.3042, - "step": 342490 - }, - { - "epoch": 0.6, - "learning_rate": 2.0136057506182055e-05, - "loss": 2.294, - "step": 342500 - }, - { - "epoch": 0.6, - "learning_rate": 2.0135185566255226e-05, - "loss": 2.3391, - "step": 342510 - }, - { - "epoch": 0.6, - "learning_rate": 2.0134313626328403e-05, - "loss": 2.3149, - "step": 342520 - }, - { - "epoch": 0.6, - "learning_rate": 2.0133441686401573e-05, - "loss": 2.3181, - "step": 342530 - }, - { - "epoch": 0.6, - "learning_rate": 2.0132569746474747e-05, - "loss": 2.2821, - "step": 342540 - }, - { - "epoch": 0.6, - "learning_rate": 2.013169780654792e-05, - "loss": 2.4205, - "step": 342550 - }, - { - "epoch": 0.6, - "learning_rate": 2.0130825866621095e-05, - "loss": 2.3553, - "step": 342560 - }, - { - "epoch": 0.6, - "learning_rate": 2.012995392669427e-05, - "loss": 2.1639, - "step": 342570 - }, - { - "epoch": 0.6, - "learning_rate": 2.012908198676744e-05, - "loss": 2.2975, - "step": 342580 - }, - { - "epoch": 0.6, - "learning_rate": 2.0128210046840616e-05, - "loss": 2.3976, - "step": 342590 - }, - { - "epoch": 0.6, - "learning_rate": 2.0127338106913786e-05, - "loss": 2.3746, - "step": 342600 - }, - { - "epoch": 0.6, - "learning_rate": 2.012646616698696e-05, - "loss": 2.4175, - "step": 342610 - }, - { - "epoch": 0.6, - "learning_rate": 2.0125594227060134e-05, - "loss": 2.2743, - "step": 342620 - }, - { - "epoch": 0.6, - "learning_rate": 2.0124722287133308e-05, - "loss": 2.3048, - "step": 342630 - }, - { - "epoch": 0.6, - "learning_rate": 2.012385034720648e-05, - "loss": 2.3266, - "step": 342640 - }, - { - "epoch": 0.6, - "learning_rate": 2.0122978407279652e-05, - "loss": 2.3572, - "step": 342650 - }, - { - "epoch": 0.6, - "learning_rate": 2.012210646735283e-05, - "loss": 2.4742, - "step": 342660 - }, - { - "epoch": 0.6, - "learning_rate": 2.0121234527426e-05, - "loss": 2.2968, - "step": 342670 - }, - { - "epoch": 0.6, - "learning_rate": 2.0120362587499173e-05, - "loss": 2.2431, - "step": 342680 - }, - { - "epoch": 0.6, - "learning_rate": 2.0119490647572343e-05, - "loss": 2.4659, - "step": 342690 - }, - { - "epoch": 0.6, - "learning_rate": 2.011861870764552e-05, - "loss": 2.4039, - "step": 342700 - }, - { - "epoch": 0.6, - "learning_rate": 2.011774676771869e-05, - "loss": 2.2555, - "step": 342710 - }, - { - "epoch": 0.6, - "learning_rate": 2.0116874827791865e-05, - "loss": 2.4472, - "step": 342720 - }, - { - "epoch": 0.6, - "learning_rate": 2.011600288786504e-05, - "loss": 2.373, - "step": 342730 - }, - { - "epoch": 0.6, - "learning_rate": 2.0115130947938212e-05, - "loss": 2.3874, - "step": 342740 - }, - { - "epoch": 0.6, - "learning_rate": 2.0114259008011386e-05, - "loss": 2.1955, - "step": 342750 - }, - { - "epoch": 0.6, - "learning_rate": 2.0113387068084556e-05, - "loss": 2.2682, - "step": 342760 - }, - { - "epoch": 0.6, - "learning_rate": 2.011251512815773e-05, - "loss": 2.3188, - "step": 342770 - }, - { - "epoch": 0.6, - "learning_rate": 2.0111643188230904e-05, - "loss": 2.4105, - "step": 342780 - }, - { - "epoch": 0.6, - "learning_rate": 2.0110771248304078e-05, - "loss": 2.2887, - "step": 342790 - }, - { - "epoch": 0.6, - "learning_rate": 2.010989930837725e-05, - "loss": 2.2043, - "step": 342800 - }, - { - "epoch": 0.6, - "learning_rate": 2.0109027368450425e-05, - "loss": 2.354, - "step": 342810 - }, - { - "epoch": 0.6, - "learning_rate": 2.01081554285236e-05, - "loss": 2.4025, - "step": 342820 - }, - { - "epoch": 0.6, - "learning_rate": 2.010728348859677e-05, - "loss": 2.3237, - "step": 342830 - }, - { - "epoch": 0.6, - "learning_rate": 2.0106411548669943e-05, - "loss": 2.2479, - "step": 342840 - }, - { - "epoch": 0.6, - "learning_rate": 2.0105539608743117e-05, - "loss": 2.2897, - "step": 342850 - }, - { - "epoch": 0.6, - "learning_rate": 2.010466766881629e-05, - "loss": 2.4056, - "step": 342860 - }, - { - "epoch": 0.6, - "learning_rate": 2.0103795728889465e-05, - "loss": 2.3878, - "step": 342870 - }, - { - "epoch": 0.6, - "learning_rate": 2.0102923788962635e-05, - "loss": 2.4018, - "step": 342880 - }, - { - "epoch": 0.6, - "learning_rate": 2.0102051849035812e-05, - "loss": 2.4445, - "step": 342890 - }, - { - "epoch": 0.6, - "learning_rate": 2.0101179909108982e-05, - "loss": 2.266, - "step": 342900 - }, - { - "epoch": 0.6, - "learning_rate": 2.0100307969182156e-05, - "loss": 2.3186, - "step": 342910 - }, - { - "epoch": 0.6, - "learning_rate": 2.009943602925533e-05, - "loss": 2.2662, - "step": 342920 - }, - { - "epoch": 0.6, - "learning_rate": 2.0098564089328504e-05, - "loss": 2.4012, - "step": 342930 - }, - { - "epoch": 0.6, - "learning_rate": 2.0097692149401674e-05, - "loss": 2.2771, - "step": 342940 - }, - { - "epoch": 0.6, - "learning_rate": 2.0096820209474848e-05, - "loss": 2.5058, - "step": 342950 - }, - { - "epoch": 0.6, - "learning_rate": 2.009594826954802e-05, - "loss": 2.3043, - "step": 342960 - }, - { - "epoch": 0.6, - "learning_rate": 2.0095076329621195e-05, - "loss": 2.3272, - "step": 342970 - }, - { - "epoch": 0.6, - "learning_rate": 2.009420438969437e-05, - "loss": 2.2796, - "step": 342980 - }, - { - "epoch": 0.6, - "learning_rate": 2.009333244976754e-05, - "loss": 2.2553, - "step": 342990 - }, - { - "epoch": 0.6, - "learning_rate": 2.0092460509840717e-05, - "loss": 2.3804, - "step": 343000 - }, - { - "epoch": 0.6, - "learning_rate": 2.0091588569913887e-05, - "loss": 2.2877, - "step": 343010 - }, - { - "epoch": 0.6, - "learning_rate": 2.009071662998706e-05, - "loss": 2.3787, - "step": 343020 - }, - { - "epoch": 0.6, - "learning_rate": 2.0089844690060235e-05, - "loss": 2.3367, - "step": 343030 - }, - { - "epoch": 0.6, - "learning_rate": 2.008897275013341e-05, - "loss": 2.3874, - "step": 343040 - }, - { - "epoch": 0.6, - "learning_rate": 2.0088100810206582e-05, - "loss": 2.2729, - "step": 343050 - }, - { - "epoch": 0.6, - "learning_rate": 2.0087228870279753e-05, - "loss": 2.3187, - "step": 343060 - }, - { - "epoch": 0.6, - "learning_rate": 2.008635693035293e-05, - "loss": 2.2713, - "step": 343070 - }, - { - "epoch": 0.6, - "learning_rate": 2.00854849904261e-05, - "loss": 2.4274, - "step": 343080 - }, - { - "epoch": 0.6, - "learning_rate": 2.0084613050499274e-05, - "loss": 2.2517, - "step": 343090 - }, - { - "epoch": 0.6, - "learning_rate": 2.0083741110572448e-05, - "loss": 2.2646, - "step": 343100 - }, - { - "epoch": 0.6, - "learning_rate": 2.008286917064562e-05, - "loss": 2.2316, - "step": 343110 - }, - { - "epoch": 0.6, - "learning_rate": 2.0081997230718795e-05, - "loss": 2.2589, - "step": 343120 - }, - { - "epoch": 0.6, - "learning_rate": 2.0081125290791966e-05, - "loss": 2.2833, - "step": 343130 - }, - { - "epoch": 0.6, - "learning_rate": 2.008025335086514e-05, - "loss": 2.247, - "step": 343140 - }, - { - "epoch": 0.6, - "learning_rate": 2.0079381410938313e-05, - "loss": 2.381, - "step": 343150 - }, - { - "epoch": 0.6, - "learning_rate": 2.0078509471011487e-05, - "loss": 2.4367, - "step": 343160 - }, - { - "epoch": 0.6, - "learning_rate": 2.0077637531084657e-05, - "loss": 2.4037, - "step": 343170 - }, - { - "epoch": 0.6, - "learning_rate": 2.007676559115783e-05, - "loss": 2.2529, - "step": 343180 - }, - { - "epoch": 0.6, - "learning_rate": 2.0075893651231005e-05, - "loss": 2.3439, - "step": 343190 - }, - { - "epoch": 0.6, - "learning_rate": 2.007502171130418e-05, - "loss": 2.2854, - "step": 343200 - }, - { - "epoch": 0.6, - "learning_rate": 2.0074149771377352e-05, - "loss": 2.4401, - "step": 343210 - }, - { - "epoch": 0.6, - "learning_rate": 2.0073277831450526e-05, - "loss": 2.3239, - "step": 343220 - }, - { - "epoch": 0.6, - "learning_rate": 2.00724058915237e-05, - "loss": 2.3151, - "step": 343230 - }, - { - "epoch": 0.6, - "learning_rate": 2.007153395159687e-05, - "loss": 2.2901, - "step": 343240 - }, - { - "epoch": 0.6, - "learning_rate": 2.0070662011670044e-05, - "loss": 2.3912, - "step": 343250 - }, - { - "epoch": 0.6, - "learning_rate": 2.0069790071743218e-05, - "loss": 2.3642, - "step": 343260 - }, - { - "epoch": 0.6, - "learning_rate": 2.006891813181639e-05, - "loss": 2.3912, - "step": 343270 - }, - { - "epoch": 0.6, - "learning_rate": 2.0068046191889565e-05, - "loss": 2.3578, - "step": 343280 - }, - { - "epoch": 0.6, - "learning_rate": 2.0067174251962736e-05, - "loss": 2.295, - "step": 343290 - }, - { - "epoch": 0.6, - "learning_rate": 2.0066302312035913e-05, - "loss": 2.3181, - "step": 343300 - }, - { - "epoch": 0.6, - "learning_rate": 2.0065430372109083e-05, - "loss": 2.3716, - "step": 343310 - }, - { - "epoch": 0.6, - "learning_rate": 2.0064558432182257e-05, - "loss": 2.44, - "step": 343320 - }, - { - "epoch": 0.6, - "learning_rate": 2.006368649225543e-05, - "loss": 2.4053, - "step": 343330 - }, - { - "epoch": 0.6, - "learning_rate": 2.0062814552328605e-05, - "loss": 2.347, - "step": 343340 - }, - { - "epoch": 0.6, - "learning_rate": 2.006194261240178e-05, - "loss": 2.2775, - "step": 343350 - }, - { - "epoch": 0.6, - "learning_rate": 2.006107067247495e-05, - "loss": 2.254, - "step": 343360 - }, - { - "epoch": 0.6, - "learning_rate": 2.0060198732548126e-05, - "loss": 2.2812, - "step": 343370 - }, - { - "epoch": 0.6, - "learning_rate": 2.0059326792621296e-05, - "loss": 2.2749, - "step": 343380 - }, - { - "epoch": 0.6, - "learning_rate": 2.005845485269447e-05, - "loss": 2.3787, - "step": 343390 - }, - { - "epoch": 0.6, - "learning_rate": 2.005758291276764e-05, - "loss": 2.3895, - "step": 343400 - }, - { - "epoch": 0.6, - "learning_rate": 2.0056710972840818e-05, - "loss": 2.3474, - "step": 343410 - }, - { - "epoch": 0.6, - "learning_rate": 2.0055839032913988e-05, - "loss": 2.2279, - "step": 343420 - }, - { - "epoch": 0.6, - "learning_rate": 2.0054967092987162e-05, - "loss": 2.329, - "step": 343430 - }, - { - "epoch": 0.6, - "learning_rate": 2.0054095153060336e-05, - "loss": 2.3811, - "step": 343440 - }, - { - "epoch": 0.6, - "learning_rate": 2.005322321313351e-05, - "loss": 2.2899, - "step": 343450 - }, - { - "epoch": 0.6, - "learning_rate": 2.0052351273206683e-05, - "loss": 2.3068, - "step": 343460 - }, - { - "epoch": 0.6, - "learning_rate": 2.0051479333279853e-05, - "loss": 2.3113, - "step": 343470 - }, - { - "epoch": 0.6, - "learning_rate": 2.005060739335303e-05, - "loss": 2.4507, - "step": 343480 - }, - { - "epoch": 0.6, - "learning_rate": 2.00497354534262e-05, - "loss": 2.3234, - "step": 343490 - }, - { - "epoch": 0.6, - "learning_rate": 2.0048863513499375e-05, - "loss": 2.2999, - "step": 343500 - }, - { - "epoch": 0.6, - "learning_rate": 2.004799157357255e-05, - "loss": 2.2687, - "step": 343510 - }, - { - "epoch": 0.6, - "learning_rate": 2.0047119633645722e-05, - "loss": 2.429, - "step": 343520 - }, - { - "epoch": 0.6, - "learning_rate": 2.0046247693718896e-05, - "loss": 2.3207, - "step": 343530 - }, - { - "epoch": 0.6, - "learning_rate": 2.0045375753792066e-05, - "loss": 2.4138, - "step": 343540 - }, - { - "epoch": 0.6, - "learning_rate": 2.004450381386524e-05, - "loss": 2.2146, - "step": 343550 - }, - { - "epoch": 0.6, - "learning_rate": 2.0043631873938414e-05, - "loss": 2.39, - "step": 343560 - }, - { - "epoch": 0.6, - "learning_rate": 2.0042759934011588e-05, - "loss": 2.254, - "step": 343570 - }, - { - "epoch": 0.6, - "learning_rate": 2.0041887994084758e-05, - "loss": 2.2674, - "step": 343580 - }, - { - "epoch": 0.6, - "learning_rate": 2.0041016054157935e-05, - "loss": 2.2599, - "step": 343590 - }, - { - "epoch": 0.6, - "learning_rate": 2.004014411423111e-05, - "loss": 2.2571, - "step": 343600 - }, - { - "epoch": 0.6, - "learning_rate": 2.003927217430428e-05, - "loss": 2.3184, - "step": 343610 - }, - { - "epoch": 0.6, - "learning_rate": 2.0038400234377453e-05, - "loss": 2.4391, - "step": 343620 - }, - { - "epoch": 0.6, - "learning_rate": 2.0037528294450627e-05, - "loss": 2.3896, - "step": 343630 - }, - { - "epoch": 0.6, - "learning_rate": 2.00366563545238e-05, - "loss": 2.3646, - "step": 343640 - }, - { - "epoch": 0.6, - "learning_rate": 2.003578441459697e-05, - "loss": 2.3757, - "step": 343650 - }, - { - "epoch": 0.6, - "learning_rate": 2.0034912474670145e-05, - "loss": 2.2369, - "step": 343660 - }, - { - "epoch": 0.6, - "learning_rate": 2.003404053474332e-05, - "loss": 2.3398, - "step": 343670 - }, - { - "epoch": 0.6, - "learning_rate": 2.0033168594816492e-05, - "loss": 2.3956, - "step": 343680 - }, - { - "epoch": 0.6, - "learning_rate": 2.0032296654889666e-05, - "loss": 2.2408, - "step": 343690 - }, - { - "epoch": 0.6, - "learning_rate": 2.0031424714962837e-05, - "loss": 2.2298, - "step": 343700 - }, - { - "epoch": 0.6, - "learning_rate": 2.0030552775036014e-05, - "loss": 2.2659, - "step": 343710 - }, - { - "epoch": 0.6, - "learning_rate": 2.0029680835109184e-05, - "loss": 2.3391, - "step": 343720 - }, - { - "epoch": 0.6, - "learning_rate": 2.0028808895182358e-05, - "loss": 2.3367, - "step": 343730 - }, - { - "epoch": 0.6, - "learning_rate": 2.002793695525553e-05, - "loss": 2.3085, - "step": 343740 - }, - { - "epoch": 0.6, - "learning_rate": 2.0027065015328705e-05, - "loss": 2.3237, - "step": 343750 - }, - { - "epoch": 0.6, - "learning_rate": 2.002619307540188e-05, - "loss": 2.2756, - "step": 343760 - }, - { - "epoch": 0.6, - "learning_rate": 2.002532113547505e-05, - "loss": 2.3863, - "step": 343770 - }, - { - "epoch": 0.6, - "learning_rate": 2.0024449195548227e-05, - "loss": 2.2377, - "step": 343780 - }, - { - "epoch": 0.6, - "learning_rate": 2.0023577255621397e-05, - "loss": 2.4038, - "step": 343790 - }, - { - "epoch": 0.6, - "learning_rate": 2.002270531569457e-05, - "loss": 2.3944, - "step": 343800 - }, - { - "epoch": 0.6, - "learning_rate": 2.002183337576774e-05, - "loss": 2.2655, - "step": 343810 - }, - { - "epoch": 0.6, - "learning_rate": 2.002096143584092e-05, - "loss": 2.1941, - "step": 343820 - }, - { - "epoch": 0.6, - "learning_rate": 2.0020089495914092e-05, - "loss": 2.3272, - "step": 343830 - }, - { - "epoch": 0.6, - "learning_rate": 2.0019217555987263e-05, - "loss": 2.2535, - "step": 343840 - }, - { - "epoch": 0.6, - "learning_rate": 2.001834561606044e-05, - "loss": 2.304, - "step": 343850 - }, - { - "epoch": 0.6, - "learning_rate": 2.001747367613361e-05, - "loss": 2.3538, - "step": 343860 - }, - { - "epoch": 0.6, - "learning_rate": 2.0016601736206784e-05, - "loss": 2.2538, - "step": 343870 - }, - { - "epoch": 0.6, - "learning_rate": 2.0015729796279954e-05, - "loss": 2.2407, - "step": 343880 - }, - { - "epoch": 0.6, - "learning_rate": 2.001485785635313e-05, - "loss": 2.2129, - "step": 343890 - }, - { - "epoch": 0.6, - "learning_rate": 2.0013985916426302e-05, - "loss": 2.3497, - "step": 343900 - }, - { - "epoch": 0.6, - "learning_rate": 2.0013113976499476e-05, - "loss": 2.433, - "step": 343910 - }, - { - "epoch": 0.6, - "learning_rate": 2.001224203657265e-05, - "loss": 2.3011, - "step": 343920 - }, - { - "epoch": 0.6, - "learning_rate": 2.0011370096645823e-05, - "loss": 2.2722, - "step": 343930 - }, - { - "epoch": 0.6, - "learning_rate": 2.0010498156718997e-05, - "loss": 2.3689, - "step": 343940 - }, - { - "epoch": 0.6, - "learning_rate": 2.0009626216792167e-05, - "loss": 2.3368, - "step": 343950 - }, - { - "epoch": 0.6, - "learning_rate": 2.000875427686534e-05, - "loss": 2.3711, - "step": 343960 - }, - { - "epoch": 0.6, - "learning_rate": 2.0007882336938515e-05, - "loss": 2.379, - "step": 343970 - }, - { - "epoch": 0.6, - "learning_rate": 2.000701039701169e-05, - "loss": 2.3641, - "step": 343980 - }, - { - "epoch": 0.6, - "learning_rate": 2.0006138457084862e-05, - "loss": 2.3239, - "step": 343990 - }, - { - "epoch": 0.6, - "learning_rate": 2.0005266517158036e-05, - "loss": 2.2927, - "step": 344000 - }, - { - "epoch": 0.6, - "learning_rate": 2.000439457723121e-05, - "loss": 2.4385, - "step": 344010 - }, - { - "epoch": 0.6, - "learning_rate": 2.000352263730438e-05, - "loss": 2.4148, - "step": 344020 - }, - { - "epoch": 0.6, - "learning_rate": 2.0002650697377554e-05, - "loss": 2.2551, - "step": 344030 - }, - { - "epoch": 0.6, - "learning_rate": 2.0001778757450728e-05, - "loss": 2.3722, - "step": 344040 - }, - { - "epoch": 0.6, - "learning_rate": 2.00009068175239e-05, - "loss": 2.4626, - "step": 344050 - }, - { - "epoch": 0.6, - "learning_rate": 2.0000034877597072e-05, - "loss": 2.3122, - "step": 344060 - }, - { - "epoch": 0.6, - "learning_rate": 1.9999162937670246e-05, - "loss": 2.3392, - "step": 344070 - }, - { - "epoch": 0.6, - "learning_rate": 1.9998290997743423e-05, - "loss": 2.3582, - "step": 344080 - }, - { - "epoch": 0.6, - "learning_rate": 1.9997419057816593e-05, - "loss": 2.3369, - "step": 344090 - }, - { - "epoch": 0.6, - "learning_rate": 1.9996547117889767e-05, - "loss": 2.4265, - "step": 344100 - }, - { - "epoch": 0.6, - "learning_rate": 1.9995675177962937e-05, - "loss": 2.317, - "step": 344110 - }, - { - "epoch": 0.6, - "learning_rate": 1.9994803238036115e-05, - "loss": 2.2944, - "step": 344120 - }, - { - "epoch": 0.6, - "learning_rate": 1.9993931298109285e-05, - "loss": 2.3278, - "step": 344130 - }, - { - "epoch": 0.6, - "learning_rate": 1.999305935818246e-05, - "loss": 2.2587, - "step": 344140 - }, - { - "epoch": 0.6, - "learning_rate": 1.9992187418255633e-05, - "loss": 2.4103, - "step": 344150 - }, - { - "epoch": 0.6, - "learning_rate": 1.9991315478328806e-05, - "loss": 2.4173, - "step": 344160 - }, - { - "epoch": 0.6, - "learning_rate": 1.999044353840198e-05, - "loss": 2.3098, - "step": 344170 - }, - { - "epoch": 0.6, - "learning_rate": 1.998957159847515e-05, - "loss": 2.3136, - "step": 344180 - }, - { - "epoch": 0.6, - "learning_rate": 1.9988699658548328e-05, - "loss": 2.3789, - "step": 344190 - }, - { - "epoch": 0.6, - "learning_rate": 1.9987827718621498e-05, - "loss": 2.3386, - "step": 344200 - }, - { - "epoch": 0.6, - "learning_rate": 1.9986955778694672e-05, - "loss": 2.2411, - "step": 344210 - }, - { - "epoch": 0.6, - "learning_rate": 1.9986083838767846e-05, - "loss": 2.3405, - "step": 344220 - }, - { - "epoch": 0.6, - "learning_rate": 1.998521189884102e-05, - "loss": 2.4213, - "step": 344230 - }, - { - "epoch": 0.6, - "learning_rate": 1.9984339958914193e-05, - "loss": 2.2516, - "step": 344240 - }, - { - "epoch": 0.6, - "learning_rate": 1.9983468018987363e-05, - "loss": 2.3386, - "step": 344250 - }, - { - "epoch": 0.6, - "learning_rate": 1.998259607906054e-05, - "loss": 2.2585, - "step": 344260 - }, - { - "epoch": 0.6, - "learning_rate": 1.998172413913371e-05, - "loss": 2.2863, - "step": 344270 - }, - { - "epoch": 0.6, - "learning_rate": 1.9980852199206885e-05, - "loss": 2.4447, - "step": 344280 - }, - { - "epoch": 0.6, - "learning_rate": 1.9979980259280055e-05, - "loss": 2.2669, - "step": 344290 - }, - { - "epoch": 0.6, - "learning_rate": 1.9979108319353232e-05, - "loss": 2.329, - "step": 344300 - }, - { - "epoch": 0.6, - "learning_rate": 1.9978236379426403e-05, - "loss": 2.2927, - "step": 344310 - }, - { - "epoch": 0.6, - "learning_rate": 1.9977364439499576e-05, - "loss": 2.4112, - "step": 344320 - }, - { - "epoch": 0.6, - "learning_rate": 1.997649249957275e-05, - "loss": 2.4204, - "step": 344330 - }, - { - "epoch": 0.6, - "learning_rate": 1.9975620559645924e-05, - "loss": 2.4236, - "step": 344340 - }, - { - "epoch": 0.6, - "learning_rate": 1.9974748619719098e-05, - "loss": 2.3648, - "step": 344350 - }, - { - "epoch": 0.6, - "learning_rate": 1.9973876679792268e-05, - "loss": 2.3168, - "step": 344360 - }, - { - "epoch": 0.6, - "learning_rate": 1.9973004739865442e-05, - "loss": 2.1646, - "step": 344370 - }, - { - "epoch": 0.6, - "learning_rate": 1.9972132799938616e-05, - "loss": 2.4149, - "step": 344380 - }, - { - "epoch": 0.6, - "learning_rate": 1.997126086001179e-05, - "loss": 2.2952, - "step": 344390 - }, - { - "epoch": 0.6, - "learning_rate": 1.9970388920084963e-05, - "loss": 2.4156, - "step": 344400 - }, - { - "epoch": 0.6, - "learning_rate": 1.9969516980158137e-05, - "loss": 2.375, - "step": 344410 - }, - { - "epoch": 0.6, - "learning_rate": 1.996864504023131e-05, - "loss": 2.3324, - "step": 344420 - }, - { - "epoch": 0.6, - "learning_rate": 1.996777310030448e-05, - "loss": 2.2556, - "step": 344430 - }, - { - "epoch": 0.6, - "learning_rate": 1.9966901160377655e-05, - "loss": 2.2859, - "step": 344440 - }, - { - "epoch": 0.6, - "learning_rate": 1.996602922045083e-05, - "loss": 2.3925, - "step": 344450 - }, - { - "epoch": 0.6, - "learning_rate": 1.9965157280524002e-05, - "loss": 2.2517, - "step": 344460 - }, - { - "epoch": 0.6, - "learning_rate": 1.9964285340597176e-05, - "loss": 2.3853, - "step": 344470 - }, - { - "epoch": 0.6, - "learning_rate": 1.9963413400670347e-05, - "loss": 2.3613, - "step": 344480 - }, - { - "epoch": 0.6, - "learning_rate": 1.9962541460743524e-05, - "loss": 2.5729, - "step": 344490 - }, - { - "epoch": 0.6, - "learning_rate": 1.9961669520816694e-05, - "loss": 2.3846, - "step": 344500 - }, - { - "epoch": 0.6, - "learning_rate": 1.9960797580889868e-05, - "loss": 2.257, - "step": 344510 - }, - { - "epoch": 0.6, - "learning_rate": 1.995992564096304e-05, - "loss": 2.3763, - "step": 344520 - }, - { - "epoch": 0.6, - "learning_rate": 1.9959053701036215e-05, - "loss": 2.3438, - "step": 344530 - }, - { - "epoch": 0.6, - "learning_rate": 1.9958181761109386e-05, - "loss": 2.302, - "step": 344540 - }, - { - "epoch": 0.6, - "learning_rate": 1.995730982118256e-05, - "loss": 2.3483, - "step": 344550 - }, - { - "epoch": 0.6, - "learning_rate": 1.9956437881255737e-05, - "loss": 2.3227, - "step": 344560 - }, - { - "epoch": 0.6, - "learning_rate": 1.9955565941328907e-05, - "loss": 2.3424, - "step": 344570 - }, - { - "epoch": 0.6, - "learning_rate": 1.995469400140208e-05, - "loss": 2.3546, - "step": 344580 - }, - { - "epoch": 0.6, - "learning_rate": 1.995382206147525e-05, - "loss": 2.3271, - "step": 344590 - }, - { - "epoch": 0.6, - "learning_rate": 1.995295012154843e-05, - "loss": 2.3659, - "step": 344600 - }, - { - "epoch": 0.6, - "learning_rate": 1.99520781816216e-05, - "loss": 2.2466, - "step": 344610 - }, - { - "epoch": 0.6, - "learning_rate": 1.9951206241694773e-05, - "loss": 2.2745, - "step": 344620 - }, - { - "epoch": 0.6, - "learning_rate": 1.9950334301767946e-05, - "loss": 2.3244, - "step": 344630 - }, - { - "epoch": 0.6, - "learning_rate": 1.994946236184112e-05, - "loss": 2.3536, - "step": 344640 - }, - { - "epoch": 0.6, - "learning_rate": 1.9948590421914294e-05, - "loss": 2.2948, - "step": 344650 - }, - { - "epoch": 0.6, - "learning_rate": 1.9947718481987464e-05, - "loss": 2.419, - "step": 344660 - }, - { - "epoch": 0.6, - "learning_rate": 1.994684654206064e-05, - "loss": 2.3499, - "step": 344670 - }, - { - "epoch": 0.6, - "learning_rate": 1.9945974602133812e-05, - "loss": 2.332, - "step": 344680 - }, - { - "epoch": 0.6, - "learning_rate": 1.9945102662206986e-05, - "loss": 2.2027, - "step": 344690 - }, - { - "epoch": 0.6, - "learning_rate": 1.994423072228016e-05, - "loss": 2.2927, - "step": 344700 - }, - { - "epoch": 0.6, - "learning_rate": 1.9943358782353333e-05, - "loss": 2.2606, - "step": 344710 - }, - { - "epoch": 0.6, - "learning_rate": 1.9942486842426507e-05, - "loss": 2.1753, - "step": 344720 - }, - { - "epoch": 0.6, - "learning_rate": 1.9941614902499677e-05, - "loss": 2.3006, - "step": 344730 - }, - { - "epoch": 0.6, - "learning_rate": 1.994074296257285e-05, - "loss": 2.3293, - "step": 344740 - }, - { - "epoch": 0.6, - "learning_rate": 1.9939871022646025e-05, - "loss": 2.3565, - "step": 344750 - }, - { - "epoch": 0.6, - "learning_rate": 1.99389990827192e-05, - "loss": 2.2583, - "step": 344760 - }, - { - "epoch": 0.6, - "learning_rate": 1.993812714279237e-05, - "loss": 2.3013, - "step": 344770 - }, - { - "epoch": 0.6, - "learning_rate": 1.9937255202865546e-05, - "loss": 2.3568, - "step": 344780 - }, - { - "epoch": 0.6, - "learning_rate": 1.9936383262938717e-05, - "loss": 2.3378, - "step": 344790 - }, - { - "epoch": 0.6, - "learning_rate": 1.993551132301189e-05, - "loss": 2.4567, - "step": 344800 - }, - { - "epoch": 0.6, - "learning_rate": 1.9934639383085064e-05, - "loss": 2.3154, - "step": 344810 - }, - { - "epoch": 0.6, - "learning_rate": 1.9933767443158238e-05, - "loss": 2.3467, - "step": 344820 - }, - { - "epoch": 0.6, - "learning_rate": 1.993289550323141e-05, - "loss": 2.2186, - "step": 344830 - }, - { - "epoch": 0.6, - "learning_rate": 1.9932023563304582e-05, - "loss": 2.2557, - "step": 344840 - }, - { - "epoch": 0.6, - "learning_rate": 1.9931151623377756e-05, - "loss": 2.4095, - "step": 344850 - }, - { - "epoch": 0.6, - "learning_rate": 1.993027968345093e-05, - "loss": 2.3587, - "step": 344860 - }, - { - "epoch": 0.6, - "learning_rate": 1.9929407743524103e-05, - "loss": 2.2901, - "step": 344870 - }, - { - "epoch": 0.6, - "learning_rate": 1.9928535803597277e-05, - "loss": 2.2152, - "step": 344880 - }, - { - "epoch": 0.6, - "learning_rate": 1.9927663863670447e-05, - "loss": 2.3479, - "step": 344890 - }, - { - "epoch": 0.6, - "learning_rate": 1.9926791923743625e-05, - "loss": 2.2769, - "step": 344900 - }, - { - "epoch": 0.6, - "learning_rate": 1.9925919983816795e-05, - "loss": 2.3829, - "step": 344910 - }, - { - "epoch": 0.6, - "learning_rate": 1.992504804388997e-05, - "loss": 2.4816, - "step": 344920 - }, - { - "epoch": 0.6, - "learning_rate": 1.9924176103963143e-05, - "loss": 2.2979, - "step": 344930 - }, - { - "epoch": 0.6, - "learning_rate": 1.9923304164036316e-05, - "loss": 2.3456, - "step": 344940 - }, - { - "epoch": 0.6, - "learning_rate": 1.992243222410949e-05, - "loss": 2.2483, - "step": 344950 - }, - { - "epoch": 0.6, - "learning_rate": 1.992156028418266e-05, - "loss": 2.3699, - "step": 344960 - }, - { - "epoch": 0.6, - "learning_rate": 1.9920688344255838e-05, - "loss": 2.3935, - "step": 344970 - }, - { - "epoch": 0.6, - "learning_rate": 1.9919816404329008e-05, - "loss": 2.3107, - "step": 344980 - }, - { - "epoch": 0.6, - "learning_rate": 1.9918944464402182e-05, - "loss": 2.3673, - "step": 344990 - }, - { - "epoch": 0.6, - "learning_rate": 1.9918072524475352e-05, - "loss": 2.3251, - "step": 345000 - }, - { - "epoch": 0.6, - "learning_rate": 1.991720058454853e-05, - "loss": 2.3729, - "step": 345010 - }, - { - "epoch": 0.6, - "learning_rate": 1.99163286446217e-05, - "loss": 2.3712, - "step": 345020 - }, - { - "epoch": 0.6, - "learning_rate": 1.9915456704694873e-05, - "loss": 2.2759, - "step": 345030 - }, - { - "epoch": 0.6, - "learning_rate": 1.9914584764768047e-05, - "loss": 2.3497, - "step": 345040 - }, - { - "epoch": 0.6, - "learning_rate": 1.991371282484122e-05, - "loss": 2.3191, - "step": 345050 - }, - { - "epoch": 0.6, - "learning_rate": 1.9912840884914395e-05, - "loss": 2.3711, - "step": 345060 - }, - { - "epoch": 0.6, - "learning_rate": 1.9911968944987565e-05, - "loss": 2.2549, - "step": 345070 - }, - { - "epoch": 0.6, - "learning_rate": 1.9911097005060742e-05, - "loss": 2.3878, - "step": 345080 - }, - { - "epoch": 0.6, - "learning_rate": 1.9910225065133913e-05, - "loss": 2.3586, - "step": 345090 - }, - { - "epoch": 0.6, - "learning_rate": 1.9909353125207086e-05, - "loss": 2.3682, - "step": 345100 - }, - { - "epoch": 0.6, - "learning_rate": 1.990848118528026e-05, - "loss": 2.3796, - "step": 345110 - }, - { - "epoch": 0.6, - "learning_rate": 1.9907609245353434e-05, - "loss": 2.3, - "step": 345120 - }, - { - "epoch": 0.6, - "learning_rate": 1.9906737305426608e-05, - "loss": 2.2874, - "step": 345130 - }, - { - "epoch": 0.6, - "learning_rate": 1.9905865365499778e-05, - "loss": 2.3221, - "step": 345140 - }, - { - "epoch": 0.6, - "learning_rate": 1.9904993425572952e-05, - "loss": 2.3494, - "step": 345150 - }, - { - "epoch": 0.6, - "learning_rate": 1.9904121485646126e-05, - "loss": 2.2688, - "step": 345160 - }, - { - "epoch": 0.6, - "learning_rate": 1.99032495457193e-05, - "loss": 2.4109, - "step": 345170 - }, - { - "epoch": 0.6, - "learning_rate": 1.9902377605792473e-05, - "loss": 2.246, - "step": 345180 - }, - { - "epoch": 0.6, - "learning_rate": 1.9901505665865647e-05, - "loss": 2.3192, - "step": 345190 - }, - { - "epoch": 0.6, - "learning_rate": 1.990063372593882e-05, - "loss": 2.2877, - "step": 345200 - }, - { - "epoch": 0.6, - "learning_rate": 1.989976178601199e-05, - "loss": 2.323, - "step": 345210 - }, - { - "epoch": 0.6, - "learning_rate": 1.9898889846085165e-05, - "loss": 2.4049, - "step": 345220 - }, - { - "epoch": 0.6, - "learning_rate": 1.989801790615834e-05, - "loss": 2.363, - "step": 345230 - }, - { - "epoch": 0.6, - "learning_rate": 1.9897145966231512e-05, - "loss": 2.4095, - "step": 345240 - }, - { - "epoch": 0.6, - "learning_rate": 1.9896274026304683e-05, - "loss": 2.3882, - "step": 345250 - }, - { - "epoch": 0.6, - "learning_rate": 1.9895402086377857e-05, - "loss": 2.2454, - "step": 345260 - }, - { - "epoch": 0.6, - "learning_rate": 1.989453014645103e-05, - "loss": 2.309, - "step": 345270 - }, - { - "epoch": 0.6, - "learning_rate": 1.9893658206524204e-05, - "loss": 2.3518, - "step": 345280 - }, - { - "epoch": 0.6, - "learning_rate": 1.9892786266597378e-05, - "loss": 2.3246, - "step": 345290 - }, - { - "epoch": 0.6, - "learning_rate": 1.9891914326670548e-05, - "loss": 2.3884, - "step": 345300 - }, - { - "epoch": 0.6, - "learning_rate": 1.9891042386743725e-05, - "loss": 2.321, - "step": 345310 - }, - { - "epoch": 0.6, - "learning_rate": 1.9890170446816896e-05, - "loss": 2.3993, - "step": 345320 - }, - { - "epoch": 0.6, - "learning_rate": 1.988929850689007e-05, - "loss": 2.382, - "step": 345330 - }, - { - "epoch": 0.6, - "learning_rate": 1.9888426566963243e-05, - "loss": 2.3398, - "step": 345340 - }, - { - "epoch": 0.6, - "learning_rate": 1.9887554627036417e-05, - "loss": 2.3081, - "step": 345350 - }, - { - "epoch": 0.6, - "learning_rate": 1.988668268710959e-05, - "loss": 2.3151, - "step": 345360 - }, - { - "epoch": 0.6, - "learning_rate": 1.988581074718276e-05, - "loss": 2.4319, - "step": 345370 - }, - { - "epoch": 0.6, - "learning_rate": 1.988493880725594e-05, - "loss": 2.3954, - "step": 345380 - }, - { - "epoch": 0.6, - "learning_rate": 1.988406686732911e-05, - "loss": 2.3205, - "step": 345390 - }, - { - "epoch": 0.6, - "learning_rate": 1.9883194927402283e-05, - "loss": 2.319, - "step": 345400 - }, - { - "epoch": 0.6, - "learning_rate": 1.9882322987475453e-05, - "loss": 2.373, - "step": 345410 - }, - { - "epoch": 0.6, - "learning_rate": 1.988145104754863e-05, - "loss": 2.284, - "step": 345420 - }, - { - "epoch": 0.6, - "learning_rate": 1.9880579107621804e-05, - "loss": 2.3005, - "step": 345430 - }, - { - "epoch": 0.6, - "learning_rate": 1.9879707167694974e-05, - "loss": 2.295, - "step": 345440 - }, - { - "epoch": 0.6, - "learning_rate": 1.987883522776815e-05, - "loss": 2.2089, - "step": 345450 - }, - { - "epoch": 0.6, - "learning_rate": 1.9877963287841322e-05, - "loss": 2.3445, - "step": 345460 - }, - { - "epoch": 0.6, - "learning_rate": 1.9877091347914496e-05, - "loss": 2.309, - "step": 345470 - }, - { - "epoch": 0.6, - "learning_rate": 1.9876219407987666e-05, - "loss": 2.3322, - "step": 345480 - }, - { - "epoch": 0.6, - "learning_rate": 1.9875347468060843e-05, - "loss": 2.3232, - "step": 345490 - }, - { - "epoch": 0.6, - "learning_rate": 1.9874475528134014e-05, - "loss": 2.3262, - "step": 345500 - }, - { - "epoch": 0.6, - "learning_rate": 1.9873603588207187e-05, - "loss": 2.3877, - "step": 345510 - }, - { - "epoch": 0.6, - "learning_rate": 1.987273164828036e-05, - "loss": 2.3491, - "step": 345520 - }, - { - "epoch": 0.6, - "learning_rate": 1.9871859708353535e-05, - "loss": 2.2937, - "step": 345530 - }, - { - "epoch": 0.6, - "learning_rate": 1.987098776842671e-05, - "loss": 2.4053, - "step": 345540 - }, - { - "epoch": 0.6, - "learning_rate": 1.987011582849988e-05, - "loss": 2.2379, - "step": 345550 - }, - { - "epoch": 0.6, - "learning_rate": 1.9869243888573053e-05, - "loss": 2.3566, - "step": 345560 - }, - { - "epoch": 0.6, - "learning_rate": 1.9868371948646227e-05, - "loss": 2.4208, - "step": 345570 - }, - { - "epoch": 0.6, - "learning_rate": 1.98675000087194e-05, - "loss": 2.3083, - "step": 345580 - }, - { - "epoch": 0.6, - "learning_rate": 1.9866628068792574e-05, - "loss": 2.4203, - "step": 345590 - }, - { - "epoch": 0.6, - "learning_rate": 1.9865756128865748e-05, - "loss": 2.2595, - "step": 345600 - }, - { - "epoch": 0.6, - "learning_rate": 1.986488418893892e-05, - "loss": 2.266, - "step": 345610 - }, - { - "epoch": 0.6, - "learning_rate": 1.9864012249012092e-05, - "loss": 2.3753, - "step": 345620 - }, - { - "epoch": 0.6, - "learning_rate": 1.9863140309085266e-05, - "loss": 2.3999, - "step": 345630 - }, - { - "epoch": 0.6, - "learning_rate": 1.986226836915844e-05, - "loss": 2.3362, - "step": 345640 - }, - { - "epoch": 0.6, - "learning_rate": 1.9861396429231613e-05, - "loss": 2.2632, - "step": 345650 - }, - { - "epoch": 0.6, - "learning_rate": 1.9860524489304787e-05, - "loss": 2.3033, - "step": 345660 - }, - { - "epoch": 0.6, - "learning_rate": 1.9859652549377957e-05, - "loss": 2.4042, - "step": 345670 - }, - { - "epoch": 0.6, - "learning_rate": 1.9858780609451135e-05, - "loss": 2.2984, - "step": 345680 - }, - { - "epoch": 0.6, - "learning_rate": 1.9857908669524305e-05, - "loss": 2.4133, - "step": 345690 - }, - { - "epoch": 0.6, - "learning_rate": 1.985703672959748e-05, - "loss": 2.2195, - "step": 345700 - }, - { - "epoch": 0.6, - "learning_rate": 1.9856164789670653e-05, - "loss": 2.3369, - "step": 345710 - }, - { - "epoch": 0.6, - "learning_rate": 1.9855292849743826e-05, - "loss": 2.3068, - "step": 345720 - }, - { - "epoch": 0.6, - "learning_rate": 1.9854420909816997e-05, - "loss": 2.2945, - "step": 345730 - }, - { - "epoch": 0.6, - "learning_rate": 1.985354896989017e-05, - "loss": 2.3755, - "step": 345740 - }, - { - "epoch": 0.6, - "learning_rate": 1.9852677029963344e-05, - "loss": 2.238, - "step": 345750 - }, - { - "epoch": 0.6, - "learning_rate": 1.9851805090036518e-05, - "loss": 2.3775, - "step": 345760 - }, - { - "epoch": 0.6, - "learning_rate": 1.9850933150109692e-05, - "loss": 2.3858, - "step": 345770 - }, - { - "epoch": 0.6, - "learning_rate": 1.9850061210182862e-05, - "loss": 2.2876, - "step": 345780 - }, - { - "epoch": 0.6, - "learning_rate": 1.984918927025604e-05, - "loss": 2.4157, - "step": 345790 - }, - { - "epoch": 0.6, - "learning_rate": 1.984831733032921e-05, - "loss": 2.4465, - "step": 345800 - }, - { - "epoch": 0.6, - "learning_rate": 1.9847445390402383e-05, - "loss": 2.404, - "step": 345810 - }, - { - "epoch": 0.6, - "learning_rate": 1.9846573450475557e-05, - "loss": 2.2842, - "step": 345820 - }, - { - "epoch": 0.6, - "learning_rate": 1.984570151054873e-05, - "loss": 2.4134, - "step": 345830 - }, - { - "epoch": 0.6, - "learning_rate": 1.9844829570621905e-05, - "loss": 2.4017, - "step": 345840 - }, - { - "epoch": 0.6, - "learning_rate": 1.9843957630695075e-05, - "loss": 2.3132, - "step": 345850 - }, - { - "epoch": 0.6, - "learning_rate": 1.9843085690768252e-05, - "loss": 2.3906, - "step": 345860 - }, - { - "epoch": 0.6, - "learning_rate": 1.9842213750841423e-05, - "loss": 2.3513, - "step": 345870 - }, - { - "epoch": 0.6, - "learning_rate": 1.9841341810914596e-05, - "loss": 2.322, - "step": 345880 - }, - { - "epoch": 0.6, - "learning_rate": 1.9840469870987767e-05, - "loss": 2.4202, - "step": 345890 - }, - { - "epoch": 0.6, - "learning_rate": 1.9839597931060944e-05, - "loss": 2.366, - "step": 345900 - }, - { - "epoch": 0.6, - "learning_rate": 1.9838725991134118e-05, - "loss": 2.3909, - "step": 345910 - }, - { - "epoch": 0.6, - "learning_rate": 1.9837854051207288e-05, - "loss": 2.2991, - "step": 345920 - }, - { - "epoch": 0.6, - "learning_rate": 1.9836982111280462e-05, - "loss": 2.2661, - "step": 345930 - }, - { - "epoch": 0.6, - "learning_rate": 1.9836110171353636e-05, - "loss": 2.3354, - "step": 345940 - }, - { - "epoch": 0.6, - "learning_rate": 1.983523823142681e-05, - "loss": 2.2128, - "step": 345950 - }, - { - "epoch": 0.6, - "learning_rate": 1.983436629149998e-05, - "loss": 2.3179, - "step": 345960 - }, - { - "epoch": 0.6, - "learning_rate": 1.9833494351573154e-05, - "loss": 2.402, - "step": 345970 - }, - { - "epoch": 0.6, - "learning_rate": 1.9832622411646327e-05, - "loss": 2.2653, - "step": 345980 - }, - { - "epoch": 0.6, - "learning_rate": 1.98317504717195e-05, - "loss": 2.365, - "step": 345990 - }, - { - "epoch": 0.6, - "learning_rate": 1.9830878531792675e-05, - "loss": 2.3498, - "step": 346000 - }, - { - "epoch": 0.6, - "learning_rate": 1.983000659186585e-05, - "loss": 2.3211, - "step": 346010 - }, - { - "epoch": 0.6, - "learning_rate": 1.9829134651939022e-05, - "loss": 2.1962, - "step": 346020 - }, - { - "epoch": 0.6, - "learning_rate": 1.9828262712012193e-05, - "loss": 2.3663, - "step": 346030 - }, - { - "epoch": 0.6, - "learning_rate": 1.9827390772085367e-05, - "loss": 2.3567, - "step": 346040 - }, - { - "epoch": 0.6, - "learning_rate": 1.982651883215854e-05, - "loss": 2.4552, - "step": 346050 - }, - { - "epoch": 0.6, - "learning_rate": 1.9825646892231714e-05, - "loss": 2.3565, - "step": 346060 - }, - { - "epoch": 0.6, - "learning_rate": 1.9824774952304888e-05, - "loss": 2.3555, - "step": 346070 - }, - { - "epoch": 0.6, - "learning_rate": 1.9823903012378058e-05, - "loss": 2.217, - "step": 346080 - }, - { - "epoch": 0.6, - "learning_rate": 1.9823031072451235e-05, - "loss": 2.329, - "step": 346090 - }, - { - "epoch": 0.6, - "learning_rate": 1.9822159132524406e-05, - "loss": 2.3105, - "step": 346100 - }, - { - "epoch": 0.6, - "learning_rate": 1.982128719259758e-05, - "loss": 2.3658, - "step": 346110 - }, - { - "epoch": 0.6, - "learning_rate": 1.9820415252670753e-05, - "loss": 2.4063, - "step": 346120 - }, - { - "epoch": 0.6, - "learning_rate": 1.9819543312743927e-05, - "loss": 2.2907, - "step": 346130 - }, - { - "epoch": 0.6, - "learning_rate": 1.9818671372817098e-05, - "loss": 2.3145, - "step": 346140 - }, - { - "epoch": 0.6, - "learning_rate": 1.981779943289027e-05, - "loss": 2.367, - "step": 346150 - }, - { - "epoch": 0.6, - "learning_rate": 1.981692749296345e-05, - "loss": 2.4411, - "step": 346160 - }, - { - "epoch": 0.6, - "learning_rate": 1.981605555303662e-05, - "loss": 2.3556, - "step": 346170 - }, - { - "epoch": 0.6, - "learning_rate": 1.9815183613109793e-05, - "loss": 2.3575, - "step": 346180 - }, - { - "epoch": 0.6, - "learning_rate": 1.9814311673182963e-05, - "loss": 2.2792, - "step": 346190 - }, - { - "epoch": 0.6, - "learning_rate": 1.981343973325614e-05, - "loss": 2.4118, - "step": 346200 - }, - { - "epoch": 0.6, - "learning_rate": 1.981256779332931e-05, - "loss": 2.2964, - "step": 346210 - }, - { - "epoch": 0.6, - "learning_rate": 1.9811695853402484e-05, - "loss": 2.3778, - "step": 346220 - }, - { - "epoch": 0.6, - "learning_rate": 1.9810823913475658e-05, - "loss": 2.3689, - "step": 346230 - }, - { - "epoch": 0.6, - "learning_rate": 1.9809951973548832e-05, - "loss": 2.4007, - "step": 346240 - }, - { - "epoch": 0.6, - "learning_rate": 1.9809080033622006e-05, - "loss": 2.4159, - "step": 346250 - }, - { - "epoch": 0.6, - "learning_rate": 1.9808208093695176e-05, - "loss": 2.3522, - "step": 346260 - }, - { - "epoch": 0.6, - "learning_rate": 1.9807336153768353e-05, - "loss": 2.2156, - "step": 346270 - }, - { - "epoch": 0.6, - "learning_rate": 1.9806464213841524e-05, - "loss": 2.459, - "step": 346280 - }, - { - "epoch": 0.6, - "learning_rate": 1.9805592273914697e-05, - "loss": 2.2132, - "step": 346290 - }, - { - "epoch": 0.6, - "learning_rate": 1.980472033398787e-05, - "loss": 2.3219, - "step": 346300 - }, - { - "epoch": 0.6, - "learning_rate": 1.9803848394061045e-05, - "loss": 2.4217, - "step": 346310 - }, - { - "epoch": 0.6, - "learning_rate": 1.980297645413422e-05, - "loss": 2.2231, - "step": 346320 - }, - { - "epoch": 0.6, - "learning_rate": 1.980210451420739e-05, - "loss": 2.3108, - "step": 346330 - }, - { - "epoch": 0.6, - "learning_rate": 1.9801232574280563e-05, - "loss": 2.3381, - "step": 346340 - }, - { - "epoch": 0.6, - "learning_rate": 1.9800360634353737e-05, - "loss": 2.3581, - "step": 346350 - }, - { - "epoch": 0.6, - "learning_rate": 1.979948869442691e-05, - "loss": 2.2898, - "step": 346360 - }, - { - "epoch": 0.6, - "learning_rate": 1.979861675450008e-05, - "loss": 2.2533, - "step": 346370 - }, - { - "epoch": 0.6, - "learning_rate": 1.9797744814573258e-05, - "loss": 2.2698, - "step": 346380 - }, - { - "epoch": 0.6, - "learning_rate": 1.979687287464643e-05, - "loss": 2.315, - "step": 346390 - }, - { - "epoch": 0.6, - "learning_rate": 1.9796000934719602e-05, - "loss": 2.268, - "step": 346400 - }, - { - "epoch": 0.6, - "learning_rate": 1.9795128994792776e-05, - "loss": 2.2339, - "step": 346410 - }, - { - "epoch": 0.6, - "learning_rate": 1.979425705486595e-05, - "loss": 2.3464, - "step": 346420 - }, - { - "epoch": 0.6, - "learning_rate": 1.9793385114939123e-05, - "loss": 2.2631, - "step": 346430 - }, - { - "epoch": 0.6, - "learning_rate": 1.9792513175012294e-05, - "loss": 2.3938, - "step": 346440 - }, - { - "epoch": 0.6, - "learning_rate": 1.9791641235085467e-05, - "loss": 2.2795, - "step": 346450 - }, - { - "epoch": 0.6, - "learning_rate": 1.979076929515864e-05, - "loss": 2.3253, - "step": 346460 - }, - { - "epoch": 0.6, - "learning_rate": 1.9789897355231815e-05, - "loss": 2.3058, - "step": 346470 - }, - { - "epoch": 0.6, - "learning_rate": 1.978902541530499e-05, - "loss": 2.2443, - "step": 346480 - }, - { - "epoch": 0.6, - "learning_rate": 1.978815347537816e-05, - "loss": 2.3242, - "step": 346490 - }, - { - "epoch": 0.6, - "learning_rate": 1.9787281535451336e-05, - "loss": 2.4017, - "step": 346500 - }, - { - "epoch": 0.6, - "learning_rate": 1.9786409595524507e-05, - "loss": 2.3075, - "step": 346510 - }, - { - "epoch": 0.6, - "learning_rate": 1.978553765559768e-05, - "loss": 2.2732, - "step": 346520 - }, - { - "epoch": 0.6, - "learning_rate": 1.9784665715670854e-05, - "loss": 2.3599, - "step": 346530 - }, - { - "epoch": 0.6, - "learning_rate": 1.9783793775744028e-05, - "loss": 2.37, - "step": 346540 - }, - { - "epoch": 0.6, - "learning_rate": 1.9782921835817202e-05, - "loss": 2.4323, - "step": 346550 - }, - { - "epoch": 0.6, - "learning_rate": 1.9782049895890372e-05, - "loss": 2.3594, - "step": 346560 - }, - { - "epoch": 0.6, - "learning_rate": 1.978117795596355e-05, - "loss": 2.3462, - "step": 346570 - }, - { - "epoch": 0.6, - "learning_rate": 1.978030601603672e-05, - "loss": 2.3734, - "step": 346580 - }, - { - "epoch": 0.6, - "learning_rate": 1.9779434076109893e-05, - "loss": 2.2952, - "step": 346590 - }, - { - "epoch": 0.6, - "learning_rate": 1.9778562136183064e-05, - "loss": 2.3508, - "step": 346600 - }, - { - "epoch": 0.6, - "learning_rate": 1.977769019625624e-05, - "loss": 2.2997, - "step": 346610 - }, - { - "epoch": 0.6, - "learning_rate": 1.977681825632941e-05, - "loss": 2.1928, - "step": 346620 - }, - { - "epoch": 0.6, - "learning_rate": 1.9775946316402585e-05, - "loss": 2.3917, - "step": 346630 - }, - { - "epoch": 0.6, - "learning_rate": 1.977507437647576e-05, - "loss": 2.3242, - "step": 346640 - }, - { - "epoch": 0.6, - "learning_rate": 1.9774202436548933e-05, - "loss": 2.2709, - "step": 346650 - }, - { - "epoch": 0.6, - "learning_rate": 1.9773330496622106e-05, - "loss": 2.5074, - "step": 346660 - }, - { - "epoch": 0.6, - "learning_rate": 1.9772458556695277e-05, - "loss": 2.3776, - "step": 346670 - }, - { - "epoch": 0.6, - "learning_rate": 1.9771586616768454e-05, - "loss": 2.331, - "step": 346680 - }, - { - "epoch": 0.6, - "learning_rate": 1.9770714676841624e-05, - "loss": 2.3771, - "step": 346690 - }, - { - "epoch": 0.6, - "learning_rate": 1.9769842736914798e-05, - "loss": 2.3062, - "step": 346700 - }, - { - "epoch": 0.6, - "learning_rate": 1.9768970796987972e-05, - "loss": 2.3647, - "step": 346710 - }, - { - "epoch": 0.6, - "learning_rate": 1.9768098857061146e-05, - "loss": 2.3285, - "step": 346720 - }, - { - "epoch": 0.6, - "learning_rate": 1.976722691713432e-05, - "loss": 2.3026, - "step": 346730 - }, - { - "epoch": 0.6, - "learning_rate": 1.976635497720749e-05, - "loss": 2.383, - "step": 346740 - }, - { - "epoch": 0.6, - "learning_rate": 1.9765483037280664e-05, - "loss": 2.3266, - "step": 346750 - }, - { - "epoch": 0.6, - "learning_rate": 1.9764611097353837e-05, - "loss": 2.3471, - "step": 346760 - }, - { - "epoch": 0.6, - "learning_rate": 1.976373915742701e-05, - "loss": 2.3499, - "step": 346770 - }, - { - "epoch": 0.6, - "learning_rate": 1.9762867217500185e-05, - "loss": 2.3402, - "step": 346780 - }, - { - "epoch": 0.6, - "learning_rate": 1.976199527757336e-05, - "loss": 2.2301, - "step": 346790 - }, - { - "epoch": 0.6, - "learning_rate": 1.9761123337646532e-05, - "loss": 2.3383, - "step": 346800 - }, - { - "epoch": 0.6, - "learning_rate": 1.9760251397719703e-05, - "loss": 2.2863, - "step": 346810 - }, - { - "epoch": 0.6, - "learning_rate": 1.9759379457792877e-05, - "loss": 2.4041, - "step": 346820 - }, - { - "epoch": 0.6, - "learning_rate": 1.975850751786605e-05, - "loss": 2.2899, - "step": 346830 - }, - { - "epoch": 0.6, - "learning_rate": 1.9757635577939224e-05, - "loss": 2.3247, - "step": 346840 - }, - { - "epoch": 0.6, - "learning_rate": 1.9756763638012395e-05, - "loss": 2.3256, - "step": 346850 - }, - { - "epoch": 0.6, - "learning_rate": 1.975589169808557e-05, - "loss": 2.3809, - "step": 346860 - }, - { - "epoch": 0.6, - "learning_rate": 1.9755019758158742e-05, - "loss": 2.3043, - "step": 346870 - }, - { - "epoch": 0.6, - "learning_rate": 1.9754147818231916e-05, - "loss": 2.3306, - "step": 346880 - }, - { - "epoch": 0.6, - "learning_rate": 1.975327587830509e-05, - "loss": 2.2431, - "step": 346890 - }, - { - "epoch": 0.6, - "learning_rate": 1.975240393837826e-05, - "loss": 2.259, - "step": 346900 - }, - { - "epoch": 0.6, - "learning_rate": 1.9751531998451437e-05, - "loss": 2.4287, - "step": 346910 - }, - { - "epoch": 0.6, - "learning_rate": 1.9750660058524608e-05, - "loss": 2.3478, - "step": 346920 - }, - { - "epoch": 0.61, - "learning_rate": 1.974978811859778e-05, - "loss": 2.4424, - "step": 346930 - }, - { - "epoch": 0.61, - "learning_rate": 1.9748916178670955e-05, - "loss": 2.2437, - "step": 346940 - }, - { - "epoch": 0.61, - "learning_rate": 1.974804423874413e-05, - "loss": 2.3451, - "step": 346950 - }, - { - "epoch": 0.61, - "learning_rate": 1.9747172298817303e-05, - "loss": 2.304, - "step": 346960 - }, - { - "epoch": 0.61, - "learning_rate": 1.9746300358890473e-05, - "loss": 2.364, - "step": 346970 - }, - { - "epoch": 0.61, - "learning_rate": 1.974542841896365e-05, - "loss": 2.2997, - "step": 346980 - }, - { - "epoch": 0.61, - "learning_rate": 1.974455647903682e-05, - "loss": 2.3394, - "step": 346990 - }, - { - "epoch": 0.61, - "learning_rate": 1.9743684539109994e-05, - "loss": 2.2296, - "step": 347000 - }, - { - "epoch": 0.61, - "learning_rate": 1.9742812599183168e-05, - "loss": 2.2746, - "step": 347010 - }, - { - "epoch": 0.61, - "learning_rate": 1.9741940659256342e-05, - "loss": 2.3046, - "step": 347020 - }, - { - "epoch": 0.61, - "learning_rate": 1.9741068719329516e-05, - "loss": 2.2803, - "step": 347030 - }, - { - "epoch": 0.61, - "learning_rate": 1.9740196779402686e-05, - "loss": 2.333, - "step": 347040 - }, - { - "epoch": 0.61, - "learning_rate": 1.9739324839475863e-05, - "loss": 2.3762, - "step": 347050 - }, - { - "epoch": 0.61, - "learning_rate": 1.9738452899549034e-05, - "loss": 2.3486, - "step": 347060 - }, - { - "epoch": 0.61, - "learning_rate": 1.9737580959622207e-05, - "loss": 2.3907, - "step": 347070 - }, - { - "epoch": 0.61, - "learning_rate": 1.9736709019695378e-05, - "loss": 2.4936, - "step": 347080 - }, - { - "epoch": 0.61, - "learning_rate": 1.9735837079768555e-05, - "loss": 2.2571, - "step": 347090 - }, - { - "epoch": 0.61, - "learning_rate": 1.9734965139841725e-05, - "loss": 2.325, - "step": 347100 - }, - { - "epoch": 0.61, - "learning_rate": 1.97340931999149e-05, - "loss": 2.329, - "step": 347110 - }, - { - "epoch": 0.61, - "learning_rate": 1.9733221259988073e-05, - "loss": 2.3561, - "step": 347120 - }, - { - "epoch": 0.61, - "learning_rate": 1.9732349320061247e-05, - "loss": 2.3763, - "step": 347130 - }, - { - "epoch": 0.61, - "learning_rate": 1.973147738013442e-05, - "loss": 2.3397, - "step": 347140 - }, - { - "epoch": 0.61, - "learning_rate": 1.973060544020759e-05, - "loss": 2.4157, - "step": 347150 - }, - { - "epoch": 0.61, - "learning_rate": 1.9729733500280764e-05, - "loss": 2.2658, - "step": 347160 - }, - { - "epoch": 0.61, - "learning_rate": 1.9728861560353938e-05, - "loss": 2.2611, - "step": 347170 - }, - { - "epoch": 0.61, - "learning_rate": 1.9727989620427112e-05, - "loss": 2.4498, - "step": 347180 - }, - { - "epoch": 0.61, - "learning_rate": 1.9727117680500286e-05, - "loss": 2.3077, - "step": 347190 - }, - { - "epoch": 0.61, - "learning_rate": 1.972624574057346e-05, - "loss": 2.4089, - "step": 347200 - }, - { - "epoch": 0.61, - "learning_rate": 1.9725373800646633e-05, - "loss": 2.4173, - "step": 347210 - }, - { - "epoch": 0.61, - "learning_rate": 1.9724501860719804e-05, - "loss": 2.2889, - "step": 347220 - }, - { - "epoch": 0.61, - "learning_rate": 1.9723629920792977e-05, - "loss": 2.3736, - "step": 347230 - }, - { - "epoch": 0.61, - "learning_rate": 1.972275798086615e-05, - "loss": 2.3065, - "step": 347240 - }, - { - "epoch": 0.61, - "learning_rate": 1.9721886040939325e-05, - "loss": 2.3988, - "step": 347250 - }, - { - "epoch": 0.61, - "learning_rate": 1.97210141010125e-05, - "loss": 2.2959, - "step": 347260 - }, - { - "epoch": 0.61, - "learning_rate": 1.972014216108567e-05, - "loss": 2.3583, - "step": 347270 - }, - { - "epoch": 0.61, - "learning_rate": 1.9719270221158846e-05, - "loss": 2.3816, - "step": 347280 - }, - { - "epoch": 0.61, - "learning_rate": 1.9718398281232017e-05, - "loss": 2.3017, - "step": 347290 - }, - { - "epoch": 0.61, - "learning_rate": 1.971752634130519e-05, - "loss": 2.4102, - "step": 347300 - }, - { - "epoch": 0.61, - "learning_rate": 1.9716654401378364e-05, - "loss": 2.4661, - "step": 347310 - }, - { - "epoch": 0.61, - "learning_rate": 1.9715782461451538e-05, - "loss": 2.4305, - "step": 347320 - }, - { - "epoch": 0.61, - "learning_rate": 1.971491052152471e-05, - "loss": 2.3561, - "step": 347330 - }, - { - "epoch": 0.61, - "learning_rate": 1.9714038581597882e-05, - "loss": 2.3199, - "step": 347340 - }, - { - "epoch": 0.61, - "learning_rate": 1.9713166641671056e-05, - "loss": 2.3184, - "step": 347350 - }, - { - "epoch": 0.61, - "learning_rate": 1.971229470174423e-05, - "loss": 2.3298, - "step": 347360 - }, - { - "epoch": 0.61, - "learning_rate": 1.9711422761817403e-05, - "loss": 2.3372, - "step": 347370 - }, - { - "epoch": 0.61, - "learning_rate": 1.9710550821890574e-05, - "loss": 2.3951, - "step": 347380 - }, - { - "epoch": 0.61, - "learning_rate": 1.970967888196375e-05, - "loss": 2.4728, - "step": 347390 - }, - { - "epoch": 0.61, - "learning_rate": 1.970880694203692e-05, - "loss": 2.3577, - "step": 347400 - }, - { - "epoch": 0.61, - "learning_rate": 1.9707935002110095e-05, - "loss": 2.364, - "step": 347410 - }, - { - "epoch": 0.61, - "learning_rate": 1.970706306218327e-05, - "loss": 2.3819, - "step": 347420 - }, - { - "epoch": 0.61, - "learning_rate": 1.9706191122256443e-05, - "loss": 2.4356, - "step": 347430 - }, - { - "epoch": 0.61, - "learning_rate": 1.9705319182329616e-05, - "loss": 2.2606, - "step": 347440 - }, - { - "epoch": 0.61, - "learning_rate": 1.9704447242402787e-05, - "loss": 2.4045, - "step": 347450 - }, - { - "epoch": 0.61, - "learning_rate": 1.9703575302475964e-05, - "loss": 2.1837, - "step": 347460 - }, - { - "epoch": 0.61, - "learning_rate": 1.9702703362549134e-05, - "loss": 2.3232, - "step": 347470 - }, - { - "epoch": 0.61, - "learning_rate": 1.9701831422622308e-05, - "loss": 2.3849, - "step": 347480 - }, - { - "epoch": 0.61, - "learning_rate": 1.970095948269548e-05, - "loss": 2.2244, - "step": 347490 - }, - { - "epoch": 0.61, - "learning_rate": 1.9700087542768656e-05, - "loss": 2.2754, - "step": 347500 - }, - { - "epoch": 0.61, - "learning_rate": 1.969921560284183e-05, - "loss": 2.392, - "step": 347510 - }, - { - "epoch": 0.61, - "learning_rate": 1.9698343662915e-05, - "loss": 2.337, - "step": 347520 - }, - { - "epoch": 0.61, - "learning_rate": 1.9697471722988174e-05, - "loss": 2.3556, - "step": 347530 - }, - { - "epoch": 0.61, - "learning_rate": 1.9696599783061347e-05, - "loss": 2.3984, - "step": 347540 - }, - { - "epoch": 0.61, - "learning_rate": 1.969572784313452e-05, - "loss": 2.3359, - "step": 347550 - }, - { - "epoch": 0.61, - "learning_rate": 1.969485590320769e-05, - "loss": 2.3319, - "step": 347560 - }, - { - "epoch": 0.61, - "learning_rate": 1.9693983963280865e-05, - "loss": 2.3353, - "step": 347570 - }, - { - "epoch": 0.61, - "learning_rate": 1.969311202335404e-05, - "loss": 2.3517, - "step": 347580 - }, - { - "epoch": 0.61, - "learning_rate": 1.9692240083427213e-05, - "loss": 2.1911, - "step": 347590 - }, - { - "epoch": 0.61, - "learning_rate": 1.9691368143500387e-05, - "loss": 2.3837, - "step": 347600 - }, - { - "epoch": 0.61, - "learning_rate": 1.969049620357356e-05, - "loss": 2.226, - "step": 347610 - }, - { - "epoch": 0.61, - "learning_rate": 1.9689624263646734e-05, - "loss": 2.3167, - "step": 347620 - }, - { - "epoch": 0.61, - "learning_rate": 1.9688752323719905e-05, - "loss": 2.3305, - "step": 347630 - }, - { - "epoch": 0.61, - "learning_rate": 1.968788038379308e-05, - "loss": 2.4007, - "step": 347640 - }, - { - "epoch": 0.61, - "learning_rate": 1.9687008443866252e-05, - "loss": 2.3188, - "step": 347650 - }, - { - "epoch": 0.61, - "learning_rate": 1.9686136503939426e-05, - "loss": 2.3441, - "step": 347660 - }, - { - "epoch": 0.61, - "learning_rate": 1.96852645640126e-05, - "loss": 2.3455, - "step": 347670 - }, - { - "epoch": 0.61, - "learning_rate": 1.968439262408577e-05, - "loss": 2.4199, - "step": 347680 - }, - { - "epoch": 0.61, - "learning_rate": 1.9683520684158947e-05, - "loss": 2.287, - "step": 347690 - }, - { - "epoch": 0.61, - "learning_rate": 1.9682648744232118e-05, - "loss": 2.3009, - "step": 347700 - }, - { - "epoch": 0.61, - "learning_rate": 1.968177680430529e-05, - "loss": 2.2039, - "step": 347710 - }, - { - "epoch": 0.61, - "learning_rate": 1.9680904864378465e-05, - "loss": 2.3455, - "step": 347720 - }, - { - "epoch": 0.61, - "learning_rate": 1.968003292445164e-05, - "loss": 2.3128, - "step": 347730 - }, - { - "epoch": 0.61, - "learning_rate": 1.9679160984524813e-05, - "loss": 2.244, - "step": 347740 - }, - { - "epoch": 0.61, - "learning_rate": 1.9678289044597983e-05, - "loss": 2.4144, - "step": 347750 - }, - { - "epoch": 0.61, - "learning_rate": 1.967741710467116e-05, - "loss": 2.2185, - "step": 347760 - }, - { - "epoch": 0.61, - "learning_rate": 1.967654516474433e-05, - "loss": 2.3596, - "step": 347770 - }, - { - "epoch": 0.61, - "learning_rate": 1.9675673224817504e-05, - "loss": 2.2852, - "step": 347780 - }, - { - "epoch": 0.61, - "learning_rate": 1.9674801284890675e-05, - "loss": 2.2967, - "step": 347790 - }, - { - "epoch": 0.61, - "learning_rate": 1.9673929344963852e-05, - "loss": 2.4546, - "step": 347800 - }, - { - "epoch": 0.61, - "learning_rate": 1.9673057405037022e-05, - "loss": 2.2723, - "step": 347810 - }, - { - "epoch": 0.61, - "learning_rate": 1.9672185465110196e-05, - "loss": 2.3837, - "step": 347820 - }, - { - "epoch": 0.61, - "learning_rate": 1.967131352518337e-05, - "loss": 2.2945, - "step": 347830 - }, - { - "epoch": 0.61, - "learning_rate": 1.9670441585256544e-05, - "loss": 2.2507, - "step": 347840 - }, - { - "epoch": 0.61, - "learning_rate": 1.9669569645329717e-05, - "loss": 2.3858, - "step": 347850 - }, - { - "epoch": 0.61, - "learning_rate": 1.9668697705402888e-05, - "loss": 2.4893, - "step": 347860 - }, - { - "epoch": 0.61, - "learning_rate": 1.9667825765476065e-05, - "loss": 2.2585, - "step": 347870 - }, - { - "epoch": 0.61, - "learning_rate": 1.9666953825549235e-05, - "loss": 2.456, - "step": 347880 - }, - { - "epoch": 0.61, - "learning_rate": 1.966608188562241e-05, - "loss": 2.3968, - "step": 347890 - }, - { - "epoch": 0.61, - "learning_rate": 1.9665209945695583e-05, - "loss": 2.2927, - "step": 347900 - }, - { - "epoch": 0.61, - "learning_rate": 1.9664338005768757e-05, - "loss": 2.1929, - "step": 347910 - }, - { - "epoch": 0.61, - "learning_rate": 1.966346606584193e-05, - "loss": 2.3806, - "step": 347920 - }, - { - "epoch": 0.61, - "learning_rate": 1.96625941259151e-05, - "loss": 2.3464, - "step": 347930 - }, - { - "epoch": 0.61, - "learning_rate": 1.9661722185988274e-05, - "loss": 2.2692, - "step": 347940 - }, - { - "epoch": 0.61, - "learning_rate": 1.9660850246061448e-05, - "loss": 2.2956, - "step": 347950 - }, - { - "epoch": 0.61, - "learning_rate": 1.9659978306134622e-05, - "loss": 2.3268, - "step": 347960 - }, - { - "epoch": 0.61, - "learning_rate": 1.9659106366207792e-05, - "loss": 2.3439, - "step": 347970 - }, - { - "epoch": 0.61, - "learning_rate": 1.965823442628097e-05, - "loss": 2.1618, - "step": 347980 - }, - { - "epoch": 0.61, - "learning_rate": 1.9657362486354143e-05, - "loss": 2.3664, - "step": 347990 - }, - { - "epoch": 0.61, - "learning_rate": 1.9656490546427314e-05, - "loss": 2.4143, - "step": 348000 - }, - { - "epoch": 0.61, - "learning_rate": 1.9655618606500487e-05, - "loss": 2.3302, - "step": 348010 - }, - { - "epoch": 0.61, - "learning_rate": 1.965474666657366e-05, - "loss": 2.512, - "step": 348020 - }, - { - "epoch": 0.61, - "learning_rate": 1.9653874726646835e-05, - "loss": 2.2961, - "step": 348030 - }, - { - "epoch": 0.61, - "learning_rate": 1.9653002786720005e-05, - "loss": 2.33, - "step": 348040 - }, - { - "epoch": 0.61, - "learning_rate": 1.965213084679318e-05, - "loss": 2.2621, - "step": 348050 - }, - { - "epoch": 0.61, - "learning_rate": 1.9651258906866353e-05, - "loss": 2.2926, - "step": 348060 - }, - { - "epoch": 0.61, - "learning_rate": 1.9650386966939527e-05, - "loss": 2.3802, - "step": 348070 - }, - { - "epoch": 0.61, - "learning_rate": 1.96495150270127e-05, - "loss": 2.273, - "step": 348080 - }, - { - "epoch": 0.61, - "learning_rate": 1.964864308708587e-05, - "loss": 2.3563, - "step": 348090 - }, - { - "epoch": 0.61, - "learning_rate": 1.9647771147159048e-05, - "loss": 2.2456, - "step": 348100 - }, - { - "epoch": 0.61, - "learning_rate": 1.964689920723222e-05, - "loss": 2.2786, - "step": 348110 - }, - { - "epoch": 0.61, - "learning_rate": 1.9646027267305392e-05, - "loss": 2.2797, - "step": 348120 - }, - { - "epoch": 0.61, - "learning_rate": 1.9645155327378566e-05, - "loss": 2.2882, - "step": 348130 - }, - { - "epoch": 0.61, - "learning_rate": 1.964428338745174e-05, - "loss": 2.276, - "step": 348140 - }, - { - "epoch": 0.61, - "learning_rate": 1.9643411447524913e-05, - "loss": 2.2919, - "step": 348150 - }, - { - "epoch": 0.61, - "learning_rate": 1.9642539507598084e-05, - "loss": 2.3483, - "step": 348160 - }, - { - "epoch": 0.61, - "learning_rate": 1.964166756767126e-05, - "loss": 2.3386, - "step": 348170 - }, - { - "epoch": 0.61, - "learning_rate": 1.964079562774443e-05, - "loss": 2.3258, - "step": 348180 - }, - { - "epoch": 0.61, - "learning_rate": 1.9639923687817605e-05, - "loss": 2.4302, - "step": 348190 - }, - { - "epoch": 0.61, - "learning_rate": 1.9639051747890776e-05, - "loss": 2.3778, - "step": 348200 - }, - { - "epoch": 0.61, - "learning_rate": 1.9638179807963953e-05, - "loss": 2.349, - "step": 348210 - }, - { - "epoch": 0.61, - "learning_rate": 1.9637307868037123e-05, - "loss": 2.3031, - "step": 348220 - }, - { - "epoch": 0.61, - "learning_rate": 1.9636435928110297e-05, - "loss": 2.3195, - "step": 348230 - }, - { - "epoch": 0.61, - "learning_rate": 1.9635563988183474e-05, - "loss": 2.2754, - "step": 348240 - }, - { - "epoch": 0.61, - "learning_rate": 1.9634692048256644e-05, - "loss": 2.4747, - "step": 348250 - }, - { - "epoch": 0.61, - "learning_rate": 1.9633820108329818e-05, - "loss": 2.3255, - "step": 348260 - }, - { - "epoch": 0.61, - "learning_rate": 1.963294816840299e-05, - "loss": 2.2432, - "step": 348270 - }, - { - "epoch": 0.61, - "learning_rate": 1.9632076228476166e-05, - "loss": 2.3818, - "step": 348280 - }, - { - "epoch": 0.61, - "learning_rate": 1.9631204288549336e-05, - "loss": 2.3913, - "step": 348290 - }, - { - "epoch": 0.61, - "learning_rate": 1.963033234862251e-05, - "loss": 2.2866, - "step": 348300 - }, - { - "epoch": 0.61, - "learning_rate": 1.9629460408695684e-05, - "loss": 2.4056, - "step": 348310 - }, - { - "epoch": 0.61, - "learning_rate": 1.9628588468768857e-05, - "loss": 2.3573, - "step": 348320 - }, - { - "epoch": 0.61, - "learning_rate": 1.962771652884203e-05, - "loss": 2.411, - "step": 348330 - }, - { - "epoch": 0.61, - "learning_rate": 1.96268445889152e-05, - "loss": 2.287, - "step": 348340 - }, - { - "epoch": 0.61, - "learning_rate": 1.9625972648988375e-05, - "loss": 2.3791, - "step": 348350 - }, - { - "epoch": 0.61, - "learning_rate": 1.962510070906155e-05, - "loss": 2.3293, - "step": 348360 - }, - { - "epoch": 0.61, - "learning_rate": 1.9624228769134723e-05, - "loss": 2.2737, - "step": 348370 - }, - { - "epoch": 0.61, - "learning_rate": 1.9623356829207897e-05, - "loss": 2.2892, - "step": 348380 - }, - { - "epoch": 0.61, - "learning_rate": 1.962248488928107e-05, - "loss": 2.2752, - "step": 348390 - }, - { - "epoch": 0.61, - "learning_rate": 1.9621612949354244e-05, - "loss": 2.3726, - "step": 348400 - }, - { - "epoch": 0.61, - "learning_rate": 1.9620741009427415e-05, - "loss": 2.4426, - "step": 348410 - }, - { - "epoch": 0.61, - "learning_rate": 1.961986906950059e-05, - "loss": 2.355, - "step": 348420 - }, - { - "epoch": 0.61, - "learning_rate": 1.9618997129573762e-05, - "loss": 2.3019, - "step": 348430 - }, - { - "epoch": 0.61, - "learning_rate": 1.9618125189646936e-05, - "loss": 2.4275, - "step": 348440 - }, - { - "epoch": 0.61, - "learning_rate": 1.9617253249720106e-05, - "loss": 2.3699, - "step": 348450 - }, - { - "epoch": 0.61, - "learning_rate": 1.961638130979328e-05, - "loss": 2.4124, - "step": 348460 - }, - { - "epoch": 0.61, - "learning_rate": 1.9615509369866457e-05, - "loss": 2.2578, - "step": 348470 - }, - { - "epoch": 0.61, - "learning_rate": 1.9614637429939628e-05, - "loss": 2.2281, - "step": 348480 - }, - { - "epoch": 0.61, - "learning_rate": 1.96137654900128e-05, - "loss": 2.4282, - "step": 348490 - }, - { - "epoch": 0.61, - "learning_rate": 1.9612893550085972e-05, - "loss": 2.2972, - "step": 348500 - }, - { - "epoch": 0.61, - "learning_rate": 1.961202161015915e-05, - "loss": 2.272, - "step": 348510 - }, - { - "epoch": 0.61, - "learning_rate": 1.961114967023232e-05, - "loss": 2.322, - "step": 348520 - }, - { - "epoch": 0.61, - "learning_rate": 1.9610277730305493e-05, - "loss": 2.309, - "step": 348530 - }, - { - "epoch": 0.61, - "learning_rate": 1.9609405790378667e-05, - "loss": 2.4263, - "step": 348540 - }, - { - "epoch": 0.61, - "learning_rate": 1.960853385045184e-05, - "loss": 2.2665, - "step": 348550 - }, - { - "epoch": 0.61, - "learning_rate": 1.9607661910525014e-05, - "loss": 2.2775, - "step": 348560 - }, - { - "epoch": 0.61, - "learning_rate": 1.9606789970598185e-05, - "loss": 2.4037, - "step": 348570 - }, - { - "epoch": 0.61, - "learning_rate": 1.9605918030671362e-05, - "loss": 2.2849, - "step": 348580 - }, - { - "epoch": 0.61, - "learning_rate": 1.9605046090744532e-05, - "loss": 2.1749, - "step": 348590 - }, - { - "epoch": 0.61, - "learning_rate": 1.9604174150817706e-05, - "loss": 2.2824, - "step": 348600 - }, - { - "epoch": 0.61, - "learning_rate": 1.960330221089088e-05, - "loss": 2.2996, - "step": 348610 - }, - { - "epoch": 0.61, - "learning_rate": 1.9602430270964054e-05, - "loss": 2.3621, - "step": 348620 - }, - { - "epoch": 0.61, - "learning_rate": 1.9601558331037227e-05, - "loss": 2.3527, - "step": 348630 - }, - { - "epoch": 0.61, - "learning_rate": 1.9600686391110398e-05, - "loss": 2.37, - "step": 348640 - }, - { - "epoch": 0.61, - "learning_rate": 1.9599814451183575e-05, - "loss": 2.3497, - "step": 348650 - }, - { - "epoch": 0.61, - "learning_rate": 1.9598942511256745e-05, - "loss": 2.3799, - "step": 348660 - }, - { - "epoch": 0.61, - "learning_rate": 1.959807057132992e-05, - "loss": 2.4079, - "step": 348670 - }, - { - "epoch": 0.61, - "learning_rate": 1.959719863140309e-05, - "loss": 2.2183, - "step": 348680 - }, - { - "epoch": 0.61, - "learning_rate": 1.9596326691476267e-05, - "loss": 2.327, - "step": 348690 - }, - { - "epoch": 0.61, - "learning_rate": 1.9595454751549437e-05, - "loss": 2.3553, - "step": 348700 - }, - { - "epoch": 0.61, - "learning_rate": 1.959458281162261e-05, - "loss": 2.327, - "step": 348710 - }, - { - "epoch": 0.61, - "learning_rate": 1.9593710871695784e-05, - "loss": 2.3447, - "step": 348720 - }, - { - "epoch": 0.61, - "learning_rate": 1.9592838931768958e-05, - "loss": 2.3492, - "step": 348730 - }, - { - "epoch": 0.61, - "learning_rate": 1.9591966991842132e-05, - "loss": 2.4688, - "step": 348740 - }, - { - "epoch": 0.61, - "learning_rate": 1.9591095051915302e-05, - "loss": 2.3513, - "step": 348750 - }, - { - "epoch": 0.61, - "learning_rate": 1.9590223111988476e-05, - "loss": 2.3032, - "step": 348760 - }, - { - "epoch": 0.61, - "learning_rate": 1.958935117206165e-05, - "loss": 2.2229, - "step": 348770 - }, - { - "epoch": 0.61, - "learning_rate": 1.9588479232134824e-05, - "loss": 2.2768, - "step": 348780 - }, - { - "epoch": 0.61, - "learning_rate": 1.9587607292207997e-05, - "loss": 2.3722, - "step": 348790 - }, - { - "epoch": 0.61, - "learning_rate": 1.958673535228117e-05, - "loss": 2.3316, - "step": 348800 - }, - { - "epoch": 0.61, - "learning_rate": 1.9585863412354345e-05, - "loss": 2.3506, - "step": 348810 - }, - { - "epoch": 0.61, - "learning_rate": 1.9584991472427515e-05, - "loss": 2.4009, - "step": 348820 - }, - { - "epoch": 0.61, - "learning_rate": 1.958411953250069e-05, - "loss": 2.0419, - "step": 348830 - }, - { - "epoch": 0.61, - "learning_rate": 1.9583247592573863e-05, - "loss": 2.3824, - "step": 348840 - }, - { - "epoch": 0.61, - "learning_rate": 1.9582375652647037e-05, - "loss": 2.3764, - "step": 348850 - }, - { - "epoch": 0.61, - "learning_rate": 1.958150371272021e-05, - "loss": 2.3366, - "step": 348860 - }, - { - "epoch": 0.61, - "learning_rate": 1.958063177279338e-05, - "loss": 2.3342, - "step": 348870 - }, - { - "epoch": 0.61, - "learning_rate": 1.9579759832866558e-05, - "loss": 2.325, - "step": 348880 - }, - { - "epoch": 0.61, - "learning_rate": 1.957888789293973e-05, - "loss": 2.216, - "step": 348890 - }, - { - "epoch": 0.61, - "learning_rate": 1.9578015953012902e-05, - "loss": 2.2386, - "step": 348900 - }, - { - "epoch": 0.61, - "learning_rate": 1.9577144013086076e-05, - "loss": 2.2859, - "step": 348910 - }, - { - "epoch": 0.61, - "learning_rate": 1.957627207315925e-05, - "loss": 2.2315, - "step": 348920 - }, - { - "epoch": 0.61, - "learning_rate": 1.957540013323242e-05, - "loss": 2.3445, - "step": 348930 - }, - { - "epoch": 0.61, - "learning_rate": 1.9574528193305594e-05, - "loss": 2.2692, - "step": 348940 - }, - { - "epoch": 0.61, - "learning_rate": 1.9573656253378768e-05, - "loss": 2.3105, - "step": 348950 - }, - { - "epoch": 0.61, - "learning_rate": 1.957278431345194e-05, - "loss": 2.2728, - "step": 348960 - }, - { - "epoch": 0.61, - "learning_rate": 1.9571912373525115e-05, - "loss": 2.2129, - "step": 348970 - }, - { - "epoch": 0.61, - "learning_rate": 1.9571040433598286e-05, - "loss": 2.3371, - "step": 348980 - }, - { - "epoch": 0.61, - "learning_rate": 1.9570168493671463e-05, - "loss": 2.2979, - "step": 348990 - }, - { - "epoch": 0.61, - "learning_rate": 1.9569296553744633e-05, - "loss": 2.2564, - "step": 349000 - }, - { - "epoch": 0.61, - "learning_rate": 1.9568424613817807e-05, - "loss": 2.3352, - "step": 349010 - }, - { - "epoch": 0.61, - "learning_rate": 1.956755267389098e-05, - "loss": 2.4582, - "step": 349020 - }, - { - "epoch": 0.61, - "learning_rate": 1.9566680733964154e-05, - "loss": 2.2205, - "step": 349030 - }, - { - "epoch": 0.61, - "learning_rate": 1.9565808794037328e-05, - "loss": 2.3509, - "step": 349040 - }, - { - "epoch": 0.61, - "learning_rate": 1.95649368541105e-05, - "loss": 2.3805, - "step": 349050 - }, - { - "epoch": 0.61, - "learning_rate": 1.9564064914183676e-05, - "loss": 2.4035, - "step": 349060 - }, - { - "epoch": 0.61, - "learning_rate": 1.9563192974256846e-05, - "loss": 2.269, - "step": 349070 - }, - { - "epoch": 0.61, - "learning_rate": 1.956232103433002e-05, - "loss": 2.3075, - "step": 349080 - }, - { - "epoch": 0.61, - "learning_rate": 1.9561449094403194e-05, - "loss": 2.303, - "step": 349090 - }, - { - "epoch": 0.61, - "learning_rate": 1.9560577154476367e-05, - "loss": 2.3936, - "step": 349100 - }, - { - "epoch": 0.61, - "learning_rate": 1.955970521454954e-05, - "loss": 2.3648, - "step": 349110 - }, - { - "epoch": 0.61, - "learning_rate": 1.955883327462271e-05, - "loss": 2.3141, - "step": 349120 - }, - { - "epoch": 0.61, - "learning_rate": 1.9557961334695885e-05, - "loss": 2.3761, - "step": 349130 - }, - { - "epoch": 0.61, - "learning_rate": 1.955708939476906e-05, - "loss": 2.3388, - "step": 349140 - }, - { - "epoch": 0.61, - "learning_rate": 1.9556217454842233e-05, - "loss": 2.3792, - "step": 349150 - }, - { - "epoch": 0.61, - "learning_rate": 1.9555345514915403e-05, - "loss": 2.2915, - "step": 349160 - }, - { - "epoch": 0.61, - "learning_rate": 1.955447357498858e-05, - "loss": 2.4534, - "step": 349170 - }, - { - "epoch": 0.61, - "learning_rate": 1.955360163506175e-05, - "loss": 2.3321, - "step": 349180 - }, - { - "epoch": 0.61, - "learning_rate": 1.9552729695134925e-05, - "loss": 2.3133, - "step": 349190 - }, - { - "epoch": 0.61, - "learning_rate": 1.95518577552081e-05, - "loss": 2.3149, - "step": 349200 - }, - { - "epoch": 0.61, - "learning_rate": 1.9550985815281272e-05, - "loss": 2.3567, - "step": 349210 - }, - { - "epoch": 0.61, - "learning_rate": 1.9550113875354446e-05, - "loss": 2.4076, - "step": 349220 - }, - { - "epoch": 0.61, - "learning_rate": 1.9549241935427616e-05, - "loss": 2.4255, - "step": 349230 - }, - { - "epoch": 0.61, - "learning_rate": 1.954836999550079e-05, - "loss": 2.3211, - "step": 349240 - }, - { - "epoch": 0.61, - "learning_rate": 1.9547498055573964e-05, - "loss": 2.313, - "step": 349250 - }, - { - "epoch": 0.61, - "learning_rate": 1.9546626115647138e-05, - "loss": 2.3468, - "step": 349260 - }, - { - "epoch": 0.61, - "learning_rate": 1.954575417572031e-05, - "loss": 2.2666, - "step": 349270 - }, - { - "epoch": 0.61, - "learning_rate": 1.9544882235793482e-05, - "loss": 2.3386, - "step": 349280 - }, - { - "epoch": 0.61, - "learning_rate": 1.954401029586666e-05, - "loss": 2.3637, - "step": 349290 - }, - { - "epoch": 0.61, - "learning_rate": 1.954313835593983e-05, - "loss": 2.2094, - "step": 349300 - }, - { - "epoch": 0.61, - "learning_rate": 1.9542266416013003e-05, - "loss": 2.4036, - "step": 349310 - }, - { - "epoch": 0.61, - "learning_rate": 1.9541394476086177e-05, - "loss": 2.291, - "step": 349320 - }, - { - "epoch": 0.61, - "learning_rate": 1.954052253615935e-05, - "loss": 2.2336, - "step": 349330 - }, - { - "epoch": 0.61, - "learning_rate": 1.9539650596232524e-05, - "loss": 2.3563, - "step": 349340 - }, - { - "epoch": 0.61, - "learning_rate": 1.9538778656305695e-05, - "loss": 2.2398, - "step": 349350 - }, - { - "epoch": 0.61, - "learning_rate": 1.9537906716378872e-05, - "loss": 2.3627, - "step": 349360 - }, - { - "epoch": 0.61, - "learning_rate": 1.9537034776452042e-05, - "loss": 2.4278, - "step": 349370 - }, - { - "epoch": 0.61, - "learning_rate": 1.9536162836525216e-05, - "loss": 2.3921, - "step": 349380 - }, - { - "epoch": 0.61, - "learning_rate": 1.9535290896598386e-05, - "loss": 2.4734, - "step": 349390 - }, - { - "epoch": 0.61, - "learning_rate": 1.9534418956671564e-05, - "loss": 2.3355, - "step": 349400 - }, - { - "epoch": 0.61, - "learning_rate": 1.9533547016744734e-05, - "loss": 2.3774, - "step": 349410 - }, - { - "epoch": 0.61, - "learning_rate": 1.9532675076817908e-05, - "loss": 2.3457, - "step": 349420 - }, - { - "epoch": 0.61, - "learning_rate": 1.953180313689108e-05, - "loss": 2.3699, - "step": 349430 - }, - { - "epoch": 0.61, - "learning_rate": 1.9530931196964255e-05, - "loss": 2.3234, - "step": 349440 - }, - { - "epoch": 0.61, - "learning_rate": 1.953005925703743e-05, - "loss": 2.3493, - "step": 349450 - }, - { - "epoch": 0.61, - "learning_rate": 1.95291873171106e-05, - "loss": 2.199, - "step": 349460 - }, - { - "epoch": 0.61, - "learning_rate": 1.9528315377183777e-05, - "loss": 2.324, - "step": 349470 - }, - { - "epoch": 0.61, - "learning_rate": 1.9527443437256947e-05, - "loss": 2.164, - "step": 349480 - }, - { - "epoch": 0.61, - "learning_rate": 1.952657149733012e-05, - "loss": 2.2705, - "step": 349490 - }, - { - "epoch": 0.61, - "learning_rate": 1.9525699557403294e-05, - "loss": 2.3047, - "step": 349500 - }, - { - "epoch": 0.61, - "learning_rate": 1.9524827617476468e-05, - "loss": 2.3124, - "step": 349510 - }, - { - "epoch": 0.61, - "learning_rate": 1.9523955677549642e-05, - "loss": 2.3952, - "step": 349520 - }, - { - "epoch": 0.61, - "learning_rate": 1.9523083737622812e-05, - "loss": 2.2955, - "step": 349530 - }, - { - "epoch": 0.61, - "learning_rate": 1.9522211797695986e-05, - "loss": 2.4372, - "step": 349540 - }, - { - "epoch": 0.61, - "learning_rate": 1.952133985776916e-05, - "loss": 2.3494, - "step": 349550 - }, - { - "epoch": 0.61, - "learning_rate": 1.9520467917842334e-05, - "loss": 2.3329, - "step": 349560 - }, - { - "epoch": 0.61, - "learning_rate": 1.9519595977915504e-05, - "loss": 2.419, - "step": 349570 - }, - { - "epoch": 0.61, - "learning_rate": 1.951872403798868e-05, - "loss": 2.3673, - "step": 349580 - }, - { - "epoch": 0.61, - "learning_rate": 1.9517852098061855e-05, - "loss": 2.1396, - "step": 349590 - }, - { - "epoch": 0.61, - "learning_rate": 1.9516980158135025e-05, - "loss": 2.3331, - "step": 349600 - }, - { - "epoch": 0.61, - "learning_rate": 1.95161082182082e-05, - "loss": 2.3822, - "step": 349610 - }, - { - "epoch": 0.61, - "learning_rate": 1.9515236278281373e-05, - "loss": 2.251, - "step": 349620 - }, - { - "epoch": 0.61, - "learning_rate": 1.9514364338354547e-05, - "loss": 2.318, - "step": 349630 - }, - { - "epoch": 0.61, - "learning_rate": 1.9513492398427717e-05, - "loss": 2.3445, - "step": 349640 - }, - { - "epoch": 0.61, - "learning_rate": 1.951262045850089e-05, - "loss": 2.2983, - "step": 349650 - }, - { - "epoch": 0.61, - "learning_rate": 1.9511748518574065e-05, - "loss": 2.4103, - "step": 349660 - }, - { - "epoch": 0.61, - "learning_rate": 1.951087657864724e-05, - "loss": 2.3641, - "step": 349670 - }, - { - "epoch": 0.61, - "learning_rate": 1.9510004638720412e-05, - "loss": 2.2944, - "step": 349680 - }, - { - "epoch": 0.61, - "learning_rate": 1.9509132698793583e-05, - "loss": 2.3306, - "step": 349690 - }, - { - "epoch": 0.61, - "learning_rate": 1.950826075886676e-05, - "loss": 2.3027, - "step": 349700 - }, - { - "epoch": 0.61, - "learning_rate": 1.950738881893993e-05, - "loss": 2.466, - "step": 349710 - }, - { - "epoch": 0.61, - "learning_rate": 1.9506516879013104e-05, - "loss": 2.2951, - "step": 349720 - }, - { - "epoch": 0.61, - "learning_rate": 1.9505644939086278e-05, - "loss": 2.304, - "step": 349730 - }, - { - "epoch": 0.61, - "learning_rate": 1.950477299915945e-05, - "loss": 2.3558, - "step": 349740 - }, - { - "epoch": 0.61, - "learning_rate": 1.9503901059232625e-05, - "loss": 2.2496, - "step": 349750 - }, - { - "epoch": 0.61, - "learning_rate": 1.9503029119305796e-05, - "loss": 2.3607, - "step": 349760 - }, - { - "epoch": 0.61, - "learning_rate": 1.9502157179378973e-05, - "loss": 2.3063, - "step": 349770 - }, - { - "epoch": 0.61, - "learning_rate": 1.9501285239452143e-05, - "loss": 2.2634, - "step": 349780 - }, - { - "epoch": 0.61, - "learning_rate": 1.9500413299525317e-05, - "loss": 2.3102, - "step": 349790 - }, - { - "epoch": 0.61, - "learning_rate": 1.9499541359598487e-05, - "loss": 2.3108, - "step": 349800 - }, - { - "epoch": 0.61, - "learning_rate": 1.9498669419671664e-05, - "loss": 2.4283, - "step": 349810 - }, - { - "epoch": 0.61, - "learning_rate": 1.9497797479744838e-05, - "loss": 2.4004, - "step": 349820 - }, - { - "epoch": 0.61, - "learning_rate": 1.949692553981801e-05, - "loss": 2.3697, - "step": 349830 - }, - { - "epoch": 0.61, - "learning_rate": 1.9496053599891186e-05, - "loss": 2.3559, - "step": 349840 - }, - { - "epoch": 0.61, - "learning_rate": 1.9495181659964356e-05, - "loss": 2.3386, - "step": 349850 - }, - { - "epoch": 0.61, - "learning_rate": 1.949430972003753e-05, - "loss": 2.2405, - "step": 349860 - }, - { - "epoch": 0.61, - "learning_rate": 1.94934377801107e-05, - "loss": 2.3326, - "step": 349870 - }, - { - "epoch": 0.61, - "learning_rate": 1.9492565840183877e-05, - "loss": 2.2626, - "step": 349880 - }, - { - "epoch": 0.61, - "learning_rate": 1.9491693900257048e-05, - "loss": 2.377, - "step": 349890 - }, - { - "epoch": 0.61, - "learning_rate": 1.949082196033022e-05, - "loss": 2.3445, - "step": 349900 - }, - { - "epoch": 0.61, - "learning_rate": 1.9489950020403395e-05, - "loss": 2.3623, - "step": 349910 - }, - { - "epoch": 0.61, - "learning_rate": 1.948907808047657e-05, - "loss": 2.3185, - "step": 349920 - }, - { - "epoch": 0.61, - "learning_rate": 1.9488206140549743e-05, - "loss": 2.288, - "step": 349930 - }, - { - "epoch": 0.61, - "learning_rate": 1.9487334200622913e-05, - "loss": 2.3298, - "step": 349940 - }, - { - "epoch": 0.61, - "learning_rate": 1.9486462260696087e-05, - "loss": 2.3724, - "step": 349950 - }, - { - "epoch": 0.61, - "learning_rate": 1.948559032076926e-05, - "loss": 2.4181, - "step": 349960 - }, - { - "epoch": 0.61, - "learning_rate": 1.9484718380842435e-05, - "loss": 2.292, - "step": 349970 - }, - { - "epoch": 0.61, - "learning_rate": 1.948384644091561e-05, - "loss": 2.3761, - "step": 349980 - }, - { - "epoch": 0.61, - "learning_rate": 1.9482974500988782e-05, - "loss": 2.4397, - "step": 349990 - }, - { - "epoch": 0.61, - "learning_rate": 1.9482102561061956e-05, - "loss": 2.2869, - "step": 350000 - }, - { - "epoch": 0.61, - "learning_rate": 1.9481230621135126e-05, - "loss": 2.3066, - "step": 350010 - }, - { - "epoch": 0.61, - "learning_rate": 1.94803586812083e-05, - "loss": 2.2536, - "step": 350020 - }, - { - "epoch": 0.61, - "learning_rate": 1.9479486741281474e-05, - "loss": 2.2964, - "step": 350030 - }, - { - "epoch": 0.61, - "learning_rate": 1.9478614801354648e-05, - "loss": 2.3702, - "step": 350040 - }, - { - "epoch": 0.61, - "learning_rate": 1.9477742861427818e-05, - "loss": 2.3325, - "step": 350050 - }, - { - "epoch": 0.61, - "learning_rate": 1.9476870921500992e-05, - "loss": 2.2463, - "step": 350060 - }, - { - "epoch": 0.61, - "learning_rate": 1.947599898157417e-05, - "loss": 2.3833, - "step": 350070 - }, - { - "epoch": 0.61, - "learning_rate": 1.947512704164734e-05, - "loss": 2.3213, - "step": 350080 - }, - { - "epoch": 0.61, - "learning_rate": 1.9474255101720513e-05, - "loss": 2.3684, - "step": 350090 - }, - { - "epoch": 0.61, - "learning_rate": 1.9473383161793687e-05, - "loss": 2.2684, - "step": 350100 - }, - { - "epoch": 0.61, - "learning_rate": 1.947251122186686e-05, - "loss": 2.2435, - "step": 350110 - }, - { - "epoch": 0.61, - "learning_rate": 1.947163928194003e-05, - "loss": 2.2816, - "step": 350120 - }, - { - "epoch": 0.61, - "learning_rate": 1.9470767342013205e-05, - "loss": 2.3061, - "step": 350130 - }, - { - "epoch": 0.61, - "learning_rate": 1.946989540208638e-05, - "loss": 2.3099, - "step": 350140 - }, - { - "epoch": 0.61, - "learning_rate": 1.9469023462159552e-05, - "loss": 2.279, - "step": 350150 - }, - { - "epoch": 0.61, - "learning_rate": 1.9468151522232726e-05, - "loss": 2.2579, - "step": 350160 - }, - { - "epoch": 0.61, - "learning_rate": 1.9467279582305896e-05, - "loss": 2.1981, - "step": 350170 - }, - { - "epoch": 0.61, - "learning_rate": 1.9466407642379074e-05, - "loss": 2.3007, - "step": 350180 - }, - { - "epoch": 0.61, - "learning_rate": 1.9465535702452244e-05, - "loss": 2.315, - "step": 350190 - }, - { - "epoch": 0.61, - "learning_rate": 1.9464663762525418e-05, - "loss": 2.3292, - "step": 350200 - }, - { - "epoch": 0.61, - "learning_rate": 1.946379182259859e-05, - "loss": 2.3366, - "step": 350210 - }, - { - "epoch": 0.61, - "learning_rate": 1.9462919882671765e-05, - "loss": 2.2502, - "step": 350220 - }, - { - "epoch": 0.61, - "learning_rate": 1.946204794274494e-05, - "loss": 2.3167, - "step": 350230 - }, - { - "epoch": 0.61, - "learning_rate": 1.946117600281811e-05, - "loss": 2.2639, - "step": 350240 - }, - { - "epoch": 0.61, - "learning_rate": 1.9460304062891287e-05, - "loss": 2.1478, - "step": 350250 - }, - { - "epoch": 0.61, - "learning_rate": 1.9459432122964457e-05, - "loss": 2.4136, - "step": 350260 - }, - { - "epoch": 0.61, - "learning_rate": 1.945856018303763e-05, - "loss": 2.2898, - "step": 350270 - }, - { - "epoch": 0.61, - "learning_rate": 1.94576882431108e-05, - "loss": 2.2185, - "step": 350280 - }, - { - "epoch": 0.61, - "learning_rate": 1.9456816303183978e-05, - "loss": 2.2606, - "step": 350290 - }, - { - "epoch": 0.61, - "learning_rate": 1.945594436325715e-05, - "loss": 2.2317, - "step": 350300 - }, - { - "epoch": 0.61, - "learning_rate": 1.9455072423330322e-05, - "loss": 2.3401, - "step": 350310 - }, - { - "epoch": 0.61, - "learning_rate": 1.9454200483403496e-05, - "loss": 2.2712, - "step": 350320 - }, - { - "epoch": 0.61, - "learning_rate": 1.945332854347667e-05, - "loss": 2.2536, - "step": 350330 - }, - { - "epoch": 0.61, - "learning_rate": 1.9452456603549844e-05, - "loss": 2.2444, - "step": 350340 - }, - { - "epoch": 0.61, - "learning_rate": 1.9451584663623014e-05, - "loss": 2.4018, - "step": 350350 - }, - { - "epoch": 0.61, - "learning_rate": 1.9450712723696188e-05, - "loss": 2.4143, - "step": 350360 - }, - { - "epoch": 0.61, - "learning_rate": 1.944984078376936e-05, - "loss": 2.3022, - "step": 350370 - }, - { - "epoch": 0.61, - "learning_rate": 1.9448968843842535e-05, - "loss": 2.3292, - "step": 350380 - }, - { - "epoch": 0.61, - "learning_rate": 1.944809690391571e-05, - "loss": 2.3109, - "step": 350390 - }, - { - "epoch": 0.61, - "learning_rate": 1.9447224963988883e-05, - "loss": 2.384, - "step": 350400 - }, - { - "epoch": 0.61, - "learning_rate": 1.9446353024062057e-05, - "loss": 2.2911, - "step": 350410 - }, - { - "epoch": 0.61, - "learning_rate": 1.9445481084135227e-05, - "loss": 2.4595, - "step": 350420 - }, - { - "epoch": 0.61, - "learning_rate": 1.94446091442084e-05, - "loss": 2.2783, - "step": 350430 - }, - { - "epoch": 0.61, - "learning_rate": 1.9443737204281575e-05, - "loss": 2.3116, - "step": 350440 - }, - { - "epoch": 0.61, - "learning_rate": 1.944286526435475e-05, - "loss": 2.2664, - "step": 350450 - }, - { - "epoch": 0.61, - "learning_rate": 1.9441993324427922e-05, - "loss": 2.3772, - "step": 350460 - }, - { - "epoch": 0.61, - "learning_rate": 1.9441121384501093e-05, - "loss": 2.2903, - "step": 350470 - }, - { - "epoch": 0.61, - "learning_rate": 1.944024944457427e-05, - "loss": 2.3432, - "step": 350480 - }, - { - "epoch": 0.61, - "learning_rate": 1.943937750464744e-05, - "loss": 2.355, - "step": 350490 - }, - { - "epoch": 0.61, - "learning_rate": 1.9438505564720614e-05, - "loss": 2.2968, - "step": 350500 - }, - { - "epoch": 0.61, - "learning_rate": 1.9437633624793788e-05, - "loss": 2.3936, - "step": 350510 - }, - { - "epoch": 0.61, - "learning_rate": 1.943676168486696e-05, - "loss": 2.3697, - "step": 350520 - }, - { - "epoch": 0.61, - "learning_rate": 1.9435889744940132e-05, - "loss": 2.2605, - "step": 350530 - }, - { - "epoch": 0.61, - "learning_rate": 1.9435017805013306e-05, - "loss": 2.3863, - "step": 350540 - }, - { - "epoch": 0.61, - "learning_rate": 1.9434145865086483e-05, - "loss": 2.3672, - "step": 350550 - }, - { - "epoch": 0.61, - "learning_rate": 1.9433273925159653e-05, - "loss": 2.3713, - "step": 350560 - }, - { - "epoch": 0.61, - "learning_rate": 1.9432401985232827e-05, - "loss": 2.2939, - "step": 350570 - }, - { - "epoch": 0.61, - "learning_rate": 1.9431530045305997e-05, - "loss": 2.4678, - "step": 350580 - }, - { - "epoch": 0.61, - "learning_rate": 1.9430658105379174e-05, - "loss": 2.3789, - "step": 350590 - }, - { - "epoch": 0.61, - "learning_rate": 1.9429786165452345e-05, - "loss": 2.443, - "step": 350600 - }, - { - "epoch": 0.61, - "learning_rate": 1.942891422552552e-05, - "loss": 2.3315, - "step": 350610 - }, - { - "epoch": 0.61, - "learning_rate": 1.9428042285598692e-05, - "loss": 2.277, - "step": 350620 - }, - { - "epoch": 0.61, - "learning_rate": 1.9427170345671866e-05, - "loss": 2.4399, - "step": 350630 - }, - { - "epoch": 0.61, - "learning_rate": 1.942629840574504e-05, - "loss": 2.3914, - "step": 350640 - }, - { - "epoch": 0.61, - "learning_rate": 1.942542646581821e-05, - "loss": 2.3621, - "step": 350650 - }, - { - "epoch": 0.61, - "learning_rate": 1.9424554525891387e-05, - "loss": 2.3896, - "step": 350660 - }, - { - "epoch": 0.61, - "learning_rate": 1.9423682585964558e-05, - "loss": 2.3994, - "step": 350670 - }, - { - "epoch": 0.61, - "learning_rate": 1.942281064603773e-05, - "loss": 2.4933, - "step": 350680 - }, - { - "epoch": 0.61, - "learning_rate": 1.9421938706110905e-05, - "loss": 2.3857, - "step": 350690 - }, - { - "epoch": 0.61, - "learning_rate": 1.942106676618408e-05, - "loss": 2.3293, - "step": 350700 - }, - { - "epoch": 0.61, - "learning_rate": 1.9420194826257253e-05, - "loss": 2.3531, - "step": 350710 - }, - { - "epoch": 0.61, - "learning_rate": 1.9419322886330423e-05, - "loss": 2.2928, - "step": 350720 - }, - { - "epoch": 0.61, - "learning_rate": 1.9418450946403597e-05, - "loss": 2.2813, - "step": 350730 - }, - { - "epoch": 0.61, - "learning_rate": 1.941757900647677e-05, - "loss": 2.4508, - "step": 350740 - }, - { - "epoch": 0.61, - "learning_rate": 1.9416707066549945e-05, - "loss": 2.4032, - "step": 350750 - }, - { - "epoch": 0.61, - "learning_rate": 1.9415835126623115e-05, - "loss": 2.1607, - "step": 350760 - }, - { - "epoch": 0.61, - "learning_rate": 1.9414963186696292e-05, - "loss": 2.4208, - "step": 350770 - }, - { - "epoch": 0.61, - "learning_rate": 1.9414091246769462e-05, - "loss": 2.2934, - "step": 350780 - }, - { - "epoch": 0.61, - "learning_rate": 1.9413219306842636e-05, - "loss": 2.4268, - "step": 350790 - }, - { - "epoch": 0.61, - "learning_rate": 1.941234736691581e-05, - "loss": 2.3817, - "step": 350800 - }, - { - "epoch": 0.61, - "learning_rate": 1.9411475426988984e-05, - "loss": 2.2679, - "step": 350810 - }, - { - "epoch": 0.61, - "learning_rate": 1.9410603487062158e-05, - "loss": 2.3931, - "step": 350820 - }, - { - "epoch": 0.61, - "learning_rate": 1.9409731547135328e-05, - "loss": 2.3632, - "step": 350830 - }, - { - "epoch": 0.61, - "learning_rate": 1.9408859607208502e-05, - "loss": 2.2648, - "step": 350840 - }, - { - "epoch": 0.61, - "learning_rate": 1.9407987667281675e-05, - "loss": 2.3967, - "step": 350850 - }, - { - "epoch": 0.61, - "learning_rate": 1.940711572735485e-05, - "loss": 2.3237, - "step": 350860 - }, - { - "epoch": 0.61, - "learning_rate": 1.9406243787428023e-05, - "loss": 2.3493, - "step": 350870 - }, - { - "epoch": 0.61, - "learning_rate": 1.9405371847501193e-05, - "loss": 2.3353, - "step": 350880 - }, - { - "epoch": 0.61, - "learning_rate": 1.940449990757437e-05, - "loss": 2.3569, - "step": 350890 - }, - { - "epoch": 0.61, - "learning_rate": 1.940362796764754e-05, - "loss": 2.2781, - "step": 350900 - }, - { - "epoch": 0.61, - "learning_rate": 1.9402756027720715e-05, - "loss": 2.3941, - "step": 350910 - }, - { - "epoch": 0.61, - "learning_rate": 1.940188408779389e-05, - "loss": 2.3126, - "step": 350920 - }, - { - "epoch": 0.61, - "learning_rate": 1.9401012147867062e-05, - "loss": 2.3621, - "step": 350930 - }, - { - "epoch": 0.61, - "learning_rate": 1.9400140207940236e-05, - "loss": 2.2582, - "step": 350940 - }, - { - "epoch": 0.61, - "learning_rate": 1.9399268268013406e-05, - "loss": 2.3525, - "step": 350950 - }, - { - "epoch": 0.61, - "learning_rate": 1.9398396328086584e-05, - "loss": 2.1914, - "step": 350960 - }, - { - "epoch": 0.61, - "learning_rate": 1.9397524388159754e-05, - "loss": 2.3354, - "step": 350970 - }, - { - "epoch": 0.61, - "learning_rate": 1.9396652448232928e-05, - "loss": 2.2848, - "step": 350980 - }, - { - "epoch": 0.61, - "learning_rate": 1.9395780508306098e-05, - "loss": 2.3851, - "step": 350990 - }, - { - "epoch": 0.61, - "learning_rate": 1.9394908568379275e-05, - "loss": 2.3634, - "step": 351000 - }, - { - "epoch": 0.61, - "learning_rate": 1.9394036628452446e-05, - "loss": 2.1852, - "step": 351010 - }, - { - "epoch": 0.61, - "learning_rate": 1.939316468852562e-05, - "loss": 2.2594, - "step": 351020 - }, - { - "epoch": 0.61, - "learning_rate": 1.9392292748598793e-05, - "loss": 2.3555, - "step": 351030 - }, - { - "epoch": 0.61, - "learning_rate": 1.9391420808671967e-05, - "loss": 2.2483, - "step": 351040 - }, - { - "epoch": 0.61, - "learning_rate": 1.939054886874514e-05, - "loss": 2.4466, - "step": 351050 - }, - { - "epoch": 0.61, - "learning_rate": 1.938967692881831e-05, - "loss": 2.311, - "step": 351060 - }, - { - "epoch": 0.61, - "learning_rate": 1.9388804988891488e-05, - "loss": 2.2989, - "step": 351070 - }, - { - "epoch": 0.61, - "learning_rate": 1.938793304896466e-05, - "loss": 2.3503, - "step": 351080 - }, - { - "epoch": 0.61, - "learning_rate": 1.9387061109037832e-05, - "loss": 2.3594, - "step": 351090 - }, - { - "epoch": 0.61, - "learning_rate": 1.9386189169111006e-05, - "loss": 2.1794, - "step": 351100 - }, - { - "epoch": 0.61, - "learning_rate": 1.938531722918418e-05, - "loss": 2.3606, - "step": 351110 - }, - { - "epoch": 0.61, - "learning_rate": 1.9384445289257354e-05, - "loss": 2.3213, - "step": 351120 - }, - { - "epoch": 0.61, - "learning_rate": 1.9383573349330524e-05, - "loss": 2.3079, - "step": 351130 - }, - { - "epoch": 0.61, - "learning_rate": 1.9382701409403698e-05, - "loss": 2.3715, - "step": 351140 - }, - { - "epoch": 0.61, - "learning_rate": 1.938182946947687e-05, - "loss": 2.3533, - "step": 351150 - }, - { - "epoch": 0.61, - "learning_rate": 1.9380957529550045e-05, - "loss": 2.3097, - "step": 351160 - }, - { - "epoch": 0.61, - "learning_rate": 1.938008558962322e-05, - "loss": 2.308, - "step": 351170 - }, - { - "epoch": 0.61, - "learning_rate": 1.9379213649696393e-05, - "loss": 2.4096, - "step": 351180 - }, - { - "epoch": 0.61, - "learning_rate": 1.9378341709769567e-05, - "loss": 2.4192, - "step": 351190 - }, - { - "epoch": 0.61, - "learning_rate": 1.9377469769842737e-05, - "loss": 2.2383, - "step": 351200 - }, - { - "epoch": 0.61, - "learning_rate": 1.937659782991591e-05, - "loss": 2.2369, - "step": 351210 - }, - { - "epoch": 0.61, - "learning_rate": 1.9375725889989085e-05, - "loss": 2.2109, - "step": 351220 - }, - { - "epoch": 0.61, - "learning_rate": 1.937485395006226e-05, - "loss": 2.3387, - "step": 351230 - }, - { - "epoch": 0.61, - "learning_rate": 1.937398201013543e-05, - "loss": 2.312, - "step": 351240 - }, - { - "epoch": 0.61, - "learning_rate": 1.9373110070208603e-05, - "loss": 2.3065, - "step": 351250 - }, - { - "epoch": 0.61, - "learning_rate": 1.9372238130281776e-05, - "loss": 2.5074, - "step": 351260 - }, - { - "epoch": 0.61, - "learning_rate": 1.937136619035495e-05, - "loss": 2.3855, - "step": 351270 - }, - { - "epoch": 0.61, - "learning_rate": 1.9370494250428124e-05, - "loss": 2.2574, - "step": 351280 - }, - { - "epoch": 0.61, - "learning_rate": 1.9369622310501294e-05, - "loss": 2.2938, - "step": 351290 - }, - { - "epoch": 0.61, - "learning_rate": 1.936875037057447e-05, - "loss": 2.3534, - "step": 351300 - }, - { - "epoch": 0.61, - "learning_rate": 1.9367878430647642e-05, - "loss": 2.2647, - "step": 351310 - }, - { - "epoch": 0.61, - "learning_rate": 1.9367006490720816e-05, - "loss": 2.2329, - "step": 351320 - }, - { - "epoch": 0.61, - "learning_rate": 1.936613455079399e-05, - "loss": 2.3117, - "step": 351330 - }, - { - "epoch": 0.61, - "learning_rate": 1.9365262610867163e-05, - "loss": 2.3391, - "step": 351340 - }, - { - "epoch": 0.61, - "learning_rate": 1.9364390670940337e-05, - "loss": 2.2818, - "step": 351350 - }, - { - "epoch": 0.61, - "learning_rate": 1.9363518731013507e-05, - "loss": 2.3501, - "step": 351360 - }, - { - "epoch": 0.61, - "learning_rate": 1.9362646791086684e-05, - "loss": 2.3468, - "step": 351370 - }, - { - "epoch": 0.61, - "learning_rate": 1.9361774851159855e-05, - "loss": 2.3496, - "step": 351380 - }, - { - "epoch": 0.61, - "learning_rate": 1.936090291123303e-05, - "loss": 2.2662, - "step": 351390 - }, - { - "epoch": 0.61, - "learning_rate": 1.93600309713062e-05, - "loss": 2.3161, - "step": 351400 - }, - { - "epoch": 0.61, - "learning_rate": 1.9359159031379376e-05, - "loss": 2.2694, - "step": 351410 - }, - { - "epoch": 0.61, - "learning_rate": 1.935828709145255e-05, - "loss": 2.3888, - "step": 351420 - }, - { - "epoch": 0.61, - "learning_rate": 1.935741515152572e-05, - "loss": 2.4068, - "step": 351430 - }, - { - "epoch": 0.61, - "learning_rate": 1.9356543211598897e-05, - "loss": 2.2384, - "step": 351440 - }, - { - "epoch": 0.61, - "learning_rate": 1.9355671271672068e-05, - "loss": 2.319, - "step": 351450 - }, - { - "epoch": 0.61, - "learning_rate": 1.935479933174524e-05, - "loss": 2.1383, - "step": 351460 - }, - { - "epoch": 0.61, - "learning_rate": 1.9353927391818412e-05, - "loss": 2.3237, - "step": 351470 - }, - { - "epoch": 0.61, - "learning_rate": 1.935305545189159e-05, - "loss": 2.3531, - "step": 351480 - }, - { - "epoch": 0.61, - "learning_rate": 1.935218351196476e-05, - "loss": 2.4745, - "step": 351490 - }, - { - "epoch": 0.61, - "learning_rate": 1.9351311572037933e-05, - "loss": 2.3462, - "step": 351500 - }, - { - "epoch": 0.61, - "learning_rate": 1.9350439632111107e-05, - "loss": 2.3345, - "step": 351510 - }, - { - "epoch": 0.61, - "learning_rate": 1.934956769218428e-05, - "loss": 2.1794, - "step": 351520 - }, - { - "epoch": 0.61, - "learning_rate": 1.9348695752257455e-05, - "loss": 2.3027, - "step": 351530 - }, - { - "epoch": 0.61, - "learning_rate": 1.9347823812330625e-05, - "loss": 2.3702, - "step": 351540 - }, - { - "epoch": 0.61, - "learning_rate": 1.93469518724038e-05, - "loss": 2.4399, - "step": 351550 - }, - { - "epoch": 0.61, - "learning_rate": 1.9346079932476973e-05, - "loss": 2.3612, - "step": 351560 - }, - { - "epoch": 0.61, - "learning_rate": 1.9345207992550146e-05, - "loss": 2.2329, - "step": 351570 - }, - { - "epoch": 0.61, - "learning_rate": 1.934433605262332e-05, - "loss": 2.3537, - "step": 351580 - }, - { - "epoch": 0.61, - "learning_rate": 1.9343464112696494e-05, - "loss": 2.2603, - "step": 351590 - }, - { - "epoch": 0.61, - "learning_rate": 1.9342592172769668e-05, - "loss": 2.338, - "step": 351600 - }, - { - "epoch": 0.61, - "learning_rate": 1.9341720232842838e-05, - "loss": 2.3767, - "step": 351610 - }, - { - "epoch": 0.61, - "learning_rate": 1.9340848292916012e-05, - "loss": 2.1545, - "step": 351620 - }, - { - "epoch": 0.61, - "learning_rate": 1.9339976352989186e-05, - "loss": 2.4031, - "step": 351630 - }, - { - "epoch": 0.61, - "learning_rate": 1.933910441306236e-05, - "loss": 2.5121, - "step": 351640 - }, - { - "epoch": 0.61, - "learning_rate": 1.933823247313553e-05, - "loss": 2.3664, - "step": 351650 - }, - { - "epoch": 0.61, - "learning_rate": 1.9337360533208703e-05, - "loss": 2.243, - "step": 351660 - }, - { - "epoch": 0.61, - "learning_rate": 1.933648859328188e-05, - "loss": 2.2896, - "step": 351670 - }, - { - "epoch": 0.61, - "learning_rate": 1.933561665335505e-05, - "loss": 2.3792, - "step": 351680 - }, - { - "epoch": 0.61, - "learning_rate": 1.9334744713428225e-05, - "loss": 2.1943, - "step": 351690 - }, - { - "epoch": 0.61, - "learning_rate": 1.93338727735014e-05, - "loss": 2.4077, - "step": 351700 - }, - { - "epoch": 0.61, - "learning_rate": 1.9333000833574572e-05, - "loss": 2.186, - "step": 351710 - }, - { - "epoch": 0.61, - "learning_rate": 1.9332128893647743e-05, - "loss": 2.2958, - "step": 351720 - }, - { - "epoch": 0.61, - "learning_rate": 1.9331256953720916e-05, - "loss": 2.3836, - "step": 351730 - }, - { - "epoch": 0.61, - "learning_rate": 1.933038501379409e-05, - "loss": 2.2563, - "step": 351740 - }, - { - "epoch": 0.61, - "learning_rate": 1.9329513073867264e-05, - "loss": 2.3357, - "step": 351750 - }, - { - "epoch": 0.61, - "learning_rate": 1.9328641133940438e-05, - "loss": 2.3468, - "step": 351760 - }, - { - "epoch": 0.61, - "learning_rate": 1.9327769194013608e-05, - "loss": 2.36, - "step": 351770 - }, - { - "epoch": 0.61, - "learning_rate": 1.9326897254086785e-05, - "loss": 2.3806, - "step": 351780 - }, - { - "epoch": 0.61, - "learning_rate": 1.9326025314159956e-05, - "loss": 2.3949, - "step": 351790 - }, - { - "epoch": 0.61, - "learning_rate": 1.932515337423313e-05, - "loss": 2.3161, - "step": 351800 - }, - { - "epoch": 0.61, - "learning_rate": 1.9324281434306303e-05, - "loss": 2.3753, - "step": 351810 - }, - { - "epoch": 0.61, - "learning_rate": 1.9323409494379477e-05, - "loss": 2.4087, - "step": 351820 - }, - { - "epoch": 0.61, - "learning_rate": 1.932253755445265e-05, - "loss": 2.4001, - "step": 351830 - }, - { - "epoch": 0.61, - "learning_rate": 1.932166561452582e-05, - "loss": 2.3471, - "step": 351840 - }, - { - "epoch": 0.61, - "learning_rate": 1.9320793674598998e-05, - "loss": 2.3621, - "step": 351850 - }, - { - "epoch": 0.61, - "learning_rate": 1.931992173467217e-05, - "loss": 2.2435, - "step": 351860 - }, - { - "epoch": 0.61, - "learning_rate": 1.9319049794745342e-05, - "loss": 2.3931, - "step": 351870 - }, - { - "epoch": 0.61, - "learning_rate": 1.9318177854818513e-05, - "loss": 2.339, - "step": 351880 - }, - { - "epoch": 0.61, - "learning_rate": 1.931730591489169e-05, - "loss": 2.2032, - "step": 351890 - }, - { - "epoch": 0.61, - "learning_rate": 1.9316433974964864e-05, - "loss": 2.4309, - "step": 351900 - }, - { - "epoch": 0.61, - "learning_rate": 1.9315562035038034e-05, - "loss": 2.3995, - "step": 351910 - }, - { - "epoch": 0.61, - "learning_rate": 1.9314690095111208e-05, - "loss": 2.5287, - "step": 351920 - }, - { - "epoch": 0.61, - "learning_rate": 1.931381815518438e-05, - "loss": 2.3346, - "step": 351930 - }, - { - "epoch": 0.61, - "learning_rate": 1.9312946215257555e-05, - "loss": 2.31, - "step": 351940 - }, - { - "epoch": 0.61, - "learning_rate": 1.9312074275330726e-05, - "loss": 2.2544, - "step": 351950 - }, - { - "epoch": 0.61, - "learning_rate": 1.93112023354039e-05, - "loss": 2.2731, - "step": 351960 - }, - { - "epoch": 0.61, - "learning_rate": 1.9310330395477073e-05, - "loss": 2.309, - "step": 351970 - }, - { - "epoch": 0.61, - "learning_rate": 1.9309458455550247e-05, - "loss": 2.2533, - "step": 351980 - }, - { - "epoch": 0.61, - "learning_rate": 1.930858651562342e-05, - "loss": 2.3054, - "step": 351990 - }, - { - "epoch": 0.61, - "learning_rate": 1.9307714575696595e-05, - "loss": 2.3289, - "step": 352000 - }, - { - "epoch": 0.61, - "learning_rate": 1.930684263576977e-05, - "loss": 2.3502, - "step": 352010 - }, - { - "epoch": 0.61, - "learning_rate": 1.930597069584294e-05, - "loss": 2.2713, - "step": 352020 - }, - { - "epoch": 0.61, - "learning_rate": 1.9305098755916113e-05, - "loss": 2.2883, - "step": 352030 - }, - { - "epoch": 0.61, - "learning_rate": 1.9304226815989286e-05, - "loss": 2.3939, - "step": 352040 - }, - { - "epoch": 0.61, - "learning_rate": 1.930335487606246e-05, - "loss": 2.3443, - "step": 352050 - }, - { - "epoch": 0.61, - "learning_rate": 1.9302482936135634e-05, - "loss": 2.3718, - "step": 352060 - }, - { - "epoch": 0.61, - "learning_rate": 1.9301610996208804e-05, - "loss": 2.2931, - "step": 352070 - }, - { - "epoch": 0.61, - "learning_rate": 1.930073905628198e-05, - "loss": 2.3151, - "step": 352080 - }, - { - "epoch": 0.61, - "learning_rate": 1.9299867116355152e-05, - "loss": 2.3586, - "step": 352090 - }, - { - "epoch": 0.61, - "learning_rate": 1.9298995176428326e-05, - "loss": 2.1977, - "step": 352100 - }, - { - "epoch": 0.61, - "learning_rate": 1.92981232365015e-05, - "loss": 2.3279, - "step": 352110 - }, - { - "epoch": 0.61, - "learning_rate": 1.9297251296574673e-05, - "loss": 2.3613, - "step": 352120 - }, - { - "epoch": 0.61, - "learning_rate": 1.9296379356647844e-05, - "loss": 2.2524, - "step": 352130 - }, - { - "epoch": 0.61, - "learning_rate": 1.9295507416721017e-05, - "loss": 2.2632, - "step": 352140 - }, - { - "epoch": 0.61, - "learning_rate": 1.9294635476794194e-05, - "loss": 2.3043, - "step": 352150 - }, - { - "epoch": 0.61, - "learning_rate": 1.9293763536867365e-05, - "loss": 2.4222, - "step": 352160 - }, - { - "epoch": 0.61, - "learning_rate": 1.929289159694054e-05, - "loss": 2.3303, - "step": 352170 - }, - { - "epoch": 0.61, - "learning_rate": 1.929201965701371e-05, - "loss": 2.3124, - "step": 352180 - }, - { - "epoch": 0.61, - "learning_rate": 1.9291147717086886e-05, - "loss": 2.2757, - "step": 352190 - }, - { - "epoch": 0.61, - "learning_rate": 1.9290275777160057e-05, - "loss": 2.2246, - "step": 352200 - }, - { - "epoch": 0.61, - "learning_rate": 1.928940383723323e-05, - "loss": 2.3697, - "step": 352210 - }, - { - "epoch": 0.61, - "learning_rate": 1.9288531897306404e-05, - "loss": 2.2523, - "step": 352220 - }, - { - "epoch": 0.61, - "learning_rate": 1.9287659957379578e-05, - "loss": 2.2326, - "step": 352230 - }, - { - "epoch": 0.61, - "learning_rate": 1.928678801745275e-05, - "loss": 2.3909, - "step": 352240 - }, - { - "epoch": 0.61, - "learning_rate": 1.9285916077525922e-05, - "loss": 2.3627, - "step": 352250 - }, - { - "epoch": 0.61, - "learning_rate": 1.92850441375991e-05, - "loss": 2.2352, - "step": 352260 - }, - { - "epoch": 0.61, - "learning_rate": 1.928417219767227e-05, - "loss": 2.3287, - "step": 352270 - }, - { - "epoch": 0.61, - "learning_rate": 1.9283300257745443e-05, - "loss": 2.3373, - "step": 352280 - }, - { - "epoch": 0.61, - "learning_rate": 1.9282428317818617e-05, - "loss": 2.2982, - "step": 352290 - }, - { - "epoch": 0.61, - "learning_rate": 1.928155637789179e-05, - "loss": 2.3906, - "step": 352300 - }, - { - "epoch": 0.61, - "learning_rate": 1.9280684437964965e-05, - "loss": 2.3978, - "step": 352310 - }, - { - "epoch": 0.61, - "learning_rate": 1.9279812498038135e-05, - "loss": 2.31, - "step": 352320 - }, - { - "epoch": 0.61, - "learning_rate": 1.927894055811131e-05, - "loss": 2.3508, - "step": 352330 - }, - { - "epoch": 0.61, - "learning_rate": 1.9278068618184483e-05, - "loss": 2.3715, - "step": 352340 - }, - { - "epoch": 0.61, - "learning_rate": 1.9277196678257656e-05, - "loss": 2.3579, - "step": 352350 - }, - { - "epoch": 0.61, - "learning_rate": 1.9276324738330827e-05, - "loss": 2.213, - "step": 352360 - }, - { - "epoch": 0.61, - "learning_rate": 1.9275452798404004e-05, - "loss": 2.3481, - "step": 352370 - }, - { - "epoch": 0.61, - "learning_rate": 1.9274580858477174e-05, - "loss": 2.3682, - "step": 352380 - }, - { - "epoch": 0.61, - "learning_rate": 1.9273708918550348e-05, - "loss": 2.2858, - "step": 352390 - }, - { - "epoch": 0.61, - "learning_rate": 1.9272836978623522e-05, - "loss": 2.2761, - "step": 352400 - }, - { - "epoch": 0.61, - "learning_rate": 1.9271965038696696e-05, - "loss": 2.449, - "step": 352410 - }, - { - "epoch": 0.61, - "learning_rate": 1.927109309876987e-05, - "loss": 2.3858, - "step": 352420 - }, - { - "epoch": 0.61, - "learning_rate": 1.927022115884304e-05, - "loss": 2.3359, - "step": 352430 - }, - { - "epoch": 0.61, - "learning_rate": 1.9269349218916213e-05, - "loss": 2.3807, - "step": 352440 - }, - { - "epoch": 0.61, - "learning_rate": 1.9268477278989387e-05, - "loss": 2.3303, - "step": 352450 - }, - { - "epoch": 0.61, - "learning_rate": 1.926760533906256e-05, - "loss": 2.3351, - "step": 352460 - }, - { - "epoch": 0.61, - "learning_rate": 1.9266733399135735e-05, - "loss": 2.3722, - "step": 352470 - }, - { - "epoch": 0.61, - "learning_rate": 1.9265861459208905e-05, - "loss": 2.3598, - "step": 352480 - }, - { - "epoch": 0.61, - "learning_rate": 1.9264989519282082e-05, - "loss": 2.3633, - "step": 352490 - }, - { - "epoch": 0.61, - "learning_rate": 1.9264117579355253e-05, - "loss": 2.3121, - "step": 352500 - }, - { - "epoch": 0.61, - "learning_rate": 1.9263245639428426e-05, - "loss": 2.2985, - "step": 352510 - }, - { - "epoch": 0.61, - "learning_rate": 1.92623736995016e-05, - "loss": 2.3765, - "step": 352520 - }, - { - "epoch": 0.61, - "learning_rate": 1.9261501759574774e-05, - "loss": 2.3647, - "step": 352530 - }, - { - "epoch": 0.61, - "learning_rate": 1.9260629819647948e-05, - "loss": 2.3487, - "step": 352540 - }, - { - "epoch": 0.61, - "learning_rate": 1.9259757879721118e-05, - "loss": 2.2997, - "step": 352550 - }, - { - "epoch": 0.61, - "learning_rate": 1.9258885939794295e-05, - "loss": 2.3264, - "step": 352560 - }, - { - "epoch": 0.61, - "learning_rate": 1.9258013999867466e-05, - "loss": 2.2198, - "step": 352570 - }, - { - "epoch": 0.61, - "learning_rate": 1.925714205994064e-05, - "loss": 2.3388, - "step": 352580 - }, - { - "epoch": 0.61, - "learning_rate": 1.925627012001381e-05, - "loss": 2.3546, - "step": 352590 - }, - { - "epoch": 0.61, - "learning_rate": 1.9255398180086987e-05, - "loss": 2.4553, - "step": 352600 - }, - { - "epoch": 0.61, - "learning_rate": 1.9254526240160157e-05, - "loss": 2.2963, - "step": 352610 - }, - { - "epoch": 0.61, - "learning_rate": 1.925365430023333e-05, - "loss": 2.2756, - "step": 352620 - }, - { - "epoch": 0.61, - "learning_rate": 1.9252782360306508e-05, - "loss": 2.1609, - "step": 352630 - }, - { - "epoch": 0.61, - "learning_rate": 1.925191042037968e-05, - "loss": 2.3627, - "step": 352640 - }, - { - "epoch": 0.61, - "learning_rate": 1.9251038480452852e-05, - "loss": 2.3473, - "step": 352650 - }, - { - "epoch": 0.61, - "learning_rate": 1.9250166540526023e-05, - "loss": 2.3646, - "step": 352660 - }, - { - "epoch": 0.62, - "learning_rate": 1.92492946005992e-05, - "loss": 2.3062, - "step": 352670 - }, - { - "epoch": 0.62, - "learning_rate": 1.924842266067237e-05, - "loss": 2.3411, - "step": 352680 - }, - { - "epoch": 0.62, - "learning_rate": 1.9247550720745544e-05, - "loss": 2.2752, - "step": 352690 - }, - { - "epoch": 0.62, - "learning_rate": 1.9246678780818718e-05, - "loss": 2.4229, - "step": 352700 - }, - { - "epoch": 0.62, - "learning_rate": 1.924580684089189e-05, - "loss": 2.3005, - "step": 352710 - }, - { - "epoch": 0.62, - "learning_rate": 1.9244934900965065e-05, - "loss": 2.3177, - "step": 352720 - }, - { - "epoch": 0.62, - "learning_rate": 1.9244062961038236e-05, - "loss": 2.349, - "step": 352730 - }, - { - "epoch": 0.62, - "learning_rate": 1.924319102111141e-05, - "loss": 2.4152, - "step": 352740 - }, - { - "epoch": 0.62, - "learning_rate": 1.9242319081184583e-05, - "loss": 2.2336, - "step": 352750 - }, - { - "epoch": 0.62, - "learning_rate": 1.9241447141257757e-05, - "loss": 2.2835, - "step": 352760 - }, - { - "epoch": 0.62, - "learning_rate": 1.924057520133093e-05, - "loss": 2.3763, - "step": 352770 - }, - { - "epoch": 0.62, - "learning_rate": 1.9239703261404105e-05, - "loss": 2.3355, - "step": 352780 - }, - { - "epoch": 0.62, - "learning_rate": 1.923883132147728e-05, - "loss": 2.3411, - "step": 352790 - }, - { - "epoch": 0.62, - "learning_rate": 1.923795938155045e-05, - "loss": 2.4064, - "step": 352800 - }, - { - "epoch": 0.62, - "learning_rate": 1.9237087441623623e-05, - "loss": 2.2678, - "step": 352810 - }, - { - "epoch": 0.62, - "learning_rate": 1.9236215501696796e-05, - "loss": 2.3946, - "step": 352820 - }, - { - "epoch": 0.62, - "learning_rate": 1.923534356176997e-05, - "loss": 2.3436, - "step": 352830 - }, - { - "epoch": 0.62, - "learning_rate": 1.923447162184314e-05, - "loss": 2.3496, - "step": 352840 - }, - { - "epoch": 0.62, - "learning_rate": 1.9233599681916314e-05, - "loss": 2.4113, - "step": 352850 - }, - { - "epoch": 0.62, - "learning_rate": 1.9232727741989488e-05, - "loss": 2.3536, - "step": 352860 - }, - { - "epoch": 0.62, - "learning_rate": 1.9231855802062662e-05, - "loss": 2.3412, - "step": 352870 - }, - { - "epoch": 0.62, - "learning_rate": 1.9230983862135836e-05, - "loss": 2.2557, - "step": 352880 - }, - { - "epoch": 0.62, - "learning_rate": 1.9230111922209006e-05, - "loss": 2.3198, - "step": 352890 - }, - { - "epoch": 0.62, - "learning_rate": 1.9229239982282183e-05, - "loss": 2.3592, - "step": 352900 - }, - { - "epoch": 0.62, - "learning_rate": 1.9228368042355354e-05, - "loss": 2.3016, - "step": 352910 - }, - { - "epoch": 0.62, - "learning_rate": 1.9227496102428527e-05, - "loss": 2.1598, - "step": 352920 - }, - { - "epoch": 0.62, - "learning_rate": 1.92266241625017e-05, - "loss": 2.2319, - "step": 352930 - }, - { - "epoch": 0.62, - "learning_rate": 1.9225752222574875e-05, - "loss": 2.3399, - "step": 352940 - }, - { - "epoch": 0.62, - "learning_rate": 1.922488028264805e-05, - "loss": 2.334, - "step": 352950 - }, - { - "epoch": 0.62, - "learning_rate": 1.922400834272122e-05, - "loss": 2.2906, - "step": 352960 - }, - { - "epoch": 0.62, - "learning_rate": 1.9223136402794396e-05, - "loss": 2.3146, - "step": 352970 - }, - { - "epoch": 0.62, - "learning_rate": 1.9222264462867567e-05, - "loss": 2.3183, - "step": 352980 - }, - { - "epoch": 0.62, - "learning_rate": 1.922139252294074e-05, - "loss": 2.2603, - "step": 352990 - }, - { - "epoch": 0.62, - "learning_rate": 1.922052058301391e-05, - "loss": 2.3446, - "step": 353000 - }, - { - "epoch": 0.62, - "learning_rate": 1.9219648643087088e-05, - "loss": 2.2515, - "step": 353010 - }, - { - "epoch": 0.62, - "learning_rate": 1.921877670316026e-05, - "loss": 2.2003, - "step": 353020 - }, - { - "epoch": 0.62, - "learning_rate": 1.9217904763233432e-05, - "loss": 2.2488, - "step": 353030 - }, - { - "epoch": 0.62, - "learning_rate": 1.921703282330661e-05, - "loss": 2.303, - "step": 353040 - }, - { - "epoch": 0.62, - "learning_rate": 1.921616088337978e-05, - "loss": 2.4693, - "step": 353050 - }, - { - "epoch": 0.62, - "learning_rate": 1.9215288943452953e-05, - "loss": 2.3871, - "step": 353060 - }, - { - "epoch": 0.62, - "learning_rate": 1.9214417003526124e-05, - "loss": 2.42, - "step": 353070 - }, - { - "epoch": 0.62, - "learning_rate": 1.92135450635993e-05, - "loss": 2.336, - "step": 353080 - }, - { - "epoch": 0.62, - "learning_rate": 1.921267312367247e-05, - "loss": 2.398, - "step": 353090 - }, - { - "epoch": 0.62, - "learning_rate": 1.9211801183745645e-05, - "loss": 2.4564, - "step": 353100 - }, - { - "epoch": 0.62, - "learning_rate": 1.921092924381882e-05, - "loss": 2.2654, - "step": 353110 - }, - { - "epoch": 0.62, - "learning_rate": 1.9210057303891993e-05, - "loss": 2.2311, - "step": 353120 - }, - { - "epoch": 0.62, - "learning_rate": 1.9209185363965166e-05, - "loss": 2.279, - "step": 353130 - }, - { - "epoch": 0.62, - "learning_rate": 1.9208313424038337e-05, - "loss": 2.2708, - "step": 353140 - }, - { - "epoch": 0.62, - "learning_rate": 1.920744148411151e-05, - "loss": 2.3183, - "step": 353150 - }, - { - "epoch": 0.62, - "learning_rate": 1.9206569544184684e-05, - "loss": 2.3354, - "step": 353160 - }, - { - "epoch": 0.62, - "learning_rate": 1.9205697604257858e-05, - "loss": 2.3809, - "step": 353170 - }, - { - "epoch": 0.62, - "learning_rate": 1.9204825664331032e-05, - "loss": 2.3224, - "step": 353180 - }, - { - "epoch": 0.62, - "learning_rate": 1.9203953724404206e-05, - "loss": 2.4346, - "step": 353190 - }, - { - "epoch": 0.62, - "learning_rate": 1.920308178447738e-05, - "loss": 2.3689, - "step": 353200 - }, - { - "epoch": 0.62, - "learning_rate": 1.920220984455055e-05, - "loss": 2.3053, - "step": 353210 - }, - { - "epoch": 0.62, - "learning_rate": 1.9201337904623723e-05, - "loss": 2.4265, - "step": 353220 - }, - { - "epoch": 0.62, - "learning_rate": 1.9200465964696897e-05, - "loss": 2.3443, - "step": 353230 - }, - { - "epoch": 0.62, - "learning_rate": 1.919959402477007e-05, - "loss": 2.3631, - "step": 353240 - }, - { - "epoch": 0.62, - "learning_rate": 1.9198722084843245e-05, - "loss": 2.1993, - "step": 353250 - }, - { - "epoch": 0.62, - "learning_rate": 1.9197850144916415e-05, - "loss": 2.2754, - "step": 353260 - }, - { - "epoch": 0.62, - "learning_rate": 1.9196978204989592e-05, - "loss": 2.276, - "step": 353270 - }, - { - "epoch": 0.62, - "learning_rate": 1.9196106265062763e-05, - "loss": 2.2699, - "step": 353280 - }, - { - "epoch": 0.62, - "learning_rate": 1.9195234325135936e-05, - "loss": 2.3672, - "step": 353290 - }, - { - "epoch": 0.62, - "learning_rate": 1.919436238520911e-05, - "loss": 2.2578, - "step": 353300 - }, - { - "epoch": 0.62, - "learning_rate": 1.9193490445282284e-05, - "loss": 2.4329, - "step": 353310 - }, - { - "epoch": 0.62, - "learning_rate": 1.9192618505355454e-05, - "loss": 2.3269, - "step": 353320 - }, - { - "epoch": 0.62, - "learning_rate": 1.9191746565428628e-05, - "loss": 2.2033, - "step": 353330 - }, - { - "epoch": 0.62, - "learning_rate": 1.9190874625501802e-05, - "loss": 2.3143, - "step": 353340 - }, - { - "epoch": 0.62, - "learning_rate": 1.9190002685574976e-05, - "loss": 2.2766, - "step": 353350 - }, - { - "epoch": 0.62, - "learning_rate": 1.918913074564815e-05, - "loss": 2.3377, - "step": 353360 - }, - { - "epoch": 0.62, - "learning_rate": 1.918825880572132e-05, - "loss": 2.3634, - "step": 353370 - }, - { - "epoch": 0.62, - "learning_rate": 1.9187386865794497e-05, - "loss": 2.345, - "step": 353380 - }, - { - "epoch": 0.62, - "learning_rate": 1.9186514925867667e-05, - "loss": 2.5013, - "step": 353390 - }, - { - "epoch": 0.62, - "learning_rate": 1.918564298594084e-05, - "loss": 2.3151, - "step": 353400 - }, - { - "epoch": 0.62, - "learning_rate": 1.9184771046014015e-05, - "loss": 2.2945, - "step": 353410 - }, - { - "epoch": 0.62, - "learning_rate": 1.918389910608719e-05, - "loss": 2.3246, - "step": 353420 - }, - { - "epoch": 0.62, - "learning_rate": 1.9183027166160362e-05, - "loss": 2.3089, - "step": 353430 - }, - { - "epoch": 0.62, - "learning_rate": 1.9182155226233533e-05, - "loss": 2.3661, - "step": 353440 - }, - { - "epoch": 0.62, - "learning_rate": 1.918128328630671e-05, - "loss": 2.2494, - "step": 353450 - }, - { - "epoch": 0.62, - "learning_rate": 1.918041134637988e-05, - "loss": 2.2646, - "step": 353460 - }, - { - "epoch": 0.62, - "learning_rate": 1.9179539406453054e-05, - "loss": 2.3082, - "step": 353470 - }, - { - "epoch": 0.62, - "learning_rate": 1.9178667466526225e-05, - "loss": 2.225, - "step": 353480 - }, - { - "epoch": 0.62, - "learning_rate": 1.91777955265994e-05, - "loss": 2.4318, - "step": 353490 - }, - { - "epoch": 0.62, - "learning_rate": 1.9176923586672575e-05, - "loss": 2.5269, - "step": 353500 - }, - { - "epoch": 0.62, - "learning_rate": 1.9176051646745746e-05, - "loss": 2.3051, - "step": 353510 - }, - { - "epoch": 0.62, - "learning_rate": 1.917517970681892e-05, - "loss": 2.3012, - "step": 353520 - }, - { - "epoch": 0.62, - "learning_rate": 1.9174307766892093e-05, - "loss": 2.3697, - "step": 353530 - }, - { - "epoch": 0.62, - "learning_rate": 1.9173435826965267e-05, - "loss": 2.2762, - "step": 353540 - }, - { - "epoch": 0.62, - "learning_rate": 1.9172563887038438e-05, - "loss": 2.2653, - "step": 353550 - }, - { - "epoch": 0.62, - "learning_rate": 1.9171691947111615e-05, - "loss": 2.2208, - "step": 353560 - }, - { - "epoch": 0.62, - "learning_rate": 1.9170820007184785e-05, - "loss": 2.224, - "step": 353570 - }, - { - "epoch": 0.62, - "learning_rate": 1.916994806725796e-05, - "loss": 2.4121, - "step": 353580 - }, - { - "epoch": 0.62, - "learning_rate": 1.9169076127331133e-05, - "loss": 2.3555, - "step": 353590 - }, - { - "epoch": 0.62, - "learning_rate": 1.9168204187404306e-05, - "loss": 2.3225, - "step": 353600 - }, - { - "epoch": 0.62, - "learning_rate": 1.916733224747748e-05, - "loss": 2.2641, - "step": 353610 - }, - { - "epoch": 0.62, - "learning_rate": 1.916646030755065e-05, - "loss": 2.3468, - "step": 353620 - }, - { - "epoch": 0.62, - "learning_rate": 1.9165588367623824e-05, - "loss": 2.3447, - "step": 353630 - }, - { - "epoch": 0.62, - "learning_rate": 1.9164716427696998e-05, - "loss": 2.3827, - "step": 353640 - }, - { - "epoch": 0.62, - "learning_rate": 1.9163844487770172e-05, - "loss": 2.2022, - "step": 353650 - }, - { - "epoch": 0.62, - "learning_rate": 1.9162972547843346e-05, - "loss": 2.3921, - "step": 353660 - }, - { - "epoch": 0.62, - "learning_rate": 1.9162100607916516e-05, - "loss": 2.3854, - "step": 353670 - }, - { - "epoch": 0.62, - "learning_rate": 1.9161228667989693e-05, - "loss": 2.3662, - "step": 353680 - }, - { - "epoch": 0.62, - "learning_rate": 1.9160356728062864e-05, - "loss": 2.3832, - "step": 353690 - }, - { - "epoch": 0.62, - "learning_rate": 1.9159484788136037e-05, - "loss": 2.288, - "step": 353700 - }, - { - "epoch": 0.62, - "learning_rate": 1.915861284820921e-05, - "loss": 2.3707, - "step": 353710 - }, - { - "epoch": 0.62, - "learning_rate": 1.9157740908282385e-05, - "loss": 2.4449, - "step": 353720 - }, - { - "epoch": 0.62, - "learning_rate": 1.9156868968355555e-05, - "loss": 2.2656, - "step": 353730 - }, - { - "epoch": 0.62, - "learning_rate": 1.915599702842873e-05, - "loss": 2.3816, - "step": 353740 - }, - { - "epoch": 0.62, - "learning_rate": 1.9155125088501906e-05, - "loss": 2.3126, - "step": 353750 - }, - { - "epoch": 0.62, - "learning_rate": 1.9154253148575077e-05, - "loss": 2.3158, - "step": 353760 - }, - { - "epoch": 0.62, - "learning_rate": 1.915338120864825e-05, - "loss": 2.2625, - "step": 353770 - }, - { - "epoch": 0.62, - "learning_rate": 1.915250926872142e-05, - "loss": 2.4002, - "step": 353780 - }, - { - "epoch": 0.62, - "learning_rate": 1.9151637328794598e-05, - "loss": 2.3731, - "step": 353790 - }, - { - "epoch": 0.62, - "learning_rate": 1.9150765388867768e-05, - "loss": 2.329, - "step": 353800 - }, - { - "epoch": 0.62, - "learning_rate": 1.9149893448940942e-05, - "loss": 2.3219, - "step": 353810 - }, - { - "epoch": 0.62, - "learning_rate": 1.9149021509014116e-05, - "loss": 2.368, - "step": 353820 - }, - { - "epoch": 0.62, - "learning_rate": 1.914814956908729e-05, - "loss": 2.3451, - "step": 353830 - }, - { - "epoch": 0.62, - "learning_rate": 1.9147277629160463e-05, - "loss": 2.2592, - "step": 353840 - }, - { - "epoch": 0.62, - "learning_rate": 1.9146405689233634e-05, - "loss": 2.3334, - "step": 353850 - }, - { - "epoch": 0.62, - "learning_rate": 1.914553374930681e-05, - "loss": 2.3908, - "step": 353860 - }, - { - "epoch": 0.62, - "learning_rate": 1.914466180937998e-05, - "loss": 2.4113, - "step": 353870 - }, - { - "epoch": 0.62, - "learning_rate": 1.9143789869453155e-05, - "loss": 2.3422, - "step": 353880 - }, - { - "epoch": 0.62, - "learning_rate": 1.914291792952633e-05, - "loss": 2.3907, - "step": 353890 - }, - { - "epoch": 0.62, - "learning_rate": 1.9142045989599503e-05, - "loss": 2.3747, - "step": 353900 - }, - { - "epoch": 0.62, - "learning_rate": 1.9141174049672676e-05, - "loss": 2.3505, - "step": 353910 - }, - { - "epoch": 0.62, - "learning_rate": 1.9140302109745847e-05, - "loss": 2.3849, - "step": 353920 - }, - { - "epoch": 0.62, - "learning_rate": 1.913943016981902e-05, - "loss": 2.3676, - "step": 353930 - }, - { - "epoch": 0.62, - "learning_rate": 1.9138558229892194e-05, - "loss": 2.3656, - "step": 353940 - }, - { - "epoch": 0.62, - "learning_rate": 1.9137686289965368e-05, - "loss": 2.2841, - "step": 353950 - }, - { - "epoch": 0.62, - "learning_rate": 1.913681435003854e-05, - "loss": 2.1853, - "step": 353960 - }, - { - "epoch": 0.62, - "learning_rate": 1.9135942410111716e-05, - "loss": 2.3183, - "step": 353970 - }, - { - "epoch": 0.62, - "learning_rate": 1.913507047018489e-05, - "loss": 2.2989, - "step": 353980 - }, - { - "epoch": 0.62, - "learning_rate": 1.913419853025806e-05, - "loss": 2.3171, - "step": 353990 - }, - { - "epoch": 0.62, - "learning_rate": 1.9133326590331233e-05, - "loss": 2.3766, - "step": 354000 - }, - { - "epoch": 0.62, - "learning_rate": 1.9132454650404407e-05, - "loss": 2.4828, - "step": 354010 - }, - { - "epoch": 0.62, - "learning_rate": 1.913158271047758e-05, - "loss": 2.3612, - "step": 354020 - }, - { - "epoch": 0.62, - "learning_rate": 1.913071077055075e-05, - "loss": 2.3321, - "step": 354030 - }, - { - "epoch": 0.62, - "learning_rate": 1.9129838830623925e-05, - "loss": 2.3099, - "step": 354040 - }, - { - "epoch": 0.62, - "learning_rate": 1.91289668906971e-05, - "loss": 2.4082, - "step": 354050 - }, - { - "epoch": 0.62, - "learning_rate": 1.9128094950770273e-05, - "loss": 2.1822, - "step": 354060 - }, - { - "epoch": 0.62, - "learning_rate": 1.9127223010843446e-05, - "loss": 2.2898, - "step": 354070 - }, - { - "epoch": 0.62, - "learning_rate": 1.9126351070916617e-05, - "loss": 2.386, - "step": 354080 - }, - { - "epoch": 0.62, - "learning_rate": 1.9125479130989794e-05, - "loss": 2.3076, - "step": 354090 - }, - { - "epoch": 0.62, - "learning_rate": 1.9124607191062964e-05, - "loss": 2.4046, - "step": 354100 - }, - { - "epoch": 0.62, - "learning_rate": 1.9123735251136138e-05, - "loss": 2.2114, - "step": 354110 - }, - { - "epoch": 0.62, - "learning_rate": 1.9122863311209312e-05, - "loss": 2.3992, - "step": 354120 - }, - { - "epoch": 0.62, - "learning_rate": 1.9121991371282486e-05, - "loss": 2.2635, - "step": 354130 - }, - { - "epoch": 0.62, - "learning_rate": 1.912111943135566e-05, - "loss": 2.3602, - "step": 354140 - }, - { - "epoch": 0.62, - "learning_rate": 1.912024749142883e-05, - "loss": 2.3757, - "step": 354150 - }, - { - "epoch": 0.62, - "learning_rate": 1.9119375551502007e-05, - "loss": 2.3524, - "step": 354160 - }, - { - "epoch": 0.62, - "learning_rate": 1.9118503611575177e-05, - "loss": 2.3117, - "step": 354170 - }, - { - "epoch": 0.62, - "learning_rate": 1.911763167164835e-05, - "loss": 2.3155, - "step": 354180 - }, - { - "epoch": 0.62, - "learning_rate": 1.911675973172152e-05, - "loss": 2.3, - "step": 354190 - }, - { - "epoch": 0.62, - "learning_rate": 1.91158877917947e-05, - "loss": 2.2535, - "step": 354200 - }, - { - "epoch": 0.62, - "learning_rate": 1.911501585186787e-05, - "loss": 2.309, - "step": 354210 - }, - { - "epoch": 0.62, - "learning_rate": 1.9114143911941043e-05, - "loss": 2.3784, - "step": 354220 - }, - { - "epoch": 0.62, - "learning_rate": 1.911327197201422e-05, - "loss": 2.2237, - "step": 354230 - }, - { - "epoch": 0.62, - "learning_rate": 1.911240003208739e-05, - "loss": 2.3269, - "step": 354240 - }, - { - "epoch": 0.62, - "learning_rate": 1.9111528092160564e-05, - "loss": 2.3262, - "step": 354250 - }, - { - "epoch": 0.62, - "learning_rate": 1.9110656152233735e-05, - "loss": 2.2644, - "step": 354260 - }, - { - "epoch": 0.62, - "learning_rate": 1.910978421230691e-05, - "loss": 2.3884, - "step": 354270 - }, - { - "epoch": 0.62, - "learning_rate": 1.9108912272380082e-05, - "loss": 2.2694, - "step": 354280 - }, - { - "epoch": 0.62, - "learning_rate": 1.9108040332453256e-05, - "loss": 2.4462, - "step": 354290 - }, - { - "epoch": 0.62, - "learning_rate": 1.910716839252643e-05, - "loss": 2.3721, - "step": 354300 - }, - { - "epoch": 0.62, - "learning_rate": 1.9106296452599603e-05, - "loss": 2.3488, - "step": 354310 - }, - { - "epoch": 0.62, - "learning_rate": 1.9105424512672777e-05, - "loss": 2.3403, - "step": 354320 - }, - { - "epoch": 0.62, - "learning_rate": 1.9104552572745948e-05, - "loss": 2.3967, - "step": 354330 - }, - { - "epoch": 0.62, - "learning_rate": 1.910368063281912e-05, - "loss": 2.4312, - "step": 354340 - }, - { - "epoch": 0.62, - "learning_rate": 1.9102808692892295e-05, - "loss": 2.3752, - "step": 354350 - }, - { - "epoch": 0.62, - "learning_rate": 1.910193675296547e-05, - "loss": 2.3046, - "step": 354360 - }, - { - "epoch": 0.62, - "learning_rate": 1.9101064813038643e-05, - "loss": 2.3323, - "step": 354370 - }, - { - "epoch": 0.62, - "learning_rate": 1.9100192873111816e-05, - "loss": 2.4438, - "step": 354380 - }, - { - "epoch": 0.62, - "learning_rate": 1.909932093318499e-05, - "loss": 2.283, - "step": 354390 - }, - { - "epoch": 0.62, - "learning_rate": 1.909844899325816e-05, - "loss": 2.4127, - "step": 354400 - }, - { - "epoch": 0.62, - "learning_rate": 1.9097577053331334e-05, - "loss": 2.3397, - "step": 354410 - }, - { - "epoch": 0.62, - "learning_rate": 1.9096705113404508e-05, - "loss": 2.3509, - "step": 354420 - }, - { - "epoch": 0.62, - "learning_rate": 1.9095833173477682e-05, - "loss": 2.1679, - "step": 354430 - }, - { - "epoch": 0.62, - "learning_rate": 1.9094961233550852e-05, - "loss": 2.2485, - "step": 354440 - }, - { - "epoch": 0.62, - "learning_rate": 1.9094089293624026e-05, - "loss": 2.3417, - "step": 354450 - }, - { - "epoch": 0.62, - "learning_rate": 1.90932173536972e-05, - "loss": 2.2627, - "step": 354460 - }, - { - "epoch": 0.62, - "learning_rate": 1.9092345413770374e-05, - "loss": 2.3511, - "step": 354470 - }, - { - "epoch": 0.62, - "learning_rate": 1.9091473473843547e-05, - "loss": 2.28, - "step": 354480 - }, - { - "epoch": 0.62, - "learning_rate": 1.909060153391672e-05, - "loss": 2.4491, - "step": 354490 - }, - { - "epoch": 0.62, - "learning_rate": 1.9089729593989895e-05, - "loss": 2.4492, - "step": 354500 - }, - { - "epoch": 0.62, - "learning_rate": 1.9088857654063065e-05, - "loss": 2.2463, - "step": 354510 - }, - { - "epoch": 0.62, - "learning_rate": 1.908798571413624e-05, - "loss": 2.2342, - "step": 354520 - }, - { - "epoch": 0.62, - "learning_rate": 1.9087113774209413e-05, - "loss": 2.2161, - "step": 354530 - }, - { - "epoch": 0.62, - "learning_rate": 1.9086241834282587e-05, - "loss": 2.3297, - "step": 354540 - }, - { - "epoch": 0.62, - "learning_rate": 1.908536989435576e-05, - "loss": 2.3889, - "step": 354550 - }, - { - "epoch": 0.62, - "learning_rate": 1.908449795442893e-05, - "loss": 2.3452, - "step": 354560 - }, - { - "epoch": 0.62, - "learning_rate": 1.9083626014502108e-05, - "loss": 2.3038, - "step": 354570 - }, - { - "epoch": 0.62, - "learning_rate": 1.9082754074575278e-05, - "loss": 2.2697, - "step": 354580 - }, - { - "epoch": 0.62, - "learning_rate": 1.9081882134648452e-05, - "loss": 2.2248, - "step": 354590 - }, - { - "epoch": 0.62, - "learning_rate": 1.9081010194721626e-05, - "loss": 2.212, - "step": 354600 - }, - { - "epoch": 0.62, - "learning_rate": 1.90801382547948e-05, - "loss": 2.4037, - "step": 354610 - }, - { - "epoch": 0.62, - "learning_rate": 1.9079266314867973e-05, - "loss": 2.3444, - "step": 354620 - }, - { - "epoch": 0.62, - "learning_rate": 1.9078394374941144e-05, - "loss": 2.3921, - "step": 354630 - }, - { - "epoch": 0.62, - "learning_rate": 1.907752243501432e-05, - "loss": 2.4174, - "step": 354640 - }, - { - "epoch": 0.62, - "learning_rate": 1.907665049508749e-05, - "loss": 2.2107, - "step": 354650 - }, - { - "epoch": 0.62, - "learning_rate": 1.9075778555160665e-05, - "loss": 2.2698, - "step": 354660 - }, - { - "epoch": 0.62, - "learning_rate": 1.9074906615233835e-05, - "loss": 2.3613, - "step": 354670 - }, - { - "epoch": 0.62, - "learning_rate": 1.9074034675307013e-05, - "loss": 2.3771, - "step": 354680 - }, - { - "epoch": 0.62, - "learning_rate": 1.9073162735380183e-05, - "loss": 2.3813, - "step": 354690 - }, - { - "epoch": 0.62, - "learning_rate": 1.9072290795453357e-05, - "loss": 2.2953, - "step": 354700 - }, - { - "epoch": 0.62, - "learning_rate": 1.907141885552653e-05, - "loss": 2.261, - "step": 354710 - }, - { - "epoch": 0.62, - "learning_rate": 1.9070546915599704e-05, - "loss": 2.3188, - "step": 354720 - }, - { - "epoch": 0.62, - "learning_rate": 1.9069674975672878e-05, - "loss": 2.3335, - "step": 354730 - }, - { - "epoch": 0.62, - "learning_rate": 1.906880303574605e-05, - "loss": 2.3903, - "step": 354740 - }, - { - "epoch": 0.62, - "learning_rate": 1.9067931095819222e-05, - "loss": 2.3928, - "step": 354750 - }, - { - "epoch": 0.62, - "learning_rate": 1.9067059155892396e-05, - "loss": 2.2841, - "step": 354760 - }, - { - "epoch": 0.62, - "learning_rate": 1.906618721596557e-05, - "loss": 2.405, - "step": 354770 - }, - { - "epoch": 0.62, - "learning_rate": 1.9065315276038743e-05, - "loss": 2.3709, - "step": 354780 - }, - { - "epoch": 0.62, - "learning_rate": 1.9064443336111917e-05, - "loss": 2.4336, - "step": 354790 - }, - { - "epoch": 0.62, - "learning_rate": 1.906357139618509e-05, - "loss": 2.3109, - "step": 354800 - }, - { - "epoch": 0.62, - "learning_rate": 1.906269945625826e-05, - "loss": 2.2109, - "step": 354810 - }, - { - "epoch": 0.62, - "learning_rate": 1.9061827516331435e-05, - "loss": 2.251, - "step": 354820 - }, - { - "epoch": 0.62, - "learning_rate": 1.906095557640461e-05, - "loss": 2.4301, - "step": 354830 - }, - { - "epoch": 0.62, - "learning_rate": 1.9060083636477783e-05, - "loss": 2.3077, - "step": 354840 - }, - { - "epoch": 0.62, - "learning_rate": 1.9059211696550956e-05, - "loss": 2.338, - "step": 354850 - }, - { - "epoch": 0.62, - "learning_rate": 1.9058339756624127e-05, - "loss": 2.3101, - "step": 354860 - }, - { - "epoch": 0.62, - "learning_rate": 1.9057467816697304e-05, - "loss": 2.3564, - "step": 354870 - }, - { - "epoch": 0.62, - "learning_rate": 1.9056595876770474e-05, - "loss": 2.3457, - "step": 354880 - }, - { - "epoch": 0.62, - "learning_rate": 1.9055723936843648e-05, - "loss": 2.2535, - "step": 354890 - }, - { - "epoch": 0.62, - "learning_rate": 1.9054851996916822e-05, - "loss": 2.4144, - "step": 354900 - }, - { - "epoch": 0.62, - "learning_rate": 1.9053980056989996e-05, - "loss": 2.4078, - "step": 354910 - }, - { - "epoch": 0.62, - "learning_rate": 1.9053108117063166e-05, - "loss": 2.3171, - "step": 354920 - }, - { - "epoch": 0.62, - "learning_rate": 1.905223617713634e-05, - "loss": 2.3465, - "step": 354930 - }, - { - "epoch": 0.62, - "learning_rate": 1.9051364237209514e-05, - "loss": 2.1954, - "step": 354940 - }, - { - "epoch": 0.62, - "learning_rate": 1.9050492297282687e-05, - "loss": 2.2595, - "step": 354950 - }, - { - "epoch": 0.62, - "learning_rate": 1.904962035735586e-05, - "loss": 2.3364, - "step": 354960 - }, - { - "epoch": 0.62, - "learning_rate": 1.904874841742903e-05, - "loss": 2.3002, - "step": 354970 - }, - { - "epoch": 0.62, - "learning_rate": 1.904787647750221e-05, - "loss": 2.2735, - "step": 354980 - }, - { - "epoch": 0.62, - "learning_rate": 1.904700453757538e-05, - "loss": 2.2518, - "step": 354990 - }, - { - "epoch": 0.62, - "learning_rate": 1.9046132597648553e-05, - "loss": 2.3581, - "step": 355000 - }, - { - "epoch": 0.62, - "learning_rate": 1.9045260657721727e-05, - "loss": 2.4076, - "step": 355010 - }, - { - "epoch": 0.62, - "learning_rate": 1.90443887177949e-05, - "loss": 2.3834, - "step": 355020 - }, - { - "epoch": 0.62, - "learning_rate": 1.9043516777868074e-05, - "loss": 2.4343, - "step": 355030 - }, - { - "epoch": 0.62, - "learning_rate": 1.9042644837941245e-05, - "loss": 2.1516, - "step": 355040 - }, - { - "epoch": 0.62, - "learning_rate": 1.904177289801442e-05, - "loss": 2.4127, - "step": 355050 - }, - { - "epoch": 0.62, - "learning_rate": 1.9040900958087592e-05, - "loss": 2.3384, - "step": 355060 - }, - { - "epoch": 0.62, - "learning_rate": 1.9040029018160766e-05, - "loss": 2.2323, - "step": 355070 - }, - { - "epoch": 0.62, - "learning_rate": 1.9039157078233936e-05, - "loss": 2.2788, - "step": 355080 - }, - { - "epoch": 0.62, - "learning_rate": 1.9038285138307113e-05, - "loss": 2.3994, - "step": 355090 - }, - { - "epoch": 0.62, - "learning_rate": 1.9037413198380287e-05, - "loss": 2.2839, - "step": 355100 - }, - { - "epoch": 0.62, - "learning_rate": 1.9036541258453458e-05, - "loss": 2.2376, - "step": 355110 - }, - { - "epoch": 0.62, - "learning_rate": 1.903566931852663e-05, - "loss": 2.3419, - "step": 355120 - }, - { - "epoch": 0.62, - "learning_rate": 1.9034797378599805e-05, - "loss": 2.33, - "step": 355130 - }, - { - "epoch": 0.62, - "learning_rate": 1.903392543867298e-05, - "loss": 2.219, - "step": 355140 - }, - { - "epoch": 0.62, - "learning_rate": 1.903305349874615e-05, - "loss": 2.3125, - "step": 355150 - }, - { - "epoch": 0.62, - "learning_rate": 1.9032181558819326e-05, - "loss": 2.3388, - "step": 355160 - }, - { - "epoch": 0.62, - "learning_rate": 1.9031309618892497e-05, - "loss": 2.2958, - "step": 355170 - }, - { - "epoch": 0.62, - "learning_rate": 1.903043767896567e-05, - "loss": 2.2924, - "step": 355180 - }, - { - "epoch": 0.62, - "learning_rate": 1.9029565739038844e-05, - "loss": 2.3403, - "step": 355190 - }, - { - "epoch": 0.62, - "learning_rate": 1.9028693799112018e-05, - "loss": 2.2199, - "step": 355200 - }, - { - "epoch": 0.62, - "learning_rate": 1.9027821859185192e-05, - "loss": 2.376, - "step": 355210 - }, - { - "epoch": 0.62, - "learning_rate": 1.9026949919258362e-05, - "loss": 2.2129, - "step": 355220 - }, - { - "epoch": 0.62, - "learning_rate": 1.9026077979331536e-05, - "loss": 2.2406, - "step": 355230 - }, - { - "epoch": 0.62, - "learning_rate": 1.902520603940471e-05, - "loss": 2.2892, - "step": 355240 - }, - { - "epoch": 0.62, - "learning_rate": 1.9024334099477884e-05, - "loss": 2.249, - "step": 355250 - }, - { - "epoch": 0.62, - "learning_rate": 1.9023462159551057e-05, - "loss": 2.3679, - "step": 355260 - }, - { - "epoch": 0.62, - "learning_rate": 1.9022590219624228e-05, - "loss": 2.3768, - "step": 355270 - }, - { - "epoch": 0.62, - "learning_rate": 1.9021718279697405e-05, - "loss": 2.4152, - "step": 355280 - }, - { - "epoch": 0.62, - "learning_rate": 1.9020846339770575e-05, - "loss": 2.3602, - "step": 355290 - }, - { - "epoch": 0.62, - "learning_rate": 1.901997439984375e-05, - "loss": 2.341, - "step": 355300 - }, - { - "epoch": 0.62, - "learning_rate": 1.9019102459916923e-05, - "loss": 2.3147, - "step": 355310 - }, - { - "epoch": 0.62, - "learning_rate": 1.9018230519990097e-05, - "loss": 2.3692, - "step": 355320 - }, - { - "epoch": 0.62, - "learning_rate": 1.901735858006327e-05, - "loss": 2.2406, - "step": 355330 - }, - { - "epoch": 0.62, - "learning_rate": 1.901648664013644e-05, - "loss": 2.3642, - "step": 355340 - }, - { - "epoch": 0.62, - "learning_rate": 1.9015614700209618e-05, - "loss": 2.3261, - "step": 355350 - }, - { - "epoch": 0.62, - "learning_rate": 1.9014742760282788e-05, - "loss": 2.3799, - "step": 355360 - }, - { - "epoch": 0.62, - "learning_rate": 1.9013870820355962e-05, - "loss": 2.295, - "step": 355370 - }, - { - "epoch": 0.62, - "learning_rate": 1.9012998880429132e-05, - "loss": 2.3274, - "step": 355380 - }, - { - "epoch": 0.62, - "learning_rate": 1.901212694050231e-05, - "loss": 2.2983, - "step": 355390 - }, - { - "epoch": 0.62, - "learning_rate": 1.901125500057548e-05, - "loss": 2.3331, - "step": 355400 - }, - { - "epoch": 0.62, - "learning_rate": 1.9010383060648654e-05, - "loss": 2.4162, - "step": 355410 - }, - { - "epoch": 0.62, - "learning_rate": 1.9009511120721827e-05, - "loss": 2.2132, - "step": 355420 - }, - { - "epoch": 0.62, - "learning_rate": 1.9008639180795e-05, - "loss": 2.3849, - "step": 355430 - }, - { - "epoch": 0.62, - "learning_rate": 1.9007767240868175e-05, - "loss": 2.2956, - "step": 355440 - }, - { - "epoch": 0.62, - "learning_rate": 1.9006895300941345e-05, - "loss": 2.3828, - "step": 355450 - }, - { - "epoch": 0.62, - "learning_rate": 1.9006023361014523e-05, - "loss": 2.3925, - "step": 355460 - }, - { - "epoch": 0.62, - "learning_rate": 1.9005151421087693e-05, - "loss": 2.2183, - "step": 355470 - }, - { - "epoch": 0.62, - "learning_rate": 1.9004279481160867e-05, - "loss": 2.2605, - "step": 355480 - }, - { - "epoch": 0.62, - "learning_rate": 1.900340754123404e-05, - "loss": 2.3754, - "step": 355490 - }, - { - "epoch": 0.62, - "learning_rate": 1.9002535601307214e-05, - "loss": 2.4308, - "step": 355500 - }, - { - "epoch": 0.62, - "learning_rate": 1.9001663661380388e-05, - "loss": 2.1994, - "step": 355510 - }, - { - "epoch": 0.62, - "learning_rate": 1.900079172145356e-05, - "loss": 2.3904, - "step": 355520 - }, - { - "epoch": 0.62, - "learning_rate": 1.8999919781526732e-05, - "loss": 2.2106, - "step": 355530 - }, - { - "epoch": 0.62, - "learning_rate": 1.8999047841599906e-05, - "loss": 2.4207, - "step": 355540 - }, - { - "epoch": 0.62, - "learning_rate": 1.899817590167308e-05, - "loss": 2.3091, - "step": 355550 - }, - { - "epoch": 0.62, - "learning_rate": 1.899730396174625e-05, - "loss": 2.2972, - "step": 355560 - }, - { - "epoch": 0.62, - "learning_rate": 1.8996432021819427e-05, - "loss": 2.2926, - "step": 355570 - }, - { - "epoch": 0.62, - "learning_rate": 1.89955600818926e-05, - "loss": 2.3798, - "step": 355580 - }, - { - "epoch": 0.62, - "learning_rate": 1.899468814196577e-05, - "loss": 2.2745, - "step": 355590 - }, - { - "epoch": 0.62, - "learning_rate": 1.8993816202038945e-05, - "loss": 2.2569, - "step": 355600 - }, - { - "epoch": 0.62, - "learning_rate": 1.899294426211212e-05, - "loss": 2.3995, - "step": 355610 - }, - { - "epoch": 0.62, - "learning_rate": 1.8992072322185293e-05, - "loss": 2.2954, - "step": 355620 - }, - { - "epoch": 0.62, - "learning_rate": 1.8991200382258463e-05, - "loss": 2.3473, - "step": 355630 - }, - { - "epoch": 0.62, - "learning_rate": 1.8990328442331637e-05, - "loss": 2.3251, - "step": 355640 - }, - { - "epoch": 0.62, - "learning_rate": 1.898945650240481e-05, - "loss": 2.3648, - "step": 355650 - }, - { - "epoch": 0.62, - "learning_rate": 1.8988584562477984e-05, - "loss": 2.2786, - "step": 355660 - }, - { - "epoch": 0.62, - "learning_rate": 1.8987712622551158e-05, - "loss": 2.2241, - "step": 355670 - }, - { - "epoch": 0.62, - "learning_rate": 1.898684068262433e-05, - "loss": 2.3936, - "step": 355680 - }, - { - "epoch": 0.62, - "learning_rate": 1.8985968742697506e-05, - "loss": 2.2385, - "step": 355690 - }, - { - "epoch": 0.62, - "learning_rate": 1.8985096802770676e-05, - "loss": 2.3769, - "step": 355700 - }, - { - "epoch": 0.62, - "learning_rate": 1.898422486284385e-05, - "loss": 2.369, - "step": 355710 - }, - { - "epoch": 0.62, - "learning_rate": 1.8983352922917024e-05, - "loss": 2.3555, - "step": 355720 - }, - { - "epoch": 0.62, - "learning_rate": 1.8982480982990197e-05, - "loss": 2.3335, - "step": 355730 - }, - { - "epoch": 0.62, - "learning_rate": 1.898160904306337e-05, - "loss": 2.3344, - "step": 355740 - }, - { - "epoch": 0.62, - "learning_rate": 1.898073710313654e-05, - "loss": 2.3169, - "step": 355750 - }, - { - "epoch": 0.62, - "learning_rate": 1.897986516320972e-05, - "loss": 2.3315, - "step": 355760 - }, - { - "epoch": 0.62, - "learning_rate": 1.897899322328289e-05, - "loss": 2.3356, - "step": 355770 - }, - { - "epoch": 0.62, - "learning_rate": 1.8978121283356063e-05, - "loss": 2.2778, - "step": 355780 - }, - { - "epoch": 0.62, - "learning_rate": 1.8977249343429233e-05, - "loss": 2.3119, - "step": 355790 - }, - { - "epoch": 0.62, - "learning_rate": 1.897637740350241e-05, - "loss": 2.3712, - "step": 355800 - }, - { - "epoch": 0.62, - "learning_rate": 1.897550546357558e-05, - "loss": 2.4084, - "step": 355810 - }, - { - "epoch": 0.62, - "learning_rate": 1.8974633523648755e-05, - "loss": 2.2802, - "step": 355820 - }, - { - "epoch": 0.62, - "learning_rate": 1.8973761583721932e-05, - "loss": 2.2729, - "step": 355830 - }, - { - "epoch": 0.62, - "learning_rate": 1.8972889643795102e-05, - "loss": 2.3629, - "step": 355840 - }, - { - "epoch": 0.62, - "learning_rate": 1.8972017703868276e-05, - "loss": 2.4029, - "step": 355850 - }, - { - "epoch": 0.62, - "learning_rate": 1.8971145763941446e-05, - "loss": 2.4025, - "step": 355860 - }, - { - "epoch": 0.62, - "learning_rate": 1.8970273824014623e-05, - "loss": 2.3074, - "step": 355870 - }, - { - "epoch": 0.62, - "learning_rate": 1.8969401884087794e-05, - "loss": 2.302, - "step": 355880 - }, - { - "epoch": 0.62, - "learning_rate": 1.8968529944160968e-05, - "loss": 2.2653, - "step": 355890 - }, - { - "epoch": 0.62, - "learning_rate": 1.896765800423414e-05, - "loss": 2.3767, - "step": 355900 - }, - { - "epoch": 0.62, - "learning_rate": 1.8966786064307315e-05, - "loss": 2.37, - "step": 355910 - }, - { - "epoch": 0.62, - "learning_rate": 1.896591412438049e-05, - "loss": 2.2612, - "step": 355920 - }, - { - "epoch": 0.62, - "learning_rate": 1.896504218445366e-05, - "loss": 2.3536, - "step": 355930 - }, - { - "epoch": 0.62, - "learning_rate": 1.8964170244526833e-05, - "loss": 2.2484, - "step": 355940 - }, - { - "epoch": 0.62, - "learning_rate": 1.8963298304600007e-05, - "loss": 2.4279, - "step": 355950 - }, - { - "epoch": 0.62, - "learning_rate": 1.896242636467318e-05, - "loss": 2.3137, - "step": 355960 - }, - { - "epoch": 0.62, - "learning_rate": 1.8961554424746354e-05, - "loss": 2.3399, - "step": 355970 - }, - { - "epoch": 0.62, - "learning_rate": 1.8960682484819528e-05, - "loss": 2.2973, - "step": 355980 - }, - { - "epoch": 0.62, - "learning_rate": 1.8959810544892702e-05, - "loss": 2.3255, - "step": 355990 - }, - { - "epoch": 0.62, - "learning_rate": 1.8958938604965872e-05, - "loss": 2.4456, - "step": 356000 - }, - { - "epoch": 0.62, - "learning_rate": 1.8958066665039046e-05, - "loss": 2.3713, - "step": 356010 - }, - { - "epoch": 0.62, - "learning_rate": 1.895719472511222e-05, - "loss": 2.2909, - "step": 356020 - }, - { - "epoch": 0.62, - "learning_rate": 1.8956322785185394e-05, - "loss": 2.2822, - "step": 356030 - }, - { - "epoch": 0.62, - "learning_rate": 1.8955450845258564e-05, - "loss": 2.3634, - "step": 356040 - }, - { - "epoch": 0.62, - "learning_rate": 1.8954578905331738e-05, - "loss": 2.3487, - "step": 356050 - }, - { - "epoch": 0.62, - "learning_rate": 1.8953706965404915e-05, - "loss": 2.3828, - "step": 356060 - }, - { - "epoch": 0.62, - "learning_rate": 1.8952835025478085e-05, - "loss": 2.2664, - "step": 356070 - }, - { - "epoch": 0.62, - "learning_rate": 1.895196308555126e-05, - "loss": 2.272, - "step": 356080 - }, - { - "epoch": 0.62, - "learning_rate": 1.8951091145624433e-05, - "loss": 2.291, - "step": 356090 - }, - { - "epoch": 0.62, - "learning_rate": 1.8950219205697607e-05, - "loss": 2.3184, - "step": 356100 - }, - { - "epoch": 0.62, - "learning_rate": 1.8949347265770777e-05, - "loss": 2.3427, - "step": 356110 - }, - { - "epoch": 0.62, - "learning_rate": 1.894847532584395e-05, - "loss": 2.2781, - "step": 356120 - }, - { - "epoch": 0.62, - "learning_rate": 1.8947603385917124e-05, - "loss": 2.3425, - "step": 356130 - }, - { - "epoch": 0.62, - "learning_rate": 1.8946731445990298e-05, - "loss": 2.29, - "step": 356140 - }, - { - "epoch": 0.62, - "learning_rate": 1.8945859506063472e-05, - "loss": 2.2962, - "step": 356150 - }, - { - "epoch": 0.62, - "learning_rate": 1.8944987566136642e-05, - "loss": 2.351, - "step": 356160 - }, - { - "epoch": 0.62, - "learning_rate": 1.894411562620982e-05, - "loss": 2.3372, - "step": 356170 - }, - { - "epoch": 0.62, - "learning_rate": 1.894324368628299e-05, - "loss": 2.2306, - "step": 356180 - }, - { - "epoch": 0.62, - "learning_rate": 1.8942371746356164e-05, - "loss": 2.3605, - "step": 356190 - }, - { - "epoch": 0.62, - "learning_rate": 1.8941499806429337e-05, - "loss": 2.292, - "step": 356200 - }, - { - "epoch": 0.62, - "learning_rate": 1.894062786650251e-05, - "loss": 2.3302, - "step": 356210 - }, - { - "epoch": 0.62, - "learning_rate": 1.8939755926575685e-05, - "loss": 2.2932, - "step": 356220 - }, - { - "epoch": 0.62, - "learning_rate": 1.8938883986648855e-05, - "loss": 2.2445, - "step": 356230 - }, - { - "epoch": 0.62, - "learning_rate": 1.8938012046722033e-05, - "loss": 2.3265, - "step": 356240 - }, - { - "epoch": 0.62, - "learning_rate": 1.8937140106795203e-05, - "loss": 2.2305, - "step": 356250 - }, - { - "epoch": 0.62, - "learning_rate": 1.8936268166868377e-05, - "loss": 2.4182, - "step": 356260 - }, - { - "epoch": 0.62, - "learning_rate": 1.8935396226941547e-05, - "loss": 2.3275, - "step": 356270 - }, - { - "epoch": 0.62, - "learning_rate": 1.8934524287014724e-05, - "loss": 2.3173, - "step": 356280 - }, - { - "epoch": 0.62, - "learning_rate": 1.8933652347087895e-05, - "loss": 2.3298, - "step": 356290 - }, - { - "epoch": 0.62, - "learning_rate": 1.893278040716107e-05, - "loss": 2.3564, - "step": 356300 - }, - { - "epoch": 0.62, - "learning_rate": 1.8931908467234242e-05, - "loss": 2.3315, - "step": 356310 - }, - { - "epoch": 0.62, - "learning_rate": 1.8931036527307416e-05, - "loss": 2.295, - "step": 356320 - }, - { - "epoch": 0.62, - "learning_rate": 1.893016458738059e-05, - "loss": 2.2873, - "step": 356330 - }, - { - "epoch": 0.62, - "learning_rate": 1.892929264745376e-05, - "loss": 2.3073, - "step": 356340 - }, - { - "epoch": 0.62, - "learning_rate": 1.8928420707526934e-05, - "loss": 2.2943, - "step": 356350 - }, - { - "epoch": 0.62, - "learning_rate": 1.8927548767600108e-05, - "loss": 2.3209, - "step": 356360 - }, - { - "epoch": 0.62, - "learning_rate": 1.892667682767328e-05, - "loss": 2.4581, - "step": 356370 - }, - { - "epoch": 0.62, - "learning_rate": 1.8925804887746455e-05, - "loss": 2.2646, - "step": 356380 - }, - { - "epoch": 0.62, - "learning_rate": 1.892493294781963e-05, - "loss": 2.4391, - "step": 356390 - }, - { - "epoch": 0.62, - "learning_rate": 1.8924061007892803e-05, - "loss": 2.3664, - "step": 356400 - }, - { - "epoch": 0.62, - "learning_rate": 1.8923189067965973e-05, - "loss": 2.2986, - "step": 356410 - }, - { - "epoch": 0.62, - "learning_rate": 1.8922317128039147e-05, - "loss": 2.2916, - "step": 356420 - }, - { - "epoch": 0.62, - "learning_rate": 1.892144518811232e-05, - "loss": 2.2781, - "step": 356430 - }, - { - "epoch": 0.62, - "learning_rate": 1.8920573248185494e-05, - "loss": 2.4411, - "step": 356440 - }, - { - "epoch": 0.62, - "learning_rate": 1.8919701308258668e-05, - "loss": 2.3222, - "step": 356450 - }, - { - "epoch": 0.62, - "learning_rate": 1.891882936833184e-05, - "loss": 2.3792, - "step": 356460 - }, - { - "epoch": 0.62, - "learning_rate": 1.8917957428405016e-05, - "loss": 2.2679, - "step": 356470 - }, - { - "epoch": 0.62, - "learning_rate": 1.8917085488478186e-05, - "loss": 2.3436, - "step": 356480 - }, - { - "epoch": 0.62, - "learning_rate": 1.891621354855136e-05, - "loss": 2.3273, - "step": 356490 - }, - { - "epoch": 0.62, - "learning_rate": 1.8915341608624534e-05, - "loss": 2.2842, - "step": 356500 - }, - { - "epoch": 0.62, - "learning_rate": 1.8914469668697707e-05, - "loss": 2.2644, - "step": 356510 - }, - { - "epoch": 0.62, - "learning_rate": 1.8913597728770878e-05, - "loss": 2.3222, - "step": 356520 - }, - { - "epoch": 0.62, - "learning_rate": 1.891272578884405e-05, - "loss": 2.3846, - "step": 356530 - }, - { - "epoch": 0.62, - "learning_rate": 1.8911853848917225e-05, - "loss": 2.298, - "step": 356540 - }, - { - "epoch": 0.62, - "learning_rate": 1.89109819089904e-05, - "loss": 2.2379, - "step": 356550 - }, - { - "epoch": 0.62, - "learning_rate": 1.8910109969063573e-05, - "loss": 2.3168, - "step": 356560 - }, - { - "epoch": 0.62, - "learning_rate": 1.8909238029136743e-05, - "loss": 2.3204, - "step": 356570 - }, - { - "epoch": 0.62, - "learning_rate": 1.890836608920992e-05, - "loss": 2.3687, - "step": 356580 - }, - { - "epoch": 0.62, - "learning_rate": 1.890749414928309e-05, - "loss": 2.2869, - "step": 356590 - }, - { - "epoch": 0.62, - "learning_rate": 1.8906622209356265e-05, - "loss": 2.3444, - "step": 356600 - }, - { - "epoch": 0.62, - "learning_rate": 1.890575026942944e-05, - "loss": 2.3335, - "step": 356610 - }, - { - "epoch": 0.62, - "learning_rate": 1.8904878329502612e-05, - "loss": 2.3575, - "step": 356620 - }, - { - "epoch": 0.62, - "learning_rate": 1.8904006389575786e-05, - "loss": 2.3868, - "step": 356630 - }, - { - "epoch": 0.62, - "learning_rate": 1.8903134449648956e-05, - "loss": 2.3724, - "step": 356640 - }, - { - "epoch": 0.62, - "learning_rate": 1.8902262509722133e-05, - "loss": 2.4142, - "step": 356650 - }, - { - "epoch": 0.62, - "learning_rate": 1.8901390569795304e-05, - "loss": 2.3533, - "step": 356660 - }, - { - "epoch": 0.62, - "learning_rate": 1.8900518629868478e-05, - "loss": 2.3666, - "step": 356670 - }, - { - "epoch": 0.62, - "learning_rate": 1.889964668994165e-05, - "loss": 2.2513, - "step": 356680 - }, - { - "epoch": 0.62, - "learning_rate": 1.8898774750014825e-05, - "loss": 2.3596, - "step": 356690 - }, - { - "epoch": 0.62, - "learning_rate": 1.8897902810088e-05, - "loss": 2.2842, - "step": 356700 - }, - { - "epoch": 0.62, - "learning_rate": 1.889703087016117e-05, - "loss": 2.3803, - "step": 356710 - }, - { - "epoch": 0.62, - "learning_rate": 1.8896158930234343e-05, - "loss": 2.2624, - "step": 356720 - }, - { - "epoch": 0.62, - "learning_rate": 1.8895286990307517e-05, - "loss": 2.2183, - "step": 356730 - }, - { - "epoch": 0.62, - "learning_rate": 1.889441505038069e-05, - "loss": 2.3214, - "step": 356740 - }, - { - "epoch": 0.62, - "learning_rate": 1.889354311045386e-05, - "loss": 2.3432, - "step": 356750 - }, - { - "epoch": 0.62, - "learning_rate": 1.8892671170527038e-05, - "loss": 2.4232, - "step": 356760 - }, - { - "epoch": 0.62, - "learning_rate": 1.889179923060021e-05, - "loss": 2.3673, - "step": 356770 - }, - { - "epoch": 0.62, - "learning_rate": 1.8890927290673382e-05, - "loss": 2.2613, - "step": 356780 - }, - { - "epoch": 0.62, - "learning_rate": 1.8890055350746556e-05, - "loss": 2.4343, - "step": 356790 - }, - { - "epoch": 0.62, - "learning_rate": 1.888918341081973e-05, - "loss": 2.4297, - "step": 356800 - }, - { - "epoch": 0.62, - "learning_rate": 1.8888311470892904e-05, - "loss": 2.3657, - "step": 356810 - }, - { - "epoch": 0.62, - "learning_rate": 1.8887439530966074e-05, - "loss": 2.2492, - "step": 356820 - }, - { - "epoch": 0.62, - "learning_rate": 1.8886567591039248e-05, - "loss": 2.4387, - "step": 356830 - }, - { - "epoch": 0.62, - "learning_rate": 1.888569565111242e-05, - "loss": 2.2978, - "step": 356840 - }, - { - "epoch": 0.62, - "learning_rate": 1.8884823711185595e-05, - "loss": 2.3477, - "step": 356850 - }, - { - "epoch": 0.62, - "learning_rate": 1.888395177125877e-05, - "loss": 2.4384, - "step": 356860 - }, - { - "epoch": 0.62, - "learning_rate": 1.888307983133194e-05, - "loss": 2.3278, - "step": 356870 - }, - { - "epoch": 0.62, - "learning_rate": 1.8882207891405117e-05, - "loss": 2.379, - "step": 356880 - }, - { - "epoch": 0.62, - "learning_rate": 1.8881335951478287e-05, - "loss": 2.4146, - "step": 356890 - }, - { - "epoch": 0.62, - "learning_rate": 1.888046401155146e-05, - "loss": 2.3258, - "step": 356900 - }, - { - "epoch": 0.62, - "learning_rate": 1.8879592071624634e-05, - "loss": 2.4013, - "step": 356910 - }, - { - "epoch": 0.62, - "learning_rate": 1.8878720131697808e-05, - "loss": 2.3681, - "step": 356920 - }, - { - "epoch": 0.62, - "learning_rate": 1.8877848191770982e-05, - "loss": 2.4141, - "step": 356930 - }, - { - "epoch": 0.62, - "learning_rate": 1.8876976251844152e-05, - "loss": 2.3257, - "step": 356940 - }, - { - "epoch": 0.62, - "learning_rate": 1.887610431191733e-05, - "loss": 2.3211, - "step": 356950 - }, - { - "epoch": 0.62, - "learning_rate": 1.88752323719905e-05, - "loss": 2.2529, - "step": 356960 - }, - { - "epoch": 0.62, - "learning_rate": 1.8874360432063674e-05, - "loss": 2.3409, - "step": 356970 - }, - { - "epoch": 0.62, - "learning_rate": 1.8873488492136844e-05, - "loss": 2.244, - "step": 356980 - }, - { - "epoch": 0.62, - "learning_rate": 1.887261655221002e-05, - "loss": 2.2589, - "step": 356990 - }, - { - "epoch": 0.62, - "learning_rate": 1.887174461228319e-05, - "loss": 2.2835, - "step": 357000 - }, - { - "epoch": 0.62, - "learning_rate": 1.8870872672356365e-05, - "loss": 2.42, - "step": 357010 - }, - { - "epoch": 0.62, - "learning_rate": 1.887000073242954e-05, - "loss": 2.3533, - "step": 357020 - }, - { - "epoch": 0.62, - "learning_rate": 1.8869128792502713e-05, - "loss": 2.3023, - "step": 357030 - }, - { - "epoch": 0.62, - "learning_rate": 1.8868256852575887e-05, - "loss": 2.2609, - "step": 357040 - }, - { - "epoch": 0.62, - "learning_rate": 1.8867384912649057e-05, - "loss": 2.3023, - "step": 357050 - }, - { - "epoch": 0.62, - "learning_rate": 1.8866512972722234e-05, - "loss": 2.3084, - "step": 357060 - }, - { - "epoch": 0.62, - "learning_rate": 1.8865641032795405e-05, - "loss": 2.4131, - "step": 357070 - }, - { - "epoch": 0.62, - "learning_rate": 1.886476909286858e-05, - "loss": 2.3842, - "step": 357080 - }, - { - "epoch": 0.62, - "learning_rate": 1.8863897152941752e-05, - "loss": 2.4207, - "step": 357090 - }, - { - "epoch": 0.62, - "learning_rate": 1.8863025213014926e-05, - "loss": 2.3816, - "step": 357100 - }, - { - "epoch": 0.62, - "learning_rate": 1.88621532730881e-05, - "loss": 2.3296, - "step": 357110 - }, - { - "epoch": 0.62, - "learning_rate": 1.886128133316127e-05, - "loss": 2.3944, - "step": 357120 - }, - { - "epoch": 0.62, - "learning_rate": 1.8860409393234444e-05, - "loss": 2.2914, - "step": 357130 - }, - { - "epoch": 0.62, - "learning_rate": 1.8859537453307618e-05, - "loss": 2.2479, - "step": 357140 - }, - { - "epoch": 0.62, - "learning_rate": 1.885866551338079e-05, - "loss": 2.3173, - "step": 357150 - }, - { - "epoch": 0.62, - "learning_rate": 1.8857793573453962e-05, - "loss": 2.3015, - "step": 357160 - }, - { - "epoch": 0.62, - "learning_rate": 1.885692163352714e-05, - "loss": 2.3053, - "step": 357170 - }, - { - "epoch": 0.62, - "learning_rate": 1.8856049693600313e-05, - "loss": 2.2867, - "step": 357180 - }, - { - "epoch": 0.62, - "learning_rate": 1.8855177753673483e-05, - "loss": 2.3839, - "step": 357190 - }, - { - "epoch": 0.62, - "learning_rate": 1.8854305813746657e-05, - "loss": 2.2292, - "step": 357200 - }, - { - "epoch": 0.62, - "learning_rate": 1.885343387381983e-05, - "loss": 2.239, - "step": 357210 - }, - { - "epoch": 0.62, - "learning_rate": 1.8852561933893004e-05, - "loss": 2.2211, - "step": 357220 - }, - { - "epoch": 0.62, - "learning_rate": 1.8851689993966175e-05, - "loss": 2.4452, - "step": 357230 - }, - { - "epoch": 0.62, - "learning_rate": 1.885081805403935e-05, - "loss": 2.2723, - "step": 357240 - }, - { - "epoch": 0.62, - "learning_rate": 1.8849946114112522e-05, - "loss": 2.2954, - "step": 357250 - }, - { - "epoch": 0.62, - "learning_rate": 1.8849074174185696e-05, - "loss": 2.3629, - "step": 357260 - }, - { - "epoch": 0.62, - "learning_rate": 1.884820223425887e-05, - "loss": 2.2766, - "step": 357270 - }, - { - "epoch": 0.62, - "learning_rate": 1.884733029433204e-05, - "loss": 2.3016, - "step": 357280 - }, - { - "epoch": 0.62, - "learning_rate": 1.8846458354405217e-05, - "loss": 2.2859, - "step": 357290 - }, - { - "epoch": 0.62, - "learning_rate": 1.8845586414478388e-05, - "loss": 2.2904, - "step": 357300 - }, - { - "epoch": 0.62, - "learning_rate": 1.884471447455156e-05, - "loss": 2.33, - "step": 357310 - }, - { - "epoch": 0.62, - "learning_rate": 1.8843842534624735e-05, - "loss": 2.3368, - "step": 357320 - }, - { - "epoch": 0.62, - "learning_rate": 1.884297059469791e-05, - "loss": 2.3611, - "step": 357330 - }, - { - "epoch": 0.62, - "learning_rate": 1.8842098654771083e-05, - "loss": 2.2721, - "step": 357340 - }, - { - "epoch": 0.62, - "learning_rate": 1.8841226714844253e-05, - "loss": 2.3709, - "step": 357350 - }, - { - "epoch": 0.62, - "learning_rate": 1.884035477491743e-05, - "loss": 2.4549, - "step": 357360 - }, - { - "epoch": 0.62, - "learning_rate": 1.88394828349906e-05, - "loss": 2.2903, - "step": 357370 - }, - { - "epoch": 0.62, - "learning_rate": 1.8838610895063775e-05, - "loss": 2.2842, - "step": 357380 - }, - { - "epoch": 0.62, - "learning_rate": 1.8837738955136945e-05, - "loss": 2.3938, - "step": 357390 - }, - { - "epoch": 0.62, - "learning_rate": 1.8836867015210122e-05, - "loss": 2.3038, - "step": 357400 - }, - { - "epoch": 0.62, - "learning_rate": 1.8835995075283296e-05, - "loss": 2.244, - "step": 357410 - }, - { - "epoch": 0.62, - "learning_rate": 1.8835123135356466e-05, - "loss": 2.3486, - "step": 357420 - }, - { - "epoch": 0.62, - "learning_rate": 1.8834251195429643e-05, - "loss": 2.4367, - "step": 357430 - }, - { - "epoch": 0.62, - "learning_rate": 1.8833379255502814e-05, - "loss": 2.315, - "step": 357440 - }, - { - "epoch": 0.62, - "learning_rate": 1.8832507315575988e-05, - "loss": 2.2748, - "step": 357450 - }, - { - "epoch": 0.62, - "learning_rate": 1.8831635375649158e-05, - "loss": 2.3412, - "step": 357460 - }, - { - "epoch": 0.62, - "learning_rate": 1.8830763435722335e-05, - "loss": 2.2601, - "step": 357470 - }, - { - "epoch": 0.62, - "learning_rate": 1.8829891495795505e-05, - "loss": 2.3776, - "step": 357480 - }, - { - "epoch": 0.62, - "learning_rate": 1.882901955586868e-05, - "loss": 2.1596, - "step": 357490 - }, - { - "epoch": 0.62, - "learning_rate": 1.8828147615941853e-05, - "loss": 2.2536, - "step": 357500 - }, - { - "epoch": 0.62, - "learning_rate": 1.8827275676015027e-05, - "loss": 2.2292, - "step": 357510 - }, - { - "epoch": 0.62, - "learning_rate": 1.88264037360882e-05, - "loss": 2.3426, - "step": 357520 - }, - { - "epoch": 0.62, - "learning_rate": 1.882553179616137e-05, - "loss": 2.1771, - "step": 357530 - }, - { - "epoch": 0.62, - "learning_rate": 1.8824659856234545e-05, - "loss": 2.4109, - "step": 357540 - }, - { - "epoch": 0.62, - "learning_rate": 1.882378791630772e-05, - "loss": 2.2637, - "step": 357550 - }, - { - "epoch": 0.62, - "learning_rate": 1.8822915976380892e-05, - "loss": 2.3279, - "step": 357560 - }, - { - "epoch": 0.62, - "learning_rate": 1.8822044036454066e-05, - "loss": 2.4886, - "step": 357570 - }, - { - "epoch": 0.62, - "learning_rate": 1.882117209652724e-05, - "loss": 2.2749, - "step": 357580 - }, - { - "epoch": 0.62, - "learning_rate": 1.8820300156600414e-05, - "loss": 2.3402, - "step": 357590 - }, - { - "epoch": 0.62, - "learning_rate": 1.8819428216673584e-05, - "loss": 2.3482, - "step": 357600 - }, - { - "epoch": 0.62, - "learning_rate": 1.8818556276746758e-05, - "loss": 2.3285, - "step": 357610 - }, - { - "epoch": 0.62, - "learning_rate": 1.881768433681993e-05, - "loss": 2.3246, - "step": 357620 - }, - { - "epoch": 0.62, - "learning_rate": 1.8816812396893105e-05, - "loss": 2.3891, - "step": 357630 - }, - { - "epoch": 0.62, - "learning_rate": 1.8815940456966276e-05, - "loss": 2.2494, - "step": 357640 - }, - { - "epoch": 0.62, - "learning_rate": 1.881506851703945e-05, - "loss": 2.2967, - "step": 357650 - }, - { - "epoch": 0.62, - "learning_rate": 1.8814196577112627e-05, - "loss": 2.3517, - "step": 357660 - }, - { - "epoch": 0.62, - "learning_rate": 1.8813324637185797e-05, - "loss": 2.346, - "step": 357670 - }, - { - "epoch": 0.62, - "learning_rate": 1.881245269725897e-05, - "loss": 2.2734, - "step": 357680 - }, - { - "epoch": 0.62, - "learning_rate": 1.8811580757332144e-05, - "loss": 2.275, - "step": 357690 - }, - { - "epoch": 0.62, - "learning_rate": 1.8810708817405318e-05, - "loss": 2.3966, - "step": 357700 - }, - { - "epoch": 0.62, - "learning_rate": 1.880983687747849e-05, - "loss": 2.2174, - "step": 357710 - }, - { - "epoch": 0.62, - "learning_rate": 1.8808964937551662e-05, - "loss": 2.2751, - "step": 357720 - }, - { - "epoch": 0.62, - "learning_rate": 1.8808092997624836e-05, - "loss": 2.1238, - "step": 357730 - }, - { - "epoch": 0.62, - "learning_rate": 1.880722105769801e-05, - "loss": 2.419, - "step": 357740 - }, - { - "epoch": 0.62, - "learning_rate": 1.8806349117771184e-05, - "loss": 2.4245, - "step": 357750 - }, - { - "epoch": 0.62, - "learning_rate": 1.8805477177844354e-05, - "loss": 2.3665, - "step": 357760 - }, - { - "epoch": 0.62, - "learning_rate": 1.880460523791753e-05, - "loss": 2.3478, - "step": 357770 - }, - { - "epoch": 0.62, - "learning_rate": 1.88037332979907e-05, - "loss": 2.3016, - "step": 357780 - }, - { - "epoch": 0.62, - "learning_rate": 1.8802861358063875e-05, - "loss": 2.3211, - "step": 357790 - }, - { - "epoch": 0.62, - "learning_rate": 1.880198941813705e-05, - "loss": 2.3782, - "step": 357800 - }, - { - "epoch": 0.62, - "learning_rate": 1.8801117478210223e-05, - "loss": 2.4556, - "step": 357810 - }, - { - "epoch": 0.62, - "learning_rate": 1.8800245538283397e-05, - "loss": 2.3891, - "step": 357820 - }, - { - "epoch": 0.62, - "learning_rate": 1.8799373598356567e-05, - "loss": 2.2876, - "step": 357830 - }, - { - "epoch": 0.62, - "learning_rate": 1.8798501658429744e-05, - "loss": 2.4269, - "step": 357840 - }, - { - "epoch": 0.62, - "learning_rate": 1.8797629718502915e-05, - "loss": 2.389, - "step": 357850 - }, - { - "epoch": 0.62, - "learning_rate": 1.879675777857609e-05, - "loss": 2.2032, - "step": 357860 - }, - { - "epoch": 0.62, - "learning_rate": 1.879588583864926e-05, - "loss": 2.3393, - "step": 357870 - }, - { - "epoch": 0.62, - "learning_rate": 1.8795013898722436e-05, - "loss": 2.3608, - "step": 357880 - }, - { - "epoch": 0.62, - "learning_rate": 1.8794141958795606e-05, - "loss": 2.4567, - "step": 357890 - }, - { - "epoch": 0.62, - "learning_rate": 1.879327001886878e-05, - "loss": 2.298, - "step": 357900 - }, - { - "epoch": 0.62, - "learning_rate": 1.8792398078941954e-05, - "loss": 2.2986, - "step": 357910 - }, - { - "epoch": 0.62, - "learning_rate": 1.8791526139015128e-05, - "loss": 2.2639, - "step": 357920 - }, - { - "epoch": 0.62, - "learning_rate": 1.87906541990883e-05, - "loss": 2.2596, - "step": 357930 - }, - { - "epoch": 0.62, - "learning_rate": 1.8789782259161472e-05, - "loss": 2.2381, - "step": 357940 - }, - { - "epoch": 0.62, - "learning_rate": 1.878891031923465e-05, - "loss": 2.273, - "step": 357950 - }, - { - "epoch": 0.62, - "learning_rate": 1.878803837930782e-05, - "loss": 2.2738, - "step": 357960 - }, - { - "epoch": 0.62, - "learning_rate": 1.8787166439380993e-05, - "loss": 2.3813, - "step": 357970 - }, - { - "epoch": 0.62, - "learning_rate": 1.8786294499454167e-05, - "loss": 2.3407, - "step": 357980 - }, - { - "epoch": 0.62, - "learning_rate": 1.878542255952734e-05, - "loss": 2.3659, - "step": 357990 - }, - { - "epoch": 0.62, - "learning_rate": 1.8784550619600514e-05, - "loss": 2.3094, - "step": 358000 - }, - { - "epoch": 0.62, - "learning_rate": 1.8783678679673685e-05, - "loss": 2.3836, - "step": 358010 - }, - { - "epoch": 0.62, - "learning_rate": 1.878280673974686e-05, - "loss": 2.3122, - "step": 358020 - }, - { - "epoch": 0.62, - "learning_rate": 1.8781934799820032e-05, - "loss": 2.3104, - "step": 358030 - }, - { - "epoch": 0.62, - "learning_rate": 1.8781062859893206e-05, - "loss": 2.4044, - "step": 358040 - }, - { - "epoch": 0.62, - "learning_rate": 1.878019091996638e-05, - "loss": 2.3289, - "step": 358050 - }, - { - "epoch": 0.62, - "learning_rate": 1.877931898003955e-05, - "loss": 2.3406, - "step": 358060 - }, - { - "epoch": 0.62, - "learning_rate": 1.8778447040112727e-05, - "loss": 2.2568, - "step": 358070 - }, - { - "epoch": 0.62, - "learning_rate": 1.8777575100185898e-05, - "loss": 2.3536, - "step": 358080 - }, - { - "epoch": 0.62, - "learning_rate": 1.877670316025907e-05, - "loss": 2.2192, - "step": 358090 - }, - { - "epoch": 0.62, - "learning_rate": 1.8775831220332245e-05, - "loss": 2.3717, - "step": 358100 - }, - { - "epoch": 0.62, - "learning_rate": 1.877495928040542e-05, - "loss": 2.3312, - "step": 358110 - }, - { - "epoch": 0.62, - "learning_rate": 1.877408734047859e-05, - "loss": 2.2982, - "step": 358120 - }, - { - "epoch": 0.62, - "learning_rate": 1.8773215400551763e-05, - "loss": 2.4005, - "step": 358130 - }, - { - "epoch": 0.62, - "learning_rate": 1.877234346062494e-05, - "loss": 2.3646, - "step": 358140 - }, - { - "epoch": 0.62, - "learning_rate": 1.877147152069811e-05, - "loss": 2.2479, - "step": 358150 - }, - { - "epoch": 0.62, - "learning_rate": 1.8770599580771285e-05, - "loss": 2.3106, - "step": 358160 - }, - { - "epoch": 0.62, - "learning_rate": 1.8769727640844455e-05, - "loss": 2.2372, - "step": 358170 - }, - { - "epoch": 0.62, - "learning_rate": 1.8768855700917632e-05, - "loss": 2.3273, - "step": 358180 - }, - { - "epoch": 0.62, - "learning_rate": 1.8767983760990802e-05, - "loss": 2.2882, - "step": 358190 - }, - { - "epoch": 0.62, - "learning_rate": 1.8767111821063976e-05, - "loss": 2.4046, - "step": 358200 - }, - { - "epoch": 0.62, - "learning_rate": 1.876623988113715e-05, - "loss": 2.3089, - "step": 358210 - }, - { - "epoch": 0.62, - "learning_rate": 1.8765367941210324e-05, - "loss": 2.3903, - "step": 358220 - }, - { - "epoch": 0.62, - "learning_rate": 1.8764496001283498e-05, - "loss": 2.2897, - "step": 358230 - }, - { - "epoch": 0.62, - "learning_rate": 1.8763624061356668e-05, - "loss": 2.3841, - "step": 358240 - }, - { - "epoch": 0.62, - "learning_rate": 1.8762752121429845e-05, - "loss": 2.3597, - "step": 358250 - }, - { - "epoch": 0.62, - "learning_rate": 1.8761880181503015e-05, - "loss": 2.2177, - "step": 358260 - }, - { - "epoch": 0.62, - "learning_rate": 1.876100824157619e-05, - "loss": 2.4074, - "step": 358270 - }, - { - "epoch": 0.62, - "learning_rate": 1.8760136301649363e-05, - "loss": 2.4473, - "step": 358280 - }, - { - "epoch": 0.62, - "learning_rate": 1.8759264361722537e-05, - "loss": 2.3493, - "step": 358290 - }, - { - "epoch": 0.62, - "learning_rate": 1.875839242179571e-05, - "loss": 2.2754, - "step": 358300 - }, - { - "epoch": 0.62, - "learning_rate": 1.875752048186888e-05, - "loss": 2.3765, - "step": 358310 - }, - { - "epoch": 0.62, - "learning_rate": 1.8756648541942055e-05, - "loss": 2.2649, - "step": 358320 - }, - { - "epoch": 0.62, - "learning_rate": 1.875577660201523e-05, - "loss": 2.363, - "step": 358330 - }, - { - "epoch": 0.62, - "learning_rate": 1.8754904662088402e-05, - "loss": 2.2633, - "step": 358340 - }, - { - "epoch": 0.62, - "learning_rate": 1.8754032722161573e-05, - "loss": 2.3136, - "step": 358350 - }, - { - "epoch": 0.62, - "learning_rate": 1.875316078223475e-05, - "loss": 2.2087, - "step": 358360 - }, - { - "epoch": 0.62, - "learning_rate": 1.875228884230792e-05, - "loss": 2.3397, - "step": 358370 - }, - { - "epoch": 0.62, - "learning_rate": 1.8751416902381094e-05, - "loss": 2.2177, - "step": 358380 - }, - { - "epoch": 0.62, - "learning_rate": 1.8750544962454268e-05, - "loss": 2.3647, - "step": 358390 - }, - { - "epoch": 0.63, - "learning_rate": 1.874967302252744e-05, - "loss": 2.3245, - "step": 358400 - }, - { - "epoch": 0.63, - "learning_rate": 1.8748801082600615e-05, - "loss": 2.4044, - "step": 358410 - }, - { - "epoch": 0.63, - "learning_rate": 1.8747929142673786e-05, - "loss": 2.4123, - "step": 358420 - }, - { - "epoch": 0.63, - "learning_rate": 1.874705720274696e-05, - "loss": 2.3928, - "step": 358430 - }, - { - "epoch": 0.63, - "learning_rate": 1.8746185262820133e-05, - "loss": 2.2162, - "step": 358440 - }, - { - "epoch": 0.63, - "learning_rate": 1.8745313322893307e-05, - "loss": 2.26, - "step": 358450 - }, - { - "epoch": 0.63, - "learning_rate": 1.874444138296648e-05, - "loss": 2.3233, - "step": 358460 - }, - { - "epoch": 0.63, - "learning_rate": 1.874356944303965e-05, - "loss": 2.349, - "step": 358470 - }, - { - "epoch": 0.63, - "learning_rate": 1.8742697503112828e-05, - "loss": 2.3334, - "step": 358480 - }, - { - "epoch": 0.63, - "learning_rate": 1.8741825563186e-05, - "loss": 2.3606, - "step": 358490 - }, - { - "epoch": 0.63, - "learning_rate": 1.8740953623259172e-05, - "loss": 2.375, - "step": 358500 - }, - { - "epoch": 0.63, - "learning_rate": 1.8740081683332346e-05, - "loss": 2.2859, - "step": 358510 - }, - { - "epoch": 0.63, - "learning_rate": 1.873920974340552e-05, - "loss": 2.3198, - "step": 358520 - }, - { - "epoch": 0.63, - "learning_rate": 1.8738337803478694e-05, - "loss": 2.3127, - "step": 358530 - }, - { - "epoch": 0.63, - "learning_rate": 1.8737465863551864e-05, - "loss": 2.4314, - "step": 358540 - }, - { - "epoch": 0.63, - "learning_rate": 1.873659392362504e-05, - "loss": 2.3237, - "step": 358550 - }, - { - "epoch": 0.63, - "learning_rate": 1.873572198369821e-05, - "loss": 2.3599, - "step": 358560 - }, - { - "epoch": 0.63, - "learning_rate": 1.8734850043771385e-05, - "loss": 2.2954, - "step": 358570 - }, - { - "epoch": 0.63, - "learning_rate": 1.8733978103844556e-05, - "loss": 2.2484, - "step": 358580 - }, - { - "epoch": 0.63, - "learning_rate": 1.8733106163917733e-05, - "loss": 2.3265, - "step": 358590 - }, - { - "epoch": 0.63, - "learning_rate": 1.8732234223990903e-05, - "loss": 2.2142, - "step": 358600 - }, - { - "epoch": 0.63, - "learning_rate": 1.8731362284064077e-05, - "loss": 2.3286, - "step": 358610 - }, - { - "epoch": 0.63, - "learning_rate": 1.8730490344137254e-05, - "loss": 2.4028, - "step": 358620 - }, - { - "epoch": 0.63, - "learning_rate": 1.8729618404210425e-05, - "loss": 2.2722, - "step": 358630 - }, - { - "epoch": 0.63, - "learning_rate": 1.87287464642836e-05, - "loss": 2.2914, - "step": 358640 - }, - { - "epoch": 0.63, - "learning_rate": 1.872787452435677e-05, - "loss": 2.3324, - "step": 358650 - }, - { - "epoch": 0.63, - "learning_rate": 1.8727002584429946e-05, - "loss": 2.3589, - "step": 358660 - }, - { - "epoch": 0.63, - "learning_rate": 1.8726130644503116e-05, - "loss": 2.3272, - "step": 358670 - }, - { - "epoch": 0.63, - "learning_rate": 1.872525870457629e-05, - "loss": 2.2798, - "step": 358680 - }, - { - "epoch": 0.63, - "learning_rate": 1.8724386764649464e-05, - "loss": 2.3121, - "step": 358690 - }, - { - "epoch": 0.63, - "learning_rate": 1.8723514824722638e-05, - "loss": 2.3859, - "step": 358700 - }, - { - "epoch": 0.63, - "learning_rate": 1.872264288479581e-05, - "loss": 2.1834, - "step": 358710 - }, - { - "epoch": 0.63, - "learning_rate": 1.8721770944868982e-05, - "loss": 2.4517, - "step": 358720 - }, - { - "epoch": 0.63, - "learning_rate": 1.8720899004942156e-05, - "loss": 2.3427, - "step": 358730 - }, - { - "epoch": 0.63, - "learning_rate": 1.872002706501533e-05, - "loss": 2.3583, - "step": 358740 - }, - { - "epoch": 0.63, - "learning_rate": 1.8719155125088503e-05, - "loss": 2.3255, - "step": 358750 - }, - { - "epoch": 0.63, - "learning_rate": 1.8718283185161677e-05, - "loss": 2.2382, - "step": 358760 - }, - { - "epoch": 0.63, - "learning_rate": 1.871741124523485e-05, - "loss": 2.2967, - "step": 358770 - }, - { - "epoch": 0.63, - "learning_rate": 1.8716539305308024e-05, - "loss": 2.3961, - "step": 358780 - }, - { - "epoch": 0.63, - "learning_rate": 1.8715667365381195e-05, - "loss": 2.3348, - "step": 358790 - }, - { - "epoch": 0.63, - "learning_rate": 1.871479542545437e-05, - "loss": 2.3484, - "step": 358800 - }, - { - "epoch": 0.63, - "learning_rate": 1.8713923485527542e-05, - "loss": 2.2435, - "step": 358810 - }, - { - "epoch": 0.63, - "learning_rate": 1.8713051545600716e-05, - "loss": 2.2959, - "step": 358820 - }, - { - "epoch": 0.63, - "learning_rate": 1.8712179605673886e-05, - "loss": 2.3668, - "step": 358830 - }, - { - "epoch": 0.63, - "learning_rate": 1.871130766574706e-05, - "loss": 2.3754, - "step": 358840 - }, - { - "epoch": 0.63, - "learning_rate": 1.8710435725820234e-05, - "loss": 2.3233, - "step": 358850 - }, - { - "epoch": 0.63, - "learning_rate": 1.8709563785893408e-05, - "loss": 2.3475, - "step": 358860 - }, - { - "epoch": 0.63, - "learning_rate": 1.870869184596658e-05, - "loss": 2.1582, - "step": 358870 - }, - { - "epoch": 0.63, - "learning_rate": 1.8707819906039755e-05, - "loss": 2.3534, - "step": 358880 - }, - { - "epoch": 0.63, - "learning_rate": 1.870694796611293e-05, - "loss": 2.3415, - "step": 358890 - }, - { - "epoch": 0.63, - "learning_rate": 1.87060760261861e-05, - "loss": 2.3605, - "step": 358900 - }, - { - "epoch": 0.63, - "learning_rate": 1.8705204086259273e-05, - "loss": 2.2862, - "step": 358910 - }, - { - "epoch": 0.63, - "learning_rate": 1.8704332146332447e-05, - "loss": 2.3182, - "step": 358920 - }, - { - "epoch": 0.63, - "learning_rate": 1.870346020640562e-05, - "loss": 2.3187, - "step": 358930 - }, - { - "epoch": 0.63, - "learning_rate": 1.8702588266478795e-05, - "loss": 2.2725, - "step": 358940 - }, - { - "epoch": 0.63, - "learning_rate": 1.8701716326551965e-05, - "loss": 2.3321, - "step": 358950 - }, - { - "epoch": 0.63, - "learning_rate": 1.8700844386625142e-05, - "loss": 2.2254, - "step": 358960 - }, - { - "epoch": 0.63, - "learning_rate": 1.8699972446698312e-05, - "loss": 2.3909, - "step": 358970 - }, - { - "epoch": 0.63, - "learning_rate": 1.8699100506771486e-05, - "loss": 2.3918, - "step": 358980 - }, - { - "epoch": 0.63, - "learning_rate": 1.8698228566844657e-05, - "loss": 2.2291, - "step": 358990 - }, - { - "epoch": 0.63, - "learning_rate": 1.8697356626917834e-05, - "loss": 2.3377, - "step": 359000 - }, - { - "epoch": 0.63, - "learning_rate": 1.8696484686991008e-05, - "loss": 2.3056, - "step": 359010 - }, - { - "epoch": 0.63, - "learning_rate": 1.8695612747064178e-05, - "loss": 2.3638, - "step": 359020 - }, - { - "epoch": 0.63, - "learning_rate": 1.8694740807137355e-05, - "loss": 2.4012, - "step": 359030 - }, - { - "epoch": 0.63, - "learning_rate": 1.8693868867210525e-05, - "loss": 2.3321, - "step": 359040 - }, - { - "epoch": 0.63, - "learning_rate": 1.86929969272837e-05, - "loss": 2.3501, - "step": 359050 - }, - { - "epoch": 0.63, - "learning_rate": 1.869212498735687e-05, - "loss": 2.3701, - "step": 359060 - }, - { - "epoch": 0.63, - "learning_rate": 1.8691253047430047e-05, - "loss": 2.2844, - "step": 359070 - }, - { - "epoch": 0.63, - "learning_rate": 1.8690381107503217e-05, - "loss": 2.2729, - "step": 359080 - }, - { - "epoch": 0.63, - "learning_rate": 1.868950916757639e-05, - "loss": 2.3677, - "step": 359090 - }, - { - "epoch": 0.63, - "learning_rate": 1.8688637227649565e-05, - "loss": 2.3185, - "step": 359100 - }, - { - "epoch": 0.63, - "learning_rate": 1.868776528772274e-05, - "loss": 2.3237, - "step": 359110 - }, - { - "epoch": 0.63, - "learning_rate": 1.8686893347795912e-05, - "loss": 2.1986, - "step": 359120 - }, - { - "epoch": 0.63, - "learning_rate": 1.8686021407869083e-05, - "loss": 2.3544, - "step": 359130 - }, - { - "epoch": 0.63, - "learning_rate": 1.8685149467942256e-05, - "loss": 2.3469, - "step": 359140 - }, - { - "epoch": 0.63, - "learning_rate": 1.868427752801543e-05, - "loss": 2.2607, - "step": 359150 - }, - { - "epoch": 0.63, - "learning_rate": 1.8683405588088604e-05, - "loss": 2.3729, - "step": 359160 - }, - { - "epoch": 0.63, - "learning_rate": 1.8682533648161778e-05, - "loss": 2.342, - "step": 359170 - }, - { - "epoch": 0.63, - "learning_rate": 1.868166170823495e-05, - "loss": 2.3696, - "step": 359180 - }, - { - "epoch": 0.63, - "learning_rate": 1.8680789768308125e-05, - "loss": 2.2784, - "step": 359190 - }, - { - "epoch": 0.63, - "learning_rate": 1.8679917828381296e-05, - "loss": 2.3106, - "step": 359200 - }, - { - "epoch": 0.63, - "learning_rate": 1.867904588845447e-05, - "loss": 2.3327, - "step": 359210 - }, - { - "epoch": 0.63, - "learning_rate": 1.8678173948527643e-05, - "loss": 2.261, - "step": 359220 - }, - { - "epoch": 0.63, - "learning_rate": 1.8677302008600817e-05, - "loss": 2.1892, - "step": 359230 - }, - { - "epoch": 0.63, - "learning_rate": 1.867643006867399e-05, - "loss": 2.3241, - "step": 359240 - }, - { - "epoch": 0.63, - "learning_rate": 1.867555812874716e-05, - "loss": 2.2214, - "step": 359250 - }, - { - "epoch": 0.63, - "learning_rate": 1.8674686188820338e-05, - "loss": 2.2059, - "step": 359260 - }, - { - "epoch": 0.63, - "learning_rate": 1.867381424889351e-05, - "loss": 2.3417, - "step": 359270 - }, - { - "epoch": 0.63, - "learning_rate": 1.8672942308966682e-05, - "loss": 2.2739, - "step": 359280 - }, - { - "epoch": 0.63, - "learning_rate": 1.8672070369039856e-05, - "loss": 2.3435, - "step": 359290 - }, - { - "epoch": 0.63, - "learning_rate": 1.867119842911303e-05, - "loss": 2.3945, - "step": 359300 - }, - { - "epoch": 0.63, - "learning_rate": 1.86703264891862e-05, - "loss": 2.4295, - "step": 359310 - }, - { - "epoch": 0.63, - "learning_rate": 1.8669454549259374e-05, - "loss": 2.3564, - "step": 359320 - }, - { - "epoch": 0.63, - "learning_rate": 1.8668582609332548e-05, - "loss": 2.3998, - "step": 359330 - }, - { - "epoch": 0.63, - "learning_rate": 1.866771066940572e-05, - "loss": 2.3034, - "step": 359340 - }, - { - "epoch": 0.63, - "learning_rate": 1.8666838729478895e-05, - "loss": 2.3517, - "step": 359350 - }, - { - "epoch": 0.63, - "learning_rate": 1.8665966789552066e-05, - "loss": 2.3221, - "step": 359360 - }, - { - "epoch": 0.63, - "learning_rate": 1.8665094849625243e-05, - "loss": 2.3625, - "step": 359370 - }, - { - "epoch": 0.63, - "learning_rate": 1.8664222909698413e-05, - "loss": 2.4176, - "step": 359380 - }, - { - "epoch": 0.63, - "learning_rate": 1.8663350969771587e-05, - "loss": 2.2456, - "step": 359390 - }, - { - "epoch": 0.63, - "learning_rate": 1.866247902984476e-05, - "loss": 2.4152, - "step": 359400 - }, - { - "epoch": 0.63, - "learning_rate": 1.8661607089917935e-05, - "loss": 2.3181, - "step": 359410 - }, - { - "epoch": 0.63, - "learning_rate": 1.866073514999111e-05, - "loss": 2.3255, - "step": 359420 - }, - { - "epoch": 0.63, - "learning_rate": 1.865986321006428e-05, - "loss": 2.2602, - "step": 359430 - }, - { - "epoch": 0.63, - "learning_rate": 1.8658991270137456e-05, - "loss": 2.3051, - "step": 359440 - }, - { - "epoch": 0.63, - "learning_rate": 1.8658119330210626e-05, - "loss": 2.2182, - "step": 359450 - }, - { - "epoch": 0.63, - "learning_rate": 1.86572473902838e-05, - "loss": 2.3996, - "step": 359460 - }, - { - "epoch": 0.63, - "learning_rate": 1.865637545035697e-05, - "loss": 2.2939, - "step": 359470 - }, - { - "epoch": 0.63, - "learning_rate": 1.8655503510430148e-05, - "loss": 2.3595, - "step": 359480 - }, - { - "epoch": 0.63, - "learning_rate": 1.865463157050332e-05, - "loss": 2.2625, - "step": 359490 - }, - { - "epoch": 0.63, - "learning_rate": 1.8653759630576492e-05, - "loss": 2.375, - "step": 359500 - }, - { - "epoch": 0.63, - "learning_rate": 1.8652887690649666e-05, - "loss": 2.3997, - "step": 359510 - }, - { - "epoch": 0.63, - "learning_rate": 1.865201575072284e-05, - "loss": 2.4011, - "step": 359520 - }, - { - "epoch": 0.63, - "learning_rate": 1.8651143810796013e-05, - "loss": 2.3425, - "step": 359530 - }, - { - "epoch": 0.63, - "learning_rate": 1.8650271870869183e-05, - "loss": 2.3847, - "step": 359540 - }, - { - "epoch": 0.63, - "learning_rate": 1.864939993094236e-05, - "loss": 2.3446, - "step": 359550 - }, - { - "epoch": 0.63, - "learning_rate": 1.864852799101553e-05, - "loss": 2.2814, - "step": 359560 - }, - { - "epoch": 0.63, - "learning_rate": 1.8647656051088705e-05, - "loss": 2.3724, - "step": 359570 - }, - { - "epoch": 0.63, - "learning_rate": 1.864678411116188e-05, - "loss": 2.306, - "step": 359580 - }, - { - "epoch": 0.63, - "learning_rate": 1.8645912171235052e-05, - "loss": 2.2665, - "step": 359590 - }, - { - "epoch": 0.63, - "learning_rate": 1.8645040231308226e-05, - "loss": 2.3301, - "step": 359600 - }, - { - "epoch": 0.63, - "learning_rate": 1.8644168291381396e-05, - "loss": 2.319, - "step": 359610 - }, - { - "epoch": 0.63, - "learning_rate": 1.864329635145457e-05, - "loss": 2.3053, - "step": 359620 - }, - { - "epoch": 0.63, - "learning_rate": 1.8642424411527744e-05, - "loss": 2.2944, - "step": 359630 - }, - { - "epoch": 0.63, - "learning_rate": 1.8641552471600918e-05, - "loss": 2.3189, - "step": 359640 - }, - { - "epoch": 0.63, - "learning_rate": 1.864068053167409e-05, - "loss": 2.3437, - "step": 359650 - }, - { - "epoch": 0.63, - "learning_rate": 1.8639808591747262e-05, - "loss": 2.2602, - "step": 359660 - }, - { - "epoch": 0.63, - "learning_rate": 1.863893665182044e-05, - "loss": 2.3275, - "step": 359670 - }, - { - "epoch": 0.63, - "learning_rate": 1.863806471189361e-05, - "loss": 2.3471, - "step": 359680 - }, - { - "epoch": 0.63, - "learning_rate": 1.8637192771966783e-05, - "loss": 2.2516, - "step": 359690 - }, - { - "epoch": 0.63, - "learning_rate": 1.8636320832039957e-05, - "loss": 2.4334, - "step": 359700 - }, - { - "epoch": 0.63, - "learning_rate": 1.863544889211313e-05, - "loss": 2.2997, - "step": 359710 - }, - { - "epoch": 0.63, - "learning_rate": 1.86345769521863e-05, - "loss": 2.3031, - "step": 359720 - }, - { - "epoch": 0.63, - "learning_rate": 1.8633705012259475e-05, - "loss": 2.2232, - "step": 359730 - }, - { - "epoch": 0.63, - "learning_rate": 1.8632833072332652e-05, - "loss": 2.3528, - "step": 359740 - }, - { - "epoch": 0.63, - "learning_rate": 1.8631961132405822e-05, - "loss": 2.3817, - "step": 359750 - }, - { - "epoch": 0.63, - "learning_rate": 1.8631089192478996e-05, - "loss": 2.315, - "step": 359760 - }, - { - "epoch": 0.63, - "learning_rate": 1.8630217252552167e-05, - "loss": 2.2895, - "step": 359770 - }, - { - "epoch": 0.63, - "learning_rate": 1.8629345312625344e-05, - "loss": 2.3053, - "step": 359780 - }, - { - "epoch": 0.63, - "learning_rate": 1.8628473372698514e-05, - "loss": 2.2577, - "step": 359790 - }, - { - "epoch": 0.63, - "learning_rate": 1.8627601432771688e-05, - "loss": 2.3411, - "step": 359800 - }, - { - "epoch": 0.63, - "learning_rate": 1.8626729492844862e-05, - "loss": 2.3119, - "step": 359810 - }, - { - "epoch": 0.63, - "learning_rate": 1.8625857552918035e-05, - "loss": 2.3855, - "step": 359820 - }, - { - "epoch": 0.63, - "learning_rate": 1.862498561299121e-05, - "loss": 2.3624, - "step": 359830 - }, - { - "epoch": 0.63, - "learning_rate": 1.862411367306438e-05, - "loss": 2.3367, - "step": 359840 - }, - { - "epoch": 0.63, - "learning_rate": 1.8623241733137557e-05, - "loss": 2.2404, - "step": 359850 - }, - { - "epoch": 0.63, - "learning_rate": 1.8622369793210727e-05, - "loss": 2.3829, - "step": 359860 - }, - { - "epoch": 0.63, - "learning_rate": 1.86214978532839e-05, - "loss": 2.2968, - "step": 359870 - }, - { - "epoch": 0.63, - "learning_rate": 1.8620625913357075e-05, - "loss": 2.3606, - "step": 359880 - }, - { - "epoch": 0.63, - "learning_rate": 1.861975397343025e-05, - "loss": 2.3589, - "step": 359890 - }, - { - "epoch": 0.63, - "learning_rate": 1.8618882033503422e-05, - "loss": 2.3698, - "step": 359900 - }, - { - "epoch": 0.63, - "learning_rate": 1.8618010093576593e-05, - "loss": 2.2979, - "step": 359910 - }, - { - "epoch": 0.63, - "learning_rate": 1.8617138153649766e-05, - "loss": 2.2671, - "step": 359920 - }, - { - "epoch": 0.63, - "learning_rate": 1.861626621372294e-05, - "loss": 2.1954, - "step": 359930 - }, - { - "epoch": 0.63, - "learning_rate": 1.8615394273796114e-05, - "loss": 2.3208, - "step": 359940 - }, - { - "epoch": 0.63, - "learning_rate": 1.8614522333869284e-05, - "loss": 2.2864, - "step": 359950 - }, - { - "epoch": 0.63, - "learning_rate": 1.861365039394246e-05, - "loss": 2.3194, - "step": 359960 - }, - { - "epoch": 0.63, - "learning_rate": 1.8612778454015635e-05, - "loss": 2.2356, - "step": 359970 - }, - { - "epoch": 0.63, - "learning_rate": 1.8611906514088806e-05, - "loss": 2.4041, - "step": 359980 - }, - { - "epoch": 0.63, - "learning_rate": 1.861103457416198e-05, - "loss": 2.3567, - "step": 359990 - }, - { - "epoch": 0.63, - "learning_rate": 1.8610162634235153e-05, - "loss": 2.3732, - "step": 360000 - }, - { - "epoch": 0.63, - "learning_rate": 1.8609290694308327e-05, - "loss": 2.288, - "step": 360010 - }, - { - "epoch": 0.63, - "learning_rate": 1.8608418754381497e-05, - "loss": 2.3511, - "step": 360020 - }, - { - "epoch": 0.63, - "learning_rate": 1.860754681445467e-05, - "loss": 2.3299, - "step": 360030 - }, - { - "epoch": 0.63, - "learning_rate": 1.8606674874527845e-05, - "loss": 2.3115, - "step": 360040 - }, - { - "epoch": 0.63, - "learning_rate": 1.860580293460102e-05, - "loss": 2.2577, - "step": 360050 - }, - { - "epoch": 0.63, - "learning_rate": 1.8604930994674192e-05, - "loss": 2.4564, - "step": 360060 - }, - { - "epoch": 0.63, - "learning_rate": 1.8604059054747363e-05, - "loss": 2.33, - "step": 360070 - }, - { - "epoch": 0.63, - "learning_rate": 1.860318711482054e-05, - "loss": 2.283, - "step": 360080 - }, - { - "epoch": 0.63, - "learning_rate": 1.860231517489371e-05, - "loss": 2.3601, - "step": 360090 - }, - { - "epoch": 0.63, - "learning_rate": 1.8601443234966884e-05, - "loss": 2.3077, - "step": 360100 - }, - { - "epoch": 0.63, - "learning_rate": 1.8600571295040058e-05, - "loss": 2.3001, - "step": 360110 - }, - { - "epoch": 0.63, - "learning_rate": 1.859969935511323e-05, - "loss": 2.2787, - "step": 360120 - }, - { - "epoch": 0.63, - "learning_rate": 1.8598827415186405e-05, - "loss": 2.4189, - "step": 360130 - }, - { - "epoch": 0.63, - "learning_rate": 1.8597955475259576e-05, - "loss": 2.392, - "step": 360140 - }, - { - "epoch": 0.63, - "learning_rate": 1.8597083535332753e-05, - "loss": 2.2584, - "step": 360150 - }, - { - "epoch": 0.63, - "learning_rate": 1.8596211595405923e-05, - "loss": 2.2234, - "step": 360160 - }, - { - "epoch": 0.63, - "learning_rate": 1.8595339655479097e-05, - "loss": 2.3709, - "step": 360170 - }, - { - "epoch": 0.63, - "learning_rate": 1.8594467715552267e-05, - "loss": 2.3995, - "step": 360180 - }, - { - "epoch": 0.63, - "learning_rate": 1.8593595775625445e-05, - "loss": 2.4375, - "step": 360190 - }, - { - "epoch": 0.63, - "learning_rate": 1.8592723835698615e-05, - "loss": 2.42, - "step": 360200 - }, - { - "epoch": 0.63, - "learning_rate": 1.859185189577179e-05, - "loss": 2.2037, - "step": 360210 - }, - { - "epoch": 0.63, - "learning_rate": 1.8590979955844966e-05, - "loss": 2.3427, - "step": 360220 - }, - { - "epoch": 0.63, - "learning_rate": 1.8590108015918136e-05, - "loss": 2.2992, - "step": 360230 - }, - { - "epoch": 0.63, - "learning_rate": 1.858923607599131e-05, - "loss": 2.2579, - "step": 360240 - }, - { - "epoch": 0.63, - "learning_rate": 1.858836413606448e-05, - "loss": 2.3106, - "step": 360250 - }, - { - "epoch": 0.63, - "learning_rate": 1.8587492196137658e-05, - "loss": 2.3462, - "step": 360260 - }, - { - "epoch": 0.63, - "learning_rate": 1.8586620256210828e-05, - "loss": 2.1572, - "step": 360270 - }, - { - "epoch": 0.63, - "learning_rate": 1.8585748316284002e-05, - "loss": 2.3359, - "step": 360280 - }, - { - "epoch": 0.63, - "learning_rate": 1.8584876376357176e-05, - "loss": 2.34, - "step": 360290 - }, - { - "epoch": 0.63, - "learning_rate": 1.858400443643035e-05, - "loss": 2.3627, - "step": 360300 - }, - { - "epoch": 0.63, - "learning_rate": 1.8583132496503523e-05, - "loss": 2.3947, - "step": 360310 - }, - { - "epoch": 0.63, - "learning_rate": 1.8582260556576694e-05, - "loss": 2.3286, - "step": 360320 - }, - { - "epoch": 0.63, - "learning_rate": 1.8581388616649867e-05, - "loss": 2.2761, - "step": 360330 - }, - { - "epoch": 0.63, - "learning_rate": 1.858051667672304e-05, - "loss": 2.3497, - "step": 360340 - }, - { - "epoch": 0.63, - "learning_rate": 1.8579644736796215e-05, - "loss": 2.3138, - "step": 360350 - }, - { - "epoch": 0.63, - "learning_rate": 1.857877279686939e-05, - "loss": 2.29, - "step": 360360 - }, - { - "epoch": 0.63, - "learning_rate": 1.8577900856942562e-05, - "loss": 2.3254, - "step": 360370 - }, - { - "epoch": 0.63, - "learning_rate": 1.8577028917015736e-05, - "loss": 2.3712, - "step": 360380 - }, - { - "epoch": 0.63, - "learning_rate": 1.8576156977088907e-05, - "loss": 2.3404, - "step": 360390 - }, - { - "epoch": 0.63, - "learning_rate": 1.857528503716208e-05, - "loss": 2.3092, - "step": 360400 - }, - { - "epoch": 0.63, - "learning_rate": 1.8574413097235254e-05, - "loss": 2.346, - "step": 360410 - }, - { - "epoch": 0.63, - "learning_rate": 1.8573541157308428e-05, - "loss": 2.2189, - "step": 360420 - }, - { - "epoch": 0.63, - "learning_rate": 1.8572669217381598e-05, - "loss": 2.2769, - "step": 360430 - }, - { - "epoch": 0.63, - "learning_rate": 1.8571797277454772e-05, - "loss": 2.4136, - "step": 360440 - }, - { - "epoch": 0.63, - "learning_rate": 1.8570925337527946e-05, - "loss": 2.2848, - "step": 360450 - }, - { - "epoch": 0.63, - "learning_rate": 1.857005339760112e-05, - "loss": 2.2392, - "step": 360460 - }, - { - "epoch": 0.63, - "learning_rate": 1.8569181457674293e-05, - "loss": 2.3603, - "step": 360470 - }, - { - "epoch": 0.63, - "learning_rate": 1.8568309517747467e-05, - "loss": 2.2571, - "step": 360480 - }, - { - "epoch": 0.63, - "learning_rate": 1.856743757782064e-05, - "loss": 2.2838, - "step": 360490 - }, - { - "epoch": 0.63, - "learning_rate": 1.856656563789381e-05, - "loss": 2.3356, - "step": 360500 - }, - { - "epoch": 0.63, - "learning_rate": 1.8565693697966985e-05, - "loss": 2.286, - "step": 360510 - }, - { - "epoch": 0.63, - "learning_rate": 1.856482175804016e-05, - "loss": 2.2508, - "step": 360520 - }, - { - "epoch": 0.63, - "learning_rate": 1.8563949818113333e-05, - "loss": 2.3924, - "step": 360530 - }, - { - "epoch": 0.63, - "learning_rate": 1.8563077878186506e-05, - "loss": 2.2964, - "step": 360540 - }, - { - "epoch": 0.63, - "learning_rate": 1.8562205938259677e-05, - "loss": 2.2557, - "step": 360550 - }, - { - "epoch": 0.63, - "learning_rate": 1.8561333998332854e-05, - "loss": 2.2888, - "step": 360560 - }, - { - "epoch": 0.63, - "learning_rate": 1.8560462058406024e-05, - "loss": 2.3677, - "step": 360570 - }, - { - "epoch": 0.63, - "learning_rate": 1.8559590118479198e-05, - "loss": 2.3288, - "step": 360580 - }, - { - "epoch": 0.63, - "learning_rate": 1.8558718178552372e-05, - "loss": 2.3065, - "step": 360590 - }, - { - "epoch": 0.63, - "learning_rate": 1.8557846238625546e-05, - "loss": 2.4114, - "step": 360600 - }, - { - "epoch": 0.63, - "learning_rate": 1.855697429869872e-05, - "loss": 2.3153, - "step": 360610 - }, - { - "epoch": 0.63, - "learning_rate": 1.855610235877189e-05, - "loss": 2.1661, - "step": 360620 - }, - { - "epoch": 0.63, - "learning_rate": 1.8555230418845067e-05, - "loss": 2.286, - "step": 360630 - }, - { - "epoch": 0.63, - "learning_rate": 1.8554358478918237e-05, - "loss": 2.3571, - "step": 360640 - }, - { - "epoch": 0.63, - "learning_rate": 1.855348653899141e-05, - "loss": 2.3746, - "step": 360650 - }, - { - "epoch": 0.63, - "learning_rate": 1.855261459906458e-05, - "loss": 2.3288, - "step": 360660 - }, - { - "epoch": 0.63, - "learning_rate": 1.855174265913776e-05, - "loss": 2.2811, - "step": 360670 - }, - { - "epoch": 0.63, - "learning_rate": 1.855087071921093e-05, - "loss": 2.3046, - "step": 360680 - }, - { - "epoch": 0.63, - "learning_rate": 1.8549998779284103e-05, - "loss": 2.2881, - "step": 360690 - }, - { - "epoch": 0.63, - "learning_rate": 1.8549126839357276e-05, - "loss": 2.2409, - "step": 360700 - }, - { - "epoch": 0.63, - "learning_rate": 1.854825489943045e-05, - "loss": 2.2205, - "step": 360710 - }, - { - "epoch": 0.63, - "learning_rate": 1.8547382959503624e-05, - "loss": 2.2289, - "step": 360720 - }, - { - "epoch": 0.63, - "learning_rate": 1.8546511019576794e-05, - "loss": 2.3535, - "step": 360730 - }, - { - "epoch": 0.63, - "learning_rate": 1.8545639079649968e-05, - "loss": 2.3324, - "step": 360740 - }, - { - "epoch": 0.63, - "learning_rate": 1.8544767139723142e-05, - "loss": 2.2906, - "step": 360750 - }, - { - "epoch": 0.63, - "learning_rate": 1.8543895199796316e-05, - "loss": 2.3539, - "step": 360760 - }, - { - "epoch": 0.63, - "learning_rate": 1.854302325986949e-05, - "loss": 2.1847, - "step": 360770 - }, - { - "epoch": 0.63, - "learning_rate": 1.8542151319942663e-05, - "loss": 2.2755, - "step": 360780 - }, - { - "epoch": 0.63, - "learning_rate": 1.8541279380015837e-05, - "loss": 2.3457, - "step": 360790 - }, - { - "epoch": 0.63, - "learning_rate": 1.8540407440089007e-05, - "loss": 2.3691, - "step": 360800 - }, - { - "epoch": 0.63, - "learning_rate": 1.853953550016218e-05, - "loss": 2.3274, - "step": 360810 - }, - { - "epoch": 0.63, - "learning_rate": 1.8538663560235355e-05, - "loss": 2.3283, - "step": 360820 - }, - { - "epoch": 0.63, - "learning_rate": 1.853779162030853e-05, - "loss": 2.2455, - "step": 360830 - }, - { - "epoch": 0.63, - "learning_rate": 1.8536919680381702e-05, - "loss": 2.366, - "step": 360840 - }, - { - "epoch": 0.63, - "learning_rate": 1.8536047740454873e-05, - "loss": 2.3236, - "step": 360850 - }, - { - "epoch": 0.63, - "learning_rate": 1.853517580052805e-05, - "loss": 2.2706, - "step": 360860 - }, - { - "epoch": 0.63, - "learning_rate": 1.853430386060122e-05, - "loss": 2.2441, - "step": 360870 - }, - { - "epoch": 0.63, - "learning_rate": 1.8533431920674394e-05, - "loss": 2.3922, - "step": 360880 - }, - { - "epoch": 0.63, - "learning_rate": 1.8532559980747568e-05, - "loss": 2.2907, - "step": 360890 - }, - { - "epoch": 0.63, - "learning_rate": 1.853168804082074e-05, - "loss": 2.3204, - "step": 360900 - }, - { - "epoch": 0.63, - "learning_rate": 1.8530816100893912e-05, - "loss": 2.3452, - "step": 360910 - }, - { - "epoch": 0.63, - "learning_rate": 1.8529944160967086e-05, - "loss": 2.2749, - "step": 360920 - }, - { - "epoch": 0.63, - "learning_rate": 1.852907222104026e-05, - "loss": 2.3858, - "step": 360930 - }, - { - "epoch": 0.63, - "learning_rate": 1.8528200281113433e-05, - "loss": 2.2931, - "step": 360940 - }, - { - "epoch": 0.63, - "learning_rate": 1.8527328341186607e-05, - "loss": 2.3081, - "step": 360950 - }, - { - "epoch": 0.63, - "learning_rate": 1.8526456401259778e-05, - "loss": 2.4349, - "step": 360960 - }, - { - "epoch": 0.63, - "learning_rate": 1.8525584461332955e-05, - "loss": 2.2887, - "step": 360970 - }, - { - "epoch": 0.63, - "learning_rate": 1.8524712521406125e-05, - "loss": 2.3103, - "step": 360980 - }, - { - "epoch": 0.63, - "learning_rate": 1.85238405814793e-05, - "loss": 2.1988, - "step": 360990 - }, - { - "epoch": 0.63, - "learning_rate": 1.8522968641552473e-05, - "loss": 2.2717, - "step": 361000 - }, - { - "epoch": 0.63, - "learning_rate": 1.8522096701625646e-05, - "loss": 2.2511, - "step": 361010 - }, - { - "epoch": 0.63, - "learning_rate": 1.852122476169882e-05, - "loss": 2.3657, - "step": 361020 - }, - { - "epoch": 0.63, - "learning_rate": 1.852035282177199e-05, - "loss": 2.4178, - "step": 361030 - }, - { - "epoch": 0.63, - "learning_rate": 1.8519480881845168e-05, - "loss": 2.3081, - "step": 361040 - }, - { - "epoch": 0.63, - "learning_rate": 1.8518608941918338e-05, - "loss": 2.3095, - "step": 361050 - }, - { - "epoch": 0.63, - "learning_rate": 1.8517737001991512e-05, - "loss": 2.2493, - "step": 361060 - }, - { - "epoch": 0.63, - "learning_rate": 1.8516865062064682e-05, - "loss": 2.3023, - "step": 361070 - }, - { - "epoch": 0.63, - "learning_rate": 1.851599312213786e-05, - "loss": 2.4155, - "step": 361080 - }, - { - "epoch": 0.63, - "learning_rate": 1.8515121182211033e-05, - "loss": 2.2709, - "step": 361090 - }, - { - "epoch": 0.63, - "learning_rate": 1.8514249242284204e-05, - "loss": 2.464, - "step": 361100 - }, - { - "epoch": 0.63, - "learning_rate": 1.8513377302357377e-05, - "loss": 2.2663, - "step": 361110 - }, - { - "epoch": 0.63, - "learning_rate": 1.851250536243055e-05, - "loss": 2.2881, - "step": 361120 - }, - { - "epoch": 0.63, - "learning_rate": 1.8511633422503725e-05, - "loss": 2.3069, - "step": 361130 - }, - { - "epoch": 0.63, - "learning_rate": 1.8510761482576895e-05, - "loss": 2.2969, - "step": 361140 - }, - { - "epoch": 0.63, - "learning_rate": 1.8509889542650072e-05, - "loss": 2.347, - "step": 361150 - }, - { - "epoch": 0.63, - "learning_rate": 1.8509017602723243e-05, - "loss": 2.2506, - "step": 361160 - }, - { - "epoch": 0.63, - "learning_rate": 1.8508145662796417e-05, - "loss": 2.2809, - "step": 361170 - }, - { - "epoch": 0.63, - "learning_rate": 1.850727372286959e-05, - "loss": 2.3252, - "step": 361180 - }, - { - "epoch": 0.63, - "learning_rate": 1.8506401782942764e-05, - "loss": 2.292, - "step": 361190 - }, - { - "epoch": 0.63, - "learning_rate": 1.8505529843015938e-05, - "loss": 2.4414, - "step": 361200 - }, - { - "epoch": 0.63, - "learning_rate": 1.8504657903089108e-05, - "loss": 2.229, - "step": 361210 - }, - { - "epoch": 0.63, - "learning_rate": 1.8503785963162282e-05, - "loss": 2.3169, - "step": 361220 - }, - { - "epoch": 0.63, - "learning_rate": 1.8502914023235456e-05, - "loss": 2.3462, - "step": 361230 - }, - { - "epoch": 0.63, - "learning_rate": 1.850204208330863e-05, - "loss": 2.1588, - "step": 361240 - }, - { - "epoch": 0.63, - "learning_rate": 1.8501170143381803e-05, - "loss": 2.3438, - "step": 361250 - }, - { - "epoch": 0.63, - "learning_rate": 1.8500298203454974e-05, - "loss": 2.3765, - "step": 361260 - }, - { - "epoch": 0.63, - "learning_rate": 1.849942626352815e-05, - "loss": 2.3038, - "step": 361270 - }, - { - "epoch": 0.63, - "learning_rate": 1.849855432360132e-05, - "loss": 2.3187, - "step": 361280 - }, - { - "epoch": 0.63, - "learning_rate": 1.8497682383674495e-05, - "loss": 2.3048, - "step": 361290 - }, - { - "epoch": 0.63, - "learning_rate": 1.849681044374767e-05, - "loss": 2.4213, - "step": 361300 - }, - { - "epoch": 0.63, - "learning_rate": 1.8495938503820843e-05, - "loss": 2.3012, - "step": 361310 - }, - { - "epoch": 0.63, - "learning_rate": 1.8495066563894016e-05, - "loss": 2.4008, - "step": 361320 - }, - { - "epoch": 0.63, - "learning_rate": 1.8494194623967187e-05, - "loss": 2.3819, - "step": 361330 - }, - { - "epoch": 0.63, - "learning_rate": 1.8493322684040364e-05, - "loss": 2.3264, - "step": 361340 - }, - { - "epoch": 0.63, - "learning_rate": 1.8492450744113534e-05, - "loss": 2.3574, - "step": 361350 - }, - { - "epoch": 0.63, - "learning_rate": 1.8491578804186708e-05, - "loss": 2.2984, - "step": 361360 - }, - { - "epoch": 0.63, - "learning_rate": 1.849070686425988e-05, - "loss": 2.3348, - "step": 361370 - }, - { - "epoch": 0.63, - "learning_rate": 1.8489834924333056e-05, - "loss": 2.348, - "step": 361380 - }, - { - "epoch": 0.63, - "learning_rate": 1.8488962984406226e-05, - "loss": 2.3978, - "step": 361390 - }, - { - "epoch": 0.63, - "learning_rate": 1.84880910444794e-05, - "loss": 2.3527, - "step": 361400 - }, - { - "epoch": 0.63, - "learning_rate": 1.8487219104552573e-05, - "loss": 2.3589, - "step": 361410 - }, - { - "epoch": 0.63, - "learning_rate": 1.8486347164625747e-05, - "loss": 2.3695, - "step": 361420 - }, - { - "epoch": 0.63, - "learning_rate": 1.848547522469892e-05, - "loss": 2.2988, - "step": 361430 - }, - { - "epoch": 0.63, - "learning_rate": 1.848460328477209e-05, - "loss": 2.374, - "step": 361440 - }, - { - "epoch": 0.63, - "learning_rate": 1.848373134484527e-05, - "loss": 2.2941, - "step": 361450 - }, - { - "epoch": 0.63, - "learning_rate": 1.848285940491844e-05, - "loss": 2.2719, - "step": 361460 - }, - { - "epoch": 0.63, - "learning_rate": 1.8481987464991613e-05, - "loss": 2.2661, - "step": 361470 - }, - { - "epoch": 0.63, - "learning_rate": 1.8481115525064786e-05, - "loss": 2.3959, - "step": 361480 - }, - { - "epoch": 0.63, - "learning_rate": 1.848024358513796e-05, - "loss": 2.1818, - "step": 361490 - }, - { - "epoch": 0.63, - "learning_rate": 1.8479371645211134e-05, - "loss": 2.3334, - "step": 361500 - }, - { - "epoch": 0.63, - "learning_rate": 1.8478499705284304e-05, - "loss": 2.3807, - "step": 361510 - }, - { - "epoch": 0.63, - "learning_rate": 1.8477627765357478e-05, - "loss": 2.256, - "step": 361520 - }, - { - "epoch": 0.63, - "learning_rate": 1.8476755825430652e-05, - "loss": 2.413, - "step": 361530 - }, - { - "epoch": 0.63, - "learning_rate": 1.8475883885503826e-05, - "loss": 2.309, - "step": 361540 - }, - { - "epoch": 0.63, - "learning_rate": 1.8475011945576996e-05, - "loss": 2.2885, - "step": 361550 - }, - { - "epoch": 0.63, - "learning_rate": 1.8474140005650173e-05, - "loss": 2.2779, - "step": 361560 - }, - { - "epoch": 0.63, - "learning_rate": 1.8473268065723347e-05, - "loss": 2.2148, - "step": 361570 - }, - { - "epoch": 0.63, - "learning_rate": 1.8472396125796517e-05, - "loss": 2.3665, - "step": 361580 - }, - { - "epoch": 0.63, - "learning_rate": 1.847152418586969e-05, - "loss": 2.3712, - "step": 361590 - }, - { - "epoch": 0.63, - "learning_rate": 1.8470652245942865e-05, - "loss": 2.2866, - "step": 361600 - }, - { - "epoch": 0.63, - "learning_rate": 1.846978030601604e-05, - "loss": 2.3562, - "step": 361610 - }, - { - "epoch": 0.63, - "learning_rate": 1.846890836608921e-05, - "loss": 2.3832, - "step": 361620 - }, - { - "epoch": 0.63, - "learning_rate": 1.8468036426162383e-05, - "loss": 2.3077, - "step": 361630 - }, - { - "epoch": 0.63, - "learning_rate": 1.8467164486235557e-05, - "loss": 2.2947, - "step": 361640 - }, - { - "epoch": 0.63, - "learning_rate": 1.846629254630873e-05, - "loss": 2.3049, - "step": 361650 - }, - { - "epoch": 0.63, - "learning_rate": 1.8465420606381904e-05, - "loss": 2.3427, - "step": 361660 - }, - { - "epoch": 0.63, - "learning_rate": 1.8464548666455075e-05, - "loss": 2.3639, - "step": 361670 - }, - { - "epoch": 0.63, - "learning_rate": 1.846367672652825e-05, - "loss": 2.2975, - "step": 361680 - }, - { - "epoch": 0.63, - "learning_rate": 1.8462804786601422e-05, - "loss": 2.3418, - "step": 361690 - }, - { - "epoch": 0.63, - "learning_rate": 1.8461932846674596e-05, - "loss": 2.3347, - "step": 361700 - }, - { - "epoch": 0.63, - "learning_rate": 1.846106090674777e-05, - "loss": 2.3171, - "step": 361710 - }, - { - "epoch": 0.63, - "learning_rate": 1.8460188966820943e-05, - "loss": 2.2863, - "step": 361720 - }, - { - "epoch": 0.63, - "learning_rate": 1.8459317026894117e-05, - "loss": 2.3751, - "step": 361730 - }, - { - "epoch": 0.63, - "learning_rate": 1.8458445086967288e-05, - "loss": 2.3661, - "step": 361740 - }, - { - "epoch": 0.63, - "learning_rate": 1.8457573147040465e-05, - "loss": 2.3832, - "step": 361750 - }, - { - "epoch": 0.63, - "learning_rate": 1.8456701207113635e-05, - "loss": 2.345, - "step": 361760 - }, - { - "epoch": 0.63, - "learning_rate": 1.845582926718681e-05, - "loss": 2.3231, - "step": 361770 - }, - { - "epoch": 0.63, - "learning_rate": 1.845495732725998e-05, - "loss": 2.3407, - "step": 361780 - }, - { - "epoch": 0.63, - "learning_rate": 1.8454085387333156e-05, - "loss": 2.3608, - "step": 361790 - }, - { - "epoch": 0.63, - "learning_rate": 1.8453213447406327e-05, - "loss": 2.3469, - "step": 361800 - }, - { - "epoch": 0.63, - "learning_rate": 1.84523415074795e-05, - "loss": 2.2818, - "step": 361810 - }, - { - "epoch": 0.63, - "learning_rate": 1.8451469567552678e-05, - "loss": 2.3559, - "step": 361820 - }, - { - "epoch": 0.63, - "learning_rate": 1.8450597627625848e-05, - "loss": 2.307, - "step": 361830 - }, - { - "epoch": 0.63, - "learning_rate": 1.8449725687699022e-05, - "loss": 2.3975, - "step": 361840 - }, - { - "epoch": 0.63, - "learning_rate": 1.8448853747772192e-05, - "loss": 2.3443, - "step": 361850 - }, - { - "epoch": 0.63, - "learning_rate": 1.844798180784537e-05, - "loss": 2.4522, - "step": 361860 - }, - { - "epoch": 0.63, - "learning_rate": 1.844710986791854e-05, - "loss": 2.2418, - "step": 361870 - }, - { - "epoch": 0.63, - "learning_rate": 1.8446237927991714e-05, - "loss": 2.3127, - "step": 361880 - }, - { - "epoch": 0.63, - "learning_rate": 1.8445365988064887e-05, - "loss": 2.3262, - "step": 361890 - }, - { - "epoch": 0.63, - "learning_rate": 1.844449404813806e-05, - "loss": 2.4218, - "step": 361900 - }, - { - "epoch": 0.63, - "learning_rate": 1.8443622108211235e-05, - "loss": 2.3423, - "step": 361910 - }, - { - "epoch": 0.63, - "learning_rate": 1.8442750168284405e-05, - "loss": 2.2733, - "step": 361920 - }, - { - "epoch": 0.63, - "learning_rate": 1.844187822835758e-05, - "loss": 2.3319, - "step": 361930 - }, - { - "epoch": 0.63, - "learning_rate": 1.8441006288430753e-05, - "loss": 2.3034, - "step": 361940 - }, - { - "epoch": 0.63, - "learning_rate": 1.8440134348503927e-05, - "loss": 2.2386, - "step": 361950 - }, - { - "epoch": 0.63, - "learning_rate": 1.84392624085771e-05, - "loss": 2.3755, - "step": 361960 - }, - { - "epoch": 0.63, - "learning_rate": 1.8438390468650274e-05, - "loss": 2.3366, - "step": 361970 - }, - { - "epoch": 0.63, - "learning_rate": 1.8437518528723448e-05, - "loss": 2.3444, - "step": 361980 - }, - { - "epoch": 0.63, - "learning_rate": 1.8436646588796618e-05, - "loss": 2.2518, - "step": 361990 - }, - { - "epoch": 0.63, - "learning_rate": 1.8435774648869792e-05, - "loss": 2.2812, - "step": 362000 - }, - { - "epoch": 0.63, - "learning_rate": 1.8434902708942966e-05, - "loss": 2.475, - "step": 362010 - }, - { - "epoch": 0.63, - "learning_rate": 1.843403076901614e-05, - "loss": 2.3884, - "step": 362020 - }, - { - "epoch": 0.63, - "learning_rate": 1.843315882908931e-05, - "loss": 2.3722, - "step": 362030 - }, - { - "epoch": 0.63, - "learning_rate": 1.8432286889162484e-05, - "loss": 2.341, - "step": 362040 - }, - { - "epoch": 0.63, - "learning_rate": 1.843141494923566e-05, - "loss": 2.3463, - "step": 362050 - }, - { - "epoch": 0.63, - "learning_rate": 1.843054300930883e-05, - "loss": 2.3512, - "step": 362060 - }, - { - "epoch": 0.63, - "learning_rate": 1.8429671069382005e-05, - "loss": 2.337, - "step": 362070 - }, - { - "epoch": 0.63, - "learning_rate": 1.842879912945518e-05, - "loss": 2.2999, - "step": 362080 - }, - { - "epoch": 0.63, - "learning_rate": 1.8427927189528353e-05, - "loss": 2.4729, - "step": 362090 - }, - { - "epoch": 0.63, - "learning_rate": 1.8427055249601523e-05, - "loss": 2.2979, - "step": 362100 - }, - { - "epoch": 0.63, - "learning_rate": 1.8426183309674697e-05, - "loss": 2.3759, - "step": 362110 - }, - { - "epoch": 0.63, - "learning_rate": 1.842531136974787e-05, - "loss": 2.4013, - "step": 362120 - }, - { - "epoch": 0.63, - "learning_rate": 1.8424439429821044e-05, - "loss": 2.2556, - "step": 362130 - }, - { - "epoch": 0.63, - "learning_rate": 1.8423567489894218e-05, - "loss": 2.436, - "step": 362140 - }, - { - "epoch": 0.63, - "learning_rate": 1.842269554996739e-05, - "loss": 2.39, - "step": 362150 - }, - { - "epoch": 0.63, - "learning_rate": 1.8421823610040566e-05, - "loss": 2.2751, - "step": 362160 - }, - { - "epoch": 0.63, - "learning_rate": 1.8420951670113736e-05, - "loss": 2.374, - "step": 362170 - }, - { - "epoch": 0.63, - "learning_rate": 1.842007973018691e-05, - "loss": 2.3209, - "step": 362180 - }, - { - "epoch": 0.63, - "learning_rate": 1.8419207790260083e-05, - "loss": 2.3542, - "step": 362190 - }, - { - "epoch": 0.63, - "learning_rate": 1.8418335850333257e-05, - "loss": 2.2894, - "step": 362200 - }, - { - "epoch": 0.63, - "learning_rate": 1.841746391040643e-05, - "loss": 2.3352, - "step": 362210 - }, - { - "epoch": 0.63, - "learning_rate": 1.84165919704796e-05, - "loss": 2.3838, - "step": 362220 - }, - { - "epoch": 0.63, - "learning_rate": 1.841572003055278e-05, - "loss": 2.3561, - "step": 362230 - }, - { - "epoch": 0.63, - "learning_rate": 1.841484809062595e-05, - "loss": 2.3292, - "step": 362240 - }, - { - "epoch": 0.63, - "learning_rate": 1.8413976150699123e-05, - "loss": 2.3576, - "step": 362250 - }, - { - "epoch": 0.63, - "learning_rate": 1.8413104210772293e-05, - "loss": 2.3898, - "step": 362260 - }, - { - "epoch": 0.63, - "learning_rate": 1.841223227084547e-05, - "loss": 2.2975, - "step": 362270 - }, - { - "epoch": 0.63, - "learning_rate": 1.841136033091864e-05, - "loss": 2.2989, - "step": 362280 - }, - { - "epoch": 0.63, - "learning_rate": 1.8410488390991814e-05, - "loss": 2.4415, - "step": 362290 - }, - { - "epoch": 0.63, - "learning_rate": 1.8409616451064988e-05, - "loss": 2.3472, - "step": 362300 - }, - { - "epoch": 0.63, - "learning_rate": 1.8408744511138162e-05, - "loss": 2.4003, - "step": 362310 - }, - { - "epoch": 0.63, - "learning_rate": 1.8407872571211336e-05, - "loss": 2.4506, - "step": 362320 - }, - { - "epoch": 0.63, - "learning_rate": 1.8407000631284506e-05, - "loss": 2.2518, - "step": 362330 - }, - { - "epoch": 0.63, - "learning_rate": 1.8406128691357683e-05, - "loss": 2.3446, - "step": 362340 - }, - { - "epoch": 0.63, - "learning_rate": 1.8405256751430854e-05, - "loss": 2.3936, - "step": 362350 - }, - { - "epoch": 0.63, - "learning_rate": 1.8404384811504027e-05, - "loss": 2.1847, - "step": 362360 - }, - { - "epoch": 0.63, - "learning_rate": 1.84035128715772e-05, - "loss": 2.3369, - "step": 362370 - }, - { - "epoch": 0.63, - "learning_rate": 1.8402640931650375e-05, - "loss": 2.2943, - "step": 362380 - }, - { - "epoch": 0.63, - "learning_rate": 1.840176899172355e-05, - "loss": 2.3666, - "step": 362390 - }, - { - "epoch": 0.63, - "learning_rate": 1.840089705179672e-05, - "loss": 2.2852, - "step": 362400 - }, - { - "epoch": 0.63, - "learning_rate": 1.8400025111869893e-05, - "loss": 2.3782, - "step": 362410 - }, - { - "epoch": 0.63, - "learning_rate": 1.8399153171943067e-05, - "loss": 2.2461, - "step": 362420 - }, - { - "epoch": 0.63, - "learning_rate": 1.839828123201624e-05, - "loss": 2.2125, - "step": 362430 - }, - { - "epoch": 0.63, - "learning_rate": 1.8397409292089414e-05, - "loss": 2.2789, - "step": 362440 - }, - { - "epoch": 0.63, - "learning_rate": 1.8396537352162585e-05, - "loss": 2.3167, - "step": 362450 - }, - { - "epoch": 0.63, - "learning_rate": 1.839566541223576e-05, - "loss": 2.239, - "step": 362460 - }, - { - "epoch": 0.63, - "learning_rate": 1.8394793472308932e-05, - "loss": 2.3318, - "step": 362470 - }, - { - "epoch": 0.63, - "learning_rate": 1.8393921532382106e-05, - "loss": 2.3444, - "step": 362480 - }, - { - "epoch": 0.63, - "learning_rate": 1.839304959245528e-05, - "loss": 2.3545, - "step": 362490 - }, - { - "epoch": 0.63, - "learning_rate": 1.8392177652528453e-05, - "loss": 2.2901, - "step": 362500 - }, - { - "epoch": 0.63, - "learning_rate": 1.8391305712601624e-05, - "loss": 2.2948, - "step": 362510 - }, - { - "epoch": 0.63, - "learning_rate": 1.8390433772674798e-05, - "loss": 2.2451, - "step": 362520 - }, - { - "epoch": 0.63, - "learning_rate": 1.838956183274797e-05, - "loss": 2.3153, - "step": 362530 - }, - { - "epoch": 0.63, - "learning_rate": 1.8388689892821145e-05, - "loss": 2.3389, - "step": 362540 - }, - { - "epoch": 0.63, - "learning_rate": 1.838781795289432e-05, - "loss": 2.2955, - "step": 362550 - }, - { - "epoch": 0.63, - "learning_rate": 1.838694601296749e-05, - "loss": 2.3483, - "step": 362560 - }, - { - "epoch": 0.63, - "learning_rate": 1.8386074073040666e-05, - "loss": 2.3644, - "step": 362570 - }, - { - "epoch": 0.63, - "learning_rate": 1.8385202133113837e-05, - "loss": 2.352, - "step": 362580 - }, - { - "epoch": 0.63, - "learning_rate": 1.838433019318701e-05, - "loss": 2.2643, - "step": 362590 - }, - { - "epoch": 0.63, - "learning_rate": 1.8383458253260184e-05, - "loss": 2.3986, - "step": 362600 - }, - { - "epoch": 0.63, - "learning_rate": 1.8382586313333358e-05, - "loss": 2.3314, - "step": 362610 - }, - { - "epoch": 0.63, - "learning_rate": 1.8381714373406532e-05, - "loss": 2.2787, - "step": 362620 - }, - { - "epoch": 0.63, - "learning_rate": 1.8380842433479702e-05, - "loss": 2.1369, - "step": 362630 - }, - { - "epoch": 0.63, - "learning_rate": 1.837997049355288e-05, - "loss": 2.3216, - "step": 362640 - }, - { - "epoch": 0.63, - "learning_rate": 1.837909855362605e-05, - "loss": 2.3882, - "step": 362650 - }, - { - "epoch": 0.63, - "learning_rate": 1.8378226613699224e-05, - "loss": 2.3317, - "step": 362660 - }, - { - "epoch": 0.63, - "learning_rate": 1.8377354673772397e-05, - "loss": 2.2067, - "step": 362670 - }, - { - "epoch": 0.63, - "learning_rate": 1.837648273384557e-05, - "loss": 2.3192, - "step": 362680 - }, - { - "epoch": 0.63, - "learning_rate": 1.8375610793918745e-05, - "loss": 2.3808, - "step": 362690 - }, - { - "epoch": 0.63, - "learning_rate": 1.8374738853991915e-05, - "loss": 2.2739, - "step": 362700 - }, - { - "epoch": 0.63, - "learning_rate": 1.837386691406509e-05, - "loss": 2.344, - "step": 362710 - }, - { - "epoch": 0.63, - "learning_rate": 1.8372994974138263e-05, - "loss": 2.2452, - "step": 362720 - }, - { - "epoch": 0.63, - "learning_rate": 1.8372123034211437e-05, - "loss": 2.3909, - "step": 362730 - }, - { - "epoch": 0.63, - "learning_rate": 1.8371251094284607e-05, - "loss": 2.3464, - "step": 362740 - }, - { - "epoch": 0.63, - "learning_rate": 1.8370379154357784e-05, - "loss": 2.3803, - "step": 362750 - }, - { - "epoch": 0.63, - "learning_rate": 1.8369507214430954e-05, - "loss": 2.3126, - "step": 362760 - }, - { - "epoch": 0.63, - "learning_rate": 1.8368635274504128e-05, - "loss": 2.3878, - "step": 362770 - }, - { - "epoch": 0.63, - "learning_rate": 1.8367763334577302e-05, - "loss": 2.2028, - "step": 362780 - }, - { - "epoch": 0.63, - "learning_rate": 1.8366891394650476e-05, - "loss": 2.3559, - "step": 362790 - }, - { - "epoch": 0.63, - "learning_rate": 1.836601945472365e-05, - "loss": 2.4134, - "step": 362800 - }, - { - "epoch": 0.63, - "learning_rate": 1.836514751479682e-05, - "loss": 2.348, - "step": 362810 - }, - { - "epoch": 0.63, - "learning_rate": 1.8364275574869994e-05, - "loss": 2.2767, - "step": 362820 - }, - { - "epoch": 0.63, - "learning_rate": 1.8363403634943167e-05, - "loss": 2.3503, - "step": 362830 - }, - { - "epoch": 0.63, - "learning_rate": 1.836253169501634e-05, - "loss": 2.2389, - "step": 362840 - }, - { - "epoch": 0.63, - "learning_rate": 1.8361659755089515e-05, - "loss": 2.244, - "step": 362850 - }, - { - "epoch": 0.63, - "learning_rate": 1.8360787815162685e-05, - "loss": 2.2318, - "step": 362860 - }, - { - "epoch": 0.63, - "learning_rate": 1.8359915875235863e-05, - "loss": 2.3474, - "step": 362870 - }, - { - "epoch": 0.63, - "learning_rate": 1.8359043935309033e-05, - "loss": 2.3259, - "step": 362880 - }, - { - "epoch": 0.63, - "learning_rate": 1.8358171995382207e-05, - "loss": 2.2732, - "step": 362890 - }, - { - "epoch": 0.63, - "learning_rate": 1.835730005545538e-05, - "loss": 2.3559, - "step": 362900 - }, - { - "epoch": 0.63, - "learning_rate": 1.8356428115528554e-05, - "loss": 2.1897, - "step": 362910 - }, - { - "epoch": 0.63, - "learning_rate": 1.8355556175601728e-05, - "loss": 2.4102, - "step": 362920 - }, - { - "epoch": 0.63, - "learning_rate": 1.83546842356749e-05, - "loss": 2.2931, - "step": 362930 - }, - { - "epoch": 0.63, - "learning_rate": 1.8353812295748076e-05, - "loss": 2.516, - "step": 362940 - }, - { - "epoch": 0.63, - "learning_rate": 1.8352940355821246e-05, - "loss": 2.301, - "step": 362950 - }, - { - "epoch": 0.63, - "learning_rate": 1.835206841589442e-05, - "loss": 2.4497, - "step": 362960 - }, - { - "epoch": 0.63, - "learning_rate": 1.835119647596759e-05, - "loss": 2.3997, - "step": 362970 - }, - { - "epoch": 0.63, - "learning_rate": 1.8350324536040767e-05, - "loss": 2.3569, - "step": 362980 - }, - { - "epoch": 0.63, - "learning_rate": 1.8349452596113938e-05, - "loss": 2.322, - "step": 362990 - }, - { - "epoch": 0.63, - "learning_rate": 1.834858065618711e-05, - "loss": 2.2911, - "step": 363000 - }, - { - "epoch": 0.63, - "learning_rate": 1.8347708716260285e-05, - "loss": 2.4045, - "step": 363010 - }, - { - "epoch": 0.63, - "learning_rate": 1.834683677633346e-05, - "loss": 2.2449, - "step": 363020 - }, - { - "epoch": 0.63, - "learning_rate": 1.8345964836406633e-05, - "loss": 2.3566, - "step": 363030 - }, - { - "epoch": 0.63, - "learning_rate": 1.8345092896479803e-05, - "loss": 2.3384, - "step": 363040 - }, - { - "epoch": 0.63, - "learning_rate": 1.834422095655298e-05, - "loss": 2.2829, - "step": 363050 - }, - { - "epoch": 0.63, - "learning_rate": 1.834334901662615e-05, - "loss": 2.3699, - "step": 363060 - }, - { - "epoch": 0.63, - "learning_rate": 1.8342477076699324e-05, - "loss": 2.3466, - "step": 363070 - }, - { - "epoch": 0.63, - "learning_rate": 1.8341605136772498e-05, - "loss": 2.3861, - "step": 363080 - }, - { - "epoch": 0.63, - "learning_rate": 1.8340733196845672e-05, - "loss": 2.294, - "step": 363090 - }, - { - "epoch": 0.63, - "learning_rate": 1.8339861256918846e-05, - "loss": 2.2751, - "step": 363100 - }, - { - "epoch": 0.63, - "learning_rate": 1.8338989316992016e-05, - "loss": 2.2994, - "step": 363110 - }, - { - "epoch": 0.63, - "learning_rate": 1.833811737706519e-05, - "loss": 2.2483, - "step": 363120 - }, - { - "epoch": 0.63, - "learning_rate": 1.8337245437138364e-05, - "loss": 2.3436, - "step": 363130 - }, - { - "epoch": 0.63, - "learning_rate": 1.8336373497211537e-05, - "loss": 2.4314, - "step": 363140 - }, - { - "epoch": 0.63, - "learning_rate": 1.8335501557284708e-05, - "loss": 2.3045, - "step": 363150 - }, - { - "epoch": 0.63, - "learning_rate": 1.8334629617357885e-05, - "loss": 2.4326, - "step": 363160 - }, - { - "epoch": 0.63, - "learning_rate": 1.833375767743106e-05, - "loss": 2.2938, - "step": 363170 - }, - { - "epoch": 0.63, - "learning_rate": 1.833288573750423e-05, - "loss": 2.287, - "step": 363180 - }, - { - "epoch": 0.63, - "learning_rate": 1.8332013797577403e-05, - "loss": 2.2727, - "step": 363190 - }, - { - "epoch": 0.63, - "learning_rate": 1.8331141857650577e-05, - "loss": 2.1824, - "step": 363200 - }, - { - "epoch": 0.63, - "learning_rate": 1.833026991772375e-05, - "loss": 2.3568, - "step": 363210 - }, - { - "epoch": 0.63, - "learning_rate": 1.832939797779692e-05, - "loss": 2.3095, - "step": 363220 - }, - { - "epoch": 0.63, - "learning_rate": 1.8328526037870095e-05, - "loss": 2.3564, - "step": 363230 - }, - { - "epoch": 0.63, - "learning_rate": 1.8327654097943268e-05, - "loss": 2.3835, - "step": 363240 - }, - { - "epoch": 0.63, - "learning_rate": 1.8326782158016442e-05, - "loss": 2.3905, - "step": 363250 - }, - { - "epoch": 0.63, - "learning_rate": 1.8325910218089616e-05, - "loss": 2.3704, - "step": 363260 - }, - { - "epoch": 0.63, - "learning_rate": 1.832503827816279e-05, - "loss": 2.3259, - "step": 363270 - }, - { - "epoch": 0.63, - "learning_rate": 1.8324166338235963e-05, - "loss": 2.3024, - "step": 363280 - }, - { - "epoch": 0.63, - "learning_rate": 1.8323294398309134e-05, - "loss": 2.2366, - "step": 363290 - }, - { - "epoch": 0.63, - "learning_rate": 1.8322422458382308e-05, - "loss": 2.2365, - "step": 363300 - }, - { - "epoch": 0.63, - "learning_rate": 1.832155051845548e-05, - "loss": 2.4501, - "step": 363310 - }, - { - "epoch": 0.63, - "learning_rate": 1.8320678578528655e-05, - "loss": 2.2054, - "step": 363320 - }, - { - "epoch": 0.63, - "learning_rate": 1.831980663860183e-05, - "loss": 2.371, - "step": 363330 - }, - { - "epoch": 0.63, - "learning_rate": 1.8318934698675e-05, - "loss": 2.2317, - "step": 363340 - }, - { - "epoch": 0.63, - "learning_rate": 1.8318062758748176e-05, - "loss": 2.371, - "step": 363350 - }, - { - "epoch": 0.63, - "learning_rate": 1.8317190818821347e-05, - "loss": 2.3532, - "step": 363360 - }, - { - "epoch": 0.63, - "learning_rate": 1.831631887889452e-05, - "loss": 2.2312, - "step": 363370 - }, - { - "epoch": 0.63, - "learning_rate": 1.831544693896769e-05, - "loss": 2.3283, - "step": 363380 - }, - { - "epoch": 0.63, - "learning_rate": 1.8314574999040868e-05, - "loss": 2.2321, - "step": 363390 - }, - { - "epoch": 0.63, - "learning_rate": 1.8313703059114042e-05, - "loss": 2.3447, - "step": 363400 - }, - { - "epoch": 0.63, - "learning_rate": 1.8312831119187212e-05, - "loss": 2.2785, - "step": 363410 - }, - { - "epoch": 0.63, - "learning_rate": 1.831195917926039e-05, - "loss": 2.4025, - "step": 363420 - }, - { - "epoch": 0.63, - "learning_rate": 1.831108723933356e-05, - "loss": 2.3223, - "step": 363430 - }, - { - "epoch": 0.63, - "learning_rate": 1.8310215299406734e-05, - "loss": 2.3351, - "step": 363440 - }, - { - "epoch": 0.63, - "learning_rate": 1.8309343359479904e-05, - "loss": 2.2572, - "step": 363450 - }, - { - "epoch": 0.63, - "learning_rate": 1.830847141955308e-05, - "loss": 2.3675, - "step": 363460 - }, - { - "epoch": 0.63, - "learning_rate": 1.830759947962625e-05, - "loss": 2.3752, - "step": 363470 - }, - { - "epoch": 0.63, - "learning_rate": 1.8306727539699425e-05, - "loss": 2.3946, - "step": 363480 - }, - { - "epoch": 0.63, - "learning_rate": 1.83058555997726e-05, - "loss": 2.3287, - "step": 363490 - }, - { - "epoch": 0.63, - "learning_rate": 1.8304983659845773e-05, - "loss": 2.376, - "step": 363500 - }, - { - "epoch": 0.63, - "learning_rate": 1.8304111719918947e-05, - "loss": 2.3053, - "step": 363510 - }, - { - "epoch": 0.63, - "learning_rate": 1.8303239779992117e-05, - "loss": 2.34, - "step": 363520 - }, - { - "epoch": 0.63, - "learning_rate": 1.830236784006529e-05, - "loss": 2.3543, - "step": 363530 - }, - { - "epoch": 0.63, - "learning_rate": 1.8301495900138464e-05, - "loss": 2.4111, - "step": 363540 - }, - { - "epoch": 0.63, - "learning_rate": 1.8300623960211638e-05, - "loss": 2.2978, - "step": 363550 - }, - { - "epoch": 0.63, - "learning_rate": 1.8299752020284812e-05, - "loss": 2.3233, - "step": 363560 - }, - { - "epoch": 0.63, - "learning_rate": 1.8298880080357986e-05, - "loss": 2.3206, - "step": 363570 - }, - { - "epoch": 0.63, - "learning_rate": 1.829800814043116e-05, - "loss": 2.3594, - "step": 363580 - }, - { - "epoch": 0.63, - "learning_rate": 1.829713620050433e-05, - "loss": 2.3115, - "step": 363590 - }, - { - "epoch": 0.63, - "learning_rate": 1.8296264260577504e-05, - "loss": 2.4035, - "step": 363600 - }, - { - "epoch": 0.63, - "learning_rate": 1.8295392320650677e-05, - "loss": 2.3637, - "step": 363610 - }, - { - "epoch": 0.63, - "learning_rate": 1.829452038072385e-05, - "loss": 2.3469, - "step": 363620 - }, - { - "epoch": 0.63, - "learning_rate": 1.829364844079702e-05, - "loss": 2.4554, - "step": 363630 - }, - { - "epoch": 0.63, - "learning_rate": 1.8292776500870195e-05, - "loss": 2.3518, - "step": 363640 - }, - { - "epoch": 0.63, - "learning_rate": 1.8291904560943373e-05, - "loss": 2.3506, - "step": 363650 - }, - { - "epoch": 0.63, - "learning_rate": 1.8291032621016543e-05, - "loss": 2.3324, - "step": 363660 - }, - { - "epoch": 0.63, - "learning_rate": 1.8290160681089717e-05, - "loss": 2.3305, - "step": 363670 - }, - { - "epoch": 0.63, - "learning_rate": 1.828928874116289e-05, - "loss": 2.5168, - "step": 363680 - }, - { - "epoch": 0.63, - "learning_rate": 1.8288416801236064e-05, - "loss": 2.355, - "step": 363690 - }, - { - "epoch": 0.63, - "learning_rate": 1.8287544861309235e-05, - "loss": 2.37, - "step": 363700 - }, - { - "epoch": 0.63, - "learning_rate": 1.828667292138241e-05, - "loss": 2.2828, - "step": 363710 - }, - { - "epoch": 0.63, - "learning_rate": 1.8285800981455582e-05, - "loss": 2.3839, - "step": 363720 - }, - { - "epoch": 0.63, - "learning_rate": 1.8284929041528756e-05, - "loss": 2.2915, - "step": 363730 - }, - { - "epoch": 0.63, - "learning_rate": 1.828405710160193e-05, - "loss": 2.2886, - "step": 363740 - }, - { - "epoch": 0.63, - "learning_rate": 1.82831851616751e-05, - "loss": 2.3123, - "step": 363750 - }, - { - "epoch": 0.63, - "learning_rate": 1.8282313221748277e-05, - "loss": 2.3696, - "step": 363760 - }, - { - "epoch": 0.63, - "learning_rate": 1.8281441281821448e-05, - "loss": 2.4275, - "step": 363770 - }, - { - "epoch": 0.63, - "learning_rate": 1.828056934189462e-05, - "loss": 2.222, - "step": 363780 - }, - { - "epoch": 0.63, - "learning_rate": 1.8279697401967795e-05, - "loss": 2.3662, - "step": 363790 - }, - { - "epoch": 0.63, - "learning_rate": 1.827882546204097e-05, - "loss": 2.3833, - "step": 363800 - }, - { - "epoch": 0.63, - "learning_rate": 1.8277953522114143e-05, - "loss": 2.5125, - "step": 363810 - }, - { - "epoch": 0.63, - "learning_rate": 1.8277081582187313e-05, - "loss": 2.3399, - "step": 363820 - }, - { - "epoch": 0.63, - "learning_rate": 1.827620964226049e-05, - "loss": 2.2916, - "step": 363830 - }, - { - "epoch": 0.63, - "learning_rate": 1.827533770233366e-05, - "loss": 2.4504, - "step": 363840 - }, - { - "epoch": 0.63, - "learning_rate": 1.8274465762406834e-05, - "loss": 2.255, - "step": 363850 - }, - { - "epoch": 0.63, - "learning_rate": 1.8273593822480005e-05, - "loss": 2.2991, - "step": 363860 - }, - { - "epoch": 0.63, - "learning_rate": 1.8272721882553182e-05, - "loss": 2.3093, - "step": 363870 - }, - { - "epoch": 0.63, - "learning_rate": 1.8271849942626352e-05, - "loss": 2.2988, - "step": 363880 - }, - { - "epoch": 0.63, - "learning_rate": 1.8270978002699526e-05, - "loss": 2.2733, - "step": 363890 - }, - { - "epoch": 0.63, - "learning_rate": 1.82701060627727e-05, - "loss": 2.2278, - "step": 363900 - }, - { - "epoch": 0.63, - "learning_rate": 1.8269234122845874e-05, - "loss": 2.2722, - "step": 363910 - }, - { - "epoch": 0.63, - "learning_rate": 1.8268362182919047e-05, - "loss": 2.3292, - "step": 363920 - }, - { - "epoch": 0.63, - "learning_rate": 1.8267490242992218e-05, - "loss": 2.3608, - "step": 363930 - }, - { - "epoch": 0.63, - "learning_rate": 1.8266618303065395e-05, - "loss": 2.3281, - "step": 363940 - }, - { - "epoch": 0.63, - "learning_rate": 1.8265746363138565e-05, - "loss": 2.3579, - "step": 363950 - }, - { - "epoch": 0.63, - "learning_rate": 1.826487442321174e-05, - "loss": 2.3801, - "step": 363960 - }, - { - "epoch": 0.63, - "learning_rate": 1.8264002483284913e-05, - "loss": 2.373, - "step": 363970 - }, - { - "epoch": 0.63, - "learning_rate": 1.8263130543358087e-05, - "loss": 2.3094, - "step": 363980 - }, - { - "epoch": 0.63, - "learning_rate": 1.826225860343126e-05, - "loss": 2.3824, - "step": 363990 - }, - { - "epoch": 0.63, - "learning_rate": 1.826138666350443e-05, - "loss": 2.2528, - "step": 364000 - }, - { - "epoch": 0.63, - "learning_rate": 1.8260514723577605e-05, - "loss": 2.3227, - "step": 364010 - }, - { - "epoch": 0.63, - "learning_rate": 1.8259642783650778e-05, - "loss": 2.3468, - "step": 364020 - }, - { - "epoch": 0.63, - "learning_rate": 1.8258770843723952e-05, - "loss": 2.4083, - "step": 364030 - }, - { - "epoch": 0.63, - "learning_rate": 1.8257898903797126e-05, - "loss": 2.3193, - "step": 364040 - }, - { - "epoch": 0.63, - "learning_rate": 1.8257026963870296e-05, - "loss": 2.2975, - "step": 364050 - }, - { - "epoch": 0.63, - "learning_rate": 1.8256155023943473e-05, - "loss": 2.3813, - "step": 364060 - }, - { - "epoch": 0.63, - "learning_rate": 1.8255283084016644e-05, - "loss": 2.3657, - "step": 364070 - }, - { - "epoch": 0.63, - "learning_rate": 1.8254411144089818e-05, - "loss": 2.3212, - "step": 364080 - }, - { - "epoch": 0.63, - "learning_rate": 1.825353920416299e-05, - "loss": 2.2754, - "step": 364090 - }, - { - "epoch": 0.63, - "learning_rate": 1.8252667264236165e-05, - "loss": 2.3801, - "step": 364100 - }, - { - "epoch": 0.63, - "learning_rate": 1.8251795324309335e-05, - "loss": 2.2545, - "step": 364110 - }, - { - "epoch": 0.63, - "learning_rate": 1.825092338438251e-05, - "loss": 2.3241, - "step": 364120 - }, - { - "epoch": 0.63, - "learning_rate": 1.8250051444455686e-05, - "loss": 2.3435, - "step": 364130 - }, - { - "epoch": 0.64, - "learning_rate": 1.8249179504528857e-05, - "loss": 2.3407, - "step": 364140 - }, - { - "epoch": 0.64, - "learning_rate": 1.824830756460203e-05, - "loss": 2.3138, - "step": 364150 - }, - { - "epoch": 0.64, - "learning_rate": 1.82474356246752e-05, - "loss": 2.2713, - "step": 364160 - }, - { - "epoch": 0.64, - "learning_rate": 1.8246563684748378e-05, - "loss": 2.2934, - "step": 364170 - }, - { - "epoch": 0.64, - "learning_rate": 1.824569174482155e-05, - "loss": 2.1927, - "step": 364180 - }, - { - "epoch": 0.64, - "learning_rate": 1.8244819804894722e-05, - "loss": 2.3016, - "step": 364190 - }, - { - "epoch": 0.64, - "learning_rate": 1.8243947864967896e-05, - "loss": 2.2639, - "step": 364200 - }, - { - "epoch": 0.64, - "learning_rate": 1.824307592504107e-05, - "loss": 2.297, - "step": 364210 - }, - { - "epoch": 0.64, - "learning_rate": 1.8242203985114244e-05, - "loss": 2.3051, - "step": 364220 - }, - { - "epoch": 0.64, - "learning_rate": 1.8241332045187414e-05, - "loss": 2.3162, - "step": 364230 - }, - { - "epoch": 0.64, - "learning_rate": 1.824046010526059e-05, - "loss": 2.2759, - "step": 364240 - }, - { - "epoch": 0.64, - "learning_rate": 1.823958816533376e-05, - "loss": 2.2967, - "step": 364250 - }, - { - "epoch": 0.64, - "learning_rate": 1.8238716225406935e-05, - "loss": 2.1801, - "step": 364260 - }, - { - "epoch": 0.64, - "learning_rate": 1.823784428548011e-05, - "loss": 2.3135, - "step": 364270 - }, - { - "epoch": 0.64, - "learning_rate": 1.8236972345553283e-05, - "loss": 2.341, - "step": 364280 - }, - { - "epoch": 0.64, - "learning_rate": 1.8236100405626457e-05, - "loss": 2.2946, - "step": 364290 - }, - { - "epoch": 0.64, - "learning_rate": 1.8235228465699627e-05, - "loss": 2.2877, - "step": 364300 - }, - { - "epoch": 0.64, - "learning_rate": 1.82343565257728e-05, - "loss": 2.4199, - "step": 364310 - }, - { - "epoch": 0.64, - "learning_rate": 1.8233484585845974e-05, - "loss": 2.3001, - "step": 364320 - }, - { - "epoch": 0.64, - "learning_rate": 1.8232612645919148e-05, - "loss": 2.2729, - "step": 364330 - }, - { - "epoch": 0.64, - "learning_rate": 1.823174070599232e-05, - "loss": 2.2408, - "step": 364340 - }, - { - "epoch": 0.64, - "learning_rate": 1.8230868766065496e-05, - "loss": 2.3648, - "step": 364350 - }, - { - "epoch": 0.64, - "learning_rate": 1.8229996826138666e-05, - "loss": 2.3252, - "step": 364360 - }, - { - "epoch": 0.64, - "learning_rate": 1.822912488621184e-05, - "loss": 2.3134, - "step": 364370 - }, - { - "epoch": 0.64, - "learning_rate": 1.8228252946285014e-05, - "loss": 2.2363, - "step": 364380 - }, - { - "epoch": 0.64, - "learning_rate": 1.8227381006358187e-05, - "loss": 2.4006, - "step": 364390 - }, - { - "epoch": 0.64, - "learning_rate": 1.822650906643136e-05, - "loss": 2.2096, - "step": 364400 - }, - { - "epoch": 0.64, - "learning_rate": 1.822563712650453e-05, - "loss": 2.4477, - "step": 364410 - }, - { - "epoch": 0.64, - "learning_rate": 1.8224765186577705e-05, - "loss": 2.3947, - "step": 364420 - }, - { - "epoch": 0.64, - "learning_rate": 1.822389324665088e-05, - "loss": 2.3234, - "step": 364430 - }, - { - "epoch": 0.64, - "learning_rate": 1.8223021306724053e-05, - "loss": 2.2953, - "step": 364440 - }, - { - "epoch": 0.64, - "learning_rate": 1.8222149366797227e-05, - "loss": 2.3255, - "step": 364450 - }, - { - "epoch": 0.64, - "learning_rate": 1.8221277426870397e-05, - "loss": 2.2307, - "step": 364460 - }, - { - "epoch": 0.64, - "learning_rate": 1.8220405486943574e-05, - "loss": 2.3489, - "step": 364470 - }, - { - "epoch": 0.64, - "learning_rate": 1.8219533547016745e-05, - "loss": 2.3096, - "step": 364480 - }, - { - "epoch": 0.64, - "learning_rate": 1.821866160708992e-05, - "loss": 2.3205, - "step": 364490 - }, - { - "epoch": 0.64, - "learning_rate": 1.8217789667163092e-05, - "loss": 2.3753, - "step": 364500 - }, - { - "epoch": 0.64, - "learning_rate": 1.8216917727236266e-05, - "loss": 2.3458, - "step": 364510 - }, - { - "epoch": 0.64, - "learning_rate": 1.821604578730944e-05, - "loss": 2.3418, - "step": 364520 - }, - { - "epoch": 0.64, - "learning_rate": 1.821517384738261e-05, - "loss": 2.1469, - "step": 364530 - }, - { - "epoch": 0.64, - "learning_rate": 1.8214301907455787e-05, - "loss": 2.2734, - "step": 364540 - }, - { - "epoch": 0.64, - "learning_rate": 1.8213429967528958e-05, - "loss": 2.4429, - "step": 364550 - }, - { - "epoch": 0.64, - "learning_rate": 1.821255802760213e-05, - "loss": 2.4409, - "step": 364560 - }, - { - "epoch": 0.64, - "learning_rate": 1.8211686087675302e-05, - "loss": 2.3156, - "step": 364570 - }, - { - "epoch": 0.64, - "learning_rate": 1.821081414774848e-05, - "loss": 2.357, - "step": 364580 - }, - { - "epoch": 0.64, - "learning_rate": 1.820994220782165e-05, - "loss": 2.323, - "step": 364590 - }, - { - "epoch": 0.64, - "learning_rate": 1.8209070267894823e-05, - "loss": 2.2813, - "step": 364600 - }, - { - "epoch": 0.64, - "learning_rate": 1.8208198327967997e-05, - "loss": 2.3322, - "step": 364610 - }, - { - "epoch": 0.64, - "learning_rate": 1.820732638804117e-05, - "loss": 2.2938, - "step": 364620 - }, - { - "epoch": 0.64, - "learning_rate": 1.8206454448114344e-05, - "loss": 2.275, - "step": 364630 - }, - { - "epoch": 0.64, - "learning_rate": 1.8205582508187515e-05, - "loss": 2.3858, - "step": 364640 - }, - { - "epoch": 0.64, - "learning_rate": 1.8204710568260692e-05, - "loss": 2.2759, - "step": 364650 - }, - { - "epoch": 0.64, - "learning_rate": 1.8203838628333862e-05, - "loss": 2.3633, - "step": 364660 - }, - { - "epoch": 0.64, - "learning_rate": 1.8202966688407036e-05, - "loss": 2.1981, - "step": 364670 - }, - { - "epoch": 0.64, - "learning_rate": 1.820209474848021e-05, - "loss": 2.3377, - "step": 364680 - }, - { - "epoch": 0.64, - "learning_rate": 1.8201222808553384e-05, - "loss": 2.3744, - "step": 364690 - }, - { - "epoch": 0.64, - "learning_rate": 1.8200350868626557e-05, - "loss": 2.2666, - "step": 364700 - }, - { - "epoch": 0.64, - "learning_rate": 1.8199478928699728e-05, - "loss": 2.2875, - "step": 364710 - }, - { - "epoch": 0.64, - "learning_rate": 1.81986069887729e-05, - "loss": 2.3435, - "step": 364720 - }, - { - "epoch": 0.64, - "learning_rate": 1.8197735048846075e-05, - "loss": 2.327, - "step": 364730 - }, - { - "epoch": 0.64, - "learning_rate": 1.819686310891925e-05, - "loss": 2.3991, - "step": 364740 - }, - { - "epoch": 0.64, - "learning_rate": 1.8195991168992423e-05, - "loss": 2.3667, - "step": 364750 - }, - { - "epoch": 0.64, - "learning_rate": 1.8195119229065597e-05, - "loss": 2.2182, - "step": 364760 - }, - { - "epoch": 0.64, - "learning_rate": 1.819424728913877e-05, - "loss": 2.312, - "step": 364770 - }, - { - "epoch": 0.64, - "learning_rate": 1.819337534921194e-05, - "loss": 2.3867, - "step": 364780 - }, - { - "epoch": 0.64, - "learning_rate": 1.8192503409285115e-05, - "loss": 2.355, - "step": 364790 - }, - { - "epoch": 0.64, - "learning_rate": 1.819163146935829e-05, - "loss": 2.2799, - "step": 364800 - }, - { - "epoch": 0.64, - "learning_rate": 1.8190759529431462e-05, - "loss": 2.1998, - "step": 364810 - }, - { - "epoch": 0.64, - "learning_rate": 1.8189887589504632e-05, - "loss": 2.3861, - "step": 364820 - }, - { - "epoch": 0.64, - "learning_rate": 1.8189015649577806e-05, - "loss": 2.3634, - "step": 364830 - }, - { - "epoch": 0.64, - "learning_rate": 1.818814370965098e-05, - "loss": 2.2827, - "step": 364840 - }, - { - "epoch": 0.64, - "learning_rate": 1.8187271769724154e-05, - "loss": 2.3099, - "step": 364850 - }, - { - "epoch": 0.64, - "learning_rate": 1.8186399829797328e-05, - "loss": 2.2527, - "step": 364860 - }, - { - "epoch": 0.64, - "learning_rate": 1.81855278898705e-05, - "loss": 2.3219, - "step": 364870 - }, - { - "epoch": 0.64, - "learning_rate": 1.8184655949943675e-05, - "loss": 2.3424, - "step": 364880 - }, - { - "epoch": 0.64, - "learning_rate": 1.8183784010016845e-05, - "loss": 2.3601, - "step": 364890 - }, - { - "epoch": 0.64, - "learning_rate": 1.818291207009002e-05, - "loss": 2.2019, - "step": 364900 - }, - { - "epoch": 0.64, - "learning_rate": 1.8182040130163193e-05, - "loss": 2.2618, - "step": 364910 - }, - { - "epoch": 0.64, - "learning_rate": 1.8181168190236367e-05, - "loss": 2.3455, - "step": 364920 - }, - { - "epoch": 0.64, - "learning_rate": 1.818029625030954e-05, - "loss": 2.2322, - "step": 364930 - }, - { - "epoch": 0.64, - "learning_rate": 1.817942431038271e-05, - "loss": 2.3264, - "step": 364940 - }, - { - "epoch": 0.64, - "learning_rate": 1.8178552370455888e-05, - "loss": 2.1749, - "step": 364950 - }, - { - "epoch": 0.64, - "learning_rate": 1.817768043052906e-05, - "loss": 2.2802, - "step": 364960 - }, - { - "epoch": 0.64, - "learning_rate": 1.8176808490602232e-05, - "loss": 2.1598, - "step": 364970 - }, - { - "epoch": 0.64, - "learning_rate": 1.8175936550675403e-05, - "loss": 2.2529, - "step": 364980 - }, - { - "epoch": 0.64, - "learning_rate": 1.817506461074858e-05, - "loss": 2.2416, - "step": 364990 - }, - { - "epoch": 0.64, - "learning_rate": 1.8174192670821754e-05, - "loss": 2.3488, - "step": 365000 - }, - { - "epoch": 0.64, - "learning_rate": 1.8173320730894924e-05, - "loss": 2.334, - "step": 365010 - }, - { - "epoch": 0.64, - "learning_rate": 1.81724487909681e-05, - "loss": 2.4309, - "step": 365020 - }, - { - "epoch": 0.64, - "learning_rate": 1.817157685104127e-05, - "loss": 2.211, - "step": 365030 - }, - { - "epoch": 0.64, - "learning_rate": 1.8170704911114445e-05, - "loss": 2.2794, - "step": 365040 - }, - { - "epoch": 0.64, - "learning_rate": 1.8169832971187616e-05, - "loss": 2.2431, - "step": 365050 - }, - { - "epoch": 0.64, - "learning_rate": 1.8168961031260793e-05, - "loss": 2.3766, - "step": 365060 - }, - { - "epoch": 0.64, - "learning_rate": 1.8168089091333963e-05, - "loss": 2.306, - "step": 365070 - }, - { - "epoch": 0.64, - "learning_rate": 1.8167217151407137e-05, - "loss": 2.3155, - "step": 365080 - }, - { - "epoch": 0.64, - "learning_rate": 1.816634521148031e-05, - "loss": 2.358, - "step": 365090 - }, - { - "epoch": 0.64, - "learning_rate": 1.8165473271553484e-05, - "loss": 2.2592, - "step": 365100 - }, - { - "epoch": 0.64, - "learning_rate": 1.8164601331626658e-05, - "loss": 2.4451, - "step": 365110 - }, - { - "epoch": 0.64, - "learning_rate": 1.816372939169983e-05, - "loss": 2.247, - "step": 365120 - }, - { - "epoch": 0.64, - "learning_rate": 1.8162857451773002e-05, - "loss": 2.375, - "step": 365130 - }, - { - "epoch": 0.64, - "learning_rate": 1.8161985511846176e-05, - "loss": 2.2855, - "step": 365140 - }, - { - "epoch": 0.64, - "learning_rate": 1.816111357191935e-05, - "loss": 2.2778, - "step": 365150 - }, - { - "epoch": 0.64, - "learning_rate": 1.8160241631992524e-05, - "loss": 2.3418, - "step": 365160 - }, - { - "epoch": 0.64, - "learning_rate": 1.8159369692065697e-05, - "loss": 2.3203, - "step": 365170 - }, - { - "epoch": 0.64, - "learning_rate": 1.815849775213887e-05, - "loss": 2.3179, - "step": 365180 - }, - { - "epoch": 0.64, - "learning_rate": 1.815762581221204e-05, - "loss": 2.2526, - "step": 365190 - }, - { - "epoch": 0.64, - "learning_rate": 1.8156753872285215e-05, - "loss": 2.3804, - "step": 365200 - }, - { - "epoch": 0.64, - "learning_rate": 1.815588193235839e-05, - "loss": 2.2074, - "step": 365210 - }, - { - "epoch": 0.64, - "learning_rate": 1.8155009992431563e-05, - "loss": 2.3762, - "step": 365220 - }, - { - "epoch": 0.64, - "learning_rate": 1.8154138052504733e-05, - "loss": 2.408, - "step": 365230 - }, - { - "epoch": 0.64, - "learning_rate": 1.8153266112577907e-05, - "loss": 2.3609, - "step": 365240 - }, - { - "epoch": 0.64, - "learning_rate": 1.8152394172651084e-05, - "loss": 2.3435, - "step": 365250 - }, - { - "epoch": 0.64, - "learning_rate": 1.8151522232724255e-05, - "loss": 2.3621, - "step": 365260 - }, - { - "epoch": 0.64, - "learning_rate": 1.815065029279743e-05, - "loss": 2.3359, - "step": 365270 - }, - { - "epoch": 0.64, - "learning_rate": 1.8149778352870602e-05, - "loss": 2.1998, - "step": 365280 - }, - { - "epoch": 0.64, - "learning_rate": 1.8148906412943776e-05, - "loss": 2.3272, - "step": 365290 - }, - { - "epoch": 0.64, - "learning_rate": 1.8148034473016946e-05, - "loss": 2.3719, - "step": 365300 - }, - { - "epoch": 0.64, - "learning_rate": 1.814716253309012e-05, - "loss": 2.3375, - "step": 365310 - }, - { - "epoch": 0.64, - "learning_rate": 1.8146290593163294e-05, - "loss": 2.42, - "step": 365320 - }, - { - "epoch": 0.64, - "learning_rate": 1.8145418653236468e-05, - "loss": 2.3294, - "step": 365330 - }, - { - "epoch": 0.64, - "learning_rate": 1.814454671330964e-05, - "loss": 2.3689, - "step": 365340 - }, - { - "epoch": 0.64, - "learning_rate": 1.8143674773382812e-05, - "loss": 2.2013, - "step": 365350 - }, - { - "epoch": 0.64, - "learning_rate": 1.814280283345599e-05, - "loss": 2.3836, - "step": 365360 - }, - { - "epoch": 0.64, - "learning_rate": 1.814193089352916e-05, - "loss": 2.324, - "step": 365370 - }, - { - "epoch": 0.64, - "learning_rate": 1.8141058953602333e-05, - "loss": 2.2682, - "step": 365380 - }, - { - "epoch": 0.64, - "learning_rate": 1.8140187013675507e-05, - "loss": 2.367, - "step": 365390 - }, - { - "epoch": 0.64, - "learning_rate": 1.813931507374868e-05, - "loss": 2.3515, - "step": 365400 - }, - { - "epoch": 0.64, - "learning_rate": 1.8138443133821854e-05, - "loss": 2.226, - "step": 365410 - }, - { - "epoch": 0.64, - "learning_rate": 1.8137571193895025e-05, - "loss": 2.3157, - "step": 365420 - }, - { - "epoch": 0.64, - "learning_rate": 1.8136699253968202e-05, - "loss": 2.3486, - "step": 365430 - }, - { - "epoch": 0.64, - "learning_rate": 1.8135827314041372e-05, - "loss": 2.354, - "step": 365440 - }, - { - "epoch": 0.64, - "learning_rate": 1.8134955374114546e-05, - "loss": 2.3805, - "step": 365450 - }, - { - "epoch": 0.64, - "learning_rate": 1.8134083434187716e-05, - "loss": 2.3854, - "step": 365460 - }, - { - "epoch": 0.64, - "learning_rate": 1.8133211494260894e-05, - "loss": 2.3555, - "step": 365470 - }, - { - "epoch": 0.64, - "learning_rate": 1.8132339554334067e-05, - "loss": 2.2931, - "step": 365480 - }, - { - "epoch": 0.64, - "learning_rate": 1.8131467614407238e-05, - "loss": 2.5155, - "step": 365490 - }, - { - "epoch": 0.64, - "learning_rate": 1.813059567448041e-05, - "loss": 2.2672, - "step": 365500 - }, - { - "epoch": 0.64, - "learning_rate": 1.8129723734553585e-05, - "loss": 2.4609, - "step": 365510 - }, - { - "epoch": 0.64, - "learning_rate": 1.812885179462676e-05, - "loss": 2.2929, - "step": 365520 - }, - { - "epoch": 0.64, - "learning_rate": 1.812797985469993e-05, - "loss": 2.3108, - "step": 365530 - }, - { - "epoch": 0.64, - "learning_rate": 1.8127107914773107e-05, - "loss": 2.2786, - "step": 365540 - }, - { - "epoch": 0.64, - "learning_rate": 1.8126235974846277e-05, - "loss": 2.4305, - "step": 365550 - }, - { - "epoch": 0.64, - "learning_rate": 1.812536403491945e-05, - "loss": 2.2135, - "step": 365560 - }, - { - "epoch": 0.64, - "learning_rate": 1.8124492094992625e-05, - "loss": 2.3245, - "step": 365570 - }, - { - "epoch": 0.64, - "learning_rate": 1.81236201550658e-05, - "loss": 2.2409, - "step": 365580 - }, - { - "epoch": 0.64, - "learning_rate": 1.8122748215138972e-05, - "loss": 2.3919, - "step": 365590 - }, - { - "epoch": 0.64, - "learning_rate": 1.8121876275212142e-05, - "loss": 2.2739, - "step": 365600 - }, - { - "epoch": 0.64, - "learning_rate": 1.8121004335285316e-05, - "loss": 2.3931, - "step": 365610 - }, - { - "epoch": 0.64, - "learning_rate": 1.812013239535849e-05, - "loss": 2.2801, - "step": 365620 - }, - { - "epoch": 0.64, - "learning_rate": 1.8119260455431664e-05, - "loss": 2.3051, - "step": 365630 - }, - { - "epoch": 0.64, - "learning_rate": 1.8118388515504838e-05, - "loss": 2.2404, - "step": 365640 - }, - { - "epoch": 0.64, - "learning_rate": 1.8117516575578008e-05, - "loss": 2.2554, - "step": 365650 - }, - { - "epoch": 0.64, - "learning_rate": 1.8116644635651185e-05, - "loss": 2.167, - "step": 365660 - }, - { - "epoch": 0.64, - "learning_rate": 1.8115772695724355e-05, - "loss": 2.2468, - "step": 365670 - }, - { - "epoch": 0.64, - "learning_rate": 1.811490075579753e-05, - "loss": 2.2517, - "step": 365680 - }, - { - "epoch": 0.64, - "learning_rate": 1.8114028815870703e-05, - "loss": 2.3684, - "step": 365690 - }, - { - "epoch": 0.64, - "learning_rate": 1.8113156875943877e-05, - "loss": 2.3554, - "step": 365700 - }, - { - "epoch": 0.64, - "learning_rate": 1.8112284936017047e-05, - "loss": 2.3183, - "step": 365710 - }, - { - "epoch": 0.64, - "learning_rate": 1.811141299609022e-05, - "loss": 2.315, - "step": 365720 - }, - { - "epoch": 0.64, - "learning_rate": 1.8110541056163398e-05, - "loss": 2.297, - "step": 365730 - }, - { - "epoch": 0.64, - "learning_rate": 1.810966911623657e-05, - "loss": 2.3822, - "step": 365740 - }, - { - "epoch": 0.64, - "learning_rate": 1.8108797176309742e-05, - "loss": 2.4429, - "step": 365750 - }, - { - "epoch": 0.64, - "learning_rate": 1.8107925236382913e-05, - "loss": 2.2189, - "step": 365760 - }, - { - "epoch": 0.64, - "learning_rate": 1.810705329645609e-05, - "loss": 2.3305, - "step": 365770 - }, - { - "epoch": 0.64, - "learning_rate": 1.810618135652926e-05, - "loss": 2.3011, - "step": 365780 - }, - { - "epoch": 0.64, - "learning_rate": 1.8105309416602434e-05, - "loss": 2.3394, - "step": 365790 - }, - { - "epoch": 0.64, - "learning_rate": 1.8104437476675608e-05, - "loss": 2.272, - "step": 365800 - }, - { - "epoch": 0.64, - "learning_rate": 1.810356553674878e-05, - "loss": 2.2718, - "step": 365810 - }, - { - "epoch": 0.64, - "learning_rate": 1.8102693596821955e-05, - "loss": 2.2438, - "step": 365820 - }, - { - "epoch": 0.64, - "learning_rate": 1.8101821656895126e-05, - "loss": 2.2762, - "step": 365830 - }, - { - "epoch": 0.64, - "learning_rate": 1.8100949716968303e-05, - "loss": 2.2704, - "step": 365840 - }, - { - "epoch": 0.64, - "learning_rate": 1.8100077777041473e-05, - "loss": 2.3083, - "step": 365850 - }, - { - "epoch": 0.64, - "learning_rate": 1.8099205837114647e-05, - "loss": 2.3868, - "step": 365860 - }, - { - "epoch": 0.64, - "learning_rate": 1.809833389718782e-05, - "loss": 2.1597, - "step": 365870 - }, - { - "epoch": 0.64, - "learning_rate": 1.8097461957260994e-05, - "loss": 2.3584, - "step": 365880 - }, - { - "epoch": 0.64, - "learning_rate": 1.8096590017334168e-05, - "loss": 2.2935, - "step": 365890 - }, - { - "epoch": 0.64, - "learning_rate": 1.809571807740734e-05, - "loss": 2.3426, - "step": 365900 - }, - { - "epoch": 0.64, - "learning_rate": 1.8094846137480512e-05, - "loss": 2.4063, - "step": 365910 - }, - { - "epoch": 0.64, - "learning_rate": 1.8093974197553686e-05, - "loss": 2.2775, - "step": 365920 - }, - { - "epoch": 0.64, - "learning_rate": 1.809310225762686e-05, - "loss": 2.3403, - "step": 365930 - }, - { - "epoch": 0.64, - "learning_rate": 1.809223031770003e-05, - "loss": 2.3854, - "step": 365940 - }, - { - "epoch": 0.64, - "learning_rate": 1.8091358377773207e-05, - "loss": 2.2881, - "step": 365950 - }, - { - "epoch": 0.64, - "learning_rate": 1.8090486437846378e-05, - "loss": 2.3447, - "step": 365960 - }, - { - "epoch": 0.64, - "learning_rate": 1.808961449791955e-05, - "loss": 2.3196, - "step": 365970 - }, - { - "epoch": 0.64, - "learning_rate": 1.8088742557992725e-05, - "loss": 2.3801, - "step": 365980 - }, - { - "epoch": 0.64, - "learning_rate": 1.80878706180659e-05, - "loss": 2.3133, - "step": 365990 - }, - { - "epoch": 0.64, - "learning_rate": 1.8086998678139073e-05, - "loss": 2.3152, - "step": 366000 - }, - { - "epoch": 0.64, - "learning_rate": 1.8086126738212243e-05, - "loss": 2.2818, - "step": 366010 - }, - { - "epoch": 0.64, - "learning_rate": 1.8085254798285417e-05, - "loss": 2.2855, - "step": 366020 - }, - { - "epoch": 0.64, - "learning_rate": 1.808438285835859e-05, - "loss": 2.4015, - "step": 366030 - }, - { - "epoch": 0.64, - "learning_rate": 1.8083510918431765e-05, - "loss": 2.3098, - "step": 366040 - }, - { - "epoch": 0.64, - "learning_rate": 1.808263897850494e-05, - "loss": 2.366, - "step": 366050 - }, - { - "epoch": 0.64, - "learning_rate": 1.808176703857811e-05, - "loss": 2.3207, - "step": 366060 - }, - { - "epoch": 0.64, - "learning_rate": 1.8080895098651286e-05, - "loss": 2.4126, - "step": 366070 - }, - { - "epoch": 0.64, - "learning_rate": 1.8080023158724456e-05, - "loss": 2.3586, - "step": 366080 - }, - { - "epoch": 0.64, - "learning_rate": 1.807915121879763e-05, - "loss": 2.2742, - "step": 366090 - }, - { - "epoch": 0.64, - "learning_rate": 1.8078279278870804e-05, - "loss": 2.2679, - "step": 366100 - }, - { - "epoch": 0.64, - "learning_rate": 1.8077407338943978e-05, - "loss": 2.3185, - "step": 366110 - }, - { - "epoch": 0.64, - "learning_rate": 1.807653539901715e-05, - "loss": 2.243, - "step": 366120 - }, - { - "epoch": 0.64, - "learning_rate": 1.8075663459090322e-05, - "loss": 2.2526, - "step": 366130 - }, - { - "epoch": 0.64, - "learning_rate": 1.80747915191635e-05, - "loss": 2.368, - "step": 366140 - }, - { - "epoch": 0.64, - "learning_rate": 1.807391957923667e-05, - "loss": 2.3412, - "step": 366150 - }, - { - "epoch": 0.64, - "learning_rate": 1.8073047639309843e-05, - "loss": 2.4722, - "step": 366160 - }, - { - "epoch": 0.64, - "learning_rate": 1.8072175699383013e-05, - "loss": 2.2742, - "step": 366170 - }, - { - "epoch": 0.64, - "learning_rate": 1.807130375945619e-05, - "loss": 2.3399, - "step": 366180 - }, - { - "epoch": 0.64, - "learning_rate": 1.807043181952936e-05, - "loss": 2.1444, - "step": 366190 - }, - { - "epoch": 0.64, - "learning_rate": 1.8069559879602535e-05, - "loss": 2.3074, - "step": 366200 - }, - { - "epoch": 0.64, - "learning_rate": 1.8068687939675712e-05, - "loss": 2.33, - "step": 366210 - }, - { - "epoch": 0.64, - "learning_rate": 1.8067815999748882e-05, - "loss": 2.2563, - "step": 366220 - }, - { - "epoch": 0.64, - "learning_rate": 1.8066944059822056e-05, - "loss": 2.2633, - "step": 366230 - }, - { - "epoch": 0.64, - "learning_rate": 1.8066072119895226e-05, - "loss": 2.3339, - "step": 366240 - }, - { - "epoch": 0.64, - "learning_rate": 1.8065200179968404e-05, - "loss": 2.2759, - "step": 366250 - }, - { - "epoch": 0.64, - "learning_rate": 1.8064328240041574e-05, - "loss": 2.3839, - "step": 366260 - }, - { - "epoch": 0.64, - "learning_rate": 1.8063456300114748e-05, - "loss": 2.3094, - "step": 366270 - }, - { - "epoch": 0.64, - "learning_rate": 1.806258436018792e-05, - "loss": 2.3467, - "step": 366280 - }, - { - "epoch": 0.64, - "learning_rate": 1.8061712420261095e-05, - "loss": 2.221, - "step": 366290 - }, - { - "epoch": 0.64, - "learning_rate": 1.806084048033427e-05, - "loss": 2.3069, - "step": 366300 - }, - { - "epoch": 0.64, - "learning_rate": 1.805996854040744e-05, - "loss": 2.3046, - "step": 366310 - }, - { - "epoch": 0.64, - "learning_rate": 1.8059096600480613e-05, - "loss": 2.4411, - "step": 366320 - }, - { - "epoch": 0.64, - "learning_rate": 1.8058224660553787e-05, - "loss": 2.2848, - "step": 366330 - }, - { - "epoch": 0.64, - "learning_rate": 1.805735272062696e-05, - "loss": 2.3552, - "step": 366340 - }, - { - "epoch": 0.64, - "learning_rate": 1.8056480780700135e-05, - "loss": 2.3911, - "step": 366350 - }, - { - "epoch": 0.64, - "learning_rate": 1.805560884077331e-05, - "loss": 2.2975, - "step": 366360 - }, - { - "epoch": 0.64, - "learning_rate": 1.8054736900846482e-05, - "loss": 2.3226, - "step": 366370 - }, - { - "epoch": 0.64, - "learning_rate": 1.8053864960919652e-05, - "loss": 2.3752, - "step": 366380 - }, - { - "epoch": 0.64, - "learning_rate": 1.8052993020992826e-05, - "loss": 2.2751, - "step": 366390 - }, - { - "epoch": 0.64, - "learning_rate": 1.8052121081066e-05, - "loss": 2.247, - "step": 366400 - }, - { - "epoch": 0.64, - "learning_rate": 1.8051249141139174e-05, - "loss": 2.3006, - "step": 366410 - }, - { - "epoch": 0.64, - "learning_rate": 1.8050377201212344e-05, - "loss": 2.2676, - "step": 366420 - }, - { - "epoch": 0.64, - "learning_rate": 1.8049505261285518e-05, - "loss": 2.2878, - "step": 366430 - }, - { - "epoch": 0.64, - "learning_rate": 1.8048633321358692e-05, - "loss": 2.2327, - "step": 366440 - }, - { - "epoch": 0.64, - "learning_rate": 1.8047761381431865e-05, - "loss": 2.3243, - "step": 366450 - }, - { - "epoch": 0.64, - "learning_rate": 1.804688944150504e-05, - "loss": 2.2575, - "step": 366460 - }, - { - "epoch": 0.64, - "learning_rate": 1.8046017501578213e-05, - "loss": 2.3724, - "step": 366470 - }, - { - "epoch": 0.64, - "learning_rate": 1.8045145561651387e-05, - "loss": 2.3156, - "step": 366480 - }, - { - "epoch": 0.64, - "learning_rate": 1.8044273621724557e-05, - "loss": 2.2972, - "step": 366490 - }, - { - "epoch": 0.64, - "learning_rate": 1.804340168179773e-05, - "loss": 2.3457, - "step": 366500 - }, - { - "epoch": 0.64, - "learning_rate": 1.8042529741870905e-05, - "loss": 2.3348, - "step": 366510 - }, - { - "epoch": 0.64, - "learning_rate": 1.804165780194408e-05, - "loss": 2.2909, - "step": 366520 - }, - { - "epoch": 0.64, - "learning_rate": 1.8040785862017252e-05, - "loss": 2.3104, - "step": 366530 - }, - { - "epoch": 0.64, - "learning_rate": 1.8039913922090423e-05, - "loss": 2.3939, - "step": 366540 - }, - { - "epoch": 0.64, - "learning_rate": 1.80390419821636e-05, - "loss": 2.3492, - "step": 366550 - }, - { - "epoch": 0.64, - "learning_rate": 1.803817004223677e-05, - "loss": 2.4067, - "step": 366560 - }, - { - "epoch": 0.64, - "learning_rate": 1.8037298102309944e-05, - "loss": 2.2796, - "step": 366570 - }, - { - "epoch": 0.64, - "learning_rate": 1.8036426162383114e-05, - "loss": 2.2979, - "step": 366580 - }, - { - "epoch": 0.64, - "learning_rate": 1.803555422245629e-05, - "loss": 2.4105, - "step": 366590 - }, - { - "epoch": 0.64, - "learning_rate": 1.8034682282529465e-05, - "loss": 2.3129, - "step": 366600 - }, - { - "epoch": 0.64, - "learning_rate": 1.8033810342602636e-05, - "loss": 2.3748, - "step": 366610 - }, - { - "epoch": 0.64, - "learning_rate": 1.8032938402675813e-05, - "loss": 2.2936, - "step": 366620 - }, - { - "epoch": 0.64, - "learning_rate": 1.8032066462748983e-05, - "loss": 2.3588, - "step": 366630 - }, - { - "epoch": 0.64, - "learning_rate": 1.8031194522822157e-05, - "loss": 2.2269, - "step": 366640 - }, - { - "epoch": 0.64, - "learning_rate": 1.8030322582895327e-05, - "loss": 2.252, - "step": 366650 - }, - { - "epoch": 0.64, - "learning_rate": 1.8029450642968504e-05, - "loss": 2.3524, - "step": 366660 - }, - { - "epoch": 0.64, - "learning_rate": 1.8028578703041675e-05, - "loss": 2.4, - "step": 366670 - }, - { - "epoch": 0.64, - "learning_rate": 1.802770676311485e-05, - "loss": 2.2691, - "step": 366680 - }, - { - "epoch": 0.64, - "learning_rate": 1.8026834823188022e-05, - "loss": 2.3402, - "step": 366690 - }, - { - "epoch": 0.64, - "learning_rate": 1.8025962883261196e-05, - "loss": 2.2516, - "step": 366700 - }, - { - "epoch": 0.64, - "learning_rate": 1.802509094333437e-05, - "loss": 2.3277, - "step": 366710 - }, - { - "epoch": 0.64, - "learning_rate": 1.802421900340754e-05, - "loss": 2.313, - "step": 366720 - }, - { - "epoch": 0.64, - "learning_rate": 1.8023347063480717e-05, - "loss": 2.2978, - "step": 366730 - }, - { - "epoch": 0.64, - "learning_rate": 1.8022475123553888e-05, - "loss": 2.2247, - "step": 366740 - }, - { - "epoch": 0.64, - "learning_rate": 1.802160318362706e-05, - "loss": 2.3042, - "step": 366750 - }, - { - "epoch": 0.64, - "learning_rate": 1.8020731243700235e-05, - "loss": 2.2642, - "step": 366760 - }, - { - "epoch": 0.64, - "learning_rate": 1.801985930377341e-05, - "loss": 2.249, - "step": 366770 - }, - { - "epoch": 0.64, - "learning_rate": 1.8018987363846583e-05, - "loss": 2.3493, - "step": 366780 - }, - { - "epoch": 0.64, - "learning_rate": 1.8018115423919753e-05, - "loss": 2.3282, - "step": 366790 - }, - { - "epoch": 0.64, - "learning_rate": 1.8017243483992927e-05, - "loss": 2.403, - "step": 366800 - }, - { - "epoch": 0.64, - "learning_rate": 1.80163715440661e-05, - "loss": 2.259, - "step": 366810 - }, - { - "epoch": 0.64, - "learning_rate": 1.8015499604139275e-05, - "loss": 2.3331, - "step": 366820 - }, - { - "epoch": 0.64, - "learning_rate": 1.801462766421245e-05, - "loss": 2.3919, - "step": 366830 - }, - { - "epoch": 0.64, - "learning_rate": 1.801375572428562e-05, - "loss": 2.3615, - "step": 366840 - }, - { - "epoch": 0.64, - "learning_rate": 1.8012883784358796e-05, - "loss": 2.2782, - "step": 366850 - }, - { - "epoch": 0.64, - "learning_rate": 1.8012011844431966e-05, - "loss": 2.2357, - "step": 366860 - }, - { - "epoch": 0.64, - "learning_rate": 1.801113990450514e-05, - "loss": 2.3851, - "step": 366870 - }, - { - "epoch": 0.64, - "learning_rate": 1.8010267964578314e-05, - "loss": 2.2684, - "step": 366880 - }, - { - "epoch": 0.64, - "learning_rate": 1.8009396024651488e-05, - "loss": 2.3203, - "step": 366890 - }, - { - "epoch": 0.64, - "learning_rate": 1.8008524084724658e-05, - "loss": 2.3701, - "step": 366900 - }, - { - "epoch": 0.64, - "learning_rate": 1.8007652144797832e-05, - "loss": 2.2405, - "step": 366910 - }, - { - "epoch": 0.64, - "learning_rate": 1.8006780204871006e-05, - "loss": 2.3398, - "step": 366920 - }, - { - "epoch": 0.64, - "learning_rate": 1.800590826494418e-05, - "loss": 2.299, - "step": 366930 - }, - { - "epoch": 0.64, - "learning_rate": 1.8005036325017353e-05, - "loss": 2.3422, - "step": 366940 - }, - { - "epoch": 0.64, - "learning_rate": 1.8004164385090523e-05, - "loss": 2.2719, - "step": 366950 - }, - { - "epoch": 0.64, - "learning_rate": 1.80032924451637e-05, - "loss": 2.306, - "step": 366960 - }, - { - "epoch": 0.64, - "learning_rate": 1.800242050523687e-05, - "loss": 2.3691, - "step": 366970 - }, - { - "epoch": 0.64, - "learning_rate": 1.8001548565310045e-05, - "loss": 2.3415, - "step": 366980 - }, - { - "epoch": 0.64, - "learning_rate": 1.800067662538322e-05, - "loss": 2.3881, - "step": 366990 - }, - { - "epoch": 0.64, - "learning_rate": 1.7999804685456392e-05, - "loss": 2.272, - "step": 367000 - }, - { - "epoch": 0.64, - "learning_rate": 1.7998932745529566e-05, - "loss": 2.3458, - "step": 367010 - }, - { - "epoch": 0.64, - "learning_rate": 1.7998060805602736e-05, - "loss": 2.3743, - "step": 367020 - }, - { - "epoch": 0.64, - "learning_rate": 1.7997188865675914e-05, - "loss": 2.2767, - "step": 367030 - }, - { - "epoch": 0.64, - "learning_rate": 1.7996316925749084e-05, - "loss": 2.3521, - "step": 367040 - }, - { - "epoch": 0.64, - "learning_rate": 1.7995444985822258e-05, - "loss": 2.362, - "step": 367050 - }, - { - "epoch": 0.64, - "learning_rate": 1.7994573045895428e-05, - "loss": 2.4004, - "step": 367060 - }, - { - "epoch": 0.64, - "learning_rate": 1.7993701105968605e-05, - "loss": 2.254, - "step": 367070 - }, - { - "epoch": 0.64, - "learning_rate": 1.799282916604178e-05, - "loss": 2.3756, - "step": 367080 - }, - { - "epoch": 0.64, - "learning_rate": 1.799195722611495e-05, - "loss": 2.2689, - "step": 367090 - }, - { - "epoch": 0.64, - "learning_rate": 1.7991085286188123e-05, - "loss": 2.3543, - "step": 367100 - }, - { - "epoch": 0.64, - "learning_rate": 1.7990213346261297e-05, - "loss": 2.3548, - "step": 367110 - }, - { - "epoch": 0.64, - "learning_rate": 1.798934140633447e-05, - "loss": 2.1875, - "step": 367120 - }, - { - "epoch": 0.64, - "learning_rate": 1.798846946640764e-05, - "loss": 2.257, - "step": 367130 - }, - { - "epoch": 0.64, - "learning_rate": 1.798759752648082e-05, - "loss": 2.2737, - "step": 367140 - }, - { - "epoch": 0.64, - "learning_rate": 1.798672558655399e-05, - "loss": 2.3268, - "step": 367150 - }, - { - "epoch": 0.64, - "learning_rate": 1.7985853646627162e-05, - "loss": 2.2289, - "step": 367160 - }, - { - "epoch": 0.64, - "learning_rate": 1.7984981706700336e-05, - "loss": 2.3061, - "step": 367170 - }, - { - "epoch": 0.64, - "learning_rate": 1.798410976677351e-05, - "loss": 2.29, - "step": 367180 - }, - { - "epoch": 0.64, - "learning_rate": 1.7983237826846684e-05, - "loss": 2.2574, - "step": 367190 - }, - { - "epoch": 0.64, - "learning_rate": 1.7982365886919854e-05, - "loss": 2.3941, - "step": 367200 - }, - { - "epoch": 0.64, - "learning_rate": 1.7981493946993028e-05, - "loss": 2.3758, - "step": 367210 - }, - { - "epoch": 0.64, - "learning_rate": 1.7980622007066202e-05, - "loss": 2.2931, - "step": 367220 - }, - { - "epoch": 0.64, - "learning_rate": 1.7979750067139375e-05, - "loss": 2.3633, - "step": 367230 - }, - { - "epoch": 0.64, - "learning_rate": 1.797887812721255e-05, - "loss": 2.287, - "step": 367240 - }, - { - "epoch": 0.64, - "learning_rate": 1.797800618728572e-05, - "loss": 2.3715, - "step": 367250 - }, - { - "epoch": 0.64, - "learning_rate": 1.7977134247358897e-05, - "loss": 2.3147, - "step": 367260 - }, - { - "epoch": 0.64, - "learning_rate": 1.7976262307432067e-05, - "loss": 2.2337, - "step": 367270 - }, - { - "epoch": 0.64, - "learning_rate": 1.797539036750524e-05, - "loss": 2.3572, - "step": 367280 - }, - { - "epoch": 0.64, - "learning_rate": 1.7974518427578415e-05, - "loss": 2.2335, - "step": 367290 - }, - { - "epoch": 0.64, - "learning_rate": 1.797364648765159e-05, - "loss": 2.358, - "step": 367300 - }, - { - "epoch": 0.64, - "learning_rate": 1.797277454772476e-05, - "loss": 2.3659, - "step": 367310 - }, - { - "epoch": 0.64, - "learning_rate": 1.7971902607797933e-05, - "loss": 2.3677, - "step": 367320 - }, - { - "epoch": 0.64, - "learning_rate": 1.797103066787111e-05, - "loss": 2.2867, - "step": 367330 - }, - { - "epoch": 0.64, - "learning_rate": 1.797015872794428e-05, - "loss": 2.3042, - "step": 367340 - }, - { - "epoch": 0.64, - "learning_rate": 1.7969286788017454e-05, - "loss": 2.1841, - "step": 367350 - }, - { - "epoch": 0.64, - "learning_rate": 1.7968414848090624e-05, - "loss": 2.1709, - "step": 367360 - }, - { - "epoch": 0.64, - "learning_rate": 1.79675429081638e-05, - "loss": 2.4265, - "step": 367370 - }, - { - "epoch": 0.64, - "learning_rate": 1.7966670968236972e-05, - "loss": 2.279, - "step": 367380 - }, - { - "epoch": 0.64, - "learning_rate": 1.7965799028310146e-05, - "loss": 2.3271, - "step": 367390 - }, - { - "epoch": 0.64, - "learning_rate": 1.796492708838332e-05, - "loss": 2.3749, - "step": 367400 - }, - { - "epoch": 0.64, - "learning_rate": 1.7964055148456493e-05, - "loss": 2.3127, - "step": 367410 - }, - { - "epoch": 0.64, - "learning_rate": 1.7963183208529667e-05, - "loss": 2.168, - "step": 367420 - }, - { - "epoch": 0.64, - "learning_rate": 1.7962311268602837e-05, - "loss": 2.4241, - "step": 367430 - }, - { - "epoch": 0.64, - "learning_rate": 1.7961439328676014e-05, - "loss": 2.369, - "step": 367440 - }, - { - "epoch": 0.64, - "learning_rate": 1.7960567388749185e-05, - "loss": 2.3671, - "step": 367450 - }, - { - "epoch": 0.64, - "learning_rate": 1.795969544882236e-05, - "loss": 2.353, - "step": 367460 - }, - { - "epoch": 0.64, - "learning_rate": 1.7958823508895532e-05, - "loss": 2.229, - "step": 367470 - }, - { - "epoch": 0.64, - "learning_rate": 1.7957951568968706e-05, - "loss": 2.4086, - "step": 367480 - }, - { - "epoch": 0.64, - "learning_rate": 1.795707962904188e-05, - "loss": 2.2235, - "step": 367490 - }, - { - "epoch": 0.64, - "learning_rate": 1.795620768911505e-05, - "loss": 2.257, - "step": 367500 - }, - { - "epoch": 0.64, - "learning_rate": 1.7955335749188224e-05, - "loss": 2.253, - "step": 367510 - }, - { - "epoch": 0.64, - "learning_rate": 1.7954463809261398e-05, - "loss": 2.3455, - "step": 367520 - }, - { - "epoch": 0.64, - "learning_rate": 1.795359186933457e-05, - "loss": 2.2418, - "step": 367530 - }, - { - "epoch": 0.64, - "learning_rate": 1.7952719929407742e-05, - "loss": 2.3326, - "step": 367540 - }, - { - "epoch": 0.64, - "learning_rate": 1.795184798948092e-05, - "loss": 2.3227, - "step": 367550 - }, - { - "epoch": 0.64, - "learning_rate": 1.7950976049554093e-05, - "loss": 2.4294, - "step": 367560 - }, - { - "epoch": 0.64, - "learning_rate": 1.7950104109627263e-05, - "loss": 2.262, - "step": 367570 - }, - { - "epoch": 0.64, - "learning_rate": 1.7949232169700437e-05, - "loss": 2.2688, - "step": 367580 - }, - { - "epoch": 0.64, - "learning_rate": 1.794836022977361e-05, - "loss": 2.3297, - "step": 367590 - }, - { - "epoch": 0.64, - "learning_rate": 1.7947488289846785e-05, - "loss": 2.3365, - "step": 367600 - }, - { - "epoch": 0.64, - "learning_rate": 1.7946616349919955e-05, - "loss": 2.2786, - "step": 367610 - }, - { - "epoch": 0.64, - "learning_rate": 1.794574440999313e-05, - "loss": 2.3415, - "step": 367620 - }, - { - "epoch": 0.64, - "learning_rate": 1.7944872470066303e-05, - "loss": 2.3366, - "step": 367630 - }, - { - "epoch": 0.64, - "learning_rate": 1.7944000530139476e-05, - "loss": 2.3095, - "step": 367640 - }, - { - "epoch": 0.64, - "learning_rate": 1.794312859021265e-05, - "loss": 2.3437, - "step": 367650 - }, - { - "epoch": 0.64, - "learning_rate": 1.7942256650285824e-05, - "loss": 2.3398, - "step": 367660 - }, - { - "epoch": 0.64, - "learning_rate": 1.7941384710358998e-05, - "loss": 2.3077, - "step": 367670 - }, - { - "epoch": 0.64, - "learning_rate": 1.7940512770432168e-05, - "loss": 2.3164, - "step": 367680 - }, - { - "epoch": 0.64, - "learning_rate": 1.7939640830505342e-05, - "loss": 2.286, - "step": 367690 - }, - { - "epoch": 0.64, - "learning_rate": 1.7938768890578516e-05, - "loss": 2.3361, - "step": 367700 - }, - { - "epoch": 0.64, - "learning_rate": 1.793789695065169e-05, - "loss": 2.346, - "step": 367710 - }, - { - "epoch": 0.64, - "learning_rate": 1.7937025010724863e-05, - "loss": 2.286, - "step": 367720 - }, - { - "epoch": 0.64, - "learning_rate": 1.7936153070798033e-05, - "loss": 2.3006, - "step": 367730 - }, - { - "epoch": 0.64, - "learning_rate": 1.793528113087121e-05, - "loss": 2.3208, - "step": 367740 - }, - { - "epoch": 0.64, - "learning_rate": 1.793440919094438e-05, - "loss": 2.2563, - "step": 367750 - }, - { - "epoch": 0.64, - "learning_rate": 1.7933537251017555e-05, - "loss": 2.3289, - "step": 367760 - }, - { - "epoch": 0.64, - "learning_rate": 1.7932665311090725e-05, - "loss": 2.3873, - "step": 367770 - }, - { - "epoch": 0.64, - "learning_rate": 1.7931793371163902e-05, - "loss": 2.3812, - "step": 367780 - }, - { - "epoch": 0.64, - "learning_rate": 1.7930921431237073e-05, - "loss": 2.1399, - "step": 367790 - }, - { - "epoch": 0.64, - "learning_rate": 1.7930049491310246e-05, - "loss": 2.3676, - "step": 367800 - }, - { - "epoch": 0.64, - "learning_rate": 1.7929177551383424e-05, - "loss": 2.3703, - "step": 367810 - }, - { - "epoch": 0.64, - "learning_rate": 1.7928305611456594e-05, - "loss": 2.2461, - "step": 367820 - }, - { - "epoch": 0.64, - "learning_rate": 1.7927433671529768e-05, - "loss": 2.4244, - "step": 367830 - }, - { - "epoch": 0.64, - "learning_rate": 1.7926561731602938e-05, - "loss": 2.3608, - "step": 367840 - }, - { - "epoch": 0.64, - "learning_rate": 1.7925689791676115e-05, - "loss": 2.1651, - "step": 367850 - }, - { - "epoch": 0.64, - "learning_rate": 1.7924817851749286e-05, - "loss": 2.1991, - "step": 367860 - }, - { - "epoch": 0.64, - "learning_rate": 1.792394591182246e-05, - "loss": 2.3632, - "step": 367870 - }, - { - "epoch": 0.64, - "learning_rate": 1.7923073971895633e-05, - "loss": 2.3254, - "step": 367880 - }, - { - "epoch": 0.64, - "learning_rate": 1.7922202031968807e-05, - "loss": 2.3457, - "step": 367890 - }, - { - "epoch": 0.64, - "learning_rate": 1.792133009204198e-05, - "loss": 2.456, - "step": 367900 - }, - { - "epoch": 0.64, - "learning_rate": 1.792045815211515e-05, - "loss": 2.3348, - "step": 367910 - }, - { - "epoch": 0.64, - "learning_rate": 1.7919586212188325e-05, - "loss": 2.2944, - "step": 367920 - }, - { - "epoch": 0.64, - "learning_rate": 1.79187142722615e-05, - "loss": 2.3344, - "step": 367930 - }, - { - "epoch": 0.64, - "learning_rate": 1.7917842332334672e-05, - "loss": 2.3258, - "step": 367940 - }, - { - "epoch": 0.64, - "learning_rate": 1.7916970392407846e-05, - "loss": 2.3802, - "step": 367950 - }, - { - "epoch": 0.64, - "learning_rate": 1.791609845248102e-05, - "loss": 2.3447, - "step": 367960 - }, - { - "epoch": 0.64, - "learning_rate": 1.7915226512554194e-05, - "loss": 2.42, - "step": 367970 - }, - { - "epoch": 0.64, - "learning_rate": 1.7914354572627364e-05, - "loss": 2.3699, - "step": 367980 - }, - { - "epoch": 0.64, - "learning_rate": 1.7913482632700538e-05, - "loss": 2.3382, - "step": 367990 - }, - { - "epoch": 0.64, - "learning_rate": 1.7912610692773712e-05, - "loss": 2.3039, - "step": 368000 - }, - { - "epoch": 0.64, - "learning_rate": 1.7911738752846885e-05, - "loss": 2.3909, - "step": 368010 - }, - { - "epoch": 0.64, - "learning_rate": 1.7910866812920056e-05, - "loss": 2.2862, - "step": 368020 - }, - { - "epoch": 0.64, - "learning_rate": 1.790999487299323e-05, - "loss": 2.312, - "step": 368030 - }, - { - "epoch": 0.64, - "learning_rate": 1.7909122933066403e-05, - "loss": 2.3084, - "step": 368040 - }, - { - "epoch": 0.64, - "learning_rate": 1.7908250993139577e-05, - "loss": 2.3159, - "step": 368050 - }, - { - "epoch": 0.64, - "learning_rate": 1.790737905321275e-05, - "loss": 2.3951, - "step": 368060 - }, - { - "epoch": 0.64, - "learning_rate": 1.7906507113285925e-05, - "loss": 2.2927, - "step": 368070 - }, - { - "epoch": 0.64, - "learning_rate": 1.79056351733591e-05, - "loss": 2.2806, - "step": 368080 - }, - { - "epoch": 0.64, - "learning_rate": 1.790476323343227e-05, - "loss": 2.2613, - "step": 368090 - }, - { - "epoch": 0.64, - "learning_rate": 1.7903891293505443e-05, - "loss": 2.378, - "step": 368100 - }, - { - "epoch": 0.64, - "learning_rate": 1.7903019353578616e-05, - "loss": 2.1855, - "step": 368110 - }, - { - "epoch": 0.64, - "learning_rate": 1.790214741365179e-05, - "loss": 2.3562, - "step": 368120 - }, - { - "epoch": 0.64, - "learning_rate": 1.7901275473724964e-05, - "loss": 2.235, - "step": 368130 - }, - { - "epoch": 0.64, - "learning_rate": 1.7900403533798134e-05, - "loss": 2.2346, - "step": 368140 - }, - { - "epoch": 0.64, - "learning_rate": 1.789953159387131e-05, - "loss": 2.325, - "step": 368150 - }, - { - "epoch": 0.64, - "learning_rate": 1.7898659653944482e-05, - "loss": 2.3711, - "step": 368160 - }, - { - "epoch": 0.64, - "learning_rate": 1.7897787714017656e-05, - "loss": 2.3881, - "step": 368170 - }, - { - "epoch": 0.64, - "learning_rate": 1.789691577409083e-05, - "loss": 2.3227, - "step": 368180 - }, - { - "epoch": 0.64, - "learning_rate": 1.7896043834164003e-05, - "loss": 2.3164, - "step": 368190 - }, - { - "epoch": 0.64, - "learning_rate": 1.7895171894237177e-05, - "loss": 2.2621, - "step": 368200 - }, - { - "epoch": 0.64, - "learning_rate": 1.7894299954310347e-05, - "loss": 2.3882, - "step": 368210 - }, - { - "epoch": 0.64, - "learning_rate": 1.7893428014383524e-05, - "loss": 2.4207, - "step": 368220 - }, - { - "epoch": 0.64, - "learning_rate": 1.7892556074456695e-05, - "loss": 2.3441, - "step": 368230 - }, - { - "epoch": 0.64, - "learning_rate": 1.789168413452987e-05, - "loss": 2.2926, - "step": 368240 - }, - { - "epoch": 0.64, - "learning_rate": 1.789081219460304e-05, - "loss": 2.2808, - "step": 368250 - }, - { - "epoch": 0.64, - "learning_rate": 1.7889940254676216e-05, - "loss": 2.3045, - "step": 368260 - }, - { - "epoch": 0.64, - "learning_rate": 1.7889068314749387e-05, - "loss": 2.2529, - "step": 368270 - }, - { - "epoch": 0.64, - "learning_rate": 1.788819637482256e-05, - "loss": 2.2644, - "step": 368280 - }, - { - "epoch": 0.64, - "learning_rate": 1.7887324434895734e-05, - "loss": 2.4422, - "step": 368290 - }, - { - "epoch": 0.64, - "learning_rate": 1.7886452494968908e-05, - "loss": 2.2784, - "step": 368300 - }, - { - "epoch": 0.64, - "learning_rate": 1.788558055504208e-05, - "loss": 2.36, - "step": 368310 - }, - { - "epoch": 0.64, - "learning_rate": 1.7884708615115252e-05, - "loss": 2.332, - "step": 368320 - }, - { - "epoch": 0.64, - "learning_rate": 1.788383667518843e-05, - "loss": 2.3854, - "step": 368330 - }, - { - "epoch": 0.64, - "learning_rate": 1.78829647352616e-05, - "loss": 2.3409, - "step": 368340 - }, - { - "epoch": 0.64, - "learning_rate": 1.7882092795334773e-05, - "loss": 2.2649, - "step": 368350 - }, - { - "epoch": 0.64, - "learning_rate": 1.7881220855407947e-05, - "loss": 2.2047, - "step": 368360 - }, - { - "epoch": 0.64, - "learning_rate": 1.788034891548112e-05, - "loss": 2.318, - "step": 368370 - }, - { - "epoch": 0.64, - "learning_rate": 1.7879476975554295e-05, - "loss": 2.4245, - "step": 368380 - }, - { - "epoch": 0.64, - "learning_rate": 1.7878605035627465e-05, - "loss": 2.3921, - "step": 368390 - }, - { - "epoch": 0.64, - "learning_rate": 1.787773309570064e-05, - "loss": 2.3492, - "step": 368400 - }, - { - "epoch": 0.64, - "learning_rate": 1.7876861155773813e-05, - "loss": 2.211, - "step": 368410 - }, - { - "epoch": 0.64, - "learning_rate": 1.7875989215846986e-05, - "loss": 2.2346, - "step": 368420 - }, - { - "epoch": 0.64, - "learning_rate": 1.787511727592016e-05, - "loss": 2.4325, - "step": 368430 - }, - { - "epoch": 0.64, - "learning_rate": 1.787424533599333e-05, - "loss": 2.264, - "step": 368440 - }, - { - "epoch": 0.64, - "learning_rate": 1.7873373396066508e-05, - "loss": 2.2759, - "step": 368450 - }, - { - "epoch": 0.64, - "learning_rate": 1.7872501456139678e-05, - "loss": 2.3691, - "step": 368460 - }, - { - "epoch": 0.64, - "learning_rate": 1.7871629516212852e-05, - "loss": 2.3228, - "step": 368470 - }, - { - "epoch": 0.64, - "learning_rate": 1.7870757576286026e-05, - "loss": 2.3104, - "step": 368480 - }, - { - "epoch": 0.64, - "learning_rate": 1.78698856363592e-05, - "loss": 2.2349, - "step": 368490 - }, - { - "epoch": 0.64, - "learning_rate": 1.786901369643237e-05, - "loss": 2.3386, - "step": 368500 - }, - { - "epoch": 0.64, - "learning_rate": 1.7868141756505543e-05, - "loss": 2.2408, - "step": 368510 - }, - { - "epoch": 0.64, - "learning_rate": 1.7867269816578717e-05, - "loss": 2.2836, - "step": 368520 - }, - { - "epoch": 0.64, - "learning_rate": 1.786639787665189e-05, - "loss": 2.3632, - "step": 368530 - }, - { - "epoch": 0.64, - "learning_rate": 1.7865525936725065e-05, - "loss": 2.3333, - "step": 368540 - }, - { - "epoch": 0.64, - "learning_rate": 1.7864653996798235e-05, - "loss": 2.2414, - "step": 368550 - }, - { - "epoch": 0.64, - "learning_rate": 1.7863782056871412e-05, - "loss": 2.2204, - "step": 368560 - }, - { - "epoch": 0.64, - "learning_rate": 1.7862910116944583e-05, - "loss": 2.322, - "step": 368570 - }, - { - "epoch": 0.64, - "learning_rate": 1.7862038177017756e-05, - "loss": 2.2235, - "step": 368580 - }, - { - "epoch": 0.64, - "learning_rate": 1.786116623709093e-05, - "loss": 2.3417, - "step": 368590 - }, - { - "epoch": 0.64, - "learning_rate": 1.7860294297164104e-05, - "loss": 2.2092, - "step": 368600 - }, - { - "epoch": 0.64, - "learning_rate": 1.7859422357237278e-05, - "loss": 2.2998, - "step": 368610 - }, - { - "epoch": 0.64, - "learning_rate": 1.7858550417310448e-05, - "loss": 2.2887, - "step": 368620 - }, - { - "epoch": 0.64, - "learning_rate": 1.7857678477383625e-05, - "loss": 2.4211, - "step": 368630 - }, - { - "epoch": 0.64, - "learning_rate": 1.7856806537456796e-05, - "loss": 2.3275, - "step": 368640 - }, - { - "epoch": 0.64, - "learning_rate": 1.785593459752997e-05, - "loss": 2.3667, - "step": 368650 - }, - { - "epoch": 0.64, - "learning_rate": 1.785506265760314e-05, - "loss": 2.2972, - "step": 368660 - }, - { - "epoch": 0.64, - "learning_rate": 1.7854190717676317e-05, - "loss": 2.3442, - "step": 368670 - }, - { - "epoch": 0.64, - "learning_rate": 1.785331877774949e-05, - "loss": 2.3916, - "step": 368680 - }, - { - "epoch": 0.64, - "learning_rate": 1.785244683782266e-05, - "loss": 2.3442, - "step": 368690 - }, - { - "epoch": 0.64, - "learning_rate": 1.7851574897895835e-05, - "loss": 2.3497, - "step": 368700 - }, - { - "epoch": 0.64, - "learning_rate": 1.785070295796901e-05, - "loss": 2.2394, - "step": 368710 - }, - { - "epoch": 0.64, - "learning_rate": 1.7849831018042182e-05, - "loss": 2.3626, - "step": 368720 - }, - { - "epoch": 0.64, - "learning_rate": 1.7848959078115353e-05, - "loss": 2.3445, - "step": 368730 - }, - { - "epoch": 0.64, - "learning_rate": 1.784808713818853e-05, - "loss": 2.3113, - "step": 368740 - }, - { - "epoch": 0.64, - "learning_rate": 1.78472151982617e-05, - "loss": 2.3132, - "step": 368750 - }, - { - "epoch": 0.64, - "learning_rate": 1.7846343258334874e-05, - "loss": 2.3148, - "step": 368760 - }, - { - "epoch": 0.64, - "learning_rate": 1.7845471318408048e-05, - "loss": 2.402, - "step": 368770 - }, - { - "epoch": 0.64, - "learning_rate": 1.7844599378481222e-05, - "loss": 2.369, - "step": 368780 - }, - { - "epoch": 0.64, - "learning_rate": 1.7843727438554395e-05, - "loss": 2.2295, - "step": 368790 - }, - { - "epoch": 0.64, - "learning_rate": 1.7842855498627566e-05, - "loss": 2.3758, - "step": 368800 - }, - { - "epoch": 0.64, - "learning_rate": 1.784198355870074e-05, - "loss": 2.2951, - "step": 368810 - }, - { - "epoch": 0.64, - "learning_rate": 1.7841111618773913e-05, - "loss": 2.4163, - "step": 368820 - }, - { - "epoch": 0.64, - "learning_rate": 1.7840239678847087e-05, - "loss": 2.2301, - "step": 368830 - }, - { - "epoch": 0.64, - "learning_rate": 1.783936773892026e-05, - "loss": 2.1994, - "step": 368840 - }, - { - "epoch": 0.64, - "learning_rate": 1.783849579899343e-05, - "loss": 2.3791, - "step": 368850 - }, - { - "epoch": 0.64, - "learning_rate": 1.783762385906661e-05, - "loss": 2.3319, - "step": 368860 - }, - { - "epoch": 0.64, - "learning_rate": 1.783675191913978e-05, - "loss": 2.3782, - "step": 368870 - }, - { - "epoch": 0.64, - "learning_rate": 1.7835879979212953e-05, - "loss": 2.3813, - "step": 368880 - }, - { - "epoch": 0.64, - "learning_rate": 1.7835008039286126e-05, - "loss": 2.3615, - "step": 368890 - }, - { - "epoch": 0.64, - "learning_rate": 1.78341360993593e-05, - "loss": 2.4141, - "step": 368900 - }, - { - "epoch": 0.64, - "learning_rate": 1.7833264159432474e-05, - "loss": 2.3158, - "step": 368910 - }, - { - "epoch": 0.64, - "learning_rate": 1.7832392219505644e-05, - "loss": 2.4034, - "step": 368920 - }, - { - "epoch": 0.64, - "learning_rate": 1.783152027957882e-05, - "loss": 2.3277, - "step": 368930 - }, - { - "epoch": 0.64, - "learning_rate": 1.7830648339651992e-05, - "loss": 2.4612, - "step": 368940 - }, - { - "epoch": 0.64, - "learning_rate": 1.7829776399725166e-05, - "loss": 2.4041, - "step": 368950 - }, - { - "epoch": 0.64, - "learning_rate": 1.7828904459798336e-05, - "loss": 2.3308, - "step": 368960 - }, - { - "epoch": 0.64, - "learning_rate": 1.7828032519871513e-05, - "loss": 2.363, - "step": 368970 - }, - { - "epoch": 0.64, - "learning_rate": 1.7827160579944684e-05, - "loss": 2.3721, - "step": 368980 - }, - { - "epoch": 0.64, - "learning_rate": 1.7826288640017857e-05, - "loss": 2.3667, - "step": 368990 - }, - { - "epoch": 0.64, - "learning_rate": 1.782541670009103e-05, - "loss": 2.4719, - "step": 369000 - }, - { - "epoch": 0.64, - "learning_rate": 1.7824544760164205e-05, - "loss": 2.36, - "step": 369010 - }, - { - "epoch": 0.64, - "learning_rate": 1.782367282023738e-05, - "loss": 2.4146, - "step": 369020 - }, - { - "epoch": 0.64, - "learning_rate": 1.782280088031055e-05, - "loss": 2.3774, - "step": 369030 - }, - { - "epoch": 0.64, - "learning_rate": 1.7821928940383726e-05, - "loss": 2.4443, - "step": 369040 - }, - { - "epoch": 0.64, - "learning_rate": 1.7821057000456897e-05, - "loss": 2.326, - "step": 369050 - }, - { - "epoch": 0.64, - "learning_rate": 1.782018506053007e-05, - "loss": 2.2697, - "step": 369060 - }, - { - "epoch": 0.64, - "learning_rate": 1.7819313120603244e-05, - "loss": 2.4126, - "step": 369070 - }, - { - "epoch": 0.64, - "learning_rate": 1.7818441180676418e-05, - "loss": 2.2164, - "step": 369080 - }, - { - "epoch": 0.64, - "learning_rate": 1.781756924074959e-05, - "loss": 2.2859, - "step": 369090 - }, - { - "epoch": 0.64, - "learning_rate": 1.7816697300822762e-05, - "loss": 2.3145, - "step": 369100 - }, - { - "epoch": 0.64, - "learning_rate": 1.7815825360895936e-05, - "loss": 2.3207, - "step": 369110 - }, - { - "epoch": 0.64, - "learning_rate": 1.781495342096911e-05, - "loss": 2.4036, - "step": 369120 - }, - { - "epoch": 0.64, - "learning_rate": 1.7814081481042283e-05, - "loss": 2.3486, - "step": 369130 - }, - { - "epoch": 0.64, - "learning_rate": 1.7813209541115454e-05, - "loss": 2.2428, - "step": 369140 - }, - { - "epoch": 0.64, - "learning_rate": 1.781233760118863e-05, - "loss": 2.2797, - "step": 369150 - }, - { - "epoch": 0.64, - "learning_rate": 1.7811465661261805e-05, - "loss": 2.2507, - "step": 369160 - }, - { - "epoch": 0.64, - "learning_rate": 1.7810593721334975e-05, - "loss": 2.2805, - "step": 369170 - }, - { - "epoch": 0.64, - "learning_rate": 1.780972178140815e-05, - "loss": 2.2444, - "step": 369180 - }, - { - "epoch": 0.64, - "learning_rate": 1.7808849841481323e-05, - "loss": 2.1706, - "step": 369190 - }, - { - "epoch": 0.64, - "learning_rate": 1.7807977901554496e-05, - "loss": 2.2623, - "step": 369200 - }, - { - "epoch": 0.64, - "learning_rate": 1.7807105961627667e-05, - "loss": 2.1896, - "step": 369210 - }, - { - "epoch": 0.64, - "learning_rate": 1.780623402170084e-05, - "loss": 2.3336, - "step": 369220 - }, - { - "epoch": 0.64, - "learning_rate": 1.7805362081774014e-05, - "loss": 2.2889, - "step": 369230 - }, - { - "epoch": 0.64, - "learning_rate": 1.7804490141847188e-05, - "loss": 2.3541, - "step": 369240 - }, - { - "epoch": 0.64, - "learning_rate": 1.7803618201920362e-05, - "loss": 2.2982, - "step": 369250 - }, - { - "epoch": 0.64, - "learning_rate": 1.7802746261993536e-05, - "loss": 2.2622, - "step": 369260 - }, - { - "epoch": 0.64, - "learning_rate": 1.780187432206671e-05, - "loss": 2.2707, - "step": 369270 - }, - { - "epoch": 0.64, - "learning_rate": 1.780100238213988e-05, - "loss": 2.3084, - "step": 369280 - }, - { - "epoch": 0.64, - "learning_rate": 1.7800130442213054e-05, - "loss": 2.4211, - "step": 369290 - }, - { - "epoch": 0.64, - "learning_rate": 1.7799258502286227e-05, - "loss": 2.2738, - "step": 369300 - }, - { - "epoch": 0.64, - "learning_rate": 1.77983865623594e-05, - "loss": 2.385, - "step": 369310 - }, - { - "epoch": 0.64, - "learning_rate": 1.7797514622432575e-05, - "loss": 2.2564, - "step": 369320 - }, - { - "epoch": 0.64, - "learning_rate": 1.7796642682505745e-05, - "loss": 2.3884, - "step": 369330 - }, - { - "epoch": 0.64, - "learning_rate": 1.7795770742578922e-05, - "loss": 2.2844, - "step": 369340 - }, - { - "epoch": 0.64, - "learning_rate": 1.7794898802652093e-05, - "loss": 2.3888, - "step": 369350 - }, - { - "epoch": 0.64, - "learning_rate": 1.7794026862725267e-05, - "loss": 2.3435, - "step": 369360 - }, - { - "epoch": 0.64, - "learning_rate": 1.7793154922798437e-05, - "loss": 2.3638, - "step": 369370 - }, - { - "epoch": 0.64, - "learning_rate": 1.7792282982871614e-05, - "loss": 2.3414, - "step": 369380 - }, - { - "epoch": 0.64, - "learning_rate": 1.7791411042944784e-05, - "loss": 2.2875, - "step": 369390 - }, - { - "epoch": 0.64, - "learning_rate": 1.7790539103017958e-05, - "loss": 2.3827, - "step": 369400 - }, - { - "epoch": 0.64, - "learning_rate": 1.7789667163091135e-05, - "loss": 2.3168, - "step": 369410 - }, - { - "epoch": 0.64, - "learning_rate": 1.7788795223164306e-05, - "loss": 2.2211, - "step": 369420 - }, - { - "epoch": 0.64, - "learning_rate": 1.778792328323748e-05, - "loss": 2.3653, - "step": 369430 - }, - { - "epoch": 0.64, - "learning_rate": 1.778705134331065e-05, - "loss": 2.2435, - "step": 369440 - }, - { - "epoch": 0.64, - "learning_rate": 1.7786179403383827e-05, - "loss": 2.3074, - "step": 369450 - }, - { - "epoch": 0.64, - "learning_rate": 1.7785307463456997e-05, - "loss": 2.2124, - "step": 369460 - }, - { - "epoch": 0.64, - "learning_rate": 1.778443552353017e-05, - "loss": 2.2884, - "step": 369470 - }, - { - "epoch": 0.64, - "learning_rate": 1.7783563583603345e-05, - "loss": 2.347, - "step": 369480 - }, - { - "epoch": 0.64, - "learning_rate": 1.778269164367652e-05, - "loss": 2.2763, - "step": 369490 - }, - { - "epoch": 0.64, - "learning_rate": 1.7781819703749693e-05, - "loss": 2.3867, - "step": 369500 - }, - { - "epoch": 0.64, - "learning_rate": 1.7780947763822863e-05, - "loss": 2.3154, - "step": 369510 - }, - { - "epoch": 0.64, - "learning_rate": 1.778007582389604e-05, - "loss": 2.3286, - "step": 369520 - }, - { - "epoch": 0.64, - "learning_rate": 1.777920388396921e-05, - "loss": 2.2546, - "step": 369530 - }, - { - "epoch": 0.64, - "learning_rate": 1.7778331944042384e-05, - "loss": 2.2882, - "step": 369540 - }, - { - "epoch": 0.64, - "learning_rate": 1.7777460004115558e-05, - "loss": 2.3391, - "step": 369550 - }, - { - "epoch": 0.64, - "learning_rate": 1.7776588064188732e-05, - "loss": 2.2383, - "step": 369560 - }, - { - "epoch": 0.64, - "learning_rate": 1.7775716124261906e-05, - "loss": 2.3395, - "step": 369570 - }, - { - "epoch": 0.64, - "learning_rate": 1.7774844184335076e-05, - "loss": 2.2882, - "step": 369580 - }, - { - "epoch": 0.64, - "learning_rate": 1.777397224440825e-05, - "loss": 2.4327, - "step": 369590 - }, - { - "epoch": 0.64, - "learning_rate": 1.7773100304481423e-05, - "loss": 2.3689, - "step": 369600 - }, - { - "epoch": 0.64, - "learning_rate": 1.7772228364554597e-05, - "loss": 2.3834, - "step": 369610 - }, - { - "epoch": 0.64, - "learning_rate": 1.7771356424627768e-05, - "loss": 2.2051, - "step": 369620 - }, - { - "epoch": 0.64, - "learning_rate": 1.777048448470094e-05, - "loss": 2.2881, - "step": 369630 - }, - { - "epoch": 0.64, - "learning_rate": 1.776961254477412e-05, - "loss": 2.3591, - "step": 369640 - }, - { - "epoch": 0.64, - "learning_rate": 1.776874060484729e-05, - "loss": 2.3073, - "step": 369650 - }, - { - "epoch": 0.64, - "learning_rate": 1.7767868664920463e-05, - "loss": 2.2239, - "step": 369660 - }, - { - "epoch": 0.64, - "learning_rate": 1.7766996724993636e-05, - "loss": 2.2545, - "step": 369670 - }, - { - "epoch": 0.64, - "learning_rate": 1.776612478506681e-05, - "loss": 2.3264, - "step": 369680 - }, - { - "epoch": 0.64, - "learning_rate": 1.776525284513998e-05, - "loss": 2.3352, - "step": 369690 - }, - { - "epoch": 0.64, - "learning_rate": 1.7764380905213154e-05, - "loss": 2.2401, - "step": 369700 - }, - { - "epoch": 0.64, - "learning_rate": 1.7763508965286328e-05, - "loss": 2.2319, - "step": 369710 - }, - { - "epoch": 0.64, - "learning_rate": 1.7762637025359502e-05, - "loss": 2.2851, - "step": 369720 - }, - { - "epoch": 0.64, - "learning_rate": 1.7761765085432676e-05, - "loss": 2.2507, - "step": 369730 - }, - { - "epoch": 0.64, - "learning_rate": 1.7760893145505846e-05, - "loss": 2.3865, - "step": 369740 - }, - { - "epoch": 0.64, - "learning_rate": 1.7760021205579023e-05, - "loss": 2.2771, - "step": 369750 - }, - { - "epoch": 0.64, - "learning_rate": 1.7759149265652194e-05, - "loss": 2.3587, - "step": 369760 - }, - { - "epoch": 0.64, - "learning_rate": 1.7758277325725367e-05, - "loss": 2.2979, - "step": 369770 - }, - { - "epoch": 0.64, - "learning_rate": 1.775740538579854e-05, - "loss": 2.2304, - "step": 369780 - }, - { - "epoch": 0.64, - "learning_rate": 1.7756533445871715e-05, - "loss": 2.3358, - "step": 369790 - }, - { - "epoch": 0.64, - "learning_rate": 1.775566150594489e-05, - "loss": 2.2538, - "step": 369800 - }, - { - "epoch": 0.64, - "learning_rate": 1.775478956601806e-05, - "loss": 2.3843, - "step": 369810 - }, - { - "epoch": 0.64, - "learning_rate": 1.7753917626091236e-05, - "loss": 2.4124, - "step": 369820 - }, - { - "epoch": 0.64, - "learning_rate": 1.7753045686164407e-05, - "loss": 2.2591, - "step": 369830 - }, - { - "epoch": 0.64, - "learning_rate": 1.775217374623758e-05, - "loss": 2.4166, - "step": 369840 - }, - { - "epoch": 0.64, - "learning_rate": 1.775130180631075e-05, - "loss": 2.3105, - "step": 369850 - }, - { - "epoch": 0.64, - "learning_rate": 1.7750429866383928e-05, - "loss": 2.3787, - "step": 369860 - }, - { - "epoch": 0.65, - "learning_rate": 1.7749557926457098e-05, - "loss": 2.2947, - "step": 369870 - }, - { - "epoch": 0.65, - "learning_rate": 1.7748685986530272e-05, - "loss": 2.3224, - "step": 369880 - }, - { - "epoch": 0.65, - "learning_rate": 1.7747814046603446e-05, - "loss": 2.4279, - "step": 369890 - }, - { - "epoch": 0.65, - "learning_rate": 1.774694210667662e-05, - "loss": 2.329, - "step": 369900 - }, - { - "epoch": 0.65, - "learning_rate": 1.7746070166749793e-05, - "loss": 2.2247, - "step": 369910 - }, - { - "epoch": 0.65, - "learning_rate": 1.7745198226822964e-05, - "loss": 2.3777, - "step": 369920 - }, - { - "epoch": 0.65, - "learning_rate": 1.774432628689614e-05, - "loss": 2.3755, - "step": 369930 - }, - { - "epoch": 0.65, - "learning_rate": 1.774345434696931e-05, - "loss": 2.2608, - "step": 369940 - }, - { - "epoch": 0.65, - "learning_rate": 1.7742582407042485e-05, - "loss": 2.3021, - "step": 369950 - }, - { - "epoch": 0.65, - "learning_rate": 1.774171046711566e-05, - "loss": 2.2289, - "step": 369960 - }, - { - "epoch": 0.65, - "learning_rate": 1.7740838527188833e-05, - "loss": 2.2099, - "step": 369970 - }, - { - "epoch": 0.65, - "learning_rate": 1.7739966587262006e-05, - "loss": 2.26, - "step": 369980 - }, - { - "epoch": 0.65, - "learning_rate": 1.7739094647335177e-05, - "loss": 2.274, - "step": 369990 - }, - { - "epoch": 0.65, - "learning_rate": 1.773822270740835e-05, - "loss": 2.3244, - "step": 370000 - }, - { - "epoch": 0.65, - "learning_rate": 1.7737350767481524e-05, - "loss": 2.2632, - "step": 370010 - }, - { - "epoch": 0.65, - "learning_rate": 1.7736478827554698e-05, - "loss": 2.3939, - "step": 370020 - }, - { - "epoch": 0.65, - "learning_rate": 1.7735606887627872e-05, - "loss": 2.3382, - "step": 370030 - }, - { - "epoch": 0.65, - "learning_rate": 1.7734734947701042e-05, - "loss": 2.3621, - "step": 370040 - }, - { - "epoch": 0.65, - "learning_rate": 1.773386300777422e-05, - "loss": 2.2565, - "step": 370050 - }, - { - "epoch": 0.65, - "learning_rate": 1.773299106784739e-05, - "loss": 2.4254, - "step": 370060 - }, - { - "epoch": 0.65, - "learning_rate": 1.7732119127920564e-05, - "loss": 2.311, - "step": 370070 - }, - { - "epoch": 0.65, - "learning_rate": 1.7731247187993737e-05, - "loss": 2.2329, - "step": 370080 - }, - { - "epoch": 0.65, - "learning_rate": 1.773037524806691e-05, - "loss": 2.4797, - "step": 370090 - }, - { - "epoch": 0.65, - "learning_rate": 1.772950330814008e-05, - "loss": 2.3116, - "step": 370100 - }, - { - "epoch": 0.65, - "learning_rate": 1.7728631368213255e-05, - "loss": 2.3503, - "step": 370110 - }, - { - "epoch": 0.65, - "learning_rate": 1.772775942828643e-05, - "loss": 2.3393, - "step": 370120 - }, - { - "epoch": 0.65, - "learning_rate": 1.7726887488359603e-05, - "loss": 2.196, - "step": 370130 - }, - { - "epoch": 0.65, - "learning_rate": 1.7726015548432777e-05, - "loss": 2.2822, - "step": 370140 - }, - { - "epoch": 0.65, - "learning_rate": 1.7725143608505947e-05, - "loss": 2.4321, - "step": 370150 - }, - { - "epoch": 0.65, - "learning_rate": 1.7724271668579124e-05, - "loss": 2.3233, - "step": 370160 - }, - { - "epoch": 0.65, - "learning_rate": 1.7723399728652294e-05, - "loss": 2.2055, - "step": 370170 - }, - { - "epoch": 0.65, - "learning_rate": 1.7722527788725468e-05, - "loss": 2.2871, - "step": 370180 - }, - { - "epoch": 0.65, - "learning_rate": 1.7721655848798642e-05, - "loss": 2.4087, - "step": 370190 - }, - { - "epoch": 0.65, - "learning_rate": 1.7720783908871816e-05, - "loss": 2.3625, - "step": 370200 - }, - { - "epoch": 0.65, - "learning_rate": 1.771991196894499e-05, - "loss": 2.4035, - "step": 370210 - }, - { - "epoch": 0.65, - "learning_rate": 1.771904002901816e-05, - "loss": 2.2698, - "step": 370220 - }, - { - "epoch": 0.65, - "learning_rate": 1.7718168089091337e-05, - "loss": 2.388, - "step": 370230 - }, - { - "epoch": 0.65, - "learning_rate": 1.7717296149164507e-05, - "loss": 2.4066, - "step": 370240 - }, - { - "epoch": 0.65, - "learning_rate": 1.771642420923768e-05, - "loss": 2.2796, - "step": 370250 - }, - { - "epoch": 0.65, - "learning_rate": 1.7715552269310855e-05, - "loss": 2.3435, - "step": 370260 - }, - { - "epoch": 0.65, - "learning_rate": 1.771468032938403e-05, - "loss": 2.36, - "step": 370270 - }, - { - "epoch": 0.65, - "learning_rate": 1.7713808389457203e-05, - "loss": 2.3887, - "step": 370280 - }, - { - "epoch": 0.65, - "learning_rate": 1.7712936449530373e-05, - "loss": 2.2423, - "step": 370290 - }, - { - "epoch": 0.65, - "learning_rate": 1.7712064509603547e-05, - "loss": 2.3067, - "step": 370300 - }, - { - "epoch": 0.65, - "learning_rate": 1.771119256967672e-05, - "loss": 2.3575, - "step": 370310 - }, - { - "epoch": 0.65, - "learning_rate": 1.7710320629749894e-05, - "loss": 2.2633, - "step": 370320 - }, - { - "epoch": 0.65, - "learning_rate": 1.7709448689823065e-05, - "loss": 2.4374, - "step": 370330 - }, - { - "epoch": 0.65, - "learning_rate": 1.7708576749896242e-05, - "loss": 2.2198, - "step": 370340 - }, - { - "epoch": 0.65, - "learning_rate": 1.7707704809969412e-05, - "loss": 2.3312, - "step": 370350 - }, - { - "epoch": 0.65, - "learning_rate": 1.7706832870042586e-05, - "loss": 2.2861, - "step": 370360 - }, - { - "epoch": 0.65, - "learning_rate": 1.770596093011576e-05, - "loss": 2.3456, - "step": 370370 - }, - { - "epoch": 0.65, - "learning_rate": 1.7705088990188933e-05, - "loss": 2.2607, - "step": 370380 - }, - { - "epoch": 0.65, - "learning_rate": 1.7704217050262107e-05, - "loss": 2.2255, - "step": 370390 - }, - { - "epoch": 0.65, - "learning_rate": 1.7703345110335278e-05, - "loss": 2.4565, - "step": 370400 - }, - { - "epoch": 0.65, - "learning_rate": 1.770247317040845e-05, - "loss": 2.4806, - "step": 370410 - }, - { - "epoch": 0.65, - "learning_rate": 1.7701601230481625e-05, - "loss": 2.3009, - "step": 370420 - }, - { - "epoch": 0.65, - "learning_rate": 1.77007292905548e-05, - "loss": 2.2122, - "step": 370430 - }, - { - "epoch": 0.65, - "learning_rate": 1.7699857350627973e-05, - "loss": 2.4172, - "step": 370440 - }, - { - "epoch": 0.65, - "learning_rate": 1.7698985410701143e-05, - "loss": 2.2513, - "step": 370450 - }, - { - "epoch": 0.65, - "learning_rate": 1.769811347077432e-05, - "loss": 2.3113, - "step": 370460 - }, - { - "epoch": 0.65, - "learning_rate": 1.769724153084749e-05, - "loss": 2.3123, - "step": 370470 - }, - { - "epoch": 0.65, - "learning_rate": 1.7696369590920664e-05, - "loss": 2.3212, - "step": 370480 - }, - { - "epoch": 0.65, - "learning_rate": 1.7695497650993838e-05, - "loss": 2.2689, - "step": 370490 - }, - { - "epoch": 0.65, - "learning_rate": 1.7694625711067012e-05, - "loss": 2.2172, - "step": 370500 - }, - { - "epoch": 0.65, - "learning_rate": 1.7693753771140186e-05, - "loss": 2.2679, - "step": 370510 - }, - { - "epoch": 0.65, - "learning_rate": 1.7692881831213356e-05, - "loss": 2.3171, - "step": 370520 - }, - { - "epoch": 0.65, - "learning_rate": 1.7692009891286533e-05, - "loss": 2.2862, - "step": 370530 - }, - { - "epoch": 0.65, - "learning_rate": 1.7691137951359704e-05, - "loss": 2.4039, - "step": 370540 - }, - { - "epoch": 0.65, - "learning_rate": 1.7690266011432877e-05, - "loss": 2.2765, - "step": 370550 - }, - { - "epoch": 0.65, - "learning_rate": 1.7689394071506048e-05, - "loss": 2.3129, - "step": 370560 - }, - { - "epoch": 0.65, - "learning_rate": 1.7688522131579225e-05, - "loss": 2.4061, - "step": 370570 - }, - { - "epoch": 0.65, - "learning_rate": 1.7687650191652395e-05, - "loss": 2.1991, - "step": 370580 - }, - { - "epoch": 0.65, - "learning_rate": 1.768677825172557e-05, - "loss": 2.2112, - "step": 370590 - }, - { - "epoch": 0.65, - "learning_rate": 1.7685906311798743e-05, - "loss": 2.3288, - "step": 370600 - }, - { - "epoch": 0.65, - "learning_rate": 1.7685034371871917e-05, - "loss": 2.3209, - "step": 370610 - }, - { - "epoch": 0.65, - "learning_rate": 1.768416243194509e-05, - "loss": 2.3014, - "step": 370620 - }, - { - "epoch": 0.65, - "learning_rate": 1.768329049201826e-05, - "loss": 2.3462, - "step": 370630 - }, - { - "epoch": 0.65, - "learning_rate": 1.7682418552091438e-05, - "loss": 2.3546, - "step": 370640 - }, - { - "epoch": 0.65, - "learning_rate": 1.7681546612164608e-05, - "loss": 2.3164, - "step": 370650 - }, - { - "epoch": 0.65, - "learning_rate": 1.7680674672237782e-05, - "loss": 2.267, - "step": 370660 - }, - { - "epoch": 0.65, - "learning_rate": 1.7679802732310956e-05, - "loss": 2.3593, - "step": 370670 - }, - { - "epoch": 0.65, - "learning_rate": 1.767893079238413e-05, - "loss": 2.2887, - "step": 370680 - }, - { - "epoch": 0.65, - "learning_rate": 1.7678058852457303e-05, - "loss": 2.2009, - "step": 370690 - }, - { - "epoch": 0.65, - "learning_rate": 1.7677186912530474e-05, - "loss": 2.2936, - "step": 370700 - }, - { - "epoch": 0.65, - "learning_rate": 1.7676314972603648e-05, - "loss": 2.3846, - "step": 370710 - }, - { - "epoch": 0.65, - "learning_rate": 1.767544303267682e-05, - "loss": 2.3564, - "step": 370720 - }, - { - "epoch": 0.65, - "learning_rate": 1.7674571092749995e-05, - "loss": 2.3787, - "step": 370730 - }, - { - "epoch": 0.65, - "learning_rate": 1.7673699152823165e-05, - "loss": 2.2604, - "step": 370740 - }, - { - "epoch": 0.65, - "learning_rate": 1.7672827212896343e-05, - "loss": 2.2662, - "step": 370750 - }, - { - "epoch": 0.65, - "learning_rate": 1.7671955272969516e-05, - "loss": 2.3025, - "step": 370760 - }, - { - "epoch": 0.65, - "learning_rate": 1.7671083333042687e-05, - "loss": 2.1967, - "step": 370770 - }, - { - "epoch": 0.65, - "learning_rate": 1.767021139311586e-05, - "loss": 2.3038, - "step": 370780 - }, - { - "epoch": 0.65, - "learning_rate": 1.7669339453189034e-05, - "loss": 2.3484, - "step": 370790 - }, - { - "epoch": 0.65, - "learning_rate": 1.7668467513262208e-05, - "loss": 2.3774, - "step": 370800 - }, - { - "epoch": 0.65, - "learning_rate": 1.766759557333538e-05, - "loss": 2.2763, - "step": 370810 - }, - { - "epoch": 0.65, - "learning_rate": 1.7666723633408552e-05, - "loss": 2.2612, - "step": 370820 - }, - { - "epoch": 0.65, - "learning_rate": 1.7665851693481726e-05, - "loss": 2.3135, - "step": 370830 - }, - { - "epoch": 0.65, - "learning_rate": 1.76649797535549e-05, - "loss": 2.374, - "step": 370840 - }, - { - "epoch": 0.65, - "learning_rate": 1.7664107813628074e-05, - "loss": 2.3194, - "step": 370850 - }, - { - "epoch": 0.65, - "learning_rate": 1.7663235873701247e-05, - "loss": 2.3507, - "step": 370860 - }, - { - "epoch": 0.65, - "learning_rate": 1.766236393377442e-05, - "loss": 2.3134, - "step": 370870 - }, - { - "epoch": 0.65, - "learning_rate": 1.766149199384759e-05, - "loss": 2.3215, - "step": 370880 - }, - { - "epoch": 0.65, - "learning_rate": 1.7660620053920765e-05, - "loss": 2.3635, - "step": 370890 - }, - { - "epoch": 0.65, - "learning_rate": 1.765974811399394e-05, - "loss": 2.242, - "step": 370900 - }, - { - "epoch": 0.65, - "learning_rate": 1.7658876174067113e-05, - "loss": 2.3449, - "step": 370910 - }, - { - "epoch": 0.65, - "learning_rate": 1.7658004234140287e-05, - "loss": 2.3786, - "step": 370920 - }, - { - "epoch": 0.65, - "learning_rate": 1.7657132294213457e-05, - "loss": 2.278, - "step": 370930 - }, - { - "epoch": 0.65, - "learning_rate": 1.7656260354286634e-05, - "loss": 2.3438, - "step": 370940 - }, - { - "epoch": 0.65, - "learning_rate": 1.7655388414359804e-05, - "loss": 2.3442, - "step": 370950 - }, - { - "epoch": 0.65, - "learning_rate": 1.7654516474432978e-05, - "loss": 2.3106, - "step": 370960 - }, - { - "epoch": 0.65, - "learning_rate": 1.765364453450615e-05, - "loss": 2.325, - "step": 370970 - }, - { - "epoch": 0.65, - "learning_rate": 1.7652772594579326e-05, - "loss": 2.3443, - "step": 370980 - }, - { - "epoch": 0.65, - "learning_rate": 1.76519006546525e-05, - "loss": 2.1722, - "step": 370990 - }, - { - "epoch": 0.65, - "learning_rate": 1.765102871472567e-05, - "loss": 2.2283, - "step": 371000 - }, - { - "epoch": 0.65, - "learning_rate": 1.7650156774798847e-05, - "loss": 2.431, - "step": 371010 - }, - { - "epoch": 0.65, - "learning_rate": 1.7649284834872017e-05, - "loss": 2.4093, - "step": 371020 - }, - { - "epoch": 0.65, - "learning_rate": 1.764841289494519e-05, - "loss": 2.3049, - "step": 371030 - }, - { - "epoch": 0.65, - "learning_rate": 1.764754095501836e-05, - "loss": 2.3776, - "step": 371040 - }, - { - "epoch": 0.65, - "learning_rate": 1.764666901509154e-05, - "loss": 2.3385, - "step": 371050 - }, - { - "epoch": 0.65, - "learning_rate": 1.764579707516471e-05, - "loss": 2.3941, - "step": 371060 - }, - { - "epoch": 0.65, - "learning_rate": 1.7644925135237883e-05, - "loss": 2.2083, - "step": 371070 - }, - { - "epoch": 0.65, - "learning_rate": 1.7644053195311057e-05, - "loss": 2.3242, - "step": 371080 - }, - { - "epoch": 0.65, - "learning_rate": 1.764318125538423e-05, - "loss": 2.297, - "step": 371090 - }, - { - "epoch": 0.65, - "learning_rate": 1.7642309315457404e-05, - "loss": 2.3655, - "step": 371100 - }, - { - "epoch": 0.65, - "learning_rate": 1.7641437375530575e-05, - "loss": 2.1917, - "step": 371110 - }, - { - "epoch": 0.65, - "learning_rate": 1.7640565435603752e-05, - "loss": 2.2931, - "step": 371120 - }, - { - "epoch": 0.65, - "learning_rate": 1.7639693495676922e-05, - "loss": 2.3209, - "step": 371130 - }, - { - "epoch": 0.65, - "learning_rate": 1.7638821555750096e-05, - "loss": 2.2303, - "step": 371140 - }, - { - "epoch": 0.65, - "learning_rate": 1.763794961582327e-05, - "loss": 2.2936, - "step": 371150 - }, - { - "epoch": 0.65, - "learning_rate": 1.7637077675896443e-05, - "loss": 2.327, - "step": 371160 - }, - { - "epoch": 0.65, - "learning_rate": 1.7636205735969617e-05, - "loss": 2.2869, - "step": 371170 - }, - { - "epoch": 0.65, - "learning_rate": 1.7635333796042788e-05, - "loss": 2.3378, - "step": 371180 - }, - { - "epoch": 0.65, - "learning_rate": 1.763446185611596e-05, - "loss": 2.4664, - "step": 371190 - }, - { - "epoch": 0.65, - "learning_rate": 1.7633589916189135e-05, - "loss": 2.327, - "step": 371200 - }, - { - "epoch": 0.65, - "learning_rate": 1.763271797626231e-05, - "loss": 2.2822, - "step": 371210 - }, - { - "epoch": 0.65, - "learning_rate": 1.763184603633548e-05, - "loss": 2.2801, - "step": 371220 - }, - { - "epoch": 0.65, - "learning_rate": 1.7630974096408653e-05, - "loss": 2.261, - "step": 371230 - }, - { - "epoch": 0.65, - "learning_rate": 1.763010215648183e-05, - "loss": 2.2964, - "step": 371240 - }, - { - "epoch": 0.65, - "learning_rate": 1.7629230216555e-05, - "loss": 2.2874, - "step": 371250 - }, - { - "epoch": 0.65, - "learning_rate": 1.7628358276628174e-05, - "loss": 2.2124, - "step": 371260 - }, - { - "epoch": 0.65, - "learning_rate": 1.7627486336701348e-05, - "loss": 2.3527, - "step": 371270 - }, - { - "epoch": 0.65, - "learning_rate": 1.7626614396774522e-05, - "loss": 2.5046, - "step": 371280 - }, - { - "epoch": 0.65, - "learning_rate": 1.7625742456847692e-05, - "loss": 2.3006, - "step": 371290 - }, - { - "epoch": 0.65, - "learning_rate": 1.7624870516920866e-05, - "loss": 2.303, - "step": 371300 - }, - { - "epoch": 0.65, - "learning_rate": 1.762399857699404e-05, - "loss": 2.2374, - "step": 371310 - }, - { - "epoch": 0.65, - "learning_rate": 1.7623126637067214e-05, - "loss": 2.3162, - "step": 371320 - }, - { - "epoch": 0.65, - "learning_rate": 1.7622254697140387e-05, - "loss": 2.3567, - "step": 371330 - }, - { - "epoch": 0.65, - "learning_rate": 1.7621382757213558e-05, - "loss": 2.3249, - "step": 371340 - }, - { - "epoch": 0.65, - "learning_rate": 1.7620510817286735e-05, - "loss": 2.3162, - "step": 371350 - }, - { - "epoch": 0.65, - "learning_rate": 1.7619638877359905e-05, - "loss": 2.3289, - "step": 371360 - }, - { - "epoch": 0.65, - "learning_rate": 1.761876693743308e-05, - "loss": 2.3284, - "step": 371370 - }, - { - "epoch": 0.65, - "learning_rate": 1.7617894997506253e-05, - "loss": 2.2324, - "step": 371380 - }, - { - "epoch": 0.65, - "learning_rate": 1.7617023057579427e-05, - "loss": 2.2335, - "step": 371390 - }, - { - "epoch": 0.65, - "learning_rate": 1.76161511176526e-05, - "loss": 2.2398, - "step": 371400 - }, - { - "epoch": 0.65, - "learning_rate": 1.761527917772577e-05, - "loss": 2.3343, - "step": 371410 - }, - { - "epoch": 0.65, - "learning_rate": 1.7614407237798948e-05, - "loss": 2.2295, - "step": 371420 - }, - { - "epoch": 0.65, - "learning_rate": 1.7613535297872118e-05, - "loss": 2.3623, - "step": 371430 - }, - { - "epoch": 0.65, - "learning_rate": 1.7612663357945292e-05, - "loss": 2.305, - "step": 371440 - }, - { - "epoch": 0.65, - "learning_rate": 1.7611791418018462e-05, - "loss": 2.4074, - "step": 371450 - }, - { - "epoch": 0.65, - "learning_rate": 1.761091947809164e-05, - "loss": 2.2019, - "step": 371460 - }, - { - "epoch": 0.65, - "learning_rate": 1.7610047538164813e-05, - "loss": 2.3942, - "step": 371470 - }, - { - "epoch": 0.65, - "learning_rate": 1.7609175598237984e-05, - "loss": 2.3559, - "step": 371480 - }, - { - "epoch": 0.65, - "learning_rate": 1.7608303658311158e-05, - "loss": 2.3557, - "step": 371490 - }, - { - "epoch": 0.65, - "learning_rate": 1.760743171838433e-05, - "loss": 2.4407, - "step": 371500 - }, - { - "epoch": 0.65, - "learning_rate": 1.7606559778457505e-05, - "loss": 2.315, - "step": 371510 - }, - { - "epoch": 0.65, - "learning_rate": 1.7605687838530675e-05, - "loss": 2.3227, - "step": 371520 - }, - { - "epoch": 0.65, - "learning_rate": 1.7604815898603853e-05, - "loss": 2.3339, - "step": 371530 - }, - { - "epoch": 0.65, - "learning_rate": 1.7603943958677023e-05, - "loss": 2.2679, - "step": 371540 - }, - { - "epoch": 0.65, - "learning_rate": 1.7603072018750197e-05, - "loss": 2.2643, - "step": 371550 - }, - { - "epoch": 0.65, - "learning_rate": 1.760220007882337e-05, - "loss": 2.298, - "step": 371560 - }, - { - "epoch": 0.65, - "learning_rate": 1.7601328138896544e-05, - "loss": 2.2919, - "step": 371570 - }, - { - "epoch": 0.65, - "learning_rate": 1.7600456198969718e-05, - "loss": 2.2973, - "step": 371580 - }, - { - "epoch": 0.65, - "learning_rate": 1.759958425904289e-05, - "loss": 2.2101, - "step": 371590 - }, - { - "epoch": 0.65, - "learning_rate": 1.7598712319116062e-05, - "loss": 2.4638, - "step": 371600 - }, - { - "epoch": 0.65, - "learning_rate": 1.7597840379189236e-05, - "loss": 2.3596, - "step": 371610 - }, - { - "epoch": 0.65, - "learning_rate": 1.759696843926241e-05, - "loss": 2.2795, - "step": 371620 - }, - { - "epoch": 0.65, - "learning_rate": 1.7596096499335584e-05, - "loss": 2.3502, - "step": 371630 - }, - { - "epoch": 0.65, - "learning_rate": 1.7595224559408754e-05, - "loss": 2.3543, - "step": 371640 - }, - { - "epoch": 0.65, - "learning_rate": 1.759435261948193e-05, - "loss": 2.3654, - "step": 371650 - }, - { - "epoch": 0.65, - "learning_rate": 1.75934806795551e-05, - "loss": 2.3328, - "step": 371660 - }, - { - "epoch": 0.65, - "learning_rate": 1.7592608739628275e-05, - "loss": 2.2413, - "step": 371670 - }, - { - "epoch": 0.65, - "learning_rate": 1.759173679970145e-05, - "loss": 2.44, - "step": 371680 - }, - { - "epoch": 0.65, - "learning_rate": 1.7590864859774623e-05, - "loss": 2.302, - "step": 371690 - }, - { - "epoch": 0.65, - "learning_rate": 1.7589992919847793e-05, - "loss": 2.2912, - "step": 371700 - }, - { - "epoch": 0.65, - "learning_rate": 1.7589120979920967e-05, - "loss": 2.22, - "step": 371710 - }, - { - "epoch": 0.65, - "learning_rate": 1.7588249039994144e-05, - "loss": 2.3259, - "step": 371720 - }, - { - "epoch": 0.65, - "learning_rate": 1.7587377100067314e-05, - "loss": 2.3416, - "step": 371730 - }, - { - "epoch": 0.65, - "learning_rate": 1.7586505160140488e-05, - "loss": 2.3268, - "step": 371740 - }, - { - "epoch": 0.65, - "learning_rate": 1.758563322021366e-05, - "loss": 2.1969, - "step": 371750 - }, - { - "epoch": 0.65, - "learning_rate": 1.7584761280286836e-05, - "loss": 2.3818, - "step": 371760 - }, - { - "epoch": 0.65, - "learning_rate": 1.7583889340360006e-05, - "loss": 2.3673, - "step": 371770 - }, - { - "epoch": 0.65, - "learning_rate": 1.758301740043318e-05, - "loss": 2.3631, - "step": 371780 - }, - { - "epoch": 0.65, - "learning_rate": 1.7582145460506354e-05, - "loss": 2.1989, - "step": 371790 - }, - { - "epoch": 0.65, - "learning_rate": 1.7581273520579527e-05, - "loss": 2.4348, - "step": 371800 - }, - { - "epoch": 0.65, - "learning_rate": 1.75804015806527e-05, - "loss": 2.3426, - "step": 371810 - }, - { - "epoch": 0.65, - "learning_rate": 1.757952964072587e-05, - "loss": 2.3844, - "step": 371820 - }, - { - "epoch": 0.65, - "learning_rate": 1.757865770079905e-05, - "loss": 2.4072, - "step": 371830 - }, - { - "epoch": 0.65, - "learning_rate": 1.757778576087222e-05, - "loss": 2.2462, - "step": 371840 - }, - { - "epoch": 0.65, - "learning_rate": 1.7576913820945393e-05, - "loss": 2.3043, - "step": 371850 - }, - { - "epoch": 0.65, - "learning_rate": 1.7576041881018567e-05, - "loss": 2.3309, - "step": 371860 - }, - { - "epoch": 0.65, - "learning_rate": 1.757516994109174e-05, - "loss": 2.302, - "step": 371870 - }, - { - "epoch": 0.65, - "learning_rate": 1.7574298001164914e-05, - "loss": 2.2999, - "step": 371880 - }, - { - "epoch": 0.65, - "learning_rate": 1.7573426061238085e-05, - "loss": 2.1417, - "step": 371890 - }, - { - "epoch": 0.65, - "learning_rate": 1.757255412131126e-05, - "loss": 2.3544, - "step": 371900 - }, - { - "epoch": 0.65, - "learning_rate": 1.7571682181384432e-05, - "loss": 2.366, - "step": 371910 - }, - { - "epoch": 0.65, - "learning_rate": 1.7570810241457606e-05, - "loss": 2.2548, - "step": 371920 - }, - { - "epoch": 0.65, - "learning_rate": 1.7569938301530776e-05, - "loss": 2.3589, - "step": 371930 - }, - { - "epoch": 0.65, - "learning_rate": 1.7569066361603953e-05, - "loss": 2.341, - "step": 371940 - }, - { - "epoch": 0.65, - "learning_rate": 1.7568194421677124e-05, - "loss": 2.2189, - "step": 371950 - }, - { - "epoch": 0.65, - "learning_rate": 1.7567322481750298e-05, - "loss": 2.2896, - "step": 371960 - }, - { - "epoch": 0.65, - "learning_rate": 1.756645054182347e-05, - "loss": 2.2614, - "step": 371970 - }, - { - "epoch": 0.65, - "learning_rate": 1.7565578601896645e-05, - "loss": 2.3149, - "step": 371980 - }, - { - "epoch": 0.65, - "learning_rate": 1.756470666196982e-05, - "loss": 2.3862, - "step": 371990 - }, - { - "epoch": 0.65, - "learning_rate": 1.756383472204299e-05, - "loss": 2.4479, - "step": 372000 - }, - { - "epoch": 0.65, - "learning_rate": 1.7562962782116163e-05, - "loss": 2.4254, - "step": 372010 - }, - { - "epoch": 0.65, - "learning_rate": 1.7562090842189337e-05, - "loss": 2.3855, - "step": 372020 - }, - { - "epoch": 0.65, - "learning_rate": 1.756121890226251e-05, - "loss": 2.2567, - "step": 372030 - }, - { - "epoch": 0.65, - "learning_rate": 1.7560346962335684e-05, - "loss": 2.3238, - "step": 372040 - }, - { - "epoch": 0.65, - "learning_rate": 1.7559475022408858e-05, - "loss": 2.3768, - "step": 372050 - }, - { - "epoch": 0.65, - "learning_rate": 1.7558603082482032e-05, - "loss": 2.3478, - "step": 372060 - }, - { - "epoch": 0.65, - "learning_rate": 1.7557731142555202e-05, - "loss": 2.2849, - "step": 372070 - }, - { - "epoch": 0.65, - "learning_rate": 1.7556859202628376e-05, - "loss": 2.2397, - "step": 372080 - }, - { - "epoch": 0.65, - "learning_rate": 1.755598726270155e-05, - "loss": 2.3863, - "step": 372090 - }, - { - "epoch": 0.65, - "learning_rate": 1.7555115322774724e-05, - "loss": 2.3784, - "step": 372100 - }, - { - "epoch": 0.65, - "learning_rate": 1.7554243382847897e-05, - "loss": 2.3065, - "step": 372110 - }, - { - "epoch": 0.65, - "learning_rate": 1.7553371442921068e-05, - "loss": 2.2135, - "step": 372120 - }, - { - "epoch": 0.65, - "learning_rate": 1.7552499502994245e-05, - "loss": 2.3052, - "step": 372130 - }, - { - "epoch": 0.65, - "learning_rate": 1.7551627563067415e-05, - "loss": 2.3721, - "step": 372140 - }, - { - "epoch": 0.65, - "learning_rate": 1.755075562314059e-05, - "loss": 2.2691, - "step": 372150 - }, - { - "epoch": 0.65, - "learning_rate": 1.754988368321376e-05, - "loss": 2.3498, - "step": 372160 - }, - { - "epoch": 0.65, - "learning_rate": 1.7549011743286937e-05, - "loss": 2.3579, - "step": 372170 - }, - { - "epoch": 0.65, - "learning_rate": 1.7548139803360107e-05, - "loss": 2.2975, - "step": 372180 - }, - { - "epoch": 0.65, - "learning_rate": 1.754726786343328e-05, - "loss": 2.3789, - "step": 372190 - }, - { - "epoch": 0.65, - "learning_rate": 1.7546395923506458e-05, - "loss": 2.4001, - "step": 372200 - }, - { - "epoch": 0.65, - "learning_rate": 1.7545523983579628e-05, - "loss": 2.3051, - "step": 372210 - }, - { - "epoch": 0.65, - "learning_rate": 1.7544652043652802e-05, - "loss": 2.3472, - "step": 372220 - }, - { - "epoch": 0.65, - "learning_rate": 1.7543780103725972e-05, - "loss": 2.2406, - "step": 372230 - }, - { - "epoch": 0.65, - "learning_rate": 1.754290816379915e-05, - "loss": 2.2747, - "step": 372240 - }, - { - "epoch": 0.65, - "learning_rate": 1.754203622387232e-05, - "loss": 2.4564, - "step": 372250 - }, - { - "epoch": 0.65, - "learning_rate": 1.7541164283945494e-05, - "loss": 2.2556, - "step": 372260 - }, - { - "epoch": 0.65, - "learning_rate": 1.7540292344018668e-05, - "loss": 2.2518, - "step": 372270 - }, - { - "epoch": 0.65, - "learning_rate": 1.753942040409184e-05, - "loss": 2.316, - "step": 372280 - }, - { - "epoch": 0.65, - "learning_rate": 1.7538548464165015e-05, - "loss": 2.3016, - "step": 372290 - }, - { - "epoch": 0.65, - "learning_rate": 1.7537676524238185e-05, - "loss": 2.2717, - "step": 372300 - }, - { - "epoch": 0.65, - "learning_rate": 1.753680458431136e-05, - "loss": 2.3264, - "step": 372310 - }, - { - "epoch": 0.65, - "learning_rate": 1.7535932644384533e-05, - "loss": 2.3851, - "step": 372320 - }, - { - "epoch": 0.65, - "learning_rate": 1.7535060704457707e-05, - "loss": 2.2758, - "step": 372330 - }, - { - "epoch": 0.65, - "learning_rate": 1.753418876453088e-05, - "loss": 2.3088, - "step": 372340 - }, - { - "epoch": 0.65, - "learning_rate": 1.7533316824604054e-05, - "loss": 2.2786, - "step": 372350 - }, - { - "epoch": 0.65, - "learning_rate": 1.7532444884677228e-05, - "loss": 2.2592, - "step": 372360 - }, - { - "epoch": 0.65, - "learning_rate": 1.75315729447504e-05, - "loss": 2.307, - "step": 372370 - }, - { - "epoch": 0.65, - "learning_rate": 1.7530701004823572e-05, - "loss": 2.2841, - "step": 372380 - }, - { - "epoch": 0.65, - "learning_rate": 1.7529829064896746e-05, - "loss": 2.3202, - "step": 372390 - }, - { - "epoch": 0.65, - "learning_rate": 1.752895712496992e-05, - "loss": 2.3118, - "step": 372400 - }, - { - "epoch": 0.65, - "learning_rate": 1.752808518504309e-05, - "loss": 2.4117, - "step": 372410 - }, - { - "epoch": 0.65, - "learning_rate": 1.7527213245116264e-05, - "loss": 2.2676, - "step": 372420 - }, - { - "epoch": 0.65, - "learning_rate": 1.7526341305189438e-05, - "loss": 2.3092, - "step": 372430 - }, - { - "epoch": 0.65, - "learning_rate": 1.752546936526261e-05, - "loss": 2.206, - "step": 372440 - }, - { - "epoch": 0.65, - "learning_rate": 1.7524597425335785e-05, - "loss": 2.3917, - "step": 372450 - }, - { - "epoch": 0.65, - "learning_rate": 1.752372548540896e-05, - "loss": 2.337, - "step": 372460 - }, - { - "epoch": 0.65, - "learning_rate": 1.7522853545482133e-05, - "loss": 2.2318, - "step": 372470 - }, - { - "epoch": 0.65, - "learning_rate": 1.7521981605555303e-05, - "loss": 2.2777, - "step": 372480 - }, - { - "epoch": 0.65, - "learning_rate": 1.7521109665628477e-05, - "loss": 2.416, - "step": 372490 - }, - { - "epoch": 0.65, - "learning_rate": 1.752023772570165e-05, - "loss": 2.2748, - "step": 372500 - }, - { - "epoch": 0.65, - "learning_rate": 1.7519365785774824e-05, - "loss": 2.2223, - "step": 372510 - }, - { - "epoch": 0.65, - "learning_rate": 1.7518493845847998e-05, - "loss": 2.3051, - "step": 372520 - }, - { - "epoch": 0.65, - "learning_rate": 1.751762190592117e-05, - "loss": 2.3469, - "step": 372530 - }, - { - "epoch": 0.65, - "learning_rate": 1.7516749965994346e-05, - "loss": 2.2605, - "step": 372540 - }, - { - "epoch": 0.65, - "learning_rate": 1.7515878026067516e-05, - "loss": 2.2371, - "step": 372550 - }, - { - "epoch": 0.65, - "learning_rate": 1.751500608614069e-05, - "loss": 2.2077, - "step": 372560 - }, - { - "epoch": 0.65, - "learning_rate": 1.751413414621386e-05, - "loss": 2.2909, - "step": 372570 - }, - { - "epoch": 0.65, - "learning_rate": 1.7513262206287037e-05, - "loss": 2.3106, - "step": 372580 - }, - { - "epoch": 0.65, - "learning_rate": 1.751239026636021e-05, - "loss": 2.2767, - "step": 372590 - }, - { - "epoch": 0.65, - "learning_rate": 1.751151832643338e-05, - "loss": 2.3592, - "step": 372600 - }, - { - "epoch": 0.65, - "learning_rate": 1.751064638650656e-05, - "loss": 2.267, - "step": 372610 - }, - { - "epoch": 0.65, - "learning_rate": 1.750977444657973e-05, - "loss": 2.4342, - "step": 372620 - }, - { - "epoch": 0.65, - "learning_rate": 1.7508902506652903e-05, - "loss": 2.3065, - "step": 372630 - }, - { - "epoch": 0.65, - "learning_rate": 1.7508030566726073e-05, - "loss": 2.3863, - "step": 372640 - }, - { - "epoch": 0.65, - "learning_rate": 1.750715862679925e-05, - "loss": 2.333, - "step": 372650 - }, - { - "epoch": 0.65, - "learning_rate": 1.750628668687242e-05, - "loss": 2.2243, - "step": 372660 - }, - { - "epoch": 0.65, - "learning_rate": 1.7505414746945595e-05, - "loss": 2.2993, - "step": 372670 - }, - { - "epoch": 0.65, - "learning_rate": 1.750454280701877e-05, - "loss": 2.2689, - "step": 372680 - }, - { - "epoch": 0.65, - "learning_rate": 1.7503670867091942e-05, - "loss": 2.2965, - "step": 372690 - }, - { - "epoch": 0.65, - "learning_rate": 1.7502798927165116e-05, - "loss": 2.3676, - "step": 372700 - }, - { - "epoch": 0.65, - "learning_rate": 1.7501926987238286e-05, - "loss": 2.3242, - "step": 372710 - }, - { - "epoch": 0.65, - "learning_rate": 1.7501055047311463e-05, - "loss": 2.3336, - "step": 372720 - }, - { - "epoch": 0.65, - "learning_rate": 1.7500183107384634e-05, - "loss": 2.2547, - "step": 372730 - }, - { - "epoch": 0.65, - "learning_rate": 1.7499311167457808e-05, - "loss": 2.3349, - "step": 372740 - }, - { - "epoch": 0.65, - "learning_rate": 1.749843922753098e-05, - "loss": 2.3466, - "step": 372750 - }, - { - "epoch": 0.65, - "learning_rate": 1.7497567287604155e-05, - "loss": 2.3472, - "step": 372760 - }, - { - "epoch": 0.65, - "learning_rate": 1.749669534767733e-05, - "loss": 2.2814, - "step": 372770 - }, - { - "epoch": 0.65, - "learning_rate": 1.74958234077505e-05, - "loss": 2.1919, - "step": 372780 - }, - { - "epoch": 0.65, - "learning_rate": 1.7494951467823673e-05, - "loss": 2.2973, - "step": 372790 - }, - { - "epoch": 0.65, - "learning_rate": 1.7494079527896847e-05, - "loss": 2.2995, - "step": 372800 - }, - { - "epoch": 0.65, - "learning_rate": 1.749320758797002e-05, - "loss": 2.4064, - "step": 372810 - }, - { - "epoch": 0.65, - "learning_rate": 1.7492335648043194e-05, - "loss": 2.3066, - "step": 372820 - }, - { - "epoch": 0.65, - "learning_rate": 1.7491463708116365e-05, - "loss": 2.2554, - "step": 372830 - }, - { - "epoch": 0.65, - "learning_rate": 1.7490591768189542e-05, - "loss": 2.2835, - "step": 372840 - }, - { - "epoch": 0.65, - "learning_rate": 1.7489719828262712e-05, - "loss": 2.2159, - "step": 372850 - }, - { - "epoch": 0.65, - "learning_rate": 1.7488847888335886e-05, - "loss": 2.2778, - "step": 372860 - }, - { - "epoch": 0.65, - "learning_rate": 1.748797594840906e-05, - "loss": 2.3493, - "step": 372870 - }, - { - "epoch": 0.65, - "learning_rate": 1.7487104008482234e-05, - "loss": 2.3558, - "step": 372880 - }, - { - "epoch": 0.65, - "learning_rate": 1.7486232068555404e-05, - "loss": 2.3521, - "step": 372890 - }, - { - "epoch": 0.65, - "learning_rate": 1.7485360128628578e-05, - "loss": 2.4681, - "step": 372900 - }, - { - "epoch": 0.65, - "learning_rate": 1.748448818870175e-05, - "loss": 2.3534, - "step": 372910 - }, - { - "epoch": 0.65, - "learning_rate": 1.7483616248774925e-05, - "loss": 2.2469, - "step": 372920 - }, - { - "epoch": 0.65, - "learning_rate": 1.74827443088481e-05, - "loss": 2.3529, - "step": 372930 - }, - { - "epoch": 0.65, - "learning_rate": 1.748187236892127e-05, - "loss": 2.4499, - "step": 372940 - }, - { - "epoch": 0.65, - "learning_rate": 1.7481000428994447e-05, - "loss": 2.2027, - "step": 372950 - }, - { - "epoch": 0.65, - "learning_rate": 1.7480128489067617e-05, - "loss": 2.3176, - "step": 372960 - }, - { - "epoch": 0.65, - "learning_rate": 1.747925654914079e-05, - "loss": 2.3257, - "step": 372970 - }, - { - "epoch": 0.65, - "learning_rate": 1.7478384609213965e-05, - "loss": 2.3154, - "step": 372980 - }, - { - "epoch": 0.65, - "learning_rate": 1.7477512669287138e-05, - "loss": 2.3043, - "step": 372990 - }, - { - "epoch": 0.65, - "learning_rate": 1.7476640729360312e-05, - "loss": 2.2656, - "step": 373000 - }, - { - "epoch": 0.65, - "learning_rate": 1.7475768789433482e-05, - "loss": 2.2873, - "step": 373010 - }, - { - "epoch": 0.65, - "learning_rate": 1.747489684950666e-05, - "loss": 2.3961, - "step": 373020 - }, - { - "epoch": 0.65, - "learning_rate": 1.747402490957983e-05, - "loss": 2.3715, - "step": 373030 - }, - { - "epoch": 0.65, - "learning_rate": 1.7473152969653004e-05, - "loss": 2.3923, - "step": 373040 - }, - { - "epoch": 0.65, - "learning_rate": 1.7472281029726174e-05, - "loss": 2.2976, - "step": 373050 - }, - { - "epoch": 0.65, - "learning_rate": 1.747140908979935e-05, - "loss": 2.2999, - "step": 373060 - }, - { - "epoch": 0.65, - "learning_rate": 1.7470537149872525e-05, - "loss": 2.3421, - "step": 373070 - }, - { - "epoch": 0.65, - "learning_rate": 1.7469665209945695e-05, - "loss": 2.315, - "step": 373080 - }, - { - "epoch": 0.65, - "learning_rate": 1.746879327001887e-05, - "loss": 2.2424, - "step": 373090 - }, - { - "epoch": 0.65, - "learning_rate": 1.7467921330092043e-05, - "loss": 2.4253, - "step": 373100 - }, - { - "epoch": 0.65, - "learning_rate": 1.7467049390165217e-05, - "loss": 2.2811, - "step": 373110 - }, - { - "epoch": 0.65, - "learning_rate": 1.7466177450238387e-05, - "loss": 2.3278, - "step": 373120 - }, - { - "epoch": 0.65, - "learning_rate": 1.7465305510311564e-05, - "loss": 2.4897, - "step": 373130 - }, - { - "epoch": 0.65, - "learning_rate": 1.7464433570384735e-05, - "loss": 2.3432, - "step": 373140 - }, - { - "epoch": 0.65, - "learning_rate": 1.746356163045791e-05, - "loss": 2.1801, - "step": 373150 - }, - { - "epoch": 0.65, - "learning_rate": 1.7462689690531082e-05, - "loss": 2.3321, - "step": 373160 - }, - { - "epoch": 0.65, - "learning_rate": 1.7461817750604256e-05, - "loss": 2.2781, - "step": 373170 - }, - { - "epoch": 0.65, - "learning_rate": 1.746094581067743e-05, - "loss": 2.3275, - "step": 373180 - }, - { - "epoch": 0.65, - "learning_rate": 1.74600738707506e-05, - "loss": 2.3598, - "step": 373190 - }, - { - "epoch": 0.65, - "learning_rate": 1.7459201930823774e-05, - "loss": 2.3743, - "step": 373200 - }, - { - "epoch": 0.65, - "learning_rate": 1.7458329990896948e-05, - "loss": 2.3779, - "step": 373210 - }, - { - "epoch": 0.65, - "learning_rate": 1.745745805097012e-05, - "loss": 2.3379, - "step": 373220 - }, - { - "epoch": 0.65, - "learning_rate": 1.7456586111043295e-05, - "loss": 2.3007, - "step": 373230 - }, - { - "epoch": 0.65, - "learning_rate": 1.7455714171116466e-05, - "loss": 2.3621, - "step": 373240 - }, - { - "epoch": 0.65, - "learning_rate": 1.7454842231189643e-05, - "loss": 2.3149, - "step": 373250 - }, - { - "epoch": 0.65, - "learning_rate": 1.7453970291262813e-05, - "loss": 2.318, - "step": 373260 - }, - { - "epoch": 0.65, - "learning_rate": 1.7453098351335987e-05, - "loss": 2.3639, - "step": 373270 - }, - { - "epoch": 0.65, - "learning_rate": 1.745222641140916e-05, - "loss": 2.2292, - "step": 373280 - }, - { - "epoch": 0.65, - "learning_rate": 1.7451354471482334e-05, - "loss": 2.3201, - "step": 373290 - }, - { - "epoch": 0.65, - "learning_rate": 1.7450482531555505e-05, - "loss": 2.3256, - "step": 373300 - }, - { - "epoch": 0.65, - "learning_rate": 1.744961059162868e-05, - "loss": 2.2712, - "step": 373310 - }, - { - "epoch": 0.65, - "learning_rate": 1.7448738651701856e-05, - "loss": 2.3388, - "step": 373320 - }, - { - "epoch": 0.65, - "learning_rate": 1.7447866711775026e-05, - "loss": 2.2446, - "step": 373330 - }, - { - "epoch": 0.65, - "learning_rate": 1.74469947718482e-05, - "loss": 2.3177, - "step": 373340 - }, - { - "epoch": 0.65, - "learning_rate": 1.744612283192137e-05, - "loss": 2.2232, - "step": 373350 - }, - { - "epoch": 0.65, - "learning_rate": 1.7445250891994547e-05, - "loss": 2.3634, - "step": 373360 - }, - { - "epoch": 0.65, - "learning_rate": 1.7444378952067718e-05, - "loss": 2.4204, - "step": 373370 - }, - { - "epoch": 0.65, - "learning_rate": 1.744350701214089e-05, - "loss": 2.3996, - "step": 373380 - }, - { - "epoch": 0.65, - "learning_rate": 1.7442635072214065e-05, - "loss": 2.3631, - "step": 373390 - }, - { - "epoch": 0.65, - "learning_rate": 1.744176313228724e-05, - "loss": 2.2957, - "step": 373400 - }, - { - "epoch": 0.65, - "learning_rate": 1.7440891192360413e-05, - "loss": 2.2455, - "step": 373410 - }, - { - "epoch": 0.65, - "learning_rate": 1.7440019252433583e-05, - "loss": 2.267, - "step": 373420 - }, - { - "epoch": 0.65, - "learning_rate": 1.743914731250676e-05, - "loss": 2.3671, - "step": 373430 - }, - { - "epoch": 0.65, - "learning_rate": 1.743827537257993e-05, - "loss": 2.4207, - "step": 373440 - }, - { - "epoch": 0.65, - "learning_rate": 1.7437403432653105e-05, - "loss": 2.3101, - "step": 373450 - }, - { - "epoch": 0.65, - "learning_rate": 1.743653149272628e-05, - "loss": 2.3518, - "step": 373460 - }, - { - "epoch": 0.65, - "learning_rate": 1.7435659552799452e-05, - "loss": 2.34, - "step": 373470 - }, - { - "epoch": 0.65, - "learning_rate": 1.7434787612872626e-05, - "loss": 2.424, - "step": 373480 - }, - { - "epoch": 0.65, - "learning_rate": 1.7433915672945796e-05, - "loss": 2.3586, - "step": 373490 - }, - { - "epoch": 0.65, - "learning_rate": 1.743304373301897e-05, - "loss": 2.1928, - "step": 373500 - }, - { - "epoch": 0.65, - "learning_rate": 1.7432171793092144e-05, - "loss": 2.4004, - "step": 373510 - }, - { - "epoch": 0.65, - "learning_rate": 1.7431299853165318e-05, - "loss": 2.2558, - "step": 373520 - }, - { - "epoch": 0.65, - "learning_rate": 1.7430427913238488e-05, - "loss": 2.3058, - "step": 373530 - }, - { - "epoch": 0.65, - "learning_rate": 1.7429555973311665e-05, - "loss": 2.4519, - "step": 373540 - }, - { - "epoch": 0.65, - "learning_rate": 1.742868403338484e-05, - "loss": 2.4026, - "step": 373550 - }, - { - "epoch": 0.65, - "learning_rate": 1.742781209345801e-05, - "loss": 2.3349, - "step": 373560 - }, - { - "epoch": 0.65, - "learning_rate": 1.7426940153531183e-05, - "loss": 2.3704, - "step": 373570 - }, - { - "epoch": 0.65, - "learning_rate": 1.7426068213604357e-05, - "loss": 2.392, - "step": 373580 - }, - { - "epoch": 0.65, - "learning_rate": 1.742519627367753e-05, - "loss": 2.3762, - "step": 373590 - }, - { - "epoch": 0.65, - "learning_rate": 1.74243243337507e-05, - "loss": 2.4013, - "step": 373600 - }, - { - "epoch": 0.65, - "learning_rate": 1.7423452393823875e-05, - "loss": 2.3578, - "step": 373610 - }, - { - "epoch": 0.65, - "learning_rate": 1.742258045389705e-05, - "loss": 2.3003, - "step": 373620 - }, - { - "epoch": 0.65, - "learning_rate": 1.7421708513970222e-05, - "loss": 2.2573, - "step": 373630 - }, - { - "epoch": 0.65, - "learning_rate": 1.7420836574043396e-05, - "loss": 2.3049, - "step": 373640 - }, - { - "epoch": 0.65, - "learning_rate": 1.741996463411657e-05, - "loss": 2.2666, - "step": 373650 - }, - { - "epoch": 0.65, - "learning_rate": 1.7419092694189744e-05, - "loss": 2.4651, - "step": 373660 - }, - { - "epoch": 0.65, - "learning_rate": 1.7418220754262914e-05, - "loss": 2.2863, - "step": 373670 - }, - { - "epoch": 0.65, - "learning_rate": 1.7417348814336088e-05, - "loss": 2.2345, - "step": 373680 - }, - { - "epoch": 0.65, - "learning_rate": 1.741647687440926e-05, - "loss": 2.3521, - "step": 373690 - }, - { - "epoch": 0.65, - "learning_rate": 1.7415604934482435e-05, - "loss": 2.3704, - "step": 373700 - }, - { - "epoch": 0.65, - "learning_rate": 1.741473299455561e-05, - "loss": 2.2968, - "step": 373710 - }, - { - "epoch": 0.65, - "learning_rate": 1.741386105462878e-05, - "loss": 2.3135, - "step": 373720 - }, - { - "epoch": 0.65, - "learning_rate": 1.7412989114701957e-05, - "loss": 2.4003, - "step": 373730 - }, - { - "epoch": 0.65, - "learning_rate": 1.7412117174775127e-05, - "loss": 2.2722, - "step": 373740 - }, - { - "epoch": 0.65, - "learning_rate": 1.74112452348483e-05, - "loss": 2.3592, - "step": 373750 - }, - { - "epoch": 0.65, - "learning_rate": 1.741037329492147e-05, - "loss": 2.2797, - "step": 373760 - }, - { - "epoch": 0.65, - "learning_rate": 1.740950135499465e-05, - "loss": 2.3997, - "step": 373770 - }, - { - "epoch": 0.65, - "learning_rate": 1.740862941506782e-05, - "loss": 2.4342, - "step": 373780 - }, - { - "epoch": 0.65, - "learning_rate": 1.7407757475140992e-05, - "loss": 2.3969, - "step": 373790 - }, - { - "epoch": 0.65, - "learning_rate": 1.740688553521417e-05, - "loss": 2.3881, - "step": 373800 - }, - { - "epoch": 0.65, - "learning_rate": 1.740601359528734e-05, - "loss": 2.313, - "step": 373810 - }, - { - "epoch": 0.65, - "learning_rate": 1.7405141655360514e-05, - "loss": 2.3547, - "step": 373820 - }, - { - "epoch": 0.65, - "learning_rate": 1.7404269715433684e-05, - "loss": 2.3012, - "step": 373830 - }, - { - "epoch": 0.65, - "learning_rate": 1.740339777550686e-05, - "loss": 2.2383, - "step": 373840 - }, - { - "epoch": 0.65, - "learning_rate": 1.7402525835580032e-05, - "loss": 2.1674, - "step": 373850 - }, - { - "epoch": 0.65, - "learning_rate": 1.7401653895653205e-05, - "loss": 2.2048, - "step": 373860 - }, - { - "epoch": 0.65, - "learning_rate": 1.740078195572638e-05, - "loss": 2.3003, - "step": 373870 - }, - { - "epoch": 0.65, - "learning_rate": 1.7399910015799553e-05, - "loss": 2.3214, - "step": 373880 - }, - { - "epoch": 0.65, - "learning_rate": 1.7399038075872727e-05, - "loss": 2.3273, - "step": 373890 - }, - { - "epoch": 0.65, - "learning_rate": 1.7398166135945897e-05, - "loss": 2.3571, - "step": 373900 - }, - { - "epoch": 0.65, - "learning_rate": 1.7397294196019074e-05, - "loss": 2.3899, - "step": 373910 - }, - { - "epoch": 0.65, - "learning_rate": 1.7396422256092245e-05, - "loss": 2.3666, - "step": 373920 - }, - { - "epoch": 0.65, - "learning_rate": 1.739555031616542e-05, - "loss": 2.4038, - "step": 373930 - }, - { - "epoch": 0.65, - "learning_rate": 1.7394678376238592e-05, - "loss": 2.4005, - "step": 373940 - }, - { - "epoch": 0.65, - "learning_rate": 1.7393806436311766e-05, - "loss": 2.4216, - "step": 373950 - }, - { - "epoch": 0.65, - "learning_rate": 1.739293449638494e-05, - "loss": 2.3705, - "step": 373960 - }, - { - "epoch": 0.65, - "learning_rate": 1.739206255645811e-05, - "loss": 2.3098, - "step": 373970 - }, - { - "epoch": 0.65, - "learning_rate": 1.7391190616531284e-05, - "loss": 2.3332, - "step": 373980 - }, - { - "epoch": 0.65, - "learning_rate": 1.7390318676604458e-05, - "loss": 2.4013, - "step": 373990 - }, - { - "epoch": 0.65, - "learning_rate": 1.738944673667763e-05, - "loss": 2.41, - "step": 374000 - }, - { - "epoch": 0.65, - "learning_rate": 1.7388574796750802e-05, - "loss": 2.2885, - "step": 374010 - }, - { - "epoch": 0.65, - "learning_rate": 1.7387702856823976e-05, - "loss": 2.2966, - "step": 374020 - }, - { - "epoch": 0.65, - "learning_rate": 1.738683091689715e-05, - "loss": 2.3146, - "step": 374030 - }, - { - "epoch": 0.65, - "learning_rate": 1.7385958976970323e-05, - "loss": 2.3443, - "step": 374040 - }, - { - "epoch": 0.65, - "learning_rate": 1.7385087037043497e-05, - "loss": 2.2406, - "step": 374050 - }, - { - "epoch": 0.65, - "learning_rate": 1.738421509711667e-05, - "loss": 2.2729, - "step": 374060 - }, - { - "epoch": 0.65, - "learning_rate": 1.7383343157189844e-05, - "loss": 2.324, - "step": 374070 - }, - { - "epoch": 0.65, - "learning_rate": 1.7382471217263015e-05, - "loss": 2.1703, - "step": 374080 - }, - { - "epoch": 0.65, - "learning_rate": 1.738159927733619e-05, - "loss": 2.3066, - "step": 374090 - }, - { - "epoch": 0.65, - "learning_rate": 1.7380727337409362e-05, - "loss": 2.4341, - "step": 374100 - }, - { - "epoch": 0.65, - "learning_rate": 1.7379855397482536e-05, - "loss": 2.4535, - "step": 374110 - }, - { - "epoch": 0.65, - "learning_rate": 1.737898345755571e-05, - "loss": 2.2809, - "step": 374120 - }, - { - "epoch": 0.65, - "learning_rate": 1.737811151762888e-05, - "loss": 2.2911, - "step": 374130 - }, - { - "epoch": 0.65, - "learning_rate": 1.7377239577702057e-05, - "loss": 2.3692, - "step": 374140 - }, - { - "epoch": 0.65, - "learning_rate": 1.7376367637775228e-05, - "loss": 2.2563, - "step": 374150 - }, - { - "epoch": 0.65, - "learning_rate": 1.73754956978484e-05, - "loss": 2.2293, - "step": 374160 - }, - { - "epoch": 0.65, - "learning_rate": 1.7374623757921575e-05, - "loss": 2.2924, - "step": 374170 - }, - { - "epoch": 0.65, - "learning_rate": 1.737375181799475e-05, - "loss": 2.3663, - "step": 374180 - }, - { - "epoch": 0.65, - "learning_rate": 1.7372879878067923e-05, - "loss": 2.2274, - "step": 374190 - }, - { - "epoch": 0.65, - "learning_rate": 1.7372007938141093e-05, - "loss": 2.3177, - "step": 374200 - }, - { - "epoch": 0.65, - "learning_rate": 1.737113599821427e-05, - "loss": 2.4265, - "step": 374210 - }, - { - "epoch": 0.65, - "learning_rate": 1.737026405828744e-05, - "loss": 2.2235, - "step": 374220 - }, - { - "epoch": 0.65, - "learning_rate": 1.7369392118360615e-05, - "loss": 2.3965, - "step": 374230 - }, - { - "epoch": 0.65, - "learning_rate": 1.7368520178433785e-05, - "loss": 2.4046, - "step": 374240 - }, - { - "epoch": 0.65, - "learning_rate": 1.7367648238506962e-05, - "loss": 2.2179, - "step": 374250 - }, - { - "epoch": 0.65, - "learning_rate": 1.7366776298580133e-05, - "loss": 2.3943, - "step": 374260 - }, - { - "epoch": 0.65, - "learning_rate": 1.7365904358653306e-05, - "loss": 2.3989, - "step": 374270 - }, - { - "epoch": 0.65, - "learning_rate": 1.736503241872648e-05, - "loss": 2.377, - "step": 374280 - }, - { - "epoch": 0.65, - "learning_rate": 1.7364160478799654e-05, - "loss": 2.2611, - "step": 374290 - }, - { - "epoch": 0.65, - "learning_rate": 1.7363288538872828e-05, - "loss": 2.3294, - "step": 374300 - }, - { - "epoch": 0.65, - "learning_rate": 1.7362416598945998e-05, - "loss": 2.3451, - "step": 374310 - }, - { - "epoch": 0.65, - "learning_rate": 1.7361544659019175e-05, - "loss": 2.2755, - "step": 374320 - }, - { - "epoch": 0.65, - "learning_rate": 1.7360672719092346e-05, - "loss": 2.2364, - "step": 374330 - }, - { - "epoch": 0.65, - "learning_rate": 1.735980077916552e-05, - "loss": 2.1976, - "step": 374340 - }, - { - "epoch": 0.65, - "learning_rate": 1.7358928839238693e-05, - "loss": 2.4126, - "step": 374350 - }, - { - "epoch": 0.65, - "learning_rate": 1.7358056899311867e-05, - "loss": 2.2175, - "step": 374360 - }, - { - "epoch": 0.65, - "learning_rate": 1.735718495938504e-05, - "loss": 2.267, - "step": 374370 - }, - { - "epoch": 0.65, - "learning_rate": 1.735631301945821e-05, - "loss": 2.3936, - "step": 374380 - }, - { - "epoch": 0.65, - "learning_rate": 1.7355441079531385e-05, - "loss": 2.3762, - "step": 374390 - }, - { - "epoch": 0.65, - "learning_rate": 1.735456913960456e-05, - "loss": 2.3761, - "step": 374400 - }, - { - "epoch": 0.65, - "learning_rate": 1.7353697199677732e-05, - "loss": 2.3198, - "step": 374410 - }, - { - "epoch": 0.65, - "learning_rate": 1.7352825259750906e-05, - "loss": 2.3694, - "step": 374420 - }, - { - "epoch": 0.65, - "learning_rate": 1.7351953319824076e-05, - "loss": 2.299, - "step": 374430 - }, - { - "epoch": 0.65, - "learning_rate": 1.7351081379897254e-05, - "loss": 2.3049, - "step": 374440 - }, - { - "epoch": 0.65, - "learning_rate": 1.7350209439970424e-05, - "loss": 2.3566, - "step": 374450 - }, - { - "epoch": 0.65, - "learning_rate": 1.7349337500043598e-05, - "loss": 2.3334, - "step": 374460 - }, - { - "epoch": 0.65, - "learning_rate": 1.734846556011677e-05, - "loss": 2.312, - "step": 374470 - }, - { - "epoch": 0.65, - "learning_rate": 1.7347593620189945e-05, - "loss": 2.3148, - "step": 374480 - }, - { - "epoch": 0.65, - "learning_rate": 1.7346721680263116e-05, - "loss": 2.3428, - "step": 374490 - }, - { - "epoch": 0.65, - "learning_rate": 1.734584974033629e-05, - "loss": 2.3231, - "step": 374500 - }, - { - "epoch": 0.65, - "learning_rate": 1.7344977800409463e-05, - "loss": 2.3114, - "step": 374510 - }, - { - "epoch": 0.65, - "learning_rate": 1.7344105860482637e-05, - "loss": 2.3261, - "step": 374520 - }, - { - "epoch": 0.65, - "learning_rate": 1.734323392055581e-05, - "loss": 2.3153, - "step": 374530 - }, - { - "epoch": 0.65, - "learning_rate": 1.734236198062898e-05, - "loss": 2.3029, - "step": 374540 - }, - { - "epoch": 0.65, - "learning_rate": 1.734149004070216e-05, - "loss": 2.3046, - "step": 374550 - }, - { - "epoch": 0.65, - "learning_rate": 1.734061810077533e-05, - "loss": 2.3822, - "step": 374560 - }, - { - "epoch": 0.65, - "learning_rate": 1.7339746160848502e-05, - "loss": 2.2613, - "step": 374570 - }, - { - "epoch": 0.65, - "learning_rate": 1.7338874220921676e-05, - "loss": 2.3893, - "step": 374580 - }, - { - "epoch": 0.65, - "learning_rate": 1.733800228099485e-05, - "loss": 2.2694, - "step": 374590 - }, - { - "epoch": 0.65, - "learning_rate": 1.7337130341068024e-05, - "loss": 2.3245, - "step": 374600 - }, - { - "epoch": 0.65, - "learning_rate": 1.7336258401141194e-05, - "loss": 2.2862, - "step": 374610 - }, - { - "epoch": 0.65, - "learning_rate": 1.733538646121437e-05, - "loss": 2.2589, - "step": 374620 - }, - { - "epoch": 0.65, - "learning_rate": 1.7334514521287542e-05, - "loss": 2.3161, - "step": 374630 - }, - { - "epoch": 0.65, - "learning_rate": 1.7333642581360715e-05, - "loss": 2.2456, - "step": 374640 - }, - { - "epoch": 0.65, - "learning_rate": 1.7332770641433886e-05, - "loss": 2.3364, - "step": 374650 - }, - { - "epoch": 0.65, - "learning_rate": 1.7331898701507063e-05, - "loss": 2.2508, - "step": 374660 - }, - { - "epoch": 0.65, - "learning_rate": 1.7331026761580237e-05, - "loss": 2.5146, - "step": 374670 - }, - { - "epoch": 0.65, - "learning_rate": 1.7330154821653407e-05, - "loss": 2.3277, - "step": 374680 - }, - { - "epoch": 0.65, - "learning_rate": 1.732928288172658e-05, - "loss": 2.3392, - "step": 374690 - }, - { - "epoch": 0.65, - "learning_rate": 1.7328410941799755e-05, - "loss": 2.3929, - "step": 374700 - }, - { - "epoch": 0.65, - "learning_rate": 1.732753900187293e-05, - "loss": 2.511, - "step": 374710 - }, - { - "epoch": 0.65, - "learning_rate": 1.73266670619461e-05, - "loss": 2.3608, - "step": 374720 - }, - { - "epoch": 0.65, - "learning_rate": 1.7325795122019276e-05, - "loss": 2.2086, - "step": 374730 - }, - { - "epoch": 0.65, - "learning_rate": 1.7324923182092446e-05, - "loss": 2.3095, - "step": 374740 - }, - { - "epoch": 0.65, - "learning_rate": 1.732405124216562e-05, - "loss": 2.248, - "step": 374750 - }, - { - "epoch": 0.65, - "learning_rate": 1.7323179302238794e-05, - "loss": 2.358, - "step": 374760 - }, - { - "epoch": 0.65, - "learning_rate": 1.7322307362311968e-05, - "loss": 2.2984, - "step": 374770 - }, - { - "epoch": 0.65, - "learning_rate": 1.732143542238514e-05, - "loss": 2.3026, - "step": 374780 - }, - { - "epoch": 0.65, - "learning_rate": 1.7320563482458312e-05, - "loss": 2.3117, - "step": 374790 - }, - { - "epoch": 0.65, - "learning_rate": 1.7319691542531486e-05, - "loss": 2.3087, - "step": 374800 - }, - { - "epoch": 0.65, - "learning_rate": 1.731881960260466e-05, - "loss": 2.3497, - "step": 374810 - }, - { - "epoch": 0.65, - "learning_rate": 1.7317947662677833e-05, - "loss": 2.3721, - "step": 374820 - }, - { - "epoch": 0.65, - "learning_rate": 1.7317075722751007e-05, - "loss": 2.3091, - "step": 374830 - }, - { - "epoch": 0.65, - "learning_rate": 1.7316203782824177e-05, - "loss": 2.1705, - "step": 374840 - }, - { - "epoch": 0.65, - "learning_rate": 1.7315331842897354e-05, - "loss": 2.3314, - "step": 374850 - }, - { - "epoch": 0.65, - "learning_rate": 1.7314459902970525e-05, - "loss": 2.3381, - "step": 374860 - }, - { - "epoch": 0.65, - "learning_rate": 1.73135879630437e-05, - "loss": 2.3172, - "step": 374870 - }, - { - "epoch": 0.65, - "learning_rate": 1.7312716023116872e-05, - "loss": 2.3045, - "step": 374880 - }, - { - "epoch": 0.65, - "learning_rate": 1.7311844083190046e-05, - "loss": 2.3178, - "step": 374890 - }, - { - "epoch": 0.65, - "learning_rate": 1.731097214326322e-05, - "loss": 2.2515, - "step": 374900 - }, - { - "epoch": 0.65, - "learning_rate": 1.731010020333639e-05, - "loss": 2.2482, - "step": 374910 - }, - { - "epoch": 0.65, - "learning_rate": 1.7309228263409567e-05, - "loss": 2.305, - "step": 374920 - }, - { - "epoch": 0.65, - "learning_rate": 1.7308356323482738e-05, - "loss": 2.3845, - "step": 374930 - }, - { - "epoch": 0.65, - "learning_rate": 1.730748438355591e-05, - "loss": 2.4019, - "step": 374940 - }, - { - "epoch": 0.65, - "learning_rate": 1.7306612443629082e-05, - "loss": 2.2868, - "step": 374950 - }, - { - "epoch": 0.65, - "learning_rate": 1.730574050370226e-05, - "loss": 2.3032, - "step": 374960 - }, - { - "epoch": 0.65, - "learning_rate": 1.730486856377543e-05, - "loss": 2.386, - "step": 374970 - }, - { - "epoch": 0.65, - "learning_rate": 1.7303996623848603e-05, - "loss": 2.3372, - "step": 374980 - }, - { - "epoch": 0.65, - "learning_rate": 1.7303124683921777e-05, - "loss": 2.3868, - "step": 374990 - }, - { - "epoch": 0.65, - "learning_rate": 1.730225274399495e-05, - "loss": 2.2661, - "step": 375000 - }, - { - "epoch": 0.65, - "learning_rate": 1.7301380804068125e-05, - "loss": 2.3923, - "step": 375010 - }, - { - "epoch": 0.65, - "learning_rate": 1.7300508864141295e-05, - "loss": 2.3158, - "step": 375020 - }, - { - "epoch": 0.65, - "learning_rate": 1.7299636924214472e-05, - "loss": 2.3635, - "step": 375030 - }, - { - "epoch": 0.65, - "learning_rate": 1.7298764984287643e-05, - "loss": 2.2966, - "step": 375040 - }, - { - "epoch": 0.65, - "learning_rate": 1.7297893044360816e-05, - "loss": 2.3397, - "step": 375050 - }, - { - "epoch": 0.65, - "learning_rate": 1.729702110443399e-05, - "loss": 2.3367, - "step": 375060 - }, - { - "epoch": 0.65, - "learning_rate": 1.7296149164507164e-05, - "loss": 2.3709, - "step": 375070 - }, - { - "epoch": 0.65, - "learning_rate": 1.7295277224580338e-05, - "loss": 2.3933, - "step": 375080 - }, - { - "epoch": 0.65, - "learning_rate": 1.7294405284653508e-05, - "loss": 2.3343, - "step": 375090 - }, - { - "epoch": 0.65, - "learning_rate": 1.7293533344726682e-05, - "loss": 2.3145, - "step": 375100 - }, - { - "epoch": 0.65, - "learning_rate": 1.7292661404799856e-05, - "loss": 2.2912, - "step": 375110 - }, - { - "epoch": 0.65, - "learning_rate": 1.729178946487303e-05, - "loss": 2.3528, - "step": 375120 - }, - { - "epoch": 0.65, - "learning_rate": 1.72909175249462e-05, - "loss": 2.2858, - "step": 375130 - }, - { - "epoch": 0.65, - "learning_rate": 1.7290045585019377e-05, - "loss": 2.3195, - "step": 375140 - }, - { - "epoch": 0.65, - "learning_rate": 1.728917364509255e-05, - "loss": 2.375, - "step": 375150 - }, - { - "epoch": 0.65, - "learning_rate": 1.728830170516572e-05, - "loss": 2.406, - "step": 375160 - }, - { - "epoch": 0.65, - "learning_rate": 1.7287429765238895e-05, - "loss": 2.3075, - "step": 375170 - }, - { - "epoch": 0.65, - "learning_rate": 1.728655782531207e-05, - "loss": 2.2648, - "step": 375180 - }, - { - "epoch": 0.65, - "learning_rate": 1.7285685885385242e-05, - "loss": 2.2603, - "step": 375190 - }, - { - "epoch": 0.65, - "learning_rate": 1.7284813945458413e-05, - "loss": 2.271, - "step": 375200 - }, - { - "epoch": 0.65, - "learning_rate": 1.7283942005531586e-05, - "loss": 2.3146, - "step": 375210 - }, - { - "epoch": 0.65, - "learning_rate": 1.728307006560476e-05, - "loss": 2.3687, - "step": 375220 - }, - { - "epoch": 0.65, - "learning_rate": 1.7282198125677934e-05, - "loss": 2.2732, - "step": 375230 - }, - { - "epoch": 0.65, - "learning_rate": 1.7281326185751108e-05, - "loss": 2.438, - "step": 375240 - }, - { - "epoch": 0.65, - "learning_rate": 1.728045424582428e-05, - "loss": 2.2992, - "step": 375250 - }, - { - "epoch": 0.65, - "learning_rate": 1.7279582305897455e-05, - "loss": 2.3415, - "step": 375260 - }, - { - "epoch": 0.65, - "learning_rate": 1.7278710365970626e-05, - "loss": 2.3668, - "step": 375270 - }, - { - "epoch": 0.65, - "learning_rate": 1.72778384260438e-05, - "loss": 2.3799, - "step": 375280 - }, - { - "epoch": 0.65, - "learning_rate": 1.7276966486116973e-05, - "loss": 2.2112, - "step": 375290 - }, - { - "epoch": 0.65, - "learning_rate": 1.7276094546190147e-05, - "loss": 2.2837, - "step": 375300 - }, - { - "epoch": 0.65, - "learning_rate": 1.727522260626332e-05, - "loss": 2.3902, - "step": 375310 - }, - { - "epoch": 0.65, - "learning_rate": 1.727435066633649e-05, - "loss": 2.3204, - "step": 375320 - }, - { - "epoch": 0.65, - "learning_rate": 1.727347872640967e-05, - "loss": 2.2798, - "step": 375330 - }, - { - "epoch": 0.65, - "learning_rate": 1.727260678648284e-05, - "loss": 2.3685, - "step": 375340 - }, - { - "epoch": 0.65, - "learning_rate": 1.7271734846556012e-05, - "loss": 2.2907, - "step": 375350 - }, - { - "epoch": 0.65, - "learning_rate": 1.7270862906629183e-05, - "loss": 2.1992, - "step": 375360 - }, - { - "epoch": 0.65, - "learning_rate": 1.726999096670236e-05, - "loss": 2.2205, - "step": 375370 - }, - { - "epoch": 0.65, - "learning_rate": 1.726911902677553e-05, - "loss": 2.3384, - "step": 375380 - }, - { - "epoch": 0.65, - "learning_rate": 1.7268247086848704e-05, - "loss": 2.3895, - "step": 375390 - }, - { - "epoch": 0.65, - "learning_rate": 1.726737514692188e-05, - "loss": 2.3233, - "step": 375400 - }, - { - "epoch": 0.65, - "learning_rate": 1.7266503206995052e-05, - "loss": 2.2806, - "step": 375410 - }, - { - "epoch": 0.65, - "learning_rate": 1.7265631267068225e-05, - "loss": 2.2383, - "step": 375420 - }, - { - "epoch": 0.65, - "learning_rate": 1.7264759327141396e-05, - "loss": 2.3107, - "step": 375430 - }, - { - "epoch": 0.65, - "learning_rate": 1.7263887387214573e-05, - "loss": 2.304, - "step": 375440 - }, - { - "epoch": 0.65, - "learning_rate": 1.7263015447287743e-05, - "loss": 2.4387, - "step": 375450 - }, - { - "epoch": 0.65, - "learning_rate": 1.7262143507360917e-05, - "loss": 2.3266, - "step": 375460 - }, - { - "epoch": 0.65, - "learning_rate": 1.726127156743409e-05, - "loss": 2.3417, - "step": 375470 - }, - { - "epoch": 0.65, - "learning_rate": 1.7260399627507265e-05, - "loss": 2.2888, - "step": 375480 - }, - { - "epoch": 0.65, - "learning_rate": 1.725952768758044e-05, - "loss": 2.2479, - "step": 375490 - }, - { - "epoch": 0.65, - "learning_rate": 1.725865574765361e-05, - "loss": 2.4127, - "step": 375500 - }, - { - "epoch": 0.65, - "learning_rate": 1.7257783807726786e-05, - "loss": 2.309, - "step": 375510 - }, - { - "epoch": 0.65, - "learning_rate": 1.7256911867799956e-05, - "loss": 2.3385, - "step": 375520 - }, - { - "epoch": 0.65, - "learning_rate": 1.725603992787313e-05, - "loss": 2.3173, - "step": 375530 - }, - { - "epoch": 0.65, - "learning_rate": 1.7255167987946304e-05, - "loss": 2.3823, - "step": 375540 - }, - { - "epoch": 0.65, - "learning_rate": 1.7254296048019478e-05, - "loss": 2.3379, - "step": 375550 - }, - { - "epoch": 0.65, - "learning_rate": 1.725342410809265e-05, - "loss": 2.2879, - "step": 375560 - }, - { - "epoch": 0.65, - "learning_rate": 1.7252552168165822e-05, - "loss": 2.3568, - "step": 375570 - }, - { - "epoch": 0.65, - "learning_rate": 1.7251680228238996e-05, - "loss": 2.4165, - "step": 375580 - }, - { - "epoch": 0.65, - "learning_rate": 1.725080828831217e-05, - "loss": 2.2293, - "step": 375590 - }, - { - "epoch": 0.66, - "learning_rate": 1.7249936348385343e-05, - "loss": 2.2643, - "step": 375600 - }, - { - "epoch": 0.66, - "learning_rate": 1.7249064408458514e-05, - "loss": 2.2292, - "step": 375610 - }, - { - "epoch": 0.66, - "learning_rate": 1.7248192468531687e-05, - "loss": 2.3175, - "step": 375620 - }, - { - "epoch": 0.66, - "learning_rate": 1.7247320528604864e-05, - "loss": 2.4241, - "step": 375630 - }, - { - "epoch": 0.66, - "learning_rate": 1.7246448588678035e-05, - "loss": 2.4184, - "step": 375640 - }, - { - "epoch": 0.66, - "learning_rate": 1.724557664875121e-05, - "loss": 2.2992, - "step": 375650 - }, - { - "epoch": 0.66, - "learning_rate": 1.7244704708824382e-05, - "loss": 2.2606, - "step": 375660 - }, - { - "epoch": 0.66, - "learning_rate": 1.7243832768897556e-05, - "loss": 2.3886, - "step": 375670 - }, - { - "epoch": 0.66, - "learning_rate": 1.7242960828970727e-05, - "loss": 2.3281, - "step": 375680 - }, - { - "epoch": 0.66, - "learning_rate": 1.72420888890439e-05, - "loss": 2.256, - "step": 375690 - }, - { - "epoch": 0.66, - "learning_rate": 1.7241216949117074e-05, - "loss": 2.2784, - "step": 375700 - }, - { - "epoch": 0.66, - "learning_rate": 1.7240345009190248e-05, - "loss": 2.1952, - "step": 375710 - }, - { - "epoch": 0.66, - "learning_rate": 1.723947306926342e-05, - "loss": 2.3177, - "step": 375720 - }, - { - "epoch": 0.66, - "learning_rate": 1.7238601129336592e-05, - "loss": 2.269, - "step": 375730 - }, - { - "epoch": 0.66, - "learning_rate": 1.723772918940977e-05, - "loss": 2.3198, - "step": 375740 - }, - { - "epoch": 0.66, - "learning_rate": 1.723685724948294e-05, - "loss": 2.2882, - "step": 375750 - }, - { - "epoch": 0.66, - "learning_rate": 1.7235985309556113e-05, - "loss": 2.4664, - "step": 375760 - }, - { - "epoch": 0.66, - "learning_rate": 1.7235113369629287e-05, - "loss": 2.2876, - "step": 375770 - }, - { - "epoch": 0.66, - "learning_rate": 1.723424142970246e-05, - "loss": 2.3938, - "step": 375780 - }, - { - "epoch": 0.66, - "learning_rate": 1.7233369489775635e-05, - "loss": 2.3803, - "step": 375790 - }, - { - "epoch": 0.66, - "learning_rate": 1.7232497549848805e-05, - "loss": 2.2911, - "step": 375800 - }, - { - "epoch": 0.66, - "learning_rate": 1.7231625609921982e-05, - "loss": 2.3454, - "step": 375810 - }, - { - "epoch": 0.66, - "learning_rate": 1.7230753669995153e-05, - "loss": 2.3849, - "step": 375820 - }, - { - "epoch": 0.66, - "learning_rate": 1.7229881730068326e-05, - "loss": 2.3189, - "step": 375830 - }, - { - "epoch": 0.66, - "learning_rate": 1.7229009790141497e-05, - "loss": 2.3178, - "step": 375840 - }, - { - "epoch": 0.66, - "learning_rate": 1.7228137850214674e-05, - "loss": 2.39, - "step": 375850 - }, - { - "epoch": 0.66, - "learning_rate": 1.7227265910287844e-05, - "loss": 2.2492, - "step": 375860 - }, - { - "epoch": 0.66, - "learning_rate": 1.7226393970361018e-05, - "loss": 2.2546, - "step": 375870 - }, - { - "epoch": 0.66, - "learning_rate": 1.7225522030434192e-05, - "loss": 2.25, - "step": 375880 - }, - { - "epoch": 0.66, - "learning_rate": 1.7224650090507366e-05, - "loss": 2.3295, - "step": 375890 - }, - { - "epoch": 0.66, - "learning_rate": 1.722377815058054e-05, - "loss": 2.3812, - "step": 375900 - }, - { - "epoch": 0.66, - "learning_rate": 1.722290621065371e-05, - "loss": 2.3599, - "step": 375910 - }, - { - "epoch": 0.66, - "learning_rate": 1.7222034270726887e-05, - "loss": 2.2841, - "step": 375920 - }, - { - "epoch": 0.66, - "learning_rate": 1.7221162330800057e-05, - "loss": 2.3279, - "step": 375930 - }, - { - "epoch": 0.66, - "learning_rate": 1.722029039087323e-05, - "loss": 2.2333, - "step": 375940 - }, - { - "epoch": 0.66, - "learning_rate": 1.7219418450946405e-05, - "loss": 2.3255, - "step": 375950 - }, - { - "epoch": 0.66, - "learning_rate": 1.721854651101958e-05, - "loss": 2.3555, - "step": 375960 - }, - { - "epoch": 0.66, - "learning_rate": 1.7217674571092752e-05, - "loss": 2.2656, - "step": 375970 - }, - { - "epoch": 0.66, - "learning_rate": 1.7216802631165923e-05, - "loss": 2.4115, - "step": 375980 - }, - { - "epoch": 0.66, - "learning_rate": 1.7215930691239096e-05, - "loss": 2.2956, - "step": 375990 - }, - { - "epoch": 0.66, - "learning_rate": 1.721505875131227e-05, - "loss": 2.3194, - "step": 376000 - }, - { - "epoch": 0.66, - "learning_rate": 1.7214186811385444e-05, - "loss": 2.3228, - "step": 376010 - }, - { - "epoch": 0.66, - "learning_rate": 1.7213314871458618e-05, - "loss": 2.4089, - "step": 376020 - }, - { - "epoch": 0.66, - "learning_rate": 1.7212442931531788e-05, - "loss": 2.2939, - "step": 376030 - }, - { - "epoch": 0.66, - "learning_rate": 1.7211570991604965e-05, - "loss": 2.4491, - "step": 376040 - }, - { - "epoch": 0.66, - "learning_rate": 1.7210699051678136e-05, - "loss": 2.3837, - "step": 376050 - }, - { - "epoch": 0.66, - "learning_rate": 1.720982711175131e-05, - "loss": 2.321, - "step": 376060 - }, - { - "epoch": 0.66, - "learning_rate": 1.7208955171824483e-05, - "loss": 2.3258, - "step": 376070 - }, - { - "epoch": 0.66, - "learning_rate": 1.7208083231897657e-05, - "loss": 2.4234, - "step": 376080 - }, - { - "epoch": 0.66, - "learning_rate": 1.7207211291970827e-05, - "loss": 2.2667, - "step": 376090 - }, - { - "epoch": 0.66, - "learning_rate": 1.7206339352044e-05, - "loss": 2.3498, - "step": 376100 - }, - { - "epoch": 0.66, - "learning_rate": 1.7205467412117175e-05, - "loss": 2.3615, - "step": 376110 - }, - { - "epoch": 0.66, - "learning_rate": 1.720459547219035e-05, - "loss": 2.3519, - "step": 376120 - }, - { - "epoch": 0.66, - "learning_rate": 1.7203723532263522e-05, - "loss": 2.2793, - "step": 376130 - }, - { - "epoch": 0.66, - "learning_rate": 1.7202851592336693e-05, - "loss": 2.3378, - "step": 376140 - }, - { - "epoch": 0.66, - "learning_rate": 1.720197965240987e-05, - "loss": 2.4385, - "step": 376150 - }, - { - "epoch": 0.66, - "learning_rate": 1.720110771248304e-05, - "loss": 2.29, - "step": 376160 - }, - { - "epoch": 0.66, - "learning_rate": 1.7200235772556214e-05, - "loss": 2.3251, - "step": 376170 - }, - { - "epoch": 0.66, - "learning_rate": 1.7199363832629388e-05, - "loss": 2.2812, - "step": 376180 - }, - { - "epoch": 0.66, - "learning_rate": 1.7198491892702562e-05, - "loss": 2.3325, - "step": 376190 - }, - { - "epoch": 0.66, - "learning_rate": 1.7197619952775735e-05, - "loss": 2.1982, - "step": 376200 - }, - { - "epoch": 0.66, - "learning_rate": 1.7196748012848906e-05, - "loss": 2.248, - "step": 376210 - }, - { - "epoch": 0.66, - "learning_rate": 1.7195876072922083e-05, - "loss": 2.2284, - "step": 376220 - }, - { - "epoch": 0.66, - "learning_rate": 1.7195004132995253e-05, - "loss": 2.2671, - "step": 376230 - }, - { - "epoch": 0.66, - "learning_rate": 1.7194132193068427e-05, - "loss": 2.3553, - "step": 376240 - }, - { - "epoch": 0.66, - "learning_rate": 1.71932602531416e-05, - "loss": 2.3795, - "step": 376250 - }, - { - "epoch": 0.66, - "learning_rate": 1.7192388313214775e-05, - "loss": 2.2452, - "step": 376260 - }, - { - "epoch": 0.66, - "learning_rate": 1.719151637328795e-05, - "loss": 2.3192, - "step": 376270 - }, - { - "epoch": 0.66, - "learning_rate": 1.719064443336112e-05, - "loss": 2.2991, - "step": 376280 - }, - { - "epoch": 0.66, - "learning_rate": 1.7189772493434293e-05, - "loss": 2.3045, - "step": 376290 - }, - { - "epoch": 0.66, - "learning_rate": 1.7188900553507466e-05, - "loss": 2.3769, - "step": 376300 - }, - { - "epoch": 0.66, - "learning_rate": 1.718802861358064e-05, - "loss": 2.4355, - "step": 376310 - }, - { - "epoch": 0.66, - "learning_rate": 1.718715667365381e-05, - "loss": 2.2772, - "step": 376320 - }, - { - "epoch": 0.66, - "learning_rate": 1.7186284733726988e-05, - "loss": 2.33, - "step": 376330 - }, - { - "epoch": 0.66, - "learning_rate": 1.7185412793800158e-05, - "loss": 2.2936, - "step": 376340 - }, - { - "epoch": 0.66, - "learning_rate": 1.7184540853873332e-05, - "loss": 2.3024, - "step": 376350 - }, - { - "epoch": 0.66, - "learning_rate": 1.7183668913946506e-05, - "loss": 2.3339, - "step": 376360 - }, - { - "epoch": 0.66, - "learning_rate": 1.718279697401968e-05, - "loss": 2.4032, - "step": 376370 - }, - { - "epoch": 0.66, - "learning_rate": 1.7181925034092853e-05, - "loss": 2.2299, - "step": 376380 - }, - { - "epoch": 0.66, - "learning_rate": 1.7181053094166024e-05, - "loss": 2.2654, - "step": 376390 - }, - { - "epoch": 0.66, - "learning_rate": 1.7180181154239197e-05, - "loss": 2.2119, - "step": 376400 - }, - { - "epoch": 0.66, - "learning_rate": 1.717930921431237e-05, - "loss": 2.3239, - "step": 376410 - }, - { - "epoch": 0.66, - "learning_rate": 1.7178437274385545e-05, - "loss": 2.2742, - "step": 376420 - }, - { - "epoch": 0.66, - "learning_rate": 1.717756533445872e-05, - "loss": 2.2986, - "step": 376430 - }, - { - "epoch": 0.66, - "learning_rate": 1.7176693394531892e-05, - "loss": 2.3, - "step": 376440 - }, - { - "epoch": 0.66, - "learning_rate": 1.7175821454605066e-05, - "loss": 2.2809, - "step": 376450 - }, - { - "epoch": 0.66, - "learning_rate": 1.7174949514678237e-05, - "loss": 2.2113, - "step": 376460 - }, - { - "epoch": 0.66, - "learning_rate": 1.717407757475141e-05, - "loss": 2.3567, - "step": 376470 - }, - { - "epoch": 0.66, - "learning_rate": 1.7173205634824584e-05, - "loss": 2.2627, - "step": 376480 - }, - { - "epoch": 0.66, - "learning_rate": 1.7172333694897758e-05, - "loss": 2.2996, - "step": 376490 - }, - { - "epoch": 0.66, - "learning_rate": 1.717146175497093e-05, - "loss": 2.3617, - "step": 376500 - }, - { - "epoch": 0.66, - "learning_rate": 1.7170589815044102e-05, - "loss": 2.3106, - "step": 376510 - }, - { - "epoch": 0.66, - "learning_rate": 1.716971787511728e-05, - "loss": 2.3109, - "step": 376520 - }, - { - "epoch": 0.66, - "learning_rate": 1.716884593519045e-05, - "loss": 2.3088, - "step": 376530 - }, - { - "epoch": 0.66, - "learning_rate": 1.7167973995263623e-05, - "loss": 2.3279, - "step": 376540 - }, - { - "epoch": 0.66, - "learning_rate": 1.7167102055336794e-05, - "loss": 2.3396, - "step": 376550 - }, - { - "epoch": 0.66, - "learning_rate": 1.716623011540997e-05, - "loss": 2.2212, - "step": 376560 - }, - { - "epoch": 0.66, - "learning_rate": 1.716535817548314e-05, - "loss": 2.3122, - "step": 376570 - }, - { - "epoch": 0.66, - "learning_rate": 1.7164486235556315e-05, - "loss": 2.2867, - "step": 376580 - }, - { - "epoch": 0.66, - "learning_rate": 1.716361429562949e-05, - "loss": 2.262, - "step": 376590 - }, - { - "epoch": 0.66, - "learning_rate": 1.7162742355702663e-05, - "loss": 2.4606, - "step": 376600 - }, - { - "epoch": 0.66, - "learning_rate": 1.7161870415775836e-05, - "loss": 2.319, - "step": 376610 - }, - { - "epoch": 0.66, - "learning_rate": 1.7160998475849007e-05, - "loss": 2.3659, - "step": 376620 - }, - { - "epoch": 0.66, - "learning_rate": 1.7160126535922184e-05, - "loss": 2.3698, - "step": 376630 - }, - { - "epoch": 0.66, - "learning_rate": 1.7159254595995354e-05, - "loss": 2.3712, - "step": 376640 - }, - { - "epoch": 0.66, - "learning_rate": 1.7158382656068528e-05, - "loss": 2.3056, - "step": 376650 - }, - { - "epoch": 0.66, - "learning_rate": 1.7157510716141702e-05, - "loss": 2.2843, - "step": 376660 - }, - { - "epoch": 0.66, - "learning_rate": 1.7156638776214876e-05, - "loss": 2.3583, - "step": 376670 - }, - { - "epoch": 0.66, - "learning_rate": 1.715576683628805e-05, - "loss": 2.3201, - "step": 376680 - }, - { - "epoch": 0.66, - "learning_rate": 1.715489489636122e-05, - "loss": 2.4041, - "step": 376690 - }, - { - "epoch": 0.66, - "learning_rate": 1.7154022956434393e-05, - "loss": 2.3372, - "step": 376700 - }, - { - "epoch": 0.66, - "learning_rate": 1.7153151016507567e-05, - "loss": 2.4112, - "step": 376710 - }, - { - "epoch": 0.66, - "learning_rate": 1.715227907658074e-05, - "loss": 2.2633, - "step": 376720 - }, - { - "epoch": 0.66, - "learning_rate": 1.715140713665391e-05, - "loss": 2.3954, - "step": 376730 - }, - { - "epoch": 0.66, - "learning_rate": 1.715053519672709e-05, - "loss": 2.3131, - "step": 376740 - }, - { - "epoch": 0.66, - "learning_rate": 1.7149663256800262e-05, - "loss": 2.3413, - "step": 376750 - }, - { - "epoch": 0.66, - "learning_rate": 1.7148791316873433e-05, - "loss": 2.2829, - "step": 376760 - }, - { - "epoch": 0.66, - "learning_rate": 1.7147919376946606e-05, - "loss": 2.1798, - "step": 376770 - }, - { - "epoch": 0.66, - "learning_rate": 1.714704743701978e-05, - "loss": 2.2614, - "step": 376780 - }, - { - "epoch": 0.66, - "learning_rate": 1.7146175497092954e-05, - "loss": 2.283, - "step": 376790 - }, - { - "epoch": 0.66, - "learning_rate": 1.7145303557166124e-05, - "loss": 2.2649, - "step": 376800 - }, - { - "epoch": 0.66, - "learning_rate": 1.7144431617239298e-05, - "loss": 2.3022, - "step": 376810 - }, - { - "epoch": 0.66, - "learning_rate": 1.7143559677312472e-05, - "loss": 2.2907, - "step": 376820 - }, - { - "epoch": 0.66, - "learning_rate": 1.7142687737385646e-05, - "loss": 2.3141, - "step": 376830 - }, - { - "epoch": 0.66, - "learning_rate": 1.714181579745882e-05, - "loss": 2.3376, - "step": 376840 - }, - { - "epoch": 0.66, - "learning_rate": 1.7140943857531993e-05, - "loss": 2.418, - "step": 376850 - }, - { - "epoch": 0.66, - "learning_rate": 1.7140071917605167e-05, - "loss": 2.3139, - "step": 376860 - }, - { - "epoch": 0.66, - "learning_rate": 1.7139199977678337e-05, - "loss": 2.2822, - "step": 376870 - }, - { - "epoch": 0.66, - "learning_rate": 1.713832803775151e-05, - "loss": 2.3465, - "step": 376880 - }, - { - "epoch": 0.66, - "learning_rate": 1.7137456097824685e-05, - "loss": 2.274, - "step": 376890 - }, - { - "epoch": 0.66, - "learning_rate": 1.713658415789786e-05, - "loss": 2.3388, - "step": 376900 - }, - { - "epoch": 0.66, - "learning_rate": 1.7135712217971032e-05, - "loss": 2.2683, - "step": 376910 - }, - { - "epoch": 0.66, - "learning_rate": 1.7134840278044203e-05, - "loss": 2.2526, - "step": 376920 - }, - { - "epoch": 0.66, - "learning_rate": 1.713396833811738e-05, - "loss": 2.3153, - "step": 376930 - }, - { - "epoch": 0.66, - "learning_rate": 1.713309639819055e-05, - "loss": 2.3301, - "step": 376940 - }, - { - "epoch": 0.66, - "learning_rate": 1.7132224458263724e-05, - "loss": 2.4038, - "step": 376950 - }, - { - "epoch": 0.66, - "learning_rate": 1.7131352518336895e-05, - "loss": 2.3335, - "step": 376960 - }, - { - "epoch": 0.66, - "learning_rate": 1.7130480578410072e-05, - "loss": 2.3305, - "step": 376970 - }, - { - "epoch": 0.66, - "learning_rate": 1.7129608638483245e-05, - "loss": 2.3115, - "step": 376980 - }, - { - "epoch": 0.66, - "learning_rate": 1.7128736698556416e-05, - "loss": 2.3609, - "step": 376990 - }, - { - "epoch": 0.66, - "learning_rate": 1.7127864758629593e-05, - "loss": 2.2604, - "step": 377000 - }, - { - "epoch": 0.66, - "learning_rate": 1.7126992818702763e-05, - "loss": 2.279, - "step": 377010 - }, - { - "epoch": 0.66, - "learning_rate": 1.7126120878775937e-05, - "loss": 2.3645, - "step": 377020 - }, - { - "epoch": 0.66, - "learning_rate": 1.7125248938849108e-05, - "loss": 2.3025, - "step": 377030 - }, - { - "epoch": 0.66, - "learning_rate": 1.7124376998922285e-05, - "loss": 2.1676, - "step": 377040 - }, - { - "epoch": 0.66, - "learning_rate": 1.7123505058995455e-05, - "loss": 2.3451, - "step": 377050 - }, - { - "epoch": 0.66, - "learning_rate": 1.712263311906863e-05, - "loss": 2.3725, - "step": 377060 - }, - { - "epoch": 0.66, - "learning_rate": 1.7121761179141803e-05, - "loss": 2.2315, - "step": 377070 - }, - { - "epoch": 0.66, - "learning_rate": 1.7120889239214976e-05, - "loss": 2.2598, - "step": 377080 - }, - { - "epoch": 0.66, - "learning_rate": 1.712001729928815e-05, - "loss": 2.2407, - "step": 377090 - }, - { - "epoch": 0.66, - "learning_rate": 1.711914535936132e-05, - "loss": 2.3115, - "step": 377100 - }, - { - "epoch": 0.66, - "learning_rate": 1.7118273419434498e-05, - "loss": 2.3715, - "step": 377110 - }, - { - "epoch": 0.66, - "learning_rate": 1.7117401479507668e-05, - "loss": 2.38, - "step": 377120 - }, - { - "epoch": 0.66, - "learning_rate": 1.7116529539580842e-05, - "loss": 2.392, - "step": 377130 - }, - { - "epoch": 0.66, - "learning_rate": 1.7115657599654016e-05, - "loss": 2.3416, - "step": 377140 - }, - { - "epoch": 0.66, - "learning_rate": 1.711478565972719e-05, - "loss": 2.1535, - "step": 377150 - }, - { - "epoch": 0.66, - "learning_rate": 1.7113913719800363e-05, - "loss": 2.3792, - "step": 377160 - }, - { - "epoch": 0.66, - "learning_rate": 1.7113041779873534e-05, - "loss": 2.2359, - "step": 377170 - }, - { - "epoch": 0.66, - "learning_rate": 1.7112169839946707e-05, - "loss": 2.2679, - "step": 377180 - }, - { - "epoch": 0.66, - "learning_rate": 1.711129790001988e-05, - "loss": 2.3482, - "step": 377190 - }, - { - "epoch": 0.66, - "learning_rate": 1.7110425960093055e-05, - "loss": 2.3144, - "step": 377200 - }, - { - "epoch": 0.66, - "learning_rate": 1.7109554020166225e-05, - "loss": 2.2572, - "step": 377210 - }, - { - "epoch": 0.66, - "learning_rate": 1.71086820802394e-05, - "loss": 2.3864, - "step": 377220 - }, - { - "epoch": 0.66, - "learning_rate": 1.7107810140312576e-05, - "loss": 2.3612, - "step": 377230 - }, - { - "epoch": 0.66, - "learning_rate": 1.7106938200385747e-05, - "loss": 2.3038, - "step": 377240 - }, - { - "epoch": 0.66, - "learning_rate": 1.710606626045892e-05, - "loss": 2.3396, - "step": 377250 - }, - { - "epoch": 0.66, - "learning_rate": 1.7105194320532094e-05, - "loss": 2.2442, - "step": 377260 - }, - { - "epoch": 0.66, - "learning_rate": 1.7104322380605268e-05, - "loss": 2.267, - "step": 377270 - }, - { - "epoch": 0.66, - "learning_rate": 1.7103450440678438e-05, - "loss": 2.4166, - "step": 377280 - }, - { - "epoch": 0.66, - "learning_rate": 1.7102578500751612e-05, - "loss": 2.2742, - "step": 377290 - }, - { - "epoch": 0.66, - "learning_rate": 1.7101706560824786e-05, - "loss": 2.3426, - "step": 377300 - }, - { - "epoch": 0.66, - "learning_rate": 1.710083462089796e-05, - "loss": 2.327, - "step": 377310 - }, - { - "epoch": 0.66, - "learning_rate": 1.7099962680971133e-05, - "loss": 2.3988, - "step": 377320 - }, - { - "epoch": 0.66, - "learning_rate": 1.7099090741044304e-05, - "loss": 2.2704, - "step": 377330 - }, - { - "epoch": 0.66, - "learning_rate": 1.709821880111748e-05, - "loss": 2.3464, - "step": 377340 - }, - { - "epoch": 0.66, - "learning_rate": 1.709734686119065e-05, - "loss": 2.3414, - "step": 377350 - }, - { - "epoch": 0.66, - "learning_rate": 1.7096474921263825e-05, - "loss": 2.3453, - "step": 377360 - }, - { - "epoch": 0.66, - "learning_rate": 1.7095602981337e-05, - "loss": 2.3095, - "step": 377370 - }, - { - "epoch": 0.66, - "learning_rate": 1.7094731041410173e-05, - "loss": 2.3575, - "step": 377380 - }, - { - "epoch": 0.66, - "learning_rate": 1.7093859101483346e-05, - "loss": 2.2285, - "step": 377390 - }, - { - "epoch": 0.66, - "learning_rate": 1.7092987161556517e-05, - "loss": 2.3102, - "step": 377400 - }, - { - "epoch": 0.66, - "learning_rate": 1.7092115221629694e-05, - "loss": 2.3551, - "step": 377410 - }, - { - "epoch": 0.66, - "learning_rate": 1.7091243281702864e-05, - "loss": 2.3226, - "step": 377420 - }, - { - "epoch": 0.66, - "learning_rate": 1.7090371341776038e-05, - "loss": 2.2741, - "step": 377430 - }, - { - "epoch": 0.66, - "learning_rate": 1.708949940184921e-05, - "loss": 2.2649, - "step": 377440 - }, - { - "epoch": 0.66, - "learning_rate": 1.7088627461922386e-05, - "loss": 2.3195, - "step": 377450 - }, - { - "epoch": 0.66, - "learning_rate": 1.7087755521995556e-05, - "loss": 2.3501, - "step": 377460 - }, - { - "epoch": 0.66, - "learning_rate": 1.708688358206873e-05, - "loss": 2.4342, - "step": 377470 - }, - { - "epoch": 0.66, - "learning_rate": 1.7086011642141903e-05, - "loss": 2.3165, - "step": 377480 - }, - { - "epoch": 0.66, - "learning_rate": 1.7085139702215077e-05, - "loss": 2.394, - "step": 377490 - }, - { - "epoch": 0.66, - "learning_rate": 1.708426776228825e-05, - "loss": 2.3717, - "step": 377500 - }, - { - "epoch": 0.66, - "learning_rate": 1.708339582236142e-05, - "loss": 2.4768, - "step": 377510 - }, - { - "epoch": 0.66, - "learning_rate": 1.70825238824346e-05, - "loss": 2.2463, - "step": 377520 - }, - { - "epoch": 0.66, - "learning_rate": 1.708165194250777e-05, - "loss": 2.3012, - "step": 377530 - }, - { - "epoch": 0.66, - "learning_rate": 1.7080780002580943e-05, - "loss": 2.1724, - "step": 377540 - }, - { - "epoch": 0.66, - "learning_rate": 1.7079908062654116e-05, - "loss": 2.4287, - "step": 377550 - }, - { - "epoch": 0.66, - "learning_rate": 1.707903612272729e-05, - "loss": 2.3515, - "step": 377560 - }, - { - "epoch": 0.66, - "learning_rate": 1.7078164182800464e-05, - "loss": 2.3111, - "step": 377570 - }, - { - "epoch": 0.66, - "learning_rate": 1.7077292242873634e-05, - "loss": 2.293, - "step": 377580 - }, - { - "epoch": 0.66, - "learning_rate": 1.7076420302946808e-05, - "loss": 2.3878, - "step": 377590 - }, - { - "epoch": 0.66, - "learning_rate": 1.7075548363019982e-05, - "loss": 2.3848, - "step": 377600 - }, - { - "epoch": 0.66, - "learning_rate": 1.7074676423093156e-05, - "loss": 2.3543, - "step": 377610 - }, - { - "epoch": 0.66, - "learning_rate": 1.707380448316633e-05, - "loss": 2.2992, - "step": 377620 - }, - { - "epoch": 0.66, - "learning_rate": 1.70729325432395e-05, - "loss": 2.3942, - "step": 377630 - }, - { - "epoch": 0.66, - "learning_rate": 1.7072060603312677e-05, - "loss": 2.4457, - "step": 377640 - }, - { - "epoch": 0.66, - "learning_rate": 1.7071188663385847e-05, - "loss": 2.3576, - "step": 377650 - }, - { - "epoch": 0.66, - "learning_rate": 1.707031672345902e-05, - "loss": 2.3072, - "step": 377660 - }, - { - "epoch": 0.66, - "learning_rate": 1.7069444783532195e-05, - "loss": 2.4321, - "step": 377670 - }, - { - "epoch": 0.66, - "learning_rate": 1.706857284360537e-05, - "loss": 2.3622, - "step": 377680 - }, - { - "epoch": 0.66, - "learning_rate": 1.706770090367854e-05, - "loss": 2.2443, - "step": 377690 - }, - { - "epoch": 0.66, - "learning_rate": 1.7066828963751713e-05, - "loss": 2.2599, - "step": 377700 - }, - { - "epoch": 0.66, - "learning_rate": 1.706595702382489e-05, - "loss": 2.3395, - "step": 377710 - }, - { - "epoch": 0.66, - "learning_rate": 1.706508508389806e-05, - "loss": 2.3461, - "step": 377720 - }, - { - "epoch": 0.66, - "learning_rate": 1.7064213143971234e-05, - "loss": 2.2846, - "step": 377730 - }, - { - "epoch": 0.66, - "learning_rate": 1.7063341204044405e-05, - "loss": 2.2761, - "step": 377740 - }, - { - "epoch": 0.66, - "learning_rate": 1.7062469264117582e-05, - "loss": 2.3283, - "step": 377750 - }, - { - "epoch": 0.66, - "learning_rate": 1.7061597324190752e-05, - "loss": 2.3882, - "step": 377760 - }, - { - "epoch": 0.66, - "learning_rate": 1.7060725384263926e-05, - "loss": 2.4112, - "step": 377770 - }, - { - "epoch": 0.66, - "learning_rate": 1.70598534443371e-05, - "loss": 2.1841, - "step": 377780 - }, - { - "epoch": 0.66, - "learning_rate": 1.7058981504410273e-05, - "loss": 2.3539, - "step": 377790 - }, - { - "epoch": 0.66, - "learning_rate": 1.7058109564483447e-05, - "loss": 2.3053, - "step": 377800 - }, - { - "epoch": 0.66, - "learning_rate": 1.7057237624556618e-05, - "loss": 2.3519, - "step": 377810 - }, - { - "epoch": 0.66, - "learning_rate": 1.7056365684629795e-05, - "loss": 2.3156, - "step": 377820 - }, - { - "epoch": 0.66, - "learning_rate": 1.7055493744702965e-05, - "loss": 2.3775, - "step": 377830 - }, - { - "epoch": 0.66, - "learning_rate": 1.705462180477614e-05, - "loss": 2.3189, - "step": 377840 - }, - { - "epoch": 0.66, - "learning_rate": 1.7053749864849313e-05, - "loss": 2.4247, - "step": 377850 - }, - { - "epoch": 0.66, - "learning_rate": 1.7052877924922486e-05, - "loss": 2.315, - "step": 377860 - }, - { - "epoch": 0.66, - "learning_rate": 1.705200598499566e-05, - "loss": 2.3539, - "step": 377870 - }, - { - "epoch": 0.66, - "learning_rate": 1.705113404506883e-05, - "loss": 2.341, - "step": 377880 - }, - { - "epoch": 0.66, - "learning_rate": 1.7050262105142004e-05, - "loss": 2.283, - "step": 377890 - }, - { - "epoch": 0.66, - "learning_rate": 1.7049390165215178e-05, - "loss": 2.2999, - "step": 377900 - }, - { - "epoch": 0.66, - "learning_rate": 1.7048518225288352e-05, - "loss": 2.3354, - "step": 377910 - }, - { - "epoch": 0.66, - "learning_rate": 1.7047646285361522e-05, - "loss": 2.3697, - "step": 377920 - }, - { - "epoch": 0.66, - "learning_rate": 1.70467743454347e-05, - "loss": 2.3228, - "step": 377930 - }, - { - "epoch": 0.66, - "learning_rate": 1.704590240550787e-05, - "loss": 2.4005, - "step": 377940 - }, - { - "epoch": 0.66, - "learning_rate": 1.7045030465581044e-05, - "loss": 2.4584, - "step": 377950 - }, - { - "epoch": 0.66, - "learning_rate": 1.7044158525654217e-05, - "loss": 2.383, - "step": 377960 - }, - { - "epoch": 0.66, - "learning_rate": 1.704328658572739e-05, - "loss": 2.2226, - "step": 377970 - }, - { - "epoch": 0.66, - "learning_rate": 1.7042414645800565e-05, - "loss": 2.3378, - "step": 377980 - }, - { - "epoch": 0.66, - "learning_rate": 1.7041542705873735e-05, - "loss": 2.3098, - "step": 377990 - }, - { - "epoch": 0.66, - "learning_rate": 1.704067076594691e-05, - "loss": 2.3501, - "step": 378000 - }, - { - "epoch": 0.66, - "learning_rate": 1.7039798826020083e-05, - "loss": 2.358, - "step": 378010 - }, - { - "epoch": 0.66, - "learning_rate": 1.7038926886093257e-05, - "loss": 2.3389, - "step": 378020 - }, - { - "epoch": 0.66, - "learning_rate": 1.703805494616643e-05, - "loss": 2.2295, - "step": 378030 - }, - { - "epoch": 0.66, - "learning_rate": 1.7037183006239604e-05, - "loss": 2.2579, - "step": 378040 - }, - { - "epoch": 0.66, - "learning_rate": 1.7036311066312778e-05, - "loss": 2.1863, - "step": 378050 - }, - { - "epoch": 0.66, - "learning_rate": 1.7035439126385948e-05, - "loss": 2.3936, - "step": 378060 - }, - { - "epoch": 0.66, - "learning_rate": 1.7034567186459122e-05, - "loss": 2.2308, - "step": 378070 - }, - { - "epoch": 0.66, - "learning_rate": 1.7033695246532296e-05, - "loss": 2.3567, - "step": 378080 - }, - { - "epoch": 0.66, - "learning_rate": 1.703282330660547e-05, - "loss": 2.2988, - "step": 378090 - }, - { - "epoch": 0.66, - "learning_rate": 1.7031951366678643e-05, - "loss": 2.3501, - "step": 378100 - }, - { - "epoch": 0.66, - "learning_rate": 1.7031079426751814e-05, - "loss": 2.196, - "step": 378110 - }, - { - "epoch": 0.66, - "learning_rate": 1.703020748682499e-05, - "loss": 2.4058, - "step": 378120 - }, - { - "epoch": 0.66, - "learning_rate": 1.702933554689816e-05, - "loss": 2.3401, - "step": 378130 - }, - { - "epoch": 0.66, - "learning_rate": 1.7028463606971335e-05, - "loss": 2.2765, - "step": 378140 - }, - { - "epoch": 0.66, - "learning_rate": 1.7027591667044505e-05, - "loss": 2.2141, - "step": 378150 - }, - { - "epoch": 0.66, - "learning_rate": 1.7026719727117683e-05, - "loss": 2.3435, - "step": 378160 - }, - { - "epoch": 0.66, - "learning_rate": 1.7025847787190853e-05, - "loss": 2.0845, - "step": 378170 - }, - { - "epoch": 0.66, - "learning_rate": 1.7024975847264027e-05, - "loss": 2.272, - "step": 378180 - }, - { - "epoch": 0.66, - "learning_rate": 1.70241039073372e-05, - "loss": 2.2385, - "step": 378190 - }, - { - "epoch": 0.66, - "learning_rate": 1.7023231967410374e-05, - "loss": 2.3478, - "step": 378200 - }, - { - "epoch": 0.66, - "learning_rate": 1.7022360027483548e-05, - "loss": 2.2371, - "step": 378210 - }, - { - "epoch": 0.66, - "learning_rate": 1.702148808755672e-05, - "loss": 2.2299, - "step": 378220 - }, - { - "epoch": 0.66, - "learning_rate": 1.7020616147629896e-05, - "loss": 2.3502, - "step": 378230 - }, - { - "epoch": 0.66, - "learning_rate": 1.7019744207703066e-05, - "loss": 2.2712, - "step": 378240 - }, - { - "epoch": 0.66, - "learning_rate": 1.701887226777624e-05, - "loss": 2.3855, - "step": 378250 - }, - { - "epoch": 0.66, - "learning_rate": 1.7018000327849414e-05, - "loss": 2.2109, - "step": 378260 - }, - { - "epoch": 0.66, - "learning_rate": 1.7017128387922587e-05, - "loss": 2.1532, - "step": 378270 - }, - { - "epoch": 0.66, - "learning_rate": 1.701625644799576e-05, - "loss": 2.2835, - "step": 378280 - }, - { - "epoch": 0.66, - "learning_rate": 1.701538450806893e-05, - "loss": 2.3264, - "step": 378290 - }, - { - "epoch": 0.66, - "learning_rate": 1.701451256814211e-05, - "loss": 2.2487, - "step": 378300 - }, - { - "epoch": 0.66, - "learning_rate": 1.701364062821528e-05, - "loss": 2.3217, - "step": 378310 - }, - { - "epoch": 0.66, - "learning_rate": 1.7012768688288453e-05, - "loss": 2.3613, - "step": 378320 - }, - { - "epoch": 0.66, - "learning_rate": 1.7011896748361627e-05, - "loss": 2.436, - "step": 378330 - }, - { - "epoch": 0.66, - "learning_rate": 1.70110248084348e-05, - "loss": 2.4444, - "step": 378340 - }, - { - "epoch": 0.66, - "learning_rate": 1.7010152868507974e-05, - "loss": 2.337, - "step": 378350 - }, - { - "epoch": 0.66, - "learning_rate": 1.7009280928581144e-05, - "loss": 2.2757, - "step": 378360 - }, - { - "epoch": 0.66, - "learning_rate": 1.7008408988654318e-05, - "loss": 2.3246, - "step": 378370 - }, - { - "epoch": 0.66, - "learning_rate": 1.7007537048727492e-05, - "loss": 2.2979, - "step": 378380 - }, - { - "epoch": 0.66, - "learning_rate": 1.7006665108800666e-05, - "loss": 2.3299, - "step": 378390 - }, - { - "epoch": 0.66, - "learning_rate": 1.7005793168873836e-05, - "loss": 2.3018, - "step": 378400 - }, - { - "epoch": 0.66, - "learning_rate": 1.700492122894701e-05, - "loss": 2.243, - "step": 378410 - }, - { - "epoch": 0.66, - "learning_rate": 1.7004049289020184e-05, - "loss": 2.3251, - "step": 378420 - }, - { - "epoch": 0.66, - "learning_rate": 1.7003177349093357e-05, - "loss": 2.385, - "step": 378430 - }, - { - "epoch": 0.66, - "learning_rate": 1.700230540916653e-05, - "loss": 2.3255, - "step": 378440 - }, - { - "epoch": 0.66, - "learning_rate": 1.7001433469239705e-05, - "loss": 2.3163, - "step": 378450 - }, - { - "epoch": 0.66, - "learning_rate": 1.700056152931288e-05, - "loss": 2.2536, - "step": 378460 - }, - { - "epoch": 0.66, - "learning_rate": 1.699968958938605e-05, - "loss": 2.3505, - "step": 378470 - }, - { - "epoch": 0.66, - "learning_rate": 1.6998817649459223e-05, - "loss": 2.2433, - "step": 378480 - }, - { - "epoch": 0.66, - "learning_rate": 1.6997945709532397e-05, - "loss": 2.2847, - "step": 378490 - }, - { - "epoch": 0.66, - "learning_rate": 1.699707376960557e-05, - "loss": 2.3007, - "step": 378500 - }, - { - "epoch": 0.66, - "learning_rate": 1.6996201829678744e-05, - "loss": 2.2345, - "step": 378510 - }, - { - "epoch": 0.66, - "learning_rate": 1.6995329889751915e-05, - "loss": 2.2071, - "step": 378520 - }, - { - "epoch": 0.66, - "learning_rate": 1.6994457949825092e-05, - "loss": 2.2815, - "step": 378530 - }, - { - "epoch": 0.66, - "learning_rate": 1.6993586009898262e-05, - "loss": 2.381, - "step": 378540 - }, - { - "epoch": 0.66, - "learning_rate": 1.6992714069971436e-05, - "loss": 2.2736, - "step": 378550 - }, - { - "epoch": 0.66, - "learning_rate": 1.6991842130044606e-05, - "loss": 2.3192, - "step": 378560 - }, - { - "epoch": 0.66, - "learning_rate": 1.6990970190117783e-05, - "loss": 2.3101, - "step": 378570 - }, - { - "epoch": 0.66, - "learning_rate": 1.6990098250190957e-05, - "loss": 2.2067, - "step": 378580 - }, - { - "epoch": 0.66, - "learning_rate": 1.6989226310264128e-05, - "loss": 2.3342, - "step": 378590 - }, - { - "epoch": 0.66, - "learning_rate": 1.6988354370337305e-05, - "loss": 2.2857, - "step": 378600 - }, - { - "epoch": 0.66, - "learning_rate": 1.6987482430410475e-05, - "loss": 2.2346, - "step": 378610 - }, - { - "epoch": 0.66, - "learning_rate": 1.698661049048365e-05, - "loss": 2.2118, - "step": 378620 - }, - { - "epoch": 0.66, - "learning_rate": 1.698573855055682e-05, - "loss": 2.2459, - "step": 378630 - }, - { - "epoch": 0.66, - "learning_rate": 1.6984866610629996e-05, - "loss": 2.2423, - "step": 378640 - }, - { - "epoch": 0.66, - "learning_rate": 1.6983994670703167e-05, - "loss": 2.1942, - "step": 378650 - }, - { - "epoch": 0.66, - "learning_rate": 1.698312273077634e-05, - "loss": 2.3597, - "step": 378660 - }, - { - "epoch": 0.66, - "learning_rate": 1.6982250790849514e-05, - "loss": 2.3653, - "step": 378670 - }, - { - "epoch": 0.66, - "learning_rate": 1.6981378850922688e-05, - "loss": 2.3409, - "step": 378680 - }, - { - "epoch": 0.66, - "learning_rate": 1.6980506910995862e-05, - "loss": 2.377, - "step": 378690 - }, - { - "epoch": 0.66, - "learning_rate": 1.6979634971069032e-05, - "loss": 2.3434, - "step": 378700 - }, - { - "epoch": 0.66, - "learning_rate": 1.697876303114221e-05, - "loss": 2.4115, - "step": 378710 - }, - { - "epoch": 0.66, - "learning_rate": 1.697789109121538e-05, - "loss": 2.3286, - "step": 378720 - }, - { - "epoch": 0.66, - "learning_rate": 1.6977019151288554e-05, - "loss": 2.4143, - "step": 378730 - }, - { - "epoch": 0.66, - "learning_rate": 1.6976147211361727e-05, - "loss": 2.3572, - "step": 378740 - }, - { - "epoch": 0.66, - "learning_rate": 1.69752752714349e-05, - "loss": 2.3128, - "step": 378750 - }, - { - "epoch": 0.66, - "learning_rate": 1.6974403331508075e-05, - "loss": 2.3076, - "step": 378760 - }, - { - "epoch": 0.66, - "learning_rate": 1.6973531391581245e-05, - "loss": 2.2322, - "step": 378770 - }, - { - "epoch": 0.66, - "learning_rate": 1.697265945165442e-05, - "loss": 2.2124, - "step": 378780 - }, - { - "epoch": 0.66, - "learning_rate": 1.6971787511727593e-05, - "loss": 2.2525, - "step": 378790 - }, - { - "epoch": 0.66, - "learning_rate": 1.6970915571800767e-05, - "loss": 2.3409, - "step": 378800 - }, - { - "epoch": 0.66, - "learning_rate": 1.6970043631873937e-05, - "loss": 2.2854, - "step": 378810 - }, - { - "epoch": 0.66, - "learning_rate": 1.696917169194711e-05, - "loss": 2.2584, - "step": 378820 - }, - { - "epoch": 0.66, - "learning_rate": 1.6968299752020288e-05, - "loss": 2.3947, - "step": 378830 - }, - { - "epoch": 0.66, - "learning_rate": 1.6967427812093458e-05, - "loss": 2.3206, - "step": 378840 - }, - { - "epoch": 0.66, - "learning_rate": 1.6966555872166632e-05, - "loss": 2.2515, - "step": 378850 - }, - { - "epoch": 0.66, - "learning_rate": 1.6965683932239806e-05, - "loss": 2.3863, - "step": 378860 - }, - { - "epoch": 0.66, - "learning_rate": 1.696481199231298e-05, - "loss": 2.3666, - "step": 378870 - }, - { - "epoch": 0.66, - "learning_rate": 1.696394005238615e-05, - "loss": 2.2851, - "step": 378880 - }, - { - "epoch": 0.66, - "learning_rate": 1.6963068112459324e-05, - "loss": 2.3509, - "step": 378890 - }, - { - "epoch": 0.66, - "learning_rate": 1.6962196172532498e-05, - "loss": 2.304, - "step": 378900 - }, - { - "epoch": 0.66, - "learning_rate": 1.696132423260567e-05, - "loss": 2.2751, - "step": 378910 - }, - { - "epoch": 0.66, - "learning_rate": 1.6960452292678845e-05, - "loss": 2.4239, - "step": 378920 - }, - { - "epoch": 0.66, - "learning_rate": 1.6959580352752015e-05, - "loss": 2.3318, - "step": 378930 - }, - { - "epoch": 0.66, - "learning_rate": 1.6958708412825193e-05, - "loss": 2.4103, - "step": 378940 - }, - { - "epoch": 0.66, - "learning_rate": 1.6957836472898363e-05, - "loss": 2.2837, - "step": 378950 - }, - { - "epoch": 0.66, - "learning_rate": 1.6956964532971537e-05, - "loss": 2.2952, - "step": 378960 - }, - { - "epoch": 0.66, - "learning_rate": 1.695609259304471e-05, - "loss": 2.3179, - "step": 378970 - }, - { - "epoch": 0.66, - "learning_rate": 1.6955220653117884e-05, - "loss": 2.3301, - "step": 378980 - }, - { - "epoch": 0.66, - "learning_rate": 1.6954348713191058e-05, - "loss": 2.3146, - "step": 378990 - }, - { - "epoch": 0.66, - "learning_rate": 1.695347677326423e-05, - "loss": 2.2709, - "step": 379000 - }, - { - "epoch": 0.66, - "learning_rate": 1.6952604833337406e-05, - "loss": 2.3873, - "step": 379010 - }, - { - "epoch": 0.66, - "learning_rate": 1.6951732893410576e-05, - "loss": 2.2461, - "step": 379020 - }, - { - "epoch": 0.66, - "learning_rate": 1.695086095348375e-05, - "loss": 2.2695, - "step": 379030 - }, - { - "epoch": 0.66, - "learning_rate": 1.694998901355692e-05, - "loss": 2.258, - "step": 379040 - }, - { - "epoch": 0.66, - "learning_rate": 1.6949117073630097e-05, - "loss": 2.2391, - "step": 379050 - }, - { - "epoch": 0.66, - "learning_rate": 1.694824513370327e-05, - "loss": 2.3418, - "step": 379060 - }, - { - "epoch": 0.66, - "learning_rate": 1.694737319377644e-05, - "loss": 2.3444, - "step": 379070 - }, - { - "epoch": 0.66, - "learning_rate": 1.6946501253849615e-05, - "loss": 2.3456, - "step": 379080 - }, - { - "epoch": 0.66, - "learning_rate": 1.694562931392279e-05, - "loss": 2.2599, - "step": 379090 - }, - { - "epoch": 0.66, - "learning_rate": 1.6944757373995963e-05, - "loss": 2.3778, - "step": 379100 - }, - { - "epoch": 0.66, - "learning_rate": 1.6943885434069133e-05, - "loss": 2.3186, - "step": 379110 - }, - { - "epoch": 0.66, - "learning_rate": 1.694301349414231e-05, - "loss": 2.3225, - "step": 379120 - }, - { - "epoch": 0.66, - "learning_rate": 1.694214155421548e-05, - "loss": 2.3823, - "step": 379130 - }, - { - "epoch": 0.66, - "learning_rate": 1.6941269614288654e-05, - "loss": 2.4048, - "step": 379140 - }, - { - "epoch": 0.66, - "learning_rate": 1.6940397674361828e-05, - "loss": 2.3883, - "step": 379150 - }, - { - "epoch": 0.66, - "learning_rate": 1.6939525734435002e-05, - "loss": 2.2612, - "step": 379160 - }, - { - "epoch": 0.66, - "learning_rate": 1.6938653794508176e-05, - "loss": 2.2646, - "step": 379170 - }, - { - "epoch": 0.66, - "learning_rate": 1.6937781854581346e-05, - "loss": 2.4043, - "step": 379180 - }, - { - "epoch": 0.66, - "learning_rate": 1.693690991465452e-05, - "loss": 2.398, - "step": 379190 - }, - { - "epoch": 0.66, - "learning_rate": 1.6936037974727694e-05, - "loss": 2.3605, - "step": 379200 - }, - { - "epoch": 0.66, - "learning_rate": 1.6935166034800867e-05, - "loss": 2.3411, - "step": 379210 - }, - { - "epoch": 0.66, - "learning_rate": 1.693429409487404e-05, - "loss": 2.2971, - "step": 379220 - }, - { - "epoch": 0.66, - "learning_rate": 1.6933422154947215e-05, - "loss": 2.3472, - "step": 379230 - }, - { - "epoch": 0.66, - "learning_rate": 1.693255021502039e-05, - "loss": 2.2476, - "step": 379240 - }, - { - "epoch": 0.66, - "learning_rate": 1.693167827509356e-05, - "loss": 2.2115, - "step": 379250 - }, - { - "epoch": 0.66, - "learning_rate": 1.6930806335166733e-05, - "loss": 2.0942, - "step": 379260 - }, - { - "epoch": 0.66, - "learning_rate": 1.6929934395239907e-05, - "loss": 2.2882, - "step": 379270 - }, - { - "epoch": 0.66, - "learning_rate": 1.692906245531308e-05, - "loss": 2.2856, - "step": 379280 - }, - { - "epoch": 0.66, - "learning_rate": 1.692819051538625e-05, - "loss": 2.2941, - "step": 379290 - }, - { - "epoch": 0.66, - "learning_rate": 1.6927318575459425e-05, - "loss": 2.2769, - "step": 379300 - }, - { - "epoch": 0.66, - "learning_rate": 1.6926446635532602e-05, - "loss": 2.211, - "step": 379310 - }, - { - "epoch": 0.66, - "learning_rate": 1.6925574695605772e-05, - "loss": 2.3323, - "step": 379320 - }, - { - "epoch": 0.66, - "learning_rate": 1.6924702755678946e-05, - "loss": 2.3426, - "step": 379330 - }, - { - "epoch": 0.66, - "learning_rate": 1.6923830815752116e-05, - "loss": 2.324, - "step": 379340 - }, - { - "epoch": 0.66, - "learning_rate": 1.6922958875825293e-05, - "loss": 2.3215, - "step": 379350 - }, - { - "epoch": 0.66, - "learning_rate": 1.6922086935898464e-05, - "loss": 2.2698, - "step": 379360 - }, - { - "epoch": 0.66, - "learning_rate": 1.6921214995971638e-05, - "loss": 2.3085, - "step": 379370 - }, - { - "epoch": 0.66, - "learning_rate": 1.692034305604481e-05, - "loss": 2.416, - "step": 379380 - }, - { - "epoch": 0.66, - "learning_rate": 1.6919471116117985e-05, - "loss": 2.3383, - "step": 379390 - }, - { - "epoch": 0.66, - "learning_rate": 1.691859917619116e-05, - "loss": 2.2851, - "step": 379400 - }, - { - "epoch": 0.66, - "learning_rate": 1.691772723626433e-05, - "loss": 2.21, - "step": 379410 - }, - { - "epoch": 0.66, - "learning_rate": 1.6916855296337506e-05, - "loss": 2.3843, - "step": 379420 - }, - { - "epoch": 0.66, - "learning_rate": 1.6915983356410677e-05, - "loss": 2.3665, - "step": 379430 - }, - { - "epoch": 0.66, - "learning_rate": 1.691511141648385e-05, - "loss": 2.3412, - "step": 379440 - }, - { - "epoch": 0.66, - "learning_rate": 1.6914239476557024e-05, - "loss": 2.2974, - "step": 379450 - }, - { - "epoch": 0.66, - "learning_rate": 1.6913367536630198e-05, - "loss": 2.3731, - "step": 379460 - }, - { - "epoch": 0.66, - "learning_rate": 1.6912495596703372e-05, - "loss": 2.3744, - "step": 379470 - }, - { - "epoch": 0.66, - "learning_rate": 1.6911623656776542e-05, - "loss": 2.3232, - "step": 379480 - }, - { - "epoch": 0.66, - "learning_rate": 1.6910751716849716e-05, - "loss": 2.3349, - "step": 379490 - }, - { - "epoch": 0.66, - "learning_rate": 1.690987977692289e-05, - "loss": 2.3764, - "step": 379500 - }, - { - "epoch": 0.66, - "learning_rate": 1.6909007836996064e-05, - "loss": 2.2937, - "step": 379510 - }, - { - "epoch": 0.66, - "learning_rate": 1.6908135897069234e-05, - "loss": 2.2463, - "step": 379520 - }, - { - "epoch": 0.66, - "learning_rate": 1.690726395714241e-05, - "loss": 2.3538, - "step": 379530 - }, - { - "epoch": 0.66, - "learning_rate": 1.690639201721558e-05, - "loss": 2.3329, - "step": 379540 - }, - { - "epoch": 0.66, - "learning_rate": 1.6905520077288755e-05, - "loss": 2.2844, - "step": 379550 - }, - { - "epoch": 0.66, - "learning_rate": 1.690464813736193e-05, - "loss": 2.2214, - "step": 379560 - }, - { - "epoch": 0.66, - "learning_rate": 1.6903776197435103e-05, - "loss": 2.3034, - "step": 379570 - }, - { - "epoch": 0.66, - "learning_rate": 1.6902904257508277e-05, - "loss": 2.3338, - "step": 379580 - }, - { - "epoch": 0.66, - "learning_rate": 1.6902032317581447e-05, - "loss": 2.304, - "step": 379590 - }, - { - "epoch": 0.66, - "learning_rate": 1.690116037765462e-05, - "loss": 2.3782, - "step": 379600 - }, - { - "epoch": 0.66, - "learning_rate": 1.6900288437727795e-05, - "loss": 2.2751, - "step": 379610 - }, - { - "epoch": 0.66, - "learning_rate": 1.6899416497800968e-05, - "loss": 2.2085, - "step": 379620 - }, - { - "epoch": 0.66, - "learning_rate": 1.6898544557874142e-05, - "loss": 2.3334, - "step": 379630 - }, - { - "epoch": 0.66, - "learning_rate": 1.6897672617947316e-05, - "loss": 2.3679, - "step": 379640 - }, - { - "epoch": 0.66, - "learning_rate": 1.689680067802049e-05, - "loss": 2.3393, - "step": 379650 - }, - { - "epoch": 0.66, - "learning_rate": 1.689592873809366e-05, - "loss": 2.2648, - "step": 379660 - }, - { - "epoch": 0.66, - "learning_rate": 1.6895056798166834e-05, - "loss": 2.2886, - "step": 379670 - }, - { - "epoch": 0.66, - "learning_rate": 1.6894184858240008e-05, - "loss": 2.3278, - "step": 379680 - }, - { - "epoch": 0.66, - "learning_rate": 1.689331291831318e-05, - "loss": 2.3329, - "step": 379690 - }, - { - "epoch": 0.66, - "learning_rate": 1.6892440978386355e-05, - "loss": 2.4276, - "step": 379700 - }, - { - "epoch": 0.66, - "learning_rate": 1.6891569038459525e-05, - "loss": 2.2105, - "step": 379710 - }, - { - "epoch": 0.66, - "learning_rate": 1.6890697098532703e-05, - "loss": 2.2439, - "step": 379720 - }, - { - "epoch": 0.66, - "learning_rate": 1.6889825158605873e-05, - "loss": 2.3772, - "step": 379730 - }, - { - "epoch": 0.66, - "learning_rate": 1.6888953218679047e-05, - "loss": 2.2888, - "step": 379740 - }, - { - "epoch": 0.66, - "learning_rate": 1.6888081278752217e-05, - "loss": 2.2695, - "step": 379750 - }, - { - "epoch": 0.66, - "learning_rate": 1.6887209338825394e-05, - "loss": 2.3107, - "step": 379760 - }, - { - "epoch": 0.66, - "learning_rate": 1.6886337398898565e-05, - "loss": 2.2761, - "step": 379770 - }, - { - "epoch": 0.66, - "learning_rate": 1.688546545897174e-05, - "loss": 2.457, - "step": 379780 - }, - { - "epoch": 0.66, - "learning_rate": 1.6884593519044916e-05, - "loss": 2.2228, - "step": 379790 - }, - { - "epoch": 0.66, - "learning_rate": 1.6883721579118086e-05, - "loss": 2.2323, - "step": 379800 - }, - { - "epoch": 0.66, - "learning_rate": 1.688284963919126e-05, - "loss": 2.2534, - "step": 379810 - }, - { - "epoch": 0.66, - "learning_rate": 1.688197769926443e-05, - "loss": 2.4035, - "step": 379820 - }, - { - "epoch": 0.66, - "learning_rate": 1.6881105759337607e-05, - "loss": 2.253, - "step": 379830 - }, - { - "epoch": 0.66, - "learning_rate": 1.6880233819410778e-05, - "loss": 2.2852, - "step": 379840 - }, - { - "epoch": 0.66, - "learning_rate": 1.687936187948395e-05, - "loss": 2.2404, - "step": 379850 - }, - { - "epoch": 0.66, - "learning_rate": 1.6878489939557125e-05, - "loss": 2.246, - "step": 379860 - }, - { - "epoch": 0.66, - "learning_rate": 1.68776179996303e-05, - "loss": 2.3661, - "step": 379870 - }, - { - "epoch": 0.66, - "learning_rate": 1.6876746059703473e-05, - "loss": 2.3608, - "step": 379880 - }, - { - "epoch": 0.66, - "learning_rate": 1.6875874119776643e-05, - "loss": 2.3421, - "step": 379890 - }, - { - "epoch": 0.66, - "learning_rate": 1.687500217984982e-05, - "loss": 2.3161, - "step": 379900 - }, - { - "epoch": 0.66, - "learning_rate": 1.687413023992299e-05, - "loss": 2.2616, - "step": 379910 - }, - { - "epoch": 0.66, - "learning_rate": 1.6873258299996164e-05, - "loss": 2.371, - "step": 379920 - }, - { - "epoch": 0.66, - "learning_rate": 1.6872386360069338e-05, - "loss": 2.2775, - "step": 379930 - }, - { - "epoch": 0.66, - "learning_rate": 1.6871514420142512e-05, - "loss": 2.4206, - "step": 379940 - }, - { - "epoch": 0.66, - "learning_rate": 1.6870642480215686e-05, - "loss": 2.2278, - "step": 379950 - }, - { - "epoch": 0.66, - "learning_rate": 1.6869770540288856e-05, - "loss": 2.3837, - "step": 379960 - }, - { - "epoch": 0.66, - "learning_rate": 1.686889860036203e-05, - "loss": 2.3524, - "step": 379970 - }, - { - "epoch": 0.66, - "learning_rate": 1.6868026660435204e-05, - "loss": 2.1719, - "step": 379980 - }, - { - "epoch": 0.66, - "learning_rate": 1.6867154720508377e-05, - "loss": 2.3342, - "step": 379990 - }, - { - "epoch": 0.66, - "learning_rate": 1.6866282780581548e-05, - "loss": 2.2199, - "step": 380000 - }, - { - "epoch": 0.66, - "learning_rate": 1.686541084065472e-05, - "loss": 2.2453, - "step": 380010 - }, - { - "epoch": 0.66, - "learning_rate": 1.6864538900727895e-05, - "loss": 2.3465, - "step": 380020 - }, - { - "epoch": 0.66, - "learning_rate": 1.686366696080107e-05, - "loss": 2.3753, - "step": 380030 - }, - { - "epoch": 0.66, - "learning_rate": 1.6862795020874243e-05, - "loss": 2.264, - "step": 380040 - }, - { - "epoch": 0.66, - "learning_rate": 1.6861923080947417e-05, - "loss": 2.2893, - "step": 380050 - }, - { - "epoch": 0.66, - "learning_rate": 1.686105114102059e-05, - "loss": 2.3556, - "step": 380060 - }, - { - "epoch": 0.66, - "learning_rate": 1.686017920109376e-05, - "loss": 2.3086, - "step": 380070 - }, - { - "epoch": 0.66, - "learning_rate": 1.6859307261166935e-05, - "loss": 2.4279, - "step": 380080 - }, - { - "epoch": 0.66, - "learning_rate": 1.685843532124011e-05, - "loss": 2.3985, - "step": 380090 - }, - { - "epoch": 0.66, - "learning_rate": 1.6857563381313282e-05, - "loss": 2.4798, - "step": 380100 - }, - { - "epoch": 0.66, - "learning_rate": 1.6856691441386456e-05, - "loss": 2.374, - "step": 380110 - }, - { - "epoch": 0.66, - "learning_rate": 1.6855819501459626e-05, - "loss": 2.3818, - "step": 380120 - }, - { - "epoch": 0.66, - "learning_rate": 1.6854947561532803e-05, - "loss": 2.322, - "step": 380130 - }, - { - "epoch": 0.66, - "learning_rate": 1.6854075621605974e-05, - "loss": 2.2352, - "step": 380140 - }, - { - "epoch": 0.66, - "learning_rate": 1.6853203681679148e-05, - "loss": 2.3014, - "step": 380150 - }, - { - "epoch": 0.66, - "learning_rate": 1.6852331741752318e-05, - "loss": 2.3552, - "step": 380160 - }, - { - "epoch": 0.66, - "learning_rate": 1.6851459801825495e-05, - "loss": 2.3067, - "step": 380170 - }, - { - "epoch": 0.66, - "learning_rate": 1.685058786189867e-05, - "loss": 2.293, - "step": 380180 - }, - { - "epoch": 0.66, - "learning_rate": 1.684971592197184e-05, - "loss": 2.3342, - "step": 380190 - }, - { - "epoch": 0.66, - "learning_rate": 1.6848843982045016e-05, - "loss": 2.2725, - "step": 380200 - }, - { - "epoch": 0.66, - "learning_rate": 1.6847972042118187e-05, - "loss": 2.3857, - "step": 380210 - }, - { - "epoch": 0.66, - "learning_rate": 1.684710010219136e-05, - "loss": 2.301, - "step": 380220 - }, - { - "epoch": 0.66, - "learning_rate": 1.684622816226453e-05, - "loss": 2.261, - "step": 380230 - }, - { - "epoch": 0.66, - "learning_rate": 1.6845356222337708e-05, - "loss": 2.2199, - "step": 380240 - }, - { - "epoch": 0.66, - "learning_rate": 1.684448428241088e-05, - "loss": 2.2441, - "step": 380250 - }, - { - "epoch": 0.66, - "learning_rate": 1.6843612342484052e-05, - "loss": 2.2964, - "step": 380260 - }, - { - "epoch": 0.66, - "learning_rate": 1.6842740402557226e-05, - "loss": 2.3813, - "step": 380270 - }, - { - "epoch": 0.66, - "learning_rate": 1.68418684626304e-05, - "loss": 2.2666, - "step": 380280 - }, - { - "epoch": 0.66, - "learning_rate": 1.6840996522703574e-05, - "loss": 2.2191, - "step": 380290 - }, - { - "epoch": 0.66, - "learning_rate": 1.6840124582776744e-05, - "loss": 2.2023, - "step": 380300 - }, - { - "epoch": 0.66, - "learning_rate": 1.683925264284992e-05, - "loss": 2.2864, - "step": 380310 - }, - { - "epoch": 0.66, - "learning_rate": 1.683838070292309e-05, - "loss": 2.1695, - "step": 380320 - }, - { - "epoch": 0.66, - "learning_rate": 1.6837508762996265e-05, - "loss": 2.2855, - "step": 380330 - }, - { - "epoch": 0.66, - "learning_rate": 1.683663682306944e-05, - "loss": 2.2957, - "step": 380340 - }, - { - "epoch": 0.66, - "learning_rate": 1.6835764883142613e-05, - "loss": 2.2979, - "step": 380350 - }, - { - "epoch": 0.66, - "learning_rate": 1.6834892943215787e-05, - "loss": 2.1446, - "step": 380360 - }, - { - "epoch": 0.66, - "learning_rate": 1.6834021003288957e-05, - "loss": 2.3181, - "step": 380370 - }, - { - "epoch": 0.66, - "learning_rate": 1.683314906336213e-05, - "loss": 2.4133, - "step": 380380 - }, - { - "epoch": 0.66, - "learning_rate": 1.6832277123435305e-05, - "loss": 2.3067, - "step": 380390 - }, - { - "epoch": 0.66, - "learning_rate": 1.6831405183508478e-05, - "loss": 2.4126, - "step": 380400 - }, - { - "epoch": 0.66, - "learning_rate": 1.6830533243581652e-05, - "loss": 2.3352, - "step": 380410 - }, - { - "epoch": 0.66, - "learning_rate": 1.6829661303654822e-05, - "loss": 2.3426, - "step": 380420 - }, - { - "epoch": 0.66, - "learning_rate": 1.6828789363728e-05, - "loss": 2.3011, - "step": 380430 - }, - { - "epoch": 0.66, - "learning_rate": 1.682791742380117e-05, - "loss": 2.3111, - "step": 380440 - }, - { - "epoch": 0.66, - "learning_rate": 1.6827045483874344e-05, - "loss": 2.3269, - "step": 380450 - }, - { - "epoch": 0.66, - "learning_rate": 1.6826173543947518e-05, - "loss": 2.3305, - "step": 380460 - }, - { - "epoch": 0.66, - "learning_rate": 1.682530160402069e-05, - "loss": 2.26, - "step": 380470 - }, - { - "epoch": 0.66, - "learning_rate": 1.682442966409386e-05, - "loss": 2.3864, - "step": 380480 - }, - { - "epoch": 0.66, - "learning_rate": 1.6823557724167035e-05, - "loss": 2.4437, - "step": 380490 - }, - { - "epoch": 0.66, - "learning_rate": 1.682268578424021e-05, - "loss": 2.3511, - "step": 380500 - }, - { - "epoch": 0.66, - "learning_rate": 1.6821813844313383e-05, - "loss": 2.2302, - "step": 380510 - }, - { - "epoch": 0.66, - "learning_rate": 1.6820941904386557e-05, - "loss": 2.2709, - "step": 380520 - }, - { - "epoch": 0.66, - "learning_rate": 1.6820069964459727e-05, - "loss": 2.335, - "step": 380530 - }, - { - "epoch": 0.66, - "learning_rate": 1.6819198024532904e-05, - "loss": 2.3432, - "step": 380540 - }, - { - "epoch": 0.66, - "learning_rate": 1.6818326084606075e-05, - "loss": 2.3193, - "step": 380550 - }, - { - "epoch": 0.66, - "learning_rate": 1.681745414467925e-05, - "loss": 2.2562, - "step": 380560 - }, - { - "epoch": 0.66, - "learning_rate": 1.6816582204752422e-05, - "loss": 2.3672, - "step": 380570 - }, - { - "epoch": 0.66, - "learning_rate": 1.6815710264825596e-05, - "loss": 2.3591, - "step": 380580 - }, - { - "epoch": 0.66, - "learning_rate": 1.681483832489877e-05, - "loss": 2.3295, - "step": 380590 - }, - { - "epoch": 0.66, - "learning_rate": 1.681396638497194e-05, - "loss": 2.3628, - "step": 380600 - }, - { - "epoch": 0.66, - "learning_rate": 1.6813094445045117e-05, - "loss": 2.2017, - "step": 380610 - }, - { - "epoch": 0.66, - "learning_rate": 1.6812222505118288e-05, - "loss": 2.3686, - "step": 380620 - }, - { - "epoch": 0.66, - "learning_rate": 1.681135056519146e-05, - "loss": 2.5002, - "step": 380630 - }, - { - "epoch": 0.66, - "learning_rate": 1.6810478625264632e-05, - "loss": 2.3416, - "step": 380640 - }, - { - "epoch": 0.66, - "learning_rate": 1.680960668533781e-05, - "loss": 2.4275, - "step": 380650 - }, - { - "epoch": 0.66, - "learning_rate": 1.6808734745410983e-05, - "loss": 2.4328, - "step": 380660 - }, - { - "epoch": 0.66, - "learning_rate": 1.6807862805484153e-05, - "loss": 2.2948, - "step": 380670 - }, - { - "epoch": 0.66, - "learning_rate": 1.6806990865557327e-05, - "loss": 2.0997, - "step": 380680 - }, - { - "epoch": 0.66, - "learning_rate": 1.68061189256305e-05, - "loss": 2.2759, - "step": 380690 - }, - { - "epoch": 0.66, - "learning_rate": 1.6805246985703674e-05, - "loss": 2.3087, - "step": 380700 - }, - { - "epoch": 0.66, - "learning_rate": 1.6804375045776845e-05, - "loss": 2.2831, - "step": 380710 - }, - { - "epoch": 0.66, - "learning_rate": 1.6803503105850022e-05, - "loss": 2.3341, - "step": 380720 - }, - { - "epoch": 0.66, - "learning_rate": 1.6802631165923192e-05, - "loss": 2.3705, - "step": 380730 - }, - { - "epoch": 0.66, - "learning_rate": 1.6801759225996366e-05, - "loss": 2.3316, - "step": 380740 - }, - { - "epoch": 0.66, - "learning_rate": 1.680088728606954e-05, - "loss": 2.2298, - "step": 380750 - }, - { - "epoch": 0.66, - "learning_rate": 1.6800015346142714e-05, - "loss": 2.3516, - "step": 380760 - }, - { - "epoch": 0.66, - "learning_rate": 1.6799143406215887e-05, - "loss": 2.2961, - "step": 380770 - }, - { - "epoch": 0.66, - "learning_rate": 1.6798271466289058e-05, - "loss": 2.3607, - "step": 380780 - }, - { - "epoch": 0.66, - "learning_rate": 1.679739952636223e-05, - "loss": 2.3258, - "step": 380790 - }, - { - "epoch": 0.66, - "learning_rate": 1.6796527586435405e-05, - "loss": 2.3854, - "step": 380800 - }, - { - "epoch": 0.66, - "learning_rate": 1.679565564650858e-05, - "loss": 2.3771, - "step": 380810 - }, - { - "epoch": 0.66, - "learning_rate": 1.6794783706581753e-05, - "loss": 2.3544, - "step": 380820 - }, - { - "epoch": 0.66, - "learning_rate": 1.6793911766654927e-05, - "loss": 2.2574, - "step": 380830 - }, - { - "epoch": 0.66, - "learning_rate": 1.67930398267281e-05, - "loss": 2.3378, - "step": 380840 - }, - { - "epoch": 0.66, - "learning_rate": 1.679216788680127e-05, - "loss": 2.3562, - "step": 380850 - }, - { - "epoch": 0.66, - "learning_rate": 1.6791295946874445e-05, - "loss": 2.2562, - "step": 380860 - }, - { - "epoch": 0.66, - "learning_rate": 1.679042400694762e-05, - "loss": 2.3436, - "step": 380870 - }, - { - "epoch": 0.66, - "learning_rate": 1.6789552067020792e-05, - "loss": 2.3967, - "step": 380880 - }, - { - "epoch": 0.66, - "learning_rate": 1.6788680127093963e-05, - "loss": 2.3783, - "step": 380890 - }, - { - "epoch": 0.66, - "learning_rate": 1.6787808187167136e-05, - "loss": 2.3623, - "step": 380900 - }, - { - "epoch": 0.66, - "learning_rate": 1.6786936247240313e-05, - "loss": 2.3202, - "step": 380910 - }, - { - "epoch": 0.66, - "learning_rate": 1.6786064307313484e-05, - "loss": 2.324, - "step": 380920 - }, - { - "epoch": 0.66, - "learning_rate": 1.6785192367386658e-05, - "loss": 2.3425, - "step": 380930 - }, - { - "epoch": 0.66, - "learning_rate": 1.6784320427459828e-05, - "loss": 2.2164, - "step": 380940 - }, - { - "epoch": 0.66, - "learning_rate": 1.6783448487533005e-05, - "loss": 2.231, - "step": 380950 - }, - { - "epoch": 0.66, - "learning_rate": 1.6782576547606176e-05, - "loss": 2.1572, - "step": 380960 - }, - { - "epoch": 0.66, - "learning_rate": 1.678170460767935e-05, - "loss": 2.2973, - "step": 380970 - }, - { - "epoch": 0.66, - "learning_rate": 1.6780832667752523e-05, - "loss": 2.4303, - "step": 380980 - }, - { - "epoch": 0.66, - "learning_rate": 1.6779960727825697e-05, - "loss": 2.3217, - "step": 380990 - }, - { - "epoch": 0.66, - "learning_rate": 1.677908878789887e-05, - "loss": 2.3767, - "step": 381000 - }, - { - "epoch": 0.66, - "learning_rate": 1.677821684797204e-05, - "loss": 2.3417, - "step": 381010 - }, - { - "epoch": 0.66, - "learning_rate": 1.6777344908045218e-05, - "loss": 2.3221, - "step": 381020 - }, - { - "epoch": 0.66, - "learning_rate": 1.677647296811839e-05, - "loss": 2.3262, - "step": 381030 - }, - { - "epoch": 0.66, - "learning_rate": 1.6775601028191562e-05, - "loss": 2.3885, - "step": 381040 - }, - { - "epoch": 0.66, - "learning_rate": 1.6774729088264736e-05, - "loss": 2.3872, - "step": 381050 - }, - { - "epoch": 0.66, - "learning_rate": 1.677385714833791e-05, - "loss": 2.3479, - "step": 381060 - }, - { - "epoch": 0.66, - "learning_rate": 1.6772985208411084e-05, - "loss": 2.3253, - "step": 381070 - }, - { - "epoch": 0.66, - "learning_rate": 1.6772113268484254e-05, - "loss": 2.4009, - "step": 381080 - }, - { - "epoch": 0.66, - "learning_rate": 1.6771241328557428e-05, - "loss": 2.2152, - "step": 381090 - }, - { - "epoch": 0.66, - "learning_rate": 1.67703693886306e-05, - "loss": 2.3132, - "step": 381100 - }, - { - "epoch": 0.66, - "learning_rate": 1.6769497448703775e-05, - "loss": 2.3162, - "step": 381110 - }, - { - "epoch": 0.66, - "learning_rate": 1.6768625508776946e-05, - "loss": 2.2663, - "step": 381120 - }, - { - "epoch": 0.66, - "learning_rate": 1.6767753568850123e-05, - "loss": 2.3349, - "step": 381130 - }, - { - "epoch": 0.66, - "learning_rate": 1.6766881628923297e-05, - "loss": 2.2674, - "step": 381140 - }, - { - "epoch": 0.66, - "learning_rate": 1.6766009688996467e-05, - "loss": 2.2741, - "step": 381150 - }, - { - "epoch": 0.66, - "learning_rate": 1.676513774906964e-05, - "loss": 2.3111, - "step": 381160 - }, - { - "epoch": 0.66, - "learning_rate": 1.6764265809142815e-05, - "loss": 2.3165, - "step": 381170 - }, - { - "epoch": 0.66, - "learning_rate": 1.6763393869215988e-05, - "loss": 2.3744, - "step": 381180 - }, - { - "epoch": 0.66, - "learning_rate": 1.676252192928916e-05, - "loss": 2.4097, - "step": 381190 - }, - { - "epoch": 0.66, - "learning_rate": 1.6761649989362332e-05, - "loss": 2.2289, - "step": 381200 - }, - { - "epoch": 0.66, - "learning_rate": 1.6760778049435506e-05, - "loss": 2.2472, - "step": 381210 - }, - { - "epoch": 0.66, - "learning_rate": 1.675990610950868e-05, - "loss": 2.3248, - "step": 381220 - }, - { - "epoch": 0.66, - "learning_rate": 1.6759034169581854e-05, - "loss": 2.3774, - "step": 381230 - }, - { - "epoch": 0.66, - "learning_rate": 1.6758162229655028e-05, - "loss": 2.3381, - "step": 381240 - }, - { - "epoch": 0.66, - "learning_rate": 1.67572902897282e-05, - "loss": 2.3237, - "step": 381250 - }, - { - "epoch": 0.66, - "learning_rate": 1.675641834980137e-05, - "loss": 2.3035, - "step": 381260 - }, - { - "epoch": 0.66, - "learning_rate": 1.6755546409874545e-05, - "loss": 2.3845, - "step": 381270 - }, - { - "epoch": 0.66, - "learning_rate": 1.675467446994772e-05, - "loss": 2.3683, - "step": 381280 - }, - { - "epoch": 0.66, - "learning_rate": 1.6753802530020893e-05, - "loss": 2.3038, - "step": 381290 - }, - { - "epoch": 0.66, - "learning_rate": 1.6752930590094067e-05, - "loss": 2.2709, - "step": 381300 - }, - { - "epoch": 0.66, - "learning_rate": 1.6752058650167237e-05, - "loss": 2.3742, - "step": 381310 - }, - { - "epoch": 0.66, - "learning_rate": 1.6751186710240414e-05, - "loss": 2.3038, - "step": 381320 - }, - { - "epoch": 0.66, - "learning_rate": 1.6750314770313585e-05, - "loss": 2.222, - "step": 381330 - }, - { - "epoch": 0.67, - "learning_rate": 1.674944283038676e-05, - "loss": 2.2368, - "step": 381340 - }, - { - "epoch": 0.67, - "learning_rate": 1.674857089045993e-05, - "loss": 2.3053, - "step": 381350 - }, - { - "epoch": 0.67, - "learning_rate": 1.6747698950533106e-05, - "loss": 2.3416, - "step": 381360 - }, - { - "epoch": 0.67, - "learning_rate": 1.6746827010606276e-05, - "loss": 2.2818, - "step": 381370 - }, - { - "epoch": 0.67, - "learning_rate": 1.674595507067945e-05, - "loss": 2.2532, - "step": 381380 - }, - { - "epoch": 0.67, - "learning_rate": 1.6745083130752627e-05, - "loss": 2.4118, - "step": 381390 - }, - { - "epoch": 0.67, - "learning_rate": 1.6744211190825798e-05, - "loss": 2.4454, - "step": 381400 - }, - { - "epoch": 0.67, - "learning_rate": 1.674333925089897e-05, - "loss": 2.3, - "step": 381410 - }, - { - "epoch": 0.67, - "learning_rate": 1.6742467310972142e-05, - "loss": 2.2294, - "step": 381420 - }, - { - "epoch": 0.67, - "learning_rate": 1.674159537104532e-05, - "loss": 2.2648, - "step": 381430 - }, - { - "epoch": 0.67, - "learning_rate": 1.674072343111849e-05, - "loss": 2.2745, - "step": 381440 - }, - { - "epoch": 0.67, - "learning_rate": 1.6739851491191663e-05, - "loss": 2.2487, - "step": 381450 - }, - { - "epoch": 0.67, - "learning_rate": 1.6738979551264837e-05, - "loss": 2.2755, - "step": 381460 - }, - { - "epoch": 0.67, - "learning_rate": 1.673810761133801e-05, - "loss": 2.2893, - "step": 381470 - }, - { - "epoch": 0.67, - "learning_rate": 1.6737235671411184e-05, - "loss": 2.1717, - "step": 381480 - }, - { - "epoch": 0.67, - "learning_rate": 1.6736363731484355e-05, - "loss": 2.4332, - "step": 381490 - }, - { - "epoch": 0.67, - "learning_rate": 1.6735491791557532e-05, - "loss": 2.2192, - "step": 381500 - }, - { - "epoch": 0.67, - "learning_rate": 1.6734619851630702e-05, - "loss": 2.1958, - "step": 381510 - }, - { - "epoch": 0.67, - "learning_rate": 1.6733747911703876e-05, - "loss": 2.3331, - "step": 381520 - }, - { - "epoch": 0.67, - "learning_rate": 1.673287597177705e-05, - "loss": 2.2132, - "step": 381530 - }, - { - "epoch": 0.67, - "learning_rate": 1.6732004031850224e-05, - "loss": 2.3302, - "step": 381540 - }, - { - "epoch": 0.67, - "learning_rate": 1.6731132091923397e-05, - "loss": 2.2009, - "step": 381550 - }, - { - "epoch": 0.67, - "learning_rate": 1.6730260151996568e-05, - "loss": 2.105, - "step": 381560 - }, - { - "epoch": 0.67, - "learning_rate": 1.672938821206974e-05, - "loss": 2.4053, - "step": 381570 - }, - { - "epoch": 0.67, - "learning_rate": 1.6728516272142915e-05, - "loss": 2.3903, - "step": 381580 - }, - { - "epoch": 0.67, - "learning_rate": 1.672764433221609e-05, - "loss": 2.276, - "step": 381590 - }, - { - "epoch": 0.67, - "learning_rate": 1.672677239228926e-05, - "loss": 2.2543, - "step": 381600 - }, - { - "epoch": 0.67, - "learning_rate": 1.6725900452362433e-05, - "loss": 2.3436, - "step": 381610 - }, - { - "epoch": 0.67, - "learning_rate": 1.6725028512435607e-05, - "loss": 2.3895, - "step": 381620 - }, - { - "epoch": 0.67, - "learning_rate": 1.672415657250878e-05, - "loss": 2.2618, - "step": 381630 - }, - { - "epoch": 0.67, - "learning_rate": 1.6723284632581955e-05, - "loss": 2.2718, - "step": 381640 - }, - { - "epoch": 0.67, - "learning_rate": 1.672241269265513e-05, - "loss": 2.4499, - "step": 381650 - }, - { - "epoch": 0.67, - "learning_rate": 1.6721540752728302e-05, - "loss": 2.4074, - "step": 381660 - }, - { - "epoch": 0.67, - "learning_rate": 1.6720668812801473e-05, - "loss": 2.4393, - "step": 381670 - }, - { - "epoch": 0.67, - "learning_rate": 1.6719796872874646e-05, - "loss": 2.3612, - "step": 381680 - }, - { - "epoch": 0.67, - "learning_rate": 1.671892493294782e-05, - "loss": 2.4161, - "step": 381690 - }, - { - "epoch": 0.67, - "learning_rate": 1.6718052993020994e-05, - "loss": 2.2755, - "step": 381700 - }, - { - "epoch": 0.67, - "learning_rate": 1.6717181053094168e-05, - "loss": 2.2729, - "step": 381710 - }, - { - "epoch": 0.67, - "learning_rate": 1.6716309113167338e-05, - "loss": 2.2601, - "step": 381720 - }, - { - "epoch": 0.67, - "learning_rate": 1.6715437173240515e-05, - "loss": 2.2911, - "step": 381730 - }, - { - "epoch": 0.67, - "learning_rate": 1.6714565233313686e-05, - "loss": 2.3988, - "step": 381740 - }, - { - "epoch": 0.67, - "learning_rate": 1.671369329338686e-05, - "loss": 2.2675, - "step": 381750 - }, - { - "epoch": 0.67, - "learning_rate": 1.6712821353460033e-05, - "loss": 2.2826, - "step": 381760 - }, - { - "epoch": 0.67, - "learning_rate": 1.6711949413533207e-05, - "loss": 2.3825, - "step": 381770 - }, - { - "epoch": 0.67, - "learning_rate": 1.671107747360638e-05, - "loss": 2.3493, - "step": 381780 - }, - { - "epoch": 0.67, - "learning_rate": 1.671020553367955e-05, - "loss": 2.2755, - "step": 381790 - }, - { - "epoch": 0.67, - "learning_rate": 1.6709333593752728e-05, - "loss": 2.3891, - "step": 381800 - }, - { - "epoch": 0.67, - "learning_rate": 1.67084616538259e-05, - "loss": 2.3658, - "step": 381810 - }, - { - "epoch": 0.67, - "learning_rate": 1.6707589713899072e-05, - "loss": 2.2783, - "step": 381820 - }, - { - "epoch": 0.67, - "learning_rate": 1.6706717773972243e-05, - "loss": 2.2849, - "step": 381830 - }, - { - "epoch": 0.67, - "learning_rate": 1.670584583404542e-05, - "loss": 2.2321, - "step": 381840 - }, - { - "epoch": 0.67, - "learning_rate": 1.670497389411859e-05, - "loss": 2.3126, - "step": 381850 - }, - { - "epoch": 0.67, - "learning_rate": 1.6704101954191764e-05, - "loss": 2.292, - "step": 381860 - }, - { - "epoch": 0.67, - "learning_rate": 1.6703230014264938e-05, - "loss": 2.3183, - "step": 381870 - }, - { - "epoch": 0.67, - "learning_rate": 1.670235807433811e-05, - "loss": 2.3744, - "step": 381880 - }, - { - "epoch": 0.67, - "learning_rate": 1.6701486134411285e-05, - "loss": 2.2655, - "step": 381890 - }, - { - "epoch": 0.67, - "learning_rate": 1.6700614194484456e-05, - "loss": 2.1732, - "step": 381900 - }, - { - "epoch": 0.67, - "learning_rate": 1.6699742254557633e-05, - "loss": 2.262, - "step": 381910 - }, - { - "epoch": 0.67, - "learning_rate": 1.6698870314630803e-05, - "loss": 2.2914, - "step": 381920 - }, - { - "epoch": 0.67, - "learning_rate": 1.6697998374703977e-05, - "loss": 2.4012, - "step": 381930 - }, - { - "epoch": 0.67, - "learning_rate": 1.669712643477715e-05, - "loss": 2.2583, - "step": 381940 - }, - { - "epoch": 0.67, - "learning_rate": 1.6696254494850325e-05, - "loss": 2.4114, - "step": 381950 - }, - { - "epoch": 0.67, - "learning_rate": 1.6695382554923498e-05, - "loss": 2.3333, - "step": 381960 - }, - { - "epoch": 0.67, - "learning_rate": 1.669451061499667e-05, - "loss": 2.3752, - "step": 381970 - }, - { - "epoch": 0.67, - "learning_rate": 1.6693638675069842e-05, - "loss": 2.3554, - "step": 381980 - }, - { - "epoch": 0.67, - "learning_rate": 1.6692766735143016e-05, - "loss": 2.3027, - "step": 381990 - }, - { - "epoch": 0.67, - "learning_rate": 1.669189479521619e-05, - "loss": 2.2993, - "step": 382000 - }, - { - "epoch": 0.67, - "learning_rate": 1.6691022855289364e-05, - "loss": 2.2655, - "step": 382010 - }, - { - "epoch": 0.67, - "learning_rate": 1.6690150915362534e-05, - "loss": 2.3321, - "step": 382020 - }, - { - "epoch": 0.67, - "learning_rate": 1.668927897543571e-05, - "loss": 2.4447, - "step": 382030 - }, - { - "epoch": 0.67, - "learning_rate": 1.668840703550888e-05, - "loss": 2.2549, - "step": 382040 - }, - { - "epoch": 0.67, - "learning_rate": 1.6687535095582055e-05, - "loss": 2.2789, - "step": 382050 - }, - { - "epoch": 0.67, - "learning_rate": 1.668666315565523e-05, - "loss": 2.241, - "step": 382060 - }, - { - "epoch": 0.67, - "learning_rate": 1.6685791215728403e-05, - "loss": 2.4286, - "step": 382070 - }, - { - "epoch": 0.67, - "learning_rate": 1.6684919275801573e-05, - "loss": 2.2884, - "step": 382080 - }, - { - "epoch": 0.67, - "learning_rate": 1.6684047335874747e-05, - "loss": 2.1699, - "step": 382090 - }, - { - "epoch": 0.67, - "learning_rate": 1.668317539594792e-05, - "loss": 2.3215, - "step": 382100 - }, - { - "epoch": 0.67, - "learning_rate": 1.6682303456021095e-05, - "loss": 2.3163, - "step": 382110 - }, - { - "epoch": 0.67, - "learning_rate": 1.668143151609427e-05, - "loss": 2.3717, - "step": 382120 - }, - { - "epoch": 0.67, - "learning_rate": 1.668055957616744e-05, - "loss": 2.3204, - "step": 382130 - }, - { - "epoch": 0.67, - "learning_rate": 1.6679687636240616e-05, - "loss": 2.3044, - "step": 382140 - }, - { - "epoch": 0.67, - "learning_rate": 1.6678815696313786e-05, - "loss": 2.4487, - "step": 382150 - }, - { - "epoch": 0.67, - "learning_rate": 1.667794375638696e-05, - "loss": 2.2324, - "step": 382160 - }, - { - "epoch": 0.67, - "learning_rate": 1.6677071816460134e-05, - "loss": 2.3678, - "step": 382170 - }, - { - "epoch": 0.67, - "learning_rate": 1.6676199876533308e-05, - "loss": 2.2596, - "step": 382180 - }, - { - "epoch": 0.67, - "learning_rate": 1.667532793660648e-05, - "loss": 2.4041, - "step": 382190 - }, - { - "epoch": 0.67, - "learning_rate": 1.6674455996679652e-05, - "loss": 2.2751, - "step": 382200 - }, - { - "epoch": 0.67, - "learning_rate": 1.667358405675283e-05, - "loss": 2.4896, - "step": 382210 - }, - { - "epoch": 0.67, - "learning_rate": 1.6672712116826e-05, - "loss": 2.3489, - "step": 382220 - }, - { - "epoch": 0.67, - "learning_rate": 1.6671840176899173e-05, - "loss": 2.3743, - "step": 382230 - }, - { - "epoch": 0.67, - "learning_rate": 1.6670968236972344e-05, - "loss": 2.3014, - "step": 382240 - }, - { - "epoch": 0.67, - "learning_rate": 1.667009629704552e-05, - "loss": 2.2474, - "step": 382250 - }, - { - "epoch": 0.67, - "learning_rate": 1.6669224357118694e-05, - "loss": 2.2287, - "step": 382260 - }, - { - "epoch": 0.67, - "learning_rate": 1.6668352417191865e-05, - "loss": 2.2225, - "step": 382270 - }, - { - "epoch": 0.67, - "learning_rate": 1.666748047726504e-05, - "loss": 2.3907, - "step": 382280 - }, - { - "epoch": 0.67, - "learning_rate": 1.6666608537338212e-05, - "loss": 2.2739, - "step": 382290 - }, - { - "epoch": 0.67, - "learning_rate": 1.6665736597411386e-05, - "loss": 2.2625, - "step": 382300 - }, - { - "epoch": 0.67, - "learning_rate": 1.6664864657484557e-05, - "loss": 2.3299, - "step": 382310 - }, - { - "epoch": 0.67, - "learning_rate": 1.6663992717557734e-05, - "loss": 2.2718, - "step": 382320 - }, - { - "epoch": 0.67, - "learning_rate": 1.6663120777630904e-05, - "loss": 2.3455, - "step": 382330 - }, - { - "epoch": 0.67, - "learning_rate": 1.6662248837704078e-05, - "loss": 2.2265, - "step": 382340 - }, - { - "epoch": 0.67, - "learning_rate": 1.666137689777725e-05, - "loss": 2.2434, - "step": 382350 - }, - { - "epoch": 0.67, - "learning_rate": 1.6660504957850425e-05, - "loss": 2.3076, - "step": 382360 - }, - { - "epoch": 0.67, - "learning_rate": 1.66596330179236e-05, - "loss": 2.3977, - "step": 382370 - }, - { - "epoch": 0.67, - "learning_rate": 1.665876107799677e-05, - "loss": 2.2089, - "step": 382380 - }, - { - "epoch": 0.67, - "learning_rate": 1.6657889138069943e-05, - "loss": 2.3769, - "step": 382390 - }, - { - "epoch": 0.67, - "learning_rate": 1.6657017198143117e-05, - "loss": 2.3012, - "step": 382400 - }, - { - "epoch": 0.67, - "learning_rate": 1.665614525821629e-05, - "loss": 2.2935, - "step": 382410 - }, - { - "epoch": 0.67, - "learning_rate": 1.6655273318289465e-05, - "loss": 2.3588, - "step": 382420 - }, - { - "epoch": 0.67, - "learning_rate": 1.665440137836264e-05, - "loss": 2.3297, - "step": 382430 - }, - { - "epoch": 0.67, - "learning_rate": 1.6653529438435812e-05, - "loss": 2.2667, - "step": 382440 - }, - { - "epoch": 0.67, - "learning_rate": 1.6652657498508983e-05, - "loss": 2.2719, - "step": 382450 - }, - { - "epoch": 0.67, - "learning_rate": 1.6651785558582156e-05, - "loss": 2.3995, - "step": 382460 - }, - { - "epoch": 0.67, - "learning_rate": 1.665091361865533e-05, - "loss": 2.4098, - "step": 382470 - }, - { - "epoch": 0.67, - "learning_rate": 1.6650041678728504e-05, - "loss": 2.3312, - "step": 382480 - }, - { - "epoch": 0.67, - "learning_rate": 1.6649169738801678e-05, - "loss": 2.2773, - "step": 382490 - }, - { - "epoch": 0.67, - "learning_rate": 1.6648297798874848e-05, - "loss": 2.244, - "step": 382500 - }, - { - "epoch": 0.67, - "learning_rate": 1.6647425858948025e-05, - "loss": 2.4912, - "step": 382510 - }, - { - "epoch": 0.67, - "learning_rate": 1.6646553919021196e-05, - "loss": 2.265, - "step": 382520 - }, - { - "epoch": 0.67, - "learning_rate": 1.664568197909437e-05, - "loss": 2.3089, - "step": 382530 - }, - { - "epoch": 0.67, - "learning_rate": 1.664481003916754e-05, - "loss": 2.3269, - "step": 382540 - }, - { - "epoch": 0.67, - "learning_rate": 1.6643938099240717e-05, - "loss": 2.3592, - "step": 382550 - }, - { - "epoch": 0.67, - "learning_rate": 1.6643066159313887e-05, - "loss": 2.3655, - "step": 382560 - }, - { - "epoch": 0.67, - "learning_rate": 1.664219421938706e-05, - "loss": 2.2792, - "step": 382570 - }, - { - "epoch": 0.67, - "learning_rate": 1.6641322279460235e-05, - "loss": 2.373, - "step": 382580 - }, - { - "epoch": 0.67, - "learning_rate": 1.664045033953341e-05, - "loss": 2.2498, - "step": 382590 - }, - { - "epoch": 0.67, - "learning_rate": 1.6639578399606582e-05, - "loss": 2.3309, - "step": 382600 - }, - { - "epoch": 0.67, - "learning_rate": 1.6638706459679753e-05, - "loss": 2.3463, - "step": 382610 - }, - { - "epoch": 0.67, - "learning_rate": 1.663783451975293e-05, - "loss": 2.3639, - "step": 382620 - }, - { - "epoch": 0.67, - "learning_rate": 1.66369625798261e-05, - "loss": 2.3404, - "step": 382630 - }, - { - "epoch": 0.67, - "learning_rate": 1.6636090639899274e-05, - "loss": 2.2475, - "step": 382640 - }, - { - "epoch": 0.67, - "learning_rate": 1.6635218699972448e-05, - "loss": 2.2402, - "step": 382650 - }, - { - "epoch": 0.67, - "learning_rate": 1.663434676004562e-05, - "loss": 2.3129, - "step": 382660 - }, - { - "epoch": 0.67, - "learning_rate": 1.6633474820118795e-05, - "loss": 2.2532, - "step": 382670 - }, - { - "epoch": 0.67, - "learning_rate": 1.6632602880191966e-05, - "loss": 2.3686, - "step": 382680 - }, - { - "epoch": 0.67, - "learning_rate": 1.6631730940265143e-05, - "loss": 2.4257, - "step": 382690 - }, - { - "epoch": 0.67, - "learning_rate": 1.6630859000338313e-05, - "loss": 2.2681, - "step": 382700 - }, - { - "epoch": 0.67, - "learning_rate": 1.6629987060411487e-05, - "loss": 2.1637, - "step": 382710 - }, - { - "epoch": 0.67, - "learning_rate": 1.6629115120484657e-05, - "loss": 2.327, - "step": 382720 - }, - { - "epoch": 0.67, - "learning_rate": 1.6628243180557835e-05, - "loss": 2.4227, - "step": 382730 - }, - { - "epoch": 0.67, - "learning_rate": 1.662737124063101e-05, - "loss": 2.1907, - "step": 382740 - }, - { - "epoch": 0.67, - "learning_rate": 1.662649930070418e-05, - "loss": 2.2382, - "step": 382750 - }, - { - "epoch": 0.67, - "learning_rate": 1.6625627360777352e-05, - "loss": 2.3263, - "step": 382760 - }, - { - "epoch": 0.67, - "learning_rate": 1.6624755420850526e-05, - "loss": 2.3531, - "step": 382770 - }, - { - "epoch": 0.67, - "learning_rate": 1.66238834809237e-05, - "loss": 2.2461, - "step": 382780 - }, - { - "epoch": 0.67, - "learning_rate": 1.662301154099687e-05, - "loss": 2.2548, - "step": 382790 - }, - { - "epoch": 0.67, - "learning_rate": 1.6622139601070044e-05, - "loss": 2.5073, - "step": 382800 - }, - { - "epoch": 0.67, - "learning_rate": 1.6621267661143218e-05, - "loss": 2.3713, - "step": 382810 - }, - { - "epoch": 0.67, - "learning_rate": 1.6620395721216392e-05, - "loss": 2.327, - "step": 382820 - }, - { - "epoch": 0.67, - "learning_rate": 1.6619523781289565e-05, - "loss": 2.3477, - "step": 382830 - }, - { - "epoch": 0.67, - "learning_rate": 1.661865184136274e-05, - "loss": 2.2649, - "step": 382840 - }, - { - "epoch": 0.67, - "learning_rate": 1.6617779901435913e-05, - "loss": 2.4099, - "step": 382850 - }, - { - "epoch": 0.67, - "learning_rate": 1.6616907961509083e-05, - "loss": 2.3712, - "step": 382860 - }, - { - "epoch": 0.67, - "learning_rate": 1.6616036021582257e-05, - "loss": 2.31, - "step": 382870 - }, - { - "epoch": 0.67, - "learning_rate": 1.661516408165543e-05, - "loss": 2.285, - "step": 382880 - }, - { - "epoch": 0.67, - "learning_rate": 1.6614292141728605e-05, - "loss": 2.3086, - "step": 382890 - }, - { - "epoch": 0.67, - "learning_rate": 1.661342020180178e-05, - "loss": 2.1909, - "step": 382900 - }, - { - "epoch": 0.67, - "learning_rate": 1.661254826187495e-05, - "loss": 2.3121, - "step": 382910 - }, - { - "epoch": 0.67, - "learning_rate": 1.6611676321948126e-05, - "loss": 2.427, - "step": 382920 - }, - { - "epoch": 0.67, - "learning_rate": 1.6610804382021296e-05, - "loss": 2.242, - "step": 382930 - }, - { - "epoch": 0.67, - "learning_rate": 1.660993244209447e-05, - "loss": 2.2848, - "step": 382940 - }, - { - "epoch": 0.67, - "learning_rate": 1.660906050216764e-05, - "loss": 2.3428, - "step": 382950 - }, - { - "epoch": 0.67, - "learning_rate": 1.6608188562240818e-05, - "loss": 2.321, - "step": 382960 - }, - { - "epoch": 0.67, - "learning_rate": 1.6607316622313988e-05, - "loss": 2.3361, - "step": 382970 - }, - { - "epoch": 0.67, - "learning_rate": 1.6606444682387162e-05, - "loss": 2.2707, - "step": 382980 - }, - { - "epoch": 0.67, - "learning_rate": 1.660557274246034e-05, - "loss": 2.2898, - "step": 382990 - }, - { - "epoch": 0.67, - "learning_rate": 1.660470080253351e-05, - "loss": 2.4615, - "step": 383000 - }, - { - "epoch": 0.67, - "learning_rate": 1.6603828862606683e-05, - "loss": 2.2185, - "step": 383010 - }, - { - "epoch": 0.67, - "learning_rate": 1.6602956922679854e-05, - "loss": 2.3627, - "step": 383020 - }, - { - "epoch": 0.67, - "learning_rate": 1.660208498275303e-05, - "loss": 2.3078, - "step": 383030 - }, - { - "epoch": 0.67, - "learning_rate": 1.66012130428262e-05, - "loss": 2.3984, - "step": 383040 - }, - { - "epoch": 0.67, - "learning_rate": 1.6600341102899375e-05, - "loss": 2.2819, - "step": 383050 - }, - { - "epoch": 0.67, - "learning_rate": 1.659946916297255e-05, - "loss": 2.2993, - "step": 383060 - }, - { - "epoch": 0.67, - "learning_rate": 1.6598597223045722e-05, - "loss": 2.3649, - "step": 383070 - }, - { - "epoch": 0.67, - "learning_rate": 1.6597725283118896e-05, - "loss": 2.304, - "step": 383080 - }, - { - "epoch": 0.67, - "learning_rate": 1.6596853343192067e-05, - "loss": 2.3458, - "step": 383090 - }, - { - "epoch": 0.67, - "learning_rate": 1.6595981403265244e-05, - "loss": 2.2676, - "step": 383100 - }, - { - "epoch": 0.67, - "learning_rate": 1.6595109463338414e-05, - "loss": 2.3454, - "step": 383110 - }, - { - "epoch": 0.67, - "learning_rate": 1.6594237523411588e-05, - "loss": 2.2956, - "step": 383120 - }, - { - "epoch": 0.67, - "learning_rate": 1.659336558348476e-05, - "loss": 2.3739, - "step": 383130 - }, - { - "epoch": 0.67, - "learning_rate": 1.6592493643557935e-05, - "loss": 2.2492, - "step": 383140 - }, - { - "epoch": 0.67, - "learning_rate": 1.659162170363111e-05, - "loss": 2.2938, - "step": 383150 - }, - { - "epoch": 0.67, - "learning_rate": 1.659074976370428e-05, - "loss": 2.2257, - "step": 383160 - }, - { - "epoch": 0.67, - "learning_rate": 1.6589877823777453e-05, - "loss": 2.2181, - "step": 383170 - }, - { - "epoch": 0.67, - "learning_rate": 1.6589005883850627e-05, - "loss": 2.272, - "step": 383180 - }, - { - "epoch": 0.67, - "learning_rate": 1.65881339439238e-05, - "loss": 2.2944, - "step": 383190 - }, - { - "epoch": 0.67, - "learning_rate": 1.658726200399697e-05, - "loss": 2.3857, - "step": 383200 - }, - { - "epoch": 0.67, - "learning_rate": 1.6586390064070145e-05, - "loss": 2.2274, - "step": 383210 - }, - { - "epoch": 0.67, - "learning_rate": 1.6585518124143322e-05, - "loss": 2.3581, - "step": 383220 - }, - { - "epoch": 0.67, - "learning_rate": 1.6584646184216493e-05, - "loss": 2.2171, - "step": 383230 - }, - { - "epoch": 0.67, - "learning_rate": 1.6583774244289666e-05, - "loss": 2.3184, - "step": 383240 - }, - { - "epoch": 0.67, - "learning_rate": 1.658290230436284e-05, - "loss": 2.3655, - "step": 383250 - }, - { - "epoch": 0.67, - "learning_rate": 1.6582030364436014e-05, - "loss": 2.3681, - "step": 383260 - }, - { - "epoch": 0.67, - "learning_rate": 1.6581158424509184e-05, - "loss": 2.3302, - "step": 383270 - }, - { - "epoch": 0.67, - "learning_rate": 1.6580286484582358e-05, - "loss": 2.2612, - "step": 383280 - }, - { - "epoch": 0.67, - "learning_rate": 1.6579414544655532e-05, - "loss": 2.3644, - "step": 383290 - }, - { - "epoch": 0.67, - "learning_rate": 1.6578542604728706e-05, - "loss": 2.2808, - "step": 383300 - }, - { - "epoch": 0.67, - "learning_rate": 1.657767066480188e-05, - "loss": 2.2947, - "step": 383310 - }, - { - "epoch": 0.67, - "learning_rate": 1.657679872487505e-05, - "loss": 2.388, - "step": 383320 - }, - { - "epoch": 0.67, - "learning_rate": 1.6575926784948227e-05, - "loss": 2.3094, - "step": 383330 - }, - { - "epoch": 0.67, - "learning_rate": 1.6575054845021397e-05, - "loss": 2.3513, - "step": 383340 - }, - { - "epoch": 0.67, - "learning_rate": 1.657418290509457e-05, - "loss": 2.3885, - "step": 383350 - }, - { - "epoch": 0.67, - "learning_rate": 1.6573310965167745e-05, - "loss": 2.4149, - "step": 383360 - }, - { - "epoch": 0.67, - "learning_rate": 1.657243902524092e-05, - "loss": 2.2335, - "step": 383370 - }, - { - "epoch": 0.67, - "learning_rate": 1.6571567085314092e-05, - "loss": 2.2693, - "step": 383380 - }, - { - "epoch": 0.67, - "learning_rate": 1.6570695145387263e-05, - "loss": 2.317, - "step": 383390 - }, - { - "epoch": 0.67, - "learning_rate": 1.656982320546044e-05, - "loss": 2.227, - "step": 383400 - }, - { - "epoch": 0.67, - "learning_rate": 1.656895126553361e-05, - "loss": 2.4342, - "step": 383410 - }, - { - "epoch": 0.67, - "learning_rate": 1.6568079325606784e-05, - "loss": 2.3441, - "step": 383420 - }, - { - "epoch": 0.67, - "learning_rate": 1.6567207385679954e-05, - "loss": 2.3078, - "step": 383430 - }, - { - "epoch": 0.67, - "learning_rate": 1.656633544575313e-05, - "loss": 2.2717, - "step": 383440 - }, - { - "epoch": 0.67, - "learning_rate": 1.6565463505826302e-05, - "loss": 2.2535, - "step": 383450 - }, - { - "epoch": 0.67, - "learning_rate": 1.6564591565899476e-05, - "loss": 2.3508, - "step": 383460 - }, - { - "epoch": 0.67, - "learning_rate": 1.656371962597265e-05, - "loss": 2.2249, - "step": 383470 - }, - { - "epoch": 0.67, - "learning_rate": 1.6562847686045823e-05, - "loss": 2.3052, - "step": 383480 - }, - { - "epoch": 0.67, - "learning_rate": 1.6561975746118997e-05, - "loss": 2.2736, - "step": 383490 - }, - { - "epoch": 0.67, - "learning_rate": 1.6561103806192167e-05, - "loss": 2.3362, - "step": 383500 - }, - { - "epoch": 0.67, - "learning_rate": 1.6560231866265345e-05, - "loss": 2.4029, - "step": 383510 - }, - { - "epoch": 0.67, - "learning_rate": 1.6559359926338515e-05, - "loss": 2.3601, - "step": 383520 - }, - { - "epoch": 0.67, - "learning_rate": 1.655848798641169e-05, - "loss": 2.4466, - "step": 383530 - }, - { - "epoch": 0.67, - "learning_rate": 1.6557616046484862e-05, - "loss": 2.2657, - "step": 383540 - }, - { - "epoch": 0.67, - "learning_rate": 1.6556744106558036e-05, - "loss": 2.3483, - "step": 383550 - }, - { - "epoch": 0.67, - "learning_rate": 1.655587216663121e-05, - "loss": 2.2738, - "step": 383560 - }, - { - "epoch": 0.67, - "learning_rate": 1.655500022670438e-05, - "loss": 2.2752, - "step": 383570 - }, - { - "epoch": 0.67, - "learning_rate": 1.6554128286777554e-05, - "loss": 2.1125, - "step": 383580 - }, - { - "epoch": 0.67, - "learning_rate": 1.6553256346850728e-05, - "loss": 2.2682, - "step": 383590 - }, - { - "epoch": 0.67, - "learning_rate": 1.6552384406923902e-05, - "loss": 2.2447, - "step": 383600 - }, - { - "epoch": 0.67, - "learning_rate": 1.6551512466997075e-05, - "loss": 2.2187, - "step": 383610 - }, - { - "epoch": 0.67, - "learning_rate": 1.655064052707025e-05, - "loss": 2.3112, - "step": 383620 - }, - { - "epoch": 0.67, - "learning_rate": 1.6549768587143423e-05, - "loss": 2.337, - "step": 383630 - }, - { - "epoch": 0.67, - "learning_rate": 1.6548896647216593e-05, - "loss": 2.3681, - "step": 383640 - }, - { - "epoch": 0.67, - "learning_rate": 1.6548024707289767e-05, - "loss": 2.2993, - "step": 383650 - }, - { - "epoch": 0.67, - "learning_rate": 1.654715276736294e-05, - "loss": 2.3044, - "step": 383660 - }, - { - "epoch": 0.67, - "learning_rate": 1.6546280827436115e-05, - "loss": 2.2956, - "step": 383670 - }, - { - "epoch": 0.67, - "learning_rate": 1.6545408887509285e-05, - "loss": 2.3278, - "step": 383680 - }, - { - "epoch": 0.67, - "learning_rate": 1.654453694758246e-05, - "loss": 2.3542, - "step": 383690 - }, - { - "epoch": 0.67, - "learning_rate": 1.6543665007655633e-05, - "loss": 2.3193, - "step": 383700 - }, - { - "epoch": 0.67, - "learning_rate": 1.6542793067728806e-05, - "loss": 2.3365, - "step": 383710 - }, - { - "epoch": 0.67, - "learning_rate": 1.654192112780198e-05, - "loss": 2.326, - "step": 383720 - }, - { - "epoch": 0.67, - "learning_rate": 1.654104918787515e-05, - "loss": 2.3246, - "step": 383730 - }, - { - "epoch": 0.67, - "learning_rate": 1.6540177247948328e-05, - "loss": 2.3278, - "step": 383740 - }, - { - "epoch": 0.67, - "learning_rate": 1.6539305308021498e-05, - "loss": 2.3247, - "step": 383750 - }, - { - "epoch": 0.67, - "learning_rate": 1.6538433368094672e-05, - "loss": 2.3438, - "step": 383760 - }, - { - "epoch": 0.67, - "learning_rate": 1.6537561428167846e-05, - "loss": 2.3283, - "step": 383770 - }, - { - "epoch": 0.67, - "learning_rate": 1.653668948824102e-05, - "loss": 2.2961, - "step": 383780 - }, - { - "epoch": 0.67, - "learning_rate": 1.6535817548314193e-05, - "loss": 2.3763, - "step": 383790 - }, - { - "epoch": 0.67, - "learning_rate": 1.6534945608387364e-05, - "loss": 2.329, - "step": 383800 - }, - { - "epoch": 0.67, - "learning_rate": 1.653407366846054e-05, - "loss": 2.2488, - "step": 383810 - }, - { - "epoch": 0.67, - "learning_rate": 1.653320172853371e-05, - "loss": 2.2662, - "step": 383820 - }, - { - "epoch": 0.67, - "learning_rate": 1.6532329788606885e-05, - "loss": 2.2902, - "step": 383830 - }, - { - "epoch": 0.67, - "learning_rate": 1.653145784868006e-05, - "loss": 2.2629, - "step": 383840 - }, - { - "epoch": 0.67, - "learning_rate": 1.6530585908753232e-05, - "loss": 2.1779, - "step": 383850 - }, - { - "epoch": 0.67, - "learning_rate": 1.6529713968826406e-05, - "loss": 2.2899, - "step": 383860 - }, - { - "epoch": 0.67, - "learning_rate": 1.6528842028899577e-05, - "loss": 2.3404, - "step": 383870 - }, - { - "epoch": 0.67, - "learning_rate": 1.652797008897275e-05, - "loss": 2.3683, - "step": 383880 - }, - { - "epoch": 0.67, - "learning_rate": 1.6527098149045924e-05, - "loss": 2.1878, - "step": 383890 - }, - { - "epoch": 0.67, - "learning_rate": 1.6526226209119098e-05, - "loss": 2.3709, - "step": 383900 - }, - { - "epoch": 0.67, - "learning_rate": 1.6525354269192268e-05, - "loss": 2.2331, - "step": 383910 - }, - { - "epoch": 0.67, - "learning_rate": 1.6524482329265445e-05, - "loss": 2.2887, - "step": 383920 - }, - { - "epoch": 0.67, - "learning_rate": 1.6523610389338616e-05, - "loss": 2.1949, - "step": 383930 - }, - { - "epoch": 0.67, - "learning_rate": 1.652273844941179e-05, - "loss": 2.2646, - "step": 383940 - }, - { - "epoch": 0.67, - "learning_rate": 1.6521866509484963e-05, - "loss": 2.3897, - "step": 383950 - }, - { - "epoch": 0.67, - "learning_rate": 1.6520994569558137e-05, - "loss": 2.3245, - "step": 383960 - }, - { - "epoch": 0.67, - "learning_rate": 1.652012262963131e-05, - "loss": 2.3813, - "step": 383970 - }, - { - "epoch": 0.67, - "learning_rate": 1.651925068970448e-05, - "loss": 2.2748, - "step": 383980 - }, - { - "epoch": 0.67, - "learning_rate": 1.6518378749777655e-05, - "loss": 2.4129, - "step": 383990 - }, - { - "epoch": 0.67, - "learning_rate": 1.651750680985083e-05, - "loss": 2.3229, - "step": 384000 - }, - { - "epoch": 0.67, - "learning_rate": 1.6516634869924003e-05, - "loss": 2.2889, - "step": 384010 - }, - { - "epoch": 0.67, - "learning_rate": 1.6515762929997176e-05, - "loss": 2.1643, - "step": 384020 - }, - { - "epoch": 0.67, - "learning_rate": 1.651489099007035e-05, - "loss": 2.3087, - "step": 384030 - }, - { - "epoch": 0.67, - "learning_rate": 1.6514019050143524e-05, - "loss": 2.2223, - "step": 384040 - }, - { - "epoch": 0.67, - "learning_rate": 1.6513147110216694e-05, - "loss": 2.3804, - "step": 384050 - }, - { - "epoch": 0.67, - "learning_rate": 1.6512275170289868e-05, - "loss": 2.417, - "step": 384060 - }, - { - "epoch": 0.67, - "learning_rate": 1.6511403230363042e-05, - "loss": 2.1915, - "step": 384070 - }, - { - "epoch": 0.67, - "learning_rate": 1.6510531290436216e-05, - "loss": 2.3911, - "step": 384080 - }, - { - "epoch": 0.67, - "learning_rate": 1.650965935050939e-05, - "loss": 2.3231, - "step": 384090 - }, - { - "epoch": 0.67, - "learning_rate": 1.650878741058256e-05, - "loss": 2.3895, - "step": 384100 - }, - { - "epoch": 0.67, - "learning_rate": 1.6507915470655737e-05, - "loss": 2.3471, - "step": 384110 - }, - { - "epoch": 0.67, - "learning_rate": 1.6507043530728907e-05, - "loss": 2.2365, - "step": 384120 - }, - { - "epoch": 0.67, - "learning_rate": 1.650617159080208e-05, - "loss": 2.2926, - "step": 384130 - }, - { - "epoch": 0.67, - "learning_rate": 1.650529965087525e-05, - "loss": 2.3215, - "step": 384140 - }, - { - "epoch": 0.67, - "learning_rate": 1.650442771094843e-05, - "loss": 2.286, - "step": 384150 - }, - { - "epoch": 0.67, - "learning_rate": 1.65035557710216e-05, - "loss": 2.429, - "step": 384160 - }, - { - "epoch": 0.67, - "learning_rate": 1.6502683831094773e-05, - "loss": 2.3624, - "step": 384170 - }, - { - "epoch": 0.67, - "learning_rate": 1.6501811891167946e-05, - "loss": 2.3039, - "step": 384180 - }, - { - "epoch": 0.67, - "learning_rate": 1.650093995124112e-05, - "loss": 2.2557, - "step": 384190 - }, - { - "epoch": 0.67, - "learning_rate": 1.6500068011314294e-05, - "loss": 2.4242, - "step": 384200 - }, - { - "epoch": 0.67, - "learning_rate": 1.6499196071387464e-05, - "loss": 2.341, - "step": 384210 - }, - { - "epoch": 0.67, - "learning_rate": 1.649832413146064e-05, - "loss": 2.2176, - "step": 384220 - }, - { - "epoch": 0.67, - "learning_rate": 1.6497452191533812e-05, - "loss": 2.3336, - "step": 384230 - }, - { - "epoch": 0.67, - "learning_rate": 1.6496580251606986e-05, - "loss": 2.2281, - "step": 384240 - }, - { - "epoch": 0.67, - "learning_rate": 1.649570831168016e-05, - "loss": 2.238, - "step": 384250 - }, - { - "epoch": 0.67, - "learning_rate": 1.6494836371753333e-05, - "loss": 2.2991, - "step": 384260 - }, - { - "epoch": 0.67, - "learning_rate": 1.6493964431826507e-05, - "loss": 2.2564, - "step": 384270 - }, - { - "epoch": 0.67, - "learning_rate": 1.6493092491899677e-05, - "loss": 2.332, - "step": 384280 - }, - { - "epoch": 0.67, - "learning_rate": 1.6492220551972855e-05, - "loss": 2.2224, - "step": 384290 - }, - { - "epoch": 0.67, - "learning_rate": 1.6491348612046025e-05, - "loss": 2.3799, - "step": 384300 - }, - { - "epoch": 0.67, - "learning_rate": 1.64904766721192e-05, - "loss": 2.313, - "step": 384310 - }, - { - "epoch": 0.67, - "learning_rate": 1.6489604732192372e-05, - "loss": 2.3546, - "step": 384320 - }, - { - "epoch": 0.67, - "learning_rate": 1.6488732792265546e-05, - "loss": 2.3152, - "step": 384330 - }, - { - "epoch": 0.67, - "learning_rate": 1.648786085233872e-05, - "loss": 2.3331, - "step": 384340 - }, - { - "epoch": 0.67, - "learning_rate": 1.648698891241189e-05, - "loss": 2.2596, - "step": 384350 - }, - { - "epoch": 0.67, - "learning_rate": 1.6486116972485064e-05, - "loss": 2.3657, - "step": 384360 - }, - { - "epoch": 0.67, - "learning_rate": 1.6485245032558238e-05, - "loss": 2.3099, - "step": 384370 - }, - { - "epoch": 0.67, - "learning_rate": 1.6484373092631412e-05, - "loss": 2.2383, - "step": 384380 - }, - { - "epoch": 0.67, - "learning_rate": 1.6483501152704582e-05, - "loss": 2.3243, - "step": 384390 - }, - { - "epoch": 0.67, - "learning_rate": 1.6482629212777756e-05, - "loss": 2.2838, - "step": 384400 - }, - { - "epoch": 0.67, - "learning_rate": 1.648175727285093e-05, - "loss": 2.3511, - "step": 384410 - }, - { - "epoch": 0.67, - "learning_rate": 1.6480885332924103e-05, - "loss": 2.3273, - "step": 384420 - }, - { - "epoch": 0.67, - "learning_rate": 1.6480013392997277e-05, - "loss": 2.2138, - "step": 384430 - }, - { - "epoch": 0.67, - "learning_rate": 1.647914145307045e-05, - "loss": 2.3739, - "step": 384440 - }, - { - "epoch": 0.67, - "learning_rate": 1.6478269513143625e-05, - "loss": 2.3068, - "step": 384450 - }, - { - "epoch": 0.67, - "learning_rate": 1.6477397573216795e-05, - "loss": 2.2871, - "step": 384460 - }, - { - "epoch": 0.67, - "learning_rate": 1.647652563328997e-05, - "loss": 2.3211, - "step": 384470 - }, - { - "epoch": 0.67, - "learning_rate": 1.6475653693363143e-05, - "loss": 2.3166, - "step": 384480 - }, - { - "epoch": 0.67, - "learning_rate": 1.6474781753436316e-05, - "loss": 2.3668, - "step": 384490 - }, - { - "epoch": 0.67, - "learning_rate": 1.647390981350949e-05, - "loss": 2.3507, - "step": 384500 - }, - { - "epoch": 0.67, - "learning_rate": 1.647303787358266e-05, - "loss": 2.3186, - "step": 384510 - }, - { - "epoch": 0.67, - "learning_rate": 1.6472165933655838e-05, - "loss": 2.3062, - "step": 384520 - }, - { - "epoch": 0.67, - "learning_rate": 1.6471293993729008e-05, - "loss": 2.3427, - "step": 384530 - }, - { - "epoch": 0.67, - "learning_rate": 1.6470422053802182e-05, - "loss": 2.2379, - "step": 384540 - }, - { - "epoch": 0.67, - "learning_rate": 1.6469550113875352e-05, - "loss": 2.2514, - "step": 384550 - }, - { - "epoch": 0.67, - "learning_rate": 1.646867817394853e-05, - "loss": 2.2184, - "step": 384560 - }, - { - "epoch": 0.67, - "learning_rate": 1.6467806234021703e-05, - "loss": 2.3732, - "step": 384570 - }, - { - "epoch": 0.67, - "learning_rate": 1.6466934294094874e-05, - "loss": 2.3661, - "step": 384580 - }, - { - "epoch": 0.67, - "learning_rate": 1.646606235416805e-05, - "loss": 2.2352, - "step": 384590 - }, - { - "epoch": 0.67, - "learning_rate": 1.646519041424122e-05, - "loss": 2.2022, - "step": 384600 - }, - { - "epoch": 0.67, - "learning_rate": 1.6464318474314395e-05, - "loss": 2.21, - "step": 384610 - }, - { - "epoch": 0.67, - "learning_rate": 1.6463446534387565e-05, - "loss": 2.3543, - "step": 384620 - }, - { - "epoch": 0.67, - "learning_rate": 1.6462574594460742e-05, - "loss": 2.3119, - "step": 384630 - }, - { - "epoch": 0.67, - "learning_rate": 1.6461702654533913e-05, - "loss": 2.2795, - "step": 384640 - }, - { - "epoch": 0.67, - "learning_rate": 1.6460830714607087e-05, - "loss": 2.2887, - "step": 384650 - }, - { - "epoch": 0.67, - "learning_rate": 1.645995877468026e-05, - "loss": 2.29, - "step": 384660 - }, - { - "epoch": 0.67, - "learning_rate": 1.6459086834753434e-05, - "loss": 2.2528, - "step": 384670 - }, - { - "epoch": 0.67, - "learning_rate": 1.6458214894826608e-05, - "loss": 2.2412, - "step": 384680 - }, - { - "epoch": 0.67, - "learning_rate": 1.6457342954899778e-05, - "loss": 2.2968, - "step": 384690 - }, - { - "epoch": 0.67, - "learning_rate": 1.6456471014972955e-05, - "loss": 2.2801, - "step": 384700 - }, - { - "epoch": 0.67, - "learning_rate": 1.6455599075046126e-05, - "loss": 2.1281, - "step": 384710 - }, - { - "epoch": 0.67, - "learning_rate": 1.64547271351193e-05, - "loss": 2.2011, - "step": 384720 - }, - { - "epoch": 0.67, - "learning_rate": 1.6453855195192473e-05, - "loss": 2.3534, - "step": 384730 - }, - { - "epoch": 0.67, - "learning_rate": 1.6452983255265647e-05, - "loss": 2.2849, - "step": 384740 - }, - { - "epoch": 0.67, - "learning_rate": 1.645211131533882e-05, - "loss": 2.2978, - "step": 384750 - }, - { - "epoch": 0.67, - "learning_rate": 1.645123937541199e-05, - "loss": 2.3677, - "step": 384760 - }, - { - "epoch": 0.67, - "learning_rate": 1.6450367435485165e-05, - "loss": 2.3098, - "step": 384770 - }, - { - "epoch": 0.67, - "learning_rate": 1.644949549555834e-05, - "loss": 2.3067, - "step": 384780 - }, - { - "epoch": 0.67, - "learning_rate": 1.6448623555631513e-05, - "loss": 2.3002, - "step": 384790 - }, - { - "epoch": 0.67, - "learning_rate": 1.6447751615704683e-05, - "loss": 2.3699, - "step": 384800 - }, - { - "epoch": 0.67, - "learning_rate": 1.6446879675777857e-05, - "loss": 2.3006, - "step": 384810 - }, - { - "epoch": 0.67, - "learning_rate": 1.6446007735851034e-05, - "loss": 2.2576, - "step": 384820 - }, - { - "epoch": 0.67, - "learning_rate": 1.6445135795924204e-05, - "loss": 2.3797, - "step": 384830 - }, - { - "epoch": 0.67, - "learning_rate": 1.6444263855997378e-05, - "loss": 2.2982, - "step": 384840 - }, - { - "epoch": 0.67, - "learning_rate": 1.6443391916070552e-05, - "loss": 2.2108, - "step": 384850 - }, - { - "epoch": 0.67, - "learning_rate": 1.6442519976143726e-05, - "loss": 2.3165, - "step": 384860 - }, - { - "epoch": 0.67, - "learning_rate": 1.6441648036216896e-05, - "loss": 2.2098, - "step": 384870 - }, - { - "epoch": 0.67, - "learning_rate": 1.644077609629007e-05, - "loss": 2.2942, - "step": 384880 - }, - { - "epoch": 0.67, - "learning_rate": 1.6439904156363243e-05, - "loss": 2.4215, - "step": 384890 - }, - { - "epoch": 0.67, - "learning_rate": 1.6439032216436417e-05, - "loss": 2.1985, - "step": 384900 - }, - { - "epoch": 0.67, - "learning_rate": 1.643816027650959e-05, - "loss": 2.3555, - "step": 384910 - }, - { - "epoch": 0.67, - "learning_rate": 1.643728833658276e-05, - "loss": 2.2582, - "step": 384920 - }, - { - "epoch": 0.67, - "learning_rate": 1.643641639665594e-05, - "loss": 2.2876, - "step": 384930 - }, - { - "epoch": 0.67, - "learning_rate": 1.643554445672911e-05, - "loss": 2.4529, - "step": 384940 - }, - { - "epoch": 0.67, - "learning_rate": 1.6434672516802283e-05, - "loss": 2.3395, - "step": 384950 - }, - { - "epoch": 0.67, - "learning_rate": 1.6433800576875456e-05, - "loss": 2.2897, - "step": 384960 - }, - { - "epoch": 0.67, - "learning_rate": 1.643292863694863e-05, - "loss": 2.4071, - "step": 384970 - }, - { - "epoch": 0.67, - "learning_rate": 1.6432056697021804e-05, - "loss": 2.3255, - "step": 384980 - }, - { - "epoch": 0.67, - "learning_rate": 1.6431184757094974e-05, - "loss": 2.3323, - "step": 384990 - }, - { - "epoch": 0.67, - "learning_rate": 1.643031281716815e-05, - "loss": 2.2351, - "step": 385000 - }, - { - "epoch": 0.67, - "learning_rate": 1.6429440877241322e-05, - "loss": 2.3315, - "step": 385010 - }, - { - "epoch": 0.67, - "learning_rate": 1.6428568937314496e-05, - "loss": 2.3603, - "step": 385020 - }, - { - "epoch": 0.67, - "learning_rate": 1.6427696997387666e-05, - "loss": 2.3197, - "step": 385030 - }, - { - "epoch": 0.67, - "learning_rate": 1.6426825057460843e-05, - "loss": 2.2585, - "step": 385040 - }, - { - "epoch": 0.67, - "learning_rate": 1.6425953117534017e-05, - "loss": 2.2167, - "step": 385050 - }, - { - "epoch": 0.67, - "learning_rate": 1.6425081177607187e-05, - "loss": 2.352, - "step": 385060 - }, - { - "epoch": 0.67, - "learning_rate": 1.642420923768036e-05, - "loss": 2.2672, - "step": 385070 - }, - { - "epoch": 0.67, - "learning_rate": 1.6423337297753535e-05, - "loss": 2.3062, - "step": 385080 - }, - { - "epoch": 0.67, - "learning_rate": 1.642246535782671e-05, - "loss": 2.349, - "step": 385090 - }, - { - "epoch": 0.67, - "learning_rate": 1.642159341789988e-05, - "loss": 2.3555, - "step": 385100 - }, - { - "epoch": 0.67, - "learning_rate": 1.6420721477973056e-05, - "loss": 2.2681, - "step": 385110 - }, - { - "epoch": 0.67, - "learning_rate": 1.6419849538046227e-05, - "loss": 2.4067, - "step": 385120 - }, - { - "epoch": 0.67, - "learning_rate": 1.64189775981194e-05, - "loss": 2.2577, - "step": 385130 - }, - { - "epoch": 0.67, - "learning_rate": 1.6418105658192574e-05, - "loss": 2.3237, - "step": 385140 - }, - { - "epoch": 0.67, - "learning_rate": 1.6417233718265748e-05, - "loss": 2.2397, - "step": 385150 - }, - { - "epoch": 0.67, - "learning_rate": 1.6416361778338922e-05, - "loss": 2.3509, - "step": 385160 - }, - { - "epoch": 0.67, - "learning_rate": 1.6415489838412092e-05, - "loss": 2.3446, - "step": 385170 - }, - { - "epoch": 0.67, - "learning_rate": 1.6414617898485266e-05, - "loss": 2.2651, - "step": 385180 - }, - { - "epoch": 0.67, - "learning_rate": 1.641374595855844e-05, - "loss": 2.2793, - "step": 385190 - }, - { - "epoch": 0.67, - "learning_rate": 1.6412874018631613e-05, - "loss": 2.403, - "step": 385200 - }, - { - "epoch": 0.67, - "learning_rate": 1.6412002078704787e-05, - "loss": 2.3456, - "step": 385210 - }, - { - "epoch": 0.67, - "learning_rate": 1.641113013877796e-05, - "loss": 2.1723, - "step": 385220 - }, - { - "epoch": 0.67, - "learning_rate": 1.6410258198851135e-05, - "loss": 2.249, - "step": 385230 - }, - { - "epoch": 0.67, - "learning_rate": 1.6409386258924305e-05, - "loss": 2.266, - "step": 385240 - }, - { - "epoch": 0.67, - "learning_rate": 1.640851431899748e-05, - "loss": 2.4174, - "step": 385250 - }, - { - "epoch": 0.67, - "learning_rate": 1.6407642379070653e-05, - "loss": 2.4106, - "step": 385260 - }, - { - "epoch": 0.67, - "learning_rate": 1.6406770439143826e-05, - "loss": 2.2748, - "step": 385270 - }, - { - "epoch": 0.67, - "learning_rate": 1.6405898499216997e-05, - "loss": 2.4139, - "step": 385280 - }, - { - "epoch": 0.67, - "learning_rate": 1.640502655929017e-05, - "loss": 2.3249, - "step": 385290 - }, - { - "epoch": 0.67, - "learning_rate": 1.6404154619363348e-05, - "loss": 2.3214, - "step": 385300 - }, - { - "epoch": 0.67, - "learning_rate": 1.6403282679436518e-05, - "loss": 2.4261, - "step": 385310 - }, - { - "epoch": 0.67, - "learning_rate": 1.6402410739509692e-05, - "loss": 2.2295, - "step": 385320 - }, - { - "epoch": 0.67, - "learning_rate": 1.6401538799582862e-05, - "loss": 2.2841, - "step": 385330 - }, - { - "epoch": 0.67, - "learning_rate": 1.640066685965604e-05, - "loss": 2.2783, - "step": 385340 - }, - { - "epoch": 0.67, - "learning_rate": 1.639979491972921e-05, - "loss": 2.2538, - "step": 385350 - }, - { - "epoch": 0.67, - "learning_rate": 1.6398922979802384e-05, - "loss": 2.3461, - "step": 385360 - }, - { - "epoch": 0.67, - "learning_rate": 1.6398051039875557e-05, - "loss": 2.2454, - "step": 385370 - }, - { - "epoch": 0.67, - "learning_rate": 1.639717909994873e-05, - "loss": 2.3445, - "step": 385380 - }, - { - "epoch": 0.67, - "learning_rate": 1.6396307160021905e-05, - "loss": 2.3208, - "step": 385390 - }, - { - "epoch": 0.67, - "learning_rate": 1.6395435220095075e-05, - "loss": 2.3916, - "step": 385400 - }, - { - "epoch": 0.67, - "learning_rate": 1.6394563280168252e-05, - "loss": 2.4126, - "step": 385410 - }, - { - "epoch": 0.67, - "learning_rate": 1.6393691340241423e-05, - "loss": 2.3623, - "step": 385420 - }, - { - "epoch": 0.67, - "learning_rate": 1.6392819400314597e-05, - "loss": 2.2613, - "step": 385430 - }, - { - "epoch": 0.67, - "learning_rate": 1.639194746038777e-05, - "loss": 2.1604, - "step": 385440 - }, - { - "epoch": 0.67, - "learning_rate": 1.6391075520460944e-05, - "loss": 2.3776, - "step": 385450 - }, - { - "epoch": 0.67, - "learning_rate": 1.6390203580534118e-05, - "loss": 2.2632, - "step": 385460 - }, - { - "epoch": 0.67, - "learning_rate": 1.6389331640607288e-05, - "loss": 2.3779, - "step": 385470 - }, - { - "epoch": 0.67, - "learning_rate": 1.6388459700680462e-05, - "loss": 2.3125, - "step": 385480 - }, - { - "epoch": 0.67, - "learning_rate": 1.6387587760753636e-05, - "loss": 2.261, - "step": 385490 - }, - { - "epoch": 0.67, - "learning_rate": 1.638671582082681e-05, - "loss": 2.3167, - "step": 385500 - }, - { - "epoch": 0.67, - "learning_rate": 1.638584388089998e-05, - "loss": 2.2813, - "step": 385510 - }, - { - "epoch": 0.67, - "learning_rate": 1.6384971940973157e-05, - "loss": 2.3636, - "step": 385520 - }, - { - "epoch": 0.67, - "learning_rate": 1.6384100001046327e-05, - "loss": 2.3255, - "step": 385530 - }, - { - "epoch": 0.67, - "learning_rate": 1.63832280611195e-05, - "loss": 2.3207, - "step": 385540 - }, - { - "epoch": 0.67, - "learning_rate": 1.6382356121192675e-05, - "loss": 2.3033, - "step": 385550 - }, - { - "epoch": 0.67, - "learning_rate": 1.638148418126585e-05, - "loss": 2.2208, - "step": 385560 - }, - { - "epoch": 0.67, - "learning_rate": 1.6380612241339023e-05, - "loss": 2.3159, - "step": 385570 - }, - { - "epoch": 0.67, - "learning_rate": 1.6379740301412193e-05, - "loss": 2.3398, - "step": 385580 - }, - { - "epoch": 0.67, - "learning_rate": 1.6378868361485367e-05, - "loss": 2.3172, - "step": 385590 - }, - { - "epoch": 0.67, - "learning_rate": 1.637799642155854e-05, - "loss": 2.3732, - "step": 385600 - }, - { - "epoch": 0.67, - "learning_rate": 1.6377124481631714e-05, - "loss": 2.4041, - "step": 385610 - }, - { - "epoch": 0.67, - "learning_rate": 1.6376252541704888e-05, - "loss": 2.2254, - "step": 385620 - }, - { - "epoch": 0.67, - "learning_rate": 1.6375380601778062e-05, - "loss": 2.4214, - "step": 385630 - }, - { - "epoch": 0.67, - "learning_rate": 1.6374508661851236e-05, - "loss": 2.2592, - "step": 385640 - }, - { - "epoch": 0.67, - "learning_rate": 1.6373636721924406e-05, - "loss": 2.2787, - "step": 385650 - }, - { - "epoch": 0.67, - "learning_rate": 1.637276478199758e-05, - "loss": 2.2956, - "step": 385660 - }, - { - "epoch": 0.67, - "learning_rate": 1.6371892842070753e-05, - "loss": 2.3091, - "step": 385670 - }, - { - "epoch": 0.67, - "learning_rate": 1.6371020902143927e-05, - "loss": 2.3977, - "step": 385680 - }, - { - "epoch": 0.67, - "learning_rate": 1.63701489622171e-05, - "loss": 2.3555, - "step": 385690 - }, - { - "epoch": 0.67, - "learning_rate": 1.636927702229027e-05, - "loss": 2.3177, - "step": 385700 - }, - { - "epoch": 0.67, - "learning_rate": 1.636840508236345e-05, - "loss": 2.4001, - "step": 385710 - }, - { - "epoch": 0.67, - "learning_rate": 1.636753314243662e-05, - "loss": 2.3269, - "step": 385720 - }, - { - "epoch": 0.67, - "learning_rate": 1.6366661202509793e-05, - "loss": 2.2939, - "step": 385730 - }, - { - "epoch": 0.67, - "learning_rate": 1.6365789262582963e-05, - "loss": 2.3137, - "step": 385740 - }, - { - "epoch": 0.67, - "learning_rate": 1.636491732265614e-05, - "loss": 2.3548, - "step": 385750 - }, - { - "epoch": 0.67, - "learning_rate": 1.636404538272931e-05, - "loss": 2.3632, - "step": 385760 - }, - { - "epoch": 0.67, - "learning_rate": 1.6363173442802484e-05, - "loss": 2.4345, - "step": 385770 - }, - { - "epoch": 0.67, - "learning_rate": 1.636230150287566e-05, - "loss": 2.2999, - "step": 385780 - }, - { - "epoch": 0.67, - "learning_rate": 1.6361429562948832e-05, - "loss": 2.3895, - "step": 385790 - }, - { - "epoch": 0.67, - "learning_rate": 1.6360557623022006e-05, - "loss": 2.3951, - "step": 385800 - }, - { - "epoch": 0.67, - "learning_rate": 1.6359685683095176e-05, - "loss": 2.3259, - "step": 385810 - }, - { - "epoch": 0.67, - "learning_rate": 1.6358813743168353e-05, - "loss": 2.2434, - "step": 385820 - }, - { - "epoch": 0.67, - "learning_rate": 1.6357941803241524e-05, - "loss": 2.3368, - "step": 385830 - }, - { - "epoch": 0.67, - "learning_rate": 1.6357069863314697e-05, - "loss": 2.2976, - "step": 385840 - }, - { - "epoch": 0.67, - "learning_rate": 1.635619792338787e-05, - "loss": 2.284, - "step": 385850 - }, - { - "epoch": 0.67, - "learning_rate": 1.6355325983461045e-05, - "loss": 2.2439, - "step": 385860 - }, - { - "epoch": 0.67, - "learning_rate": 1.635445404353422e-05, - "loss": 2.2904, - "step": 385870 - }, - { - "epoch": 0.67, - "learning_rate": 1.635358210360739e-05, - "loss": 2.2547, - "step": 385880 - }, - { - "epoch": 0.67, - "learning_rate": 1.6352710163680566e-05, - "loss": 2.3589, - "step": 385890 - }, - { - "epoch": 0.67, - "learning_rate": 1.6351838223753737e-05, - "loss": 2.3053, - "step": 385900 - }, - { - "epoch": 0.67, - "learning_rate": 1.635096628382691e-05, - "loss": 2.2555, - "step": 385910 - }, - { - "epoch": 0.67, - "learning_rate": 1.6350094343900084e-05, - "loss": 2.2956, - "step": 385920 - }, - { - "epoch": 0.67, - "learning_rate": 1.6349222403973258e-05, - "loss": 2.3162, - "step": 385930 - }, - { - "epoch": 0.67, - "learning_rate": 1.6348350464046432e-05, - "loss": 2.3408, - "step": 385940 - }, - { - "epoch": 0.67, - "learning_rate": 1.6347478524119602e-05, - "loss": 2.2444, - "step": 385950 - }, - { - "epoch": 0.67, - "learning_rate": 1.6346606584192776e-05, - "loss": 2.2127, - "step": 385960 - }, - { - "epoch": 0.67, - "learning_rate": 1.634573464426595e-05, - "loss": 2.2073, - "step": 385970 - }, - { - "epoch": 0.67, - "learning_rate": 1.6344862704339123e-05, - "loss": 2.1937, - "step": 385980 - }, - { - "epoch": 0.67, - "learning_rate": 1.6343990764412294e-05, - "loss": 2.3366, - "step": 385990 - }, - { - "epoch": 0.67, - "learning_rate": 1.6343118824485468e-05, - "loss": 2.3472, - "step": 386000 - }, - { - "epoch": 0.67, - "learning_rate": 1.634224688455864e-05, - "loss": 2.4187, - "step": 386010 - }, - { - "epoch": 0.67, - "learning_rate": 1.6341374944631815e-05, - "loss": 2.3379, - "step": 386020 - }, - { - "epoch": 0.67, - "learning_rate": 1.634050300470499e-05, - "loss": 2.3374, - "step": 386030 - }, - { - "epoch": 0.67, - "learning_rate": 1.6339631064778163e-05, - "loss": 2.2241, - "step": 386040 - }, - { - "epoch": 0.67, - "learning_rate": 1.6338759124851336e-05, - "loss": 2.289, - "step": 386050 - }, - { - "epoch": 0.67, - "learning_rate": 1.6337887184924507e-05, - "loss": 2.2513, - "step": 386060 - }, - { - "epoch": 0.67, - "learning_rate": 1.633701524499768e-05, - "loss": 2.3366, - "step": 386070 - }, - { - "epoch": 0.67, - "learning_rate": 1.6336143305070854e-05, - "loss": 2.3317, - "step": 386080 - }, - { - "epoch": 0.67, - "learning_rate": 1.6335271365144028e-05, - "loss": 2.2743, - "step": 386090 - }, - { - "epoch": 0.67, - "learning_rate": 1.6334399425217202e-05, - "loss": 2.3952, - "step": 386100 - }, - { - "epoch": 0.67, - "learning_rate": 1.6333527485290372e-05, - "loss": 2.3662, - "step": 386110 - }, - { - "epoch": 0.67, - "learning_rate": 1.633265554536355e-05, - "loss": 2.3667, - "step": 386120 - }, - { - "epoch": 0.67, - "learning_rate": 1.633178360543672e-05, - "loss": 2.3576, - "step": 386130 - }, - { - "epoch": 0.67, - "learning_rate": 1.6330911665509894e-05, - "loss": 2.2789, - "step": 386140 - }, - { - "epoch": 0.67, - "learning_rate": 1.6330039725583067e-05, - "loss": 2.2935, - "step": 386150 - }, - { - "epoch": 0.67, - "learning_rate": 1.632916778565624e-05, - "loss": 2.2922, - "step": 386160 - }, - { - "epoch": 0.67, - "learning_rate": 1.6328295845729415e-05, - "loss": 2.2855, - "step": 386170 - }, - { - "epoch": 0.67, - "learning_rate": 1.6327423905802585e-05, - "loss": 2.4108, - "step": 386180 - }, - { - "epoch": 0.67, - "learning_rate": 1.6326551965875762e-05, - "loss": 2.3397, - "step": 386190 - }, - { - "epoch": 0.67, - "learning_rate": 1.6325680025948933e-05, - "loss": 2.2701, - "step": 386200 - }, - { - "epoch": 0.67, - "learning_rate": 1.6324808086022107e-05, - "loss": 2.3671, - "step": 386210 - }, - { - "epoch": 0.67, - "learning_rate": 1.6323936146095277e-05, - "loss": 2.3247, - "step": 386220 - }, - { - "epoch": 0.67, - "learning_rate": 1.6323064206168454e-05, - "loss": 2.3158, - "step": 386230 - }, - { - "epoch": 0.67, - "learning_rate": 1.6322192266241624e-05, - "loss": 2.3157, - "step": 386240 - }, - { - "epoch": 0.67, - "learning_rate": 1.6321320326314798e-05, - "loss": 2.281, - "step": 386250 - }, - { - "epoch": 0.67, - "learning_rate": 1.6320448386387972e-05, - "loss": 2.4329, - "step": 386260 - }, - { - "epoch": 0.67, - "learning_rate": 1.6319576446461146e-05, - "loss": 2.3614, - "step": 386270 - }, - { - "epoch": 0.67, - "learning_rate": 1.631870450653432e-05, - "loss": 2.342, - "step": 386280 - }, - { - "epoch": 0.67, - "learning_rate": 1.631783256660749e-05, - "loss": 2.3859, - "step": 386290 - }, - { - "epoch": 0.67, - "learning_rate": 1.6316960626680667e-05, - "loss": 2.4238, - "step": 386300 - }, - { - "epoch": 0.67, - "learning_rate": 1.6316088686753837e-05, - "loss": 2.2738, - "step": 386310 - }, - { - "epoch": 0.67, - "learning_rate": 1.631521674682701e-05, - "loss": 2.3811, - "step": 386320 - }, - { - "epoch": 0.67, - "learning_rate": 1.6314344806900185e-05, - "loss": 2.2698, - "step": 386330 - }, - { - "epoch": 0.67, - "learning_rate": 1.631347286697336e-05, - "loss": 2.2429, - "step": 386340 - }, - { - "epoch": 0.67, - "learning_rate": 1.6312600927046533e-05, - "loss": 2.3438, - "step": 386350 - }, - { - "epoch": 0.67, - "learning_rate": 1.6311728987119703e-05, - "loss": 2.3092, - "step": 386360 - }, - { - "epoch": 0.67, - "learning_rate": 1.6310857047192877e-05, - "loss": 2.3755, - "step": 386370 - }, - { - "epoch": 0.67, - "learning_rate": 1.630998510726605e-05, - "loss": 2.3667, - "step": 386380 - }, - { - "epoch": 0.67, - "learning_rate": 1.6309113167339224e-05, - "loss": 2.39, - "step": 386390 - }, - { - "epoch": 0.67, - "learning_rate": 1.6308241227412398e-05, - "loss": 2.2362, - "step": 386400 - }, - { - "epoch": 0.67, - "learning_rate": 1.630736928748557e-05, - "loss": 2.3752, - "step": 386410 - }, - { - "epoch": 0.67, - "learning_rate": 1.6306497347558746e-05, - "loss": 2.4639, - "step": 386420 - }, - { - "epoch": 0.67, - "learning_rate": 1.6305625407631916e-05, - "loss": 2.3282, - "step": 386430 - }, - { - "epoch": 0.67, - "learning_rate": 1.630475346770509e-05, - "loss": 2.352, - "step": 386440 - }, - { - "epoch": 0.67, - "learning_rate": 1.6303881527778263e-05, - "loss": 2.3803, - "step": 386450 - }, - { - "epoch": 0.67, - "learning_rate": 1.6303009587851437e-05, - "loss": 2.2347, - "step": 386460 - }, - { - "epoch": 0.67, - "learning_rate": 1.6302137647924608e-05, - "loss": 2.3141, - "step": 386470 - }, - { - "epoch": 0.67, - "learning_rate": 1.630126570799778e-05, - "loss": 2.3596, - "step": 386480 - }, - { - "epoch": 0.67, - "learning_rate": 1.6300393768070955e-05, - "loss": 2.2752, - "step": 386490 - }, - { - "epoch": 0.67, - "learning_rate": 1.629952182814413e-05, - "loss": 2.306, - "step": 386500 - }, - { - "epoch": 0.67, - "learning_rate": 1.6298649888217303e-05, - "loss": 2.4311, - "step": 386510 - }, - { - "epoch": 0.67, - "learning_rate": 1.6297777948290473e-05, - "loss": 2.3405, - "step": 386520 - }, - { - "epoch": 0.67, - "learning_rate": 1.629690600836365e-05, - "loss": 2.3042, - "step": 386530 - }, - { - "epoch": 0.67, - "learning_rate": 1.629603406843682e-05, - "loss": 2.3447, - "step": 386540 - }, - { - "epoch": 0.67, - "learning_rate": 1.6295162128509994e-05, - "loss": 2.2854, - "step": 386550 - }, - { - "epoch": 0.67, - "learning_rate": 1.6294290188583168e-05, - "loss": 2.2284, - "step": 386560 - }, - { - "epoch": 0.67, - "learning_rate": 1.6293418248656342e-05, - "loss": 2.2605, - "step": 386570 - }, - { - "epoch": 0.67, - "learning_rate": 1.6292546308729516e-05, - "loss": 2.3753, - "step": 386580 - }, - { - "epoch": 0.67, - "learning_rate": 1.6291674368802686e-05, - "loss": 2.2278, - "step": 386590 - }, - { - "epoch": 0.67, - "learning_rate": 1.6290802428875863e-05, - "loss": 2.3057, - "step": 386600 - }, - { - "epoch": 0.67, - "learning_rate": 1.6289930488949034e-05, - "loss": 2.3556, - "step": 386610 - }, - { - "epoch": 0.67, - "learning_rate": 1.6289058549022207e-05, - "loss": 2.3263, - "step": 386620 - }, - { - "epoch": 0.67, - "learning_rate": 1.6288186609095378e-05, - "loss": 2.2824, - "step": 386630 - }, - { - "epoch": 0.67, - "learning_rate": 1.6287314669168555e-05, - "loss": 2.3695, - "step": 386640 - }, - { - "epoch": 0.67, - "learning_rate": 1.628644272924173e-05, - "loss": 2.1703, - "step": 386650 - }, - { - "epoch": 0.67, - "learning_rate": 1.62855707893149e-05, - "loss": 2.328, - "step": 386660 - }, - { - "epoch": 0.67, - "learning_rate": 1.6284698849388073e-05, - "loss": 2.3304, - "step": 386670 - }, - { - "epoch": 0.67, - "learning_rate": 1.6283826909461247e-05, - "loss": 2.1823, - "step": 386680 - }, - { - "epoch": 0.67, - "learning_rate": 1.628295496953442e-05, - "loss": 2.3588, - "step": 386690 - }, - { - "epoch": 0.67, - "learning_rate": 1.628208302960759e-05, - "loss": 2.4082, - "step": 386700 - }, - { - "epoch": 0.67, - "learning_rate": 1.6281211089680768e-05, - "loss": 2.3514, - "step": 386710 - }, - { - "epoch": 0.67, - "learning_rate": 1.628033914975394e-05, - "loss": 2.3155, - "step": 386720 - }, - { - "epoch": 0.67, - "learning_rate": 1.6279467209827112e-05, - "loss": 2.2995, - "step": 386730 - }, - { - "epoch": 0.67, - "learning_rate": 1.6278595269900286e-05, - "loss": 2.2435, - "step": 386740 - }, - { - "epoch": 0.67, - "learning_rate": 1.627772332997346e-05, - "loss": 2.281, - "step": 386750 - }, - { - "epoch": 0.67, - "learning_rate": 1.6276851390046633e-05, - "loss": 2.3669, - "step": 386760 - }, - { - "epoch": 0.67, - "learning_rate": 1.6275979450119804e-05, - "loss": 2.2698, - "step": 386770 - }, - { - "epoch": 0.67, - "learning_rate": 1.6275107510192978e-05, - "loss": 2.3557, - "step": 386780 - }, - { - "epoch": 0.67, - "learning_rate": 1.627423557026615e-05, - "loss": 2.3314, - "step": 386790 - }, - { - "epoch": 0.67, - "learning_rate": 1.6273363630339325e-05, - "loss": 2.2671, - "step": 386800 - }, - { - "epoch": 0.67, - "learning_rate": 1.62724916904125e-05, - "loss": 2.3079, - "step": 386810 - }, - { - "epoch": 0.67, - "learning_rate": 1.6271619750485673e-05, - "loss": 2.2319, - "step": 386820 - }, - { - "epoch": 0.67, - "learning_rate": 1.6270747810558846e-05, - "loss": 2.3525, - "step": 386830 - }, - { - "epoch": 0.67, - "learning_rate": 1.6269875870632017e-05, - "loss": 2.394, - "step": 386840 - }, - { - "epoch": 0.67, - "learning_rate": 1.626900393070519e-05, - "loss": 2.3832, - "step": 386850 - }, - { - "epoch": 0.67, - "learning_rate": 1.6268131990778364e-05, - "loss": 2.2328, - "step": 386860 - }, - { - "epoch": 0.67, - "learning_rate": 1.6267260050851538e-05, - "loss": 2.3464, - "step": 386870 - }, - { - "epoch": 0.67, - "learning_rate": 1.626638811092471e-05, - "loss": 2.4198, - "step": 386880 - }, - { - "epoch": 0.67, - "learning_rate": 1.6265516170997882e-05, - "loss": 2.273, - "step": 386890 - }, - { - "epoch": 0.67, - "learning_rate": 1.626464423107106e-05, - "loss": 2.2415, - "step": 386900 - }, - { - "epoch": 0.67, - "learning_rate": 1.626377229114423e-05, - "loss": 2.3243, - "step": 386910 - }, - { - "epoch": 0.67, - "learning_rate": 1.6262900351217404e-05, - "loss": 2.3539, - "step": 386920 - }, - { - "epoch": 0.67, - "learning_rate": 1.6262028411290574e-05, - "loss": 2.3748, - "step": 386930 - }, - { - "epoch": 0.67, - "learning_rate": 1.626115647136375e-05, - "loss": 2.2985, - "step": 386940 - }, - { - "epoch": 0.67, - "learning_rate": 1.626028453143692e-05, - "loss": 2.2816, - "step": 386950 - }, - { - "epoch": 0.67, - "learning_rate": 1.6259412591510095e-05, - "loss": 2.3641, - "step": 386960 - }, - { - "epoch": 0.67, - "learning_rate": 1.625854065158327e-05, - "loss": 2.2918, - "step": 386970 - }, - { - "epoch": 0.67, - "learning_rate": 1.6257668711656443e-05, - "loss": 2.3491, - "step": 386980 - }, - { - "epoch": 0.67, - "learning_rate": 1.6256796771729617e-05, - "loss": 2.3451, - "step": 386990 - }, - { - "epoch": 0.67, - "learning_rate": 1.6255924831802787e-05, - "loss": 2.3667, - "step": 387000 - }, - { - "epoch": 0.67, - "learning_rate": 1.6255052891875964e-05, - "loss": 2.2892, - "step": 387010 - }, - { - "epoch": 0.67, - "learning_rate": 1.6254180951949135e-05, - "loss": 2.2838, - "step": 387020 - }, - { - "epoch": 0.67, - "learning_rate": 1.6253309012022308e-05, - "loss": 2.328, - "step": 387030 - }, - { - "epoch": 0.67, - "learning_rate": 1.6252437072095482e-05, - "loss": 2.1384, - "step": 387040 - }, - { - "epoch": 0.67, - "learning_rate": 1.6251565132168656e-05, - "loss": 2.4142, - "step": 387050 - }, - { - "epoch": 0.67, - "learning_rate": 1.625069319224183e-05, - "loss": 2.2928, - "step": 387060 - }, - { - "epoch": 0.68, - "learning_rate": 1.6249821252315e-05, - "loss": 2.3024, - "step": 387070 - }, - { - "epoch": 0.68, - "learning_rate": 1.6248949312388177e-05, - "loss": 2.2663, - "step": 387080 - }, - { - "epoch": 0.68, - "learning_rate": 1.6248077372461348e-05, - "loss": 2.1834, - "step": 387090 - }, - { - "epoch": 0.68, - "learning_rate": 1.624720543253452e-05, - "loss": 2.3416, - "step": 387100 - }, - { - "epoch": 0.68, - "learning_rate": 1.624633349260769e-05, - "loss": 2.3492, - "step": 387110 - }, - { - "epoch": 0.68, - "learning_rate": 1.624546155268087e-05, - "loss": 2.2675, - "step": 387120 - }, - { - "epoch": 0.68, - "learning_rate": 1.6244589612754043e-05, - "loss": 2.2827, - "step": 387130 - }, - { - "epoch": 0.68, - "learning_rate": 1.6243717672827213e-05, - "loss": 2.3195, - "step": 387140 - }, - { - "epoch": 0.68, - "learning_rate": 1.6242845732900387e-05, - "loss": 2.4508, - "step": 387150 - }, - { - "epoch": 0.68, - "learning_rate": 1.624197379297356e-05, - "loss": 2.426, - "step": 387160 - }, - { - "epoch": 0.68, - "learning_rate": 1.6241101853046734e-05, - "loss": 2.4835, - "step": 387170 - }, - { - "epoch": 0.68, - "learning_rate": 1.6240229913119905e-05, - "loss": 2.3315, - "step": 387180 - }, - { - "epoch": 0.68, - "learning_rate": 1.623935797319308e-05, - "loss": 2.2216, - "step": 387190 - }, - { - "epoch": 0.68, - "learning_rate": 1.6238486033266252e-05, - "loss": 2.322, - "step": 387200 - }, - { - "epoch": 0.68, - "learning_rate": 1.6237614093339426e-05, - "loss": 2.2465, - "step": 387210 - }, - { - "epoch": 0.68, - "learning_rate": 1.62367421534126e-05, - "loss": 2.3499, - "step": 387220 - }, - { - "epoch": 0.68, - "learning_rate": 1.6235870213485774e-05, - "loss": 2.3219, - "step": 387230 - }, - { - "epoch": 0.68, - "learning_rate": 1.6234998273558947e-05, - "loss": 2.1485, - "step": 387240 - }, - { - "epoch": 0.68, - "learning_rate": 1.6234126333632118e-05, - "loss": 2.3783, - "step": 387250 - }, - { - "epoch": 0.68, - "learning_rate": 1.623325439370529e-05, - "loss": 2.2715, - "step": 387260 - }, - { - "epoch": 0.68, - "learning_rate": 1.6232382453778465e-05, - "loss": 2.4805, - "step": 387270 - }, - { - "epoch": 0.68, - "learning_rate": 1.623151051385164e-05, - "loss": 2.3308, - "step": 387280 - }, - { - "epoch": 0.68, - "learning_rate": 1.6230638573924813e-05, - "loss": 2.2245, - "step": 387290 - }, - { - "epoch": 0.68, - "learning_rate": 1.6229766633997983e-05, - "loss": 2.3253, - "step": 387300 - }, - { - "epoch": 0.68, - "learning_rate": 1.622889469407116e-05, - "loss": 2.3687, - "step": 387310 - }, - { - "epoch": 0.68, - "learning_rate": 1.622802275414433e-05, - "loss": 2.2319, - "step": 387320 - }, - { - "epoch": 0.68, - "learning_rate": 1.6227150814217504e-05, - "loss": 2.3558, - "step": 387330 - }, - { - "epoch": 0.68, - "learning_rate": 1.6226278874290675e-05, - "loss": 2.3656, - "step": 387340 - }, - { - "epoch": 0.68, - "learning_rate": 1.6225406934363852e-05, - "loss": 2.3759, - "step": 387350 - }, - { - "epoch": 0.68, - "learning_rate": 1.6224534994437022e-05, - "loss": 2.3565, - "step": 387360 - }, - { - "epoch": 0.68, - "learning_rate": 1.6223663054510196e-05, - "loss": 2.1966, - "step": 387370 - }, - { - "epoch": 0.68, - "learning_rate": 1.6222791114583373e-05, - "loss": 2.4492, - "step": 387380 - }, - { - "epoch": 0.68, - "learning_rate": 1.6221919174656544e-05, - "loss": 2.3403, - "step": 387390 - }, - { - "epoch": 0.68, - "learning_rate": 1.6221047234729717e-05, - "loss": 2.2344, - "step": 387400 - }, - { - "epoch": 0.68, - "learning_rate": 1.6220175294802888e-05, - "loss": 2.3281, - "step": 387410 - }, - { - "epoch": 0.68, - "learning_rate": 1.6219303354876065e-05, - "loss": 2.3207, - "step": 387420 - }, - { - "epoch": 0.68, - "learning_rate": 1.6218431414949235e-05, - "loss": 2.4075, - "step": 387430 - }, - { - "epoch": 0.68, - "learning_rate": 1.621755947502241e-05, - "loss": 2.3208, - "step": 387440 - }, - { - "epoch": 0.68, - "learning_rate": 1.6216687535095583e-05, - "loss": 2.2137, - "step": 387450 - }, - { - "epoch": 0.68, - "learning_rate": 1.6215815595168757e-05, - "loss": 2.1981, - "step": 387460 - }, - { - "epoch": 0.68, - "learning_rate": 1.621494365524193e-05, - "loss": 2.2527, - "step": 387470 - }, - { - "epoch": 0.68, - "learning_rate": 1.62140717153151e-05, - "loss": 2.3457, - "step": 387480 - }, - { - "epoch": 0.68, - "learning_rate": 1.6213199775388278e-05, - "loss": 2.2895, - "step": 387490 - }, - { - "epoch": 0.68, - "learning_rate": 1.621232783546145e-05, - "loss": 2.3069, - "step": 387500 - }, - { - "epoch": 0.68, - "learning_rate": 1.6211455895534622e-05, - "loss": 2.4264, - "step": 387510 - }, - { - "epoch": 0.68, - "learning_rate": 1.6210583955607796e-05, - "loss": 2.2451, - "step": 387520 - }, - { - "epoch": 0.68, - "learning_rate": 1.620971201568097e-05, - "loss": 2.2731, - "step": 387530 - }, - { - "epoch": 0.68, - "learning_rate": 1.6208840075754143e-05, - "loss": 2.2984, - "step": 387540 - }, - { - "epoch": 0.68, - "learning_rate": 1.6207968135827314e-05, - "loss": 2.3826, - "step": 387550 - }, - { - "epoch": 0.68, - "learning_rate": 1.6207096195900488e-05, - "loss": 2.1888, - "step": 387560 - }, - { - "epoch": 0.68, - "learning_rate": 1.620622425597366e-05, - "loss": 2.3541, - "step": 387570 - }, - { - "epoch": 0.68, - "learning_rate": 1.6205352316046835e-05, - "loss": 2.2529, - "step": 387580 - }, - { - "epoch": 0.68, - "learning_rate": 1.6204480376120006e-05, - "loss": 2.3685, - "step": 387590 - }, - { - "epoch": 0.68, - "learning_rate": 1.620360843619318e-05, - "loss": 2.2792, - "step": 387600 - }, - { - "epoch": 0.68, - "learning_rate": 1.6202736496266353e-05, - "loss": 2.322, - "step": 387610 - }, - { - "epoch": 0.68, - "learning_rate": 1.6201864556339527e-05, - "loss": 2.2865, - "step": 387620 - }, - { - "epoch": 0.68, - "learning_rate": 1.62009926164127e-05, - "loss": 2.3068, - "step": 387630 - }, - { - "epoch": 0.68, - "learning_rate": 1.6200120676485874e-05, - "loss": 2.3107, - "step": 387640 - }, - { - "epoch": 0.68, - "learning_rate": 1.6199248736559048e-05, - "loss": 2.2491, - "step": 387650 - }, - { - "epoch": 0.68, - "learning_rate": 1.619837679663222e-05, - "loss": 2.3052, - "step": 387660 - }, - { - "epoch": 0.68, - "learning_rate": 1.6197504856705392e-05, - "loss": 2.1886, - "step": 387670 - }, - { - "epoch": 0.68, - "learning_rate": 1.6196632916778566e-05, - "loss": 2.3736, - "step": 387680 - }, - { - "epoch": 0.68, - "learning_rate": 1.619576097685174e-05, - "loss": 2.2945, - "step": 387690 - }, - { - "epoch": 0.68, - "learning_rate": 1.6194889036924914e-05, - "loss": 2.29, - "step": 387700 - }, - { - "epoch": 0.68, - "learning_rate": 1.6194017096998084e-05, - "loss": 2.2418, - "step": 387710 - }, - { - "epoch": 0.68, - "learning_rate": 1.619314515707126e-05, - "loss": 2.2644, - "step": 387720 - }, - { - "epoch": 0.68, - "learning_rate": 1.619227321714443e-05, - "loss": 2.2217, - "step": 387730 - }, - { - "epoch": 0.68, - "learning_rate": 1.6191401277217605e-05, - "loss": 2.439, - "step": 387740 - }, - { - "epoch": 0.68, - "learning_rate": 1.619052933729078e-05, - "loss": 2.2994, - "step": 387750 - }, - { - "epoch": 0.68, - "learning_rate": 1.6189657397363953e-05, - "loss": 2.3447, - "step": 387760 - }, - { - "epoch": 0.68, - "learning_rate": 1.6188785457437127e-05, - "loss": 2.3121, - "step": 387770 - }, - { - "epoch": 0.68, - "learning_rate": 1.6187913517510297e-05, - "loss": 2.3786, - "step": 387780 - }, - { - "epoch": 0.68, - "learning_rate": 1.6187041577583474e-05, - "loss": 2.3283, - "step": 387790 - }, - { - "epoch": 0.68, - "learning_rate": 1.6186169637656645e-05, - "loss": 2.234, - "step": 387800 - }, - { - "epoch": 0.68, - "learning_rate": 1.6185297697729818e-05, - "loss": 2.273, - "step": 387810 - }, - { - "epoch": 0.68, - "learning_rate": 1.618442575780299e-05, - "loss": 2.3731, - "step": 387820 - }, - { - "epoch": 0.68, - "learning_rate": 1.6183553817876166e-05, - "loss": 2.2657, - "step": 387830 - }, - { - "epoch": 0.68, - "learning_rate": 1.6182681877949336e-05, - "loss": 2.301, - "step": 387840 - }, - { - "epoch": 0.68, - "learning_rate": 1.618180993802251e-05, - "loss": 2.3414, - "step": 387850 - }, - { - "epoch": 0.68, - "learning_rate": 1.6180937998095684e-05, - "loss": 2.3473, - "step": 387860 - }, - { - "epoch": 0.68, - "learning_rate": 1.6180066058168858e-05, - "loss": 2.2701, - "step": 387870 - }, - { - "epoch": 0.68, - "learning_rate": 1.617919411824203e-05, - "loss": 2.2662, - "step": 387880 - }, - { - "epoch": 0.68, - "learning_rate": 1.61783221783152e-05, - "loss": 2.2227, - "step": 387890 - }, - { - "epoch": 0.68, - "learning_rate": 1.617745023838838e-05, - "loss": 2.3756, - "step": 387900 - }, - { - "epoch": 0.68, - "learning_rate": 1.617657829846155e-05, - "loss": 2.2146, - "step": 387910 - }, - { - "epoch": 0.68, - "learning_rate": 1.6175706358534723e-05, - "loss": 2.1405, - "step": 387920 - }, - { - "epoch": 0.68, - "learning_rate": 1.6174834418607897e-05, - "loss": 2.2591, - "step": 387930 - }, - { - "epoch": 0.68, - "learning_rate": 1.617396247868107e-05, - "loss": 2.3837, - "step": 387940 - }, - { - "epoch": 0.68, - "learning_rate": 1.6173090538754244e-05, - "loss": 2.3438, - "step": 387950 - }, - { - "epoch": 0.68, - "learning_rate": 1.6172218598827415e-05, - "loss": 2.1956, - "step": 387960 - }, - { - "epoch": 0.68, - "learning_rate": 1.617134665890059e-05, - "loss": 2.3103, - "step": 387970 - }, - { - "epoch": 0.68, - "learning_rate": 1.6170474718973762e-05, - "loss": 2.2559, - "step": 387980 - }, - { - "epoch": 0.68, - "learning_rate": 1.6169602779046936e-05, - "loss": 2.318, - "step": 387990 - }, - { - "epoch": 0.68, - "learning_rate": 1.616873083912011e-05, - "loss": 2.2611, - "step": 388000 - }, - { - "epoch": 0.68, - "learning_rate": 1.6167858899193284e-05, - "loss": 2.3522, - "step": 388010 - }, - { - "epoch": 0.68, - "learning_rate": 1.6166986959266457e-05, - "loss": 2.3061, - "step": 388020 - }, - { - "epoch": 0.68, - "learning_rate": 1.6166115019339628e-05, - "loss": 2.301, - "step": 388030 - }, - { - "epoch": 0.68, - "learning_rate": 1.61652430794128e-05, - "loss": 2.3692, - "step": 388040 - }, - { - "epoch": 0.68, - "learning_rate": 1.6164371139485975e-05, - "loss": 2.2659, - "step": 388050 - }, - { - "epoch": 0.68, - "learning_rate": 1.616349919955915e-05, - "loss": 2.2612, - "step": 388060 - }, - { - "epoch": 0.68, - "learning_rate": 1.616262725963232e-05, - "loss": 2.3319, - "step": 388070 - }, - { - "epoch": 0.68, - "learning_rate": 1.6161755319705493e-05, - "loss": 2.1819, - "step": 388080 - }, - { - "epoch": 0.68, - "learning_rate": 1.6160883379778667e-05, - "loss": 2.3007, - "step": 388090 - }, - { - "epoch": 0.68, - "learning_rate": 1.616001143985184e-05, - "loss": 2.1902, - "step": 388100 - }, - { - "epoch": 0.68, - "learning_rate": 1.6159139499925014e-05, - "loss": 2.3051, - "step": 388110 - }, - { - "epoch": 0.68, - "learning_rate": 1.6158267559998185e-05, - "loss": 2.4543, - "step": 388120 - }, - { - "epoch": 0.68, - "learning_rate": 1.6157395620071362e-05, - "loss": 2.4128, - "step": 388130 - }, - { - "epoch": 0.68, - "learning_rate": 1.6156523680144532e-05, - "loss": 2.2664, - "step": 388140 - }, - { - "epoch": 0.68, - "learning_rate": 1.6155651740217706e-05, - "loss": 2.3513, - "step": 388150 - }, - { - "epoch": 0.68, - "learning_rate": 1.615477980029088e-05, - "loss": 2.3014, - "step": 388160 - }, - { - "epoch": 0.68, - "learning_rate": 1.6153907860364054e-05, - "loss": 2.2532, - "step": 388170 - }, - { - "epoch": 0.68, - "learning_rate": 1.6153035920437227e-05, - "loss": 2.237, - "step": 388180 - }, - { - "epoch": 0.68, - "learning_rate": 1.6152163980510398e-05, - "loss": 2.1962, - "step": 388190 - }, - { - "epoch": 0.68, - "learning_rate": 1.6151292040583575e-05, - "loss": 2.3498, - "step": 388200 - }, - { - "epoch": 0.68, - "learning_rate": 1.6150420100656745e-05, - "loss": 2.3133, - "step": 388210 - }, - { - "epoch": 0.68, - "learning_rate": 1.614954816072992e-05, - "loss": 2.2698, - "step": 388220 - }, - { - "epoch": 0.68, - "learning_rate": 1.614867622080309e-05, - "loss": 2.3502, - "step": 388230 - }, - { - "epoch": 0.68, - "learning_rate": 1.6147804280876267e-05, - "loss": 2.3797, - "step": 388240 - }, - { - "epoch": 0.68, - "learning_rate": 1.614693234094944e-05, - "loss": 2.3822, - "step": 388250 - }, - { - "epoch": 0.68, - "learning_rate": 1.614606040102261e-05, - "loss": 2.3534, - "step": 388260 - }, - { - "epoch": 0.68, - "learning_rate": 1.6145188461095785e-05, - "loss": 2.2668, - "step": 388270 - }, - { - "epoch": 0.68, - "learning_rate": 1.614431652116896e-05, - "loss": 2.305, - "step": 388280 - }, - { - "epoch": 0.68, - "learning_rate": 1.6143444581242132e-05, - "loss": 2.1329, - "step": 388290 - }, - { - "epoch": 0.68, - "learning_rate": 1.6142572641315303e-05, - "loss": 2.2608, - "step": 388300 - }, - { - "epoch": 0.68, - "learning_rate": 1.614170070138848e-05, - "loss": 2.2579, - "step": 388310 - }, - { - "epoch": 0.68, - "learning_rate": 1.614082876146165e-05, - "loss": 2.3078, - "step": 388320 - }, - { - "epoch": 0.68, - "learning_rate": 1.6139956821534824e-05, - "loss": 2.3155, - "step": 388330 - }, - { - "epoch": 0.68, - "learning_rate": 1.6139084881607998e-05, - "loss": 2.2566, - "step": 388340 - }, - { - "epoch": 0.68, - "learning_rate": 1.613821294168117e-05, - "loss": 2.3231, - "step": 388350 - }, - { - "epoch": 0.68, - "learning_rate": 1.6137341001754345e-05, - "loss": 2.3343, - "step": 388360 - }, - { - "epoch": 0.68, - "learning_rate": 1.6136469061827516e-05, - "loss": 2.2462, - "step": 388370 - }, - { - "epoch": 0.68, - "learning_rate": 1.613559712190069e-05, - "loss": 2.3064, - "step": 388380 - }, - { - "epoch": 0.68, - "learning_rate": 1.6134725181973863e-05, - "loss": 2.2149, - "step": 388390 - }, - { - "epoch": 0.68, - "learning_rate": 1.6133853242047037e-05, - "loss": 2.1952, - "step": 388400 - }, - { - "epoch": 0.68, - "learning_rate": 1.613298130212021e-05, - "loss": 2.4144, - "step": 388410 - }, - { - "epoch": 0.68, - "learning_rate": 1.6132109362193384e-05, - "loss": 2.2785, - "step": 388420 - }, - { - "epoch": 0.68, - "learning_rate": 1.6131237422266558e-05, - "loss": 2.3872, - "step": 388430 - }, - { - "epoch": 0.68, - "learning_rate": 1.613036548233973e-05, - "loss": 2.3137, - "step": 388440 - }, - { - "epoch": 0.68, - "learning_rate": 1.6129493542412902e-05, - "loss": 2.231, - "step": 388450 - }, - { - "epoch": 0.68, - "learning_rate": 1.6128621602486076e-05, - "loss": 2.3571, - "step": 388460 - }, - { - "epoch": 0.68, - "learning_rate": 1.612774966255925e-05, - "loss": 2.3547, - "step": 388470 - }, - { - "epoch": 0.68, - "learning_rate": 1.6126877722632424e-05, - "loss": 2.3144, - "step": 388480 - }, - { - "epoch": 0.68, - "learning_rate": 1.6126005782705594e-05, - "loss": 2.276, - "step": 388490 - }, - { - "epoch": 0.68, - "learning_rate": 1.612513384277877e-05, - "loss": 2.2616, - "step": 388500 - }, - { - "epoch": 0.68, - "learning_rate": 1.612426190285194e-05, - "loss": 2.2892, - "step": 388510 - }, - { - "epoch": 0.68, - "learning_rate": 1.6123389962925115e-05, - "loss": 2.3387, - "step": 388520 - }, - { - "epoch": 0.68, - "learning_rate": 1.6122518022998286e-05, - "loss": 2.328, - "step": 388530 - }, - { - "epoch": 0.68, - "learning_rate": 1.6121646083071463e-05, - "loss": 2.2679, - "step": 388540 - }, - { - "epoch": 0.68, - "learning_rate": 1.6120774143144633e-05, - "loss": 2.3201, - "step": 388550 - }, - { - "epoch": 0.68, - "learning_rate": 1.6119902203217807e-05, - "loss": 2.3339, - "step": 388560 - }, - { - "epoch": 0.68, - "learning_rate": 1.611903026329098e-05, - "loss": 2.2255, - "step": 388570 - }, - { - "epoch": 0.68, - "learning_rate": 1.6118158323364155e-05, - "loss": 2.2482, - "step": 388580 - }, - { - "epoch": 0.68, - "learning_rate": 1.6117286383437328e-05, - "loss": 2.2781, - "step": 388590 - }, - { - "epoch": 0.68, - "learning_rate": 1.61164144435105e-05, - "loss": 2.3049, - "step": 388600 - }, - { - "epoch": 0.68, - "learning_rate": 1.6115542503583676e-05, - "loss": 2.2597, - "step": 388610 - }, - { - "epoch": 0.68, - "learning_rate": 1.6114670563656846e-05, - "loss": 2.402, - "step": 388620 - }, - { - "epoch": 0.68, - "learning_rate": 1.611379862373002e-05, - "loss": 2.2346, - "step": 388630 - }, - { - "epoch": 0.68, - "learning_rate": 1.6112926683803194e-05, - "loss": 2.3401, - "step": 388640 - }, - { - "epoch": 0.68, - "learning_rate": 1.6112054743876368e-05, - "loss": 2.3761, - "step": 388650 - }, - { - "epoch": 0.68, - "learning_rate": 1.611118280394954e-05, - "loss": 2.3552, - "step": 388660 - }, - { - "epoch": 0.68, - "learning_rate": 1.611031086402271e-05, - "loss": 2.2666, - "step": 388670 - }, - { - "epoch": 0.68, - "learning_rate": 1.610943892409589e-05, - "loss": 2.2, - "step": 388680 - }, - { - "epoch": 0.68, - "learning_rate": 1.610856698416906e-05, - "loss": 2.2532, - "step": 388690 - }, - { - "epoch": 0.68, - "learning_rate": 1.6107695044242233e-05, - "loss": 2.3067, - "step": 388700 - }, - { - "epoch": 0.68, - "learning_rate": 1.6106823104315403e-05, - "loss": 2.3247, - "step": 388710 - }, - { - "epoch": 0.68, - "learning_rate": 1.610595116438858e-05, - "loss": 2.3331, - "step": 388720 - }, - { - "epoch": 0.68, - "learning_rate": 1.6105079224461754e-05, - "loss": 2.3182, - "step": 388730 - }, - { - "epoch": 0.68, - "learning_rate": 1.6104207284534925e-05, - "loss": 2.2404, - "step": 388740 - }, - { - "epoch": 0.68, - "learning_rate": 1.61033353446081e-05, - "loss": 2.2583, - "step": 388750 - }, - { - "epoch": 0.68, - "learning_rate": 1.6102463404681272e-05, - "loss": 2.3171, - "step": 388760 - }, - { - "epoch": 0.68, - "learning_rate": 1.6101591464754446e-05, - "loss": 2.2435, - "step": 388770 - }, - { - "epoch": 0.68, - "learning_rate": 1.6100719524827616e-05, - "loss": 2.3029, - "step": 388780 - }, - { - "epoch": 0.68, - "learning_rate": 1.609984758490079e-05, - "loss": 2.3802, - "step": 388790 - }, - { - "epoch": 0.68, - "learning_rate": 1.6098975644973964e-05, - "loss": 2.451, - "step": 388800 - }, - { - "epoch": 0.68, - "learning_rate": 1.6098103705047138e-05, - "loss": 2.1918, - "step": 388810 - }, - { - "epoch": 0.68, - "learning_rate": 1.609723176512031e-05, - "loss": 2.349, - "step": 388820 - }, - { - "epoch": 0.68, - "learning_rate": 1.6096359825193485e-05, - "loss": 2.3639, - "step": 388830 - }, - { - "epoch": 0.68, - "learning_rate": 1.609548788526666e-05, - "loss": 2.3476, - "step": 388840 - }, - { - "epoch": 0.68, - "learning_rate": 1.609461594533983e-05, - "loss": 2.2742, - "step": 388850 - }, - { - "epoch": 0.68, - "learning_rate": 1.6093744005413003e-05, - "loss": 2.3243, - "step": 388860 - }, - { - "epoch": 0.68, - "learning_rate": 1.6092872065486177e-05, - "loss": 2.3389, - "step": 388870 - }, - { - "epoch": 0.68, - "learning_rate": 1.609200012555935e-05, - "loss": 2.3322, - "step": 388880 - }, - { - "epoch": 0.68, - "learning_rate": 1.6091128185632524e-05, - "loss": 2.2602, - "step": 388890 - }, - { - "epoch": 0.68, - "learning_rate": 1.6090256245705695e-05, - "loss": 2.331, - "step": 388900 - }, - { - "epoch": 0.68, - "learning_rate": 1.6089384305778872e-05, - "loss": 2.2849, - "step": 388910 - }, - { - "epoch": 0.68, - "learning_rate": 1.6088512365852042e-05, - "loss": 2.2565, - "step": 388920 - }, - { - "epoch": 0.68, - "learning_rate": 1.6087640425925216e-05, - "loss": 2.3292, - "step": 388930 - }, - { - "epoch": 0.68, - "learning_rate": 1.6086768485998387e-05, - "loss": 2.3168, - "step": 388940 - }, - { - "epoch": 0.68, - "learning_rate": 1.6085896546071564e-05, - "loss": 2.3152, - "step": 388950 - }, - { - "epoch": 0.68, - "learning_rate": 1.6085024606144734e-05, - "loss": 2.4024, - "step": 388960 - }, - { - "epoch": 0.68, - "learning_rate": 1.6084152666217908e-05, - "loss": 2.3341, - "step": 388970 - }, - { - "epoch": 0.68, - "learning_rate": 1.6083280726291085e-05, - "loss": 2.3144, - "step": 388980 - }, - { - "epoch": 0.68, - "learning_rate": 1.6082408786364255e-05, - "loss": 2.3894, - "step": 388990 - }, - { - "epoch": 0.68, - "learning_rate": 1.608153684643743e-05, - "loss": 2.2611, - "step": 389000 - }, - { - "epoch": 0.68, - "learning_rate": 1.60806649065106e-05, - "loss": 2.3188, - "step": 389010 - }, - { - "epoch": 0.68, - "learning_rate": 1.6079792966583777e-05, - "loss": 2.3349, - "step": 389020 - }, - { - "epoch": 0.68, - "learning_rate": 1.6078921026656947e-05, - "loss": 2.2778, - "step": 389030 - }, - { - "epoch": 0.68, - "learning_rate": 1.607804908673012e-05, - "loss": 2.2993, - "step": 389040 - }, - { - "epoch": 0.68, - "learning_rate": 1.6077177146803295e-05, - "loss": 2.344, - "step": 389050 - }, - { - "epoch": 0.68, - "learning_rate": 1.607630520687647e-05, - "loss": 2.3117, - "step": 389060 - }, - { - "epoch": 0.68, - "learning_rate": 1.6075433266949642e-05, - "loss": 2.2752, - "step": 389070 - }, - { - "epoch": 0.68, - "learning_rate": 1.6074561327022813e-05, - "loss": 2.3101, - "step": 389080 - }, - { - "epoch": 0.68, - "learning_rate": 1.607368938709599e-05, - "loss": 2.2775, - "step": 389090 - }, - { - "epoch": 0.68, - "learning_rate": 1.607281744716916e-05, - "loss": 2.3851, - "step": 389100 - }, - { - "epoch": 0.68, - "learning_rate": 1.6071945507242334e-05, - "loss": 2.2854, - "step": 389110 - }, - { - "epoch": 0.68, - "learning_rate": 1.6071073567315508e-05, - "loss": 2.3641, - "step": 389120 - }, - { - "epoch": 0.68, - "learning_rate": 1.607020162738868e-05, - "loss": 2.2385, - "step": 389130 - }, - { - "epoch": 0.68, - "learning_rate": 1.6069329687461855e-05, - "loss": 2.3743, - "step": 389140 - }, - { - "epoch": 0.68, - "learning_rate": 1.6068457747535026e-05, - "loss": 2.2683, - "step": 389150 - }, - { - "epoch": 0.68, - "learning_rate": 1.60675858076082e-05, - "loss": 2.2131, - "step": 389160 - }, - { - "epoch": 0.68, - "learning_rate": 1.6066713867681373e-05, - "loss": 2.4416, - "step": 389170 - }, - { - "epoch": 0.68, - "learning_rate": 1.6065841927754547e-05, - "loss": 2.3581, - "step": 389180 - }, - { - "epoch": 0.68, - "learning_rate": 1.6064969987827717e-05, - "loss": 2.2665, - "step": 389190 - }, - { - "epoch": 0.68, - "learning_rate": 1.606409804790089e-05, - "loss": 2.2276, - "step": 389200 - }, - { - "epoch": 0.68, - "learning_rate": 1.6063226107974068e-05, - "loss": 2.2475, - "step": 389210 - }, - { - "epoch": 0.68, - "learning_rate": 1.606235416804724e-05, - "loss": 2.2552, - "step": 389220 - }, - { - "epoch": 0.68, - "learning_rate": 1.6061482228120412e-05, - "loss": 2.2502, - "step": 389230 - }, - { - "epoch": 0.68, - "learning_rate": 1.6060610288193586e-05, - "loss": 2.3266, - "step": 389240 - }, - { - "epoch": 0.68, - "learning_rate": 1.605973834826676e-05, - "loss": 2.3435, - "step": 389250 - }, - { - "epoch": 0.68, - "learning_rate": 1.605886640833993e-05, - "loss": 2.362, - "step": 389260 - }, - { - "epoch": 0.68, - "learning_rate": 1.6057994468413104e-05, - "loss": 2.2992, - "step": 389270 - }, - { - "epoch": 0.68, - "learning_rate": 1.6057122528486278e-05, - "loss": 2.2862, - "step": 389280 - }, - { - "epoch": 0.68, - "learning_rate": 1.605625058855945e-05, - "loss": 2.1968, - "step": 389290 - }, - { - "epoch": 0.68, - "learning_rate": 1.6055378648632625e-05, - "loss": 2.3302, - "step": 389300 - }, - { - "epoch": 0.68, - "learning_rate": 1.6054506708705796e-05, - "loss": 2.246, - "step": 389310 - }, - { - "epoch": 0.68, - "learning_rate": 1.6053634768778973e-05, - "loss": 2.2914, - "step": 389320 - }, - { - "epoch": 0.68, - "learning_rate": 1.6052762828852143e-05, - "loss": 2.3186, - "step": 389330 - }, - { - "epoch": 0.68, - "learning_rate": 1.6051890888925317e-05, - "loss": 2.3414, - "step": 389340 - }, - { - "epoch": 0.68, - "learning_rate": 1.605101894899849e-05, - "loss": 2.3009, - "step": 389350 - }, - { - "epoch": 0.68, - "learning_rate": 1.6050147009071665e-05, - "loss": 2.3298, - "step": 389360 - }, - { - "epoch": 0.68, - "learning_rate": 1.6049275069144838e-05, - "loss": 2.3557, - "step": 389370 - }, - { - "epoch": 0.68, - "learning_rate": 1.604840312921801e-05, - "loss": 2.2774, - "step": 389380 - }, - { - "epoch": 0.68, - "learning_rate": 1.6047531189291186e-05, - "loss": 2.2147, - "step": 389390 - }, - { - "epoch": 0.68, - "learning_rate": 1.6046659249364356e-05, - "loss": 2.37, - "step": 389400 - }, - { - "epoch": 0.68, - "learning_rate": 1.604578730943753e-05, - "loss": 2.4498, - "step": 389410 - }, - { - "epoch": 0.68, - "learning_rate": 1.60449153695107e-05, - "loss": 2.2915, - "step": 389420 - }, - { - "epoch": 0.68, - "learning_rate": 1.6044043429583878e-05, - "loss": 2.2791, - "step": 389430 - }, - { - "epoch": 0.68, - "learning_rate": 1.6043171489657048e-05, - "loss": 2.1935, - "step": 389440 - }, - { - "epoch": 0.68, - "learning_rate": 1.604229954973022e-05, - "loss": 2.4071, - "step": 389450 - }, - { - "epoch": 0.68, - "learning_rate": 1.6041427609803395e-05, - "loss": 2.2599, - "step": 389460 - }, - { - "epoch": 0.68, - "learning_rate": 1.604055566987657e-05, - "loss": 2.2515, - "step": 389470 - }, - { - "epoch": 0.68, - "learning_rate": 1.6039683729949743e-05, - "loss": 2.3087, - "step": 389480 - }, - { - "epoch": 0.68, - "learning_rate": 1.6038811790022913e-05, - "loss": 2.2876, - "step": 389490 - }, - { - "epoch": 0.68, - "learning_rate": 1.603793985009609e-05, - "loss": 2.3833, - "step": 389500 - }, - { - "epoch": 0.68, - "learning_rate": 1.603706791016926e-05, - "loss": 2.3058, - "step": 389510 - }, - { - "epoch": 0.68, - "learning_rate": 1.6036195970242435e-05, - "loss": 2.37, - "step": 389520 - }, - { - "epoch": 0.68, - "learning_rate": 1.603532403031561e-05, - "loss": 2.3089, - "step": 389530 - }, - { - "epoch": 0.68, - "learning_rate": 1.6034452090388782e-05, - "loss": 2.3132, - "step": 389540 - }, - { - "epoch": 0.68, - "learning_rate": 1.6033580150461956e-05, - "loss": 2.317, - "step": 389550 - }, - { - "epoch": 0.68, - "learning_rate": 1.6032708210535126e-05, - "loss": 2.3946, - "step": 389560 - }, - { - "epoch": 0.68, - "learning_rate": 1.60318362706083e-05, - "loss": 2.4033, - "step": 389570 - }, - { - "epoch": 0.68, - "learning_rate": 1.6030964330681474e-05, - "loss": 2.402, - "step": 389580 - }, - { - "epoch": 0.68, - "learning_rate": 1.6030092390754648e-05, - "loss": 2.2994, - "step": 389590 - }, - { - "epoch": 0.68, - "learning_rate": 1.602922045082782e-05, - "loss": 2.292, - "step": 389600 - }, - { - "epoch": 0.68, - "learning_rate": 1.6028348510900995e-05, - "loss": 2.4072, - "step": 389610 - }, - { - "epoch": 0.68, - "learning_rate": 1.602747657097417e-05, - "loss": 2.2963, - "step": 389620 - }, - { - "epoch": 0.68, - "learning_rate": 1.602660463104734e-05, - "loss": 2.3369, - "step": 389630 - }, - { - "epoch": 0.68, - "learning_rate": 1.6025732691120513e-05, - "loss": 2.3152, - "step": 389640 - }, - { - "epoch": 0.68, - "learning_rate": 1.6024860751193687e-05, - "loss": 2.3498, - "step": 389650 - }, - { - "epoch": 0.68, - "learning_rate": 1.602398881126686e-05, - "loss": 2.3316, - "step": 389660 - }, - { - "epoch": 0.68, - "learning_rate": 1.602311687134003e-05, - "loss": 2.2151, - "step": 389670 - }, - { - "epoch": 0.68, - "learning_rate": 1.6022244931413205e-05, - "loss": 2.2316, - "step": 389680 - }, - { - "epoch": 0.68, - "learning_rate": 1.602137299148638e-05, - "loss": 2.4338, - "step": 389690 - }, - { - "epoch": 0.68, - "learning_rate": 1.6020501051559552e-05, - "loss": 2.2665, - "step": 389700 - }, - { - "epoch": 0.68, - "learning_rate": 1.6019629111632726e-05, - "loss": 2.3353, - "step": 389710 - }, - { - "epoch": 0.68, - "learning_rate": 1.6018757171705897e-05, - "loss": 2.3065, - "step": 389720 - }, - { - "epoch": 0.68, - "learning_rate": 1.6017885231779074e-05, - "loss": 2.2952, - "step": 389730 - }, - { - "epoch": 0.68, - "learning_rate": 1.6017013291852244e-05, - "loss": 2.3506, - "step": 389740 - }, - { - "epoch": 0.68, - "learning_rate": 1.6016141351925418e-05, - "loss": 2.3162, - "step": 389750 - }, - { - "epoch": 0.68, - "learning_rate": 1.601526941199859e-05, - "loss": 2.3108, - "step": 389760 - }, - { - "epoch": 0.68, - "learning_rate": 1.6014397472071765e-05, - "loss": 2.3401, - "step": 389770 - }, - { - "epoch": 0.68, - "learning_rate": 1.601352553214494e-05, - "loss": 2.3904, - "step": 389780 - }, - { - "epoch": 0.68, - "learning_rate": 1.601265359221811e-05, - "loss": 2.3693, - "step": 389790 - }, - { - "epoch": 0.68, - "learning_rate": 1.6011781652291287e-05, - "loss": 2.2605, - "step": 389800 - }, - { - "epoch": 0.68, - "learning_rate": 1.6010909712364457e-05, - "loss": 2.3071, - "step": 389810 - }, - { - "epoch": 0.68, - "learning_rate": 1.601003777243763e-05, - "loss": 2.2686, - "step": 389820 - }, - { - "epoch": 0.68, - "learning_rate": 1.6009165832510805e-05, - "loss": 2.3455, - "step": 389830 - }, - { - "epoch": 0.68, - "learning_rate": 1.600829389258398e-05, - "loss": 2.3946, - "step": 389840 - }, - { - "epoch": 0.68, - "learning_rate": 1.6007421952657152e-05, - "loss": 2.3746, - "step": 389850 - }, - { - "epoch": 0.68, - "learning_rate": 1.6006550012730323e-05, - "loss": 2.2865, - "step": 389860 - }, - { - "epoch": 0.68, - "learning_rate": 1.6005678072803496e-05, - "loss": 2.2246, - "step": 389870 - }, - { - "epoch": 0.68, - "learning_rate": 1.600480613287667e-05, - "loss": 2.3543, - "step": 389880 - }, - { - "epoch": 0.68, - "learning_rate": 1.6003934192949844e-05, - "loss": 2.4073, - "step": 389890 - }, - { - "epoch": 0.68, - "learning_rate": 1.6003062253023014e-05, - "loss": 2.3762, - "step": 389900 - }, - { - "epoch": 0.68, - "learning_rate": 1.600219031309619e-05, - "loss": 2.24, - "step": 389910 - }, - { - "epoch": 0.68, - "learning_rate": 1.6001318373169362e-05, - "loss": 2.339, - "step": 389920 - }, - { - "epoch": 0.68, - "learning_rate": 1.6000446433242536e-05, - "loss": 2.3584, - "step": 389930 - }, - { - "epoch": 0.68, - "learning_rate": 1.599957449331571e-05, - "loss": 2.2874, - "step": 389940 - }, - { - "epoch": 0.68, - "learning_rate": 1.5998702553388883e-05, - "loss": 2.3044, - "step": 389950 - }, - { - "epoch": 0.68, - "learning_rate": 1.5997830613462057e-05, - "loss": 2.3621, - "step": 389960 - }, - { - "epoch": 0.68, - "learning_rate": 1.5996958673535227e-05, - "loss": 2.2493, - "step": 389970 - }, - { - "epoch": 0.68, - "learning_rate": 1.59960867336084e-05, - "loss": 2.2918, - "step": 389980 - }, - { - "epoch": 0.68, - "learning_rate": 1.5995214793681575e-05, - "loss": 2.2018, - "step": 389990 - }, - { - "epoch": 0.68, - "learning_rate": 1.599434285375475e-05, - "loss": 2.4768, - "step": 390000 - }, - { - "epoch": 0.68, - "learning_rate": 1.5993470913827922e-05, - "loss": 2.3249, - "step": 390010 - }, - { - "epoch": 0.68, - "learning_rate": 1.5992598973901096e-05, - "loss": 2.2317, - "step": 390020 - }, - { - "epoch": 0.68, - "learning_rate": 1.599172703397427e-05, - "loss": 2.2826, - "step": 390030 - }, - { - "epoch": 0.68, - "learning_rate": 1.599085509404744e-05, - "loss": 2.2686, - "step": 390040 - }, - { - "epoch": 0.68, - "learning_rate": 1.5989983154120614e-05, - "loss": 2.3737, - "step": 390050 - }, - { - "epoch": 0.68, - "learning_rate": 1.5989111214193788e-05, - "loss": 2.1848, - "step": 390060 - }, - { - "epoch": 0.68, - "learning_rate": 1.598823927426696e-05, - "loss": 2.3313, - "step": 390070 - }, - { - "epoch": 0.68, - "learning_rate": 1.5987367334340135e-05, - "loss": 2.2864, - "step": 390080 - }, - { - "epoch": 0.68, - "learning_rate": 1.5986495394413306e-05, - "loss": 2.3846, - "step": 390090 - }, - { - "epoch": 0.68, - "learning_rate": 1.5985623454486483e-05, - "loss": 2.3401, - "step": 390100 - }, - { - "epoch": 0.68, - "learning_rate": 1.5984751514559653e-05, - "loss": 2.3837, - "step": 390110 - }, - { - "epoch": 0.68, - "learning_rate": 1.5983879574632827e-05, - "loss": 2.3641, - "step": 390120 - }, - { - "epoch": 0.68, - "learning_rate": 1.5983007634705997e-05, - "loss": 2.2847, - "step": 390130 - }, - { - "epoch": 0.68, - "learning_rate": 1.5982135694779175e-05, - "loss": 2.3647, - "step": 390140 - }, - { - "epoch": 0.68, - "learning_rate": 1.5981263754852345e-05, - "loss": 2.3037, - "step": 390150 - }, - { - "epoch": 0.68, - "learning_rate": 1.598039181492552e-05, - "loss": 2.34, - "step": 390160 - }, - { - "epoch": 0.68, - "learning_rate": 1.5979519874998692e-05, - "loss": 2.407, - "step": 390170 - }, - { - "epoch": 0.68, - "learning_rate": 1.5978647935071866e-05, - "loss": 2.2737, - "step": 390180 - }, - { - "epoch": 0.68, - "learning_rate": 1.597777599514504e-05, - "loss": 2.3041, - "step": 390190 - }, - { - "epoch": 0.68, - "learning_rate": 1.597690405521821e-05, - "loss": 2.4365, - "step": 390200 - }, - { - "epoch": 0.68, - "learning_rate": 1.5976032115291388e-05, - "loss": 2.3545, - "step": 390210 - }, - { - "epoch": 0.68, - "learning_rate": 1.5975160175364558e-05, - "loss": 2.3361, - "step": 390220 - }, - { - "epoch": 0.68, - "learning_rate": 1.597428823543773e-05, - "loss": 2.308, - "step": 390230 - }, - { - "epoch": 0.68, - "learning_rate": 1.5973416295510905e-05, - "loss": 2.3629, - "step": 390240 - }, - { - "epoch": 0.68, - "learning_rate": 1.597254435558408e-05, - "loss": 2.2241, - "step": 390250 - }, - { - "epoch": 0.68, - "learning_rate": 1.5971672415657253e-05, - "loss": 2.2521, - "step": 390260 - }, - { - "epoch": 0.68, - "learning_rate": 1.5970800475730423e-05, - "loss": 2.2772, - "step": 390270 - }, - { - "epoch": 0.68, - "learning_rate": 1.59699285358036e-05, - "loss": 2.324, - "step": 390280 - }, - { - "epoch": 0.68, - "learning_rate": 1.596905659587677e-05, - "loss": 2.2756, - "step": 390290 - }, - { - "epoch": 0.68, - "learning_rate": 1.5968184655949945e-05, - "loss": 2.4016, - "step": 390300 - }, - { - "epoch": 0.68, - "learning_rate": 1.5967312716023115e-05, - "loss": 2.3166, - "step": 390310 - }, - { - "epoch": 0.68, - "learning_rate": 1.5966440776096292e-05, - "loss": 2.43, - "step": 390320 - }, - { - "epoch": 0.68, - "learning_rate": 1.5965568836169466e-05, - "loss": 2.3729, - "step": 390330 - }, - { - "epoch": 0.68, - "learning_rate": 1.5964696896242636e-05, - "loss": 2.3252, - "step": 390340 - }, - { - "epoch": 0.68, - "learning_rate": 1.596382495631581e-05, - "loss": 2.244, - "step": 390350 - }, - { - "epoch": 0.68, - "learning_rate": 1.5962953016388984e-05, - "loss": 2.3535, - "step": 390360 - }, - { - "epoch": 0.68, - "learning_rate": 1.5962081076462158e-05, - "loss": 2.2126, - "step": 390370 - }, - { - "epoch": 0.68, - "learning_rate": 1.5961209136535328e-05, - "loss": 2.2382, - "step": 390380 - }, - { - "epoch": 0.68, - "learning_rate": 1.5960337196608502e-05, - "loss": 2.3077, - "step": 390390 - }, - { - "epoch": 0.68, - "learning_rate": 1.5959465256681676e-05, - "loss": 2.2771, - "step": 390400 - }, - { - "epoch": 0.68, - "learning_rate": 1.595859331675485e-05, - "loss": 2.3879, - "step": 390410 - }, - { - "epoch": 0.68, - "learning_rate": 1.5957721376828023e-05, - "loss": 2.3372, - "step": 390420 - }, - { - "epoch": 0.68, - "learning_rate": 1.5956849436901197e-05, - "loss": 2.3069, - "step": 390430 - }, - { - "epoch": 0.68, - "learning_rate": 1.595597749697437e-05, - "loss": 2.2456, - "step": 390440 - }, - { - "epoch": 0.68, - "learning_rate": 1.595510555704754e-05, - "loss": 2.1769, - "step": 390450 - }, - { - "epoch": 0.68, - "learning_rate": 1.5954233617120715e-05, - "loss": 2.2579, - "step": 390460 - }, - { - "epoch": 0.68, - "learning_rate": 1.595336167719389e-05, - "loss": 2.2818, - "step": 390470 - }, - { - "epoch": 0.68, - "learning_rate": 1.5952489737267062e-05, - "loss": 2.3678, - "step": 390480 - }, - { - "epoch": 0.68, - "learning_rate": 1.5951617797340236e-05, - "loss": 2.3031, - "step": 390490 - }, - { - "epoch": 0.68, - "learning_rate": 1.5950745857413407e-05, - "loss": 2.3205, - "step": 390500 - }, - { - "epoch": 0.68, - "learning_rate": 1.5949873917486584e-05, - "loss": 2.3239, - "step": 390510 - }, - { - "epoch": 0.68, - "learning_rate": 1.5949001977559754e-05, - "loss": 2.4075, - "step": 390520 - }, - { - "epoch": 0.68, - "learning_rate": 1.5948130037632928e-05, - "loss": 2.3097, - "step": 390530 - }, - { - "epoch": 0.68, - "learning_rate": 1.59472580977061e-05, - "loss": 2.2551, - "step": 390540 - }, - { - "epoch": 0.68, - "learning_rate": 1.5946386157779275e-05, - "loss": 2.3264, - "step": 390550 - }, - { - "epoch": 0.68, - "learning_rate": 1.594551421785245e-05, - "loss": 2.2655, - "step": 390560 - }, - { - "epoch": 0.68, - "learning_rate": 1.594464227792562e-05, - "loss": 2.2184, - "step": 390570 - }, - { - "epoch": 0.68, - "learning_rate": 1.5943770337998797e-05, - "loss": 2.2413, - "step": 390580 - }, - { - "epoch": 0.68, - "learning_rate": 1.5942898398071967e-05, - "loss": 2.356, - "step": 390590 - }, - { - "epoch": 0.68, - "learning_rate": 1.594202645814514e-05, - "loss": 2.3301, - "step": 390600 - }, - { - "epoch": 0.68, - "learning_rate": 1.594115451821831e-05, - "loss": 2.2759, - "step": 390610 - }, - { - "epoch": 0.68, - "learning_rate": 1.594028257829149e-05, - "loss": 2.2273, - "step": 390620 - }, - { - "epoch": 0.68, - "learning_rate": 1.593941063836466e-05, - "loss": 2.3807, - "step": 390630 - }, - { - "epoch": 0.68, - "learning_rate": 1.5938538698437833e-05, - "loss": 2.3054, - "step": 390640 - }, - { - "epoch": 0.68, - "learning_rate": 1.5937666758511006e-05, - "loss": 2.2265, - "step": 390650 - }, - { - "epoch": 0.68, - "learning_rate": 1.593679481858418e-05, - "loss": 2.2518, - "step": 390660 - }, - { - "epoch": 0.68, - "learning_rate": 1.5935922878657354e-05, - "loss": 2.3048, - "step": 390670 - }, - { - "epoch": 0.68, - "learning_rate": 1.5935050938730524e-05, - "loss": 2.3092, - "step": 390680 - }, - { - "epoch": 0.68, - "learning_rate": 1.59341789988037e-05, - "loss": 2.4397, - "step": 390690 - }, - { - "epoch": 0.68, - "learning_rate": 1.5933307058876872e-05, - "loss": 2.2872, - "step": 390700 - }, - { - "epoch": 0.68, - "learning_rate": 1.5932435118950046e-05, - "loss": 2.3086, - "step": 390710 - }, - { - "epoch": 0.68, - "learning_rate": 1.593156317902322e-05, - "loss": 2.3189, - "step": 390720 - }, - { - "epoch": 0.68, - "learning_rate": 1.5930691239096393e-05, - "loss": 2.3358, - "step": 390730 - }, - { - "epoch": 0.68, - "learning_rate": 1.5929819299169567e-05, - "loss": 2.341, - "step": 390740 - }, - { - "epoch": 0.68, - "learning_rate": 1.5928947359242737e-05, - "loss": 2.3128, - "step": 390750 - }, - { - "epoch": 0.68, - "learning_rate": 1.592807541931591e-05, - "loss": 2.3712, - "step": 390760 - }, - { - "epoch": 0.68, - "learning_rate": 1.5927203479389085e-05, - "loss": 2.3202, - "step": 390770 - }, - { - "epoch": 0.68, - "learning_rate": 1.592633153946226e-05, - "loss": 2.3053, - "step": 390780 - }, - { - "epoch": 0.68, - "learning_rate": 1.592545959953543e-05, - "loss": 2.2493, - "step": 390790 - }, - { - "epoch": 0.68, - "learning_rate": 1.5924587659608603e-05, - "loss": 2.2907, - "step": 390800 - }, - { - "epoch": 0.68, - "learning_rate": 1.592371571968178e-05, - "loss": 2.4087, - "step": 390810 - }, - { - "epoch": 0.68, - "learning_rate": 1.592284377975495e-05, - "loss": 2.29, - "step": 390820 - }, - { - "epoch": 0.68, - "learning_rate": 1.5921971839828124e-05, - "loss": 2.3427, - "step": 390830 - }, - { - "epoch": 0.68, - "learning_rate": 1.5921099899901298e-05, - "loss": 2.3398, - "step": 390840 - }, - { - "epoch": 0.68, - "learning_rate": 1.592022795997447e-05, - "loss": 2.2975, - "step": 390850 - }, - { - "epoch": 0.68, - "learning_rate": 1.5919356020047642e-05, - "loss": 2.4008, - "step": 390860 - }, - { - "epoch": 0.68, - "learning_rate": 1.5918484080120816e-05, - "loss": 2.3011, - "step": 390870 - }, - { - "epoch": 0.68, - "learning_rate": 1.591761214019399e-05, - "loss": 2.2187, - "step": 390880 - }, - { - "epoch": 0.68, - "learning_rate": 1.5916740200267163e-05, - "loss": 2.1479, - "step": 390890 - }, - { - "epoch": 0.68, - "learning_rate": 1.5915868260340337e-05, - "loss": 2.4636, - "step": 390900 - }, - { - "epoch": 0.68, - "learning_rate": 1.5914996320413507e-05, - "loss": 2.2456, - "step": 390910 - }, - { - "epoch": 0.68, - "learning_rate": 1.5914124380486685e-05, - "loss": 2.3569, - "step": 390920 - }, - { - "epoch": 0.68, - "learning_rate": 1.5913252440559855e-05, - "loss": 2.3442, - "step": 390930 - }, - { - "epoch": 0.68, - "learning_rate": 1.591238050063303e-05, - "loss": 2.2646, - "step": 390940 - }, - { - "epoch": 0.68, - "learning_rate": 1.5911508560706202e-05, - "loss": 2.3772, - "step": 390950 - }, - { - "epoch": 0.68, - "learning_rate": 1.5910636620779376e-05, - "loss": 2.2648, - "step": 390960 - }, - { - "epoch": 0.68, - "learning_rate": 1.590976468085255e-05, - "loss": 2.2739, - "step": 390970 - }, - { - "epoch": 0.68, - "learning_rate": 1.590889274092572e-05, - "loss": 2.1613, - "step": 390980 - }, - { - "epoch": 0.68, - "learning_rate": 1.5908020800998898e-05, - "loss": 2.3222, - "step": 390990 - }, - { - "epoch": 0.68, - "learning_rate": 1.5907148861072068e-05, - "loss": 2.3008, - "step": 391000 - }, - { - "epoch": 0.68, - "learning_rate": 1.590627692114524e-05, - "loss": 2.2727, - "step": 391010 - }, - { - "epoch": 0.68, - "learning_rate": 1.5905404981218412e-05, - "loss": 2.3853, - "step": 391020 - }, - { - "epoch": 0.68, - "learning_rate": 1.590453304129159e-05, - "loss": 2.3491, - "step": 391030 - }, - { - "epoch": 0.68, - "learning_rate": 1.590366110136476e-05, - "loss": 2.262, - "step": 391040 - }, - { - "epoch": 0.68, - "learning_rate": 1.5902789161437933e-05, - "loss": 2.3055, - "step": 391050 - }, - { - "epoch": 0.68, - "learning_rate": 1.5901917221511107e-05, - "loss": 2.3221, - "step": 391060 - }, - { - "epoch": 0.68, - "learning_rate": 1.590104528158428e-05, - "loss": 2.3747, - "step": 391070 - }, - { - "epoch": 0.68, - "learning_rate": 1.5900173341657455e-05, - "loss": 2.37, - "step": 391080 - }, - { - "epoch": 0.68, - "learning_rate": 1.5899301401730625e-05, - "loss": 2.3406, - "step": 391090 - }, - { - "epoch": 0.68, - "learning_rate": 1.5898429461803802e-05, - "loss": 2.3394, - "step": 391100 - }, - { - "epoch": 0.68, - "learning_rate": 1.5897557521876973e-05, - "loss": 2.266, - "step": 391110 - }, - { - "epoch": 0.68, - "learning_rate": 1.5896685581950146e-05, - "loss": 2.2881, - "step": 391120 - }, - { - "epoch": 0.68, - "learning_rate": 1.589581364202332e-05, - "loss": 2.3114, - "step": 391130 - }, - { - "epoch": 0.68, - "learning_rate": 1.5894941702096494e-05, - "loss": 2.303, - "step": 391140 - }, - { - "epoch": 0.68, - "learning_rate": 1.5894069762169668e-05, - "loss": 2.3888, - "step": 391150 - }, - { - "epoch": 0.68, - "learning_rate": 1.5893197822242838e-05, - "loss": 2.3135, - "step": 391160 - }, - { - "epoch": 0.68, - "learning_rate": 1.5892325882316012e-05, - "loss": 2.2574, - "step": 391170 - }, - { - "epoch": 0.68, - "learning_rate": 1.5891453942389186e-05, - "loss": 2.302, - "step": 391180 - }, - { - "epoch": 0.68, - "learning_rate": 1.589058200246236e-05, - "loss": 2.3527, - "step": 391190 - }, - { - "epoch": 0.68, - "learning_rate": 1.5889710062535533e-05, - "loss": 2.3467, - "step": 391200 - }, - { - "epoch": 0.68, - "learning_rate": 1.5888838122608707e-05, - "loss": 2.3434, - "step": 391210 - }, - { - "epoch": 0.68, - "learning_rate": 1.588796618268188e-05, - "loss": 2.4504, - "step": 391220 - }, - { - "epoch": 0.68, - "learning_rate": 1.588709424275505e-05, - "loss": 2.3672, - "step": 391230 - }, - { - "epoch": 0.68, - "learning_rate": 1.5886222302828225e-05, - "loss": 2.4139, - "step": 391240 - }, - { - "epoch": 0.68, - "learning_rate": 1.58853503629014e-05, - "loss": 2.2881, - "step": 391250 - }, - { - "epoch": 0.68, - "learning_rate": 1.5884478422974572e-05, - "loss": 2.3084, - "step": 391260 - }, - { - "epoch": 0.68, - "learning_rate": 1.5883606483047743e-05, - "loss": 2.3502, - "step": 391270 - }, - { - "epoch": 0.68, - "learning_rate": 1.5882734543120917e-05, - "loss": 2.2187, - "step": 391280 - }, - { - "epoch": 0.68, - "learning_rate": 1.5881862603194094e-05, - "loss": 2.249, - "step": 391290 - }, - { - "epoch": 0.68, - "learning_rate": 1.5880990663267264e-05, - "loss": 2.1938, - "step": 391300 - }, - { - "epoch": 0.68, - "learning_rate": 1.5880118723340438e-05, - "loss": 2.2939, - "step": 391310 - }, - { - "epoch": 0.68, - "learning_rate": 1.5879246783413608e-05, - "loss": 2.3734, - "step": 391320 - }, - { - "epoch": 0.68, - "learning_rate": 1.5878374843486785e-05, - "loss": 2.3384, - "step": 391330 - }, - { - "epoch": 0.68, - "learning_rate": 1.5877502903559956e-05, - "loss": 2.4195, - "step": 391340 - }, - { - "epoch": 0.68, - "learning_rate": 1.587663096363313e-05, - "loss": 2.0815, - "step": 391350 - }, - { - "epoch": 0.68, - "learning_rate": 1.5875759023706303e-05, - "loss": 2.3929, - "step": 391360 - }, - { - "epoch": 0.68, - "learning_rate": 1.5874887083779477e-05, - "loss": 2.2279, - "step": 391370 - }, - { - "epoch": 0.68, - "learning_rate": 1.587401514385265e-05, - "loss": 2.3749, - "step": 391380 - }, - { - "epoch": 0.68, - "learning_rate": 1.587314320392582e-05, - "loss": 2.1414, - "step": 391390 - }, - { - "epoch": 0.68, - "learning_rate": 1.5872271263999e-05, - "loss": 2.3219, - "step": 391400 - }, - { - "epoch": 0.68, - "learning_rate": 1.587139932407217e-05, - "loss": 2.2351, - "step": 391410 - }, - { - "epoch": 0.68, - "learning_rate": 1.5870527384145343e-05, - "loss": 2.2712, - "step": 391420 - }, - { - "epoch": 0.68, - "learning_rate": 1.5869655444218516e-05, - "loss": 2.2513, - "step": 391430 - }, - { - "epoch": 0.68, - "learning_rate": 1.586878350429169e-05, - "loss": 2.3922, - "step": 391440 - }, - { - "epoch": 0.68, - "learning_rate": 1.5867911564364864e-05, - "loss": 2.2051, - "step": 391450 - }, - { - "epoch": 0.68, - "learning_rate": 1.5867039624438034e-05, - "loss": 2.3934, - "step": 391460 - }, - { - "epoch": 0.68, - "learning_rate": 1.586616768451121e-05, - "loss": 2.2629, - "step": 391470 - }, - { - "epoch": 0.68, - "learning_rate": 1.5865295744584382e-05, - "loss": 2.2959, - "step": 391480 - }, - { - "epoch": 0.68, - "learning_rate": 1.5864423804657556e-05, - "loss": 2.3307, - "step": 391490 - }, - { - "epoch": 0.68, - "learning_rate": 1.5863551864730726e-05, - "loss": 2.1836, - "step": 391500 - }, - { - "epoch": 0.68, - "learning_rate": 1.5862679924803903e-05, - "loss": 2.2554, - "step": 391510 - }, - { - "epoch": 0.68, - "learning_rate": 1.5861807984877073e-05, - "loss": 2.2118, - "step": 391520 - }, - { - "epoch": 0.68, - "learning_rate": 1.5860936044950247e-05, - "loss": 2.381, - "step": 391530 - }, - { - "epoch": 0.68, - "learning_rate": 1.586006410502342e-05, - "loss": 2.3692, - "step": 391540 - }, - { - "epoch": 0.68, - "learning_rate": 1.5859192165096595e-05, - "loss": 2.1428, - "step": 391550 - }, - { - "epoch": 0.68, - "learning_rate": 1.585832022516977e-05, - "loss": 2.4009, - "step": 391560 - }, - { - "epoch": 0.68, - "learning_rate": 1.585744828524294e-05, - "loss": 2.3524, - "step": 391570 - }, - { - "epoch": 0.68, - "learning_rate": 1.5856576345316113e-05, - "loss": 2.3244, - "step": 391580 - }, - { - "epoch": 0.68, - "learning_rate": 1.5855704405389286e-05, - "loss": 2.3223, - "step": 391590 - }, - { - "epoch": 0.68, - "learning_rate": 1.585483246546246e-05, - "loss": 2.2617, - "step": 391600 - }, - { - "epoch": 0.68, - "learning_rate": 1.5853960525535634e-05, - "loss": 2.275, - "step": 391610 - }, - { - "epoch": 0.68, - "learning_rate": 1.5853088585608808e-05, - "loss": 2.3008, - "step": 391620 - }, - { - "epoch": 0.68, - "learning_rate": 1.585221664568198e-05, - "loss": 2.2634, - "step": 391630 - }, - { - "epoch": 0.68, - "learning_rate": 1.5851344705755152e-05, - "loss": 2.2399, - "step": 391640 - }, - { - "epoch": 0.68, - "learning_rate": 1.5850472765828326e-05, - "loss": 2.2583, - "step": 391650 - }, - { - "epoch": 0.68, - "learning_rate": 1.58496008259015e-05, - "loss": 2.3183, - "step": 391660 - }, - { - "epoch": 0.68, - "learning_rate": 1.5848728885974673e-05, - "loss": 2.159, - "step": 391670 - }, - { - "epoch": 0.68, - "learning_rate": 1.5847856946047847e-05, - "loss": 2.1771, - "step": 391680 - }, - { - "epoch": 0.68, - "learning_rate": 1.5846985006121017e-05, - "loss": 2.3488, - "step": 391690 - }, - { - "epoch": 0.68, - "learning_rate": 1.5846113066194195e-05, - "loss": 2.3316, - "step": 391700 - }, - { - "epoch": 0.68, - "learning_rate": 1.5845241126267365e-05, - "loss": 2.3274, - "step": 391710 - }, - { - "epoch": 0.68, - "learning_rate": 1.584436918634054e-05, - "loss": 2.4284, - "step": 391720 - }, - { - "epoch": 0.68, - "learning_rate": 1.584349724641371e-05, - "loss": 2.2582, - "step": 391730 - }, - { - "epoch": 0.68, - "learning_rate": 1.5842625306486886e-05, - "loss": 2.3055, - "step": 391740 - }, - { - "epoch": 0.68, - "learning_rate": 1.5841753366560057e-05, - "loss": 2.3306, - "step": 391750 - }, - { - "epoch": 0.68, - "learning_rate": 1.584088142663323e-05, - "loss": 2.3548, - "step": 391760 - }, - { - "epoch": 0.68, - "learning_rate": 1.5840009486706404e-05, - "loss": 2.3519, - "step": 391770 - }, - { - "epoch": 0.68, - "learning_rate": 1.5839137546779578e-05, - "loss": 2.3234, - "step": 391780 - }, - { - "epoch": 0.68, - "learning_rate": 1.5838265606852752e-05, - "loss": 2.2974, - "step": 391790 - }, - { - "epoch": 0.68, - "learning_rate": 1.5837393666925922e-05, - "loss": 2.2581, - "step": 391800 - }, - { - "epoch": 0.68, - "learning_rate": 1.58365217269991e-05, - "loss": 2.2507, - "step": 391810 - }, - { - "epoch": 0.68, - "learning_rate": 1.583564978707227e-05, - "loss": 2.1494, - "step": 391820 - }, - { - "epoch": 0.68, - "learning_rate": 1.5834777847145443e-05, - "loss": 2.2824, - "step": 391830 - }, - { - "epoch": 0.68, - "learning_rate": 1.5833905907218617e-05, - "loss": 2.3391, - "step": 391840 - }, - { - "epoch": 0.68, - "learning_rate": 1.583303396729179e-05, - "loss": 2.2957, - "step": 391850 - }, - { - "epoch": 0.68, - "learning_rate": 1.5832162027364965e-05, - "loss": 2.3626, - "step": 391860 - }, - { - "epoch": 0.68, - "learning_rate": 1.5831290087438135e-05, - "loss": 2.3594, - "step": 391870 - }, - { - "epoch": 0.68, - "learning_rate": 1.5830418147511312e-05, - "loss": 2.3654, - "step": 391880 - }, - { - "epoch": 0.68, - "learning_rate": 1.5829546207584483e-05, - "loss": 2.2537, - "step": 391890 - }, - { - "epoch": 0.68, - "learning_rate": 1.5828674267657656e-05, - "loss": 2.2806, - "step": 391900 - }, - { - "epoch": 0.68, - "learning_rate": 1.582780232773083e-05, - "loss": 2.3088, - "step": 391910 - }, - { - "epoch": 0.68, - "learning_rate": 1.5826930387804004e-05, - "loss": 2.273, - "step": 391920 - }, - { - "epoch": 0.68, - "learning_rate": 1.5826058447877178e-05, - "loss": 2.2114, - "step": 391930 - }, - { - "epoch": 0.68, - "learning_rate": 1.5825186507950348e-05, - "loss": 2.2731, - "step": 391940 - }, - { - "epoch": 0.68, - "learning_rate": 1.5824314568023522e-05, - "loss": 2.3592, - "step": 391950 - }, - { - "epoch": 0.68, - "learning_rate": 1.5823442628096696e-05, - "loss": 2.3905, - "step": 391960 - }, - { - "epoch": 0.68, - "learning_rate": 1.582257068816987e-05, - "loss": 2.2106, - "step": 391970 - }, - { - "epoch": 0.68, - "learning_rate": 1.582169874824304e-05, - "loss": 2.2491, - "step": 391980 - }, - { - "epoch": 0.68, - "learning_rate": 1.5820826808316214e-05, - "loss": 2.2564, - "step": 391990 - }, - { - "epoch": 0.68, - "learning_rate": 1.5819954868389387e-05, - "loss": 2.2582, - "step": 392000 - }, - { - "epoch": 0.68, - "learning_rate": 1.581908292846256e-05, - "loss": 2.0975, - "step": 392010 - }, - { - "epoch": 0.68, - "learning_rate": 1.5818210988535735e-05, - "loss": 2.291, - "step": 392020 - }, - { - "epoch": 0.68, - "learning_rate": 1.581733904860891e-05, - "loss": 2.1803, - "step": 392030 - }, - { - "epoch": 0.68, - "learning_rate": 1.5816467108682082e-05, - "loss": 2.3194, - "step": 392040 - }, - { - "epoch": 0.68, - "learning_rate": 1.5815595168755253e-05, - "loss": 2.1958, - "step": 392050 - }, - { - "epoch": 0.68, - "learning_rate": 1.5814723228828427e-05, - "loss": 2.3078, - "step": 392060 - }, - { - "epoch": 0.68, - "learning_rate": 1.58138512889016e-05, - "loss": 2.2691, - "step": 392070 - }, - { - "epoch": 0.68, - "learning_rate": 1.5812979348974774e-05, - "loss": 2.2867, - "step": 392080 - }, - { - "epoch": 0.68, - "learning_rate": 1.5812107409047948e-05, - "loss": 2.4097, - "step": 392090 - }, - { - "epoch": 0.68, - "learning_rate": 1.5811235469121118e-05, - "loss": 2.2522, - "step": 392100 - }, - { - "epoch": 0.68, - "learning_rate": 1.5810363529194295e-05, - "loss": 2.2104, - "step": 392110 - }, - { - "epoch": 0.68, - "learning_rate": 1.5809491589267466e-05, - "loss": 2.351, - "step": 392120 - }, - { - "epoch": 0.68, - "learning_rate": 1.580861964934064e-05, - "loss": 2.3567, - "step": 392130 - }, - { - "epoch": 0.68, - "learning_rate": 1.5807747709413813e-05, - "loss": 2.2424, - "step": 392140 - }, - { - "epoch": 0.68, - "learning_rate": 1.5806875769486987e-05, - "loss": 2.1597, - "step": 392150 - }, - { - "epoch": 0.68, - "learning_rate": 1.580600382956016e-05, - "loss": 2.3506, - "step": 392160 - }, - { - "epoch": 0.68, - "learning_rate": 1.580513188963333e-05, - "loss": 2.2791, - "step": 392170 - }, - { - "epoch": 0.68, - "learning_rate": 1.580425994970651e-05, - "loss": 2.1875, - "step": 392180 - }, - { - "epoch": 0.68, - "learning_rate": 1.580338800977968e-05, - "loss": 2.312, - "step": 392190 - }, - { - "epoch": 0.68, - "learning_rate": 1.5802516069852853e-05, - "loss": 2.206, - "step": 392200 - }, - { - "epoch": 0.68, - "learning_rate": 1.5801644129926023e-05, - "loss": 2.3332, - "step": 392210 - }, - { - "epoch": 0.68, - "learning_rate": 1.58007721899992e-05, - "loss": 2.2836, - "step": 392220 - }, - { - "epoch": 0.68, - "learning_rate": 1.579990025007237e-05, - "loss": 2.3922, - "step": 392230 - }, - { - "epoch": 0.68, - "learning_rate": 1.5799028310145544e-05, - "loss": 2.266, - "step": 392240 - }, - { - "epoch": 0.68, - "learning_rate": 1.5798156370218718e-05, - "loss": 2.4304, - "step": 392250 - }, - { - "epoch": 0.68, - "learning_rate": 1.5797284430291892e-05, - "loss": 2.3437, - "step": 392260 - }, - { - "epoch": 0.68, - "learning_rate": 1.5796412490365066e-05, - "loss": 2.3491, - "step": 392270 - }, - { - "epoch": 0.68, - "learning_rate": 1.5795540550438236e-05, - "loss": 2.2224, - "step": 392280 - }, - { - "epoch": 0.68, - "learning_rate": 1.5794668610511413e-05, - "loss": 2.2815, - "step": 392290 - }, - { - "epoch": 0.68, - "learning_rate": 1.5793796670584583e-05, - "loss": 2.254, - "step": 392300 - }, - { - "epoch": 0.68, - "learning_rate": 1.5792924730657757e-05, - "loss": 2.2111, - "step": 392310 - }, - { - "epoch": 0.68, - "learning_rate": 1.579205279073093e-05, - "loss": 2.2964, - "step": 392320 - }, - { - "epoch": 0.68, - "learning_rate": 1.5791180850804105e-05, - "loss": 2.2012, - "step": 392330 - }, - { - "epoch": 0.68, - "learning_rate": 1.579030891087728e-05, - "loss": 2.2447, - "step": 392340 - }, - { - "epoch": 0.68, - "learning_rate": 1.578943697095045e-05, - "loss": 2.3899, - "step": 392350 - }, - { - "epoch": 0.68, - "learning_rate": 1.5788565031023623e-05, - "loss": 2.3952, - "step": 392360 - }, - { - "epoch": 0.68, - "learning_rate": 1.5787693091096796e-05, - "loss": 2.3136, - "step": 392370 - }, - { - "epoch": 0.68, - "learning_rate": 1.578682115116997e-05, - "loss": 2.2071, - "step": 392380 - }, - { - "epoch": 0.68, - "learning_rate": 1.578594921124314e-05, - "loss": 2.3228, - "step": 392390 - }, - { - "epoch": 0.68, - "learning_rate": 1.5785077271316318e-05, - "loss": 2.3382, - "step": 392400 - }, - { - "epoch": 0.68, - "learning_rate": 1.578420533138949e-05, - "loss": 2.3968, - "step": 392410 - }, - { - "epoch": 0.68, - "learning_rate": 1.5783333391462662e-05, - "loss": 2.3238, - "step": 392420 - }, - { - "epoch": 0.68, - "learning_rate": 1.5782461451535836e-05, - "loss": 2.4164, - "step": 392430 - }, - { - "epoch": 0.68, - "learning_rate": 1.578158951160901e-05, - "loss": 2.2935, - "step": 392440 - }, - { - "epoch": 0.68, - "learning_rate": 1.5780717571682183e-05, - "loss": 2.1633, - "step": 392450 - }, - { - "epoch": 0.68, - "learning_rate": 1.5779845631755354e-05, - "loss": 2.3777, - "step": 392460 - }, - { - "epoch": 0.68, - "learning_rate": 1.5778973691828527e-05, - "loss": 2.3679, - "step": 392470 - }, - { - "epoch": 0.68, - "learning_rate": 1.57781017519017e-05, - "loss": 2.2691, - "step": 392480 - }, - { - "epoch": 0.68, - "learning_rate": 1.5777229811974875e-05, - "loss": 2.2483, - "step": 392490 - }, - { - "epoch": 0.68, - "learning_rate": 1.577635787204805e-05, - "loss": 2.3063, - "step": 392500 - }, - { - "epoch": 0.68, - "learning_rate": 1.577548593212122e-05, - "loss": 2.2587, - "step": 392510 - }, - { - "epoch": 0.68, - "learning_rate": 1.5774613992194396e-05, - "loss": 2.2477, - "step": 392520 - }, - { - "epoch": 0.68, - "learning_rate": 1.5773742052267567e-05, - "loss": 2.3698, - "step": 392530 - }, - { - "epoch": 0.68, - "learning_rate": 1.577287011234074e-05, - "loss": 2.2894, - "step": 392540 - }, - { - "epoch": 0.68, - "learning_rate": 1.5771998172413914e-05, - "loss": 2.3499, - "step": 392550 - }, - { - "epoch": 0.68, - "learning_rate": 1.5771126232487088e-05, - "loss": 2.3456, - "step": 392560 - }, - { - "epoch": 0.68, - "learning_rate": 1.5770254292560262e-05, - "loss": 2.3276, - "step": 392570 - }, - { - "epoch": 0.68, - "learning_rate": 1.5769382352633432e-05, - "loss": 2.3749, - "step": 392580 - }, - { - "epoch": 0.68, - "learning_rate": 1.576851041270661e-05, - "loss": 2.2454, - "step": 392590 - }, - { - "epoch": 0.68, - "learning_rate": 1.576763847277978e-05, - "loss": 2.2309, - "step": 392600 - }, - { - "epoch": 0.68, - "learning_rate": 1.5766766532852953e-05, - "loss": 2.2784, - "step": 392610 - }, - { - "epoch": 0.68, - "learning_rate": 1.5765894592926124e-05, - "loss": 2.3178, - "step": 392620 - }, - { - "epoch": 0.68, - "learning_rate": 1.57650226529993e-05, - "loss": 2.3932, - "step": 392630 - }, - { - "epoch": 0.68, - "learning_rate": 1.5764150713072475e-05, - "loss": 2.3966, - "step": 392640 - }, - { - "epoch": 0.68, - "learning_rate": 1.5763278773145645e-05, - "loss": 2.3525, - "step": 392650 - }, - { - "epoch": 0.68, - "learning_rate": 1.576240683321882e-05, - "loss": 2.3864, - "step": 392660 - }, - { - "epoch": 0.68, - "learning_rate": 1.5761534893291993e-05, - "loss": 2.2953, - "step": 392670 - }, - { - "epoch": 0.68, - "learning_rate": 1.5760662953365166e-05, - "loss": 2.2973, - "step": 392680 - }, - { - "epoch": 0.68, - "learning_rate": 1.5759791013438337e-05, - "loss": 2.2768, - "step": 392690 - }, - { - "epoch": 0.68, - "learning_rate": 1.5758919073511514e-05, - "loss": 2.3058, - "step": 392700 - }, - { - "epoch": 0.68, - "learning_rate": 1.5758047133584684e-05, - "loss": 2.323, - "step": 392710 - }, - { - "epoch": 0.68, - "learning_rate": 1.5757175193657858e-05, - "loss": 2.3241, - "step": 392720 - }, - { - "epoch": 0.68, - "learning_rate": 1.5756303253731032e-05, - "loss": 2.3068, - "step": 392730 - }, - { - "epoch": 0.68, - "learning_rate": 1.5755431313804206e-05, - "loss": 2.3078, - "step": 392740 - }, - { - "epoch": 0.68, - "learning_rate": 1.575455937387738e-05, - "loss": 2.2829, - "step": 392750 - }, - { - "epoch": 0.68, - "learning_rate": 1.575368743395055e-05, - "loss": 2.2243, - "step": 392760 - }, - { - "epoch": 0.68, - "learning_rate": 1.5752815494023724e-05, - "loss": 2.3625, - "step": 392770 - }, - { - "epoch": 0.68, - "learning_rate": 1.5751943554096897e-05, - "loss": 2.2287, - "step": 392780 - }, - { - "epoch": 0.68, - "learning_rate": 1.575107161417007e-05, - "loss": 2.3678, - "step": 392790 - }, - { - "epoch": 0.68, - "learning_rate": 1.5750199674243245e-05, - "loss": 2.2152, - "step": 392800 - }, - { - "epoch": 0.69, - "learning_rate": 1.574932773431642e-05, - "loss": 2.3582, - "step": 392810 - }, - { - "epoch": 0.69, - "learning_rate": 1.5748455794389592e-05, - "loss": 2.2649, - "step": 392820 - }, - { - "epoch": 0.69, - "learning_rate": 1.5747583854462763e-05, - "loss": 2.2394, - "step": 392830 - }, - { - "epoch": 0.69, - "learning_rate": 1.5746711914535937e-05, - "loss": 2.2726, - "step": 392840 - }, - { - "epoch": 0.69, - "learning_rate": 1.574583997460911e-05, - "loss": 2.183, - "step": 392850 - }, - { - "epoch": 0.69, - "learning_rate": 1.5744968034682284e-05, - "loss": 2.2805, - "step": 392860 - }, - { - "epoch": 0.69, - "learning_rate": 1.5744096094755454e-05, - "loss": 2.2444, - "step": 392870 - }, - { - "epoch": 0.69, - "learning_rate": 1.5743224154828628e-05, - "loss": 2.3211, - "step": 392880 - }, - { - "epoch": 0.69, - "learning_rate": 1.5742352214901805e-05, - "loss": 2.2253, - "step": 392890 - }, - { - "epoch": 0.69, - "learning_rate": 1.5741480274974976e-05, - "loss": 2.3672, - "step": 392900 - }, - { - "epoch": 0.69, - "learning_rate": 1.574060833504815e-05, - "loss": 2.3297, - "step": 392910 - }, - { - "epoch": 0.69, - "learning_rate": 1.573973639512132e-05, - "loss": 2.2338, - "step": 392920 - }, - { - "epoch": 0.69, - "learning_rate": 1.5738864455194497e-05, - "loss": 2.2223, - "step": 392930 - }, - { - "epoch": 0.69, - "learning_rate": 1.5737992515267667e-05, - "loss": 2.246, - "step": 392940 - }, - { - "epoch": 0.69, - "learning_rate": 1.573712057534084e-05, - "loss": 2.3785, - "step": 392950 - }, - { - "epoch": 0.69, - "learning_rate": 1.5736248635414015e-05, - "loss": 2.3309, - "step": 392960 - }, - { - "epoch": 0.69, - "learning_rate": 1.573537669548719e-05, - "loss": 2.2634, - "step": 392970 - }, - { - "epoch": 0.69, - "learning_rate": 1.5734504755560363e-05, - "loss": 2.4528, - "step": 392980 - }, - { - "epoch": 0.69, - "learning_rate": 1.5733632815633533e-05, - "loss": 2.2897, - "step": 392990 - }, - { - "epoch": 0.69, - "learning_rate": 1.573276087570671e-05, - "loss": 2.2529, - "step": 393000 - }, - { - "epoch": 0.69, - "learning_rate": 1.573188893577988e-05, - "loss": 2.3341, - "step": 393010 - }, - { - "epoch": 0.69, - "learning_rate": 1.5731016995853054e-05, - "loss": 2.2444, - "step": 393020 - }, - { - "epoch": 0.69, - "learning_rate": 1.5730145055926228e-05, - "loss": 2.3314, - "step": 393030 - }, - { - "epoch": 0.69, - "learning_rate": 1.5729273115999402e-05, - "loss": 2.3303, - "step": 393040 - }, - { - "epoch": 0.69, - "learning_rate": 1.5728401176072576e-05, - "loss": 2.3383, - "step": 393050 - }, - { - "epoch": 0.69, - "learning_rate": 1.5727529236145746e-05, - "loss": 2.2323, - "step": 393060 - }, - { - "epoch": 0.69, - "learning_rate": 1.5726657296218923e-05, - "loss": 2.3111, - "step": 393070 - }, - { - "epoch": 0.69, - "learning_rate": 1.5725785356292093e-05, - "loss": 2.4157, - "step": 393080 - }, - { - "epoch": 0.69, - "learning_rate": 1.5724913416365267e-05, - "loss": 2.3736, - "step": 393090 - }, - { - "epoch": 0.69, - "learning_rate": 1.5724041476438438e-05, - "loss": 2.3733, - "step": 393100 - }, - { - "epoch": 0.69, - "learning_rate": 1.5723169536511615e-05, - "loss": 2.2952, - "step": 393110 - }, - { - "epoch": 0.69, - "learning_rate": 1.5722297596584785e-05, - "loss": 2.2612, - "step": 393120 - }, - { - "epoch": 0.69, - "learning_rate": 1.572142565665796e-05, - "loss": 2.2233, - "step": 393130 - }, - { - "epoch": 0.69, - "learning_rate": 1.5720553716731133e-05, - "loss": 2.2468, - "step": 393140 - }, - { - "epoch": 0.69, - "learning_rate": 1.5719681776804306e-05, - "loss": 2.3753, - "step": 393150 - }, - { - "epoch": 0.69, - "learning_rate": 1.571880983687748e-05, - "loss": 2.3325, - "step": 393160 - }, - { - "epoch": 0.69, - "learning_rate": 1.571793789695065e-05, - "loss": 2.3534, - "step": 393170 - }, - { - "epoch": 0.69, - "learning_rate": 1.5717065957023824e-05, - "loss": 2.3322, - "step": 393180 - }, - { - "epoch": 0.69, - "learning_rate": 1.5716194017096998e-05, - "loss": 2.3921, - "step": 393190 - }, - { - "epoch": 0.69, - "learning_rate": 1.5715322077170172e-05, - "loss": 2.3428, - "step": 393200 - }, - { - "epoch": 0.69, - "learning_rate": 1.5714450137243346e-05, - "loss": 2.3986, - "step": 393210 - }, - { - "epoch": 0.69, - "learning_rate": 1.571357819731652e-05, - "loss": 2.4193, - "step": 393220 - }, - { - "epoch": 0.69, - "learning_rate": 1.5712706257389693e-05, - "loss": 2.297, - "step": 393230 - }, - { - "epoch": 0.69, - "learning_rate": 1.5711834317462864e-05, - "loss": 2.2234, - "step": 393240 - }, - { - "epoch": 0.69, - "learning_rate": 1.5710962377536037e-05, - "loss": 2.334, - "step": 393250 - }, - { - "epoch": 0.69, - "learning_rate": 1.571009043760921e-05, - "loss": 2.2369, - "step": 393260 - }, - { - "epoch": 0.69, - "learning_rate": 1.5709218497682385e-05, - "loss": 2.3147, - "step": 393270 - }, - { - "epoch": 0.69, - "learning_rate": 1.570834655775556e-05, - "loss": 2.2475, - "step": 393280 - }, - { - "epoch": 0.69, - "learning_rate": 1.570747461782873e-05, - "loss": 2.1974, - "step": 393290 - }, - { - "epoch": 0.69, - "learning_rate": 1.5706602677901906e-05, - "loss": 2.2721, - "step": 393300 - }, - { - "epoch": 0.69, - "learning_rate": 1.5705730737975077e-05, - "loss": 2.2605, - "step": 393310 - }, - { - "epoch": 0.69, - "learning_rate": 1.570485879804825e-05, - "loss": 2.3117, - "step": 393320 - }, - { - "epoch": 0.69, - "learning_rate": 1.5703986858121424e-05, - "loss": 2.3696, - "step": 393330 - }, - { - "epoch": 0.69, - "learning_rate": 1.5703114918194598e-05, - "loss": 2.2218, - "step": 393340 - }, - { - "epoch": 0.69, - "learning_rate": 1.570224297826777e-05, - "loss": 2.4, - "step": 393350 - }, - { - "epoch": 0.69, - "learning_rate": 1.5701371038340942e-05, - "loss": 2.4373, - "step": 393360 - }, - { - "epoch": 0.69, - "learning_rate": 1.570049909841412e-05, - "loss": 2.1649, - "step": 393370 - }, - { - "epoch": 0.69, - "learning_rate": 1.569962715848729e-05, - "loss": 2.199, - "step": 393380 - }, - { - "epoch": 0.69, - "learning_rate": 1.5698755218560463e-05, - "loss": 2.2797, - "step": 393390 - }, - { - "epoch": 0.69, - "learning_rate": 1.5697883278633634e-05, - "loss": 2.2641, - "step": 393400 - }, - { - "epoch": 0.69, - "learning_rate": 1.569701133870681e-05, - "loss": 2.4265, - "step": 393410 - }, - { - "epoch": 0.69, - "learning_rate": 1.569613939877998e-05, - "loss": 2.1443, - "step": 393420 - }, - { - "epoch": 0.69, - "learning_rate": 1.5695267458853155e-05, - "loss": 2.4062, - "step": 393430 - }, - { - "epoch": 0.69, - "learning_rate": 1.569439551892633e-05, - "loss": 2.3335, - "step": 393440 - }, - { - "epoch": 0.69, - "learning_rate": 1.5693523578999503e-05, - "loss": 2.1734, - "step": 393450 - }, - { - "epoch": 0.69, - "learning_rate": 1.5692651639072676e-05, - "loss": 2.324, - "step": 393460 - }, - { - "epoch": 0.69, - "learning_rate": 1.5691779699145847e-05, - "loss": 2.3696, - "step": 393470 - }, - { - "epoch": 0.69, - "learning_rate": 1.5690907759219024e-05, - "loss": 2.2167, - "step": 393480 - }, - { - "epoch": 0.69, - "learning_rate": 1.5690035819292194e-05, - "loss": 2.3352, - "step": 393490 - }, - { - "epoch": 0.69, - "learning_rate": 1.5689163879365368e-05, - "loss": 2.3783, - "step": 393500 - }, - { - "epoch": 0.69, - "learning_rate": 1.5688291939438542e-05, - "loss": 2.3169, - "step": 393510 - }, - { - "epoch": 0.69, - "learning_rate": 1.5687419999511716e-05, - "loss": 2.2479, - "step": 393520 - }, - { - "epoch": 0.69, - "learning_rate": 1.568654805958489e-05, - "loss": 2.4021, - "step": 393530 - }, - { - "epoch": 0.69, - "learning_rate": 1.568567611965806e-05, - "loss": 2.3149, - "step": 393540 - }, - { - "epoch": 0.69, - "learning_rate": 1.5684804179731234e-05, - "loss": 2.3804, - "step": 393550 - }, - { - "epoch": 0.69, - "learning_rate": 1.5683932239804407e-05, - "loss": 2.3314, - "step": 393560 - }, - { - "epoch": 0.69, - "learning_rate": 1.568306029987758e-05, - "loss": 2.4249, - "step": 393570 - }, - { - "epoch": 0.69, - "learning_rate": 1.568218835995075e-05, - "loss": 2.2635, - "step": 393580 - }, - { - "epoch": 0.69, - "learning_rate": 1.5681316420023925e-05, - "loss": 2.3269, - "step": 393590 - }, - { - "epoch": 0.69, - "learning_rate": 1.56804444800971e-05, - "loss": 2.3827, - "step": 393600 - }, - { - "epoch": 0.69, - "learning_rate": 1.5679572540170273e-05, - "loss": 2.357, - "step": 393610 - }, - { - "epoch": 0.69, - "learning_rate": 1.5678700600243447e-05, - "loss": 2.3891, - "step": 393620 - }, - { - "epoch": 0.69, - "learning_rate": 1.567782866031662e-05, - "loss": 2.2876, - "step": 393630 - }, - { - "epoch": 0.69, - "learning_rate": 1.5676956720389794e-05, - "loss": 2.3675, - "step": 393640 - }, - { - "epoch": 0.69, - "learning_rate": 1.5676084780462964e-05, - "loss": 2.2496, - "step": 393650 - }, - { - "epoch": 0.69, - "learning_rate": 1.5675212840536138e-05, - "loss": 2.3112, - "step": 393660 - }, - { - "epoch": 0.69, - "learning_rate": 1.5674340900609312e-05, - "loss": 2.4226, - "step": 393670 - }, - { - "epoch": 0.69, - "learning_rate": 1.5673468960682486e-05, - "loss": 2.2863, - "step": 393680 - }, - { - "epoch": 0.69, - "learning_rate": 1.567259702075566e-05, - "loss": 2.4124, - "step": 393690 - }, - { - "epoch": 0.69, - "learning_rate": 1.567172508082883e-05, - "loss": 2.3001, - "step": 393700 - }, - { - "epoch": 0.69, - "learning_rate": 1.5670853140902007e-05, - "loss": 2.2604, - "step": 393710 - }, - { - "epoch": 0.69, - "learning_rate": 1.5669981200975177e-05, - "loss": 2.3939, - "step": 393720 - }, - { - "epoch": 0.69, - "learning_rate": 1.566910926104835e-05, - "loss": 2.2902, - "step": 393730 - }, - { - "epoch": 0.69, - "learning_rate": 1.5668237321121525e-05, - "loss": 2.3638, - "step": 393740 - }, - { - "epoch": 0.69, - "learning_rate": 1.56673653811947e-05, - "loss": 2.3554, - "step": 393750 - }, - { - "epoch": 0.69, - "learning_rate": 1.5666493441267873e-05, - "loss": 2.3898, - "step": 393760 - }, - { - "epoch": 0.69, - "learning_rate": 1.5665621501341043e-05, - "loss": 2.3239, - "step": 393770 - }, - { - "epoch": 0.69, - "learning_rate": 1.566474956141422e-05, - "loss": 2.2882, - "step": 393780 - }, - { - "epoch": 0.69, - "learning_rate": 1.566387762148739e-05, - "loss": 2.3299, - "step": 393790 - }, - { - "epoch": 0.69, - "learning_rate": 1.5663005681560564e-05, - "loss": 2.3978, - "step": 393800 - }, - { - "epoch": 0.69, - "learning_rate": 1.5662133741633735e-05, - "loss": 2.271, - "step": 393810 - }, - { - "epoch": 0.69, - "learning_rate": 1.5661261801706912e-05, - "loss": 2.3018, - "step": 393820 - }, - { - "epoch": 0.69, - "learning_rate": 1.5660389861780082e-05, - "loss": 2.3367, - "step": 393830 - }, - { - "epoch": 0.69, - "learning_rate": 1.5659517921853256e-05, - "loss": 2.2692, - "step": 393840 - }, - { - "epoch": 0.69, - "learning_rate": 1.565864598192643e-05, - "loss": 2.2265, - "step": 393850 - }, - { - "epoch": 0.69, - "learning_rate": 1.5657774041999603e-05, - "loss": 2.2946, - "step": 393860 - }, - { - "epoch": 0.69, - "learning_rate": 1.5656902102072777e-05, - "loss": 2.221, - "step": 393870 - }, - { - "epoch": 0.69, - "learning_rate": 1.5656030162145948e-05, - "loss": 2.3346, - "step": 393880 - }, - { - "epoch": 0.69, - "learning_rate": 1.5655158222219125e-05, - "loss": 2.2784, - "step": 393890 - }, - { - "epoch": 0.69, - "learning_rate": 1.5654286282292295e-05, - "loss": 2.2723, - "step": 393900 - }, - { - "epoch": 0.69, - "learning_rate": 1.565341434236547e-05, - "loss": 2.2093, - "step": 393910 - }, - { - "epoch": 0.69, - "learning_rate": 1.5652542402438643e-05, - "loss": 2.2655, - "step": 393920 - }, - { - "epoch": 0.69, - "learning_rate": 1.5651670462511816e-05, - "loss": 2.3587, - "step": 393930 - }, - { - "epoch": 0.69, - "learning_rate": 1.565079852258499e-05, - "loss": 2.3487, - "step": 393940 - }, - { - "epoch": 0.69, - "learning_rate": 1.564992658265816e-05, - "loss": 2.3593, - "step": 393950 - }, - { - "epoch": 0.69, - "learning_rate": 1.5649054642731334e-05, - "loss": 2.326, - "step": 393960 - }, - { - "epoch": 0.69, - "learning_rate": 1.5648182702804508e-05, - "loss": 2.3346, - "step": 393970 - }, - { - "epoch": 0.69, - "learning_rate": 1.5647310762877682e-05, - "loss": 2.2808, - "step": 393980 - }, - { - "epoch": 0.69, - "learning_rate": 1.5646438822950856e-05, - "loss": 2.236, - "step": 393990 - }, - { - "epoch": 0.69, - "learning_rate": 1.564556688302403e-05, - "loss": 2.2877, - "step": 394000 - }, - { - "epoch": 0.69, - "learning_rate": 1.5644694943097203e-05, - "loss": 2.2897, - "step": 394010 - }, - { - "epoch": 0.69, - "learning_rate": 1.5643823003170374e-05, - "loss": 2.2505, - "step": 394020 - }, - { - "epoch": 0.69, - "learning_rate": 1.5642951063243547e-05, - "loss": 2.2065, - "step": 394030 - }, - { - "epoch": 0.69, - "learning_rate": 1.564207912331672e-05, - "loss": 2.2808, - "step": 394040 - }, - { - "epoch": 0.69, - "learning_rate": 1.5641207183389895e-05, - "loss": 2.4624, - "step": 394050 - }, - { - "epoch": 0.69, - "learning_rate": 1.5640335243463065e-05, - "loss": 2.4113, - "step": 394060 - }, - { - "epoch": 0.69, - "learning_rate": 1.563946330353624e-05, - "loss": 2.4141, - "step": 394070 - }, - { - "epoch": 0.69, - "learning_rate": 1.5638591363609413e-05, - "loss": 2.2436, - "step": 394080 - }, - { - "epoch": 0.69, - "learning_rate": 1.5637719423682587e-05, - "loss": 2.4314, - "step": 394090 - }, - { - "epoch": 0.69, - "learning_rate": 1.563684748375576e-05, - "loss": 2.2061, - "step": 394100 - }, - { - "epoch": 0.69, - "learning_rate": 1.563597554382893e-05, - "loss": 2.2542, - "step": 394110 - }, - { - "epoch": 0.69, - "learning_rate": 1.5635103603902108e-05, - "loss": 2.1864, - "step": 394120 - }, - { - "epoch": 0.69, - "learning_rate": 1.563423166397528e-05, - "loss": 2.3405, - "step": 394130 - }, - { - "epoch": 0.69, - "learning_rate": 1.5633359724048452e-05, - "loss": 2.2129, - "step": 394140 - }, - { - "epoch": 0.69, - "learning_rate": 1.5632487784121626e-05, - "loss": 2.4347, - "step": 394150 - }, - { - "epoch": 0.69, - "learning_rate": 1.56316158441948e-05, - "loss": 2.316, - "step": 394160 - }, - { - "epoch": 0.69, - "learning_rate": 1.5630743904267973e-05, - "loss": 2.226, - "step": 394170 - }, - { - "epoch": 0.69, - "learning_rate": 1.5629871964341144e-05, - "loss": 2.2035, - "step": 394180 - }, - { - "epoch": 0.69, - "learning_rate": 1.562900002441432e-05, - "loss": 2.28, - "step": 394190 - }, - { - "epoch": 0.69, - "learning_rate": 1.562812808448749e-05, - "loss": 2.3183, - "step": 394200 - }, - { - "epoch": 0.69, - "learning_rate": 1.5627256144560665e-05, - "loss": 2.3663, - "step": 394210 - }, - { - "epoch": 0.69, - "learning_rate": 1.5626384204633835e-05, - "loss": 2.4345, - "step": 394220 - }, - { - "epoch": 0.69, - "learning_rate": 1.5625512264707013e-05, - "loss": 2.2684, - "step": 394230 - }, - { - "epoch": 0.69, - "learning_rate": 1.5624640324780186e-05, - "loss": 2.2658, - "step": 394240 - }, - { - "epoch": 0.69, - "learning_rate": 1.5623768384853357e-05, - "loss": 2.3504, - "step": 394250 - }, - { - "epoch": 0.69, - "learning_rate": 1.562289644492653e-05, - "loss": 2.2816, - "step": 394260 - }, - { - "epoch": 0.69, - "learning_rate": 1.5622024504999704e-05, - "loss": 2.2944, - "step": 394270 - }, - { - "epoch": 0.69, - "learning_rate": 1.5621152565072878e-05, - "loss": 2.3261, - "step": 394280 - }, - { - "epoch": 0.69, - "learning_rate": 1.562028062514605e-05, - "loss": 2.3688, - "step": 394290 - }, - { - "epoch": 0.69, - "learning_rate": 1.5619408685219226e-05, - "loss": 2.3641, - "step": 394300 - }, - { - "epoch": 0.69, - "learning_rate": 1.5618536745292396e-05, - "loss": 2.3835, - "step": 394310 - }, - { - "epoch": 0.69, - "learning_rate": 1.561766480536557e-05, - "loss": 2.3628, - "step": 394320 - }, - { - "epoch": 0.69, - "learning_rate": 1.5616792865438744e-05, - "loss": 2.2645, - "step": 394330 - }, - { - "epoch": 0.69, - "learning_rate": 1.5615920925511917e-05, - "loss": 2.3923, - "step": 394340 - }, - { - "epoch": 0.69, - "learning_rate": 1.561504898558509e-05, - "loss": 2.1688, - "step": 394350 - }, - { - "epoch": 0.69, - "learning_rate": 1.561417704565826e-05, - "loss": 2.2958, - "step": 394360 - }, - { - "epoch": 0.69, - "learning_rate": 1.5613305105731435e-05, - "loss": 2.3899, - "step": 394370 - }, - { - "epoch": 0.69, - "learning_rate": 1.561243316580461e-05, - "loss": 2.412, - "step": 394380 - }, - { - "epoch": 0.69, - "learning_rate": 1.5611561225877783e-05, - "loss": 2.2463, - "step": 394390 - }, - { - "epoch": 0.69, - "learning_rate": 1.5610689285950957e-05, - "loss": 2.321, - "step": 394400 - }, - { - "epoch": 0.69, - "learning_rate": 1.560981734602413e-05, - "loss": 2.3217, - "step": 394410 - }, - { - "epoch": 0.69, - "learning_rate": 1.5608945406097304e-05, - "loss": 2.3434, - "step": 394420 - }, - { - "epoch": 0.69, - "learning_rate": 1.5608073466170474e-05, - "loss": 2.3581, - "step": 394430 - }, - { - "epoch": 0.69, - "learning_rate": 1.5607201526243648e-05, - "loss": 2.275, - "step": 394440 - }, - { - "epoch": 0.69, - "learning_rate": 1.5606329586316822e-05, - "loss": 2.3837, - "step": 394450 - }, - { - "epoch": 0.69, - "learning_rate": 1.5605457646389996e-05, - "loss": 2.4262, - "step": 394460 - }, - { - "epoch": 0.69, - "learning_rate": 1.5604585706463166e-05, - "loss": 2.262, - "step": 394470 - }, - { - "epoch": 0.69, - "learning_rate": 1.560371376653634e-05, - "loss": 2.2909, - "step": 394480 - }, - { - "epoch": 0.69, - "learning_rate": 1.5602841826609517e-05, - "loss": 2.2969, - "step": 394490 - }, - { - "epoch": 0.69, - "learning_rate": 1.5601969886682687e-05, - "loss": 2.3265, - "step": 394500 - }, - { - "epoch": 0.69, - "learning_rate": 1.560109794675586e-05, - "loss": 2.2174, - "step": 394510 - }, - { - "epoch": 0.69, - "learning_rate": 1.560022600682903e-05, - "loss": 2.279, - "step": 394520 - }, - { - "epoch": 0.69, - "learning_rate": 1.559935406690221e-05, - "loss": 2.3344, - "step": 394530 - }, - { - "epoch": 0.69, - "learning_rate": 1.559848212697538e-05, - "loss": 2.3447, - "step": 394540 - }, - { - "epoch": 0.69, - "learning_rate": 1.5597610187048553e-05, - "loss": 2.3354, - "step": 394550 - }, - { - "epoch": 0.69, - "learning_rate": 1.5596738247121727e-05, - "loss": 2.136, - "step": 394560 - }, - { - "epoch": 0.69, - "learning_rate": 1.55958663071949e-05, - "loss": 2.4076, - "step": 394570 - }, - { - "epoch": 0.69, - "learning_rate": 1.5594994367268074e-05, - "loss": 2.2347, - "step": 394580 - }, - { - "epoch": 0.69, - "learning_rate": 1.5594122427341245e-05, - "loss": 2.2667, - "step": 394590 - }, - { - "epoch": 0.69, - "learning_rate": 1.5593250487414422e-05, - "loss": 2.3372, - "step": 394600 - }, - { - "epoch": 0.69, - "learning_rate": 1.5592378547487592e-05, - "loss": 2.3842, - "step": 394610 - }, - { - "epoch": 0.69, - "learning_rate": 1.5591506607560766e-05, - "loss": 2.2961, - "step": 394620 - }, - { - "epoch": 0.69, - "learning_rate": 1.559063466763394e-05, - "loss": 2.2801, - "step": 394630 - }, - { - "epoch": 0.69, - "learning_rate": 1.5589762727707113e-05, - "loss": 2.388, - "step": 394640 - }, - { - "epoch": 0.69, - "learning_rate": 1.5588890787780287e-05, - "loss": 2.2325, - "step": 394650 - }, - { - "epoch": 0.69, - "learning_rate": 1.5588018847853458e-05, - "loss": 2.3225, - "step": 394660 - }, - { - "epoch": 0.69, - "learning_rate": 1.5587146907926635e-05, - "loss": 2.2987, - "step": 394670 - }, - { - "epoch": 0.69, - "learning_rate": 1.5586274967999805e-05, - "loss": 2.3647, - "step": 394680 - }, - { - "epoch": 0.69, - "learning_rate": 1.558540302807298e-05, - "loss": 2.3401, - "step": 394690 - }, - { - "epoch": 0.69, - "learning_rate": 1.558453108814615e-05, - "loss": 2.3465, - "step": 394700 - }, - { - "epoch": 0.69, - "learning_rate": 1.5583659148219326e-05, - "loss": 2.3885, - "step": 394710 - }, - { - "epoch": 0.69, - "learning_rate": 1.55827872082925e-05, - "loss": 2.3566, - "step": 394720 - }, - { - "epoch": 0.69, - "learning_rate": 1.558191526836567e-05, - "loss": 2.299, - "step": 394730 - }, - { - "epoch": 0.69, - "learning_rate": 1.5581043328438844e-05, - "loss": 2.1961, - "step": 394740 - }, - { - "epoch": 0.69, - "learning_rate": 1.5580171388512018e-05, - "loss": 2.2944, - "step": 394750 - }, - { - "epoch": 0.69, - "learning_rate": 1.5579299448585192e-05, - "loss": 2.2664, - "step": 394760 - }, - { - "epoch": 0.69, - "learning_rate": 1.5578427508658362e-05, - "loss": 2.299, - "step": 394770 - }, - { - "epoch": 0.69, - "learning_rate": 1.5577555568731536e-05, - "loss": 2.4043, - "step": 394780 - }, - { - "epoch": 0.69, - "learning_rate": 1.557668362880471e-05, - "loss": 2.2369, - "step": 394790 - }, - { - "epoch": 0.69, - "learning_rate": 1.5575811688877884e-05, - "loss": 2.3919, - "step": 394800 - }, - { - "epoch": 0.69, - "learning_rate": 1.5574939748951057e-05, - "loss": 2.2028, - "step": 394810 - }, - { - "epoch": 0.69, - "learning_rate": 1.557406780902423e-05, - "loss": 2.2179, - "step": 394820 - }, - { - "epoch": 0.69, - "learning_rate": 1.5573195869097405e-05, - "loss": 2.3701, - "step": 394830 - }, - { - "epoch": 0.69, - "learning_rate": 1.5572323929170575e-05, - "loss": 2.2566, - "step": 394840 - }, - { - "epoch": 0.69, - "learning_rate": 1.557145198924375e-05, - "loss": 2.3268, - "step": 394850 - }, - { - "epoch": 0.69, - "learning_rate": 1.5570580049316923e-05, - "loss": 2.2484, - "step": 394860 - }, - { - "epoch": 0.69, - "learning_rate": 1.5569708109390097e-05, - "loss": 2.2993, - "step": 394870 - }, - { - "epoch": 0.69, - "learning_rate": 1.556883616946327e-05, - "loss": 2.3486, - "step": 394880 - }, - { - "epoch": 0.69, - "learning_rate": 1.556796422953644e-05, - "loss": 2.3381, - "step": 394890 - }, - { - "epoch": 0.69, - "learning_rate": 1.5567092289609618e-05, - "loss": 2.3471, - "step": 394900 - }, - { - "epoch": 0.69, - "learning_rate": 1.556622034968279e-05, - "loss": 2.3526, - "step": 394910 - }, - { - "epoch": 0.69, - "learning_rate": 1.5565348409755962e-05, - "loss": 2.3438, - "step": 394920 - }, - { - "epoch": 0.69, - "learning_rate": 1.5564476469829136e-05, - "loss": 2.3181, - "step": 394930 - }, - { - "epoch": 0.69, - "learning_rate": 1.556360452990231e-05, - "loss": 2.2979, - "step": 394940 - }, - { - "epoch": 0.69, - "learning_rate": 1.556273258997548e-05, - "loss": 2.4284, - "step": 394950 - }, - { - "epoch": 0.69, - "learning_rate": 1.5561860650048654e-05, - "loss": 2.2853, - "step": 394960 - }, - { - "epoch": 0.69, - "learning_rate": 1.556098871012183e-05, - "loss": 2.3633, - "step": 394970 - }, - { - "epoch": 0.69, - "learning_rate": 1.5560116770195e-05, - "loss": 2.3276, - "step": 394980 - }, - { - "epoch": 0.69, - "learning_rate": 1.5559244830268175e-05, - "loss": 2.2887, - "step": 394990 - }, - { - "epoch": 0.69, - "learning_rate": 1.5558372890341345e-05, - "loss": 2.376, - "step": 395000 - }, - { - "epoch": 0.69, - "learning_rate": 1.5557500950414523e-05, - "loss": 2.3267, - "step": 395010 - }, - { - "epoch": 0.69, - "learning_rate": 1.5556629010487693e-05, - "loss": 2.3067, - "step": 395020 - }, - { - "epoch": 0.69, - "learning_rate": 1.5555757070560867e-05, - "loss": 2.3042, - "step": 395030 - }, - { - "epoch": 0.69, - "learning_rate": 1.555488513063404e-05, - "loss": 2.3333, - "step": 395040 - }, - { - "epoch": 0.69, - "learning_rate": 1.5554013190707214e-05, - "loss": 2.333, - "step": 395050 - }, - { - "epoch": 0.69, - "learning_rate": 1.5553141250780388e-05, - "loss": 2.3083, - "step": 395060 - }, - { - "epoch": 0.69, - "learning_rate": 1.555226931085356e-05, - "loss": 2.2561, - "step": 395070 - }, - { - "epoch": 0.69, - "learning_rate": 1.5551397370926736e-05, - "loss": 2.351, - "step": 395080 - }, - { - "epoch": 0.69, - "learning_rate": 1.5550525430999906e-05, - "loss": 2.3132, - "step": 395090 - }, - { - "epoch": 0.69, - "learning_rate": 1.554965349107308e-05, - "loss": 2.2365, - "step": 395100 - }, - { - "epoch": 0.69, - "learning_rate": 1.5548781551146254e-05, - "loss": 2.28, - "step": 395110 - }, - { - "epoch": 0.69, - "learning_rate": 1.5547909611219427e-05, - "loss": 2.2771, - "step": 395120 - }, - { - "epoch": 0.69, - "learning_rate": 1.55470376712926e-05, - "loss": 2.3436, - "step": 395130 - }, - { - "epoch": 0.69, - "learning_rate": 1.554616573136577e-05, - "loss": 2.2564, - "step": 395140 - }, - { - "epoch": 0.69, - "learning_rate": 1.5545293791438945e-05, - "loss": 2.2285, - "step": 395150 - }, - { - "epoch": 0.69, - "learning_rate": 1.554442185151212e-05, - "loss": 2.3812, - "step": 395160 - }, - { - "epoch": 0.69, - "learning_rate": 1.5543549911585293e-05, - "loss": 2.3396, - "step": 395170 - }, - { - "epoch": 0.69, - "learning_rate": 1.5542677971658463e-05, - "loss": 2.4031, - "step": 395180 - }, - { - "epoch": 0.69, - "learning_rate": 1.5541806031731637e-05, - "loss": 2.3025, - "step": 395190 - }, - { - "epoch": 0.69, - "learning_rate": 1.554093409180481e-05, - "loss": 2.2801, - "step": 395200 - }, - { - "epoch": 0.69, - "learning_rate": 1.5540062151877984e-05, - "loss": 2.2484, - "step": 395210 - }, - { - "epoch": 0.69, - "learning_rate": 1.5539190211951158e-05, - "loss": 2.2389, - "step": 395220 - }, - { - "epoch": 0.69, - "learning_rate": 1.5538318272024332e-05, - "loss": 2.2409, - "step": 395230 - }, - { - "epoch": 0.69, - "learning_rate": 1.5537446332097506e-05, - "loss": 2.1979, - "step": 395240 - }, - { - "epoch": 0.69, - "learning_rate": 1.5536574392170676e-05, - "loss": 2.278, - "step": 395250 - }, - { - "epoch": 0.69, - "learning_rate": 1.553570245224385e-05, - "loss": 2.3018, - "step": 395260 - }, - { - "epoch": 0.69, - "learning_rate": 1.5534830512317024e-05, - "loss": 2.3161, - "step": 395270 - }, - { - "epoch": 0.69, - "learning_rate": 1.5533958572390197e-05, - "loss": 2.3074, - "step": 395280 - }, - { - "epoch": 0.69, - "learning_rate": 1.553308663246337e-05, - "loss": 2.3141, - "step": 395290 - }, - { - "epoch": 0.69, - "learning_rate": 1.553221469253654e-05, - "loss": 2.3614, - "step": 395300 - }, - { - "epoch": 0.69, - "learning_rate": 1.553134275260972e-05, - "loss": 2.289, - "step": 395310 - }, - { - "epoch": 0.69, - "learning_rate": 1.553047081268289e-05, - "loss": 2.301, - "step": 395320 - }, - { - "epoch": 0.69, - "learning_rate": 1.5529598872756063e-05, - "loss": 2.3211, - "step": 395330 - }, - { - "epoch": 0.69, - "learning_rate": 1.5528726932829237e-05, - "loss": 2.3457, - "step": 395340 - }, - { - "epoch": 0.69, - "learning_rate": 1.552785499290241e-05, - "loss": 2.3753, - "step": 395350 - }, - { - "epoch": 0.69, - "learning_rate": 1.5526983052975584e-05, - "loss": 2.3055, - "step": 395360 - }, - { - "epoch": 0.69, - "learning_rate": 1.5526111113048755e-05, - "loss": 2.3308, - "step": 395370 - }, - { - "epoch": 0.69, - "learning_rate": 1.5525239173121932e-05, - "loss": 2.4514, - "step": 395380 - }, - { - "epoch": 0.69, - "learning_rate": 1.5524367233195102e-05, - "loss": 2.369, - "step": 395390 - }, - { - "epoch": 0.69, - "learning_rate": 1.5523495293268276e-05, - "loss": 2.3788, - "step": 395400 - }, - { - "epoch": 0.69, - "learning_rate": 1.5522623353341446e-05, - "loss": 2.3803, - "step": 395410 - }, - { - "epoch": 0.69, - "learning_rate": 1.5521751413414623e-05, - "loss": 2.2862, - "step": 395420 - }, - { - "epoch": 0.69, - "learning_rate": 1.5520879473487794e-05, - "loss": 2.2683, - "step": 395430 - }, - { - "epoch": 0.69, - "learning_rate": 1.5520007533560968e-05, - "loss": 2.3677, - "step": 395440 - }, - { - "epoch": 0.69, - "learning_rate": 1.551913559363414e-05, - "loss": 2.2608, - "step": 395450 - }, - { - "epoch": 0.69, - "learning_rate": 1.5518263653707315e-05, - "loss": 2.1581, - "step": 395460 - }, - { - "epoch": 0.69, - "learning_rate": 1.551739171378049e-05, - "loss": 2.3565, - "step": 395470 - }, - { - "epoch": 0.69, - "learning_rate": 1.551651977385366e-05, - "loss": 2.3942, - "step": 395480 - }, - { - "epoch": 0.69, - "learning_rate": 1.5515647833926836e-05, - "loss": 2.3058, - "step": 395490 - }, - { - "epoch": 0.69, - "learning_rate": 1.5514775894000007e-05, - "loss": 2.3014, - "step": 395500 - }, - { - "epoch": 0.69, - "learning_rate": 1.551390395407318e-05, - "loss": 2.2742, - "step": 395510 - }, - { - "epoch": 0.69, - "learning_rate": 1.5513032014146354e-05, - "loss": 2.2299, - "step": 395520 - }, - { - "epoch": 0.69, - "learning_rate": 1.5512160074219528e-05, - "loss": 2.305, - "step": 395530 - }, - { - "epoch": 0.69, - "learning_rate": 1.5511288134292702e-05, - "loss": 2.3825, - "step": 395540 - }, - { - "epoch": 0.69, - "learning_rate": 1.5510416194365872e-05, - "loss": 2.4033, - "step": 395550 - }, - { - "epoch": 0.69, - "learning_rate": 1.5509544254439046e-05, - "loss": 2.3164, - "step": 395560 - }, - { - "epoch": 0.69, - "learning_rate": 1.550867231451222e-05, - "loss": 2.3531, - "step": 395570 - }, - { - "epoch": 0.69, - "learning_rate": 1.5507800374585394e-05, - "loss": 2.2184, - "step": 395580 - }, - { - "epoch": 0.69, - "learning_rate": 1.5506928434658567e-05, - "loss": 2.3198, - "step": 395590 - }, - { - "epoch": 0.69, - "learning_rate": 1.550605649473174e-05, - "loss": 2.3531, - "step": 395600 - }, - { - "epoch": 0.69, - "learning_rate": 1.5505184554804915e-05, - "loss": 2.3231, - "step": 395610 - }, - { - "epoch": 0.69, - "learning_rate": 1.5504312614878085e-05, - "loss": 2.2097, - "step": 395620 - }, - { - "epoch": 0.69, - "learning_rate": 1.550344067495126e-05, - "loss": 2.2134, - "step": 395630 - }, - { - "epoch": 0.69, - "learning_rate": 1.5502568735024433e-05, - "loss": 2.3955, - "step": 395640 - }, - { - "epoch": 0.69, - "learning_rate": 1.5501696795097607e-05, - "loss": 2.2632, - "step": 395650 - }, - { - "epoch": 0.69, - "learning_rate": 1.5500824855170777e-05, - "loss": 2.2248, - "step": 395660 - }, - { - "epoch": 0.69, - "learning_rate": 1.549995291524395e-05, - "loss": 2.3556, - "step": 395670 - }, - { - "epoch": 0.69, - "learning_rate": 1.5499080975317125e-05, - "loss": 2.2602, - "step": 395680 - }, - { - "epoch": 0.69, - "learning_rate": 1.54982090353903e-05, - "loss": 2.2735, - "step": 395690 - }, - { - "epoch": 0.69, - "learning_rate": 1.5497337095463472e-05, - "loss": 2.32, - "step": 395700 - }, - { - "epoch": 0.69, - "learning_rate": 1.5496465155536642e-05, - "loss": 2.2308, - "step": 395710 - }, - { - "epoch": 0.69, - "learning_rate": 1.549559321560982e-05, - "loss": 2.2699, - "step": 395720 - }, - { - "epoch": 0.69, - "learning_rate": 1.549472127568299e-05, - "loss": 2.3635, - "step": 395730 - }, - { - "epoch": 0.69, - "learning_rate": 1.5493849335756164e-05, - "loss": 2.3517, - "step": 395740 - }, - { - "epoch": 0.69, - "learning_rate": 1.5492977395829338e-05, - "loss": 2.3426, - "step": 395750 - }, - { - "epoch": 0.69, - "learning_rate": 1.549210545590251e-05, - "loss": 2.28, - "step": 395760 - }, - { - "epoch": 0.69, - "learning_rate": 1.5491233515975685e-05, - "loss": 2.4201, - "step": 395770 - }, - { - "epoch": 0.69, - "learning_rate": 1.5490361576048855e-05, - "loss": 2.2772, - "step": 395780 - }, - { - "epoch": 0.69, - "learning_rate": 1.5489489636122033e-05, - "loss": 2.4159, - "step": 395790 - }, - { - "epoch": 0.69, - "learning_rate": 1.5488617696195203e-05, - "loss": 2.3472, - "step": 395800 - }, - { - "epoch": 0.69, - "learning_rate": 1.5487745756268377e-05, - "loss": 2.2485, - "step": 395810 - }, - { - "epoch": 0.69, - "learning_rate": 1.5486873816341547e-05, - "loss": 2.2883, - "step": 395820 - }, - { - "epoch": 0.69, - "learning_rate": 1.5486001876414724e-05, - "loss": 2.3535, - "step": 395830 - }, - { - "epoch": 0.69, - "learning_rate": 1.5485129936487898e-05, - "loss": 2.2573, - "step": 395840 - }, - { - "epoch": 0.69, - "learning_rate": 1.548425799656107e-05, - "loss": 2.2468, - "step": 395850 - }, - { - "epoch": 0.69, - "learning_rate": 1.5483386056634246e-05, - "loss": 2.3805, - "step": 395860 - }, - { - "epoch": 0.69, - "learning_rate": 1.5482514116707416e-05, - "loss": 2.1986, - "step": 395870 - }, - { - "epoch": 0.69, - "learning_rate": 1.548164217678059e-05, - "loss": 2.3739, - "step": 395880 - }, - { - "epoch": 0.69, - "learning_rate": 1.548077023685376e-05, - "loss": 2.262, - "step": 395890 - }, - { - "epoch": 0.69, - "learning_rate": 1.5479898296926937e-05, - "loss": 2.3751, - "step": 395900 - }, - { - "epoch": 0.69, - "learning_rate": 1.5479026357000108e-05, - "loss": 2.3785, - "step": 395910 - }, - { - "epoch": 0.69, - "learning_rate": 1.547815441707328e-05, - "loss": 2.3951, - "step": 395920 - }, - { - "epoch": 0.69, - "learning_rate": 1.5477282477146455e-05, - "loss": 2.3301, - "step": 395930 - }, - { - "epoch": 0.69, - "learning_rate": 1.547641053721963e-05, - "loss": 2.2652, - "step": 395940 - }, - { - "epoch": 0.69, - "learning_rate": 1.5475538597292803e-05, - "loss": 2.2359, - "step": 395950 - }, - { - "epoch": 0.69, - "learning_rate": 1.5474666657365973e-05, - "loss": 2.4125, - "step": 395960 - }, - { - "epoch": 0.69, - "learning_rate": 1.5473794717439147e-05, - "loss": 2.2798, - "step": 395970 - }, - { - "epoch": 0.69, - "learning_rate": 1.547292277751232e-05, - "loss": 2.3076, - "step": 395980 - }, - { - "epoch": 0.69, - "learning_rate": 1.5472050837585495e-05, - "loss": 2.2653, - "step": 395990 - }, - { - "epoch": 0.69, - "learning_rate": 1.5471178897658668e-05, - "loss": 2.277, - "step": 396000 - }, - { - "epoch": 0.69, - "learning_rate": 1.5470306957731842e-05, - "loss": 2.3755, - "step": 396010 - }, - { - "epoch": 0.69, - "learning_rate": 1.5469435017805016e-05, - "loss": 2.2765, - "step": 396020 - }, - { - "epoch": 0.69, - "learning_rate": 1.5468563077878186e-05, - "loss": 2.3161, - "step": 396030 - }, - { - "epoch": 0.69, - "learning_rate": 1.546769113795136e-05, - "loss": 2.4009, - "step": 396040 - }, - { - "epoch": 0.69, - "learning_rate": 1.5466819198024534e-05, - "loss": 2.2029, - "step": 396050 - }, - { - "epoch": 0.69, - "learning_rate": 1.5465947258097708e-05, - "loss": 2.3889, - "step": 396060 - }, - { - "epoch": 0.69, - "learning_rate": 1.546507531817088e-05, - "loss": 2.3063, - "step": 396070 - }, - { - "epoch": 0.69, - "learning_rate": 1.546420337824405e-05, - "loss": 2.2994, - "step": 396080 - }, - { - "epoch": 0.69, - "learning_rate": 1.546333143831723e-05, - "loss": 2.2075, - "step": 396090 - }, - { - "epoch": 0.69, - "learning_rate": 1.54624594983904e-05, - "loss": 2.3803, - "step": 396100 - }, - { - "epoch": 0.69, - "learning_rate": 1.5461587558463573e-05, - "loss": 2.3699, - "step": 396110 - }, - { - "epoch": 0.69, - "learning_rate": 1.5460715618536743e-05, - "loss": 2.2639, - "step": 396120 - }, - { - "epoch": 0.69, - "learning_rate": 1.545984367860992e-05, - "loss": 2.1862, - "step": 396130 - }, - { - "epoch": 0.69, - "learning_rate": 1.545897173868309e-05, - "loss": 2.2633, - "step": 396140 - }, - { - "epoch": 0.69, - "learning_rate": 1.5458099798756265e-05, - "loss": 2.3473, - "step": 396150 - }, - { - "epoch": 0.69, - "learning_rate": 1.545722785882944e-05, - "loss": 2.3035, - "step": 396160 - }, - { - "epoch": 0.69, - "learning_rate": 1.5456355918902612e-05, - "loss": 2.4039, - "step": 396170 - }, - { - "epoch": 0.69, - "learning_rate": 1.5455483978975786e-05, - "loss": 2.2843, - "step": 396180 - }, - { - "epoch": 0.69, - "learning_rate": 1.5454612039048956e-05, - "loss": 2.3618, - "step": 396190 - }, - { - "epoch": 0.69, - "learning_rate": 1.5453740099122134e-05, - "loss": 2.3015, - "step": 396200 - }, - { - "epoch": 0.69, - "learning_rate": 1.5452868159195304e-05, - "loss": 2.3223, - "step": 396210 - }, - { - "epoch": 0.69, - "learning_rate": 1.5451996219268478e-05, - "loss": 2.3696, - "step": 396220 - }, - { - "epoch": 0.69, - "learning_rate": 1.545112427934165e-05, - "loss": 2.1819, - "step": 396230 - }, - { - "epoch": 0.69, - "learning_rate": 1.5450252339414825e-05, - "loss": 2.3864, - "step": 396240 - }, - { - "epoch": 0.69, - "learning_rate": 1.5449380399488e-05, - "loss": 2.2728, - "step": 396250 - }, - { - "epoch": 0.69, - "learning_rate": 1.544850845956117e-05, - "loss": 2.1907, - "step": 396260 - }, - { - "epoch": 0.69, - "learning_rate": 1.5447636519634347e-05, - "loss": 2.2569, - "step": 396270 - }, - { - "epoch": 0.69, - "learning_rate": 1.5446764579707517e-05, - "loss": 2.1923, - "step": 396280 - }, - { - "epoch": 0.69, - "learning_rate": 1.544589263978069e-05, - "loss": 2.2929, - "step": 396290 - }, - { - "epoch": 0.69, - "learning_rate": 1.544502069985386e-05, - "loss": 2.2554, - "step": 396300 - }, - { - "epoch": 0.69, - "learning_rate": 1.5444148759927038e-05, - "loss": 2.4119, - "step": 396310 - }, - { - "epoch": 0.69, - "learning_rate": 1.5443276820000212e-05, - "loss": 2.312, - "step": 396320 - }, - { - "epoch": 0.69, - "learning_rate": 1.5442404880073382e-05, - "loss": 2.2583, - "step": 396330 - }, - { - "epoch": 0.69, - "learning_rate": 1.5441532940146556e-05, - "loss": 2.3277, - "step": 396340 - }, - { - "epoch": 0.69, - "learning_rate": 1.544066100021973e-05, - "loss": 2.3189, - "step": 396350 - }, - { - "epoch": 0.69, - "learning_rate": 1.5439789060292904e-05, - "loss": 2.3145, - "step": 396360 - }, - { - "epoch": 0.69, - "learning_rate": 1.5438917120366074e-05, - "loss": 2.4206, - "step": 396370 - }, - { - "epoch": 0.69, - "learning_rate": 1.5438045180439248e-05, - "loss": 2.2821, - "step": 396380 - }, - { - "epoch": 0.69, - "learning_rate": 1.543717324051242e-05, - "loss": 2.4179, - "step": 396390 - }, - { - "epoch": 0.69, - "learning_rate": 1.5436301300585595e-05, - "loss": 2.2795, - "step": 396400 - }, - { - "epoch": 0.69, - "learning_rate": 1.543542936065877e-05, - "loss": 2.2551, - "step": 396410 - }, - { - "epoch": 0.69, - "learning_rate": 1.5434557420731943e-05, - "loss": 2.2993, - "step": 396420 - }, - { - "epoch": 0.69, - "learning_rate": 1.5433685480805117e-05, - "loss": 2.2638, - "step": 396430 - }, - { - "epoch": 0.69, - "learning_rate": 1.5432813540878287e-05, - "loss": 2.4121, - "step": 396440 - }, - { - "epoch": 0.69, - "learning_rate": 1.543194160095146e-05, - "loss": 2.4194, - "step": 396450 - }, - { - "epoch": 0.69, - "learning_rate": 1.5431069661024635e-05, - "loss": 2.2919, - "step": 396460 - }, - { - "epoch": 0.69, - "learning_rate": 1.543019772109781e-05, - "loss": 2.2703, - "step": 396470 - }, - { - "epoch": 0.69, - "learning_rate": 1.5429325781170982e-05, - "loss": 2.3149, - "step": 396480 - }, - { - "epoch": 0.69, - "learning_rate": 1.5428453841244153e-05, - "loss": 2.3277, - "step": 396490 - }, - { - "epoch": 0.69, - "learning_rate": 1.542758190131733e-05, - "loss": 2.446, - "step": 396500 - }, - { - "epoch": 0.69, - "learning_rate": 1.54267099613905e-05, - "loss": 2.3854, - "step": 396510 - }, - { - "epoch": 0.69, - "learning_rate": 1.5425838021463674e-05, - "loss": 2.2283, - "step": 396520 - }, - { - "epoch": 0.69, - "learning_rate": 1.5424966081536848e-05, - "loss": 2.2674, - "step": 396530 - }, - { - "epoch": 0.69, - "learning_rate": 1.542409414161002e-05, - "loss": 2.379, - "step": 396540 - }, - { - "epoch": 0.69, - "learning_rate": 1.5423222201683192e-05, - "loss": 2.3307, - "step": 396550 - }, - { - "epoch": 0.69, - "learning_rate": 1.5422350261756366e-05, - "loss": 2.2013, - "step": 396560 - }, - { - "epoch": 0.69, - "learning_rate": 1.5421478321829543e-05, - "loss": 2.4225, - "step": 396570 - }, - { - "epoch": 0.69, - "learning_rate": 1.5420606381902713e-05, - "loss": 2.3182, - "step": 396580 - }, - { - "epoch": 0.69, - "learning_rate": 1.5419734441975887e-05, - "loss": 2.2513, - "step": 396590 - }, - { - "epoch": 0.69, - "learning_rate": 1.5418862502049057e-05, - "loss": 2.3567, - "step": 396600 - }, - { - "epoch": 0.69, - "learning_rate": 1.5417990562122234e-05, - "loss": 2.1942, - "step": 396610 - }, - { - "epoch": 0.69, - "learning_rate": 1.5417118622195405e-05, - "loss": 2.3136, - "step": 396620 - }, - { - "epoch": 0.69, - "learning_rate": 1.541624668226858e-05, - "loss": 2.2089, - "step": 396630 - }, - { - "epoch": 0.69, - "learning_rate": 1.5415374742341752e-05, - "loss": 2.3091, - "step": 396640 - }, - { - "epoch": 0.69, - "learning_rate": 1.5414502802414926e-05, - "loss": 2.2761, - "step": 396650 - }, - { - "epoch": 0.69, - "learning_rate": 1.54136308624881e-05, - "loss": 2.2758, - "step": 396660 - }, - { - "epoch": 0.69, - "learning_rate": 1.541275892256127e-05, - "loss": 2.2872, - "step": 396670 - }, - { - "epoch": 0.69, - "learning_rate": 1.5411886982634447e-05, - "loss": 2.3283, - "step": 396680 - }, - { - "epoch": 0.69, - "learning_rate": 1.5411015042707618e-05, - "loss": 2.3407, - "step": 396690 - }, - { - "epoch": 0.69, - "learning_rate": 1.541014310278079e-05, - "loss": 2.175, - "step": 396700 - }, - { - "epoch": 0.69, - "learning_rate": 1.5409271162853965e-05, - "loss": 2.4709, - "step": 396710 - }, - { - "epoch": 0.69, - "learning_rate": 1.540839922292714e-05, - "loss": 2.3246, - "step": 396720 - }, - { - "epoch": 0.69, - "learning_rate": 1.5407527283000313e-05, - "loss": 2.3841, - "step": 396730 - }, - { - "epoch": 0.69, - "learning_rate": 1.5406655343073483e-05, - "loss": 2.2988, - "step": 396740 - }, - { - "epoch": 0.69, - "learning_rate": 1.5405783403146657e-05, - "loss": 2.3253, - "step": 396750 - }, - { - "epoch": 0.69, - "learning_rate": 1.540491146321983e-05, - "loss": 2.2669, - "step": 396760 - }, - { - "epoch": 0.69, - "learning_rate": 1.5404039523293005e-05, - "loss": 2.1275, - "step": 396770 - }, - { - "epoch": 0.69, - "learning_rate": 1.5403167583366175e-05, - "loss": 2.2495, - "step": 396780 - }, - { - "epoch": 0.69, - "learning_rate": 1.5402295643439352e-05, - "loss": 2.3549, - "step": 396790 - }, - { - "epoch": 0.69, - "learning_rate": 1.5401423703512526e-05, - "loss": 2.3201, - "step": 396800 - }, - { - "epoch": 0.69, - "learning_rate": 1.5400551763585696e-05, - "loss": 2.3674, - "step": 396810 - }, - { - "epoch": 0.69, - "learning_rate": 1.539967982365887e-05, - "loss": 2.2574, - "step": 396820 - }, - { - "epoch": 0.69, - "learning_rate": 1.5398807883732044e-05, - "loss": 2.2853, - "step": 396830 - }, - { - "epoch": 0.69, - "learning_rate": 1.5397935943805218e-05, - "loss": 2.3814, - "step": 396840 - }, - { - "epoch": 0.69, - "learning_rate": 1.5397064003878388e-05, - "loss": 2.3429, - "step": 396850 - }, - { - "epoch": 0.69, - "learning_rate": 1.539619206395156e-05, - "loss": 2.329, - "step": 396860 - }, - { - "epoch": 0.69, - "learning_rate": 1.5395320124024735e-05, - "loss": 2.4073, - "step": 396870 - }, - { - "epoch": 0.69, - "learning_rate": 1.539444818409791e-05, - "loss": 2.2175, - "step": 396880 - }, - { - "epoch": 0.69, - "learning_rate": 1.5393576244171083e-05, - "loss": 2.2429, - "step": 396890 - }, - { - "epoch": 0.69, - "learning_rate": 1.5392704304244253e-05, - "loss": 2.3169, - "step": 396900 - }, - { - "epoch": 0.69, - "learning_rate": 1.539183236431743e-05, - "loss": 2.3209, - "step": 396910 - }, - { - "epoch": 0.69, - "learning_rate": 1.53909604243906e-05, - "loss": 2.3308, - "step": 396920 - }, - { - "epoch": 0.69, - "learning_rate": 1.5390088484463775e-05, - "loss": 2.2785, - "step": 396930 - }, - { - "epoch": 0.69, - "learning_rate": 1.538921654453695e-05, - "loss": 2.3832, - "step": 396940 - }, - { - "epoch": 0.69, - "learning_rate": 1.5388344604610122e-05, - "loss": 2.4079, - "step": 396950 - }, - { - "epoch": 0.69, - "learning_rate": 1.5387472664683296e-05, - "loss": 2.3713, - "step": 396960 - }, - { - "epoch": 0.69, - "learning_rate": 1.5386600724756466e-05, - "loss": 2.2909, - "step": 396970 - }, - { - "epoch": 0.69, - "learning_rate": 1.5385728784829644e-05, - "loss": 2.2836, - "step": 396980 - }, - { - "epoch": 0.69, - "learning_rate": 1.5384856844902814e-05, - "loss": 2.2994, - "step": 396990 - }, - { - "epoch": 0.69, - "learning_rate": 1.5383984904975988e-05, - "loss": 2.2853, - "step": 397000 - }, - { - "epoch": 0.69, - "learning_rate": 1.5383112965049158e-05, - "loss": 2.2705, - "step": 397010 - }, - { - "epoch": 0.69, - "learning_rate": 1.5382241025122335e-05, - "loss": 2.3626, - "step": 397020 - }, - { - "epoch": 0.69, - "learning_rate": 1.5381369085195506e-05, - "loss": 2.3657, - "step": 397030 - }, - { - "epoch": 0.69, - "learning_rate": 1.538049714526868e-05, - "loss": 2.2865, - "step": 397040 - }, - { - "epoch": 0.69, - "learning_rate": 1.5379625205341853e-05, - "loss": 2.3215, - "step": 397050 - }, - { - "epoch": 0.69, - "learning_rate": 1.5378753265415027e-05, - "loss": 2.2779, - "step": 397060 - }, - { - "epoch": 0.69, - "learning_rate": 1.53778813254882e-05, - "loss": 2.318, - "step": 397070 - }, - { - "epoch": 0.69, - "learning_rate": 1.537700938556137e-05, - "loss": 2.2654, - "step": 397080 - }, - { - "epoch": 0.69, - "learning_rate": 1.5376137445634548e-05, - "loss": 2.3914, - "step": 397090 - }, - { - "epoch": 0.69, - "learning_rate": 1.537526550570772e-05, - "loss": 2.2859, - "step": 397100 - }, - { - "epoch": 0.69, - "learning_rate": 1.5374393565780892e-05, - "loss": 2.2715, - "step": 397110 - }, - { - "epoch": 0.69, - "learning_rate": 1.5373521625854066e-05, - "loss": 2.2473, - "step": 397120 - }, - { - "epoch": 0.69, - "learning_rate": 1.537264968592724e-05, - "loss": 2.2281, - "step": 397130 - }, - { - "epoch": 0.69, - "learning_rate": 1.5371777746000414e-05, - "loss": 2.286, - "step": 397140 - }, - { - "epoch": 0.69, - "learning_rate": 1.5370905806073584e-05, - "loss": 2.4335, - "step": 397150 - }, - { - "epoch": 0.69, - "learning_rate": 1.5370033866146758e-05, - "loss": 2.2875, - "step": 397160 - }, - { - "epoch": 0.69, - "learning_rate": 1.536916192621993e-05, - "loss": 2.3389, - "step": 397170 - }, - { - "epoch": 0.69, - "learning_rate": 1.5368289986293105e-05, - "loss": 2.3979, - "step": 397180 - }, - { - "epoch": 0.69, - "learning_rate": 1.536741804636628e-05, - "loss": 2.34, - "step": 397190 - }, - { - "epoch": 0.69, - "learning_rate": 1.5366546106439453e-05, - "loss": 2.2795, - "step": 397200 - }, - { - "epoch": 0.69, - "learning_rate": 1.5365674166512627e-05, - "loss": 2.3282, - "step": 397210 - }, - { - "epoch": 0.69, - "learning_rate": 1.5364802226585797e-05, - "loss": 2.3454, - "step": 397220 - }, - { - "epoch": 0.69, - "learning_rate": 1.536393028665897e-05, - "loss": 2.252, - "step": 397230 - }, - { - "epoch": 0.69, - "learning_rate": 1.5363058346732145e-05, - "loss": 2.2852, - "step": 397240 - }, - { - "epoch": 0.69, - "learning_rate": 1.536218640680532e-05, - "loss": 2.362, - "step": 397250 - }, - { - "epoch": 0.69, - "learning_rate": 1.536131446687849e-05, - "loss": 2.2083, - "step": 397260 - }, - { - "epoch": 0.69, - "learning_rate": 1.5360442526951663e-05, - "loss": 2.2981, - "step": 397270 - }, - { - "epoch": 0.69, - "learning_rate": 1.535957058702484e-05, - "loss": 2.3123, - "step": 397280 - }, - { - "epoch": 0.69, - "learning_rate": 1.535869864709801e-05, - "loss": 2.314, - "step": 397290 - }, - { - "epoch": 0.69, - "learning_rate": 1.5357826707171184e-05, - "loss": 2.304, - "step": 397300 - }, - { - "epoch": 0.69, - "learning_rate": 1.5356954767244354e-05, - "loss": 2.2802, - "step": 397310 - }, - { - "epoch": 0.69, - "learning_rate": 1.535608282731753e-05, - "loss": 2.2816, - "step": 397320 - }, - { - "epoch": 0.69, - "learning_rate": 1.5355210887390702e-05, - "loss": 2.2673, - "step": 397330 - }, - { - "epoch": 0.69, - "learning_rate": 1.5354338947463876e-05, - "loss": 2.2474, - "step": 397340 - }, - { - "epoch": 0.69, - "learning_rate": 1.535346700753705e-05, - "loss": 2.4621, - "step": 397350 - }, - { - "epoch": 0.69, - "learning_rate": 1.5352595067610223e-05, - "loss": 2.3762, - "step": 397360 - }, - { - "epoch": 0.69, - "learning_rate": 1.5351723127683397e-05, - "loss": 2.2136, - "step": 397370 - }, - { - "epoch": 0.69, - "learning_rate": 1.5350851187756567e-05, - "loss": 2.3029, - "step": 397380 - }, - { - "epoch": 0.69, - "learning_rate": 1.5349979247829744e-05, - "loss": 2.3313, - "step": 397390 - }, - { - "epoch": 0.69, - "learning_rate": 1.5349107307902915e-05, - "loss": 2.2845, - "step": 397400 - }, - { - "epoch": 0.69, - "learning_rate": 1.534823536797609e-05, - "loss": 2.3748, - "step": 397410 - }, - { - "epoch": 0.69, - "learning_rate": 1.5347363428049262e-05, - "loss": 2.3053, - "step": 397420 - }, - { - "epoch": 0.69, - "learning_rate": 1.5346491488122436e-05, - "loss": 2.3873, - "step": 397430 - }, - { - "epoch": 0.69, - "learning_rate": 1.534561954819561e-05, - "loss": 2.2546, - "step": 397440 - }, - { - "epoch": 0.69, - "learning_rate": 1.534474760826878e-05, - "loss": 2.4081, - "step": 397450 - }, - { - "epoch": 0.69, - "learning_rate": 1.5343875668341957e-05, - "loss": 2.3718, - "step": 397460 - }, - { - "epoch": 0.69, - "learning_rate": 1.5343003728415128e-05, - "loss": 2.4268, - "step": 397470 - }, - { - "epoch": 0.69, - "learning_rate": 1.53421317884883e-05, - "loss": 2.356, - "step": 397480 - }, - { - "epoch": 0.69, - "learning_rate": 1.5341259848561472e-05, - "loss": 2.4205, - "step": 397490 - }, - { - "epoch": 0.69, - "learning_rate": 1.534038790863465e-05, - "loss": 2.2566, - "step": 397500 - }, - { - "epoch": 0.69, - "learning_rate": 1.533951596870782e-05, - "loss": 2.3289, - "step": 397510 - }, - { - "epoch": 0.69, - "learning_rate": 1.5338644028780993e-05, - "loss": 2.2578, - "step": 397520 - }, - { - "epoch": 0.69, - "learning_rate": 1.5337772088854167e-05, - "loss": 2.3334, - "step": 397530 - }, - { - "epoch": 0.69, - "learning_rate": 1.533690014892734e-05, - "loss": 2.3298, - "step": 397540 - }, - { - "epoch": 0.69, - "learning_rate": 1.5336028209000515e-05, - "loss": 2.141, - "step": 397550 - }, - { - "epoch": 0.69, - "learning_rate": 1.5335156269073685e-05, - "loss": 2.2419, - "step": 397560 - }, - { - "epoch": 0.69, - "learning_rate": 1.533428432914686e-05, - "loss": 2.2974, - "step": 397570 - }, - { - "epoch": 0.69, - "learning_rate": 1.5333412389220032e-05, - "loss": 2.3032, - "step": 397580 - }, - { - "epoch": 0.69, - "learning_rate": 1.5332540449293206e-05, - "loss": 2.3134, - "step": 397590 - }, - { - "epoch": 0.69, - "learning_rate": 1.533166850936638e-05, - "loss": 2.3651, - "step": 397600 - }, - { - "epoch": 0.69, - "learning_rate": 1.5330796569439554e-05, - "loss": 2.3105, - "step": 397610 - }, - { - "epoch": 0.69, - "learning_rate": 1.5329924629512728e-05, - "loss": 2.3277, - "step": 397620 - }, - { - "epoch": 0.69, - "learning_rate": 1.5329052689585898e-05, - "loss": 2.3321, - "step": 397630 - }, - { - "epoch": 0.69, - "learning_rate": 1.532818074965907e-05, - "loss": 2.2878, - "step": 397640 - }, - { - "epoch": 0.69, - "learning_rate": 1.5327308809732245e-05, - "loss": 2.2543, - "step": 397650 - }, - { - "epoch": 0.69, - "learning_rate": 1.532643686980542e-05, - "loss": 2.3129, - "step": 397660 - }, - { - "epoch": 0.69, - "learning_rate": 1.5325564929878593e-05, - "loss": 2.2757, - "step": 397670 - }, - { - "epoch": 0.69, - "learning_rate": 1.5324692989951763e-05, - "loss": 2.2983, - "step": 397680 - }, - { - "epoch": 0.69, - "learning_rate": 1.532382105002494e-05, - "loss": 2.2269, - "step": 397690 - }, - { - "epoch": 0.69, - "learning_rate": 1.532294911009811e-05, - "loss": 2.2703, - "step": 397700 - }, - { - "epoch": 0.69, - "learning_rate": 1.5322077170171285e-05, - "loss": 2.2738, - "step": 397710 - }, - { - "epoch": 0.69, - "learning_rate": 1.532120523024446e-05, - "loss": 2.2162, - "step": 397720 - }, - { - "epoch": 0.69, - "learning_rate": 1.5320333290317632e-05, - "loss": 2.3062, - "step": 397730 - }, - { - "epoch": 0.69, - "learning_rate": 1.5319461350390803e-05, - "loss": 2.4196, - "step": 397740 - }, - { - "epoch": 0.69, - "learning_rate": 1.5318589410463976e-05, - "loss": 2.4371, - "step": 397750 - }, - { - "epoch": 0.69, - "learning_rate": 1.531771747053715e-05, - "loss": 2.345, - "step": 397760 - }, - { - "epoch": 0.69, - "learning_rate": 1.5316845530610324e-05, - "loss": 2.3785, - "step": 397770 - }, - { - "epoch": 0.69, - "learning_rate": 1.5315973590683498e-05, - "loss": 2.3155, - "step": 397780 - }, - { - "epoch": 0.69, - "learning_rate": 1.5315101650756668e-05, - "loss": 2.2764, - "step": 397790 - }, - { - "epoch": 0.69, - "learning_rate": 1.5314229710829845e-05, - "loss": 2.3887, - "step": 397800 - }, - { - "epoch": 0.69, - "learning_rate": 1.5313357770903016e-05, - "loss": 2.3019, - "step": 397810 - }, - { - "epoch": 0.69, - "learning_rate": 1.531248583097619e-05, - "loss": 2.3632, - "step": 397820 - }, - { - "epoch": 0.69, - "learning_rate": 1.5311613891049363e-05, - "loss": 2.3322, - "step": 397830 - }, - { - "epoch": 0.69, - "learning_rate": 1.5310741951122537e-05, - "loss": 2.3158, - "step": 397840 - }, - { - "epoch": 0.69, - "learning_rate": 1.530987001119571e-05, - "loss": 2.2786, - "step": 397850 - }, - { - "epoch": 0.69, - "learning_rate": 1.530899807126888e-05, - "loss": 2.2971, - "step": 397860 - }, - { - "epoch": 0.69, - "learning_rate": 1.5308126131342058e-05, - "loss": 2.2399, - "step": 397870 - }, - { - "epoch": 0.69, - "learning_rate": 1.530725419141523e-05, - "loss": 2.2705, - "step": 397880 - }, - { - "epoch": 0.69, - "learning_rate": 1.5306382251488402e-05, - "loss": 2.2576, - "step": 397890 - }, - { - "epoch": 0.69, - "learning_rate": 1.5305510311561576e-05, - "loss": 2.321, - "step": 397900 - }, - { - "epoch": 0.69, - "learning_rate": 1.530463837163475e-05, - "loss": 2.2492, - "step": 397910 - }, - { - "epoch": 0.69, - "learning_rate": 1.5303766431707924e-05, - "loss": 2.3147, - "step": 397920 - }, - { - "epoch": 0.69, - "learning_rate": 1.5302894491781094e-05, - "loss": 2.2829, - "step": 397930 - }, - { - "epoch": 0.69, - "learning_rate": 1.5302022551854268e-05, - "loss": 2.2388, - "step": 397940 - }, - { - "epoch": 0.69, - "learning_rate": 1.530115061192744e-05, - "loss": 2.3234, - "step": 397950 - }, - { - "epoch": 0.69, - "learning_rate": 1.5300278672000615e-05, - "loss": 2.2323, - "step": 397960 - }, - { - "epoch": 0.69, - "learning_rate": 1.5299406732073786e-05, - "loss": 2.3307, - "step": 397970 - }, - { - "epoch": 0.69, - "learning_rate": 1.529853479214696e-05, - "loss": 2.2935, - "step": 397980 - }, - { - "epoch": 0.69, - "learning_rate": 1.5297662852220133e-05, - "loss": 2.2337, - "step": 397990 - }, - { - "epoch": 0.69, - "learning_rate": 1.5296790912293307e-05, - "loss": 2.3382, - "step": 398000 - }, - { - "epoch": 0.69, - "learning_rate": 1.529591897236648e-05, - "loss": 2.226, - "step": 398010 - }, - { - "epoch": 0.69, - "learning_rate": 1.5295047032439655e-05, - "loss": 2.1419, - "step": 398020 - }, - { - "epoch": 0.69, - "learning_rate": 1.529417509251283e-05, - "loss": 2.3141, - "step": 398030 - }, - { - "epoch": 0.69, - "learning_rate": 1.5293303152586e-05, - "loss": 2.3895, - "step": 398040 - }, - { - "epoch": 0.69, - "learning_rate": 1.5292431212659173e-05, - "loss": 2.3832, - "step": 398050 - }, - { - "epoch": 0.69, - "learning_rate": 1.5291559272732346e-05, - "loss": 2.4115, - "step": 398060 - }, - { - "epoch": 0.69, - "learning_rate": 1.529068733280552e-05, - "loss": 2.238, - "step": 398070 - }, - { - "epoch": 0.69, - "learning_rate": 1.5289815392878694e-05, - "loss": 2.4244, - "step": 398080 - }, - { - "epoch": 0.69, - "learning_rate": 1.5288943452951864e-05, - "loss": 2.435, - "step": 398090 - }, - { - "epoch": 0.69, - "learning_rate": 1.528807151302504e-05, - "loss": 2.3677, - "step": 398100 - }, - { - "epoch": 0.69, - "learning_rate": 1.5287199573098212e-05, - "loss": 2.415, - "step": 398110 - }, - { - "epoch": 0.69, - "learning_rate": 1.5286327633171386e-05, - "loss": 2.293, - "step": 398120 - }, - { - "epoch": 0.69, - "learning_rate": 1.528545569324456e-05, - "loss": 2.2891, - "step": 398130 - }, - { - "epoch": 0.69, - "learning_rate": 1.5284583753317733e-05, - "loss": 2.3227, - "step": 398140 - }, - { - "epoch": 0.69, - "learning_rate": 1.5283711813390907e-05, - "loss": 2.2517, - "step": 398150 - }, - { - "epoch": 0.69, - "learning_rate": 1.5282839873464077e-05, - "loss": 2.3309, - "step": 398160 - }, - { - "epoch": 0.69, - "learning_rate": 1.5281967933537254e-05, - "loss": 2.3424, - "step": 398170 - }, - { - "epoch": 0.69, - "learning_rate": 1.5281095993610425e-05, - "loss": 2.2622, - "step": 398180 - }, - { - "epoch": 0.69, - "learning_rate": 1.52802240536836e-05, - "loss": 2.3076, - "step": 398190 - }, - { - "epoch": 0.69, - "learning_rate": 1.527935211375677e-05, - "loss": 2.3092, - "step": 398200 - }, - { - "epoch": 0.69, - "learning_rate": 1.5278480173829946e-05, - "loss": 2.328, - "step": 398210 - }, - { - "epoch": 0.69, - "learning_rate": 1.5277608233903116e-05, - "loss": 2.2264, - "step": 398220 - }, - { - "epoch": 0.69, - "learning_rate": 1.527673629397629e-05, - "loss": 2.3936, - "step": 398230 - }, - { - "epoch": 0.69, - "learning_rate": 1.5275864354049464e-05, - "loss": 2.2692, - "step": 398240 - }, - { - "epoch": 0.69, - "learning_rate": 1.5274992414122638e-05, - "loss": 2.3768, - "step": 398250 - }, - { - "epoch": 0.69, - "learning_rate": 1.527412047419581e-05, - "loss": 2.2573, - "step": 398260 - }, - { - "epoch": 0.69, - "learning_rate": 1.5273248534268982e-05, - "loss": 2.4525, - "step": 398270 - }, - { - "epoch": 0.69, - "learning_rate": 1.527237659434216e-05, - "loss": 2.4224, - "step": 398280 - }, - { - "epoch": 0.69, - "learning_rate": 1.527150465441533e-05, - "loss": 2.2197, - "step": 398290 - }, - { - "epoch": 0.69, - "learning_rate": 1.5270632714488503e-05, - "loss": 2.3149, - "step": 398300 - }, - { - "epoch": 0.69, - "learning_rate": 1.5269760774561677e-05, - "loss": 2.1988, - "step": 398310 - }, - { - "epoch": 0.69, - "learning_rate": 1.526888883463485e-05, - "loss": 2.3999, - "step": 398320 - }, - { - "epoch": 0.69, - "learning_rate": 1.5268016894708025e-05, - "loss": 2.2879, - "step": 398330 - }, - { - "epoch": 0.69, - "learning_rate": 1.5267144954781195e-05, - "loss": 2.3095, - "step": 398340 - }, - { - "epoch": 0.69, - "learning_rate": 1.526627301485437e-05, - "loss": 2.29, - "step": 398350 - }, - { - "epoch": 0.69, - "learning_rate": 1.5265401074927542e-05, - "loss": 2.1799, - "step": 398360 - }, - { - "epoch": 0.69, - "learning_rate": 1.5264529135000716e-05, - "loss": 2.3708, - "step": 398370 - }, - { - "epoch": 0.69, - "learning_rate": 1.5263657195073887e-05, - "loss": 2.328, - "step": 398380 - }, - { - "epoch": 0.69, - "learning_rate": 1.5262785255147064e-05, - "loss": 2.2672, - "step": 398390 - }, - { - "epoch": 0.69, - "learning_rate": 1.5261913315220238e-05, - "loss": 2.2802, - "step": 398400 - }, - { - "epoch": 0.69, - "learning_rate": 1.5261041375293408e-05, - "loss": 2.3122, - "step": 398410 - }, - { - "epoch": 0.69, - "learning_rate": 1.526016943536658e-05, - "loss": 2.1281, - "step": 398420 - }, - { - "epoch": 0.69, - "learning_rate": 1.5259297495439755e-05, - "loss": 2.3292, - "step": 398430 - }, - { - "epoch": 0.69, - "learning_rate": 1.525842555551293e-05, - "loss": 2.3434, - "step": 398440 - }, - { - "epoch": 0.69, - "learning_rate": 1.5257553615586101e-05, - "loss": 2.2391, - "step": 398450 - }, - { - "epoch": 0.69, - "learning_rate": 1.5256681675659273e-05, - "loss": 2.2508, - "step": 398460 - }, - { - "epoch": 0.69, - "learning_rate": 1.5255809735732449e-05, - "loss": 2.3562, - "step": 398470 - }, - { - "epoch": 0.69, - "learning_rate": 1.5254937795805621e-05, - "loss": 2.3362, - "step": 398480 - }, - { - "epoch": 0.69, - "learning_rate": 1.5254065855878793e-05, - "loss": 2.2035, - "step": 398490 - }, - { - "epoch": 0.69, - "learning_rate": 1.5253193915951967e-05, - "loss": 2.4258, - "step": 398500 - }, - { - "epoch": 0.69, - "learning_rate": 1.525232197602514e-05, - "loss": 2.3688, - "step": 398510 - }, - { - "epoch": 0.69, - "learning_rate": 1.5251450036098314e-05, - "loss": 2.2958, - "step": 398520 - }, - { - "epoch": 0.69, - "learning_rate": 1.5250578096171486e-05, - "loss": 2.2612, - "step": 398530 - }, - { - "epoch": 0.7, - "learning_rate": 1.5249706156244662e-05, - "loss": 2.2705, - "step": 398540 - }, - { - "epoch": 0.7, - "learning_rate": 1.5248834216317834e-05, - "loss": 2.2602, - "step": 398550 - }, - { - "epoch": 0.7, - "learning_rate": 1.5247962276391006e-05, - "loss": 2.1693, - "step": 398560 - }, - { - "epoch": 0.7, - "learning_rate": 1.5247090336464178e-05, - "loss": 2.3598, - "step": 398570 - }, - { - "epoch": 0.7, - "learning_rate": 1.5246218396537354e-05, - "loss": 2.3635, - "step": 398580 - }, - { - "epoch": 0.7, - "learning_rate": 1.5245346456610526e-05, - "loss": 2.328, - "step": 398590 - }, - { - "epoch": 0.7, - "learning_rate": 1.52444745166837e-05, - "loss": 2.2707, - "step": 398600 - }, - { - "epoch": 0.7, - "learning_rate": 1.5243602576756871e-05, - "loss": 2.3478, - "step": 398610 - }, - { - "epoch": 0.7, - "learning_rate": 1.5242730636830047e-05, - "loss": 2.3767, - "step": 398620 - }, - { - "epoch": 0.7, - "learning_rate": 1.5241858696903219e-05, - "loss": 2.17, - "step": 398630 - }, - { - "epoch": 0.7, - "learning_rate": 1.5240986756976391e-05, - "loss": 2.2585, - "step": 398640 - }, - { - "epoch": 0.7, - "learning_rate": 1.5240114817049563e-05, - "loss": 2.2552, - "step": 398650 - }, - { - "epoch": 0.7, - "learning_rate": 1.5239242877122739e-05, - "loss": 2.304, - "step": 398660 - }, - { - "epoch": 0.7, - "learning_rate": 1.5238370937195912e-05, - "loss": 2.3271, - "step": 398670 - }, - { - "epoch": 0.7, - "learning_rate": 1.5237498997269084e-05, - "loss": 2.4087, - "step": 398680 - }, - { - "epoch": 0.7, - "learning_rate": 1.523662705734226e-05, - "loss": 2.2433, - "step": 398690 - }, - { - "epoch": 0.7, - "learning_rate": 1.5235755117415432e-05, - "loss": 2.3141, - "step": 398700 - }, - { - "epoch": 0.7, - "learning_rate": 1.5234883177488604e-05, - "loss": 2.3355, - "step": 398710 - }, - { - "epoch": 0.7, - "learning_rate": 1.5234011237561776e-05, - "loss": 2.3807, - "step": 398720 - }, - { - "epoch": 0.7, - "learning_rate": 1.5233139297634952e-05, - "loss": 2.2294, - "step": 398730 - }, - { - "epoch": 0.7, - "learning_rate": 1.5232267357708124e-05, - "loss": 2.1472, - "step": 398740 - }, - { - "epoch": 0.7, - "learning_rate": 1.5231395417781297e-05, - "loss": 2.2988, - "step": 398750 - }, - { - "epoch": 0.7, - "learning_rate": 1.523052347785447e-05, - "loss": 2.3928, - "step": 398760 - }, - { - "epoch": 0.7, - "learning_rate": 1.5229651537927645e-05, - "loss": 2.3178, - "step": 398770 - }, - { - "epoch": 0.7, - "learning_rate": 1.5228779598000817e-05, - "loss": 2.3277, - "step": 398780 - }, - { - "epoch": 0.7, - "learning_rate": 1.5227907658073989e-05, - "loss": 2.1567, - "step": 398790 - }, - { - "epoch": 0.7, - "learning_rate": 1.5227035718147165e-05, - "loss": 2.2519, - "step": 398800 - }, - { - "epoch": 0.7, - "learning_rate": 1.5226163778220337e-05, - "loss": 2.2675, - "step": 398810 - }, - { - "epoch": 0.7, - "learning_rate": 1.5225291838293509e-05, - "loss": 2.2054, - "step": 398820 - }, - { - "epoch": 0.7, - "learning_rate": 1.5224419898366683e-05, - "loss": 2.3419, - "step": 398830 - }, - { - "epoch": 0.7, - "learning_rate": 1.5223547958439858e-05, - "loss": 2.1841, - "step": 398840 - }, - { - "epoch": 0.7, - "learning_rate": 1.522267601851303e-05, - "loss": 2.2743, - "step": 398850 - }, - { - "epoch": 0.7, - "learning_rate": 1.5221804078586202e-05, - "loss": 2.3222, - "step": 398860 - }, - { - "epoch": 0.7, - "learning_rate": 1.5220932138659374e-05, - "loss": 2.2289, - "step": 398870 - }, - { - "epoch": 0.7, - "learning_rate": 1.522006019873255e-05, - "loss": 2.3902, - "step": 398880 - }, - { - "epoch": 0.7, - "learning_rate": 1.5219188258805722e-05, - "loss": 2.2041, - "step": 398890 - }, - { - "epoch": 0.7, - "learning_rate": 1.5218316318878894e-05, - "loss": 2.1734, - "step": 398900 - }, - { - "epoch": 0.7, - "learning_rate": 1.5217444378952068e-05, - "loss": 2.3725, - "step": 398910 - }, - { - "epoch": 0.7, - "learning_rate": 1.5216572439025243e-05, - "loss": 2.3601, - "step": 398920 - }, - { - "epoch": 0.7, - "learning_rate": 1.5215700499098415e-05, - "loss": 2.2902, - "step": 398930 - }, - { - "epoch": 0.7, - "learning_rate": 1.5214828559171587e-05, - "loss": 2.3189, - "step": 398940 - }, - { - "epoch": 0.7, - "learning_rate": 1.5213956619244763e-05, - "loss": 2.1762, - "step": 398950 - }, - { - "epoch": 0.7, - "learning_rate": 1.5213084679317935e-05, - "loss": 2.3245, - "step": 398960 - }, - { - "epoch": 0.7, - "learning_rate": 1.5212212739391107e-05, - "loss": 2.343, - "step": 398970 - }, - { - "epoch": 0.7, - "learning_rate": 1.521134079946428e-05, - "loss": 2.3868, - "step": 398980 - }, - { - "epoch": 0.7, - "learning_rate": 1.5210468859537454e-05, - "loss": 2.3304, - "step": 398990 - }, - { - "epoch": 0.7, - "learning_rate": 1.5209596919610628e-05, - "loss": 2.3113, - "step": 399000 - }, - { - "epoch": 0.7, - "learning_rate": 1.52087249796838e-05, - "loss": 2.0861, - "step": 399010 - }, - { - "epoch": 0.7, - "learning_rate": 1.5207853039756972e-05, - "loss": 2.2944, - "step": 399020 - }, - { - "epoch": 0.7, - "learning_rate": 1.5206981099830148e-05, - "loss": 2.4091, - "step": 399030 - }, - { - "epoch": 0.7, - "learning_rate": 1.520610915990332e-05, - "loss": 2.2496, - "step": 399040 - }, - { - "epoch": 0.7, - "learning_rate": 1.5205237219976492e-05, - "loss": 2.3181, - "step": 399050 - }, - { - "epoch": 0.7, - "learning_rate": 1.5204365280049667e-05, - "loss": 2.2907, - "step": 399060 - }, - { - "epoch": 0.7, - "learning_rate": 1.520349334012284e-05, - "loss": 2.2826, - "step": 399070 - }, - { - "epoch": 0.7, - "learning_rate": 1.5202621400196013e-05, - "loss": 2.2661, - "step": 399080 - }, - { - "epoch": 0.7, - "learning_rate": 1.5201749460269185e-05, - "loss": 2.2618, - "step": 399090 - }, - { - "epoch": 0.7, - "learning_rate": 1.520087752034236e-05, - "loss": 2.3369, - "step": 399100 - }, - { - "epoch": 0.7, - "learning_rate": 1.5200005580415533e-05, - "loss": 2.3886, - "step": 399110 - }, - { - "epoch": 0.7, - "learning_rate": 1.5199133640488705e-05, - "loss": 2.3669, - "step": 399120 - }, - { - "epoch": 0.7, - "learning_rate": 1.5198261700561877e-05, - "loss": 2.2292, - "step": 399130 - }, - { - "epoch": 0.7, - "learning_rate": 1.5197389760635052e-05, - "loss": 2.2915, - "step": 399140 - }, - { - "epoch": 0.7, - "learning_rate": 1.5196517820708226e-05, - "loss": 2.286, - "step": 399150 - }, - { - "epoch": 0.7, - "learning_rate": 1.5195645880781398e-05, - "loss": 2.3198, - "step": 399160 - }, - { - "epoch": 0.7, - "learning_rate": 1.519477394085457e-05, - "loss": 2.2054, - "step": 399170 - }, - { - "epoch": 0.7, - "learning_rate": 1.5193902000927746e-05, - "loss": 2.3742, - "step": 399180 - }, - { - "epoch": 0.7, - "learning_rate": 1.5193030061000918e-05, - "loss": 2.2231, - "step": 399190 - }, - { - "epoch": 0.7, - "learning_rate": 1.519215812107409e-05, - "loss": 2.3406, - "step": 399200 - }, - { - "epoch": 0.7, - "learning_rate": 1.5191286181147265e-05, - "loss": 2.2697, - "step": 399210 - }, - { - "epoch": 0.7, - "learning_rate": 1.5190414241220438e-05, - "loss": 2.2328, - "step": 399220 - }, - { - "epoch": 0.7, - "learning_rate": 1.5189542301293611e-05, - "loss": 2.2116, - "step": 399230 - }, - { - "epoch": 0.7, - "learning_rate": 1.5188670361366783e-05, - "loss": 2.1739, - "step": 399240 - }, - { - "epoch": 0.7, - "learning_rate": 1.5187798421439959e-05, - "loss": 2.3312, - "step": 399250 - }, - { - "epoch": 0.7, - "learning_rate": 1.5186926481513131e-05, - "loss": 2.3088, - "step": 399260 - }, - { - "epoch": 0.7, - "learning_rate": 1.5186054541586303e-05, - "loss": 2.4505, - "step": 399270 - }, - { - "epoch": 0.7, - "learning_rate": 1.5185182601659475e-05, - "loss": 2.3479, - "step": 399280 - }, - { - "epoch": 0.7, - "learning_rate": 1.518431066173265e-05, - "loss": 2.3414, - "step": 399290 - }, - { - "epoch": 0.7, - "learning_rate": 1.5183438721805823e-05, - "loss": 2.2441, - "step": 399300 - }, - { - "epoch": 0.7, - "learning_rate": 1.5182566781878996e-05, - "loss": 2.2602, - "step": 399310 - }, - { - "epoch": 0.7, - "learning_rate": 1.518169484195217e-05, - "loss": 2.2562, - "step": 399320 - }, - { - "epoch": 0.7, - "learning_rate": 1.5180822902025344e-05, - "loss": 2.3237, - "step": 399330 - }, - { - "epoch": 0.7, - "learning_rate": 1.5179950962098516e-05, - "loss": 2.2518, - "step": 399340 - }, - { - "epoch": 0.7, - "learning_rate": 1.5179079022171688e-05, - "loss": 2.3438, - "step": 399350 - }, - { - "epoch": 0.7, - "learning_rate": 1.5178207082244864e-05, - "loss": 2.2361, - "step": 399360 - }, - { - "epoch": 0.7, - "learning_rate": 1.5177335142318036e-05, - "loss": 2.4049, - "step": 399370 - }, - { - "epoch": 0.7, - "learning_rate": 1.5176463202391208e-05, - "loss": 2.2407, - "step": 399380 - }, - { - "epoch": 0.7, - "learning_rate": 1.5175591262464381e-05, - "loss": 2.2378, - "step": 399390 - }, - { - "epoch": 0.7, - "learning_rate": 1.5174719322537557e-05, - "loss": 2.1391, - "step": 399400 - }, - { - "epoch": 0.7, - "learning_rate": 1.5173847382610729e-05, - "loss": 2.3556, - "step": 399410 - }, - { - "epoch": 0.7, - "learning_rate": 1.5172975442683901e-05, - "loss": 2.3587, - "step": 399420 - }, - { - "epoch": 0.7, - "learning_rate": 1.5172103502757073e-05, - "loss": 2.3495, - "step": 399430 - }, - { - "epoch": 0.7, - "learning_rate": 1.5171231562830249e-05, - "loss": 2.266, - "step": 399440 - }, - { - "epoch": 0.7, - "learning_rate": 1.517035962290342e-05, - "loss": 2.3385, - "step": 399450 - }, - { - "epoch": 0.7, - "learning_rate": 1.5169487682976594e-05, - "loss": 2.3987, - "step": 399460 - }, - { - "epoch": 0.7, - "learning_rate": 1.5168615743049768e-05, - "loss": 2.1875, - "step": 399470 - }, - { - "epoch": 0.7, - "learning_rate": 1.5167743803122942e-05, - "loss": 2.2809, - "step": 399480 - }, - { - "epoch": 0.7, - "learning_rate": 1.5166871863196114e-05, - "loss": 2.1601, - "step": 399490 - }, - { - "epoch": 0.7, - "learning_rate": 1.5165999923269286e-05, - "loss": 2.3426, - "step": 399500 - }, - { - "epoch": 0.7, - "learning_rate": 1.5165127983342462e-05, - "loss": 2.2558, - "step": 399510 - }, - { - "epoch": 0.7, - "learning_rate": 1.5164256043415634e-05, - "loss": 2.3171, - "step": 399520 - }, - { - "epoch": 0.7, - "learning_rate": 1.5163384103488806e-05, - "loss": 2.2165, - "step": 399530 - }, - { - "epoch": 0.7, - "learning_rate": 1.516251216356198e-05, - "loss": 2.2667, - "step": 399540 - }, - { - "epoch": 0.7, - "learning_rate": 1.5161640223635153e-05, - "loss": 2.2008, - "step": 399550 - }, - { - "epoch": 0.7, - "learning_rate": 1.5160768283708327e-05, - "loss": 2.3407, - "step": 399560 - }, - { - "epoch": 0.7, - "learning_rate": 1.5159896343781499e-05, - "loss": 2.2799, - "step": 399570 - }, - { - "epoch": 0.7, - "learning_rate": 1.5159024403854671e-05, - "loss": 2.3064, - "step": 399580 - }, - { - "epoch": 0.7, - "learning_rate": 1.5158152463927847e-05, - "loss": 2.2539, - "step": 399590 - }, - { - "epoch": 0.7, - "learning_rate": 1.5157280524001019e-05, - "loss": 2.2829, - "step": 399600 - }, - { - "epoch": 0.7, - "learning_rate": 1.515640858407419e-05, - "loss": 2.265, - "step": 399610 - }, - { - "epoch": 0.7, - "learning_rate": 1.5155536644147366e-05, - "loss": 2.3754, - "step": 399620 - }, - { - "epoch": 0.7, - "learning_rate": 1.5154664704220538e-05, - "loss": 2.3593, - "step": 399630 - }, - { - "epoch": 0.7, - "learning_rate": 1.5153792764293712e-05, - "loss": 2.2924, - "step": 399640 - }, - { - "epoch": 0.7, - "learning_rate": 1.5152920824366884e-05, - "loss": 2.262, - "step": 399650 - }, - { - "epoch": 0.7, - "learning_rate": 1.515204888444006e-05, - "loss": 2.2722, - "step": 399660 - }, - { - "epoch": 0.7, - "learning_rate": 1.5151176944513232e-05, - "loss": 2.317, - "step": 399670 - }, - { - "epoch": 0.7, - "learning_rate": 1.5150305004586404e-05, - "loss": 2.2415, - "step": 399680 - }, - { - "epoch": 0.7, - "learning_rate": 1.5149433064659576e-05, - "loss": 2.2741, - "step": 399690 - }, - { - "epoch": 0.7, - "learning_rate": 1.5148561124732751e-05, - "loss": 2.3447, - "step": 399700 - }, - { - "epoch": 0.7, - "learning_rate": 1.5147689184805925e-05, - "loss": 2.2687, - "step": 399710 - }, - { - "epoch": 0.7, - "learning_rate": 1.5146817244879097e-05, - "loss": 2.3792, - "step": 399720 - }, - { - "epoch": 0.7, - "learning_rate": 1.5145945304952273e-05, - "loss": 2.3499, - "step": 399730 - }, - { - "epoch": 0.7, - "learning_rate": 1.5145073365025445e-05, - "loss": 2.3838, - "step": 399740 - }, - { - "epoch": 0.7, - "learning_rate": 1.5144201425098617e-05, - "loss": 2.1788, - "step": 399750 - }, - { - "epoch": 0.7, - "learning_rate": 1.5143329485171789e-05, - "loss": 2.3289, - "step": 399760 - }, - { - "epoch": 0.7, - "learning_rate": 1.5142457545244964e-05, - "loss": 2.3245, - "step": 399770 - }, - { - "epoch": 0.7, - "learning_rate": 1.5141585605318136e-05, - "loss": 2.2909, - "step": 399780 - }, - { - "epoch": 0.7, - "learning_rate": 1.514071366539131e-05, - "loss": 2.3831, - "step": 399790 - }, - { - "epoch": 0.7, - "learning_rate": 1.5139841725464482e-05, - "loss": 2.3554, - "step": 399800 - }, - { - "epoch": 0.7, - "learning_rate": 1.5138969785537658e-05, - "loss": 2.2683, - "step": 399810 - }, - { - "epoch": 0.7, - "learning_rate": 1.513809784561083e-05, - "loss": 2.1912, - "step": 399820 - }, - { - "epoch": 0.7, - "learning_rate": 1.5137225905684002e-05, - "loss": 2.202, - "step": 399830 - }, - { - "epoch": 0.7, - "learning_rate": 1.5136353965757174e-05, - "loss": 2.403, - "step": 399840 - }, - { - "epoch": 0.7, - "learning_rate": 1.513548202583035e-05, - "loss": 2.322, - "step": 399850 - }, - { - "epoch": 0.7, - "learning_rate": 1.5134610085903522e-05, - "loss": 2.3893, - "step": 399860 - }, - { - "epoch": 0.7, - "learning_rate": 1.5133738145976695e-05, - "loss": 2.2471, - "step": 399870 - }, - { - "epoch": 0.7, - "learning_rate": 1.513286620604987e-05, - "loss": 2.2812, - "step": 399880 - }, - { - "epoch": 0.7, - "learning_rate": 1.5131994266123043e-05, - "loss": 2.424, - "step": 399890 - }, - { - "epoch": 0.7, - "learning_rate": 1.5131122326196215e-05, - "loss": 2.4303, - "step": 399900 - }, - { - "epoch": 0.7, - "learning_rate": 1.5130250386269387e-05, - "loss": 2.3253, - "step": 399910 - }, - { - "epoch": 0.7, - "learning_rate": 1.5129378446342562e-05, - "loss": 2.303, - "step": 399920 - }, - { - "epoch": 0.7, - "learning_rate": 1.5128506506415735e-05, - "loss": 2.2859, - "step": 399930 - }, - { - "epoch": 0.7, - "learning_rate": 1.5127634566488907e-05, - "loss": 2.4975, - "step": 399940 - }, - { - "epoch": 0.7, - "learning_rate": 1.512676262656208e-05, - "loss": 2.2584, - "step": 399950 - }, - { - "epoch": 0.7, - "learning_rate": 1.5125890686635256e-05, - "loss": 2.2841, - "step": 399960 - }, - { - "epoch": 0.7, - "learning_rate": 1.5125018746708428e-05, - "loss": 2.4113, - "step": 399970 - }, - { - "epoch": 0.7, - "learning_rate": 1.51241468067816e-05, - "loss": 2.3934, - "step": 399980 - }, - { - "epoch": 0.7, - "learning_rate": 1.5123274866854775e-05, - "loss": 2.3295, - "step": 399990 - }, - { - "epoch": 0.7, - "learning_rate": 1.5122402926927948e-05, - "loss": 2.2265, - "step": 400000 - }, - { - "epoch": 0.7, - "learning_rate": 1.512153098700112e-05, - "loss": 2.2558, - "step": 400010 - }, - { - "epoch": 0.7, - "learning_rate": 1.5120659047074293e-05, - "loss": 2.3104, - "step": 400020 - }, - { - "epoch": 0.7, - "learning_rate": 1.5119787107147467e-05, - "loss": 2.3432, - "step": 400030 - }, - { - "epoch": 0.7, - "learning_rate": 1.5118915167220641e-05, - "loss": 2.2026, - "step": 400040 - }, - { - "epoch": 0.7, - "learning_rate": 1.5118043227293813e-05, - "loss": 2.3438, - "step": 400050 - }, - { - "epoch": 0.7, - "learning_rate": 1.5117171287366985e-05, - "loss": 2.2399, - "step": 400060 - }, - { - "epoch": 0.7, - "learning_rate": 1.511629934744016e-05, - "loss": 2.2797, - "step": 400070 - }, - { - "epoch": 0.7, - "learning_rate": 1.5115427407513333e-05, - "loss": 2.2995, - "step": 400080 - }, - { - "epoch": 0.7, - "learning_rate": 1.5114555467586505e-05, - "loss": 2.4303, - "step": 400090 - }, - { - "epoch": 0.7, - "learning_rate": 1.5113683527659678e-05, - "loss": 2.319, - "step": 400100 - }, - { - "epoch": 0.7, - "learning_rate": 1.5112811587732852e-05, - "loss": 2.3175, - "step": 400110 - }, - { - "epoch": 0.7, - "learning_rate": 1.5111939647806026e-05, - "loss": 2.4791, - "step": 400120 - }, - { - "epoch": 0.7, - "learning_rate": 1.5111067707879198e-05, - "loss": 2.2435, - "step": 400130 - }, - { - "epoch": 0.7, - "learning_rate": 1.5110195767952374e-05, - "loss": 2.3577, - "step": 400140 - }, - { - "epoch": 0.7, - "learning_rate": 1.5109323828025546e-05, - "loss": 2.3702, - "step": 400150 - }, - { - "epoch": 0.7, - "learning_rate": 1.5108451888098718e-05, - "loss": 2.2402, - "step": 400160 - }, - { - "epoch": 0.7, - "learning_rate": 1.510757994817189e-05, - "loss": 2.2862, - "step": 400170 - }, - { - "epoch": 0.7, - "learning_rate": 1.5106708008245065e-05, - "loss": 2.2193, - "step": 400180 - }, - { - "epoch": 0.7, - "learning_rate": 1.5105836068318239e-05, - "loss": 2.1555, - "step": 400190 - }, - { - "epoch": 0.7, - "learning_rate": 1.5104964128391411e-05, - "loss": 2.2112, - "step": 400200 - }, - { - "epoch": 0.7, - "learning_rate": 1.5104092188464583e-05, - "loss": 2.4192, - "step": 400210 - }, - { - "epoch": 0.7, - "learning_rate": 1.5103220248537759e-05, - "loss": 2.3441, - "step": 400220 - }, - { - "epoch": 0.7, - "learning_rate": 1.510234830861093e-05, - "loss": 2.2329, - "step": 400230 - }, - { - "epoch": 0.7, - "learning_rate": 1.5101476368684103e-05, - "loss": 2.4366, - "step": 400240 - }, - { - "epoch": 0.7, - "learning_rate": 1.5100604428757278e-05, - "loss": 2.3247, - "step": 400250 - }, - { - "epoch": 0.7, - "learning_rate": 1.509973248883045e-05, - "loss": 2.2826, - "step": 400260 - }, - { - "epoch": 0.7, - "learning_rate": 1.5098860548903624e-05, - "loss": 2.2887, - "step": 400270 - }, - { - "epoch": 0.7, - "learning_rate": 1.5097988608976796e-05, - "loss": 2.3439, - "step": 400280 - }, - { - "epoch": 0.7, - "learning_rate": 1.5097116669049972e-05, - "loss": 2.3632, - "step": 400290 - }, - { - "epoch": 0.7, - "learning_rate": 1.5096244729123144e-05, - "loss": 2.2308, - "step": 400300 - }, - { - "epoch": 0.7, - "learning_rate": 1.5095372789196316e-05, - "loss": 2.2254, - "step": 400310 - }, - { - "epoch": 0.7, - "learning_rate": 1.5094500849269488e-05, - "loss": 2.3112, - "step": 400320 - }, - { - "epoch": 0.7, - "learning_rate": 1.5093628909342663e-05, - "loss": 2.4018, - "step": 400330 - }, - { - "epoch": 0.7, - "learning_rate": 1.5092756969415835e-05, - "loss": 2.3322, - "step": 400340 - }, - { - "epoch": 0.7, - "learning_rate": 1.509188502948901e-05, - "loss": 2.3031, - "step": 400350 - }, - { - "epoch": 0.7, - "learning_rate": 1.5091013089562181e-05, - "loss": 2.2672, - "step": 400360 - }, - { - "epoch": 0.7, - "learning_rate": 1.5090141149635357e-05, - "loss": 2.252, - "step": 400370 - }, - { - "epoch": 0.7, - "learning_rate": 1.5089269209708529e-05, - "loss": 2.3581, - "step": 400380 - }, - { - "epoch": 0.7, - "learning_rate": 1.50883972697817e-05, - "loss": 2.3934, - "step": 400390 - }, - { - "epoch": 0.7, - "learning_rate": 1.5087525329854876e-05, - "loss": 2.2679, - "step": 400400 - }, - { - "epoch": 0.7, - "learning_rate": 1.5086653389928048e-05, - "loss": 2.3268, - "step": 400410 - }, - { - "epoch": 0.7, - "learning_rate": 1.508578145000122e-05, - "loss": 2.353, - "step": 400420 - }, - { - "epoch": 0.7, - "learning_rate": 1.5084909510074394e-05, - "loss": 2.2451, - "step": 400430 - }, - { - "epoch": 0.7, - "learning_rate": 1.508403757014757e-05, - "loss": 2.2552, - "step": 400440 - }, - { - "epoch": 0.7, - "learning_rate": 1.5083165630220742e-05, - "loss": 2.2241, - "step": 400450 - }, - { - "epoch": 0.7, - "learning_rate": 1.5082293690293914e-05, - "loss": 2.3158, - "step": 400460 - }, - { - "epoch": 0.7, - "learning_rate": 1.5081421750367086e-05, - "loss": 2.3128, - "step": 400470 - }, - { - "epoch": 0.7, - "learning_rate": 1.5080549810440261e-05, - "loss": 2.3517, - "step": 400480 - }, - { - "epoch": 0.7, - "learning_rate": 1.5079677870513433e-05, - "loss": 2.2926, - "step": 400490 - }, - { - "epoch": 0.7, - "learning_rate": 1.5078805930586607e-05, - "loss": 2.3091, - "step": 400500 - }, - { - "epoch": 0.7, - "learning_rate": 1.507793399065978e-05, - "loss": 2.1556, - "step": 400510 - }, - { - "epoch": 0.7, - "learning_rate": 1.5077062050732955e-05, - "loss": 2.3562, - "step": 400520 - }, - { - "epoch": 0.7, - "learning_rate": 1.5076190110806127e-05, - "loss": 2.3799, - "step": 400530 - }, - { - "epoch": 0.7, - "learning_rate": 1.5075318170879299e-05, - "loss": 2.4081, - "step": 400540 - }, - { - "epoch": 0.7, - "learning_rate": 1.5074446230952474e-05, - "loss": 2.2503, - "step": 400550 - }, - { - "epoch": 0.7, - "learning_rate": 1.5073574291025646e-05, - "loss": 2.2873, - "step": 400560 - }, - { - "epoch": 0.7, - "learning_rate": 1.5072702351098819e-05, - "loss": 2.3453, - "step": 400570 - }, - { - "epoch": 0.7, - "learning_rate": 1.5071830411171992e-05, - "loss": 2.2834, - "step": 400580 - }, - { - "epoch": 0.7, - "learning_rate": 1.5070958471245166e-05, - "loss": 2.2758, - "step": 400590 - }, - { - "epoch": 0.7, - "learning_rate": 1.507008653131834e-05, - "loss": 2.1469, - "step": 400600 - }, - { - "epoch": 0.7, - "learning_rate": 1.5069214591391512e-05, - "loss": 2.2566, - "step": 400610 - }, - { - "epoch": 0.7, - "learning_rate": 1.5068342651464684e-05, - "loss": 2.1736, - "step": 400620 - }, - { - "epoch": 0.7, - "learning_rate": 1.506747071153786e-05, - "loss": 2.336, - "step": 400630 - }, - { - "epoch": 0.7, - "learning_rate": 1.5066598771611032e-05, - "loss": 2.181, - "step": 400640 - }, - { - "epoch": 0.7, - "learning_rate": 1.5065726831684204e-05, - "loss": 2.234, - "step": 400650 - }, - { - "epoch": 0.7, - "learning_rate": 1.5064854891757379e-05, - "loss": 2.2929, - "step": 400660 - }, - { - "epoch": 0.7, - "learning_rate": 1.5063982951830551e-05, - "loss": 2.2963, - "step": 400670 - }, - { - "epoch": 0.7, - "learning_rate": 1.5063111011903725e-05, - "loss": 2.3096, - "step": 400680 - }, - { - "epoch": 0.7, - "learning_rate": 1.5062239071976897e-05, - "loss": 2.3106, - "step": 400690 - }, - { - "epoch": 0.7, - "learning_rate": 1.5061367132050072e-05, - "loss": 2.2022, - "step": 400700 - }, - { - "epoch": 0.7, - "learning_rate": 1.5060495192123245e-05, - "loss": 2.3847, - "step": 400710 - }, - { - "epoch": 0.7, - "learning_rate": 1.5059623252196417e-05, - "loss": 2.2776, - "step": 400720 - }, - { - "epoch": 0.7, - "learning_rate": 1.5058751312269589e-05, - "loss": 2.2245, - "step": 400730 - }, - { - "epoch": 0.7, - "learning_rate": 1.5057879372342764e-05, - "loss": 2.4228, - "step": 400740 - }, - { - "epoch": 0.7, - "learning_rate": 1.5057007432415938e-05, - "loss": 2.3049, - "step": 400750 - }, - { - "epoch": 0.7, - "learning_rate": 1.505613549248911e-05, - "loss": 2.2536, - "step": 400760 - }, - { - "epoch": 0.7, - "learning_rate": 1.5055263552562282e-05, - "loss": 2.2973, - "step": 400770 - }, - { - "epoch": 0.7, - "learning_rate": 1.5054391612635458e-05, - "loss": 2.3622, - "step": 400780 - }, - { - "epoch": 0.7, - "learning_rate": 1.505351967270863e-05, - "loss": 2.3559, - "step": 400790 - }, - { - "epoch": 0.7, - "learning_rate": 1.5052647732781802e-05, - "loss": 2.3914, - "step": 400800 - }, - { - "epoch": 0.7, - "learning_rate": 1.5051775792854977e-05, - "loss": 2.2839, - "step": 400810 - }, - { - "epoch": 0.7, - "learning_rate": 1.505090385292815e-05, - "loss": 2.2659, - "step": 400820 - }, - { - "epoch": 0.7, - "learning_rate": 1.5050031913001323e-05, - "loss": 2.3192, - "step": 400830 - }, - { - "epoch": 0.7, - "learning_rate": 1.5049159973074495e-05, - "loss": 2.4039, - "step": 400840 - }, - { - "epoch": 0.7, - "learning_rate": 1.504828803314767e-05, - "loss": 2.2961, - "step": 400850 - }, - { - "epoch": 0.7, - "learning_rate": 1.5047416093220843e-05, - "loss": 2.2537, - "step": 400860 - }, - { - "epoch": 0.7, - "learning_rate": 1.5046544153294015e-05, - "loss": 2.2784, - "step": 400870 - }, - { - "epoch": 0.7, - "learning_rate": 1.5045672213367187e-05, - "loss": 2.2748, - "step": 400880 - }, - { - "epoch": 0.7, - "learning_rate": 1.5044800273440362e-05, - "loss": 2.3528, - "step": 400890 - }, - { - "epoch": 0.7, - "learning_rate": 1.5043928333513534e-05, - "loss": 2.2669, - "step": 400900 - }, - { - "epoch": 0.7, - "learning_rate": 1.5043056393586708e-05, - "loss": 2.219, - "step": 400910 - }, - { - "epoch": 0.7, - "learning_rate": 1.5042184453659884e-05, - "loss": 2.3566, - "step": 400920 - }, - { - "epoch": 0.7, - "learning_rate": 1.5041312513733056e-05, - "loss": 2.3912, - "step": 400930 - }, - { - "epoch": 0.7, - "learning_rate": 1.5040440573806228e-05, - "loss": 2.3176, - "step": 400940 - }, - { - "epoch": 0.7, - "learning_rate": 1.50395686338794e-05, - "loss": 2.2482, - "step": 400950 - }, - { - "epoch": 0.7, - "learning_rate": 1.5038696693952575e-05, - "loss": 2.3404, - "step": 400960 - }, - { - "epoch": 0.7, - "learning_rate": 1.5037824754025747e-05, - "loss": 2.3542, - "step": 400970 - }, - { - "epoch": 0.7, - "learning_rate": 1.503695281409892e-05, - "loss": 2.3866, - "step": 400980 - }, - { - "epoch": 0.7, - "learning_rate": 1.5036080874172093e-05, - "loss": 2.2588, - "step": 400990 - }, - { - "epoch": 0.7, - "learning_rate": 1.5035208934245269e-05, - "loss": 2.4393, - "step": 401000 - }, - { - "epoch": 0.7, - "learning_rate": 1.503433699431844e-05, - "loss": 2.3049, - "step": 401010 - }, - { - "epoch": 0.7, - "learning_rate": 1.5033465054391613e-05, - "loss": 2.2878, - "step": 401020 - }, - { - "epoch": 0.7, - "learning_rate": 1.5032593114464785e-05, - "loss": 2.3208, - "step": 401030 - }, - { - "epoch": 0.7, - "learning_rate": 1.503172117453796e-05, - "loss": 2.2407, - "step": 401040 - }, - { - "epoch": 0.7, - "learning_rate": 1.5030849234611132e-05, - "loss": 2.4005, - "step": 401050 - }, - { - "epoch": 0.7, - "learning_rate": 1.5029977294684306e-05, - "loss": 2.4162, - "step": 401060 - }, - { - "epoch": 0.7, - "learning_rate": 1.502910535475748e-05, - "loss": 2.2772, - "step": 401070 - }, - { - "epoch": 0.7, - "learning_rate": 1.5028233414830654e-05, - "loss": 2.2609, - "step": 401080 - }, - { - "epoch": 0.7, - "learning_rate": 1.5027361474903826e-05, - "loss": 2.2989, - "step": 401090 - }, - { - "epoch": 0.7, - "learning_rate": 1.5026489534976998e-05, - "loss": 2.3655, - "step": 401100 - }, - { - "epoch": 0.7, - "learning_rate": 1.5025617595050173e-05, - "loss": 2.3431, - "step": 401110 - }, - { - "epoch": 0.7, - "learning_rate": 1.5024745655123345e-05, - "loss": 2.3721, - "step": 401120 - }, - { - "epoch": 0.7, - "learning_rate": 1.5023873715196517e-05, - "loss": 2.3714, - "step": 401130 - }, - { - "epoch": 0.7, - "learning_rate": 1.5023001775269691e-05, - "loss": 2.2265, - "step": 401140 - }, - { - "epoch": 0.7, - "learning_rate": 1.5022129835342865e-05, - "loss": 2.2432, - "step": 401150 - }, - { - "epoch": 0.7, - "learning_rate": 1.5021257895416039e-05, - "loss": 2.2426, - "step": 401160 - }, - { - "epoch": 0.7, - "learning_rate": 1.5020385955489211e-05, - "loss": 2.3351, - "step": 401170 - }, - { - "epoch": 0.7, - "learning_rate": 1.5019514015562386e-05, - "loss": 2.294, - "step": 401180 - }, - { - "epoch": 0.7, - "learning_rate": 1.5018642075635558e-05, - "loss": 2.3279, - "step": 401190 - }, - { - "epoch": 0.7, - "learning_rate": 1.501777013570873e-05, - "loss": 2.3737, - "step": 401200 - }, - { - "epoch": 0.7, - "learning_rate": 1.5016898195781903e-05, - "loss": 2.3627, - "step": 401210 - }, - { - "epoch": 0.7, - "learning_rate": 1.5016026255855078e-05, - "loss": 2.1763, - "step": 401220 - }, - { - "epoch": 0.7, - "learning_rate": 1.5015154315928252e-05, - "loss": 2.3371, - "step": 401230 - }, - { - "epoch": 0.7, - "learning_rate": 1.5014282376001424e-05, - "loss": 2.2448, - "step": 401240 - }, - { - "epoch": 0.7, - "learning_rate": 1.5013410436074596e-05, - "loss": 2.4475, - "step": 401250 - }, - { - "epoch": 0.7, - "learning_rate": 1.5012538496147771e-05, - "loss": 2.3353, - "step": 401260 - }, - { - "epoch": 0.7, - "learning_rate": 1.5011666556220943e-05, - "loss": 2.2933, - "step": 401270 - }, - { - "epoch": 0.7, - "learning_rate": 1.5010794616294116e-05, - "loss": 2.3298, - "step": 401280 - }, - { - "epoch": 0.7, - "learning_rate": 1.5009922676367288e-05, - "loss": 2.2345, - "step": 401290 - }, - { - "epoch": 0.7, - "learning_rate": 1.5009050736440463e-05, - "loss": 2.2295, - "step": 401300 - }, - { - "epoch": 0.7, - "learning_rate": 1.5008178796513637e-05, - "loss": 2.2706, - "step": 401310 - }, - { - "epoch": 0.7, - "learning_rate": 1.5007306856586809e-05, - "loss": 2.2174, - "step": 401320 - }, - { - "epoch": 0.7, - "learning_rate": 1.5006434916659984e-05, - "loss": 2.32, - "step": 401330 - }, - { - "epoch": 0.7, - "learning_rate": 1.5005562976733156e-05, - "loss": 2.2256, - "step": 401340 - }, - { - "epoch": 0.7, - "learning_rate": 1.5004691036806329e-05, - "loss": 2.1894, - "step": 401350 - }, - { - "epoch": 0.7, - "learning_rate": 1.50038190968795e-05, - "loss": 2.2735, - "step": 401360 - }, - { - "epoch": 0.7, - "learning_rate": 1.5002947156952676e-05, - "loss": 2.3745, - "step": 401370 - }, - { - "epoch": 0.7, - "learning_rate": 1.5002075217025848e-05, - "loss": 2.2702, - "step": 401380 - }, - { - "epoch": 0.7, - "learning_rate": 1.5001203277099022e-05, - "loss": 2.2919, - "step": 401390 - }, - { - "epoch": 0.7, - "learning_rate": 1.5000331337172194e-05, - "loss": 2.3258, - "step": 401400 - }, - { - "epoch": 0.7, - "learning_rate": 1.499945939724537e-05, - "loss": 2.3299, - "step": 401410 - }, - { - "epoch": 0.7, - "learning_rate": 1.4998587457318542e-05, - "loss": 2.2997, - "step": 401420 - }, - { - "epoch": 0.7, - "learning_rate": 1.4997715517391714e-05, - "loss": 2.2505, - "step": 401430 - }, - { - "epoch": 0.7, - "learning_rate": 1.4996843577464886e-05, - "loss": 2.4142, - "step": 401440 - }, - { - "epoch": 0.7, - "learning_rate": 1.4995971637538061e-05, - "loss": 2.3535, - "step": 401450 - }, - { - "epoch": 0.7, - "learning_rate": 1.4995099697611233e-05, - "loss": 2.3525, - "step": 401460 - }, - { - "epoch": 0.7, - "learning_rate": 1.4994227757684407e-05, - "loss": 2.248, - "step": 401470 - }, - { - "epoch": 0.7, - "learning_rate": 1.4993355817757582e-05, - "loss": 2.35, - "step": 401480 - }, - { - "epoch": 0.7, - "learning_rate": 1.4992483877830755e-05, - "loss": 2.3696, - "step": 401490 - }, - { - "epoch": 0.7, - "learning_rate": 1.4991611937903927e-05, - "loss": 2.2609, - "step": 401500 - }, - { - "epoch": 0.7, - "learning_rate": 1.4990739997977099e-05, - "loss": 2.3561, - "step": 401510 - }, - { - "epoch": 0.7, - "learning_rate": 1.4989868058050274e-05, - "loss": 2.2433, - "step": 401520 - }, - { - "epoch": 0.7, - "learning_rate": 1.4988996118123446e-05, - "loss": 2.3131, - "step": 401530 - }, - { - "epoch": 0.7, - "learning_rate": 1.498812417819662e-05, - "loss": 2.2956, - "step": 401540 - }, - { - "epoch": 0.7, - "learning_rate": 1.4987252238269792e-05, - "loss": 2.3202, - "step": 401550 - }, - { - "epoch": 0.7, - "learning_rate": 1.4986380298342968e-05, - "loss": 2.3046, - "step": 401560 - }, - { - "epoch": 0.7, - "learning_rate": 1.498550835841614e-05, - "loss": 2.2931, - "step": 401570 - }, - { - "epoch": 0.7, - "learning_rate": 1.4984636418489312e-05, - "loss": 2.4354, - "step": 401580 - }, - { - "epoch": 0.7, - "learning_rate": 1.4983764478562487e-05, - "loss": 2.229, - "step": 401590 - }, - { - "epoch": 0.7, - "learning_rate": 1.498289253863566e-05, - "loss": 2.3572, - "step": 401600 - }, - { - "epoch": 0.7, - "learning_rate": 1.4982020598708831e-05, - "loss": 2.2381, - "step": 401610 - }, - { - "epoch": 0.7, - "learning_rate": 1.4981148658782005e-05, - "loss": 2.4016, - "step": 401620 - }, - { - "epoch": 0.7, - "learning_rate": 1.4980276718855179e-05, - "loss": 2.4185, - "step": 401630 - }, - { - "epoch": 0.7, - "learning_rate": 1.4979404778928353e-05, - "loss": 2.2682, - "step": 401640 - }, - { - "epoch": 0.7, - "learning_rate": 1.4978532839001525e-05, - "loss": 2.2275, - "step": 401650 - }, - { - "epoch": 0.7, - "learning_rate": 1.4977660899074697e-05, - "loss": 2.4249, - "step": 401660 - }, - { - "epoch": 0.7, - "learning_rate": 1.4976788959147872e-05, - "loss": 2.3111, - "step": 401670 - }, - { - "epoch": 0.7, - "learning_rate": 1.4975917019221044e-05, - "loss": 2.374, - "step": 401680 - }, - { - "epoch": 0.7, - "learning_rate": 1.4975045079294216e-05, - "loss": 2.493, - "step": 401690 - }, - { - "epoch": 0.7, - "learning_rate": 1.497417313936739e-05, - "loss": 2.3374, - "step": 401700 - }, - { - "epoch": 0.7, - "learning_rate": 1.4973301199440564e-05, - "loss": 2.3457, - "step": 401710 - }, - { - "epoch": 0.7, - "learning_rate": 1.4972429259513738e-05, - "loss": 2.4315, - "step": 401720 - }, - { - "epoch": 0.7, - "learning_rate": 1.497155731958691e-05, - "loss": 2.3647, - "step": 401730 - }, - { - "epoch": 0.7, - "learning_rate": 1.4970685379660085e-05, - "loss": 2.3469, - "step": 401740 - }, - { - "epoch": 0.7, - "learning_rate": 1.4969813439733257e-05, - "loss": 2.3887, - "step": 401750 - }, - { - "epoch": 0.7, - "learning_rate": 1.496894149980643e-05, - "loss": 2.3686, - "step": 401760 - }, - { - "epoch": 0.7, - "learning_rate": 1.4968069559879601e-05, - "loss": 2.303, - "step": 401770 - }, - { - "epoch": 0.7, - "learning_rate": 1.4967197619952777e-05, - "loss": 2.3221, - "step": 401780 - }, - { - "epoch": 0.7, - "learning_rate": 1.496632568002595e-05, - "loss": 2.1624, - "step": 401790 - }, - { - "epoch": 0.7, - "learning_rate": 1.4965453740099123e-05, - "loss": 2.2366, - "step": 401800 - }, - { - "epoch": 0.7, - "learning_rate": 1.4964581800172295e-05, - "loss": 2.299, - "step": 401810 - }, - { - "epoch": 0.7, - "learning_rate": 1.496370986024547e-05, - "loss": 2.3569, - "step": 401820 - }, - { - "epoch": 0.7, - "learning_rate": 1.4962837920318642e-05, - "loss": 2.2562, - "step": 401830 - }, - { - "epoch": 0.7, - "learning_rate": 1.4961965980391814e-05, - "loss": 2.2854, - "step": 401840 - }, - { - "epoch": 0.7, - "learning_rate": 1.496109404046499e-05, - "loss": 2.295, - "step": 401850 - }, - { - "epoch": 0.7, - "learning_rate": 1.4960222100538162e-05, - "loss": 2.2469, - "step": 401860 - }, - { - "epoch": 0.7, - "learning_rate": 1.4959350160611336e-05, - "loss": 2.245, - "step": 401870 - }, - { - "epoch": 0.7, - "learning_rate": 1.4958478220684508e-05, - "loss": 2.1099, - "step": 401880 - }, - { - "epoch": 0.7, - "learning_rate": 1.4957606280757683e-05, - "loss": 2.2834, - "step": 401890 - }, - { - "epoch": 0.7, - "learning_rate": 1.4956734340830855e-05, - "loss": 2.2836, - "step": 401900 - }, - { - "epoch": 0.7, - "learning_rate": 1.4955862400904027e-05, - "loss": 2.2892, - "step": 401910 - }, - { - "epoch": 0.7, - "learning_rate": 1.49549904609772e-05, - "loss": 2.3819, - "step": 401920 - }, - { - "epoch": 0.7, - "learning_rate": 1.4954118521050375e-05, - "loss": 2.3125, - "step": 401930 - }, - { - "epoch": 0.7, - "learning_rate": 1.4953246581123547e-05, - "loss": 2.3021, - "step": 401940 - }, - { - "epoch": 0.7, - "learning_rate": 1.4952374641196721e-05, - "loss": 2.2966, - "step": 401950 - }, - { - "epoch": 0.7, - "learning_rate": 1.4951502701269893e-05, - "loss": 2.3441, - "step": 401960 - }, - { - "epoch": 0.7, - "learning_rate": 1.4950630761343068e-05, - "loss": 2.1984, - "step": 401970 - }, - { - "epoch": 0.7, - "learning_rate": 1.494975882141624e-05, - "loss": 2.269, - "step": 401980 - }, - { - "epoch": 0.7, - "learning_rate": 1.4948886881489413e-05, - "loss": 2.3389, - "step": 401990 - }, - { - "epoch": 0.7, - "learning_rate": 1.4948014941562588e-05, - "loss": 2.3479, - "step": 402000 - }, - { - "epoch": 0.7, - "learning_rate": 1.494714300163576e-05, - "loss": 2.2671, - "step": 402010 - }, - { - "epoch": 0.7, - "learning_rate": 1.4946271061708932e-05, - "loss": 2.3166, - "step": 402020 - }, - { - "epoch": 0.7, - "learning_rate": 1.4945399121782106e-05, - "loss": 2.4144, - "step": 402030 - }, - { - "epoch": 0.7, - "learning_rate": 1.4944527181855281e-05, - "loss": 2.1952, - "step": 402040 - }, - { - "epoch": 0.7, - "learning_rate": 1.4943655241928453e-05, - "loss": 2.2193, - "step": 402050 - }, - { - "epoch": 0.7, - "learning_rate": 1.4942783302001626e-05, - "loss": 2.3611, - "step": 402060 - }, - { - "epoch": 0.7, - "learning_rate": 1.4941911362074798e-05, - "loss": 2.3603, - "step": 402070 - }, - { - "epoch": 0.7, - "learning_rate": 1.4941039422147973e-05, - "loss": 2.3544, - "step": 402080 - }, - { - "epoch": 0.7, - "learning_rate": 1.4940167482221145e-05, - "loss": 2.2841, - "step": 402090 - }, - { - "epoch": 0.7, - "learning_rate": 1.4939295542294319e-05, - "loss": 2.2035, - "step": 402100 - }, - { - "epoch": 0.7, - "learning_rate": 1.4938423602367493e-05, - "loss": 2.3199, - "step": 402110 - }, - { - "epoch": 0.7, - "learning_rate": 1.4937551662440666e-05, - "loss": 2.3762, - "step": 402120 - }, - { - "epoch": 0.7, - "learning_rate": 1.4936679722513839e-05, - "loss": 2.301, - "step": 402130 - }, - { - "epoch": 0.7, - "learning_rate": 1.493580778258701e-05, - "loss": 2.4507, - "step": 402140 - }, - { - "epoch": 0.7, - "learning_rate": 1.4934935842660186e-05, - "loss": 2.3771, - "step": 402150 - }, - { - "epoch": 0.7, - "learning_rate": 1.4934063902733358e-05, - "loss": 2.2751, - "step": 402160 - }, - { - "epoch": 0.7, - "learning_rate": 1.493319196280653e-05, - "loss": 2.2724, - "step": 402170 - }, - { - "epoch": 0.7, - "learning_rate": 1.4932320022879704e-05, - "loss": 2.4229, - "step": 402180 - }, - { - "epoch": 0.7, - "learning_rate": 1.4931448082952878e-05, - "loss": 2.3139, - "step": 402190 - }, - { - "epoch": 0.7, - "learning_rate": 1.4930576143026052e-05, - "loss": 2.3176, - "step": 402200 - }, - { - "epoch": 0.7, - "learning_rate": 1.4929704203099224e-05, - "loss": 2.3241, - "step": 402210 - }, - { - "epoch": 0.7, - "learning_rate": 1.4928832263172396e-05, - "loss": 2.4747, - "step": 402220 - }, - { - "epoch": 0.7, - "learning_rate": 1.4927960323245571e-05, - "loss": 2.2529, - "step": 402230 - }, - { - "epoch": 0.7, - "learning_rate": 1.4927088383318743e-05, - "loss": 2.2225, - "step": 402240 - }, - { - "epoch": 0.7, - "learning_rate": 1.4926216443391915e-05, - "loss": 2.2393, - "step": 402250 - }, - { - "epoch": 0.7, - "learning_rate": 1.492534450346509e-05, - "loss": 2.3659, - "step": 402260 - }, - { - "epoch": 0.7, - "learning_rate": 1.4924472563538265e-05, - "loss": 2.2129, - "step": 402270 - }, - { - "epoch": 0.7, - "learning_rate": 1.4923600623611437e-05, - "loss": 2.3242, - "step": 402280 - }, - { - "epoch": 0.7, - "learning_rate": 1.4922728683684609e-05, - "loss": 2.3423, - "step": 402290 - }, - { - "epoch": 0.7, - "learning_rate": 1.4921856743757784e-05, - "loss": 2.4096, - "step": 402300 - }, - { - "epoch": 0.7, - "learning_rate": 1.4920984803830956e-05, - "loss": 2.3049, - "step": 402310 - }, - { - "epoch": 0.7, - "learning_rate": 1.4920112863904128e-05, - "loss": 2.2676, - "step": 402320 - }, - { - "epoch": 0.7, - "learning_rate": 1.49192409239773e-05, - "loss": 2.2346, - "step": 402330 - }, - { - "epoch": 0.7, - "learning_rate": 1.4918368984050476e-05, - "loss": 2.2865, - "step": 402340 - }, - { - "epoch": 0.7, - "learning_rate": 1.491749704412365e-05, - "loss": 2.3214, - "step": 402350 - }, - { - "epoch": 0.7, - "learning_rate": 1.4916625104196822e-05, - "loss": 2.3431, - "step": 402360 - }, - { - "epoch": 0.7, - "learning_rate": 1.4915753164269994e-05, - "loss": 2.3429, - "step": 402370 - }, - { - "epoch": 0.7, - "learning_rate": 1.491488122434317e-05, - "loss": 2.3089, - "step": 402380 - }, - { - "epoch": 0.7, - "learning_rate": 1.4914009284416341e-05, - "loss": 2.2511, - "step": 402390 - }, - { - "epoch": 0.7, - "learning_rate": 1.4913137344489513e-05, - "loss": 2.105, - "step": 402400 - }, - { - "epoch": 0.7, - "learning_rate": 1.4912265404562689e-05, - "loss": 2.2628, - "step": 402410 - }, - { - "epoch": 0.7, - "learning_rate": 1.4911393464635861e-05, - "loss": 2.2927, - "step": 402420 - }, - { - "epoch": 0.7, - "learning_rate": 1.4910521524709035e-05, - "loss": 2.3772, - "step": 402430 - }, - { - "epoch": 0.7, - "learning_rate": 1.4909649584782207e-05, - "loss": 2.2567, - "step": 402440 - }, - { - "epoch": 0.7, - "learning_rate": 1.4908777644855382e-05, - "loss": 2.3654, - "step": 402450 - }, - { - "epoch": 0.7, - "learning_rate": 1.4907905704928554e-05, - "loss": 2.3402, - "step": 402460 - }, - { - "epoch": 0.7, - "learning_rate": 1.4907033765001726e-05, - "loss": 2.2457, - "step": 402470 - }, - { - "epoch": 0.7, - "learning_rate": 1.4906161825074898e-05, - "loss": 2.4582, - "step": 402480 - }, - { - "epoch": 0.7, - "learning_rate": 1.4905289885148074e-05, - "loss": 2.1535, - "step": 402490 - }, - { - "epoch": 0.7, - "learning_rate": 1.4904417945221246e-05, - "loss": 2.3923, - "step": 402500 - }, - { - "epoch": 0.7, - "learning_rate": 1.490354600529442e-05, - "loss": 2.3615, - "step": 402510 - }, - { - "epoch": 0.7, - "learning_rate": 1.4902674065367595e-05, - "loss": 2.3886, - "step": 402520 - }, - { - "epoch": 0.7, - "learning_rate": 1.4901802125440767e-05, - "loss": 2.2895, - "step": 402530 - }, - { - "epoch": 0.7, - "learning_rate": 1.490093018551394e-05, - "loss": 2.3563, - "step": 402540 - }, - { - "epoch": 0.7, - "learning_rate": 1.4900058245587111e-05, - "loss": 2.2678, - "step": 402550 - }, - { - "epoch": 0.7, - "learning_rate": 1.4899186305660287e-05, - "loss": 2.2645, - "step": 402560 - }, - { - "epoch": 0.7, - "learning_rate": 1.4898314365733459e-05, - "loss": 2.2359, - "step": 402570 - }, - { - "epoch": 0.7, - "learning_rate": 1.4897442425806633e-05, - "loss": 2.2964, - "step": 402580 - }, - { - "epoch": 0.7, - "learning_rate": 1.4896570485879805e-05, - "loss": 2.308, - "step": 402590 - }, - { - "epoch": 0.7, - "learning_rate": 1.489569854595298e-05, - "loss": 2.4024, - "step": 402600 - }, - { - "epoch": 0.7, - "learning_rate": 1.4894826606026152e-05, - "loss": 2.2477, - "step": 402610 - }, - { - "epoch": 0.7, - "learning_rate": 1.4893954666099324e-05, - "loss": 2.3617, - "step": 402620 - }, - { - "epoch": 0.7, - "learning_rate": 1.4893082726172497e-05, - "loss": 2.2477, - "step": 402630 - }, - { - "epoch": 0.7, - "learning_rate": 1.4892210786245672e-05, - "loss": 2.2847, - "step": 402640 - }, - { - "epoch": 0.7, - "learning_rate": 1.4891338846318844e-05, - "loss": 2.21, - "step": 402650 - }, - { - "epoch": 0.7, - "learning_rate": 1.4890466906392018e-05, - "loss": 2.3918, - "step": 402660 - }, - { - "epoch": 0.7, - "learning_rate": 1.4889594966465192e-05, - "loss": 2.3722, - "step": 402670 - }, - { - "epoch": 0.7, - "learning_rate": 1.4888723026538365e-05, - "loss": 2.2617, - "step": 402680 - }, - { - "epoch": 0.7, - "learning_rate": 1.4887851086611537e-05, - "loss": 2.3492, - "step": 402690 - }, - { - "epoch": 0.7, - "learning_rate": 1.488697914668471e-05, - "loss": 2.3192, - "step": 402700 - }, - { - "epoch": 0.7, - "learning_rate": 1.4886107206757885e-05, - "loss": 2.2869, - "step": 402710 - }, - { - "epoch": 0.7, - "learning_rate": 1.4885235266831057e-05, - "loss": 2.2716, - "step": 402720 - }, - { - "epoch": 0.7, - "learning_rate": 1.488436332690423e-05, - "loss": 2.1945, - "step": 402730 - }, - { - "epoch": 0.7, - "learning_rate": 1.4883491386977403e-05, - "loss": 2.3466, - "step": 402740 - }, - { - "epoch": 0.7, - "learning_rate": 1.4882619447050577e-05, - "loss": 2.3043, - "step": 402750 - }, - { - "epoch": 0.7, - "learning_rate": 1.488174750712375e-05, - "loss": 2.391, - "step": 402760 - }, - { - "epoch": 0.7, - "learning_rate": 1.4880875567196923e-05, - "loss": 2.2504, - "step": 402770 - }, - { - "epoch": 0.7, - "learning_rate": 1.4880003627270098e-05, - "loss": 2.2986, - "step": 402780 - }, - { - "epoch": 0.7, - "learning_rate": 1.487913168734327e-05, - "loss": 2.2819, - "step": 402790 - }, - { - "epoch": 0.7, - "learning_rate": 1.4878259747416442e-05, - "loss": 2.2186, - "step": 402800 - }, - { - "epoch": 0.7, - "learning_rate": 1.4877387807489614e-05, - "loss": 2.211, - "step": 402810 - }, - { - "epoch": 0.7, - "learning_rate": 1.487651586756279e-05, - "loss": 2.2764, - "step": 402820 - }, - { - "epoch": 0.7, - "learning_rate": 1.4875643927635963e-05, - "loss": 2.2068, - "step": 402830 - }, - { - "epoch": 0.7, - "learning_rate": 1.4874771987709136e-05, - "loss": 2.3025, - "step": 402840 - }, - { - "epoch": 0.7, - "learning_rate": 1.4873900047782308e-05, - "loss": 2.3346, - "step": 402850 - }, - { - "epoch": 0.7, - "learning_rate": 1.4873028107855483e-05, - "loss": 2.2278, - "step": 402860 - }, - { - "epoch": 0.7, - "learning_rate": 1.4872156167928655e-05, - "loss": 2.3399, - "step": 402870 - }, - { - "epoch": 0.7, - "learning_rate": 1.4871284228001827e-05, - "loss": 2.2974, - "step": 402880 - }, - { - "epoch": 0.7, - "learning_rate": 1.4870412288075001e-05, - "loss": 2.2443, - "step": 402890 - }, - { - "epoch": 0.7, - "learning_rate": 1.4869540348148175e-05, - "loss": 2.369, - "step": 402900 - }, - { - "epoch": 0.7, - "learning_rate": 1.4868668408221349e-05, - "loss": 2.2771, - "step": 402910 - }, - { - "epoch": 0.7, - "learning_rate": 1.486779646829452e-05, - "loss": 2.3354, - "step": 402920 - }, - { - "epoch": 0.7, - "learning_rate": 1.4866924528367696e-05, - "loss": 2.3038, - "step": 402930 - }, - { - "epoch": 0.7, - "learning_rate": 1.4866052588440868e-05, - "loss": 2.3768, - "step": 402940 - }, - { - "epoch": 0.7, - "learning_rate": 1.486518064851404e-05, - "loss": 2.2394, - "step": 402950 - }, - { - "epoch": 0.7, - "learning_rate": 1.4864308708587212e-05, - "loss": 2.3156, - "step": 402960 - }, - { - "epoch": 0.7, - "learning_rate": 1.4863436768660388e-05, - "loss": 2.3541, - "step": 402970 - }, - { - "epoch": 0.7, - "learning_rate": 1.486256482873356e-05, - "loss": 2.3227, - "step": 402980 - }, - { - "epoch": 0.7, - "learning_rate": 1.4861692888806734e-05, - "loss": 2.3144, - "step": 402990 - }, - { - "epoch": 0.7, - "learning_rate": 1.4860820948879906e-05, - "loss": 2.1914, - "step": 403000 - }, - { - "epoch": 0.7, - "learning_rate": 1.4859949008953081e-05, - "loss": 2.2744, - "step": 403010 - }, - { - "epoch": 0.7, - "learning_rate": 1.4859077069026253e-05, - "loss": 2.2181, - "step": 403020 - }, - { - "epoch": 0.7, - "learning_rate": 1.4858205129099425e-05, - "loss": 2.305, - "step": 403030 - }, - { - "epoch": 0.7, - "learning_rate": 1.48573331891726e-05, - "loss": 2.3908, - "step": 403040 - }, - { - "epoch": 0.7, - "learning_rate": 1.4856461249245773e-05, - "loss": 2.289, - "step": 403050 - }, - { - "epoch": 0.7, - "learning_rate": 1.4855589309318945e-05, - "loss": 2.2859, - "step": 403060 - }, - { - "epoch": 0.7, - "learning_rate": 1.4854717369392119e-05, - "loss": 2.2698, - "step": 403070 - }, - { - "epoch": 0.7, - "learning_rate": 1.4853845429465294e-05, - "loss": 2.2977, - "step": 403080 - }, - { - "epoch": 0.7, - "learning_rate": 1.4852973489538466e-05, - "loss": 2.2656, - "step": 403090 - }, - { - "epoch": 0.7, - "learning_rate": 1.4852101549611638e-05, - "loss": 2.3393, - "step": 403100 - }, - { - "epoch": 0.7, - "learning_rate": 1.485122960968481e-05, - "loss": 2.2813, - "step": 403110 - }, - { - "epoch": 0.7, - "learning_rate": 1.4850357669757986e-05, - "loss": 2.1651, - "step": 403120 - }, - { - "epoch": 0.7, - "learning_rate": 1.4849485729831158e-05, - "loss": 2.3131, - "step": 403130 - }, - { - "epoch": 0.7, - "learning_rate": 1.4848613789904332e-05, - "loss": 2.3648, - "step": 403140 - }, - { - "epoch": 0.7, - "learning_rate": 1.4847741849977504e-05, - "loss": 2.4047, - "step": 403150 - }, - { - "epoch": 0.7, - "learning_rate": 1.484686991005068e-05, - "loss": 2.147, - "step": 403160 - }, - { - "epoch": 0.7, - "learning_rate": 1.4845997970123851e-05, - "loss": 2.3275, - "step": 403170 - }, - { - "epoch": 0.7, - "learning_rate": 1.4845126030197023e-05, - "loss": 2.3493, - "step": 403180 - }, - { - "epoch": 0.7, - "learning_rate": 1.4844254090270199e-05, - "loss": 2.3929, - "step": 403190 - }, - { - "epoch": 0.7, - "learning_rate": 1.4843382150343371e-05, - "loss": 2.405, - "step": 403200 - }, - { - "epoch": 0.7, - "learning_rate": 1.4842510210416543e-05, - "loss": 2.2641, - "step": 403210 - }, - { - "epoch": 0.7, - "learning_rate": 1.4841638270489717e-05, - "loss": 2.3638, - "step": 403220 - }, - { - "epoch": 0.7, - "learning_rate": 1.484076633056289e-05, - "loss": 2.2606, - "step": 403230 - }, - { - "epoch": 0.7, - "learning_rate": 1.4839894390636064e-05, - "loss": 2.2041, - "step": 403240 - }, - { - "epoch": 0.7, - "learning_rate": 1.4839022450709236e-05, - "loss": 2.3283, - "step": 403250 - }, - { - "epoch": 0.7, - "learning_rate": 1.4838150510782408e-05, - "loss": 2.3704, - "step": 403260 - }, - { - "epoch": 0.7, - "learning_rate": 1.4837278570855584e-05, - "loss": 2.3204, - "step": 403270 - }, - { - "epoch": 0.7, - "learning_rate": 1.4836406630928756e-05, - "loss": 2.4268, - "step": 403280 - }, - { - "epoch": 0.7, - "learning_rate": 1.4835534691001928e-05, - "loss": 2.247, - "step": 403290 - }, - { - "epoch": 0.7, - "learning_rate": 1.4834662751075102e-05, - "loss": 2.3306, - "step": 403300 - }, - { - "epoch": 0.7, - "learning_rate": 1.4833790811148277e-05, - "loss": 2.3726, - "step": 403310 - }, - { - "epoch": 0.7, - "learning_rate": 1.483291887122145e-05, - "loss": 2.2505, - "step": 403320 - }, - { - "epoch": 0.7, - "learning_rate": 1.4832046931294621e-05, - "loss": 2.2739, - "step": 403330 - }, - { - "epoch": 0.7, - "learning_rate": 1.4831174991367797e-05, - "loss": 2.3703, - "step": 403340 - }, - { - "epoch": 0.7, - "learning_rate": 1.4830303051440969e-05, - "loss": 2.1819, - "step": 403350 - }, - { - "epoch": 0.7, - "learning_rate": 1.4829431111514141e-05, - "loss": 2.2324, - "step": 403360 - }, - { - "epoch": 0.7, - "learning_rate": 1.4828559171587313e-05, - "loss": 2.3182, - "step": 403370 - }, - { - "epoch": 0.7, - "learning_rate": 1.4827687231660489e-05, - "loss": 2.3734, - "step": 403380 - }, - { - "epoch": 0.7, - "learning_rate": 1.4826815291733662e-05, - "loss": 2.2756, - "step": 403390 - }, - { - "epoch": 0.7, - "learning_rate": 1.4825943351806834e-05, - "loss": 2.3313, - "step": 403400 - }, - { - "epoch": 0.7, - "learning_rate": 1.4825071411880007e-05, - "loss": 2.3865, - "step": 403410 - }, - { - "epoch": 0.7, - "learning_rate": 1.4824199471953182e-05, - "loss": 2.3286, - "step": 403420 - }, - { - "epoch": 0.7, - "learning_rate": 1.4823327532026354e-05, - "loss": 2.3766, - "step": 403430 - }, - { - "epoch": 0.7, - "learning_rate": 1.4822455592099526e-05, - "loss": 2.2864, - "step": 403440 - }, - { - "epoch": 0.7, - "learning_rate": 1.4821583652172702e-05, - "loss": 2.3434, - "step": 403450 - }, - { - "epoch": 0.7, - "learning_rate": 1.4820711712245874e-05, - "loss": 2.308, - "step": 403460 - }, - { - "epoch": 0.7, - "learning_rate": 1.4819839772319047e-05, - "loss": 2.3884, - "step": 403470 - }, - { - "epoch": 0.7, - "learning_rate": 1.481896783239222e-05, - "loss": 2.2191, - "step": 403480 - }, - { - "epoch": 0.7, - "learning_rate": 1.4818095892465395e-05, - "loss": 2.3903, - "step": 403490 - }, - { - "epoch": 0.7, - "learning_rate": 1.4817223952538567e-05, - "loss": 2.3731, - "step": 403500 - }, - { - "epoch": 0.7, - "learning_rate": 1.481635201261174e-05, - "loss": 2.3489, - "step": 403510 - }, - { - "epoch": 0.7, - "learning_rate": 1.4815480072684911e-05, - "loss": 2.277, - "step": 403520 - }, - { - "epoch": 0.7, - "learning_rate": 1.4814608132758087e-05, - "loss": 2.2992, - "step": 403530 - }, - { - "epoch": 0.7, - "learning_rate": 1.4813736192831259e-05, - "loss": 2.294, - "step": 403540 - }, - { - "epoch": 0.7, - "learning_rate": 1.4812864252904433e-05, - "loss": 2.3183, - "step": 403550 - }, - { - "epoch": 0.7, - "learning_rate": 1.4811992312977605e-05, - "loss": 2.3045, - "step": 403560 - }, - { - "epoch": 0.7, - "learning_rate": 1.481112037305078e-05, - "loss": 2.2758, - "step": 403570 - }, - { - "epoch": 0.7, - "learning_rate": 1.4810248433123952e-05, - "loss": 2.3286, - "step": 403580 - }, - { - "epoch": 0.7, - "learning_rate": 1.4809376493197124e-05, - "loss": 2.2508, - "step": 403590 - }, - { - "epoch": 0.7, - "learning_rate": 1.48085045532703e-05, - "loss": 2.3015, - "step": 403600 - }, - { - "epoch": 0.7, - "learning_rate": 1.4807632613343472e-05, - "loss": 2.3567, - "step": 403610 - }, - { - "epoch": 0.7, - "learning_rate": 1.4806760673416646e-05, - "loss": 2.2523, - "step": 403620 - }, - { - "epoch": 0.7, - "learning_rate": 1.4805888733489818e-05, - "loss": 2.29, - "step": 403630 - }, - { - "epoch": 0.7, - "learning_rate": 1.4805016793562993e-05, - "loss": 2.2832, - "step": 403640 - }, - { - "epoch": 0.7, - "learning_rate": 1.4804144853636165e-05, - "loss": 2.3941, - "step": 403650 - }, - { - "epoch": 0.7, - "learning_rate": 1.4803272913709337e-05, - "loss": 2.347, - "step": 403660 - }, - { - "epoch": 0.7, - "learning_rate": 1.480240097378251e-05, - "loss": 2.3361, - "step": 403670 - }, - { - "epoch": 0.7, - "learning_rate": 1.4801529033855685e-05, - "loss": 2.2824, - "step": 403680 - }, - { - "epoch": 0.7, - "learning_rate": 1.4800657093928857e-05, - "loss": 2.2824, - "step": 403690 - }, - { - "epoch": 0.7, - "learning_rate": 1.479978515400203e-05, - "loss": 2.3557, - "step": 403700 - }, - { - "epoch": 0.7, - "learning_rate": 1.4798913214075204e-05, - "loss": 2.3189, - "step": 403710 - }, - { - "epoch": 0.7, - "learning_rate": 1.4798041274148378e-05, - "loss": 2.3162, - "step": 403720 - }, - { - "epoch": 0.7, - "learning_rate": 1.479716933422155e-05, - "loss": 2.2994, - "step": 403730 - }, - { - "epoch": 0.7, - "learning_rate": 1.4796297394294722e-05, - "loss": 2.3294, - "step": 403740 - }, - { - "epoch": 0.7, - "learning_rate": 1.4795425454367898e-05, - "loss": 2.3543, - "step": 403750 - }, - { - "epoch": 0.7, - "learning_rate": 1.479455351444107e-05, - "loss": 2.3779, - "step": 403760 - }, - { - "epoch": 0.7, - "learning_rate": 1.4793681574514242e-05, - "loss": 2.2753, - "step": 403770 - }, - { - "epoch": 0.7, - "learning_rate": 1.4792809634587416e-05, - "loss": 2.2847, - "step": 403780 - }, - { - "epoch": 0.7, - "learning_rate": 1.479193769466059e-05, - "loss": 2.3245, - "step": 403790 - }, - { - "epoch": 0.7, - "learning_rate": 1.4791065754733763e-05, - "loss": 2.3493, - "step": 403800 - }, - { - "epoch": 0.7, - "learning_rate": 1.4790193814806935e-05, - "loss": 2.3645, - "step": 403810 - }, - { - "epoch": 0.7, - "learning_rate": 1.4789321874880107e-05, - "loss": 2.4687, - "step": 403820 - }, - { - "epoch": 0.7, - "learning_rate": 1.4788449934953283e-05, - "loss": 2.302, - "step": 403830 - }, - { - "epoch": 0.7, - "learning_rate": 1.4787577995026455e-05, - "loss": 2.3528, - "step": 403840 - }, - { - "epoch": 0.7, - "learning_rate": 1.4786706055099627e-05, - "loss": 2.2615, - "step": 403850 - }, - { - "epoch": 0.7, - "learning_rate": 1.4785834115172802e-05, - "loss": 2.2823, - "step": 403860 - }, - { - "epoch": 0.7, - "learning_rate": 1.4784962175245976e-05, - "loss": 2.2736, - "step": 403870 - }, - { - "epoch": 0.7, - "learning_rate": 1.4784090235319148e-05, - "loss": 2.3577, - "step": 403880 - }, - { - "epoch": 0.7, - "learning_rate": 1.478321829539232e-05, - "loss": 2.2179, - "step": 403890 - }, - { - "epoch": 0.7, - "learning_rate": 1.4782346355465496e-05, - "loss": 2.4429, - "step": 403900 - }, - { - "epoch": 0.7, - "learning_rate": 1.4781474415538668e-05, - "loss": 2.3053, - "step": 403910 - }, - { - "epoch": 0.7, - "learning_rate": 1.478060247561184e-05, - "loss": 2.2781, - "step": 403920 - }, - { - "epoch": 0.7, - "learning_rate": 1.4779730535685014e-05, - "loss": 2.4213, - "step": 403930 - }, - { - "epoch": 0.7, - "learning_rate": 1.4778858595758188e-05, - "loss": 2.4395, - "step": 403940 - }, - { - "epoch": 0.7, - "learning_rate": 1.4777986655831361e-05, - "loss": 2.2535, - "step": 403950 - }, - { - "epoch": 0.7, - "learning_rate": 1.4777114715904533e-05, - "loss": 2.2925, - "step": 403960 - }, - { - "epoch": 0.7, - "learning_rate": 1.4776242775977705e-05, - "loss": 2.3395, - "step": 403970 - }, - { - "epoch": 0.7, - "learning_rate": 1.4775370836050881e-05, - "loss": 2.2903, - "step": 403980 - }, - { - "epoch": 0.7, - "learning_rate": 1.4774498896124053e-05, - "loss": 2.3215, - "step": 403990 - }, - { - "epoch": 0.7, - "learning_rate": 1.4773626956197225e-05, - "loss": 2.2772, - "step": 404000 - }, - { - "epoch": 0.7, - "learning_rate": 1.47727550162704e-05, - "loss": 2.3939, - "step": 404010 - }, - { - "epoch": 0.7, - "learning_rate": 1.4771883076343573e-05, - "loss": 2.2796, - "step": 404020 - }, - { - "epoch": 0.7, - "learning_rate": 1.4771011136416746e-05, - "loss": 2.2946, - "step": 404030 - }, - { - "epoch": 0.7, - "learning_rate": 1.4770139196489918e-05, - "loss": 2.2736, - "step": 404040 - }, - { - "epoch": 0.7, - "learning_rate": 1.4769267256563094e-05, - "loss": 2.2854, - "step": 404050 - }, - { - "epoch": 0.7, - "learning_rate": 1.4768395316636266e-05, - "loss": 2.3291, - "step": 404060 - }, - { - "epoch": 0.7, - "learning_rate": 1.4767523376709438e-05, - "loss": 2.2812, - "step": 404070 - }, - { - "epoch": 0.7, - "learning_rate": 1.476665143678261e-05, - "loss": 2.317, - "step": 404080 - }, - { - "epoch": 0.7, - "learning_rate": 1.4765779496855786e-05, - "loss": 2.2407, - "step": 404090 - }, - { - "epoch": 0.7, - "learning_rate": 1.4764907556928958e-05, - "loss": 2.2345, - "step": 404100 - }, - { - "epoch": 0.7, - "learning_rate": 1.4764035617002131e-05, - "loss": 2.3509, - "step": 404110 - }, - { - "epoch": 0.7, - "learning_rate": 1.4763163677075307e-05, - "loss": 2.194, - "step": 404120 - }, - { - "epoch": 0.7, - "learning_rate": 1.4762291737148479e-05, - "loss": 2.4011, - "step": 404130 - }, - { - "epoch": 0.7, - "learning_rate": 1.4761419797221651e-05, - "loss": 2.2844, - "step": 404140 - }, - { - "epoch": 0.7, - "learning_rate": 1.4760547857294823e-05, - "loss": 2.3464, - "step": 404150 - }, - { - "epoch": 0.7, - "learning_rate": 1.4759675917367999e-05, - "loss": 2.2672, - "step": 404160 - }, - { - "epoch": 0.7, - "learning_rate": 1.475880397744117e-05, - "loss": 2.2867, - "step": 404170 - }, - { - "epoch": 0.7, - "learning_rate": 1.4757932037514344e-05, - "loss": 2.3923, - "step": 404180 - }, - { - "epoch": 0.7, - "learning_rate": 1.4757060097587517e-05, - "loss": 2.2955, - "step": 404190 - }, - { - "epoch": 0.7, - "learning_rate": 1.4756188157660692e-05, - "loss": 2.292, - "step": 404200 - }, - { - "epoch": 0.7, - "learning_rate": 1.4755316217733864e-05, - "loss": 2.267, - "step": 404210 - }, - { - "epoch": 0.7, - "learning_rate": 1.4754444277807036e-05, - "loss": 2.2697, - "step": 404220 - }, - { - "epoch": 0.7, - "learning_rate": 1.4753572337880208e-05, - "loss": 2.294, - "step": 404230 - }, - { - "epoch": 0.7, - "learning_rate": 1.4752700397953384e-05, - "loss": 2.2056, - "step": 404240 - }, - { - "epoch": 0.7, - "learning_rate": 1.4751828458026556e-05, - "loss": 2.2641, - "step": 404250 - }, - { - "epoch": 0.7, - "learning_rate": 1.475095651809973e-05, - "loss": 2.3967, - "step": 404260 - }, - { - "epoch": 0.7, - "learning_rate": 1.4750084578172903e-05, - "loss": 2.3665, - "step": 404270 - }, - { - "epoch": 0.71, - "learning_rate": 1.4749212638246077e-05, - "loss": 2.2526, - "step": 404280 - }, - { - "epoch": 0.71, - "learning_rate": 1.474834069831925e-05, - "loss": 2.3094, - "step": 404290 - }, - { - "epoch": 0.71, - "learning_rate": 1.4747468758392421e-05, - "loss": 2.2828, - "step": 404300 - }, - { - "epoch": 0.71, - "learning_rate": 1.4746596818465597e-05, - "loss": 2.3039, - "step": 404310 - }, - { - "epoch": 0.71, - "learning_rate": 1.4745724878538769e-05, - "loss": 2.4298, - "step": 404320 - }, - { - "epoch": 0.71, - "learning_rate": 1.4744852938611941e-05, - "loss": 2.3901, - "step": 404330 - }, - { - "epoch": 0.71, - "learning_rate": 1.4743980998685115e-05, - "loss": 2.4151, - "step": 404340 - }, - { - "epoch": 0.71, - "learning_rate": 1.474310905875829e-05, - "loss": 2.3485, - "step": 404350 - }, - { - "epoch": 0.71, - "learning_rate": 1.4742237118831462e-05, - "loss": 2.2297, - "step": 404360 - }, - { - "epoch": 0.71, - "learning_rate": 1.4741365178904634e-05, - "loss": 2.3955, - "step": 404370 - }, - { - "epoch": 0.71, - "learning_rate": 1.474049323897781e-05, - "loss": 2.3048, - "step": 404380 - }, - { - "epoch": 0.71, - "learning_rate": 1.4739621299050982e-05, - "loss": 2.3284, - "step": 404390 - }, - { - "epoch": 0.71, - "learning_rate": 1.4738749359124154e-05, - "loss": 2.2376, - "step": 404400 - }, - { - "epoch": 0.71, - "learning_rate": 1.4737877419197326e-05, - "loss": 2.2969, - "step": 404410 - }, - { - "epoch": 0.71, - "learning_rate": 1.4737005479270501e-05, - "loss": 2.3709, - "step": 404420 - }, - { - "epoch": 0.71, - "learning_rate": 1.4736133539343675e-05, - "loss": 2.2556, - "step": 404430 - }, - { - "epoch": 0.71, - "learning_rate": 1.4735261599416847e-05, - "loss": 2.21, - "step": 404440 - }, - { - "epoch": 0.71, - "learning_rate": 1.473438965949002e-05, - "loss": 2.255, - "step": 404450 - }, - { - "epoch": 0.71, - "learning_rate": 1.4733517719563195e-05, - "loss": 2.1935, - "step": 404460 - }, - { - "epoch": 0.71, - "learning_rate": 1.4732645779636367e-05, - "loss": 2.3582, - "step": 404470 - }, - { - "epoch": 0.71, - "learning_rate": 1.4731773839709539e-05, - "loss": 2.268, - "step": 404480 - }, - { - "epoch": 0.71, - "learning_rate": 1.4730901899782713e-05, - "loss": 2.3245, - "step": 404490 - }, - { - "epoch": 0.71, - "learning_rate": 1.4730029959855886e-05, - "loss": 2.3566, - "step": 404500 - }, - { - "epoch": 0.71, - "learning_rate": 1.472915801992906e-05, - "loss": 2.3303, - "step": 404510 - }, - { - "epoch": 0.71, - "learning_rate": 1.4728286080002232e-05, - "loss": 2.3134, - "step": 404520 - }, - { - "epoch": 0.71, - "learning_rate": 1.4727414140075408e-05, - "loss": 2.316, - "step": 404530 - }, - { - "epoch": 0.71, - "learning_rate": 1.472654220014858e-05, - "loss": 2.3314, - "step": 404540 - }, - { - "epoch": 0.71, - "learning_rate": 1.4725670260221752e-05, - "loss": 2.2756, - "step": 404550 - }, - { - "epoch": 0.71, - "learning_rate": 1.4724798320294924e-05, - "loss": 2.3111, - "step": 404560 - }, - { - "epoch": 0.71, - "learning_rate": 1.47239263803681e-05, - "loss": 2.2404, - "step": 404570 - }, - { - "epoch": 0.71, - "learning_rate": 1.4723054440441272e-05, - "loss": 2.2482, - "step": 404580 - }, - { - "epoch": 0.71, - "learning_rate": 1.4722182500514445e-05, - "loss": 2.2734, - "step": 404590 - }, - { - "epoch": 0.71, - "learning_rate": 1.4721310560587617e-05, - "loss": 2.1869, - "step": 404600 - }, - { - "epoch": 0.71, - "learning_rate": 1.4720438620660793e-05, - "loss": 2.2696, - "step": 404610 - }, - { - "epoch": 0.71, - "learning_rate": 1.4719566680733965e-05, - "loss": 2.3672, - "step": 404620 - }, - { - "epoch": 0.71, - "learning_rate": 1.4718694740807137e-05, - "loss": 2.2506, - "step": 404630 - }, - { - "epoch": 0.71, - "learning_rate": 1.4717822800880313e-05, - "loss": 2.3698, - "step": 404640 - }, - { - "epoch": 0.71, - "learning_rate": 1.4716950860953485e-05, - "loss": 2.3726, - "step": 404650 - }, - { - "epoch": 0.71, - "learning_rate": 1.4716078921026658e-05, - "loss": 2.2425, - "step": 404660 - }, - { - "epoch": 0.71, - "learning_rate": 1.471520698109983e-05, - "loss": 2.3471, - "step": 404670 - }, - { - "epoch": 0.71, - "learning_rate": 1.4714335041173006e-05, - "loss": 2.2781, - "step": 404680 - }, - { - "epoch": 0.71, - "learning_rate": 1.4713463101246178e-05, - "loss": 2.2313, - "step": 404690 - }, - { - "epoch": 0.71, - "learning_rate": 1.471259116131935e-05, - "loss": 2.2636, - "step": 404700 - }, - { - "epoch": 0.71, - "learning_rate": 1.4711719221392522e-05, - "loss": 2.3778, - "step": 404710 - }, - { - "epoch": 0.71, - "learning_rate": 1.4710847281465698e-05, - "loss": 2.3587, - "step": 404720 - }, - { - "epoch": 0.71, - "learning_rate": 1.470997534153887e-05, - "loss": 2.3345, - "step": 404730 - }, - { - "epoch": 0.71, - "learning_rate": 1.4709103401612043e-05, - "loss": 2.3122, - "step": 404740 - }, - { - "epoch": 0.71, - "learning_rate": 1.4708231461685215e-05, - "loss": 2.3332, - "step": 404750 - }, - { - "epoch": 0.71, - "learning_rate": 1.4707359521758391e-05, - "loss": 2.2986, - "step": 404760 - }, - { - "epoch": 0.71, - "learning_rate": 1.4706487581831563e-05, - "loss": 2.2207, - "step": 404770 - }, - { - "epoch": 0.71, - "learning_rate": 1.4705615641904735e-05, - "loss": 2.2933, - "step": 404780 - }, - { - "epoch": 0.71, - "learning_rate": 1.470474370197791e-05, - "loss": 2.3005, - "step": 404790 - }, - { - "epoch": 0.71, - "learning_rate": 1.4703871762051083e-05, - "loss": 2.3285, - "step": 404800 - }, - { - "epoch": 0.71, - "learning_rate": 1.4702999822124255e-05, - "loss": 2.4306, - "step": 404810 - }, - { - "epoch": 0.71, - "learning_rate": 1.4702127882197429e-05, - "loss": 2.185, - "step": 404820 - }, - { - "epoch": 0.71, - "learning_rate": 1.4701255942270602e-05, - "loss": 2.3834, - "step": 404830 - }, - { - "epoch": 0.71, - "learning_rate": 1.4700384002343776e-05, - "loss": 2.3335, - "step": 404840 - }, - { - "epoch": 0.71, - "learning_rate": 1.4699512062416948e-05, - "loss": 2.3367, - "step": 404850 - }, - { - "epoch": 0.71, - "learning_rate": 1.469864012249012e-05, - "loss": 2.3473, - "step": 404860 - }, - { - "epoch": 0.71, - "learning_rate": 1.4697768182563296e-05, - "loss": 2.2252, - "step": 404870 - }, - { - "epoch": 0.71, - "learning_rate": 1.4696896242636468e-05, - "loss": 2.3771, - "step": 404880 - }, - { - "epoch": 0.71, - "learning_rate": 1.469602430270964e-05, - "loss": 2.325, - "step": 404890 - }, - { - "epoch": 0.71, - "learning_rate": 1.4695152362782814e-05, - "loss": 2.331, - "step": 404900 - }, - { - "epoch": 0.71, - "learning_rate": 1.4694280422855989e-05, - "loss": 2.3362, - "step": 404910 - }, - { - "epoch": 0.71, - "learning_rate": 1.4693408482929161e-05, - "loss": 2.3556, - "step": 404920 - }, - { - "epoch": 0.71, - "learning_rate": 1.4692536543002333e-05, - "loss": 2.3203, - "step": 404930 - }, - { - "epoch": 0.71, - "learning_rate": 1.4691664603075509e-05, - "loss": 2.4027, - "step": 404940 - }, - { - "epoch": 0.71, - "learning_rate": 1.469079266314868e-05, - "loss": 2.2577, - "step": 404950 - }, - { - "epoch": 0.71, - "learning_rate": 1.4689920723221853e-05, - "loss": 2.2799, - "step": 404960 - }, - { - "epoch": 0.71, - "learning_rate": 1.4689048783295027e-05, - "loss": 2.271, - "step": 404970 - }, - { - "epoch": 0.71, - "learning_rate": 1.46881768433682e-05, - "loss": 2.3234, - "step": 404980 - }, - { - "epoch": 0.71, - "learning_rate": 1.4687304903441374e-05, - "loss": 2.2289, - "step": 404990 - }, - { - "epoch": 0.71, - "learning_rate": 1.4686432963514546e-05, - "loss": 2.2303, - "step": 405000 - }, - { - "epoch": 0.71, - "learning_rate": 1.4685561023587718e-05, - "loss": 2.3355, - "step": 405010 - }, - { - "epoch": 0.71, - "learning_rate": 1.4684689083660894e-05, - "loss": 2.3081, - "step": 405020 - }, - { - "epoch": 0.71, - "learning_rate": 1.4683817143734066e-05, - "loss": 2.2528, - "step": 405030 - }, - { - "epoch": 0.71, - "learning_rate": 1.4682945203807238e-05, - "loss": 2.3264, - "step": 405040 - }, - { - "epoch": 0.71, - "learning_rate": 1.4682073263880413e-05, - "loss": 2.3082, - "step": 405050 - }, - { - "epoch": 0.71, - "learning_rate": 1.4681201323953585e-05, - "loss": 2.3139, - "step": 405060 - }, - { - "epoch": 0.71, - "learning_rate": 1.468032938402676e-05, - "loss": 2.1947, - "step": 405070 - }, - { - "epoch": 0.71, - "learning_rate": 1.4679457444099931e-05, - "loss": 2.336, - "step": 405080 - }, - { - "epoch": 0.71, - "learning_rate": 1.4678585504173107e-05, - "loss": 2.3672, - "step": 405090 - }, - { - "epoch": 0.71, - "learning_rate": 1.4677713564246279e-05, - "loss": 2.2876, - "step": 405100 - }, - { - "epoch": 0.71, - "learning_rate": 1.4676841624319451e-05, - "loss": 2.2318, - "step": 405110 - }, - { - "epoch": 0.71, - "learning_rate": 1.4675969684392623e-05, - "loss": 2.2785, - "step": 405120 - }, - { - "epoch": 0.71, - "learning_rate": 1.4675097744465798e-05, - "loss": 2.26, - "step": 405130 - }, - { - "epoch": 0.71, - "learning_rate": 1.467422580453897e-05, - "loss": 2.2721, - "step": 405140 - }, - { - "epoch": 0.71, - "learning_rate": 1.4673353864612144e-05, - "loss": 2.3147, - "step": 405150 - }, - { - "epoch": 0.71, - "learning_rate": 1.4672481924685316e-05, - "loss": 2.2652, - "step": 405160 - }, - { - "epoch": 0.71, - "learning_rate": 1.4671609984758492e-05, - "loss": 2.3489, - "step": 405170 - }, - { - "epoch": 0.71, - "learning_rate": 1.4670738044831664e-05, - "loss": 2.2394, - "step": 405180 - }, - { - "epoch": 0.71, - "learning_rate": 1.4669866104904836e-05, - "loss": 2.392, - "step": 405190 - }, - { - "epoch": 0.71, - "learning_rate": 1.4668994164978011e-05, - "loss": 2.1843, - "step": 405200 - }, - { - "epoch": 0.71, - "learning_rate": 1.4668122225051184e-05, - "loss": 2.3436, - "step": 405210 - }, - { - "epoch": 0.71, - "learning_rate": 1.4667250285124357e-05, - "loss": 2.3696, - "step": 405220 - }, - { - "epoch": 0.71, - "learning_rate": 1.466637834519753e-05, - "loss": 2.167, - "step": 405230 - }, - { - "epoch": 0.71, - "learning_rate": 1.4665506405270705e-05, - "loss": 2.325, - "step": 405240 - }, - { - "epoch": 0.71, - "learning_rate": 1.4664634465343877e-05, - "loss": 2.2067, - "step": 405250 - }, - { - "epoch": 0.71, - "learning_rate": 1.4663762525417049e-05, - "loss": 2.4072, - "step": 405260 - }, - { - "epoch": 0.71, - "learning_rate": 1.4662890585490221e-05, - "loss": 2.33, - "step": 405270 - }, - { - "epoch": 0.71, - "learning_rate": 1.4662018645563397e-05, - "loss": 2.3152, - "step": 405280 - }, - { - "epoch": 0.71, - "learning_rate": 1.4661146705636569e-05, - "loss": 2.247, - "step": 405290 - }, - { - "epoch": 0.71, - "learning_rate": 1.4660274765709742e-05, - "loss": 2.3903, - "step": 405300 - }, - { - "epoch": 0.71, - "learning_rate": 1.4659402825782916e-05, - "loss": 2.3047, - "step": 405310 - }, - { - "epoch": 0.71, - "learning_rate": 1.465853088585609e-05, - "loss": 2.2341, - "step": 405320 - }, - { - "epoch": 0.71, - "learning_rate": 1.4657658945929262e-05, - "loss": 2.2593, - "step": 405330 - }, - { - "epoch": 0.71, - "learning_rate": 1.4656787006002434e-05, - "loss": 2.2686, - "step": 405340 - }, - { - "epoch": 0.71, - "learning_rate": 1.465591506607561e-05, - "loss": 2.3717, - "step": 405350 - }, - { - "epoch": 0.71, - "learning_rate": 1.4655043126148782e-05, - "loss": 2.3166, - "step": 405360 - }, - { - "epoch": 0.71, - "learning_rate": 1.4654171186221954e-05, - "loss": 2.3889, - "step": 405370 - }, - { - "epoch": 0.71, - "learning_rate": 1.4653299246295127e-05, - "loss": 2.2835, - "step": 405380 - }, - { - "epoch": 0.71, - "learning_rate": 1.4652427306368303e-05, - "loss": 2.2791, - "step": 405390 - }, - { - "epoch": 0.71, - "learning_rate": 1.4651555366441475e-05, - "loss": 2.3842, - "step": 405400 - }, - { - "epoch": 0.71, - "learning_rate": 1.4650683426514647e-05, - "loss": 2.3392, - "step": 405410 - }, - { - "epoch": 0.71, - "learning_rate": 1.4649811486587819e-05, - "loss": 2.3122, - "step": 405420 - }, - { - "epoch": 0.71, - "learning_rate": 1.4648939546660995e-05, - "loss": 2.3388, - "step": 405430 - }, - { - "epoch": 0.71, - "learning_rate": 1.4648067606734167e-05, - "loss": 2.3371, - "step": 405440 - }, - { - "epoch": 0.71, - "learning_rate": 1.4647195666807339e-05, - "loss": 2.342, - "step": 405450 - }, - { - "epoch": 0.71, - "learning_rate": 1.4646323726880514e-05, - "loss": 2.2974, - "step": 405460 - }, - { - "epoch": 0.71, - "learning_rate": 1.4645451786953688e-05, - "loss": 2.2981, - "step": 405470 - }, - { - "epoch": 0.71, - "learning_rate": 1.464457984702686e-05, - "loss": 2.2609, - "step": 405480 - }, - { - "epoch": 0.71, - "learning_rate": 1.4643707907100032e-05, - "loss": 2.3585, - "step": 405490 - }, - { - "epoch": 0.71, - "learning_rate": 1.4642835967173208e-05, - "loss": 2.2998, - "step": 405500 - }, - { - "epoch": 0.71, - "learning_rate": 1.464196402724638e-05, - "loss": 2.3295, - "step": 405510 - }, - { - "epoch": 0.71, - "learning_rate": 1.4641092087319552e-05, - "loss": 2.3237, - "step": 405520 - }, - { - "epoch": 0.71, - "learning_rate": 1.4640220147392726e-05, - "loss": 2.2822, - "step": 405530 - }, - { - "epoch": 0.71, - "learning_rate": 1.46393482074659e-05, - "loss": 2.259, - "step": 405540 - }, - { - "epoch": 0.71, - "learning_rate": 1.4638476267539073e-05, - "loss": 2.2917, - "step": 405550 - }, - { - "epoch": 0.71, - "learning_rate": 1.4637604327612245e-05, - "loss": 2.2778, - "step": 405560 - }, - { - "epoch": 0.71, - "learning_rate": 1.463673238768542e-05, - "loss": 2.2588, - "step": 405570 - }, - { - "epoch": 0.71, - "learning_rate": 1.4635860447758593e-05, - "loss": 2.3896, - "step": 405580 - }, - { - "epoch": 0.71, - "learning_rate": 1.4634988507831765e-05, - "loss": 2.2729, - "step": 405590 - }, - { - "epoch": 0.71, - "learning_rate": 1.4634116567904937e-05, - "loss": 2.2293, - "step": 405600 - }, - { - "epoch": 0.71, - "learning_rate": 1.4633244627978112e-05, - "loss": 2.2916, - "step": 405610 - }, - { - "epoch": 0.71, - "learning_rate": 1.4632372688051284e-05, - "loss": 2.341, - "step": 405620 - }, - { - "epoch": 0.71, - "learning_rate": 1.4631500748124458e-05, - "loss": 2.3481, - "step": 405630 - }, - { - "epoch": 0.71, - "learning_rate": 1.463062880819763e-05, - "loss": 2.3005, - "step": 405640 - }, - { - "epoch": 0.71, - "learning_rate": 1.4629756868270806e-05, - "loss": 2.2919, - "step": 405650 - }, - { - "epoch": 0.71, - "learning_rate": 1.4628884928343978e-05, - "loss": 2.2994, - "step": 405660 - }, - { - "epoch": 0.71, - "learning_rate": 1.462801298841715e-05, - "loss": 2.1775, - "step": 405670 - }, - { - "epoch": 0.71, - "learning_rate": 1.4627141048490322e-05, - "loss": 2.2564, - "step": 405680 - }, - { - "epoch": 0.71, - "learning_rate": 1.4626269108563497e-05, - "loss": 2.3848, - "step": 405690 - }, - { - "epoch": 0.71, - "learning_rate": 1.4625397168636671e-05, - "loss": 2.3866, - "step": 405700 - }, - { - "epoch": 0.71, - "learning_rate": 1.4624525228709843e-05, - "loss": 2.3366, - "step": 405710 - }, - { - "epoch": 0.71, - "learning_rate": 1.4623653288783019e-05, - "loss": 2.2779, - "step": 405720 - }, - { - "epoch": 0.71, - "learning_rate": 1.462278134885619e-05, - "loss": 2.3646, - "step": 405730 - }, - { - "epoch": 0.71, - "learning_rate": 1.4621909408929363e-05, - "loss": 2.3205, - "step": 405740 - }, - { - "epoch": 0.71, - "learning_rate": 1.4621037469002535e-05, - "loss": 2.3229, - "step": 405750 - }, - { - "epoch": 0.71, - "learning_rate": 1.462016552907571e-05, - "loss": 2.2258, - "step": 405760 - }, - { - "epoch": 0.71, - "learning_rate": 1.4619293589148882e-05, - "loss": 2.2275, - "step": 405770 - }, - { - "epoch": 0.71, - "learning_rate": 1.4618421649222056e-05, - "loss": 2.3233, - "step": 405780 - }, - { - "epoch": 0.71, - "learning_rate": 1.4617549709295228e-05, - "loss": 2.4321, - "step": 405790 - }, - { - "epoch": 0.71, - "learning_rate": 1.4616677769368404e-05, - "loss": 2.2646, - "step": 405800 - }, - { - "epoch": 0.71, - "learning_rate": 1.4615805829441576e-05, - "loss": 2.3205, - "step": 405810 - }, - { - "epoch": 0.71, - "learning_rate": 1.4614933889514748e-05, - "loss": 2.3677, - "step": 405820 - }, - { - "epoch": 0.71, - "learning_rate": 1.461406194958792e-05, - "loss": 2.3217, - "step": 405830 - }, - { - "epoch": 0.71, - "learning_rate": 1.4613190009661095e-05, - "loss": 2.2297, - "step": 405840 - }, - { - "epoch": 0.71, - "learning_rate": 1.4612318069734268e-05, - "loss": 2.1955, - "step": 405850 - }, - { - "epoch": 0.71, - "learning_rate": 1.4611446129807441e-05, - "loss": 2.3676, - "step": 405860 - }, - { - "epoch": 0.71, - "learning_rate": 1.4610574189880615e-05, - "loss": 2.2545, - "step": 405870 - }, - { - "epoch": 0.71, - "learning_rate": 1.4609702249953789e-05, - "loss": 2.3455, - "step": 405880 - }, - { - "epoch": 0.71, - "learning_rate": 1.4608830310026961e-05, - "loss": 2.2587, - "step": 405890 - }, - { - "epoch": 0.71, - "learning_rate": 1.4607958370100133e-05, - "loss": 2.3584, - "step": 405900 - }, - { - "epoch": 0.71, - "learning_rate": 1.4607086430173308e-05, - "loss": 2.2252, - "step": 405910 - }, - { - "epoch": 0.71, - "learning_rate": 1.460621449024648e-05, - "loss": 2.3208, - "step": 405920 - }, - { - "epoch": 0.71, - "learning_rate": 1.4605342550319653e-05, - "loss": 2.3625, - "step": 405930 - }, - { - "epoch": 0.71, - "learning_rate": 1.4604470610392826e-05, - "loss": 2.2457, - "step": 405940 - }, - { - "epoch": 0.71, - "learning_rate": 1.4603598670466002e-05, - "loss": 2.2162, - "step": 405950 - }, - { - "epoch": 0.71, - "learning_rate": 1.4602726730539174e-05, - "loss": 2.2952, - "step": 405960 - }, - { - "epoch": 0.71, - "learning_rate": 1.4601854790612346e-05, - "loss": 2.3628, - "step": 405970 - }, - { - "epoch": 0.71, - "learning_rate": 1.4600982850685521e-05, - "loss": 2.3549, - "step": 405980 - }, - { - "epoch": 0.71, - "learning_rate": 1.4600110910758694e-05, - "loss": 2.3194, - "step": 405990 - }, - { - "epoch": 0.71, - "learning_rate": 1.4599238970831866e-05, - "loss": 2.3571, - "step": 406000 - }, - { - "epoch": 0.71, - "learning_rate": 1.459836703090504e-05, - "loss": 2.3875, - "step": 406010 - }, - { - "epoch": 0.71, - "learning_rate": 1.4597495090978213e-05, - "loss": 2.3327, - "step": 406020 - }, - { - "epoch": 0.71, - "learning_rate": 1.4596623151051387e-05, - "loss": 2.2434, - "step": 406030 - }, - { - "epoch": 0.71, - "learning_rate": 1.4595751211124559e-05, - "loss": 2.2908, - "step": 406040 - }, - { - "epoch": 0.71, - "learning_rate": 1.4594879271197731e-05, - "loss": 2.2484, - "step": 406050 - }, - { - "epoch": 0.71, - "learning_rate": 1.4594007331270907e-05, - "loss": 2.2777, - "step": 406060 - }, - { - "epoch": 0.71, - "learning_rate": 1.4593135391344079e-05, - "loss": 2.3066, - "step": 406070 - }, - { - "epoch": 0.71, - "learning_rate": 1.459226345141725e-05, - "loss": 2.2157, - "step": 406080 - }, - { - "epoch": 0.71, - "learning_rate": 1.4591391511490424e-05, - "loss": 2.2501, - "step": 406090 - }, - { - "epoch": 0.71, - "learning_rate": 1.4590519571563598e-05, - "loss": 2.3046, - "step": 406100 - }, - { - "epoch": 0.71, - "learning_rate": 1.4589647631636772e-05, - "loss": 2.3513, - "step": 406110 - }, - { - "epoch": 0.71, - "learning_rate": 1.4588775691709944e-05, - "loss": 2.302, - "step": 406120 - }, - { - "epoch": 0.71, - "learning_rate": 1.458790375178312e-05, - "loss": 2.3496, - "step": 406130 - }, - { - "epoch": 0.71, - "learning_rate": 1.4587031811856292e-05, - "loss": 2.3269, - "step": 406140 - }, - { - "epoch": 0.71, - "learning_rate": 1.4586159871929464e-05, - "loss": 2.3033, - "step": 406150 - }, - { - "epoch": 0.71, - "learning_rate": 1.4585287932002636e-05, - "loss": 2.2392, - "step": 406160 - }, - { - "epoch": 0.71, - "learning_rate": 1.4584415992075811e-05, - "loss": 2.2866, - "step": 406170 - }, - { - "epoch": 0.71, - "learning_rate": 1.4583544052148983e-05, - "loss": 2.3122, - "step": 406180 - }, - { - "epoch": 0.71, - "learning_rate": 1.4582672112222157e-05, - "loss": 2.3633, - "step": 406190 - }, - { - "epoch": 0.71, - "learning_rate": 1.4581800172295329e-05, - "loss": 2.427, - "step": 406200 - }, - { - "epoch": 0.71, - "learning_rate": 1.4580928232368505e-05, - "loss": 2.4307, - "step": 406210 - }, - { - "epoch": 0.71, - "learning_rate": 1.4580056292441677e-05, - "loss": 2.3017, - "step": 406220 - }, - { - "epoch": 0.71, - "learning_rate": 1.4579184352514849e-05, - "loss": 2.3263, - "step": 406230 - }, - { - "epoch": 0.71, - "learning_rate": 1.4578312412588024e-05, - "loss": 2.3203, - "step": 406240 - }, - { - "epoch": 0.71, - "learning_rate": 1.4577440472661196e-05, - "loss": 2.2139, - "step": 406250 - }, - { - "epoch": 0.71, - "learning_rate": 1.457656853273437e-05, - "loss": 2.1539, - "step": 406260 - }, - { - "epoch": 0.71, - "learning_rate": 1.4575696592807542e-05, - "loss": 2.3035, - "step": 406270 - }, - { - "epoch": 0.71, - "learning_rate": 1.4574824652880718e-05, - "loss": 2.3462, - "step": 406280 - }, - { - "epoch": 0.71, - "learning_rate": 1.457395271295389e-05, - "loss": 2.2276, - "step": 406290 - }, - { - "epoch": 0.71, - "learning_rate": 1.4573080773027062e-05, - "loss": 2.3536, - "step": 406300 - }, - { - "epoch": 0.71, - "learning_rate": 1.4572208833100234e-05, - "loss": 2.2612, - "step": 406310 - }, - { - "epoch": 0.71, - "learning_rate": 1.457133689317341e-05, - "loss": 2.3002, - "step": 406320 - }, - { - "epoch": 0.71, - "learning_rate": 1.4570464953246581e-05, - "loss": 2.2195, - "step": 406330 - }, - { - "epoch": 0.71, - "learning_rate": 1.4569593013319755e-05, - "loss": 2.2572, - "step": 406340 - }, - { - "epoch": 0.71, - "learning_rate": 1.4568721073392927e-05, - "loss": 2.3544, - "step": 406350 - }, - { - "epoch": 0.71, - "learning_rate": 1.4567849133466103e-05, - "loss": 2.1754, - "step": 406360 - }, - { - "epoch": 0.71, - "learning_rate": 1.4566977193539275e-05, - "loss": 2.1899, - "step": 406370 - }, - { - "epoch": 0.71, - "learning_rate": 1.4566105253612447e-05, - "loss": 2.2235, - "step": 406380 - }, - { - "epoch": 0.71, - "learning_rate": 1.4565233313685622e-05, - "loss": 2.2945, - "step": 406390 - }, - { - "epoch": 0.71, - "learning_rate": 1.4564361373758794e-05, - "loss": 2.3305, - "step": 406400 - }, - { - "epoch": 0.71, - "learning_rate": 1.4563489433831966e-05, - "loss": 2.2789, - "step": 406410 - }, - { - "epoch": 0.71, - "learning_rate": 1.456261749390514e-05, - "loss": 2.327, - "step": 406420 - }, - { - "epoch": 0.71, - "learning_rate": 1.4561745553978316e-05, - "loss": 2.1705, - "step": 406430 - }, - { - "epoch": 0.71, - "learning_rate": 1.4560873614051488e-05, - "loss": 2.3384, - "step": 406440 - }, - { - "epoch": 0.71, - "learning_rate": 1.456000167412466e-05, - "loss": 2.1935, - "step": 406450 - }, - { - "epoch": 0.71, - "learning_rate": 1.4559129734197832e-05, - "loss": 2.2937, - "step": 406460 - }, - { - "epoch": 0.71, - "learning_rate": 1.4558257794271007e-05, - "loss": 2.2786, - "step": 406470 - }, - { - "epoch": 0.71, - "learning_rate": 1.455738585434418e-05, - "loss": 2.2411, - "step": 406480 - }, - { - "epoch": 0.71, - "learning_rate": 1.4556513914417352e-05, - "loss": 2.3001, - "step": 406490 - }, - { - "epoch": 0.71, - "learning_rate": 1.4555641974490527e-05, - "loss": 2.3357, - "step": 406500 - }, - { - "epoch": 0.71, - "learning_rate": 1.45547700345637e-05, - "loss": 2.3119, - "step": 406510 - }, - { - "epoch": 0.71, - "learning_rate": 1.4553898094636873e-05, - "loss": 2.3392, - "step": 406520 - }, - { - "epoch": 0.71, - "learning_rate": 1.4553026154710045e-05, - "loss": 2.2411, - "step": 406530 - }, - { - "epoch": 0.71, - "learning_rate": 1.455215421478322e-05, - "loss": 2.2285, - "step": 406540 - }, - { - "epoch": 0.71, - "learning_rate": 1.4551282274856392e-05, - "loss": 2.3513, - "step": 406550 - }, - { - "epoch": 0.71, - "learning_rate": 1.4550410334929565e-05, - "loss": 2.3249, - "step": 406560 - }, - { - "epoch": 0.71, - "learning_rate": 1.4549538395002738e-05, - "loss": 2.2917, - "step": 406570 - }, - { - "epoch": 0.71, - "learning_rate": 1.4548666455075912e-05, - "loss": 2.3717, - "step": 406580 - }, - { - "epoch": 0.71, - "learning_rate": 1.4547794515149086e-05, - "loss": 2.185, - "step": 406590 - }, - { - "epoch": 0.71, - "learning_rate": 1.4546922575222258e-05, - "loss": 2.2745, - "step": 406600 - }, - { - "epoch": 0.71, - "learning_rate": 1.454605063529543e-05, - "loss": 2.2326, - "step": 406610 - }, - { - "epoch": 0.71, - "learning_rate": 1.4545178695368605e-05, - "loss": 2.3097, - "step": 406620 - }, - { - "epoch": 0.71, - "learning_rate": 1.4544306755441778e-05, - "loss": 2.1192, - "step": 406630 - }, - { - "epoch": 0.71, - "learning_rate": 1.454343481551495e-05, - "loss": 2.3642, - "step": 406640 - }, - { - "epoch": 0.71, - "learning_rate": 1.4542562875588125e-05, - "loss": 2.4093, - "step": 406650 - }, - { - "epoch": 0.71, - "learning_rate": 1.4541690935661297e-05, - "loss": 2.2512, - "step": 406660 - }, - { - "epoch": 0.71, - "learning_rate": 1.4540818995734471e-05, - "loss": 2.2511, - "step": 406670 - }, - { - "epoch": 0.71, - "learning_rate": 1.4539947055807643e-05, - "loss": 2.2553, - "step": 406680 - }, - { - "epoch": 0.71, - "learning_rate": 1.4539075115880818e-05, - "loss": 2.3681, - "step": 406690 - }, - { - "epoch": 0.71, - "learning_rate": 1.453820317595399e-05, - "loss": 2.3349, - "step": 406700 - }, - { - "epoch": 0.71, - "learning_rate": 1.4537331236027163e-05, - "loss": 2.286, - "step": 406710 - }, - { - "epoch": 0.71, - "learning_rate": 1.4536459296100335e-05, - "loss": 2.3432, - "step": 406720 - }, - { - "epoch": 0.71, - "learning_rate": 1.453558735617351e-05, - "loss": 2.2672, - "step": 406730 - }, - { - "epoch": 0.71, - "learning_rate": 1.4534715416246684e-05, - "loss": 2.3193, - "step": 406740 - }, - { - "epoch": 0.71, - "learning_rate": 1.4533843476319856e-05, - "loss": 2.3213, - "step": 406750 - }, - { - "epoch": 0.71, - "learning_rate": 1.4532971536393028e-05, - "loss": 2.3073, - "step": 406760 - }, - { - "epoch": 0.71, - "learning_rate": 1.4532099596466204e-05, - "loss": 2.3808, - "step": 406770 - }, - { - "epoch": 0.71, - "learning_rate": 1.4531227656539376e-05, - "loss": 2.282, - "step": 406780 - }, - { - "epoch": 0.71, - "learning_rate": 1.4530355716612548e-05, - "loss": 2.3605, - "step": 406790 - }, - { - "epoch": 0.71, - "learning_rate": 1.4529483776685723e-05, - "loss": 2.2274, - "step": 406800 - }, - { - "epoch": 0.71, - "learning_rate": 1.4528611836758895e-05, - "loss": 2.2345, - "step": 406810 - }, - { - "epoch": 0.71, - "learning_rate": 1.4527739896832069e-05, - "loss": 2.3542, - "step": 406820 - }, - { - "epoch": 0.71, - "learning_rate": 1.4526867956905241e-05, - "loss": 2.3284, - "step": 406830 - }, - { - "epoch": 0.71, - "learning_rate": 1.4525996016978417e-05, - "loss": 2.3225, - "step": 406840 - }, - { - "epoch": 0.71, - "learning_rate": 1.4525124077051589e-05, - "loss": 2.3539, - "step": 406850 - }, - { - "epoch": 0.71, - "learning_rate": 1.452425213712476e-05, - "loss": 2.2642, - "step": 406860 - }, - { - "epoch": 0.71, - "learning_rate": 1.4523380197197933e-05, - "loss": 2.1956, - "step": 406870 - }, - { - "epoch": 0.71, - "learning_rate": 1.4522508257271108e-05, - "loss": 2.3357, - "step": 406880 - }, - { - "epoch": 0.71, - "learning_rate": 1.452163631734428e-05, - "loss": 2.2694, - "step": 406890 - }, - { - "epoch": 0.71, - "learning_rate": 1.4520764377417454e-05, - "loss": 2.2282, - "step": 406900 - }, - { - "epoch": 0.71, - "learning_rate": 1.4519892437490628e-05, - "loss": 2.2994, - "step": 406910 - }, - { - "epoch": 0.71, - "learning_rate": 1.4519020497563802e-05, - "loss": 2.27, - "step": 406920 - }, - { - "epoch": 0.71, - "learning_rate": 1.4518148557636974e-05, - "loss": 2.2855, - "step": 406930 - }, - { - "epoch": 0.71, - "learning_rate": 1.4517276617710146e-05, - "loss": 2.4237, - "step": 406940 - }, - { - "epoch": 0.71, - "learning_rate": 1.4516404677783321e-05, - "loss": 2.3458, - "step": 406950 - }, - { - "epoch": 0.71, - "learning_rate": 1.4515532737856493e-05, - "loss": 2.308, - "step": 406960 - }, - { - "epoch": 0.71, - "learning_rate": 1.4514660797929665e-05, - "loss": 2.303, - "step": 406970 - }, - { - "epoch": 0.71, - "learning_rate": 1.4513788858002839e-05, - "loss": 2.2444, - "step": 406980 - }, - { - "epoch": 0.71, - "learning_rate": 1.4512916918076015e-05, - "loss": 2.1528, - "step": 406990 - }, - { - "epoch": 0.71, - "learning_rate": 1.4512044978149187e-05, - "loss": 2.3256, - "step": 407000 - }, - { - "epoch": 0.71, - "learning_rate": 1.4511173038222359e-05, - "loss": 2.354, - "step": 407010 - }, - { - "epoch": 0.71, - "learning_rate": 1.451030109829553e-05, - "loss": 2.4322, - "step": 407020 - }, - { - "epoch": 0.71, - "learning_rate": 1.4509429158368706e-05, - "loss": 2.355, - "step": 407030 - }, - { - "epoch": 0.71, - "learning_rate": 1.4508557218441878e-05, - "loss": 2.263, - "step": 407040 - }, - { - "epoch": 0.71, - "learning_rate": 1.4507685278515052e-05, - "loss": 2.2444, - "step": 407050 - }, - { - "epoch": 0.71, - "learning_rate": 1.4506813338588226e-05, - "loss": 2.2639, - "step": 407060 - }, - { - "epoch": 0.71, - "learning_rate": 1.45059413986614e-05, - "loss": 2.3254, - "step": 407070 - }, - { - "epoch": 0.71, - "learning_rate": 1.4505069458734572e-05, - "loss": 2.2285, - "step": 407080 - }, - { - "epoch": 0.71, - "learning_rate": 1.4504197518807744e-05, - "loss": 2.1984, - "step": 407090 - }, - { - "epoch": 0.71, - "learning_rate": 1.450332557888092e-05, - "loss": 2.4729, - "step": 407100 - }, - { - "epoch": 0.71, - "learning_rate": 1.4502453638954091e-05, - "loss": 2.2883, - "step": 407110 - }, - { - "epoch": 0.71, - "learning_rate": 1.4501581699027263e-05, - "loss": 2.238, - "step": 407120 - }, - { - "epoch": 0.71, - "learning_rate": 1.4500709759100437e-05, - "loss": 2.2113, - "step": 407130 - }, - { - "epoch": 0.71, - "learning_rate": 1.4499837819173611e-05, - "loss": 2.3442, - "step": 407140 - }, - { - "epoch": 0.71, - "learning_rate": 1.4498965879246785e-05, - "loss": 2.2011, - "step": 407150 - }, - { - "epoch": 0.71, - "learning_rate": 1.4498093939319957e-05, - "loss": 2.407, - "step": 407160 - }, - { - "epoch": 0.71, - "learning_rate": 1.4497221999393132e-05, - "loss": 2.361, - "step": 407170 - }, - { - "epoch": 0.71, - "learning_rate": 1.4496350059466304e-05, - "loss": 2.2028, - "step": 407180 - }, - { - "epoch": 0.71, - "learning_rate": 1.4495478119539476e-05, - "loss": 2.3988, - "step": 407190 - }, - { - "epoch": 0.71, - "learning_rate": 1.4494606179612649e-05, - "loss": 2.2833, - "step": 407200 - }, - { - "epoch": 0.71, - "learning_rate": 1.4493734239685824e-05, - "loss": 2.3814, - "step": 407210 - }, - { - "epoch": 0.71, - "learning_rate": 1.4492862299758996e-05, - "loss": 2.3984, - "step": 407220 - }, - { - "epoch": 0.71, - "learning_rate": 1.449199035983217e-05, - "loss": 2.4355, - "step": 407230 - }, - { - "epoch": 0.71, - "learning_rate": 1.4491118419905342e-05, - "loss": 2.3801, - "step": 407240 - }, - { - "epoch": 0.71, - "learning_rate": 1.4490246479978517e-05, - "loss": 2.3082, - "step": 407250 - }, - { - "epoch": 0.71, - "learning_rate": 1.448937454005169e-05, - "loss": 2.3526, - "step": 407260 - }, - { - "epoch": 0.71, - "learning_rate": 1.4488502600124862e-05, - "loss": 2.2429, - "step": 407270 - }, - { - "epoch": 0.71, - "learning_rate": 1.4487630660198034e-05, - "loss": 2.3291, - "step": 407280 - }, - { - "epoch": 0.71, - "learning_rate": 1.4486758720271209e-05, - "loss": 2.2962, - "step": 407290 - }, - { - "epoch": 0.71, - "learning_rate": 1.4485886780344383e-05, - "loss": 2.228, - "step": 407300 - }, - { - "epoch": 0.71, - "learning_rate": 1.4485014840417555e-05, - "loss": 2.3131, - "step": 407310 - }, - { - "epoch": 0.71, - "learning_rate": 1.448414290049073e-05, - "loss": 2.2817, - "step": 407320 - }, - { - "epoch": 0.71, - "learning_rate": 1.4483270960563902e-05, - "loss": 2.3272, - "step": 407330 - }, - { - "epoch": 0.71, - "learning_rate": 1.4482399020637075e-05, - "loss": 2.3096, - "step": 407340 - }, - { - "epoch": 0.71, - "learning_rate": 1.4481527080710247e-05, - "loss": 2.3315, - "step": 407350 - }, - { - "epoch": 0.71, - "learning_rate": 1.4480655140783422e-05, - "loss": 2.3018, - "step": 407360 - }, - { - "epoch": 0.71, - "learning_rate": 1.4479783200856594e-05, - "loss": 2.322, - "step": 407370 - }, - { - "epoch": 0.71, - "learning_rate": 1.4478911260929768e-05, - "loss": 2.3497, - "step": 407380 - }, - { - "epoch": 0.71, - "learning_rate": 1.447803932100294e-05, - "loss": 2.2925, - "step": 407390 - }, - { - "epoch": 0.71, - "learning_rate": 1.4477167381076115e-05, - "loss": 2.2791, - "step": 407400 - }, - { - "epoch": 0.71, - "learning_rate": 1.4476295441149288e-05, - "loss": 2.3135, - "step": 407410 - }, - { - "epoch": 0.71, - "learning_rate": 1.447542350122246e-05, - "loss": 2.2977, - "step": 407420 - }, - { - "epoch": 0.71, - "learning_rate": 1.4474551561295635e-05, - "loss": 2.3538, - "step": 407430 - }, - { - "epoch": 0.71, - "learning_rate": 1.4473679621368807e-05, - "loss": 2.3209, - "step": 407440 - }, - { - "epoch": 0.71, - "learning_rate": 1.447280768144198e-05, - "loss": 2.2611, - "step": 407450 - }, - { - "epoch": 0.71, - "learning_rate": 1.4471935741515153e-05, - "loss": 2.2475, - "step": 407460 - }, - { - "epoch": 0.71, - "learning_rate": 1.4471063801588328e-05, - "loss": 2.389, - "step": 407470 - }, - { - "epoch": 0.71, - "learning_rate": 1.44701918616615e-05, - "loss": 2.2823, - "step": 407480 - }, - { - "epoch": 0.71, - "learning_rate": 1.4469319921734673e-05, - "loss": 2.2456, - "step": 407490 - }, - { - "epoch": 0.71, - "learning_rate": 1.4468447981807845e-05, - "loss": 2.2022, - "step": 407500 - }, - { - "epoch": 0.71, - "learning_rate": 1.446757604188102e-05, - "loss": 2.3355, - "step": 407510 - }, - { - "epoch": 0.71, - "learning_rate": 1.4466704101954192e-05, - "loss": 2.3167, - "step": 407520 - }, - { - "epoch": 0.71, - "learning_rate": 1.4465832162027364e-05, - "loss": 2.2937, - "step": 407530 - }, - { - "epoch": 0.71, - "learning_rate": 1.4464960222100538e-05, - "loss": 2.308, - "step": 407540 - }, - { - "epoch": 0.71, - "learning_rate": 1.4464088282173714e-05, - "loss": 2.3358, - "step": 407550 - }, - { - "epoch": 0.71, - "learning_rate": 1.4463216342246886e-05, - "loss": 2.3867, - "step": 407560 - }, - { - "epoch": 0.71, - "learning_rate": 1.4462344402320058e-05, - "loss": 2.2005, - "step": 407570 - }, - { - "epoch": 0.71, - "learning_rate": 1.4461472462393233e-05, - "loss": 2.2486, - "step": 407580 - }, - { - "epoch": 0.71, - "learning_rate": 1.4460600522466405e-05, - "loss": 2.3812, - "step": 407590 - }, - { - "epoch": 0.71, - "learning_rate": 1.4459728582539577e-05, - "loss": 2.2572, - "step": 407600 - }, - { - "epoch": 0.71, - "learning_rate": 1.4458856642612751e-05, - "loss": 2.3243, - "step": 407610 - }, - { - "epoch": 0.71, - "learning_rate": 1.4457984702685925e-05, - "loss": 2.1795, - "step": 407620 - }, - { - "epoch": 0.71, - "learning_rate": 1.4457112762759099e-05, - "loss": 2.3515, - "step": 407630 - }, - { - "epoch": 0.71, - "learning_rate": 1.445624082283227e-05, - "loss": 2.3927, - "step": 407640 - }, - { - "epoch": 0.71, - "learning_rate": 1.4455368882905443e-05, - "loss": 2.3575, - "step": 407650 - }, - { - "epoch": 0.71, - "learning_rate": 1.4454496942978618e-05, - "loss": 2.3282, - "step": 407660 - }, - { - "epoch": 0.71, - "learning_rate": 1.445362500305179e-05, - "loss": 2.1839, - "step": 407670 - }, - { - "epoch": 0.71, - "learning_rate": 1.4452753063124962e-05, - "loss": 2.2535, - "step": 407680 - }, - { - "epoch": 0.71, - "learning_rate": 1.4451881123198136e-05, - "loss": 2.4169, - "step": 407690 - }, - { - "epoch": 0.71, - "learning_rate": 1.445100918327131e-05, - "loss": 2.2609, - "step": 407700 - }, - { - "epoch": 0.71, - "learning_rate": 1.4450137243344484e-05, - "loss": 2.2888, - "step": 407710 - }, - { - "epoch": 0.71, - "learning_rate": 1.4449265303417656e-05, - "loss": 2.1859, - "step": 407720 - }, - { - "epoch": 0.71, - "learning_rate": 1.4448393363490831e-05, - "loss": 2.2598, - "step": 407730 - }, - { - "epoch": 0.71, - "learning_rate": 1.4447521423564003e-05, - "loss": 2.3568, - "step": 407740 - }, - { - "epoch": 0.71, - "learning_rate": 1.4446649483637175e-05, - "loss": 2.1986, - "step": 407750 - }, - { - "epoch": 0.71, - "learning_rate": 1.4445777543710347e-05, - "loss": 2.2994, - "step": 407760 - }, - { - "epoch": 0.71, - "learning_rate": 1.4444905603783523e-05, - "loss": 2.2179, - "step": 407770 - }, - { - "epoch": 0.71, - "learning_rate": 1.4444033663856697e-05, - "loss": 2.2459, - "step": 407780 - }, - { - "epoch": 0.71, - "learning_rate": 1.4443161723929869e-05, - "loss": 2.2763, - "step": 407790 - }, - { - "epoch": 0.71, - "learning_rate": 1.444228978400304e-05, - "loss": 2.2773, - "step": 407800 - }, - { - "epoch": 0.71, - "learning_rate": 1.4441417844076216e-05, - "loss": 2.4279, - "step": 407810 - }, - { - "epoch": 0.71, - "learning_rate": 1.4440545904149388e-05, - "loss": 2.3567, - "step": 407820 - }, - { - "epoch": 0.71, - "learning_rate": 1.443967396422256e-05, - "loss": 2.4124, - "step": 407830 - }, - { - "epoch": 0.71, - "learning_rate": 1.4438802024295736e-05, - "loss": 2.2866, - "step": 407840 - }, - { - "epoch": 0.71, - "learning_rate": 1.4437930084368908e-05, - "loss": 2.2348, - "step": 407850 - }, - { - "epoch": 0.71, - "learning_rate": 1.4437058144442082e-05, - "loss": 2.495, - "step": 407860 - }, - { - "epoch": 0.71, - "learning_rate": 1.4436186204515254e-05, - "loss": 2.2972, - "step": 407870 - }, - { - "epoch": 0.71, - "learning_rate": 1.443531426458843e-05, - "loss": 2.3601, - "step": 407880 - }, - { - "epoch": 0.71, - "learning_rate": 1.4434442324661601e-05, - "loss": 2.4092, - "step": 407890 - }, - { - "epoch": 0.71, - "learning_rate": 1.4433570384734773e-05, - "loss": 2.3152, - "step": 407900 - }, - { - "epoch": 0.71, - "learning_rate": 1.4432698444807946e-05, - "loss": 2.2764, - "step": 407910 - }, - { - "epoch": 0.71, - "learning_rate": 1.4431826504881121e-05, - "loss": 2.2799, - "step": 407920 - }, - { - "epoch": 0.71, - "learning_rate": 1.4430954564954293e-05, - "loss": 2.2807, - "step": 407930 - }, - { - "epoch": 0.71, - "learning_rate": 1.4430082625027467e-05, - "loss": 2.3516, - "step": 407940 - }, - { - "epoch": 0.71, - "learning_rate": 1.4429210685100639e-05, - "loss": 2.249, - "step": 407950 - }, - { - "epoch": 0.71, - "learning_rate": 1.4428338745173814e-05, - "loss": 2.4031, - "step": 407960 - }, - { - "epoch": 0.71, - "learning_rate": 1.4427466805246986e-05, - "loss": 2.2901, - "step": 407970 - }, - { - "epoch": 0.71, - "learning_rate": 1.4426594865320159e-05, - "loss": 2.2195, - "step": 407980 - }, - { - "epoch": 0.71, - "learning_rate": 1.4425722925393334e-05, - "loss": 2.3116, - "step": 407990 - }, - { - "epoch": 0.71, - "learning_rate": 1.4424850985466506e-05, - "loss": 2.2136, - "step": 408000 - }, - { - "epoch": 0.71, - "learning_rate": 1.4423979045539678e-05, - "loss": 2.2927, - "step": 408010 - }, - { - "epoch": 0.71, - "learning_rate": 1.4423107105612852e-05, - "loss": 2.3139, - "step": 408020 - }, - { - "epoch": 0.71, - "learning_rate": 1.4422235165686027e-05, - "loss": 2.425, - "step": 408030 - }, - { - "epoch": 0.71, - "learning_rate": 1.44213632257592e-05, - "loss": 2.3279, - "step": 408040 - }, - { - "epoch": 0.71, - "learning_rate": 1.4420491285832372e-05, - "loss": 2.3102, - "step": 408050 - }, - { - "epoch": 0.71, - "learning_rate": 1.4419619345905544e-05, - "loss": 2.3882, - "step": 408060 - }, - { - "epoch": 0.71, - "learning_rate": 1.4418747405978719e-05, - "loss": 2.2339, - "step": 408070 - }, - { - "epoch": 0.71, - "learning_rate": 1.4417875466051891e-05, - "loss": 2.2357, - "step": 408080 - }, - { - "epoch": 0.71, - "learning_rate": 1.4417003526125065e-05, - "loss": 2.3939, - "step": 408090 - }, - { - "epoch": 0.71, - "learning_rate": 1.4416131586198239e-05, - "loss": 2.3245, - "step": 408100 - }, - { - "epoch": 0.71, - "learning_rate": 1.4415259646271412e-05, - "loss": 2.2751, - "step": 408110 - }, - { - "epoch": 0.71, - "learning_rate": 1.4414387706344585e-05, - "loss": 2.3206, - "step": 408120 - }, - { - "epoch": 0.71, - "learning_rate": 1.4413515766417757e-05, - "loss": 2.2985, - "step": 408130 - }, - { - "epoch": 0.71, - "learning_rate": 1.4412643826490932e-05, - "loss": 2.3406, - "step": 408140 - }, - { - "epoch": 0.71, - "learning_rate": 1.4411771886564104e-05, - "loss": 2.3532, - "step": 408150 - }, - { - "epoch": 0.71, - "learning_rate": 1.4410899946637276e-05, - "loss": 2.2949, - "step": 408160 - }, - { - "epoch": 0.71, - "learning_rate": 1.441002800671045e-05, - "loss": 2.3744, - "step": 408170 - }, - { - "epoch": 0.71, - "learning_rate": 1.4409156066783624e-05, - "loss": 2.3075, - "step": 408180 - }, - { - "epoch": 0.71, - "learning_rate": 1.4408284126856798e-05, - "loss": 2.3565, - "step": 408190 - }, - { - "epoch": 0.71, - "learning_rate": 1.440741218692997e-05, - "loss": 2.3428, - "step": 408200 - }, - { - "epoch": 0.71, - "learning_rate": 1.4406540247003142e-05, - "loss": 2.2797, - "step": 408210 - }, - { - "epoch": 0.71, - "learning_rate": 1.4405668307076317e-05, - "loss": 2.2953, - "step": 408220 - }, - { - "epoch": 0.71, - "learning_rate": 1.440479636714949e-05, - "loss": 2.2863, - "step": 408230 - }, - { - "epoch": 0.71, - "learning_rate": 1.4403924427222661e-05, - "loss": 2.2384, - "step": 408240 - }, - { - "epoch": 0.71, - "learning_rate": 1.4403052487295837e-05, - "loss": 2.4241, - "step": 408250 - }, - { - "epoch": 0.71, - "learning_rate": 1.4402180547369009e-05, - "loss": 2.3176, - "step": 408260 - }, - { - "epoch": 0.71, - "learning_rate": 1.4401308607442183e-05, - "loss": 2.3128, - "step": 408270 - }, - { - "epoch": 0.71, - "learning_rate": 1.4400436667515355e-05, - "loss": 2.3669, - "step": 408280 - }, - { - "epoch": 0.71, - "learning_rate": 1.439956472758853e-05, - "loss": 2.3838, - "step": 408290 - }, - { - "epoch": 0.71, - "learning_rate": 1.4398692787661702e-05, - "loss": 2.2707, - "step": 408300 - }, - { - "epoch": 0.71, - "learning_rate": 1.4397820847734874e-05, - "loss": 2.3564, - "step": 408310 - }, - { - "epoch": 0.71, - "learning_rate": 1.4396948907808046e-05, - "loss": 2.3043, - "step": 408320 - }, - { - "epoch": 0.71, - "learning_rate": 1.4396076967881222e-05, - "loss": 2.3112, - "step": 408330 - }, - { - "epoch": 0.71, - "learning_rate": 1.4395205027954396e-05, - "loss": 2.2781, - "step": 408340 - }, - { - "epoch": 0.71, - "learning_rate": 1.4394333088027568e-05, - "loss": 2.4628, - "step": 408350 - }, - { - "epoch": 0.71, - "learning_rate": 1.439346114810074e-05, - "loss": 2.264, - "step": 408360 - }, - { - "epoch": 0.71, - "learning_rate": 1.4392589208173915e-05, - "loss": 2.2842, - "step": 408370 - }, - { - "epoch": 0.71, - "learning_rate": 1.4391717268247087e-05, - "loss": 2.2841, - "step": 408380 - }, - { - "epoch": 0.71, - "learning_rate": 1.439084532832026e-05, - "loss": 2.2837, - "step": 408390 - }, - { - "epoch": 0.71, - "learning_rate": 1.4389973388393435e-05, - "loss": 2.3412, - "step": 408400 - }, - { - "epoch": 0.71, - "learning_rate": 1.4389101448466607e-05, - "loss": 2.2453, - "step": 408410 - }, - { - "epoch": 0.71, - "learning_rate": 1.438822950853978e-05, - "loss": 2.4157, - "step": 408420 - }, - { - "epoch": 0.71, - "learning_rate": 1.4387357568612953e-05, - "loss": 2.3599, - "step": 408430 - }, - { - "epoch": 0.71, - "learning_rate": 1.4386485628686128e-05, - "loss": 2.3135, - "step": 408440 - }, - { - "epoch": 0.71, - "learning_rate": 1.43856136887593e-05, - "loss": 2.3133, - "step": 408450 - }, - { - "epoch": 0.71, - "learning_rate": 1.4384741748832472e-05, - "loss": 2.2692, - "step": 408460 - }, - { - "epoch": 0.71, - "learning_rate": 1.4383869808905644e-05, - "loss": 2.318, - "step": 408470 - }, - { - "epoch": 0.71, - "learning_rate": 1.438299786897882e-05, - "loss": 2.324, - "step": 408480 - }, - { - "epoch": 0.71, - "learning_rate": 1.4382125929051992e-05, - "loss": 2.4057, - "step": 408490 - }, - { - "epoch": 0.71, - "learning_rate": 1.4381253989125166e-05, - "loss": 2.3576, - "step": 408500 - }, - { - "epoch": 0.71, - "learning_rate": 1.4380382049198341e-05, - "loss": 2.1252, - "step": 408510 - }, - { - "epoch": 0.71, - "learning_rate": 1.4379510109271513e-05, - "loss": 2.2164, - "step": 408520 - }, - { - "epoch": 0.71, - "learning_rate": 1.4378638169344685e-05, - "loss": 2.3065, - "step": 408530 - }, - { - "epoch": 0.71, - "learning_rate": 1.4377766229417857e-05, - "loss": 2.2948, - "step": 408540 - }, - { - "epoch": 0.71, - "learning_rate": 1.4376894289491033e-05, - "loss": 2.3043, - "step": 408550 - }, - { - "epoch": 0.71, - "learning_rate": 1.4376022349564205e-05, - "loss": 2.2799, - "step": 408560 - }, - { - "epoch": 0.71, - "learning_rate": 1.4375150409637377e-05, - "loss": 2.2938, - "step": 408570 - }, - { - "epoch": 0.71, - "learning_rate": 1.437427846971055e-05, - "loss": 2.3348, - "step": 408580 - }, - { - "epoch": 0.71, - "learning_rate": 1.4373406529783726e-05, - "loss": 2.2504, - "step": 408590 - }, - { - "epoch": 0.71, - "learning_rate": 1.4372534589856898e-05, - "loss": 2.2351, - "step": 408600 - }, - { - "epoch": 0.71, - "learning_rate": 1.437166264993007e-05, - "loss": 2.2892, - "step": 408610 - }, - { - "epoch": 0.71, - "learning_rate": 1.4370790710003243e-05, - "loss": 2.2084, - "step": 408620 - }, - { - "epoch": 0.71, - "learning_rate": 1.4369918770076418e-05, - "loss": 2.1785, - "step": 408630 - }, - { - "epoch": 0.71, - "learning_rate": 1.436904683014959e-05, - "loss": 2.2998, - "step": 408640 - }, - { - "epoch": 0.71, - "learning_rate": 1.4368174890222764e-05, - "loss": 2.3574, - "step": 408650 - }, - { - "epoch": 0.71, - "learning_rate": 1.4367302950295938e-05, - "loss": 2.1762, - "step": 408660 - }, - { - "epoch": 0.71, - "learning_rate": 1.4366431010369111e-05, - "loss": 2.2407, - "step": 408670 - }, - { - "epoch": 0.71, - "learning_rate": 1.4365559070442283e-05, - "loss": 2.4483, - "step": 408680 - }, - { - "epoch": 0.71, - "learning_rate": 1.4364687130515456e-05, - "loss": 2.2409, - "step": 408690 - }, - { - "epoch": 0.71, - "learning_rate": 1.4363815190588631e-05, - "loss": 2.2121, - "step": 408700 - }, - { - "epoch": 0.71, - "learning_rate": 1.4362943250661803e-05, - "loss": 2.2524, - "step": 408710 - }, - { - "epoch": 0.71, - "learning_rate": 1.4362071310734975e-05, - "loss": 2.3783, - "step": 408720 - }, - { - "epoch": 0.71, - "learning_rate": 1.4361199370808149e-05, - "loss": 2.2969, - "step": 408730 - }, - { - "epoch": 0.71, - "learning_rate": 1.4360327430881323e-05, - "loss": 2.2141, - "step": 408740 - }, - { - "epoch": 0.71, - "learning_rate": 1.4359455490954496e-05, - "loss": 2.1993, - "step": 408750 - }, - { - "epoch": 0.71, - "learning_rate": 1.4358583551027669e-05, - "loss": 2.3092, - "step": 408760 - }, - { - "epoch": 0.71, - "learning_rate": 1.4357711611100844e-05, - "loss": 2.3733, - "step": 408770 - }, - { - "epoch": 0.71, - "learning_rate": 1.4356839671174016e-05, - "loss": 2.3076, - "step": 408780 - }, - { - "epoch": 0.71, - "learning_rate": 1.4355967731247188e-05, - "loss": 2.3512, - "step": 408790 - }, - { - "epoch": 0.71, - "learning_rate": 1.435509579132036e-05, - "loss": 2.2937, - "step": 408800 - }, - { - "epoch": 0.71, - "learning_rate": 1.4354223851393536e-05, - "loss": 2.348, - "step": 408810 - }, - { - "epoch": 0.71, - "learning_rate": 1.435335191146671e-05, - "loss": 2.2995, - "step": 408820 - }, - { - "epoch": 0.71, - "learning_rate": 1.4352479971539882e-05, - "loss": 2.2485, - "step": 408830 - }, - { - "epoch": 0.71, - "learning_rate": 1.4351608031613054e-05, - "loss": 2.2533, - "step": 408840 - }, - { - "epoch": 0.71, - "learning_rate": 1.4350736091686229e-05, - "loss": 2.2013, - "step": 408850 - }, - { - "epoch": 0.71, - "learning_rate": 1.4349864151759401e-05, - "loss": 2.324, - "step": 408860 - }, - { - "epoch": 0.71, - "learning_rate": 1.4348992211832573e-05, - "loss": 2.3637, - "step": 408870 - }, - { - "epoch": 0.71, - "learning_rate": 1.4348120271905745e-05, - "loss": 2.3654, - "step": 408880 - }, - { - "epoch": 0.71, - "learning_rate": 1.434724833197892e-05, - "loss": 2.2479, - "step": 408890 - }, - { - "epoch": 0.71, - "learning_rate": 1.4346376392052095e-05, - "loss": 2.3415, - "step": 408900 - }, - { - "epoch": 0.71, - "learning_rate": 1.4345504452125267e-05, - "loss": 2.3552, - "step": 408910 - }, - { - "epoch": 0.71, - "learning_rate": 1.4344632512198442e-05, - "loss": 2.4181, - "step": 408920 - }, - { - "epoch": 0.71, - "learning_rate": 1.4343760572271614e-05, - "loss": 2.372, - "step": 408930 - }, - { - "epoch": 0.71, - "learning_rate": 1.4342888632344786e-05, - "loss": 2.3413, - "step": 408940 - }, - { - "epoch": 0.71, - "learning_rate": 1.4342016692417958e-05, - "loss": 2.2577, - "step": 408950 - }, - { - "epoch": 0.71, - "learning_rate": 1.4341144752491134e-05, - "loss": 2.3983, - "step": 408960 - }, - { - "epoch": 0.71, - "learning_rate": 1.4340272812564306e-05, - "loss": 2.3052, - "step": 408970 - }, - { - "epoch": 0.71, - "learning_rate": 1.433940087263748e-05, - "loss": 2.2906, - "step": 408980 - }, - { - "epoch": 0.71, - "learning_rate": 1.4338528932710652e-05, - "loss": 2.2871, - "step": 408990 - }, - { - "epoch": 0.71, - "learning_rate": 1.4337656992783827e-05, - "loss": 2.1225, - "step": 409000 - }, - { - "epoch": 0.71, - "learning_rate": 1.4336785052857e-05, - "loss": 2.3252, - "step": 409010 - }, - { - "epoch": 0.71, - "learning_rate": 1.4335913112930171e-05, - "loss": 2.2685, - "step": 409020 - }, - { - "epoch": 0.71, - "learning_rate": 1.4335041173003347e-05, - "loss": 2.2406, - "step": 409030 - }, - { - "epoch": 0.71, - "learning_rate": 1.4334169233076519e-05, - "loss": 2.2536, - "step": 409040 - }, - { - "epoch": 0.71, - "learning_rate": 1.4333297293149691e-05, - "loss": 2.3156, - "step": 409050 - }, - { - "epoch": 0.71, - "learning_rate": 1.4332425353222865e-05, - "loss": 2.2555, - "step": 409060 - }, - { - "epoch": 0.71, - "learning_rate": 1.433155341329604e-05, - "loss": 2.2265, - "step": 409070 - }, - { - "epoch": 0.71, - "learning_rate": 1.4330681473369212e-05, - "loss": 2.2522, - "step": 409080 - }, - { - "epoch": 0.71, - "learning_rate": 1.4329809533442384e-05, - "loss": 2.2378, - "step": 409090 - }, - { - "epoch": 0.71, - "learning_rate": 1.4328937593515556e-05, - "loss": 2.2536, - "step": 409100 - }, - { - "epoch": 0.71, - "learning_rate": 1.4328065653588732e-05, - "loss": 2.1252, - "step": 409110 - }, - { - "epoch": 0.71, - "learning_rate": 1.4327193713661904e-05, - "loss": 2.3894, - "step": 409120 - }, - { - "epoch": 0.71, - "learning_rate": 1.4326321773735078e-05, - "loss": 2.4247, - "step": 409130 - }, - { - "epoch": 0.71, - "learning_rate": 1.432544983380825e-05, - "loss": 2.3062, - "step": 409140 - }, - { - "epoch": 0.71, - "learning_rate": 1.4324577893881425e-05, - "loss": 2.2832, - "step": 409150 - }, - { - "epoch": 0.71, - "learning_rate": 1.4323705953954597e-05, - "loss": 2.1436, - "step": 409160 - }, - { - "epoch": 0.71, - "learning_rate": 1.432283401402777e-05, - "loss": 2.3635, - "step": 409170 - }, - { - "epoch": 0.71, - "learning_rate": 1.4321962074100945e-05, - "loss": 2.2255, - "step": 409180 - }, - { - "epoch": 0.71, - "learning_rate": 1.4321090134174117e-05, - "loss": 2.3225, - "step": 409190 - }, - { - "epoch": 0.71, - "learning_rate": 1.4320218194247289e-05, - "loss": 2.2516, - "step": 409200 - }, - { - "epoch": 0.71, - "learning_rate": 1.4319346254320463e-05, - "loss": 2.2993, - "step": 409210 - }, - { - "epoch": 0.71, - "learning_rate": 1.4318474314393637e-05, - "loss": 2.2694, - "step": 409220 - }, - { - "epoch": 0.71, - "learning_rate": 1.431760237446681e-05, - "loss": 2.4361, - "step": 409230 - }, - { - "epoch": 0.71, - "learning_rate": 1.4316730434539982e-05, - "loss": 2.3495, - "step": 409240 - }, - { - "epoch": 0.71, - "learning_rate": 1.4315858494613154e-05, - "loss": 2.2524, - "step": 409250 - }, - { - "epoch": 0.71, - "learning_rate": 1.431498655468633e-05, - "loss": 2.2208, - "step": 409260 - }, - { - "epoch": 0.71, - "learning_rate": 1.4314114614759502e-05, - "loss": 2.3427, - "step": 409270 - }, - { - "epoch": 0.71, - "learning_rate": 1.4313242674832674e-05, - "loss": 2.345, - "step": 409280 - }, - { - "epoch": 0.71, - "learning_rate": 1.4312370734905848e-05, - "loss": 2.3288, - "step": 409290 - }, - { - "epoch": 0.71, - "learning_rate": 1.4311498794979022e-05, - "loss": 2.2919, - "step": 409300 - }, - { - "epoch": 0.71, - "learning_rate": 1.4310626855052195e-05, - "loss": 2.3329, - "step": 409310 - }, - { - "epoch": 0.71, - "learning_rate": 1.4309754915125367e-05, - "loss": 2.2208, - "step": 409320 - }, - { - "epoch": 0.71, - "learning_rate": 1.4308882975198543e-05, - "loss": 2.3314, - "step": 409330 - }, - { - "epoch": 0.71, - "learning_rate": 1.4308011035271715e-05, - "loss": 2.3461, - "step": 409340 - }, - { - "epoch": 0.71, - "learning_rate": 1.4307139095344887e-05, - "loss": 2.2917, - "step": 409350 - }, - { - "epoch": 0.71, - "learning_rate": 1.430626715541806e-05, - "loss": 2.2453, - "step": 409360 - }, - { - "epoch": 0.71, - "learning_rate": 1.4305395215491235e-05, - "loss": 2.3483, - "step": 409370 - }, - { - "epoch": 0.71, - "learning_rate": 1.4304523275564408e-05, - "loss": 2.2584, - "step": 409380 - }, - { - "epoch": 0.71, - "learning_rate": 1.430365133563758e-05, - "loss": 2.2354, - "step": 409390 - }, - { - "epoch": 0.71, - "learning_rate": 1.4302779395710753e-05, - "loss": 2.3285, - "step": 409400 - }, - { - "epoch": 0.71, - "learning_rate": 1.4301907455783928e-05, - "loss": 2.3826, - "step": 409410 - }, - { - "epoch": 0.71, - "learning_rate": 1.43010355158571e-05, - "loss": 2.1855, - "step": 409420 - }, - { - "epoch": 0.71, - "learning_rate": 1.4300163575930272e-05, - "loss": 2.3253, - "step": 409430 - }, - { - "epoch": 0.71, - "learning_rate": 1.4299291636003448e-05, - "loss": 2.3005, - "step": 409440 - }, - { - "epoch": 0.71, - "learning_rate": 1.429841969607662e-05, - "loss": 2.2126, - "step": 409450 - }, - { - "epoch": 0.71, - "learning_rate": 1.4297547756149793e-05, - "loss": 2.2641, - "step": 409460 - }, - { - "epoch": 0.71, - "learning_rate": 1.4296675816222966e-05, - "loss": 2.2584, - "step": 409470 - }, - { - "epoch": 0.71, - "learning_rate": 1.4295803876296141e-05, - "loss": 2.3062, - "step": 409480 - }, - { - "epoch": 0.71, - "learning_rate": 1.4294931936369313e-05, - "loss": 2.2829, - "step": 409490 - }, - { - "epoch": 0.71, - "learning_rate": 1.4294059996442485e-05, - "loss": 2.2646, - "step": 409500 - }, - { - "epoch": 0.71, - "learning_rate": 1.4293188056515657e-05, - "loss": 2.3772, - "step": 409510 - }, - { - "epoch": 0.71, - "learning_rate": 1.4292316116588833e-05, - "loss": 2.2987, - "step": 409520 - }, - { - "epoch": 0.71, - "learning_rate": 1.4291444176662005e-05, - "loss": 2.259, - "step": 409530 - }, - { - "epoch": 0.71, - "learning_rate": 1.4290572236735179e-05, - "loss": 2.353, - "step": 409540 - }, - { - "epoch": 0.71, - "learning_rate": 1.428970029680835e-05, - "loss": 2.2897, - "step": 409550 - }, - { - "epoch": 0.71, - "learning_rate": 1.4288828356881526e-05, - "loss": 2.2648, - "step": 409560 - }, - { - "epoch": 0.71, - "learning_rate": 1.4287956416954698e-05, - "loss": 2.2268, - "step": 409570 - }, - { - "epoch": 0.71, - "learning_rate": 1.428708447702787e-05, - "loss": 2.3063, - "step": 409580 - }, - { - "epoch": 0.71, - "learning_rate": 1.4286212537101046e-05, - "loss": 2.1523, - "step": 409590 - }, - { - "epoch": 0.71, - "learning_rate": 1.4285340597174218e-05, - "loss": 2.1455, - "step": 409600 - }, - { - "epoch": 0.71, - "learning_rate": 1.4284468657247392e-05, - "loss": 2.3609, - "step": 409610 - }, - { - "epoch": 0.71, - "learning_rate": 1.4283596717320564e-05, - "loss": 2.3014, - "step": 409620 - }, - { - "epoch": 0.71, - "learning_rate": 1.4282724777393739e-05, - "loss": 2.3922, - "step": 409630 - }, - { - "epoch": 0.71, - "learning_rate": 1.4281852837466911e-05, - "loss": 2.3175, - "step": 409640 - }, - { - "epoch": 0.71, - "learning_rate": 1.4280980897540083e-05, - "loss": 2.3396, - "step": 409650 - }, - { - "epoch": 0.71, - "learning_rate": 1.4280108957613255e-05, - "loss": 2.2448, - "step": 409660 - }, - { - "epoch": 0.71, - "learning_rate": 1.427923701768643e-05, - "loss": 2.3112, - "step": 409670 - }, - { - "epoch": 0.71, - "learning_rate": 1.4278365077759603e-05, - "loss": 2.2698, - "step": 409680 - }, - { - "epoch": 0.71, - "learning_rate": 1.4277493137832777e-05, - "loss": 2.3672, - "step": 409690 - }, - { - "epoch": 0.71, - "learning_rate": 1.427662119790595e-05, - "loss": 2.2177, - "step": 409700 - }, - { - "epoch": 0.71, - "learning_rate": 1.4275749257979124e-05, - "loss": 2.3918, - "step": 409710 - }, - { - "epoch": 0.71, - "learning_rate": 1.4274877318052296e-05, - "loss": 2.3946, - "step": 409720 - }, - { - "epoch": 0.71, - "learning_rate": 1.4274005378125468e-05, - "loss": 2.3199, - "step": 409730 - }, - { - "epoch": 0.71, - "learning_rate": 1.4273133438198644e-05, - "loss": 2.3151, - "step": 409740 - }, - { - "epoch": 0.71, - "learning_rate": 1.4272261498271816e-05, - "loss": 2.3199, - "step": 409750 - }, - { - "epoch": 0.71, - "learning_rate": 1.4271389558344988e-05, - "loss": 2.3063, - "step": 409760 - }, - { - "epoch": 0.71, - "learning_rate": 1.4270517618418162e-05, - "loss": 2.2657, - "step": 409770 - }, - { - "epoch": 0.71, - "learning_rate": 1.4269645678491335e-05, - "loss": 2.2742, - "step": 409780 - }, - { - "epoch": 0.71, - "learning_rate": 1.426877373856451e-05, - "loss": 2.2852, - "step": 409790 - }, - { - "epoch": 0.71, - "learning_rate": 1.4267901798637681e-05, - "loss": 2.3933, - "step": 409800 - }, - { - "epoch": 0.71, - "learning_rate": 1.4267029858710853e-05, - "loss": 2.3493, - "step": 409810 - }, - { - "epoch": 0.71, - "learning_rate": 1.4266157918784029e-05, - "loss": 2.2732, - "step": 409820 - }, - { - "epoch": 0.71, - "learning_rate": 1.4265285978857201e-05, - "loss": 2.2529, - "step": 409830 - }, - { - "epoch": 0.71, - "learning_rate": 1.4264414038930373e-05, - "loss": 2.41, - "step": 409840 - }, - { - "epoch": 0.71, - "learning_rate": 1.4263542099003548e-05, - "loss": 2.3889, - "step": 409850 - }, - { - "epoch": 0.71, - "learning_rate": 1.4262670159076722e-05, - "loss": 2.3161, - "step": 409860 - }, - { - "epoch": 0.71, - "learning_rate": 1.4261798219149894e-05, - "loss": 2.268, - "step": 409870 - }, - { - "epoch": 0.71, - "learning_rate": 1.4260926279223066e-05, - "loss": 2.2463, - "step": 409880 - }, - { - "epoch": 0.71, - "learning_rate": 1.4260054339296242e-05, - "loss": 2.4281, - "step": 409890 - }, - { - "epoch": 0.71, - "learning_rate": 1.4259182399369414e-05, - "loss": 2.3234, - "step": 409900 - }, - { - "epoch": 0.71, - "learning_rate": 1.4258310459442586e-05, - "loss": 2.2609, - "step": 409910 - }, - { - "epoch": 0.71, - "learning_rate": 1.425743851951576e-05, - "loss": 2.2702, - "step": 409920 - }, - { - "epoch": 0.71, - "learning_rate": 1.4256566579588934e-05, - "loss": 2.1751, - "step": 409930 - }, - { - "epoch": 0.71, - "learning_rate": 1.4255694639662107e-05, - "loss": 2.3381, - "step": 409940 - }, - { - "epoch": 0.71, - "learning_rate": 1.425482269973528e-05, - "loss": 2.3776, - "step": 409950 - }, - { - "epoch": 0.71, - "learning_rate": 1.4253950759808455e-05, - "loss": 2.2819, - "step": 409960 - }, - { - "epoch": 0.71, - "learning_rate": 1.4253078819881627e-05, - "loss": 2.225, - "step": 409970 - }, - { - "epoch": 0.71, - "learning_rate": 1.4252206879954799e-05, - "loss": 2.4418, - "step": 409980 - }, - { - "epoch": 0.71, - "learning_rate": 1.4251334940027971e-05, - "loss": 2.2392, - "step": 409990 - }, - { - "epoch": 0.71, - "learning_rate": 1.4250463000101147e-05, - "loss": 2.3815, - "step": 410000 - }, - { - "epoch": 0.72, - "learning_rate": 1.4249591060174319e-05, - "loss": 2.3014, - "step": 410010 - }, - { - "epoch": 0.72, - "learning_rate": 1.4248719120247492e-05, - "loss": 2.3152, - "step": 410020 - }, - { - "epoch": 0.72, - "learning_rate": 1.4247847180320664e-05, - "loss": 2.4168, - "step": 410030 - }, - { - "epoch": 0.72, - "learning_rate": 1.424697524039384e-05, - "loss": 2.2639, - "step": 410040 - }, - { - "epoch": 0.72, - "learning_rate": 1.4246103300467012e-05, - "loss": 2.2753, - "step": 410050 - }, - { - "epoch": 0.72, - "learning_rate": 1.4245231360540184e-05, - "loss": 2.2441, - "step": 410060 - }, - { - "epoch": 0.72, - "learning_rate": 1.4244359420613356e-05, - "loss": 2.2051, - "step": 410070 - }, - { - "epoch": 0.72, - "learning_rate": 1.4243487480686532e-05, - "loss": 2.2733, - "step": 410080 - }, - { - "epoch": 0.72, - "learning_rate": 1.4242615540759704e-05, - "loss": 2.3304, - "step": 410090 - }, - { - "epoch": 0.72, - "learning_rate": 1.4241743600832877e-05, - "loss": 2.357, - "step": 410100 - }, - { - "epoch": 0.72, - "learning_rate": 1.4240871660906053e-05, - "loss": 2.2929, - "step": 410110 - }, - { - "epoch": 0.72, - "learning_rate": 1.4239999720979225e-05, - "loss": 2.2572, - "step": 410120 - }, - { - "epoch": 0.72, - "learning_rate": 1.4239127781052397e-05, - "loss": 2.3366, - "step": 410130 - }, - { - "epoch": 0.72, - "learning_rate": 1.423825584112557e-05, - "loss": 2.4477, - "step": 410140 - }, - { - "epoch": 0.72, - "learning_rate": 1.4237383901198745e-05, - "loss": 2.1976, - "step": 410150 - }, - { - "epoch": 0.72, - "learning_rate": 1.4236511961271917e-05, - "loss": 2.3262, - "step": 410160 - }, - { - "epoch": 0.72, - "learning_rate": 1.423564002134509e-05, - "loss": 2.2981, - "step": 410170 - }, - { - "epoch": 0.72, - "learning_rate": 1.4234768081418263e-05, - "loss": 2.1583, - "step": 410180 - }, - { - "epoch": 0.72, - "learning_rate": 1.4233896141491438e-05, - "loss": 2.3859, - "step": 410190 - }, - { - "epoch": 0.72, - "learning_rate": 1.423302420156461e-05, - "loss": 2.1584, - "step": 410200 - }, - { - "epoch": 0.72, - "learning_rate": 1.4232152261637782e-05, - "loss": 2.3434, - "step": 410210 - }, - { - "epoch": 0.72, - "learning_rate": 1.4231280321710954e-05, - "loss": 2.3099, - "step": 410220 - }, - { - "epoch": 0.72, - "learning_rate": 1.423040838178413e-05, - "loss": 2.3484, - "step": 410230 - }, - { - "epoch": 0.72, - "learning_rate": 1.4229536441857302e-05, - "loss": 2.2554, - "step": 410240 - }, - { - "epoch": 0.72, - "learning_rate": 1.4228664501930476e-05, - "loss": 2.2434, - "step": 410250 - }, - { - "epoch": 0.72, - "learning_rate": 1.422779256200365e-05, - "loss": 2.3826, - "step": 410260 - }, - { - "epoch": 0.72, - "learning_rate": 1.4226920622076823e-05, - "loss": 2.3317, - "step": 410270 - }, - { - "epoch": 0.72, - "learning_rate": 1.4226048682149995e-05, - "loss": 2.2783, - "step": 410280 - }, - { - "epoch": 0.72, - "learning_rate": 1.4225176742223167e-05, - "loss": 2.3188, - "step": 410290 - }, - { - "epoch": 0.72, - "learning_rate": 1.4224304802296343e-05, - "loss": 2.3342, - "step": 410300 - }, - { - "epoch": 0.72, - "learning_rate": 1.4223432862369515e-05, - "loss": 2.3644, - "step": 410310 - }, - { - "epoch": 0.72, - "learning_rate": 1.4222560922442687e-05, - "loss": 2.3331, - "step": 410320 - }, - { - "epoch": 0.72, - "learning_rate": 1.422168898251586e-05, - "loss": 2.3564, - "step": 410330 - }, - { - "epoch": 0.72, - "learning_rate": 1.4220817042589036e-05, - "loss": 2.2653, - "step": 410340 - }, - { - "epoch": 0.72, - "learning_rate": 1.4219945102662208e-05, - "loss": 2.3658, - "step": 410350 - }, - { - "epoch": 0.72, - "learning_rate": 1.421907316273538e-05, - "loss": 2.252, - "step": 410360 - }, - { - "epoch": 0.72, - "learning_rate": 1.4218201222808556e-05, - "loss": 2.3111, - "step": 410370 - }, - { - "epoch": 0.72, - "learning_rate": 1.4217329282881728e-05, - "loss": 2.2692, - "step": 410380 - }, - { - "epoch": 0.72, - "learning_rate": 1.42164573429549e-05, - "loss": 2.2606, - "step": 410390 - }, - { - "epoch": 0.72, - "learning_rate": 1.4215585403028072e-05, - "loss": 2.3221, - "step": 410400 - }, - { - "epoch": 0.72, - "learning_rate": 1.4214713463101247e-05, - "loss": 2.4038, - "step": 410410 - }, - { - "epoch": 0.72, - "learning_rate": 1.4213841523174421e-05, - "loss": 2.3396, - "step": 410420 - }, - { - "epoch": 0.72, - "learning_rate": 1.4212969583247593e-05, - "loss": 2.3541, - "step": 410430 - }, - { - "epoch": 0.72, - "learning_rate": 1.4212097643320765e-05, - "loss": 2.3612, - "step": 410440 - }, - { - "epoch": 0.72, - "learning_rate": 1.421122570339394e-05, - "loss": 2.2785, - "step": 410450 - }, - { - "epoch": 0.72, - "learning_rate": 1.4210353763467113e-05, - "loss": 2.2564, - "step": 410460 - }, - { - "epoch": 0.72, - "learning_rate": 1.4209481823540285e-05, - "loss": 2.313, - "step": 410470 - }, - { - "epoch": 0.72, - "learning_rate": 1.4208609883613459e-05, - "loss": 2.3403, - "step": 410480 - }, - { - "epoch": 0.72, - "learning_rate": 1.4207737943686632e-05, - "loss": 2.2731, - "step": 410490 - }, - { - "epoch": 0.72, - "learning_rate": 1.4206866003759806e-05, - "loss": 2.3236, - "step": 410500 - }, - { - "epoch": 0.72, - "learning_rate": 1.4205994063832978e-05, - "loss": 2.395, - "step": 410510 - }, - { - "epoch": 0.72, - "learning_rate": 1.4205122123906154e-05, - "loss": 2.3283, - "step": 410520 - }, - { - "epoch": 0.72, - "learning_rate": 1.4204250183979326e-05, - "loss": 2.3497, - "step": 410530 - }, - { - "epoch": 0.72, - "learning_rate": 1.4203378244052498e-05, - "loss": 2.3239, - "step": 410540 - }, - { - "epoch": 0.72, - "learning_rate": 1.420250630412567e-05, - "loss": 2.2123, - "step": 410550 - }, - { - "epoch": 0.72, - "learning_rate": 1.4201634364198845e-05, - "loss": 2.2706, - "step": 410560 - }, - { - "epoch": 0.72, - "learning_rate": 1.4200762424272018e-05, - "loss": 2.3515, - "step": 410570 - }, - { - "epoch": 0.72, - "learning_rate": 1.4199890484345191e-05, - "loss": 2.326, - "step": 410580 - }, - { - "epoch": 0.72, - "learning_rate": 1.4199018544418363e-05, - "loss": 2.3037, - "step": 410590 - }, - { - "epoch": 0.72, - "learning_rate": 1.4198146604491539e-05, - "loss": 2.397, - "step": 410600 - }, - { - "epoch": 0.72, - "learning_rate": 1.4197274664564711e-05, - "loss": 2.3575, - "step": 410610 - }, - { - "epoch": 0.72, - "learning_rate": 1.4196402724637883e-05, - "loss": 2.1267, - "step": 410620 - }, - { - "epoch": 0.72, - "learning_rate": 1.4195530784711058e-05, - "loss": 2.2598, - "step": 410630 - }, - { - "epoch": 0.72, - "learning_rate": 1.419465884478423e-05, - "loss": 2.3186, - "step": 410640 - }, - { - "epoch": 0.72, - "learning_rate": 1.4193786904857404e-05, - "loss": 2.2474, - "step": 410650 - }, - { - "epoch": 0.72, - "learning_rate": 1.4192914964930576e-05, - "loss": 2.2446, - "step": 410660 - }, - { - "epoch": 0.72, - "learning_rate": 1.4192043025003752e-05, - "loss": 2.4465, - "step": 410670 - }, - { - "epoch": 0.72, - "learning_rate": 1.4191171085076924e-05, - "loss": 2.337, - "step": 410680 - }, - { - "epoch": 0.72, - "learning_rate": 1.4190299145150096e-05, - "loss": 2.3668, - "step": 410690 - }, - { - "epoch": 0.72, - "learning_rate": 1.4189427205223268e-05, - "loss": 2.303, - "step": 410700 - }, - { - "epoch": 0.72, - "learning_rate": 1.4188555265296444e-05, - "loss": 2.2933, - "step": 410710 - }, - { - "epoch": 0.72, - "learning_rate": 1.4187683325369616e-05, - "loss": 2.2902, - "step": 410720 - }, - { - "epoch": 0.72, - "learning_rate": 1.418681138544279e-05, - "loss": 2.2665, - "step": 410730 - }, - { - "epoch": 0.72, - "learning_rate": 1.4185939445515961e-05, - "loss": 2.1693, - "step": 410740 - }, - { - "epoch": 0.72, - "learning_rate": 1.4185067505589137e-05, - "loss": 2.3445, - "step": 410750 - }, - { - "epoch": 0.72, - "learning_rate": 1.4184195565662309e-05, - "loss": 2.1984, - "step": 410760 - }, - { - "epoch": 0.72, - "learning_rate": 1.4183323625735481e-05, - "loss": 2.2971, - "step": 410770 - }, - { - "epoch": 0.72, - "learning_rate": 1.4182451685808657e-05, - "loss": 2.3154, - "step": 410780 - }, - { - "epoch": 0.72, - "learning_rate": 1.4181579745881829e-05, - "loss": 2.3419, - "step": 410790 - }, - { - "epoch": 0.72, - "learning_rate": 1.4180707805955e-05, - "loss": 2.2443, - "step": 410800 - }, - { - "epoch": 0.72, - "learning_rate": 1.4179835866028174e-05, - "loss": 2.368, - "step": 410810 - }, - { - "epoch": 0.72, - "learning_rate": 1.4178963926101348e-05, - "loss": 2.3034, - "step": 410820 - }, - { - "epoch": 0.72, - "learning_rate": 1.4178091986174522e-05, - "loss": 2.3355, - "step": 410830 - }, - { - "epoch": 0.72, - "learning_rate": 1.4177220046247694e-05, - "loss": 2.2877, - "step": 410840 - }, - { - "epoch": 0.72, - "learning_rate": 1.4176348106320866e-05, - "loss": 2.2348, - "step": 410850 - }, - { - "epoch": 0.72, - "learning_rate": 1.4175476166394042e-05, - "loss": 2.3338, - "step": 410860 - }, - { - "epoch": 0.72, - "learning_rate": 1.4174604226467214e-05, - "loss": 2.2395, - "step": 410870 - }, - { - "epoch": 0.72, - "learning_rate": 1.4173732286540386e-05, - "loss": 2.1864, - "step": 410880 - }, - { - "epoch": 0.72, - "learning_rate": 1.4172860346613561e-05, - "loss": 2.2465, - "step": 410890 - }, - { - "epoch": 0.72, - "learning_rate": 1.4171988406686735e-05, - "loss": 2.2038, - "step": 410900 - }, - { - "epoch": 0.72, - "learning_rate": 1.4171116466759907e-05, - "loss": 2.3138, - "step": 410910 - }, - { - "epoch": 0.72, - "learning_rate": 1.417024452683308e-05, - "loss": 2.1939, - "step": 410920 - }, - { - "epoch": 0.72, - "learning_rate": 1.4169372586906255e-05, - "loss": 2.2879, - "step": 410930 - }, - { - "epoch": 0.72, - "learning_rate": 1.4168500646979427e-05, - "loss": 2.1923, - "step": 410940 - }, - { - "epoch": 0.72, - "learning_rate": 1.4167628707052599e-05, - "loss": 2.3466, - "step": 410950 - }, - { - "epoch": 0.72, - "learning_rate": 1.4166756767125773e-05, - "loss": 2.2715, - "step": 410960 - }, - { - "epoch": 0.72, - "learning_rate": 1.4165884827198946e-05, - "loss": 2.2879, - "step": 410970 - }, - { - "epoch": 0.72, - "learning_rate": 1.416501288727212e-05, - "loss": 2.2736, - "step": 410980 - }, - { - "epoch": 0.72, - "learning_rate": 1.4164140947345292e-05, - "loss": 2.2953, - "step": 410990 - }, - { - "epoch": 0.72, - "learning_rate": 1.4163269007418464e-05, - "loss": 2.3679, - "step": 411000 - }, - { - "epoch": 0.72, - "learning_rate": 1.416239706749164e-05, - "loss": 2.37, - "step": 411010 - }, - { - "epoch": 0.72, - "learning_rate": 1.4161525127564812e-05, - "loss": 2.2003, - "step": 411020 - }, - { - "epoch": 0.72, - "learning_rate": 1.4160653187637984e-05, - "loss": 2.2488, - "step": 411030 - }, - { - "epoch": 0.72, - "learning_rate": 1.415978124771116e-05, - "loss": 2.3053, - "step": 411040 - }, - { - "epoch": 0.72, - "learning_rate": 1.4158909307784331e-05, - "loss": 2.2106, - "step": 411050 - }, - { - "epoch": 0.72, - "learning_rate": 1.4158037367857505e-05, - "loss": 2.2077, - "step": 411060 - }, - { - "epoch": 0.72, - "learning_rate": 1.4157165427930677e-05, - "loss": 2.2859, - "step": 411070 - }, - { - "epoch": 0.72, - "learning_rate": 1.4156293488003853e-05, - "loss": 2.2369, - "step": 411080 - }, - { - "epoch": 0.72, - "learning_rate": 1.4155421548077025e-05, - "loss": 2.2612, - "step": 411090 - }, - { - "epoch": 0.72, - "learning_rate": 1.4154549608150197e-05, - "loss": 2.3571, - "step": 411100 - }, - { - "epoch": 0.72, - "learning_rate": 1.4153677668223369e-05, - "loss": 2.3135, - "step": 411110 - }, - { - "epoch": 0.72, - "learning_rate": 1.4152805728296544e-05, - "loss": 2.2471, - "step": 411120 - }, - { - "epoch": 0.72, - "learning_rate": 1.4151933788369716e-05, - "loss": 2.2927, - "step": 411130 - }, - { - "epoch": 0.72, - "learning_rate": 1.415106184844289e-05, - "loss": 2.2429, - "step": 411140 - }, - { - "epoch": 0.72, - "learning_rate": 1.4150189908516062e-05, - "loss": 2.2638, - "step": 411150 - }, - { - "epoch": 0.72, - "learning_rate": 1.4149317968589238e-05, - "loss": 2.2694, - "step": 411160 - }, - { - "epoch": 0.72, - "learning_rate": 1.414844602866241e-05, - "loss": 2.2855, - "step": 411170 - }, - { - "epoch": 0.72, - "learning_rate": 1.4147574088735582e-05, - "loss": 2.1992, - "step": 411180 - }, - { - "epoch": 0.72, - "learning_rate": 1.4146702148808757e-05, - "loss": 2.3424, - "step": 411190 - }, - { - "epoch": 0.72, - "learning_rate": 1.414583020888193e-05, - "loss": 2.3068, - "step": 411200 - }, - { - "epoch": 0.72, - "learning_rate": 1.4144958268955103e-05, - "loss": 2.3015, - "step": 411210 - }, - { - "epoch": 0.72, - "learning_rate": 1.4144086329028275e-05, - "loss": 2.3471, - "step": 411220 - }, - { - "epoch": 0.72, - "learning_rate": 1.414321438910145e-05, - "loss": 2.3288, - "step": 411230 - }, - { - "epoch": 0.72, - "learning_rate": 1.4142342449174623e-05, - "loss": 2.2587, - "step": 411240 - }, - { - "epoch": 0.72, - "learning_rate": 1.4141470509247795e-05, - "loss": 2.2313, - "step": 411250 - }, - { - "epoch": 0.72, - "learning_rate": 1.4140598569320967e-05, - "loss": 2.3767, - "step": 411260 - }, - { - "epoch": 0.72, - "learning_rate": 1.4139726629394142e-05, - "loss": 2.4077, - "step": 411270 - }, - { - "epoch": 0.72, - "learning_rate": 1.4138854689467315e-05, - "loss": 2.3059, - "step": 411280 - }, - { - "epoch": 0.72, - "learning_rate": 1.4137982749540488e-05, - "loss": 2.1935, - "step": 411290 - }, - { - "epoch": 0.72, - "learning_rate": 1.4137110809613662e-05, - "loss": 2.1945, - "step": 411300 - }, - { - "epoch": 0.72, - "learning_rate": 1.4136238869686836e-05, - "loss": 2.2649, - "step": 411310 - }, - { - "epoch": 0.72, - "learning_rate": 1.4135366929760008e-05, - "loss": 2.3038, - "step": 411320 - }, - { - "epoch": 0.72, - "learning_rate": 1.413449498983318e-05, - "loss": 2.283, - "step": 411330 - }, - { - "epoch": 0.72, - "learning_rate": 1.4133623049906355e-05, - "loss": 2.2982, - "step": 411340 - }, - { - "epoch": 0.72, - "learning_rate": 1.4132751109979528e-05, - "loss": 2.2654, - "step": 411350 - }, - { - "epoch": 0.72, - "learning_rate": 1.41318791700527e-05, - "loss": 2.3029, - "step": 411360 - }, - { - "epoch": 0.72, - "learning_rate": 1.4131007230125873e-05, - "loss": 2.3711, - "step": 411370 - }, - { - "epoch": 0.72, - "learning_rate": 1.4130135290199049e-05, - "loss": 2.2894, - "step": 411380 - }, - { - "epoch": 0.72, - "learning_rate": 1.4129263350272221e-05, - "loss": 2.2583, - "step": 411390 - }, - { - "epoch": 0.72, - "learning_rate": 1.4128391410345393e-05, - "loss": 2.2525, - "step": 411400 - }, - { - "epoch": 0.72, - "learning_rate": 1.4127519470418565e-05, - "loss": 2.2661, - "step": 411410 - }, - { - "epoch": 0.72, - "learning_rate": 1.412664753049174e-05, - "loss": 2.3401, - "step": 411420 - }, - { - "epoch": 0.72, - "learning_rate": 1.4125775590564913e-05, - "loss": 2.3056, - "step": 411430 - }, - { - "epoch": 0.72, - "learning_rate": 1.4124903650638085e-05, - "loss": 2.2859, - "step": 411440 - }, - { - "epoch": 0.72, - "learning_rate": 1.412403171071126e-05, - "loss": 2.427, - "step": 411450 - }, - { - "epoch": 0.72, - "learning_rate": 1.4123159770784434e-05, - "loss": 2.2951, - "step": 411460 - }, - { - "epoch": 0.72, - "learning_rate": 1.4122287830857606e-05, - "loss": 2.2207, - "step": 411470 - }, - { - "epoch": 0.72, - "learning_rate": 1.4121415890930778e-05, - "loss": 2.2846, - "step": 411480 - }, - { - "epoch": 0.72, - "learning_rate": 1.4120543951003954e-05, - "loss": 2.4013, - "step": 411490 - }, - { - "epoch": 0.72, - "learning_rate": 1.4119672011077126e-05, - "loss": 2.2701, - "step": 411500 - }, - { - "epoch": 0.72, - "learning_rate": 1.4118800071150298e-05, - "loss": 2.4111, - "step": 411510 - }, - { - "epoch": 0.72, - "learning_rate": 1.4117928131223471e-05, - "loss": 2.2296, - "step": 411520 - }, - { - "epoch": 0.72, - "learning_rate": 1.4117056191296645e-05, - "loss": 2.3165, - "step": 411530 - }, - { - "epoch": 0.72, - "learning_rate": 1.4116184251369819e-05, - "loss": 2.2996, - "step": 411540 - }, - { - "epoch": 0.72, - "learning_rate": 1.4115312311442991e-05, - "loss": 2.2728, - "step": 411550 - }, - { - "epoch": 0.72, - "learning_rate": 1.4114440371516167e-05, - "loss": 2.345, - "step": 411560 - }, - { - "epoch": 0.72, - "learning_rate": 1.4113568431589339e-05, - "loss": 2.2952, - "step": 411570 - }, - { - "epoch": 0.72, - "learning_rate": 1.411269649166251e-05, - "loss": 2.3407, - "step": 411580 - }, - { - "epoch": 0.72, - "learning_rate": 1.4111824551735683e-05, - "loss": 2.3325, - "step": 411590 - }, - { - "epoch": 0.72, - "learning_rate": 1.4110952611808858e-05, - "loss": 2.3098, - "step": 411600 - }, - { - "epoch": 0.72, - "learning_rate": 1.411008067188203e-05, - "loss": 2.2148, - "step": 411610 - }, - { - "epoch": 0.72, - "learning_rate": 1.4109208731955204e-05, - "loss": 2.3238, - "step": 411620 - }, - { - "epoch": 0.72, - "learning_rate": 1.4108336792028376e-05, - "loss": 2.4254, - "step": 411630 - }, - { - "epoch": 0.72, - "learning_rate": 1.4107464852101552e-05, - "loss": 2.2651, - "step": 411640 - }, - { - "epoch": 0.72, - "learning_rate": 1.4106592912174724e-05, - "loss": 2.283, - "step": 411650 - }, - { - "epoch": 0.72, - "learning_rate": 1.4105720972247896e-05, - "loss": 2.3913, - "step": 411660 - }, - { - "epoch": 0.72, - "learning_rate": 1.4104849032321068e-05, - "loss": 2.1865, - "step": 411670 - }, - { - "epoch": 0.72, - "learning_rate": 1.4103977092394243e-05, - "loss": 2.309, - "step": 411680 - }, - { - "epoch": 0.72, - "learning_rate": 1.4103105152467417e-05, - "loss": 2.2547, - "step": 411690 - }, - { - "epoch": 0.72, - "learning_rate": 1.410223321254059e-05, - "loss": 2.3469, - "step": 411700 - }, - { - "epoch": 0.72, - "learning_rate": 1.4101361272613765e-05, - "loss": 2.3642, - "step": 411710 - }, - { - "epoch": 0.72, - "learning_rate": 1.4100489332686937e-05, - "loss": 2.215, - "step": 411720 - }, - { - "epoch": 0.72, - "learning_rate": 1.4099617392760109e-05, - "loss": 2.2612, - "step": 411730 - }, - { - "epoch": 0.72, - "learning_rate": 1.4098745452833281e-05, - "loss": 2.1988, - "step": 411740 - }, - { - "epoch": 0.72, - "learning_rate": 1.4097873512906456e-05, - "loss": 2.2863, - "step": 411750 - }, - { - "epoch": 0.72, - "learning_rate": 1.4097001572979628e-05, - "loss": 2.2704, - "step": 411760 - }, - { - "epoch": 0.72, - "learning_rate": 1.4096129633052802e-05, - "loss": 2.3557, - "step": 411770 - }, - { - "epoch": 0.72, - "learning_rate": 1.4095257693125974e-05, - "loss": 2.2288, - "step": 411780 - }, - { - "epoch": 0.72, - "learning_rate": 1.409438575319915e-05, - "loss": 2.2656, - "step": 411790 - }, - { - "epoch": 0.72, - "learning_rate": 1.4093513813272322e-05, - "loss": 2.3459, - "step": 411800 - }, - { - "epoch": 0.72, - "learning_rate": 1.4092641873345494e-05, - "loss": 2.1948, - "step": 411810 - }, - { - "epoch": 0.72, - "learning_rate": 1.409176993341867e-05, - "loss": 2.3969, - "step": 411820 - }, - { - "epoch": 0.72, - "learning_rate": 1.4090897993491841e-05, - "loss": 2.2622, - "step": 411830 - }, - { - "epoch": 0.72, - "learning_rate": 1.4090026053565013e-05, - "loss": 2.3233, - "step": 411840 - }, - { - "epoch": 0.72, - "learning_rate": 1.4089154113638187e-05, - "loss": 2.2456, - "step": 411850 - }, - { - "epoch": 0.72, - "learning_rate": 1.4088282173711361e-05, - "loss": 2.3021, - "step": 411860 - }, - { - "epoch": 0.72, - "learning_rate": 1.4087410233784535e-05, - "loss": 2.2741, - "step": 411870 - }, - { - "epoch": 0.72, - "learning_rate": 1.4086538293857707e-05, - "loss": 2.1965, - "step": 411880 - }, - { - "epoch": 0.72, - "learning_rate": 1.4085666353930879e-05, - "loss": 2.3674, - "step": 411890 - }, - { - "epoch": 0.72, - "learning_rate": 1.4084794414004054e-05, - "loss": 2.2483, - "step": 411900 - }, - { - "epoch": 0.72, - "learning_rate": 1.4083922474077226e-05, - "loss": 2.219, - "step": 411910 - }, - { - "epoch": 0.72, - "learning_rate": 1.4083050534150399e-05, - "loss": 2.313, - "step": 411920 - }, - { - "epoch": 0.72, - "learning_rate": 1.4082178594223572e-05, - "loss": 2.2417, - "step": 411930 - }, - { - "epoch": 0.72, - "learning_rate": 1.4081306654296748e-05, - "loss": 2.3373, - "step": 411940 - }, - { - "epoch": 0.72, - "learning_rate": 1.408043471436992e-05, - "loss": 2.365, - "step": 411950 - }, - { - "epoch": 0.72, - "learning_rate": 1.4079562774443092e-05, - "loss": 2.3641, - "step": 411960 - }, - { - "epoch": 0.72, - "learning_rate": 1.4078690834516267e-05, - "loss": 2.2961, - "step": 411970 - }, - { - "epoch": 0.72, - "learning_rate": 1.407781889458944e-05, - "loss": 2.3343, - "step": 411980 - }, - { - "epoch": 0.72, - "learning_rate": 1.4076946954662612e-05, - "loss": 2.267, - "step": 411990 - }, - { - "epoch": 0.72, - "learning_rate": 1.4076075014735785e-05, - "loss": 2.1972, - "step": 412000 - }, - { - "epoch": 0.72, - "learning_rate": 1.4075203074808959e-05, - "loss": 2.2664, - "step": 412010 - }, - { - "epoch": 0.72, - "learning_rate": 1.4074331134882133e-05, - "loss": 2.3482, - "step": 412020 - }, - { - "epoch": 0.72, - "learning_rate": 1.4073459194955305e-05, - "loss": 2.2937, - "step": 412030 - }, - { - "epoch": 0.72, - "learning_rate": 1.4072587255028477e-05, - "loss": 2.4094, - "step": 412040 - }, - { - "epoch": 0.72, - "learning_rate": 1.4071715315101652e-05, - "loss": 2.279, - "step": 412050 - }, - { - "epoch": 0.72, - "learning_rate": 1.4070843375174825e-05, - "loss": 2.3856, - "step": 412060 - }, - { - "epoch": 0.72, - "learning_rate": 1.4069971435247997e-05, - "loss": 2.2145, - "step": 412070 - }, - { - "epoch": 0.72, - "learning_rate": 1.406909949532117e-05, - "loss": 2.2984, - "step": 412080 - }, - { - "epoch": 0.72, - "learning_rate": 1.4068227555394344e-05, - "loss": 2.3559, - "step": 412090 - }, - { - "epoch": 0.72, - "learning_rate": 1.4067355615467518e-05, - "loss": 2.4158, - "step": 412100 - }, - { - "epoch": 0.72, - "learning_rate": 1.406648367554069e-05, - "loss": 2.3435, - "step": 412110 - }, - { - "epoch": 0.72, - "learning_rate": 1.4065611735613865e-05, - "loss": 2.2828, - "step": 412120 - }, - { - "epoch": 0.72, - "learning_rate": 1.4064739795687038e-05, - "loss": 2.3059, - "step": 412130 - }, - { - "epoch": 0.72, - "learning_rate": 1.406386785576021e-05, - "loss": 2.3188, - "step": 412140 - }, - { - "epoch": 0.72, - "learning_rate": 1.4062995915833382e-05, - "loss": 2.42, - "step": 412150 - }, - { - "epoch": 0.72, - "learning_rate": 1.4062123975906557e-05, - "loss": 2.364, - "step": 412160 - }, - { - "epoch": 0.72, - "learning_rate": 1.406125203597973e-05, - "loss": 2.3518, - "step": 412170 - }, - { - "epoch": 0.72, - "learning_rate": 1.4060380096052903e-05, - "loss": 2.2879, - "step": 412180 - }, - { - "epoch": 0.72, - "learning_rate": 1.4059508156126075e-05, - "loss": 2.3535, - "step": 412190 - }, - { - "epoch": 0.72, - "learning_rate": 1.405863621619925e-05, - "loss": 2.3537, - "step": 412200 - }, - { - "epoch": 0.72, - "learning_rate": 1.4057764276272423e-05, - "loss": 2.3015, - "step": 412210 - }, - { - "epoch": 0.72, - "learning_rate": 1.4056892336345595e-05, - "loss": 2.3915, - "step": 412220 - }, - { - "epoch": 0.72, - "learning_rate": 1.405602039641877e-05, - "loss": 2.1822, - "step": 412230 - }, - { - "epoch": 0.72, - "learning_rate": 1.4055148456491942e-05, - "loss": 2.277, - "step": 412240 - }, - { - "epoch": 0.72, - "learning_rate": 1.4054276516565116e-05, - "loss": 2.2915, - "step": 412250 - }, - { - "epoch": 0.72, - "learning_rate": 1.4053404576638288e-05, - "loss": 2.1519, - "step": 412260 - }, - { - "epoch": 0.72, - "learning_rate": 1.4052532636711464e-05, - "loss": 2.3618, - "step": 412270 - }, - { - "epoch": 0.72, - "learning_rate": 1.4051660696784636e-05, - "loss": 2.2291, - "step": 412280 - }, - { - "epoch": 0.72, - "learning_rate": 1.4050788756857808e-05, - "loss": 2.2488, - "step": 412290 - }, - { - "epoch": 0.72, - "learning_rate": 1.404991681693098e-05, - "loss": 2.2491, - "step": 412300 - }, - { - "epoch": 0.72, - "learning_rate": 1.4049044877004155e-05, - "loss": 2.3874, - "step": 412310 - }, - { - "epoch": 0.72, - "learning_rate": 1.4048172937077327e-05, - "loss": 2.3904, - "step": 412320 - }, - { - "epoch": 0.72, - "learning_rate": 1.4047300997150501e-05, - "loss": 2.3105, - "step": 412330 - }, - { - "epoch": 0.72, - "learning_rate": 1.4046429057223673e-05, - "loss": 2.2731, - "step": 412340 - }, - { - "epoch": 0.72, - "learning_rate": 1.4045557117296849e-05, - "loss": 2.3477, - "step": 412350 - }, - { - "epoch": 0.72, - "learning_rate": 1.404468517737002e-05, - "loss": 2.3943, - "step": 412360 - }, - { - "epoch": 0.72, - "learning_rate": 1.4043813237443193e-05, - "loss": 2.223, - "step": 412370 - }, - { - "epoch": 0.72, - "learning_rate": 1.4042941297516368e-05, - "loss": 2.25, - "step": 412380 - }, - { - "epoch": 0.72, - "learning_rate": 1.404206935758954e-05, - "loss": 2.3839, - "step": 412390 - }, - { - "epoch": 0.72, - "learning_rate": 1.4041197417662712e-05, - "loss": 2.4107, - "step": 412400 - }, - { - "epoch": 0.72, - "learning_rate": 1.4040325477735886e-05, - "loss": 2.2539, - "step": 412410 - }, - { - "epoch": 0.72, - "learning_rate": 1.4039453537809062e-05, - "loss": 2.3523, - "step": 412420 - }, - { - "epoch": 0.72, - "learning_rate": 1.4038581597882234e-05, - "loss": 2.3442, - "step": 412430 - }, - { - "epoch": 0.72, - "learning_rate": 1.4037709657955406e-05, - "loss": 2.3334, - "step": 412440 - }, - { - "epoch": 0.72, - "learning_rate": 1.4036837718028578e-05, - "loss": 2.2176, - "step": 412450 - }, - { - "epoch": 0.72, - "learning_rate": 1.4035965778101753e-05, - "loss": 2.2637, - "step": 412460 - }, - { - "epoch": 0.72, - "learning_rate": 1.4035093838174925e-05, - "loss": 2.2419, - "step": 412470 - }, - { - "epoch": 0.72, - "learning_rate": 1.4034221898248097e-05, - "loss": 2.2325, - "step": 412480 - }, - { - "epoch": 0.72, - "learning_rate": 1.4033349958321273e-05, - "loss": 2.3481, - "step": 412490 - }, - { - "epoch": 0.72, - "learning_rate": 1.4032478018394447e-05, - "loss": 2.3503, - "step": 412500 - }, - { - "epoch": 0.72, - "learning_rate": 1.4031606078467619e-05, - "loss": 2.2608, - "step": 412510 - }, - { - "epoch": 0.72, - "learning_rate": 1.4030734138540791e-05, - "loss": 2.2371, - "step": 412520 - }, - { - "epoch": 0.72, - "learning_rate": 1.4029862198613966e-05, - "loss": 2.2422, - "step": 412530 - }, - { - "epoch": 0.72, - "learning_rate": 1.4028990258687138e-05, - "loss": 2.1695, - "step": 412540 - }, - { - "epoch": 0.72, - "learning_rate": 1.402811831876031e-05, - "loss": 2.3628, - "step": 412550 - }, - { - "epoch": 0.72, - "learning_rate": 1.4027246378833484e-05, - "loss": 2.2547, - "step": 412560 - }, - { - "epoch": 0.72, - "learning_rate": 1.4026374438906658e-05, - "loss": 2.2338, - "step": 412570 - }, - { - "epoch": 0.72, - "learning_rate": 1.4025502498979832e-05, - "loss": 2.3372, - "step": 412580 - }, - { - "epoch": 0.72, - "learning_rate": 1.4024630559053004e-05, - "loss": 2.3338, - "step": 412590 - }, - { - "epoch": 0.72, - "learning_rate": 1.4023758619126176e-05, - "loss": 2.292, - "step": 412600 - }, - { - "epoch": 0.72, - "learning_rate": 1.4022886679199351e-05, - "loss": 2.1934, - "step": 412610 - }, - { - "epoch": 0.72, - "learning_rate": 1.4022014739272523e-05, - "loss": 2.3415, - "step": 412620 - }, - { - "epoch": 0.72, - "learning_rate": 1.4021142799345696e-05, - "loss": 2.4619, - "step": 412630 - }, - { - "epoch": 0.72, - "learning_rate": 1.4020270859418871e-05, - "loss": 2.2732, - "step": 412640 - }, - { - "epoch": 0.72, - "learning_rate": 1.4019398919492043e-05, - "loss": 2.3118, - "step": 412650 - }, - { - "epoch": 0.72, - "learning_rate": 1.4018526979565217e-05, - "loss": 2.3868, - "step": 412660 - }, - { - "epoch": 0.72, - "learning_rate": 1.4017655039638389e-05, - "loss": 2.3708, - "step": 412670 - }, - { - "epoch": 0.72, - "learning_rate": 1.4016783099711564e-05, - "loss": 2.2847, - "step": 412680 - }, - { - "epoch": 0.72, - "learning_rate": 1.4015911159784736e-05, - "loss": 2.1828, - "step": 412690 - }, - { - "epoch": 0.72, - "learning_rate": 1.4015039219857909e-05, - "loss": 2.4773, - "step": 412700 - }, - { - "epoch": 0.72, - "learning_rate": 1.401416727993108e-05, - "loss": 2.3921, - "step": 412710 - }, - { - "epoch": 0.72, - "learning_rate": 1.4013295340004256e-05, - "loss": 2.1711, - "step": 412720 - }, - { - "epoch": 0.72, - "learning_rate": 1.401242340007743e-05, - "loss": 2.2785, - "step": 412730 - }, - { - "epoch": 0.72, - "learning_rate": 1.4011551460150602e-05, - "loss": 2.3721, - "step": 412740 - }, - { - "epoch": 0.72, - "learning_rate": 1.4010679520223774e-05, - "loss": 2.2685, - "step": 412750 - }, - { - "epoch": 0.72, - "learning_rate": 1.400980758029695e-05, - "loss": 2.36, - "step": 412760 - }, - { - "epoch": 0.72, - "learning_rate": 1.4008935640370122e-05, - "loss": 2.3122, - "step": 412770 - }, - { - "epoch": 0.72, - "learning_rate": 1.4008063700443294e-05, - "loss": 2.2705, - "step": 412780 - }, - { - "epoch": 0.72, - "learning_rate": 1.4007191760516469e-05, - "loss": 2.3748, - "step": 412790 - }, - { - "epoch": 0.72, - "learning_rate": 1.4006319820589641e-05, - "loss": 2.4002, - "step": 412800 - }, - { - "epoch": 0.72, - "learning_rate": 1.4005447880662815e-05, - "loss": 2.2831, - "step": 412810 - }, - { - "epoch": 0.72, - "learning_rate": 1.4004575940735987e-05, - "loss": 2.2681, - "step": 412820 - }, - { - "epoch": 0.72, - "learning_rate": 1.4003704000809162e-05, - "loss": 2.3096, - "step": 412830 - }, - { - "epoch": 0.72, - "learning_rate": 1.4002832060882335e-05, - "loss": 2.2949, - "step": 412840 - }, - { - "epoch": 0.72, - "learning_rate": 1.4001960120955507e-05, - "loss": 2.2591, - "step": 412850 - }, - { - "epoch": 0.72, - "learning_rate": 1.4001088181028679e-05, - "loss": 2.278, - "step": 412860 - }, - { - "epoch": 0.72, - "learning_rate": 1.4000216241101854e-05, - "loss": 2.2874, - "step": 412870 - }, - { - "epoch": 0.72, - "learning_rate": 1.3999344301175026e-05, - "loss": 2.3639, - "step": 412880 - }, - { - "epoch": 0.72, - "learning_rate": 1.39984723612482e-05, - "loss": 2.327, - "step": 412890 - }, - { - "epoch": 0.72, - "learning_rate": 1.3997600421321374e-05, - "loss": 2.2791, - "step": 412900 - }, - { - "epoch": 0.72, - "learning_rate": 1.3996728481394548e-05, - "loss": 2.3977, - "step": 412910 - }, - { - "epoch": 0.72, - "learning_rate": 1.399585654146772e-05, - "loss": 2.2388, - "step": 412920 - }, - { - "epoch": 0.72, - "learning_rate": 1.3994984601540892e-05, - "loss": 2.3345, - "step": 412930 - }, - { - "epoch": 0.72, - "learning_rate": 1.3994112661614067e-05, - "loss": 2.315, - "step": 412940 - }, - { - "epoch": 0.72, - "learning_rate": 1.399324072168724e-05, - "loss": 2.2887, - "step": 412950 - }, - { - "epoch": 0.72, - "learning_rate": 1.3992368781760411e-05, - "loss": 2.3151, - "step": 412960 - }, - { - "epoch": 0.72, - "learning_rate": 1.3991496841833585e-05, - "loss": 2.4646, - "step": 412970 - }, - { - "epoch": 0.72, - "learning_rate": 1.399062490190676e-05, - "loss": 2.2717, - "step": 412980 - }, - { - "epoch": 0.72, - "learning_rate": 1.3989752961979933e-05, - "loss": 2.3367, - "step": 412990 - }, - { - "epoch": 0.72, - "learning_rate": 1.3988881022053105e-05, - "loss": 2.3176, - "step": 413000 - }, - { - "epoch": 0.72, - "learning_rate": 1.3988009082126277e-05, - "loss": 2.3394, - "step": 413010 - }, - { - "epoch": 0.72, - "learning_rate": 1.3987137142199452e-05, - "loss": 2.3453, - "step": 413020 - }, - { - "epoch": 0.72, - "learning_rate": 1.3986265202272624e-05, - "loss": 2.2606, - "step": 413030 - }, - { - "epoch": 0.72, - "learning_rate": 1.3985393262345798e-05, - "loss": 2.2967, - "step": 413040 - }, - { - "epoch": 0.72, - "learning_rate": 1.3984521322418972e-05, - "loss": 2.3233, - "step": 413050 - }, - { - "epoch": 0.72, - "learning_rate": 1.3983649382492146e-05, - "loss": 2.3533, - "step": 413060 - }, - { - "epoch": 0.72, - "learning_rate": 1.3982777442565318e-05, - "loss": 2.2431, - "step": 413070 - }, - { - "epoch": 0.72, - "learning_rate": 1.398190550263849e-05, - "loss": 2.4271, - "step": 413080 - }, - { - "epoch": 0.72, - "learning_rate": 1.3981033562711665e-05, - "loss": 2.3302, - "step": 413090 - }, - { - "epoch": 0.72, - "learning_rate": 1.3980161622784837e-05, - "loss": 2.2829, - "step": 413100 - }, - { - "epoch": 0.72, - "learning_rate": 1.397928968285801e-05, - "loss": 2.2974, - "step": 413110 - }, - { - "epoch": 0.72, - "learning_rate": 1.3978417742931183e-05, - "loss": 2.2764, - "step": 413120 - }, - { - "epoch": 0.72, - "learning_rate": 1.3977545803004357e-05, - "loss": 2.3293, - "step": 413130 - }, - { - "epoch": 0.72, - "learning_rate": 1.397667386307753e-05, - "loss": 2.3089, - "step": 413140 - }, - { - "epoch": 0.72, - "learning_rate": 1.3975801923150703e-05, - "loss": 2.3142, - "step": 413150 - }, - { - "epoch": 0.72, - "learning_rate": 1.3974929983223878e-05, - "loss": 2.3383, - "step": 413160 - }, - { - "epoch": 0.72, - "learning_rate": 1.397405804329705e-05, - "loss": 2.3274, - "step": 413170 - }, - { - "epoch": 0.72, - "learning_rate": 1.3973186103370222e-05, - "loss": 2.371, - "step": 413180 - }, - { - "epoch": 0.72, - "learning_rate": 1.3972314163443394e-05, - "loss": 2.2662, - "step": 413190 - }, - { - "epoch": 0.72, - "learning_rate": 1.397144222351657e-05, - "loss": 2.3364, - "step": 413200 - }, - { - "epoch": 0.72, - "learning_rate": 1.3970570283589742e-05, - "loss": 2.3185, - "step": 413210 - }, - { - "epoch": 0.72, - "learning_rate": 1.3969698343662916e-05, - "loss": 2.2819, - "step": 413220 - }, - { - "epoch": 0.72, - "learning_rate": 1.3968826403736088e-05, - "loss": 2.2856, - "step": 413230 - }, - { - "epoch": 0.72, - "learning_rate": 1.3967954463809263e-05, - "loss": 2.3645, - "step": 413240 - }, - { - "epoch": 0.72, - "learning_rate": 1.3967082523882435e-05, - "loss": 2.3464, - "step": 413250 - }, - { - "epoch": 0.72, - "learning_rate": 1.3966210583955607e-05, - "loss": 2.3727, - "step": 413260 - }, - { - "epoch": 0.72, - "learning_rate": 1.396533864402878e-05, - "loss": 2.2689, - "step": 413270 - }, - { - "epoch": 0.72, - "learning_rate": 1.3964466704101955e-05, - "loss": 2.4352, - "step": 413280 - }, - { - "epoch": 0.72, - "learning_rate": 1.3963594764175129e-05, - "loss": 2.3032, - "step": 413290 - }, - { - "epoch": 0.72, - "learning_rate": 1.3962722824248301e-05, - "loss": 2.2381, - "step": 413300 - }, - { - "epoch": 0.72, - "learning_rate": 1.3961850884321476e-05, - "loss": 2.3282, - "step": 413310 - }, - { - "epoch": 0.72, - "learning_rate": 1.3960978944394648e-05, - "loss": 2.2147, - "step": 413320 - }, - { - "epoch": 0.72, - "learning_rate": 1.396010700446782e-05, - "loss": 2.4243, - "step": 413330 - }, - { - "epoch": 0.72, - "learning_rate": 1.3959235064540993e-05, - "loss": 2.206, - "step": 413340 - }, - { - "epoch": 0.72, - "learning_rate": 1.3958363124614168e-05, - "loss": 2.2412, - "step": 413350 - }, - { - "epoch": 0.72, - "learning_rate": 1.395749118468734e-05, - "loss": 2.4255, - "step": 413360 - }, - { - "epoch": 0.72, - "learning_rate": 1.3956619244760514e-05, - "loss": 2.2955, - "step": 413370 - }, - { - "epoch": 0.72, - "learning_rate": 1.3955747304833686e-05, - "loss": 2.3742, - "step": 413380 - }, - { - "epoch": 0.72, - "learning_rate": 1.3954875364906861e-05, - "loss": 2.3123, - "step": 413390 - }, - { - "epoch": 0.72, - "learning_rate": 1.3954003424980033e-05, - "loss": 2.3239, - "step": 413400 - }, - { - "epoch": 0.72, - "learning_rate": 1.3953131485053206e-05, - "loss": 2.2314, - "step": 413410 - }, - { - "epoch": 0.72, - "learning_rate": 1.3952259545126381e-05, - "loss": 2.335, - "step": 413420 - }, - { - "epoch": 0.72, - "learning_rate": 1.3951387605199553e-05, - "loss": 2.2558, - "step": 413430 - }, - { - "epoch": 0.72, - "learning_rate": 1.3950515665272725e-05, - "loss": 2.3397, - "step": 413440 - }, - { - "epoch": 0.72, - "learning_rate": 1.3949643725345899e-05, - "loss": 2.3072, - "step": 413450 - }, - { - "epoch": 0.72, - "learning_rate": 1.3948771785419074e-05, - "loss": 2.1826, - "step": 413460 - }, - { - "epoch": 0.72, - "learning_rate": 1.3947899845492246e-05, - "loss": 2.435, - "step": 413470 - }, - { - "epoch": 0.72, - "learning_rate": 1.3947027905565419e-05, - "loss": 2.3543, - "step": 413480 - }, - { - "epoch": 0.72, - "learning_rate": 1.394615596563859e-05, - "loss": 2.3236, - "step": 413490 - }, - { - "epoch": 0.72, - "learning_rate": 1.3945284025711766e-05, - "loss": 2.347, - "step": 413500 - }, - { - "epoch": 0.72, - "learning_rate": 1.3944412085784938e-05, - "loss": 2.2568, - "step": 413510 - }, - { - "epoch": 0.72, - "learning_rate": 1.394354014585811e-05, - "loss": 2.3404, - "step": 413520 - }, - { - "epoch": 0.72, - "learning_rate": 1.3942668205931284e-05, - "loss": 2.3346, - "step": 413530 - }, - { - "epoch": 0.72, - "learning_rate": 1.394179626600446e-05, - "loss": 2.2398, - "step": 413540 - }, - { - "epoch": 0.72, - "learning_rate": 1.3940924326077632e-05, - "loss": 2.2857, - "step": 413550 - }, - { - "epoch": 0.72, - "learning_rate": 1.3940052386150804e-05, - "loss": 2.1688, - "step": 413560 - }, - { - "epoch": 0.72, - "learning_rate": 1.3939180446223979e-05, - "loss": 2.3378, - "step": 413570 - }, - { - "epoch": 0.72, - "learning_rate": 1.3938308506297151e-05, - "loss": 2.2542, - "step": 413580 - }, - { - "epoch": 0.72, - "learning_rate": 1.3937436566370323e-05, - "loss": 2.2833, - "step": 413590 - }, - { - "epoch": 0.72, - "learning_rate": 1.3936564626443497e-05, - "loss": 2.3578, - "step": 413600 - }, - { - "epoch": 0.72, - "learning_rate": 1.393569268651667e-05, - "loss": 2.3295, - "step": 413610 - }, - { - "epoch": 0.72, - "learning_rate": 1.3934820746589845e-05, - "loss": 2.2849, - "step": 413620 - }, - { - "epoch": 0.72, - "learning_rate": 1.3933948806663017e-05, - "loss": 2.3786, - "step": 413630 - }, - { - "epoch": 0.72, - "learning_rate": 1.3933076866736189e-05, - "loss": 2.3338, - "step": 413640 - }, - { - "epoch": 0.72, - "learning_rate": 1.3932204926809364e-05, - "loss": 2.3075, - "step": 413650 - }, - { - "epoch": 0.72, - "learning_rate": 1.3931332986882536e-05, - "loss": 2.2543, - "step": 413660 - }, - { - "epoch": 0.72, - "learning_rate": 1.3930461046955708e-05, - "loss": 2.3831, - "step": 413670 - }, - { - "epoch": 0.72, - "learning_rate": 1.3929589107028882e-05, - "loss": 2.3333, - "step": 413680 - }, - { - "epoch": 0.72, - "learning_rate": 1.3928717167102056e-05, - "loss": 2.2634, - "step": 413690 - }, - { - "epoch": 0.72, - "learning_rate": 1.392784522717523e-05, - "loss": 2.2454, - "step": 413700 - }, - { - "epoch": 0.72, - "learning_rate": 1.3926973287248402e-05, - "loss": 2.2685, - "step": 413710 - }, - { - "epoch": 0.72, - "learning_rate": 1.3926101347321577e-05, - "loss": 2.2409, - "step": 413720 - }, - { - "epoch": 0.72, - "learning_rate": 1.392522940739475e-05, - "loss": 2.4206, - "step": 413730 - }, - { - "epoch": 0.72, - "learning_rate": 1.3924357467467921e-05, - "loss": 2.3922, - "step": 413740 - }, - { - "epoch": 0.72, - "learning_rate": 1.3923485527541093e-05, - "loss": 2.1995, - "step": 413750 - }, - { - "epoch": 0.72, - "learning_rate": 1.3922613587614269e-05, - "loss": 2.2769, - "step": 413760 - }, - { - "epoch": 0.72, - "learning_rate": 1.3921741647687443e-05, - "loss": 2.4169, - "step": 413770 - }, - { - "epoch": 0.72, - "learning_rate": 1.3920869707760615e-05, - "loss": 2.267, - "step": 413780 - }, - { - "epoch": 0.72, - "learning_rate": 1.3919997767833787e-05, - "loss": 2.2818, - "step": 413790 - }, - { - "epoch": 0.72, - "learning_rate": 1.3919125827906962e-05, - "loss": 2.1798, - "step": 413800 - }, - { - "epoch": 0.72, - "learning_rate": 1.3918253887980134e-05, - "loss": 2.3588, - "step": 413810 - }, - { - "epoch": 0.72, - "learning_rate": 1.3917381948053306e-05, - "loss": 2.1618, - "step": 413820 - }, - { - "epoch": 0.72, - "learning_rate": 1.3916510008126482e-05, - "loss": 2.4103, - "step": 413830 - }, - { - "epoch": 0.72, - "learning_rate": 1.3915638068199654e-05, - "loss": 2.3578, - "step": 413840 - }, - { - "epoch": 0.72, - "learning_rate": 1.3914766128272828e-05, - "loss": 2.306, - "step": 413850 - }, - { - "epoch": 0.72, - "learning_rate": 1.3913894188346e-05, - "loss": 2.324, - "step": 413860 - }, - { - "epoch": 0.72, - "learning_rate": 1.3913022248419175e-05, - "loss": 2.2739, - "step": 413870 - }, - { - "epoch": 0.72, - "learning_rate": 1.3912150308492347e-05, - "loss": 2.4021, - "step": 413880 - }, - { - "epoch": 0.72, - "learning_rate": 1.391127836856552e-05, - "loss": 2.3038, - "step": 413890 - }, - { - "epoch": 0.72, - "learning_rate": 1.3910406428638692e-05, - "loss": 2.2743, - "step": 413900 - }, - { - "epoch": 0.72, - "learning_rate": 1.3909534488711867e-05, - "loss": 2.37, - "step": 413910 - }, - { - "epoch": 0.72, - "learning_rate": 1.3908662548785039e-05, - "loss": 2.2735, - "step": 413920 - }, - { - "epoch": 0.72, - "learning_rate": 1.3907790608858213e-05, - "loss": 2.2985, - "step": 413930 - }, - { - "epoch": 0.72, - "learning_rate": 1.3906918668931385e-05, - "loss": 2.2921, - "step": 413940 - }, - { - "epoch": 0.72, - "learning_rate": 1.390604672900456e-05, - "loss": 2.2775, - "step": 413950 - }, - { - "epoch": 0.72, - "learning_rate": 1.3905174789077732e-05, - "loss": 2.1681, - "step": 413960 - }, - { - "epoch": 0.72, - "learning_rate": 1.3904302849150905e-05, - "loss": 2.423, - "step": 413970 - }, - { - "epoch": 0.72, - "learning_rate": 1.390343090922408e-05, - "loss": 2.186, - "step": 413980 - }, - { - "epoch": 0.72, - "learning_rate": 1.3902558969297252e-05, - "loss": 2.2277, - "step": 413990 - }, - { - "epoch": 0.72, - "learning_rate": 1.3901687029370424e-05, - "loss": 2.1995, - "step": 414000 - }, - { - "epoch": 0.72, - "learning_rate": 1.3900815089443598e-05, - "loss": 2.3167, - "step": 414010 - }, - { - "epoch": 0.72, - "learning_rate": 1.3899943149516773e-05, - "loss": 2.3119, - "step": 414020 - }, - { - "epoch": 0.72, - "learning_rate": 1.3899071209589945e-05, - "loss": 2.3705, - "step": 414030 - }, - { - "epoch": 0.72, - "learning_rate": 1.3898199269663118e-05, - "loss": 2.3055, - "step": 414040 - }, - { - "epoch": 0.72, - "learning_rate": 1.389732732973629e-05, - "loss": 2.3548, - "step": 414050 - }, - { - "epoch": 0.72, - "learning_rate": 1.3896455389809465e-05, - "loss": 2.2253, - "step": 414060 - }, - { - "epoch": 0.72, - "learning_rate": 1.3895583449882637e-05, - "loss": 2.419, - "step": 414070 - }, - { - "epoch": 0.72, - "learning_rate": 1.3894711509955811e-05, - "loss": 2.4399, - "step": 414080 - }, - { - "epoch": 0.72, - "learning_rate": 1.3893839570028985e-05, - "loss": 2.2303, - "step": 414090 - }, - { - "epoch": 0.72, - "learning_rate": 1.3892967630102158e-05, - "loss": 2.3062, - "step": 414100 - }, - { - "epoch": 0.72, - "learning_rate": 1.389209569017533e-05, - "loss": 2.3316, - "step": 414110 - }, - { - "epoch": 0.72, - "learning_rate": 1.3891223750248503e-05, - "loss": 2.3971, - "step": 414120 - }, - { - "epoch": 0.72, - "learning_rate": 1.3890351810321678e-05, - "loss": 2.2045, - "step": 414130 - }, - { - "epoch": 0.72, - "learning_rate": 1.388947987039485e-05, - "loss": 2.2341, - "step": 414140 - }, - { - "epoch": 0.72, - "learning_rate": 1.3888607930468022e-05, - "loss": 2.3123, - "step": 414150 - }, - { - "epoch": 0.72, - "learning_rate": 1.3887735990541196e-05, - "loss": 2.3413, - "step": 414160 - }, - { - "epoch": 0.72, - "learning_rate": 1.388686405061437e-05, - "loss": 2.4197, - "step": 414170 - }, - { - "epoch": 0.72, - "learning_rate": 1.3885992110687544e-05, - "loss": 2.2643, - "step": 414180 - }, - { - "epoch": 0.72, - "learning_rate": 1.3885120170760716e-05, - "loss": 2.339, - "step": 414190 - }, - { - "epoch": 0.72, - "learning_rate": 1.3884248230833888e-05, - "loss": 2.3222, - "step": 414200 - }, - { - "epoch": 0.72, - "learning_rate": 1.3883376290907063e-05, - "loss": 2.2482, - "step": 414210 - }, - { - "epoch": 0.72, - "learning_rate": 1.3882504350980235e-05, - "loss": 2.2677, - "step": 414220 - }, - { - "epoch": 0.72, - "learning_rate": 1.3881632411053407e-05, - "loss": 2.387, - "step": 414230 - }, - { - "epoch": 0.72, - "learning_rate": 1.3880760471126583e-05, - "loss": 2.1745, - "step": 414240 - }, - { - "epoch": 0.72, - "learning_rate": 1.3879888531199755e-05, - "loss": 2.2621, - "step": 414250 - }, - { - "epoch": 0.72, - "learning_rate": 1.3879016591272929e-05, - "loss": 2.3648, - "step": 414260 - }, - { - "epoch": 0.72, - "learning_rate": 1.38781446513461e-05, - "loss": 2.2902, - "step": 414270 - }, - { - "epoch": 0.72, - "learning_rate": 1.3877272711419276e-05, - "loss": 2.326, - "step": 414280 - }, - { - "epoch": 0.72, - "learning_rate": 1.3876400771492448e-05, - "loss": 2.2604, - "step": 414290 - }, - { - "epoch": 0.72, - "learning_rate": 1.387552883156562e-05, - "loss": 2.3448, - "step": 414300 - }, - { - "epoch": 0.72, - "learning_rate": 1.3874656891638792e-05, - "loss": 2.313, - "step": 414310 - }, - { - "epoch": 0.72, - "learning_rate": 1.3873784951711968e-05, - "loss": 2.241, - "step": 414320 - }, - { - "epoch": 0.72, - "learning_rate": 1.3872913011785142e-05, - "loss": 2.2767, - "step": 414330 - }, - { - "epoch": 0.72, - "learning_rate": 1.3872041071858314e-05, - "loss": 2.2855, - "step": 414340 - }, - { - "epoch": 0.72, - "learning_rate": 1.3871169131931489e-05, - "loss": 2.3112, - "step": 414350 - }, - { - "epoch": 0.72, - "learning_rate": 1.3870297192004661e-05, - "loss": 2.2428, - "step": 414360 - }, - { - "epoch": 0.72, - "learning_rate": 1.3869425252077833e-05, - "loss": 2.3461, - "step": 414370 - }, - { - "epoch": 0.72, - "learning_rate": 1.3868553312151005e-05, - "loss": 2.2923, - "step": 414380 - }, - { - "epoch": 0.72, - "learning_rate": 1.386768137222418e-05, - "loss": 2.4235, - "step": 414390 - }, - { - "epoch": 0.72, - "learning_rate": 1.3866809432297353e-05, - "loss": 2.367, - "step": 414400 - }, - { - "epoch": 0.72, - "learning_rate": 1.3865937492370527e-05, - "loss": 2.3201, - "step": 414410 - }, - { - "epoch": 0.72, - "learning_rate": 1.3865065552443699e-05, - "loss": 2.3549, - "step": 414420 - }, - { - "epoch": 0.72, - "learning_rate": 1.3864193612516874e-05, - "loss": 2.3569, - "step": 414430 - }, - { - "epoch": 0.72, - "learning_rate": 1.3863321672590046e-05, - "loss": 2.2674, - "step": 414440 - }, - { - "epoch": 0.72, - "learning_rate": 1.3862449732663218e-05, - "loss": 2.3099, - "step": 414450 - }, - { - "epoch": 0.72, - "learning_rate": 1.386157779273639e-05, - "loss": 2.2065, - "step": 414460 - }, - { - "epoch": 0.72, - "learning_rate": 1.3860705852809566e-05, - "loss": 2.3429, - "step": 414470 - }, - { - "epoch": 0.72, - "learning_rate": 1.3859833912882738e-05, - "loss": 2.3444, - "step": 414480 - }, - { - "epoch": 0.72, - "learning_rate": 1.3858961972955912e-05, - "loss": 2.2147, - "step": 414490 - }, - { - "epoch": 0.72, - "learning_rate": 1.3858090033029087e-05, - "loss": 2.1707, - "step": 414500 - }, - { - "epoch": 0.72, - "learning_rate": 1.385721809310226e-05, - "loss": 2.2482, - "step": 414510 - }, - { - "epoch": 0.72, - "learning_rate": 1.3856346153175431e-05, - "loss": 2.3438, - "step": 414520 - }, - { - "epoch": 0.72, - "learning_rate": 1.3855474213248603e-05, - "loss": 2.2063, - "step": 414530 - }, - { - "epoch": 0.72, - "learning_rate": 1.3854602273321779e-05, - "loss": 2.3334, - "step": 414540 - }, - { - "epoch": 0.72, - "learning_rate": 1.3853730333394951e-05, - "loss": 2.2479, - "step": 414550 - }, - { - "epoch": 0.72, - "learning_rate": 1.3852858393468123e-05, - "loss": 2.2696, - "step": 414560 - }, - { - "epoch": 0.72, - "learning_rate": 1.3851986453541297e-05, - "loss": 2.2955, - "step": 414570 - }, - { - "epoch": 0.72, - "learning_rate": 1.3851114513614472e-05, - "loss": 2.3569, - "step": 414580 - }, - { - "epoch": 0.72, - "learning_rate": 1.3850242573687644e-05, - "loss": 2.3954, - "step": 414590 - }, - { - "epoch": 0.72, - "learning_rate": 1.3849370633760816e-05, - "loss": 2.2585, - "step": 414600 - }, - { - "epoch": 0.72, - "learning_rate": 1.3848498693833989e-05, - "loss": 2.2515, - "step": 414610 - }, - { - "epoch": 0.72, - "learning_rate": 1.3847626753907164e-05, - "loss": 2.1645, - "step": 414620 - }, - { - "epoch": 0.72, - "learning_rate": 1.3846754813980336e-05, - "loss": 2.4385, - "step": 414630 - }, - { - "epoch": 0.72, - "learning_rate": 1.384588287405351e-05, - "loss": 2.2504, - "step": 414640 - }, - { - "epoch": 0.72, - "learning_rate": 1.3845010934126684e-05, - "loss": 2.2776, - "step": 414650 - }, - { - "epoch": 0.72, - "learning_rate": 1.3844138994199857e-05, - "loss": 2.3911, - "step": 414660 - }, - { - "epoch": 0.72, - "learning_rate": 1.384326705427303e-05, - "loss": 2.3224, - "step": 414670 - }, - { - "epoch": 0.72, - "learning_rate": 1.3842395114346202e-05, - "loss": 2.2692, - "step": 414680 - }, - { - "epoch": 0.72, - "learning_rate": 1.3841523174419377e-05, - "loss": 2.3327, - "step": 414690 - }, - { - "epoch": 0.72, - "learning_rate": 1.3840651234492549e-05, - "loss": 2.3016, - "step": 414700 - }, - { - "epoch": 0.72, - "learning_rate": 1.3839779294565721e-05, - "loss": 2.3463, - "step": 414710 - }, - { - "epoch": 0.72, - "learning_rate": 1.3838907354638895e-05, - "loss": 2.4561, - "step": 414720 - }, - { - "epoch": 0.72, - "learning_rate": 1.3838035414712069e-05, - "loss": 2.4446, - "step": 414730 - }, - { - "epoch": 0.72, - "learning_rate": 1.3837163474785242e-05, - "loss": 2.2725, - "step": 414740 - }, - { - "epoch": 0.72, - "learning_rate": 1.3836291534858415e-05, - "loss": 2.2771, - "step": 414750 - }, - { - "epoch": 0.72, - "learning_rate": 1.383541959493159e-05, - "loss": 2.2986, - "step": 414760 - }, - { - "epoch": 0.72, - "learning_rate": 1.3834547655004762e-05, - "loss": 2.3167, - "step": 414770 - }, - { - "epoch": 0.72, - "learning_rate": 1.3833675715077934e-05, - "loss": 2.2509, - "step": 414780 - }, - { - "epoch": 0.72, - "learning_rate": 1.3832803775151106e-05, - "loss": 2.3449, - "step": 414790 - }, - { - "epoch": 0.72, - "learning_rate": 1.3831931835224282e-05, - "loss": 2.4386, - "step": 414800 - }, - { - "epoch": 0.72, - "learning_rate": 1.3831059895297455e-05, - "loss": 2.3438, - "step": 414810 - }, - { - "epoch": 0.72, - "learning_rate": 1.3830187955370628e-05, - "loss": 2.2938, - "step": 414820 - }, - { - "epoch": 0.72, - "learning_rate": 1.38293160154438e-05, - "loss": 2.2716, - "step": 414830 - }, - { - "epoch": 0.72, - "learning_rate": 1.3828444075516975e-05, - "loss": 2.2715, - "step": 414840 - }, - { - "epoch": 0.72, - "learning_rate": 1.3827572135590147e-05, - "loss": 2.2669, - "step": 414850 - }, - { - "epoch": 0.72, - "learning_rate": 1.382670019566332e-05, - "loss": 2.3747, - "step": 414860 - }, - { - "epoch": 0.72, - "learning_rate": 1.3825828255736491e-05, - "loss": 2.2399, - "step": 414870 - }, - { - "epoch": 0.72, - "learning_rate": 1.3824956315809667e-05, - "loss": 2.3042, - "step": 414880 - }, - { - "epoch": 0.72, - "learning_rate": 1.382408437588284e-05, - "loss": 2.3847, - "step": 414890 - }, - { - "epoch": 0.72, - "learning_rate": 1.3823212435956013e-05, - "loss": 2.2952, - "step": 414900 - }, - { - "epoch": 0.72, - "learning_rate": 1.3822340496029188e-05, - "loss": 2.2372, - "step": 414910 - }, - { - "epoch": 0.72, - "learning_rate": 1.382146855610236e-05, - "loss": 2.3008, - "step": 414920 - }, - { - "epoch": 0.72, - "learning_rate": 1.3820596616175532e-05, - "loss": 2.3054, - "step": 414930 - }, - { - "epoch": 0.72, - "learning_rate": 1.3819724676248704e-05, - "loss": 2.2928, - "step": 414940 - }, - { - "epoch": 0.72, - "learning_rate": 1.381885273632188e-05, - "loss": 2.3654, - "step": 414950 - }, - { - "epoch": 0.72, - "learning_rate": 1.3817980796395052e-05, - "loss": 2.3344, - "step": 414960 - }, - { - "epoch": 0.72, - "learning_rate": 1.3817108856468226e-05, - "loss": 2.2504, - "step": 414970 - }, - { - "epoch": 0.72, - "learning_rate": 1.3816236916541398e-05, - "loss": 2.2951, - "step": 414980 - }, - { - "epoch": 0.72, - "learning_rate": 1.3815364976614573e-05, - "loss": 2.2982, - "step": 414990 - }, - { - "epoch": 0.72, - "learning_rate": 1.3814493036687745e-05, - "loss": 2.3187, - "step": 415000 - }, - { - "epoch": 0.72, - "learning_rate": 1.3813621096760917e-05, - "loss": 2.1673, - "step": 415010 - }, - { - "epoch": 0.72, - "learning_rate": 1.3812749156834093e-05, - "loss": 2.2943, - "step": 415020 - }, - { - "epoch": 0.72, - "learning_rate": 1.3811877216907265e-05, - "loss": 2.2697, - "step": 415030 - }, - { - "epoch": 0.72, - "learning_rate": 1.3811005276980437e-05, - "loss": 2.2958, - "step": 415040 - }, - { - "epoch": 0.72, - "learning_rate": 1.381013333705361e-05, - "loss": 2.3928, - "step": 415050 - }, - { - "epoch": 0.72, - "learning_rate": 1.3809261397126786e-05, - "loss": 2.3803, - "step": 415060 - }, - { - "epoch": 0.72, - "learning_rate": 1.3808389457199958e-05, - "loss": 2.2644, - "step": 415070 - }, - { - "epoch": 0.72, - "learning_rate": 1.380751751727313e-05, - "loss": 2.3381, - "step": 415080 - }, - { - "epoch": 0.72, - "learning_rate": 1.3806645577346302e-05, - "loss": 2.2467, - "step": 415090 - }, - { - "epoch": 0.72, - "learning_rate": 1.3805773637419478e-05, - "loss": 2.3133, - "step": 415100 - }, - { - "epoch": 0.72, - "learning_rate": 1.380490169749265e-05, - "loss": 2.3648, - "step": 415110 - }, - { - "epoch": 0.72, - "learning_rate": 1.3804029757565824e-05, - "loss": 2.3277, - "step": 415120 - }, - { - "epoch": 0.72, - "learning_rate": 1.3803157817638996e-05, - "loss": 2.4418, - "step": 415130 - }, - { - "epoch": 0.72, - "learning_rate": 1.3802285877712171e-05, - "loss": 2.281, - "step": 415140 - }, - { - "epoch": 0.72, - "learning_rate": 1.3801413937785343e-05, - "loss": 2.3323, - "step": 415150 - }, - { - "epoch": 0.72, - "learning_rate": 1.3800541997858515e-05, - "loss": 2.396, - "step": 415160 - }, - { - "epoch": 0.72, - "learning_rate": 1.379967005793169e-05, - "loss": 2.3894, - "step": 415170 - }, - { - "epoch": 0.72, - "learning_rate": 1.3798798118004863e-05, - "loss": 2.3257, - "step": 415180 - }, - { - "epoch": 0.72, - "learning_rate": 1.3797926178078035e-05, - "loss": 2.4242, - "step": 415190 - }, - { - "epoch": 0.72, - "learning_rate": 1.3797054238151209e-05, - "loss": 2.3415, - "step": 415200 - }, - { - "epoch": 0.72, - "learning_rate": 1.3796182298224383e-05, - "loss": 2.363, - "step": 415210 - }, - { - "epoch": 0.72, - "learning_rate": 1.3795310358297556e-05, - "loss": 2.1792, - "step": 415220 - }, - { - "epoch": 0.72, - "learning_rate": 1.3794438418370728e-05, - "loss": 2.4018, - "step": 415230 - }, - { - "epoch": 0.72, - "learning_rate": 1.37935664784439e-05, - "loss": 2.3227, - "step": 415240 - }, - { - "epoch": 0.72, - "learning_rate": 1.3792694538517076e-05, - "loss": 2.2331, - "step": 415250 - }, - { - "epoch": 0.72, - "learning_rate": 1.3791822598590248e-05, - "loss": 2.2625, - "step": 415260 - }, - { - "epoch": 0.72, - "learning_rate": 1.379095065866342e-05, - "loss": 2.3046, - "step": 415270 - }, - { - "epoch": 0.72, - "learning_rate": 1.3790078718736596e-05, - "loss": 2.2263, - "step": 415280 - }, - { - "epoch": 0.72, - "learning_rate": 1.3789206778809768e-05, - "loss": 2.3363, - "step": 415290 - }, - { - "epoch": 0.72, - "learning_rate": 1.3788334838882941e-05, - "loss": 2.2121, - "step": 415300 - }, - { - "epoch": 0.72, - "learning_rate": 1.3787462898956113e-05, - "loss": 2.2303, - "step": 415310 - }, - { - "epoch": 0.72, - "learning_rate": 1.3786590959029289e-05, - "loss": 2.2469, - "step": 415320 - }, - { - "epoch": 0.72, - "learning_rate": 1.3785719019102461e-05, - "loss": 2.346, - "step": 415330 - }, - { - "epoch": 0.72, - "learning_rate": 1.3784847079175633e-05, - "loss": 2.3428, - "step": 415340 - }, - { - "epoch": 0.72, - "learning_rate": 1.3783975139248805e-05, - "loss": 2.2102, - "step": 415350 - }, - { - "epoch": 0.72, - "learning_rate": 1.378310319932198e-05, - "loss": 2.2586, - "step": 415360 - }, - { - "epoch": 0.72, - "learning_rate": 1.3782231259395154e-05, - "loss": 2.3218, - "step": 415370 - }, - { - "epoch": 0.72, - "learning_rate": 1.3781359319468326e-05, - "loss": 2.3062, - "step": 415380 - }, - { - "epoch": 0.72, - "learning_rate": 1.3780487379541499e-05, - "loss": 2.2311, - "step": 415390 - }, - { - "epoch": 0.72, - "learning_rate": 1.3779615439614674e-05, - "loss": 2.2892, - "step": 415400 - }, - { - "epoch": 0.72, - "learning_rate": 1.3778743499687846e-05, - "loss": 2.3313, - "step": 415410 - }, - { - "epoch": 0.72, - "learning_rate": 1.3777871559761018e-05, - "loss": 2.3319, - "step": 415420 - }, - { - "epoch": 0.72, - "learning_rate": 1.3776999619834194e-05, - "loss": 2.3042, - "step": 415430 - }, - { - "epoch": 0.72, - "learning_rate": 1.3776127679907366e-05, - "loss": 2.2327, - "step": 415440 - }, - { - "epoch": 0.72, - "learning_rate": 1.377525573998054e-05, - "loss": 2.2598, - "step": 415450 - }, - { - "epoch": 0.72, - "learning_rate": 1.3774383800053712e-05, - "loss": 2.3284, - "step": 415460 - }, - { - "epoch": 0.72, - "learning_rate": 1.3773511860126887e-05, - "loss": 2.3569, - "step": 415470 - }, - { - "epoch": 0.72, - "learning_rate": 1.3772639920200059e-05, - "loss": 2.4733, - "step": 415480 - }, - { - "epoch": 0.72, - "learning_rate": 1.3771767980273231e-05, - "loss": 2.2941, - "step": 415490 - }, - { - "epoch": 0.72, - "learning_rate": 1.3770896040346403e-05, - "loss": 2.3917, - "step": 415500 - }, - { - "epoch": 0.72, - "learning_rate": 1.3770024100419579e-05, - "loss": 2.313, - "step": 415510 - }, - { - "epoch": 0.72, - "learning_rate": 1.376915216049275e-05, - "loss": 2.3749, - "step": 415520 - }, - { - "epoch": 0.72, - "learning_rate": 1.3768280220565925e-05, - "loss": 2.2921, - "step": 415530 - }, - { - "epoch": 0.72, - "learning_rate": 1.3767408280639097e-05, - "loss": 2.4631, - "step": 415540 - }, - { - "epoch": 0.72, - "learning_rate": 1.3766536340712272e-05, - "loss": 2.4096, - "step": 415550 - }, - { - "epoch": 0.72, - "learning_rate": 1.3765664400785444e-05, - "loss": 2.2456, - "step": 415560 - }, - { - "epoch": 0.72, - "learning_rate": 1.3764792460858616e-05, - "loss": 2.3864, - "step": 415570 - }, - { - "epoch": 0.72, - "learning_rate": 1.3763920520931792e-05, - "loss": 2.3681, - "step": 415580 - }, - { - "epoch": 0.72, - "learning_rate": 1.3763048581004964e-05, - "loss": 2.352, - "step": 415590 - }, - { - "epoch": 0.72, - "learning_rate": 1.3762176641078136e-05, - "loss": 2.2698, - "step": 415600 - }, - { - "epoch": 0.72, - "learning_rate": 1.376130470115131e-05, - "loss": 2.2555, - "step": 415610 - }, - { - "epoch": 0.72, - "learning_rate": 1.3760432761224485e-05, - "loss": 2.3244, - "step": 415620 - }, - { - "epoch": 0.72, - "learning_rate": 1.3759560821297657e-05, - "loss": 2.3977, - "step": 415630 - }, - { - "epoch": 0.72, - "learning_rate": 1.375868888137083e-05, - "loss": 2.2446, - "step": 415640 - }, - { - "epoch": 0.72, - "learning_rate": 1.3757816941444001e-05, - "loss": 2.2767, - "step": 415650 - }, - { - "epoch": 0.72, - "learning_rate": 1.3756945001517177e-05, - "loss": 2.2732, - "step": 415660 - }, - { - "epoch": 0.72, - "learning_rate": 1.3756073061590349e-05, - "loss": 2.1919, - "step": 415670 - }, - { - "epoch": 0.72, - "learning_rate": 1.3755201121663523e-05, - "loss": 2.2464, - "step": 415680 - }, - { - "epoch": 0.72, - "learning_rate": 1.3754329181736696e-05, - "loss": 2.3936, - "step": 415690 - }, - { - "epoch": 0.72, - "learning_rate": 1.375345724180987e-05, - "loss": 2.3093, - "step": 415700 - }, - { - "epoch": 0.72, - "learning_rate": 1.3752585301883042e-05, - "loss": 2.2678, - "step": 415710 - }, - { - "epoch": 0.72, - "learning_rate": 1.3751713361956214e-05, - "loss": 2.2637, - "step": 415720 - }, - { - "epoch": 0.72, - "learning_rate": 1.375084142202939e-05, - "loss": 2.3827, - "step": 415730 - }, - { - "epoch": 0.73, - "learning_rate": 1.3749969482102562e-05, - "loss": 2.2377, - "step": 415740 - }, - { - "epoch": 0.73, - "learning_rate": 1.3749097542175734e-05, - "loss": 2.212, - "step": 415750 - }, - { - "epoch": 0.73, - "learning_rate": 1.3748225602248908e-05, - "loss": 2.3252, - "step": 415760 - }, - { - "epoch": 0.73, - "learning_rate": 1.3747353662322081e-05, - "loss": 2.4124, - "step": 415770 - }, - { - "epoch": 0.73, - "learning_rate": 1.3746481722395255e-05, - "loss": 2.4405, - "step": 415780 - }, - { - "epoch": 0.73, - "learning_rate": 1.3745609782468427e-05, - "loss": 2.2972, - "step": 415790 - }, - { - "epoch": 0.73, - "learning_rate": 1.37447378425416e-05, - "loss": 2.2554, - "step": 415800 - }, - { - "epoch": 0.73, - "learning_rate": 1.3743865902614775e-05, - "loss": 2.3053, - "step": 415810 - }, - { - "epoch": 0.73, - "learning_rate": 1.3742993962687947e-05, - "loss": 2.2841, - "step": 415820 - }, - { - "epoch": 0.73, - "learning_rate": 1.3742122022761119e-05, - "loss": 2.2694, - "step": 415830 - }, - { - "epoch": 0.73, - "learning_rate": 1.3741250082834294e-05, - "loss": 2.2948, - "step": 415840 - }, - { - "epoch": 0.73, - "learning_rate": 1.3740378142907468e-05, - "loss": 2.3977, - "step": 415850 - }, - { - "epoch": 0.73, - "learning_rate": 1.373950620298064e-05, - "loss": 2.3165, - "step": 415860 - }, - { - "epoch": 0.73, - "learning_rate": 1.3738634263053812e-05, - "loss": 2.348, - "step": 415870 - }, - { - "epoch": 0.73, - "learning_rate": 1.3737762323126988e-05, - "loss": 2.3273, - "step": 415880 - }, - { - "epoch": 0.73, - "learning_rate": 1.373689038320016e-05, - "loss": 2.3053, - "step": 415890 - }, - { - "epoch": 0.73, - "learning_rate": 1.3736018443273332e-05, - "loss": 2.2154, - "step": 415900 - }, - { - "epoch": 0.73, - "learning_rate": 1.3735146503346504e-05, - "loss": 2.3529, - "step": 415910 - }, - { - "epoch": 0.73, - "learning_rate": 1.373427456341968e-05, - "loss": 2.3012, - "step": 415920 - }, - { - "epoch": 0.73, - "learning_rate": 1.3733402623492853e-05, - "loss": 2.204, - "step": 415930 - }, - { - "epoch": 0.73, - "learning_rate": 1.3732530683566025e-05, - "loss": 2.4152, - "step": 415940 - }, - { - "epoch": 0.73, - "learning_rate": 1.37316587436392e-05, - "loss": 2.4046, - "step": 415950 - }, - { - "epoch": 0.73, - "learning_rate": 1.3730786803712373e-05, - "loss": 2.251, - "step": 415960 - }, - { - "epoch": 0.73, - "learning_rate": 1.3729914863785545e-05, - "loss": 2.2198, - "step": 415970 - }, - { - "epoch": 0.73, - "learning_rate": 1.3729042923858717e-05, - "loss": 2.2971, - "step": 415980 - }, - { - "epoch": 0.73, - "learning_rate": 1.3728170983931893e-05, - "loss": 2.242, - "step": 415990 - }, - { - "epoch": 0.73, - "learning_rate": 1.3727299044005065e-05, - "loss": 2.3331, - "step": 416000 - }, - { - "epoch": 0.73, - "learning_rate": 1.3726427104078238e-05, - "loss": 2.2637, - "step": 416010 - }, - { - "epoch": 0.73, - "learning_rate": 1.372555516415141e-05, - "loss": 2.3179, - "step": 416020 - }, - { - "epoch": 0.73, - "learning_rate": 1.3724683224224586e-05, - "loss": 2.2886, - "step": 416030 - }, - { - "epoch": 0.73, - "learning_rate": 1.3723811284297758e-05, - "loss": 2.3137, - "step": 416040 - }, - { - "epoch": 0.73, - "learning_rate": 1.372293934437093e-05, - "loss": 2.2073, - "step": 416050 - }, - { - "epoch": 0.73, - "learning_rate": 1.3722067404444102e-05, - "loss": 2.323, - "step": 416060 - }, - { - "epoch": 0.73, - "learning_rate": 1.3721195464517278e-05, - "loss": 2.3172, - "step": 416070 - }, - { - "epoch": 0.73, - "learning_rate": 1.372032352459045e-05, - "loss": 2.3427, - "step": 416080 - }, - { - "epoch": 0.73, - "learning_rate": 1.3719451584663623e-05, - "loss": 2.38, - "step": 416090 - }, - { - "epoch": 0.73, - "learning_rate": 1.3718579644736799e-05, - "loss": 2.2764, - "step": 416100 - }, - { - "epoch": 0.73, - "learning_rate": 1.3717707704809971e-05, - "loss": 2.2975, - "step": 416110 - }, - { - "epoch": 0.73, - "learning_rate": 1.3716835764883143e-05, - "loss": 2.2867, - "step": 416120 - }, - { - "epoch": 0.73, - "learning_rate": 1.3715963824956315e-05, - "loss": 2.2478, - "step": 416130 - }, - { - "epoch": 0.73, - "learning_rate": 1.371509188502949e-05, - "loss": 2.2668, - "step": 416140 - }, - { - "epoch": 0.73, - "learning_rate": 1.3714219945102663e-05, - "loss": 2.3715, - "step": 416150 - }, - { - "epoch": 0.73, - "learning_rate": 1.3713348005175836e-05, - "loss": 2.4052, - "step": 416160 - }, - { - "epoch": 0.73, - "learning_rate": 1.3712476065249009e-05, - "loss": 2.4084, - "step": 416170 - }, - { - "epoch": 0.73, - "learning_rate": 1.3711604125322184e-05, - "loss": 2.2185, - "step": 416180 - }, - { - "epoch": 0.73, - "learning_rate": 1.3710732185395356e-05, - "loss": 2.2235, - "step": 416190 - }, - { - "epoch": 0.73, - "learning_rate": 1.3709860245468528e-05, - "loss": 2.2532, - "step": 416200 - }, - { - "epoch": 0.73, - "learning_rate": 1.3708988305541704e-05, - "loss": 2.2648, - "step": 416210 - }, - { - "epoch": 0.73, - "learning_rate": 1.3708116365614876e-05, - "loss": 2.3271, - "step": 416220 - }, - { - "epoch": 0.73, - "learning_rate": 1.3707244425688048e-05, - "loss": 2.3384, - "step": 416230 - }, - { - "epoch": 0.73, - "learning_rate": 1.3706372485761222e-05, - "loss": 2.2476, - "step": 416240 - }, - { - "epoch": 0.73, - "learning_rate": 1.3705500545834395e-05, - "loss": 2.3799, - "step": 416250 - }, - { - "epoch": 0.73, - "learning_rate": 1.3704628605907569e-05, - "loss": 2.3403, - "step": 416260 - }, - { - "epoch": 0.73, - "learning_rate": 1.3703756665980741e-05, - "loss": 2.2183, - "step": 416270 - }, - { - "epoch": 0.73, - "learning_rate": 1.3702884726053913e-05, - "loss": 2.3017, - "step": 416280 - }, - { - "epoch": 0.73, - "learning_rate": 1.3702012786127089e-05, - "loss": 2.2375, - "step": 416290 - }, - { - "epoch": 0.73, - "learning_rate": 1.370114084620026e-05, - "loss": 2.3493, - "step": 416300 - }, - { - "epoch": 0.73, - "learning_rate": 1.3700268906273433e-05, - "loss": 2.1701, - "step": 416310 - }, - { - "epoch": 0.73, - "learning_rate": 1.3699396966346607e-05, - "loss": 2.2827, - "step": 416320 - }, - { - "epoch": 0.73, - "learning_rate": 1.369852502641978e-05, - "loss": 2.3042, - "step": 416330 - }, - { - "epoch": 0.73, - "learning_rate": 1.3697653086492954e-05, - "loss": 2.2023, - "step": 416340 - }, - { - "epoch": 0.73, - "learning_rate": 1.3696781146566126e-05, - "loss": 2.2578, - "step": 416350 - }, - { - "epoch": 0.73, - "learning_rate": 1.3695909206639302e-05, - "loss": 2.3252, - "step": 416360 - }, - { - "epoch": 0.73, - "learning_rate": 1.3695037266712474e-05, - "loss": 2.39, - "step": 416370 - }, - { - "epoch": 0.73, - "learning_rate": 1.3694165326785646e-05, - "loss": 2.3404, - "step": 416380 - }, - { - "epoch": 0.73, - "learning_rate": 1.3693293386858818e-05, - "loss": 2.242, - "step": 416390 - }, - { - "epoch": 0.73, - "learning_rate": 1.3692421446931993e-05, - "loss": 2.2445, - "step": 416400 - }, - { - "epoch": 0.73, - "learning_rate": 1.3691549507005167e-05, - "loss": 2.3567, - "step": 416410 - }, - { - "epoch": 0.73, - "learning_rate": 1.369067756707834e-05, - "loss": 2.2374, - "step": 416420 - }, - { - "epoch": 0.73, - "learning_rate": 1.3689805627151511e-05, - "loss": 2.312, - "step": 416430 - }, - { - "epoch": 0.73, - "learning_rate": 1.3688933687224687e-05, - "loss": 2.2894, - "step": 416440 - }, - { - "epoch": 0.73, - "learning_rate": 1.3688061747297859e-05, - "loss": 2.2745, - "step": 416450 - }, - { - "epoch": 0.73, - "learning_rate": 1.3687189807371031e-05, - "loss": 2.1889, - "step": 416460 - }, - { - "epoch": 0.73, - "learning_rate": 1.3686317867444205e-05, - "loss": 2.3292, - "step": 416470 - }, - { - "epoch": 0.73, - "learning_rate": 1.3685445927517378e-05, - "loss": 2.2992, - "step": 416480 - }, - { - "epoch": 0.73, - "learning_rate": 1.3684573987590552e-05, - "loss": 2.3431, - "step": 416490 - }, - { - "epoch": 0.73, - "learning_rate": 1.3683702047663724e-05, - "loss": 2.2276, - "step": 416500 - }, - { - "epoch": 0.73, - "learning_rate": 1.36828301077369e-05, - "loss": 2.3711, - "step": 416510 - }, - { - "epoch": 0.73, - "learning_rate": 1.3681958167810072e-05, - "loss": 2.3049, - "step": 416520 - }, - { - "epoch": 0.73, - "learning_rate": 1.3681086227883244e-05, - "loss": 2.3162, - "step": 416530 - }, - { - "epoch": 0.73, - "learning_rate": 1.3680214287956416e-05, - "loss": 2.2607, - "step": 416540 - }, - { - "epoch": 0.73, - "learning_rate": 1.3679342348029591e-05, - "loss": 2.2634, - "step": 416550 - }, - { - "epoch": 0.73, - "learning_rate": 1.3678470408102764e-05, - "loss": 2.183, - "step": 416560 - }, - { - "epoch": 0.73, - "learning_rate": 1.3677598468175937e-05, - "loss": 2.249, - "step": 416570 - }, - { - "epoch": 0.73, - "learning_rate": 1.367672652824911e-05, - "loss": 2.2464, - "step": 416580 - }, - { - "epoch": 0.73, - "learning_rate": 1.3675854588322285e-05, - "loss": 2.2819, - "step": 416590 - }, - { - "epoch": 0.73, - "learning_rate": 1.3674982648395457e-05, - "loss": 2.3333, - "step": 416600 - }, - { - "epoch": 0.73, - "learning_rate": 1.3674110708468629e-05, - "loss": 2.4057, - "step": 416610 - }, - { - "epoch": 0.73, - "learning_rate": 1.3673238768541804e-05, - "loss": 2.2897, - "step": 416620 - }, - { - "epoch": 0.73, - "learning_rate": 1.3672366828614977e-05, - "loss": 2.5331, - "step": 416630 - }, - { - "epoch": 0.73, - "learning_rate": 1.3671494888688149e-05, - "loss": 2.1556, - "step": 416640 - }, - { - "epoch": 0.73, - "learning_rate": 1.3670622948761322e-05, - "loss": 2.2206, - "step": 416650 - }, - { - "epoch": 0.73, - "learning_rate": 1.3669751008834498e-05, - "loss": 2.2526, - "step": 416660 - }, - { - "epoch": 0.73, - "learning_rate": 1.366887906890767e-05, - "loss": 2.1602, - "step": 416670 - }, - { - "epoch": 0.73, - "learning_rate": 1.3668007128980842e-05, - "loss": 2.3447, - "step": 416680 - }, - { - "epoch": 0.73, - "learning_rate": 1.3667135189054014e-05, - "loss": 2.2904, - "step": 416690 - }, - { - "epoch": 0.73, - "learning_rate": 1.366626324912719e-05, - "loss": 2.3485, - "step": 416700 - }, - { - "epoch": 0.73, - "learning_rate": 1.3665391309200362e-05, - "loss": 2.3504, - "step": 416710 - }, - { - "epoch": 0.73, - "learning_rate": 1.3664519369273535e-05, - "loss": 2.2875, - "step": 416720 - }, - { - "epoch": 0.73, - "learning_rate": 1.3663647429346707e-05, - "loss": 2.3026, - "step": 416730 - }, - { - "epoch": 0.73, - "learning_rate": 1.3662775489419883e-05, - "loss": 2.284, - "step": 416740 - }, - { - "epoch": 0.73, - "learning_rate": 1.3661903549493055e-05, - "loss": 2.1687, - "step": 416750 - }, - { - "epoch": 0.73, - "learning_rate": 1.3661031609566227e-05, - "loss": 2.3942, - "step": 416760 - }, - { - "epoch": 0.73, - "learning_rate": 1.3660159669639403e-05, - "loss": 2.2521, - "step": 416770 - }, - { - "epoch": 0.73, - "learning_rate": 1.3659287729712575e-05, - "loss": 2.2618, - "step": 416780 - }, - { - "epoch": 0.73, - "learning_rate": 1.3658415789785747e-05, - "loss": 2.2331, - "step": 416790 - }, - { - "epoch": 0.73, - "learning_rate": 1.365754384985892e-05, - "loss": 2.4094, - "step": 416800 - }, - { - "epoch": 0.73, - "learning_rate": 1.3656671909932094e-05, - "loss": 2.2192, - "step": 416810 - }, - { - "epoch": 0.73, - "learning_rate": 1.3655799970005268e-05, - "loss": 2.2283, - "step": 416820 - }, - { - "epoch": 0.73, - "learning_rate": 1.365492803007844e-05, - "loss": 2.2816, - "step": 416830 - }, - { - "epoch": 0.73, - "learning_rate": 1.3654056090151612e-05, - "loss": 2.3655, - "step": 416840 - }, - { - "epoch": 0.73, - "learning_rate": 1.3653184150224788e-05, - "loss": 2.4086, - "step": 416850 - }, - { - "epoch": 0.73, - "learning_rate": 1.365231221029796e-05, - "loss": 2.3266, - "step": 416860 - }, - { - "epoch": 0.73, - "learning_rate": 1.3651440270371132e-05, - "loss": 2.2237, - "step": 416870 - }, - { - "epoch": 0.73, - "learning_rate": 1.3650568330444307e-05, - "loss": 2.3258, - "step": 416880 - }, - { - "epoch": 0.73, - "learning_rate": 1.3649696390517481e-05, - "loss": 2.2466, - "step": 416890 - }, - { - "epoch": 0.73, - "learning_rate": 1.3648824450590653e-05, - "loss": 2.3124, - "step": 416900 - }, - { - "epoch": 0.73, - "learning_rate": 1.3647952510663825e-05, - "loss": 2.3215, - "step": 416910 - }, - { - "epoch": 0.73, - "learning_rate": 1.3647080570737e-05, - "loss": 2.2597, - "step": 416920 - }, - { - "epoch": 0.73, - "learning_rate": 1.3646208630810173e-05, - "loss": 2.2232, - "step": 416930 - }, - { - "epoch": 0.73, - "learning_rate": 1.3645336690883345e-05, - "loss": 2.2931, - "step": 416940 - }, - { - "epoch": 0.73, - "learning_rate": 1.3644464750956517e-05, - "loss": 2.2262, - "step": 416950 - }, - { - "epoch": 0.73, - "learning_rate": 1.3643592811029692e-05, - "loss": 2.3286, - "step": 416960 - }, - { - "epoch": 0.73, - "learning_rate": 1.3642720871102866e-05, - "loss": 2.2995, - "step": 416970 - }, - { - "epoch": 0.73, - "learning_rate": 1.3641848931176038e-05, - "loss": 2.3532, - "step": 416980 - }, - { - "epoch": 0.73, - "learning_rate": 1.364097699124921e-05, - "loss": 2.3452, - "step": 416990 - }, - { - "epoch": 0.73, - "learning_rate": 1.3640105051322386e-05, - "loss": 2.3576, - "step": 417000 - }, - { - "epoch": 0.73, - "learning_rate": 1.3639233111395558e-05, - "loss": 2.2491, - "step": 417010 - }, - { - "epoch": 0.73, - "learning_rate": 1.363836117146873e-05, - "loss": 2.2604, - "step": 417020 - }, - { - "epoch": 0.73, - "learning_rate": 1.3637489231541905e-05, - "loss": 2.3354, - "step": 417030 - }, - { - "epoch": 0.73, - "learning_rate": 1.3636617291615077e-05, - "loss": 2.4027, - "step": 417040 - }, - { - "epoch": 0.73, - "learning_rate": 1.3635745351688251e-05, - "loss": 2.347, - "step": 417050 - }, - { - "epoch": 0.73, - "learning_rate": 1.3634873411761423e-05, - "loss": 2.2956, - "step": 417060 - }, - { - "epoch": 0.73, - "learning_rate": 1.3634001471834599e-05, - "loss": 2.2713, - "step": 417070 - }, - { - "epoch": 0.73, - "learning_rate": 1.363312953190777e-05, - "loss": 2.4122, - "step": 417080 - }, - { - "epoch": 0.73, - "learning_rate": 1.3632257591980943e-05, - "loss": 2.2683, - "step": 417090 - }, - { - "epoch": 0.73, - "learning_rate": 1.3631385652054115e-05, - "loss": 2.3061, - "step": 417100 - }, - { - "epoch": 0.73, - "learning_rate": 1.363051371212729e-05, - "loss": 2.3531, - "step": 417110 - }, - { - "epoch": 0.73, - "learning_rate": 1.3629641772200462e-05, - "loss": 2.2371, - "step": 417120 - }, - { - "epoch": 0.73, - "learning_rate": 1.3628769832273636e-05, - "loss": 2.2433, - "step": 417130 - }, - { - "epoch": 0.73, - "learning_rate": 1.3627897892346812e-05, - "loss": 2.3503, - "step": 417140 - }, - { - "epoch": 0.73, - "learning_rate": 1.3627025952419984e-05, - "loss": 2.3751, - "step": 417150 - }, - { - "epoch": 0.73, - "learning_rate": 1.3626154012493156e-05, - "loss": 2.4177, - "step": 417160 - }, - { - "epoch": 0.73, - "learning_rate": 1.3625282072566328e-05, - "loss": 2.2331, - "step": 417170 - }, - { - "epoch": 0.73, - "learning_rate": 1.3624410132639503e-05, - "loss": 2.3158, - "step": 417180 - }, - { - "epoch": 0.73, - "learning_rate": 1.3623538192712675e-05, - "loss": 2.2693, - "step": 417190 - }, - { - "epoch": 0.73, - "learning_rate": 1.362266625278585e-05, - "loss": 2.2509, - "step": 417200 - }, - { - "epoch": 0.73, - "learning_rate": 1.3621794312859021e-05, - "loss": 2.3535, - "step": 417210 - }, - { - "epoch": 0.73, - "learning_rate": 1.3620922372932197e-05, - "loss": 2.1126, - "step": 417220 - }, - { - "epoch": 0.73, - "learning_rate": 1.3620050433005369e-05, - "loss": 2.2329, - "step": 417230 - }, - { - "epoch": 0.73, - "learning_rate": 1.3619178493078541e-05, - "loss": 2.3545, - "step": 417240 - }, - { - "epoch": 0.73, - "learning_rate": 1.3618306553151713e-05, - "loss": 2.3174, - "step": 417250 - }, - { - "epoch": 0.73, - "learning_rate": 1.3617434613224888e-05, - "loss": 2.398, - "step": 417260 - }, - { - "epoch": 0.73, - "learning_rate": 1.361656267329806e-05, - "loss": 2.2931, - "step": 417270 - }, - { - "epoch": 0.73, - "learning_rate": 1.3615690733371234e-05, - "loss": 2.3376, - "step": 417280 - }, - { - "epoch": 0.73, - "learning_rate": 1.3614818793444408e-05, - "loss": 2.3066, - "step": 417290 - }, - { - "epoch": 0.73, - "learning_rate": 1.3613946853517582e-05, - "loss": 2.272, - "step": 417300 - }, - { - "epoch": 0.73, - "learning_rate": 1.3613074913590754e-05, - "loss": 2.2418, - "step": 417310 - }, - { - "epoch": 0.73, - "learning_rate": 1.3612202973663926e-05, - "loss": 2.2475, - "step": 417320 - }, - { - "epoch": 0.73, - "learning_rate": 1.3611331033737101e-05, - "loss": 2.3597, - "step": 417330 - }, - { - "epoch": 0.73, - "learning_rate": 1.3610459093810274e-05, - "loss": 2.3456, - "step": 417340 - }, - { - "epoch": 0.73, - "learning_rate": 1.3609587153883446e-05, - "loss": 2.3253, - "step": 417350 - }, - { - "epoch": 0.73, - "learning_rate": 1.360871521395662e-05, - "loss": 2.2684, - "step": 417360 - }, - { - "epoch": 0.73, - "learning_rate": 1.3607843274029793e-05, - "loss": 2.1416, - "step": 417370 - }, - { - "epoch": 0.73, - "learning_rate": 1.3606971334102967e-05, - "loss": 2.2806, - "step": 417380 - }, - { - "epoch": 0.73, - "learning_rate": 1.3606099394176139e-05, - "loss": 2.2749, - "step": 417390 - }, - { - "epoch": 0.73, - "learning_rate": 1.3605227454249311e-05, - "loss": 2.1783, - "step": 417400 - }, - { - "epoch": 0.73, - "learning_rate": 1.3604355514322487e-05, - "loss": 2.2531, - "step": 417410 - }, - { - "epoch": 0.73, - "learning_rate": 1.3603483574395659e-05, - "loss": 2.2885, - "step": 417420 - }, - { - "epoch": 0.73, - "learning_rate": 1.360261163446883e-05, - "loss": 2.35, - "step": 417430 - }, - { - "epoch": 0.73, - "learning_rate": 1.3601739694542006e-05, - "loss": 2.3246, - "step": 417440 - }, - { - "epoch": 0.73, - "learning_rate": 1.360086775461518e-05, - "loss": 2.2607, - "step": 417450 - }, - { - "epoch": 0.73, - "learning_rate": 1.3599995814688352e-05, - "loss": 2.2877, - "step": 417460 - }, - { - "epoch": 0.73, - "learning_rate": 1.3599123874761524e-05, - "loss": 2.3139, - "step": 417470 - }, - { - "epoch": 0.73, - "learning_rate": 1.35982519348347e-05, - "loss": 2.3194, - "step": 417480 - }, - { - "epoch": 0.73, - "learning_rate": 1.3597379994907872e-05, - "loss": 2.3143, - "step": 417490 - }, - { - "epoch": 0.73, - "learning_rate": 1.3596508054981044e-05, - "loss": 2.2805, - "step": 417500 - }, - { - "epoch": 0.73, - "learning_rate": 1.3595636115054217e-05, - "loss": 2.3386, - "step": 417510 - }, - { - "epoch": 0.73, - "learning_rate": 1.3594764175127391e-05, - "loss": 2.3469, - "step": 417520 - }, - { - "epoch": 0.73, - "learning_rate": 1.3593892235200565e-05, - "loss": 2.2471, - "step": 417530 - }, - { - "epoch": 0.73, - "learning_rate": 1.3593020295273737e-05, - "loss": 2.2355, - "step": 417540 - }, - { - "epoch": 0.73, - "learning_rate": 1.3592148355346913e-05, - "loss": 2.3021, - "step": 417550 - }, - { - "epoch": 0.73, - "learning_rate": 1.3591276415420085e-05, - "loss": 2.2892, - "step": 417560 - }, - { - "epoch": 0.73, - "learning_rate": 1.3590404475493257e-05, - "loss": 2.345, - "step": 417570 - }, - { - "epoch": 0.73, - "learning_rate": 1.3589532535566429e-05, - "loss": 2.3835, - "step": 417580 - }, - { - "epoch": 0.73, - "learning_rate": 1.3588660595639604e-05, - "loss": 2.2152, - "step": 417590 - }, - { - "epoch": 0.73, - "learning_rate": 1.3587788655712776e-05, - "loss": 2.3859, - "step": 417600 - }, - { - "epoch": 0.73, - "learning_rate": 1.358691671578595e-05, - "loss": 2.209, - "step": 417610 - }, - { - "epoch": 0.73, - "learning_rate": 1.3586044775859122e-05, - "loss": 2.3836, - "step": 417620 - }, - { - "epoch": 0.73, - "learning_rate": 1.3585172835932298e-05, - "loss": 2.1868, - "step": 417630 - }, - { - "epoch": 0.73, - "learning_rate": 1.358430089600547e-05, - "loss": 2.2373, - "step": 417640 - }, - { - "epoch": 0.73, - "learning_rate": 1.3583428956078642e-05, - "loss": 2.2997, - "step": 417650 - }, - { - "epoch": 0.73, - "learning_rate": 1.3582557016151814e-05, - "loss": 2.2485, - "step": 417660 - }, - { - "epoch": 0.73, - "learning_rate": 1.358168507622499e-05, - "loss": 2.3846, - "step": 417670 - }, - { - "epoch": 0.73, - "learning_rate": 1.3580813136298161e-05, - "loss": 2.2668, - "step": 417680 - }, - { - "epoch": 0.73, - "learning_rate": 1.3579941196371335e-05, - "loss": 2.2747, - "step": 417690 - }, - { - "epoch": 0.73, - "learning_rate": 1.357906925644451e-05, - "loss": 2.3108, - "step": 417700 - }, - { - "epoch": 0.73, - "learning_rate": 1.3578197316517683e-05, - "loss": 2.3239, - "step": 417710 - }, - { - "epoch": 0.73, - "learning_rate": 1.3577325376590855e-05, - "loss": 2.2243, - "step": 417720 - }, - { - "epoch": 0.73, - "learning_rate": 1.3576453436664027e-05, - "loss": 2.3318, - "step": 417730 - }, - { - "epoch": 0.73, - "learning_rate": 1.3575581496737202e-05, - "loss": 2.2744, - "step": 417740 - }, - { - "epoch": 0.73, - "learning_rate": 1.3574709556810374e-05, - "loss": 2.3492, - "step": 417750 - }, - { - "epoch": 0.73, - "learning_rate": 1.3573837616883548e-05, - "loss": 2.2395, - "step": 417760 - }, - { - "epoch": 0.73, - "learning_rate": 1.357296567695672e-05, - "loss": 2.2008, - "step": 417770 - }, - { - "epoch": 0.73, - "learning_rate": 1.3572093737029896e-05, - "loss": 2.318, - "step": 417780 - }, - { - "epoch": 0.73, - "learning_rate": 1.3571221797103068e-05, - "loss": 2.2754, - "step": 417790 - }, - { - "epoch": 0.73, - "learning_rate": 1.357034985717624e-05, - "loss": 2.2343, - "step": 417800 - }, - { - "epoch": 0.73, - "learning_rate": 1.3569477917249415e-05, - "loss": 2.4031, - "step": 417810 - }, - { - "epoch": 0.73, - "learning_rate": 1.3568605977322587e-05, - "loss": 2.2712, - "step": 417820 - }, - { - "epoch": 0.73, - "learning_rate": 1.356773403739576e-05, - "loss": 2.342, - "step": 417830 - }, - { - "epoch": 0.73, - "learning_rate": 1.3566862097468933e-05, - "loss": 2.1214, - "step": 417840 - }, - { - "epoch": 0.73, - "learning_rate": 1.3565990157542107e-05, - "loss": 2.42, - "step": 417850 - }, - { - "epoch": 0.73, - "learning_rate": 1.356511821761528e-05, - "loss": 2.3674, - "step": 417860 - }, - { - "epoch": 0.73, - "learning_rate": 1.3564246277688453e-05, - "loss": 2.3021, - "step": 417870 - }, - { - "epoch": 0.73, - "learning_rate": 1.3563374337761625e-05, - "loss": 2.2857, - "step": 417880 - }, - { - "epoch": 0.73, - "learning_rate": 1.35625023978348e-05, - "loss": 2.2938, - "step": 417890 - }, - { - "epoch": 0.73, - "learning_rate": 1.3561630457907972e-05, - "loss": 2.372, - "step": 417900 - }, - { - "epoch": 0.73, - "learning_rate": 1.3560758517981145e-05, - "loss": 2.3559, - "step": 417910 - }, - { - "epoch": 0.73, - "learning_rate": 1.3559886578054318e-05, - "loss": 2.2885, - "step": 417920 - }, - { - "epoch": 0.73, - "learning_rate": 1.3559014638127494e-05, - "loss": 2.3257, - "step": 417930 - }, - { - "epoch": 0.73, - "learning_rate": 1.3558142698200666e-05, - "loss": 2.4316, - "step": 417940 - }, - { - "epoch": 0.73, - "learning_rate": 1.3557270758273838e-05, - "loss": 2.2101, - "step": 417950 - }, - { - "epoch": 0.73, - "learning_rate": 1.3556398818347013e-05, - "loss": 2.267, - "step": 417960 - }, - { - "epoch": 0.73, - "learning_rate": 1.3555526878420185e-05, - "loss": 2.2868, - "step": 417970 - }, - { - "epoch": 0.73, - "learning_rate": 1.3554654938493358e-05, - "loss": 2.2608, - "step": 417980 - }, - { - "epoch": 0.73, - "learning_rate": 1.355378299856653e-05, - "loss": 2.3093, - "step": 417990 - }, - { - "epoch": 0.73, - "learning_rate": 1.3552911058639705e-05, - "loss": 2.385, - "step": 418000 - }, - { - "epoch": 0.73, - "learning_rate": 1.3552039118712879e-05, - "loss": 2.1781, - "step": 418010 - }, - { - "epoch": 0.73, - "learning_rate": 1.3551167178786051e-05, - "loss": 2.3077, - "step": 418020 - }, - { - "epoch": 0.73, - "learning_rate": 1.3550295238859223e-05, - "loss": 2.2559, - "step": 418030 - }, - { - "epoch": 0.73, - "learning_rate": 1.3549423298932398e-05, - "loss": 2.2391, - "step": 418040 - }, - { - "epoch": 0.73, - "learning_rate": 1.354855135900557e-05, - "loss": 2.3124, - "step": 418050 - }, - { - "epoch": 0.73, - "learning_rate": 1.3547679419078743e-05, - "loss": 2.2327, - "step": 418060 - }, - { - "epoch": 0.73, - "learning_rate": 1.3546807479151916e-05, - "loss": 2.2829, - "step": 418070 - }, - { - "epoch": 0.73, - "learning_rate": 1.354593553922509e-05, - "loss": 2.304, - "step": 418080 - }, - { - "epoch": 0.73, - "learning_rate": 1.3545063599298264e-05, - "loss": 2.1539, - "step": 418090 - }, - { - "epoch": 0.73, - "learning_rate": 1.3544191659371436e-05, - "loss": 2.3014, - "step": 418100 - }, - { - "epoch": 0.73, - "learning_rate": 1.3543319719444611e-05, - "loss": 2.2661, - "step": 418110 - }, - { - "epoch": 0.73, - "learning_rate": 1.3542447779517784e-05, - "loss": 2.3855, - "step": 418120 - }, - { - "epoch": 0.73, - "learning_rate": 1.3541575839590956e-05, - "loss": 2.1942, - "step": 418130 - }, - { - "epoch": 0.73, - "learning_rate": 1.3540703899664128e-05, - "loss": 2.2382, - "step": 418140 - }, - { - "epoch": 0.73, - "learning_rate": 1.3539831959737303e-05, - "loss": 2.3085, - "step": 418150 - }, - { - "epoch": 0.73, - "learning_rate": 1.3538960019810475e-05, - "loss": 2.2115, - "step": 418160 - }, - { - "epoch": 0.73, - "learning_rate": 1.3538088079883649e-05, - "loss": 2.25, - "step": 418170 - }, - { - "epoch": 0.73, - "learning_rate": 1.3537216139956821e-05, - "loss": 2.3442, - "step": 418180 - }, - { - "epoch": 0.73, - "learning_rate": 1.3536344200029997e-05, - "loss": 2.3919, - "step": 418190 - }, - { - "epoch": 0.73, - "learning_rate": 1.3535472260103169e-05, - "loss": 2.286, - "step": 418200 - }, - { - "epoch": 0.73, - "learning_rate": 1.353460032017634e-05, - "loss": 2.2831, - "step": 418210 - }, - { - "epoch": 0.73, - "learning_rate": 1.3533728380249516e-05, - "loss": 2.3463, - "step": 418220 - }, - { - "epoch": 0.73, - "learning_rate": 1.3532856440322688e-05, - "loss": 2.2816, - "step": 418230 - }, - { - "epoch": 0.73, - "learning_rate": 1.3531984500395862e-05, - "loss": 2.3523, - "step": 418240 - }, - { - "epoch": 0.73, - "learning_rate": 1.3531112560469034e-05, - "loss": 2.3225, - "step": 418250 - }, - { - "epoch": 0.73, - "learning_rate": 1.353024062054221e-05, - "loss": 2.3031, - "step": 418260 - }, - { - "epoch": 0.73, - "learning_rate": 1.3529368680615382e-05, - "loss": 2.3694, - "step": 418270 - }, - { - "epoch": 0.73, - "learning_rate": 1.3528496740688554e-05, - "loss": 2.2337, - "step": 418280 - }, - { - "epoch": 0.73, - "learning_rate": 1.3527624800761726e-05, - "loss": 2.3211, - "step": 418290 - }, - { - "epoch": 0.73, - "learning_rate": 1.3526752860834901e-05, - "loss": 2.2969, - "step": 418300 - }, - { - "epoch": 0.73, - "learning_rate": 1.3525880920908073e-05, - "loss": 2.2001, - "step": 418310 - }, - { - "epoch": 0.73, - "learning_rate": 1.3525008980981247e-05, - "loss": 2.3489, - "step": 418320 - }, - { - "epoch": 0.73, - "learning_rate": 1.352413704105442e-05, - "loss": 2.2031, - "step": 418330 - }, - { - "epoch": 0.73, - "learning_rate": 1.3523265101127595e-05, - "loss": 2.2642, - "step": 418340 - }, - { - "epoch": 0.73, - "learning_rate": 1.3522393161200767e-05, - "loss": 2.3519, - "step": 418350 - }, - { - "epoch": 0.73, - "learning_rate": 1.3521521221273939e-05, - "loss": 2.3785, - "step": 418360 - }, - { - "epoch": 0.73, - "learning_rate": 1.3520649281347114e-05, - "loss": 2.2885, - "step": 418370 - }, - { - "epoch": 0.73, - "learning_rate": 1.3519777341420286e-05, - "loss": 2.3186, - "step": 418380 - }, - { - "epoch": 0.73, - "learning_rate": 1.3518905401493458e-05, - "loss": 2.317, - "step": 418390 - }, - { - "epoch": 0.73, - "learning_rate": 1.3518033461566632e-05, - "loss": 2.3424, - "step": 418400 - }, - { - "epoch": 0.73, - "learning_rate": 1.3517161521639806e-05, - "loss": 2.2718, - "step": 418410 - }, - { - "epoch": 0.73, - "learning_rate": 1.351628958171298e-05, - "loss": 2.3517, - "step": 418420 - }, - { - "epoch": 0.73, - "learning_rate": 1.3515417641786152e-05, - "loss": 2.3412, - "step": 418430 - }, - { - "epoch": 0.73, - "learning_rate": 1.3514545701859324e-05, - "loss": 2.2488, - "step": 418440 - }, - { - "epoch": 0.73, - "learning_rate": 1.35136737619325e-05, - "loss": 2.2626, - "step": 418450 - }, - { - "epoch": 0.73, - "learning_rate": 1.3512801822005671e-05, - "loss": 2.3271, - "step": 418460 - }, - { - "epoch": 0.73, - "learning_rate": 1.3511929882078843e-05, - "loss": 2.3205, - "step": 418470 - }, - { - "epoch": 0.73, - "learning_rate": 1.3511057942152019e-05, - "loss": 2.2643, - "step": 418480 - }, - { - "epoch": 0.73, - "learning_rate": 1.3510186002225193e-05, - "loss": 2.4347, - "step": 418490 - }, - { - "epoch": 0.73, - "learning_rate": 1.3509314062298365e-05, - "loss": 2.3743, - "step": 418500 - }, - { - "epoch": 0.73, - "learning_rate": 1.3508442122371537e-05, - "loss": 2.3112, - "step": 418510 - }, - { - "epoch": 0.73, - "learning_rate": 1.3507570182444712e-05, - "loss": 2.3003, - "step": 418520 - }, - { - "epoch": 0.73, - "learning_rate": 1.3506698242517884e-05, - "loss": 2.2942, - "step": 418530 - }, - { - "epoch": 0.73, - "learning_rate": 1.3505826302591056e-05, - "loss": 2.1884, - "step": 418540 - }, - { - "epoch": 0.73, - "learning_rate": 1.350495436266423e-05, - "loss": 2.3018, - "step": 418550 - }, - { - "epoch": 0.73, - "learning_rate": 1.3504082422737404e-05, - "loss": 2.3428, - "step": 418560 - }, - { - "epoch": 0.73, - "learning_rate": 1.3503210482810578e-05, - "loss": 2.2792, - "step": 418570 - }, - { - "epoch": 0.73, - "learning_rate": 1.350233854288375e-05, - "loss": 2.2512, - "step": 418580 - }, - { - "epoch": 0.73, - "learning_rate": 1.3501466602956922e-05, - "loss": 2.3593, - "step": 418590 - }, - { - "epoch": 0.73, - "learning_rate": 1.3500594663030097e-05, - "loss": 2.3193, - "step": 418600 - }, - { - "epoch": 0.73, - "learning_rate": 1.349972272310327e-05, - "loss": 2.2961, - "step": 418610 - }, - { - "epoch": 0.73, - "learning_rate": 1.3498850783176442e-05, - "loss": 2.3159, - "step": 418620 - }, - { - "epoch": 0.73, - "learning_rate": 1.3497978843249617e-05, - "loss": 2.301, - "step": 418630 - }, - { - "epoch": 0.73, - "learning_rate": 1.3497106903322789e-05, - "loss": 2.2751, - "step": 418640 - }, - { - "epoch": 0.73, - "learning_rate": 1.3496234963395963e-05, - "loss": 2.3962, - "step": 418650 - }, - { - "epoch": 0.73, - "learning_rate": 1.3495363023469135e-05, - "loss": 2.1987, - "step": 418660 - }, - { - "epoch": 0.73, - "learning_rate": 1.349449108354231e-05, - "loss": 2.3869, - "step": 418670 - }, - { - "epoch": 0.73, - "learning_rate": 1.3493619143615482e-05, - "loss": 2.5269, - "step": 418680 - }, - { - "epoch": 0.73, - "learning_rate": 1.3492747203688655e-05, - "loss": 2.2525, - "step": 418690 - }, - { - "epoch": 0.73, - "learning_rate": 1.3491875263761827e-05, - "loss": 2.3175, - "step": 418700 - }, - { - "epoch": 0.73, - "learning_rate": 1.3491003323835002e-05, - "loss": 2.2034, - "step": 418710 - }, - { - "epoch": 0.73, - "learning_rate": 1.3490131383908174e-05, - "loss": 2.2852, - "step": 418720 - }, - { - "epoch": 0.73, - "learning_rate": 1.3489259443981348e-05, - "loss": 2.3553, - "step": 418730 - }, - { - "epoch": 0.73, - "learning_rate": 1.3488387504054523e-05, - "loss": 2.2309, - "step": 418740 - }, - { - "epoch": 0.73, - "learning_rate": 1.3487515564127695e-05, - "loss": 2.3706, - "step": 418750 - }, - { - "epoch": 0.73, - "learning_rate": 1.3486643624200868e-05, - "loss": 2.238, - "step": 418760 - }, - { - "epoch": 0.73, - "learning_rate": 1.348577168427404e-05, - "loss": 2.298, - "step": 418770 - }, - { - "epoch": 0.73, - "learning_rate": 1.3484899744347215e-05, - "loss": 2.1199, - "step": 418780 - }, - { - "epoch": 0.73, - "learning_rate": 1.3484027804420387e-05, - "loss": 2.2998, - "step": 418790 - }, - { - "epoch": 0.73, - "learning_rate": 1.3483155864493561e-05, - "loss": 2.3394, - "step": 418800 - }, - { - "epoch": 0.73, - "learning_rate": 1.3482283924566733e-05, - "loss": 2.1951, - "step": 418810 - }, - { - "epoch": 0.73, - "learning_rate": 1.3481411984639908e-05, - "loss": 2.277, - "step": 418820 - }, - { - "epoch": 0.73, - "learning_rate": 1.348054004471308e-05, - "loss": 2.3071, - "step": 418830 - }, - { - "epoch": 0.73, - "learning_rate": 1.3479668104786253e-05, - "loss": 2.3567, - "step": 418840 - }, - { - "epoch": 0.73, - "learning_rate": 1.3478796164859425e-05, - "loss": 2.3295, - "step": 418850 - }, - { - "epoch": 0.73, - "learning_rate": 1.34779242249326e-05, - "loss": 2.3164, - "step": 418860 - }, - { - "epoch": 0.73, - "learning_rate": 1.3477052285005772e-05, - "loss": 2.314, - "step": 418870 - }, - { - "epoch": 0.73, - "learning_rate": 1.3476180345078946e-05, - "loss": 2.3359, - "step": 418880 - }, - { - "epoch": 0.73, - "learning_rate": 1.347530840515212e-05, - "loss": 2.2242, - "step": 418890 - }, - { - "epoch": 0.73, - "learning_rate": 1.3474436465225294e-05, - "loss": 2.4067, - "step": 418900 - }, - { - "epoch": 0.73, - "learning_rate": 1.3473564525298466e-05, - "loss": 2.2243, - "step": 418910 - }, - { - "epoch": 0.73, - "learning_rate": 1.3472692585371638e-05, - "loss": 2.3696, - "step": 418920 - }, - { - "epoch": 0.73, - "learning_rate": 1.3471820645444813e-05, - "loss": 2.2341, - "step": 418930 - }, - { - "epoch": 0.73, - "learning_rate": 1.3470948705517985e-05, - "loss": 2.2334, - "step": 418940 - }, - { - "epoch": 0.73, - "learning_rate": 1.3470076765591157e-05, - "loss": 2.3161, - "step": 418950 - }, - { - "epoch": 0.73, - "learning_rate": 1.3469204825664331e-05, - "loss": 2.2967, - "step": 418960 - }, - { - "epoch": 0.73, - "learning_rate": 1.3468332885737507e-05, - "loss": 2.2895, - "step": 418970 - }, - { - "epoch": 0.73, - "learning_rate": 1.3467460945810679e-05, - "loss": 2.2899, - "step": 418980 - }, - { - "epoch": 0.73, - "learning_rate": 1.346658900588385e-05, - "loss": 2.4693, - "step": 418990 - }, - { - "epoch": 0.73, - "learning_rate": 1.3465717065957023e-05, - "loss": 2.2732, - "step": 419000 - }, - { - "epoch": 0.73, - "learning_rate": 1.3464845126030198e-05, - "loss": 2.3354, - "step": 419010 - }, - { - "epoch": 0.73, - "learning_rate": 1.346397318610337e-05, - "loss": 2.2988, - "step": 419020 - }, - { - "epoch": 0.73, - "learning_rate": 1.3463101246176542e-05, - "loss": 2.2794, - "step": 419030 - }, - { - "epoch": 0.73, - "learning_rate": 1.3462229306249718e-05, - "loss": 2.2539, - "step": 419040 - }, - { - "epoch": 0.73, - "learning_rate": 1.3461357366322892e-05, - "loss": 2.2423, - "step": 419050 - }, - { - "epoch": 0.73, - "learning_rate": 1.3460485426396064e-05, - "loss": 2.4104, - "step": 419060 - }, - { - "epoch": 0.73, - "learning_rate": 1.3459613486469236e-05, - "loss": 2.4023, - "step": 419070 - }, - { - "epoch": 0.73, - "learning_rate": 1.3458741546542411e-05, - "loss": 2.2893, - "step": 419080 - }, - { - "epoch": 0.73, - "learning_rate": 1.3457869606615583e-05, - "loss": 2.2153, - "step": 419090 - }, - { - "epoch": 0.73, - "learning_rate": 1.3456997666688755e-05, - "loss": 2.3248, - "step": 419100 - }, - { - "epoch": 0.73, - "learning_rate": 1.345612572676193e-05, - "loss": 2.2657, - "step": 419110 - }, - { - "epoch": 0.73, - "learning_rate": 1.3455253786835103e-05, - "loss": 2.3943, - "step": 419120 - }, - { - "epoch": 0.73, - "learning_rate": 1.3454381846908277e-05, - "loss": 2.2825, - "step": 419130 - }, - { - "epoch": 0.73, - "learning_rate": 1.3453509906981449e-05, - "loss": 2.2875, - "step": 419140 - }, - { - "epoch": 0.73, - "learning_rate": 1.3452637967054624e-05, - "loss": 2.2919, - "step": 419150 - }, - { - "epoch": 0.73, - "learning_rate": 1.3451766027127796e-05, - "loss": 2.3901, - "step": 419160 - }, - { - "epoch": 0.73, - "learning_rate": 1.3450894087200968e-05, - "loss": 2.4297, - "step": 419170 - }, - { - "epoch": 0.73, - "learning_rate": 1.345002214727414e-05, - "loss": 2.3257, - "step": 419180 - }, - { - "epoch": 0.73, - "learning_rate": 1.3449150207347316e-05, - "loss": 2.2771, - "step": 419190 - }, - { - "epoch": 0.73, - "learning_rate": 1.3448278267420488e-05, - "loss": 2.2397, - "step": 419200 - }, - { - "epoch": 0.73, - "learning_rate": 1.3447406327493662e-05, - "loss": 2.318, - "step": 419210 - }, - { - "epoch": 0.73, - "learning_rate": 1.3446534387566834e-05, - "loss": 2.3274, - "step": 419220 - }, - { - "epoch": 0.73, - "learning_rate": 1.344566244764001e-05, - "loss": 2.3646, - "step": 419230 - }, - { - "epoch": 0.73, - "learning_rate": 1.3444790507713181e-05, - "loss": 2.2777, - "step": 419240 - }, - { - "epoch": 0.73, - "learning_rate": 1.3443918567786353e-05, - "loss": 2.216, - "step": 419250 - }, - { - "epoch": 0.73, - "learning_rate": 1.3443046627859526e-05, - "loss": 2.2637, - "step": 419260 - }, - { - "epoch": 0.73, - "learning_rate": 1.3442174687932701e-05, - "loss": 2.312, - "step": 419270 - }, - { - "epoch": 0.73, - "learning_rate": 1.3441302748005875e-05, - "loss": 2.2541, - "step": 419280 - }, - { - "epoch": 0.73, - "learning_rate": 1.3440430808079047e-05, - "loss": 2.2653, - "step": 419290 - }, - { - "epoch": 0.73, - "learning_rate": 1.3439558868152222e-05, - "loss": 2.3765, - "step": 419300 - }, - { - "epoch": 0.73, - "learning_rate": 1.3438686928225394e-05, - "loss": 2.3301, - "step": 419310 - }, - { - "epoch": 0.73, - "learning_rate": 1.3437814988298566e-05, - "loss": 2.3232, - "step": 419320 - }, - { - "epoch": 0.73, - "learning_rate": 1.3436943048371739e-05, - "loss": 2.2866, - "step": 419330 - }, - { - "epoch": 0.73, - "learning_rate": 1.3436071108444914e-05, - "loss": 2.2342, - "step": 419340 - }, - { - "epoch": 0.73, - "learning_rate": 1.3435199168518086e-05, - "loss": 2.2373, - "step": 419350 - }, - { - "epoch": 0.73, - "learning_rate": 1.343432722859126e-05, - "loss": 2.1894, - "step": 419360 - }, - { - "epoch": 0.73, - "learning_rate": 1.3433455288664432e-05, - "loss": 2.304, - "step": 419370 - }, - { - "epoch": 0.73, - "learning_rate": 1.3432583348737607e-05, - "loss": 2.2607, - "step": 419380 - }, - { - "epoch": 0.73, - "learning_rate": 1.343171140881078e-05, - "loss": 2.4156, - "step": 419390 - }, - { - "epoch": 0.73, - "learning_rate": 1.3430839468883952e-05, - "loss": 2.3406, - "step": 419400 - }, - { - "epoch": 0.73, - "learning_rate": 1.3429967528957127e-05, - "loss": 2.1864, - "step": 419410 - }, - { - "epoch": 0.73, - "learning_rate": 1.3429095589030299e-05, - "loss": 2.32, - "step": 419420 - }, - { - "epoch": 0.73, - "learning_rate": 1.3428223649103471e-05, - "loss": 2.3745, - "step": 419430 - }, - { - "epoch": 0.73, - "learning_rate": 1.3427351709176645e-05, - "loss": 2.4009, - "step": 419440 - }, - { - "epoch": 0.73, - "learning_rate": 1.3426479769249819e-05, - "loss": 2.3478, - "step": 419450 - }, - { - "epoch": 0.73, - "learning_rate": 1.3425607829322992e-05, - "loss": 2.4416, - "step": 419460 - }, - { - "epoch": 0.73, - "learning_rate": 1.3424735889396165e-05, - "loss": 2.2345, - "step": 419470 - }, - { - "epoch": 0.73, - "learning_rate": 1.3423863949469337e-05, - "loss": 2.2333, - "step": 419480 - }, - { - "epoch": 0.73, - "learning_rate": 1.3422992009542512e-05, - "loss": 2.2059, - "step": 419490 - }, - { - "epoch": 0.73, - "learning_rate": 1.3422120069615684e-05, - "loss": 2.3351, - "step": 419500 - }, - { - "epoch": 0.73, - "learning_rate": 1.3421248129688856e-05, - "loss": 2.3632, - "step": 419510 - }, - { - "epoch": 0.73, - "learning_rate": 1.342037618976203e-05, - "loss": 2.4774, - "step": 419520 - }, - { - "epoch": 0.73, - "learning_rate": 1.3419504249835205e-05, - "loss": 2.3384, - "step": 419530 - }, - { - "epoch": 0.73, - "learning_rate": 1.3418632309908378e-05, - "loss": 2.3412, - "step": 419540 - }, - { - "epoch": 0.73, - "learning_rate": 1.341776036998155e-05, - "loss": 2.3627, - "step": 419550 - }, - { - "epoch": 0.73, - "learning_rate": 1.3416888430054725e-05, - "loss": 2.2951, - "step": 419560 - }, - { - "epoch": 0.73, - "learning_rate": 1.3416016490127897e-05, - "loss": 2.3522, - "step": 419570 - }, - { - "epoch": 0.73, - "learning_rate": 1.341514455020107e-05, - "loss": 2.318, - "step": 419580 - }, - { - "epoch": 0.73, - "learning_rate": 1.3414272610274243e-05, - "loss": 2.341, - "step": 419590 - }, - { - "epoch": 0.73, - "learning_rate": 1.3413400670347417e-05, - "loss": 2.3369, - "step": 419600 - }, - { - "epoch": 0.73, - "learning_rate": 1.341252873042059e-05, - "loss": 2.3403, - "step": 419610 - }, - { - "epoch": 0.73, - "learning_rate": 1.3411656790493763e-05, - "loss": 2.2692, - "step": 419620 - }, - { - "epoch": 0.73, - "learning_rate": 1.3410784850566935e-05, - "loss": 2.3267, - "step": 419630 - }, - { - "epoch": 0.73, - "learning_rate": 1.340991291064011e-05, - "loss": 2.3309, - "step": 419640 - }, - { - "epoch": 0.73, - "learning_rate": 1.3409040970713282e-05, - "loss": 2.2546, - "step": 419650 - }, - { - "epoch": 0.73, - "learning_rate": 1.3408169030786454e-05, - "loss": 2.4044, - "step": 419660 - }, - { - "epoch": 0.73, - "learning_rate": 1.340729709085963e-05, - "loss": 2.3011, - "step": 419670 - }, - { - "epoch": 0.73, - "learning_rate": 1.3406425150932802e-05, - "loss": 2.2142, - "step": 419680 - }, - { - "epoch": 0.73, - "learning_rate": 1.3405553211005976e-05, - "loss": 2.3042, - "step": 419690 - }, - { - "epoch": 0.73, - "learning_rate": 1.3404681271079148e-05, - "loss": 2.2825, - "step": 419700 - }, - { - "epoch": 0.73, - "learning_rate": 1.3403809331152323e-05, - "loss": 2.2919, - "step": 419710 - }, - { - "epoch": 0.73, - "learning_rate": 1.3402937391225495e-05, - "loss": 2.2368, - "step": 419720 - }, - { - "epoch": 0.73, - "learning_rate": 1.3402065451298667e-05, - "loss": 2.2282, - "step": 419730 - }, - { - "epoch": 0.73, - "learning_rate": 1.340119351137184e-05, - "loss": 2.1846, - "step": 419740 - }, - { - "epoch": 0.73, - "learning_rate": 1.3400321571445015e-05, - "loss": 2.3716, - "step": 419750 - }, - { - "epoch": 0.73, - "learning_rate": 1.3399449631518187e-05, - "loss": 2.419, - "step": 419760 - }, - { - "epoch": 0.73, - "learning_rate": 1.339857769159136e-05, - "loss": 2.327, - "step": 419770 - }, - { - "epoch": 0.73, - "learning_rate": 1.3397705751664533e-05, - "loss": 2.257, - "step": 419780 - }, - { - "epoch": 0.73, - "learning_rate": 1.3396833811737708e-05, - "loss": 2.3252, - "step": 419790 - }, - { - "epoch": 0.73, - "learning_rate": 1.339596187181088e-05, - "loss": 2.3032, - "step": 419800 - }, - { - "epoch": 0.73, - "learning_rate": 1.3395089931884052e-05, - "loss": 2.3351, - "step": 419810 - }, - { - "epoch": 0.73, - "learning_rate": 1.3394217991957228e-05, - "loss": 2.2626, - "step": 419820 - }, - { - "epoch": 0.73, - "learning_rate": 1.33933460520304e-05, - "loss": 2.3233, - "step": 419830 - }, - { - "epoch": 0.73, - "learning_rate": 1.3392474112103574e-05, - "loss": 2.3005, - "step": 419840 - }, - { - "epoch": 0.73, - "learning_rate": 1.3391602172176746e-05, - "loss": 2.2732, - "step": 419850 - }, - { - "epoch": 0.73, - "learning_rate": 1.3390730232249921e-05, - "loss": 2.3799, - "step": 419860 - }, - { - "epoch": 0.73, - "learning_rate": 1.3389858292323093e-05, - "loss": 2.302, - "step": 419870 - }, - { - "epoch": 0.73, - "learning_rate": 1.3388986352396265e-05, - "loss": 2.2836, - "step": 419880 - }, - { - "epoch": 0.73, - "learning_rate": 1.3388114412469437e-05, - "loss": 2.3709, - "step": 419890 - }, - { - "epoch": 0.73, - "learning_rate": 1.3387242472542613e-05, - "loss": 2.2988, - "step": 419900 - }, - { - "epoch": 0.73, - "learning_rate": 1.3386370532615785e-05, - "loss": 2.3428, - "step": 419910 - }, - { - "epoch": 0.73, - "learning_rate": 1.3385498592688959e-05, - "loss": 2.2796, - "step": 419920 - }, - { - "epoch": 0.73, - "learning_rate": 1.3384626652762131e-05, - "loss": 2.2488, - "step": 419930 - }, - { - "epoch": 0.73, - "learning_rate": 1.3383754712835306e-05, - "loss": 2.369, - "step": 419940 - }, - { - "epoch": 0.73, - "learning_rate": 1.3382882772908478e-05, - "loss": 2.3355, - "step": 419950 - }, - { - "epoch": 0.73, - "learning_rate": 1.338201083298165e-05, - "loss": 2.3078, - "step": 419960 - }, - { - "epoch": 0.73, - "learning_rate": 1.3381138893054826e-05, - "loss": 2.3567, - "step": 419970 - }, - { - "epoch": 0.73, - "learning_rate": 1.3380266953127998e-05, - "loss": 2.3313, - "step": 419980 - }, - { - "epoch": 0.73, - "learning_rate": 1.337939501320117e-05, - "loss": 2.2741, - "step": 419990 - }, - { - "epoch": 0.73, - "learning_rate": 1.3378523073274344e-05, - "loss": 2.1983, - "step": 420000 - }, - { - "epoch": 0.73, - "learning_rate": 1.337765113334752e-05, - "loss": 2.3719, - "step": 420010 - }, - { - "epoch": 0.73, - "learning_rate": 1.3376779193420691e-05, - "loss": 2.2092, - "step": 420020 - }, - { - "epoch": 0.73, - "learning_rate": 1.3375907253493863e-05, - "loss": 2.3106, - "step": 420030 - }, - { - "epoch": 0.73, - "learning_rate": 1.3375035313567036e-05, - "loss": 2.209, - "step": 420040 - }, - { - "epoch": 0.73, - "learning_rate": 1.3374163373640211e-05, - "loss": 2.2517, - "step": 420050 - }, - { - "epoch": 0.73, - "learning_rate": 1.3373291433713383e-05, - "loss": 2.3326, - "step": 420060 - }, - { - "epoch": 0.73, - "learning_rate": 1.3372419493786555e-05, - "loss": 2.3495, - "step": 420070 - }, - { - "epoch": 0.73, - "learning_rate": 1.337154755385973e-05, - "loss": 2.3323, - "step": 420080 - }, - { - "epoch": 0.73, - "learning_rate": 1.3370675613932904e-05, - "loss": 2.3206, - "step": 420090 - }, - { - "epoch": 0.73, - "learning_rate": 1.3369803674006076e-05, - "loss": 2.3255, - "step": 420100 - }, - { - "epoch": 0.73, - "learning_rate": 1.3368931734079249e-05, - "loss": 2.3134, - "step": 420110 - }, - { - "epoch": 0.73, - "learning_rate": 1.3368059794152424e-05, - "loss": 2.2942, - "step": 420120 - }, - { - "epoch": 0.73, - "learning_rate": 1.3367187854225596e-05, - "loss": 2.2401, - "step": 420130 - }, - { - "epoch": 0.73, - "learning_rate": 1.3366315914298768e-05, - "loss": 2.1778, - "step": 420140 - }, - { - "epoch": 0.73, - "learning_rate": 1.3365443974371942e-05, - "loss": 2.3361, - "step": 420150 - }, - { - "epoch": 0.73, - "learning_rate": 1.3364572034445116e-05, - "loss": 2.2803, - "step": 420160 - }, - { - "epoch": 0.73, - "learning_rate": 1.336370009451829e-05, - "loss": 2.3977, - "step": 420170 - }, - { - "epoch": 0.73, - "learning_rate": 1.3362828154591462e-05, - "loss": 2.3316, - "step": 420180 - }, - { - "epoch": 0.73, - "learning_rate": 1.3361956214664634e-05, - "loss": 2.269, - "step": 420190 - }, - { - "epoch": 0.73, - "learning_rate": 1.3361084274737809e-05, - "loss": 2.258, - "step": 420200 - }, - { - "epoch": 0.73, - "learning_rate": 1.3360212334810981e-05, - "loss": 2.2815, - "step": 420210 - }, - { - "epoch": 0.73, - "learning_rate": 1.3359340394884153e-05, - "loss": 2.2818, - "step": 420220 - }, - { - "epoch": 0.73, - "learning_rate": 1.3358468454957329e-05, - "loss": 2.354, - "step": 420230 - }, - { - "epoch": 0.73, - "learning_rate": 1.33575965150305e-05, - "loss": 2.3283, - "step": 420240 - }, - { - "epoch": 0.73, - "learning_rate": 1.3356724575103675e-05, - "loss": 2.334, - "step": 420250 - }, - { - "epoch": 0.73, - "learning_rate": 1.3355852635176847e-05, - "loss": 2.2664, - "step": 420260 - }, - { - "epoch": 0.73, - "learning_rate": 1.3354980695250022e-05, - "loss": 2.3265, - "step": 420270 - }, - { - "epoch": 0.73, - "learning_rate": 1.3354108755323194e-05, - "loss": 2.292, - "step": 420280 - }, - { - "epoch": 0.73, - "learning_rate": 1.3353236815396366e-05, - "loss": 2.2486, - "step": 420290 - }, - { - "epoch": 0.73, - "learning_rate": 1.3352364875469538e-05, - "loss": 2.2262, - "step": 420300 - }, - { - "epoch": 0.73, - "learning_rate": 1.3351492935542714e-05, - "loss": 2.2857, - "step": 420310 - }, - { - "epoch": 0.73, - "learning_rate": 1.3350620995615888e-05, - "loss": 2.2857, - "step": 420320 - }, - { - "epoch": 0.73, - "learning_rate": 1.334974905568906e-05, - "loss": 2.2519, - "step": 420330 - }, - { - "epoch": 0.73, - "learning_rate": 1.3348877115762235e-05, - "loss": 2.3539, - "step": 420340 - }, - { - "epoch": 0.73, - "learning_rate": 1.3348005175835407e-05, - "loss": 2.3118, - "step": 420350 - }, - { - "epoch": 0.73, - "learning_rate": 1.334713323590858e-05, - "loss": 2.3123, - "step": 420360 - }, - { - "epoch": 0.73, - "learning_rate": 1.3346261295981751e-05, - "loss": 2.294, - "step": 420370 - }, - { - "epoch": 0.73, - "learning_rate": 1.3345389356054927e-05, - "loss": 2.3204, - "step": 420380 - }, - { - "epoch": 0.73, - "learning_rate": 1.3344517416128099e-05, - "loss": 2.3168, - "step": 420390 - }, - { - "epoch": 0.73, - "learning_rate": 1.3343645476201273e-05, - "loss": 2.3578, - "step": 420400 - }, - { - "epoch": 0.73, - "learning_rate": 1.3342773536274445e-05, - "loss": 2.2471, - "step": 420410 - }, - { - "epoch": 0.73, - "learning_rate": 1.334190159634762e-05, - "loss": 2.2203, - "step": 420420 - }, - { - "epoch": 0.73, - "learning_rate": 1.3341029656420792e-05, - "loss": 2.3289, - "step": 420430 - }, - { - "epoch": 0.73, - "learning_rate": 1.3340157716493964e-05, - "loss": 2.408, - "step": 420440 - }, - { - "epoch": 0.73, - "learning_rate": 1.3339285776567136e-05, - "loss": 2.2996, - "step": 420450 - }, - { - "epoch": 0.73, - "learning_rate": 1.3338413836640312e-05, - "loss": 2.19, - "step": 420460 - }, - { - "epoch": 0.73, - "learning_rate": 1.3337541896713484e-05, - "loss": 2.2586, - "step": 420470 - }, - { - "epoch": 0.73, - "learning_rate": 1.3336669956786658e-05, - "loss": 2.2825, - "step": 420480 - }, - { - "epoch": 0.73, - "learning_rate": 1.3335798016859831e-05, - "loss": 2.2668, - "step": 420490 - }, - { - "epoch": 0.73, - "learning_rate": 1.3334926076933005e-05, - "loss": 2.1933, - "step": 420500 - }, - { - "epoch": 0.73, - "learning_rate": 1.3334054137006177e-05, - "loss": 2.2524, - "step": 420510 - }, - { - "epoch": 0.73, - "learning_rate": 1.333318219707935e-05, - "loss": 2.3034, - "step": 420520 - }, - { - "epoch": 0.73, - "learning_rate": 1.3332310257152525e-05, - "loss": 2.3051, - "step": 420530 - }, - { - "epoch": 0.73, - "learning_rate": 1.3331438317225697e-05, - "loss": 2.3938, - "step": 420540 - }, - { - "epoch": 0.73, - "learning_rate": 1.3330566377298869e-05, - "loss": 2.3587, - "step": 420550 - }, - { - "epoch": 0.73, - "learning_rate": 1.3329694437372043e-05, - "loss": 2.2774, - "step": 420560 - }, - { - "epoch": 0.73, - "learning_rate": 1.3328822497445218e-05, - "loss": 2.3643, - "step": 420570 - }, - { - "epoch": 0.73, - "learning_rate": 1.332795055751839e-05, - "loss": 2.4041, - "step": 420580 - }, - { - "epoch": 0.73, - "learning_rate": 1.3327078617591562e-05, - "loss": 2.2453, - "step": 420590 - }, - { - "epoch": 0.73, - "learning_rate": 1.3326206677664738e-05, - "loss": 2.3723, - "step": 420600 - }, - { - "epoch": 0.73, - "learning_rate": 1.332533473773791e-05, - "loss": 2.2709, - "step": 420610 - }, - { - "epoch": 0.73, - "learning_rate": 1.3324462797811082e-05, - "loss": 2.2045, - "step": 420620 - }, - { - "epoch": 0.73, - "learning_rate": 1.3323590857884256e-05, - "loss": 2.3138, - "step": 420630 - }, - { - "epoch": 0.73, - "learning_rate": 1.332271891795743e-05, - "loss": 2.2719, - "step": 420640 - }, - { - "epoch": 0.73, - "learning_rate": 1.3321846978030603e-05, - "loss": 2.2564, - "step": 420650 - }, - { - "epoch": 0.73, - "learning_rate": 1.3320975038103775e-05, - "loss": 2.2643, - "step": 420660 - }, - { - "epoch": 0.73, - "learning_rate": 1.3320103098176947e-05, - "loss": 2.3099, - "step": 420670 - }, - { - "epoch": 0.73, - "learning_rate": 1.3319231158250123e-05, - "loss": 2.3017, - "step": 420680 - }, - { - "epoch": 0.73, - "learning_rate": 1.3318359218323295e-05, - "loss": 2.2662, - "step": 420690 - }, - { - "epoch": 0.73, - "learning_rate": 1.3317487278396467e-05, - "loss": 2.3207, - "step": 420700 - }, - { - "epoch": 0.73, - "learning_rate": 1.3316615338469641e-05, - "loss": 2.3639, - "step": 420710 - }, - { - "epoch": 0.73, - "learning_rate": 1.3315743398542815e-05, - "loss": 2.274, - "step": 420720 - }, - { - "epoch": 0.73, - "learning_rate": 1.3314871458615988e-05, - "loss": 2.3666, - "step": 420730 - }, - { - "epoch": 0.73, - "learning_rate": 1.331399951868916e-05, - "loss": 2.3078, - "step": 420740 - }, - { - "epoch": 0.73, - "learning_rate": 1.3313127578762336e-05, - "loss": 2.2575, - "step": 420750 - }, - { - "epoch": 0.73, - "learning_rate": 1.3312255638835508e-05, - "loss": 2.3083, - "step": 420760 - }, - { - "epoch": 0.73, - "learning_rate": 1.331138369890868e-05, - "loss": 2.3179, - "step": 420770 - }, - { - "epoch": 0.73, - "learning_rate": 1.3310511758981852e-05, - "loss": 2.2606, - "step": 420780 - }, - { - "epoch": 0.73, - "learning_rate": 1.3309639819055028e-05, - "loss": 2.2789, - "step": 420790 - }, - { - "epoch": 0.73, - "learning_rate": 1.33087678791282e-05, - "loss": 2.3664, - "step": 420800 - }, - { - "epoch": 0.73, - "learning_rate": 1.3307895939201373e-05, - "loss": 2.3067, - "step": 420810 - }, - { - "epoch": 0.73, - "learning_rate": 1.3307023999274546e-05, - "loss": 2.3043, - "step": 420820 - }, - { - "epoch": 0.73, - "learning_rate": 1.3306152059347721e-05, - "loss": 2.4116, - "step": 420830 - }, - { - "epoch": 0.73, - "learning_rate": 1.3305280119420893e-05, - "loss": 2.424, - "step": 420840 - }, - { - "epoch": 0.73, - "learning_rate": 1.3304408179494065e-05, - "loss": 2.2678, - "step": 420850 - }, - { - "epoch": 0.73, - "learning_rate": 1.3303536239567237e-05, - "loss": 2.3222, - "step": 420860 - }, - { - "epoch": 0.73, - "learning_rate": 1.3302664299640413e-05, - "loss": 2.3846, - "step": 420870 - }, - { - "epoch": 0.73, - "learning_rate": 1.3301792359713586e-05, - "loss": 2.2511, - "step": 420880 - }, - { - "epoch": 0.73, - "learning_rate": 1.3300920419786759e-05, - "loss": 2.3339, - "step": 420890 - }, - { - "epoch": 0.73, - "learning_rate": 1.3300048479859934e-05, - "loss": 2.3908, - "step": 420900 - }, - { - "epoch": 0.73, - "learning_rate": 1.3299176539933106e-05, - "loss": 2.2713, - "step": 420910 - }, - { - "epoch": 0.73, - "learning_rate": 1.3298304600006278e-05, - "loss": 2.1764, - "step": 420920 - }, - { - "epoch": 0.73, - "learning_rate": 1.329743266007945e-05, - "loss": 2.3631, - "step": 420930 - }, - { - "epoch": 0.73, - "learning_rate": 1.3296560720152626e-05, - "loss": 2.1162, - "step": 420940 - }, - { - "epoch": 0.73, - "learning_rate": 1.3295688780225798e-05, - "loss": 2.2668, - "step": 420950 - }, - { - "epoch": 0.73, - "learning_rate": 1.3294816840298972e-05, - "loss": 2.1941, - "step": 420960 - }, - { - "epoch": 0.73, - "learning_rate": 1.3293944900372144e-05, - "loss": 2.2673, - "step": 420970 - }, - { - "epoch": 0.73, - "learning_rate": 1.3293072960445319e-05, - "loss": 2.3067, - "step": 420980 - }, - { - "epoch": 0.73, - "learning_rate": 1.3292201020518491e-05, - "loss": 2.1884, - "step": 420990 - }, - { - "epoch": 0.73, - "learning_rate": 1.3291329080591663e-05, - "loss": 2.364, - "step": 421000 - }, - { - "epoch": 0.73, - "learning_rate": 1.3290457140664839e-05, - "loss": 2.2583, - "step": 421010 - }, - { - "epoch": 0.73, - "learning_rate": 1.328958520073801e-05, - "loss": 2.3157, - "step": 421020 - }, - { - "epoch": 0.73, - "learning_rate": 1.3288713260811183e-05, - "loss": 2.2997, - "step": 421030 - }, - { - "epoch": 0.73, - "learning_rate": 1.3287841320884357e-05, - "loss": 2.1537, - "step": 421040 - }, - { - "epoch": 0.73, - "learning_rate": 1.3286969380957532e-05, - "loss": 2.3772, - "step": 421050 - }, - { - "epoch": 0.73, - "learning_rate": 1.3286097441030704e-05, - "loss": 2.4154, - "step": 421060 - }, - { - "epoch": 0.73, - "learning_rate": 1.3285225501103876e-05, - "loss": 2.2937, - "step": 421070 - }, - { - "epoch": 0.73, - "learning_rate": 1.3284353561177048e-05, - "loss": 2.2822, - "step": 421080 - }, - { - "epoch": 0.73, - "learning_rate": 1.3283481621250224e-05, - "loss": 2.3942, - "step": 421090 - }, - { - "epoch": 0.73, - "learning_rate": 1.3282609681323396e-05, - "loss": 2.2964, - "step": 421100 - }, - { - "epoch": 0.73, - "learning_rate": 1.3281737741396568e-05, - "loss": 2.2444, - "step": 421110 - }, - { - "epoch": 0.73, - "learning_rate": 1.3280865801469742e-05, - "loss": 2.2997, - "step": 421120 - }, - { - "epoch": 0.73, - "learning_rate": 1.3279993861542917e-05, - "loss": 2.308, - "step": 421130 - }, - { - "epoch": 0.73, - "learning_rate": 1.327912192161609e-05, - "loss": 2.2362, - "step": 421140 - }, - { - "epoch": 0.73, - "learning_rate": 1.3278249981689261e-05, - "loss": 2.2838, - "step": 421150 - }, - { - "epoch": 0.73, - "learning_rate": 1.3277378041762437e-05, - "loss": 2.2861, - "step": 421160 - }, - { - "epoch": 0.73, - "learning_rate": 1.3276506101835609e-05, - "loss": 2.295, - "step": 421170 - }, - { - "epoch": 0.73, - "learning_rate": 1.3275634161908781e-05, - "loss": 2.3885, - "step": 421180 - }, - { - "epoch": 0.73, - "learning_rate": 1.3274762221981955e-05, - "loss": 2.3695, - "step": 421190 - }, - { - "epoch": 0.73, - "learning_rate": 1.3273890282055128e-05, - "loss": 2.1641, - "step": 421200 - }, - { - "epoch": 0.73, - "learning_rate": 1.3273018342128302e-05, - "loss": 2.255, - "step": 421210 - }, - { - "epoch": 0.73, - "learning_rate": 1.3272146402201474e-05, - "loss": 2.2954, - "step": 421220 - }, - { - "epoch": 0.73, - "learning_rate": 1.3271274462274646e-05, - "loss": 2.3818, - "step": 421230 - }, - { - "epoch": 0.73, - "learning_rate": 1.3270402522347822e-05, - "loss": 2.3168, - "step": 421240 - }, - { - "epoch": 0.73, - "learning_rate": 1.3269530582420994e-05, - "loss": 2.3023, - "step": 421250 - }, - { - "epoch": 0.73, - "learning_rate": 1.3268658642494166e-05, - "loss": 2.3412, - "step": 421260 - }, - { - "epoch": 0.73, - "learning_rate": 1.3267786702567341e-05, - "loss": 2.2924, - "step": 421270 - }, - { - "epoch": 0.73, - "learning_rate": 1.3266914762640514e-05, - "loss": 2.2213, - "step": 421280 - }, - { - "epoch": 0.73, - "learning_rate": 1.3266042822713687e-05, - "loss": 2.3757, - "step": 421290 - }, - { - "epoch": 0.73, - "learning_rate": 1.326517088278686e-05, - "loss": 2.348, - "step": 421300 - }, - { - "epoch": 0.73, - "learning_rate": 1.3264298942860035e-05, - "loss": 2.3966, - "step": 421310 - }, - { - "epoch": 0.73, - "learning_rate": 1.3263427002933207e-05, - "loss": 2.3589, - "step": 421320 - }, - { - "epoch": 0.73, - "learning_rate": 1.3262555063006379e-05, - "loss": 2.2015, - "step": 421330 - }, - { - "epoch": 0.73, - "learning_rate": 1.3261683123079551e-05, - "loss": 2.392, - "step": 421340 - }, - { - "epoch": 0.73, - "learning_rate": 1.3260811183152727e-05, - "loss": 2.2767, - "step": 421350 - }, - { - "epoch": 0.73, - "learning_rate": 1.32599392432259e-05, - "loss": 2.2801, - "step": 421360 - }, - { - "epoch": 0.73, - "learning_rate": 1.3259067303299072e-05, - "loss": 2.3068, - "step": 421370 - }, - { - "epoch": 0.73, - "learning_rate": 1.3258195363372244e-05, - "loss": 2.2075, - "step": 421380 - }, - { - "epoch": 0.73, - "learning_rate": 1.325732342344542e-05, - "loss": 2.1862, - "step": 421390 - }, - { - "epoch": 0.73, - "learning_rate": 1.3256451483518592e-05, - "loss": 2.316, - "step": 421400 - }, - { - "epoch": 0.73, - "learning_rate": 1.3255579543591764e-05, - "loss": 2.1855, - "step": 421410 - }, - { - "epoch": 0.73, - "learning_rate": 1.325470760366494e-05, - "loss": 2.2711, - "step": 421420 - }, - { - "epoch": 0.73, - "learning_rate": 1.3253835663738112e-05, - "loss": 2.3044, - "step": 421430 - }, - { - "epoch": 0.73, - "learning_rate": 1.3252963723811285e-05, - "loss": 2.3692, - "step": 421440 - }, - { - "epoch": 0.73, - "learning_rate": 1.3252091783884457e-05, - "loss": 2.4838, - "step": 421450 - }, - { - "epoch": 0.73, - "learning_rate": 1.3251219843957633e-05, - "loss": 2.2339, - "step": 421460 - }, - { - "epoch": 0.73, - "learning_rate": 1.3250347904030805e-05, - "loss": 2.3488, - "step": 421470 - }, - { - "epoch": 0.74, - "learning_rate": 1.3249475964103977e-05, - "loss": 2.2971, - "step": 421480 - }, - { - "epoch": 0.74, - "learning_rate": 1.324860402417715e-05, - "loss": 2.4036, - "step": 421490 - }, - { - "epoch": 0.74, - "learning_rate": 1.3247732084250325e-05, - "loss": 2.3149, - "step": 421500 - }, - { - "epoch": 0.74, - "learning_rate": 1.3246860144323497e-05, - "loss": 2.3874, - "step": 421510 - }, - { - "epoch": 0.74, - "learning_rate": 1.324598820439667e-05, - "loss": 2.4423, - "step": 421520 - }, - { - "epoch": 0.74, - "learning_rate": 1.3245116264469844e-05, - "loss": 2.1739, - "step": 421530 - }, - { - "epoch": 0.74, - "learning_rate": 1.3244244324543018e-05, - "loss": 2.2703, - "step": 421540 - }, - { - "epoch": 0.74, - "learning_rate": 1.324337238461619e-05, - "loss": 2.375, - "step": 421550 - }, - { - "epoch": 0.74, - "learning_rate": 1.3242500444689362e-05, - "loss": 2.4143, - "step": 421560 - }, - { - "epoch": 0.74, - "learning_rate": 1.3241628504762538e-05, - "loss": 2.2857, - "step": 421570 - }, - { - "epoch": 0.74, - "learning_rate": 1.324075656483571e-05, - "loss": 2.3682, - "step": 421580 - }, - { - "epoch": 0.74, - "learning_rate": 1.3239884624908882e-05, - "loss": 2.2951, - "step": 421590 - }, - { - "epoch": 0.74, - "learning_rate": 1.3239012684982056e-05, - "loss": 2.4426, - "step": 421600 - }, - { - "epoch": 0.74, - "learning_rate": 1.3238140745055231e-05, - "loss": 2.3634, - "step": 421610 - }, - { - "epoch": 0.74, - "learning_rate": 1.3237268805128403e-05, - "loss": 2.3668, - "step": 421620 - }, - { - "epoch": 0.74, - "learning_rate": 1.3236396865201575e-05, - "loss": 2.298, - "step": 421630 - }, - { - "epoch": 0.74, - "learning_rate": 1.3235524925274747e-05, - "loss": 2.357, - "step": 421640 - }, - { - "epoch": 0.74, - "learning_rate": 1.3234652985347923e-05, - "loss": 2.3762, - "step": 421650 - }, - { - "epoch": 0.74, - "learning_rate": 1.3233781045421095e-05, - "loss": 2.2381, - "step": 421660 - }, - { - "epoch": 0.74, - "learning_rate": 1.3232909105494269e-05, - "loss": 2.3573, - "step": 421670 - }, - { - "epoch": 0.74, - "learning_rate": 1.3232037165567442e-05, - "loss": 2.3007, - "step": 421680 - }, - { - "epoch": 0.74, - "learning_rate": 1.3231165225640616e-05, - "loss": 2.3537, - "step": 421690 - }, - { - "epoch": 0.74, - "learning_rate": 1.3230293285713788e-05, - "loss": 2.199, - "step": 421700 - }, - { - "epoch": 0.74, - "learning_rate": 1.322942134578696e-05, - "loss": 2.2983, - "step": 421710 - }, - { - "epoch": 0.74, - "learning_rate": 1.3228549405860136e-05, - "loss": 2.2604, - "step": 421720 - }, - { - "epoch": 0.74, - "learning_rate": 1.3227677465933308e-05, - "loss": 2.3329, - "step": 421730 - }, - { - "epoch": 0.74, - "learning_rate": 1.322680552600648e-05, - "loss": 2.3127, - "step": 421740 - }, - { - "epoch": 0.74, - "learning_rate": 1.3225933586079654e-05, - "loss": 2.2861, - "step": 421750 - }, - { - "epoch": 0.74, - "learning_rate": 1.3225061646152827e-05, - "loss": 2.2756, - "step": 421760 - }, - { - "epoch": 0.74, - "learning_rate": 1.3224189706226001e-05, - "loss": 2.2775, - "step": 421770 - }, - { - "epoch": 0.74, - "learning_rate": 1.3223317766299173e-05, - "loss": 2.4184, - "step": 421780 - }, - { - "epoch": 0.74, - "learning_rate": 1.3222445826372345e-05, - "loss": 2.1973, - "step": 421790 - }, - { - "epoch": 0.74, - "learning_rate": 1.322157388644552e-05, - "loss": 2.3695, - "step": 421800 - }, - { - "epoch": 0.74, - "learning_rate": 1.3220701946518693e-05, - "loss": 2.2757, - "step": 421810 - }, - { - "epoch": 0.74, - "learning_rate": 1.3219830006591865e-05, - "loss": 2.2944, - "step": 421820 - }, - { - "epoch": 0.74, - "learning_rate": 1.321895806666504e-05, - "loss": 2.2724, - "step": 421830 - }, - { - "epoch": 0.74, - "learning_rate": 1.3218086126738212e-05, - "loss": 2.2973, - "step": 421840 - }, - { - "epoch": 0.74, - "learning_rate": 1.3217214186811386e-05, - "loss": 2.2987, - "step": 421850 - }, - { - "epoch": 0.74, - "learning_rate": 1.3216342246884558e-05, - "loss": 2.3569, - "step": 421860 - }, - { - "epoch": 0.74, - "learning_rate": 1.3215470306957734e-05, - "loss": 2.3422, - "step": 421870 - }, - { - "epoch": 0.74, - "learning_rate": 1.3214598367030906e-05, - "loss": 2.2916, - "step": 421880 - }, - { - "epoch": 0.74, - "learning_rate": 1.3213726427104078e-05, - "loss": 2.25, - "step": 421890 - }, - { - "epoch": 0.74, - "learning_rate": 1.321285448717725e-05, - "loss": 2.3152, - "step": 421900 - }, - { - "epoch": 0.74, - "learning_rate": 1.3211982547250425e-05, - "loss": 2.3392, - "step": 421910 - }, - { - "epoch": 0.74, - "learning_rate": 1.32111106073236e-05, - "loss": 2.3393, - "step": 421920 - }, - { - "epoch": 0.74, - "learning_rate": 1.3210238667396771e-05, - "loss": 2.3616, - "step": 421930 - }, - { - "epoch": 0.74, - "learning_rate": 1.3209366727469947e-05, - "loss": 2.4351, - "step": 421940 - }, - { - "epoch": 0.74, - "learning_rate": 1.3208494787543119e-05, - "loss": 2.2922, - "step": 421950 - }, - { - "epoch": 0.74, - "learning_rate": 1.3207622847616291e-05, - "loss": 2.2986, - "step": 421960 - }, - { - "epoch": 0.74, - "learning_rate": 1.3206750907689463e-05, - "loss": 2.3535, - "step": 421970 - }, - { - "epoch": 0.74, - "learning_rate": 1.3205878967762638e-05, - "loss": 2.2853, - "step": 421980 - }, - { - "epoch": 0.74, - "learning_rate": 1.320500702783581e-05, - "loss": 2.2718, - "step": 421990 - }, - { - "epoch": 0.74, - "learning_rate": 1.3204135087908984e-05, - "loss": 2.3634, - "step": 422000 - }, - { - "epoch": 0.74, - "learning_rate": 1.3203263147982156e-05, - "loss": 2.2764, - "step": 422010 - }, - { - "epoch": 0.74, - "learning_rate": 1.3202391208055332e-05, - "loss": 2.3229, - "step": 422020 - }, - { - "epoch": 0.74, - "learning_rate": 1.3201519268128504e-05, - "loss": 2.2125, - "step": 422030 - }, - { - "epoch": 0.74, - "learning_rate": 1.3200647328201676e-05, - "loss": 2.3127, - "step": 422040 - }, - { - "epoch": 0.74, - "learning_rate": 1.3199775388274848e-05, - "loss": 2.2561, - "step": 422050 - }, - { - "epoch": 0.74, - "learning_rate": 1.3198903448348024e-05, - "loss": 2.301, - "step": 422060 - }, - { - "epoch": 0.74, - "learning_rate": 1.3198031508421196e-05, - "loss": 2.2302, - "step": 422070 - }, - { - "epoch": 0.74, - "learning_rate": 1.319715956849437e-05, - "loss": 2.2025, - "step": 422080 - }, - { - "epoch": 0.74, - "learning_rate": 1.3196287628567545e-05, - "loss": 2.3185, - "step": 422090 - }, - { - "epoch": 0.74, - "learning_rate": 1.3195415688640717e-05, - "loss": 2.3748, - "step": 422100 - }, - { - "epoch": 0.74, - "learning_rate": 1.3194543748713889e-05, - "loss": 2.3925, - "step": 422110 - }, - { - "epoch": 0.74, - "learning_rate": 1.3193671808787061e-05, - "loss": 2.2504, - "step": 422120 - }, - { - "epoch": 0.74, - "learning_rate": 1.3192799868860237e-05, - "loss": 2.4084, - "step": 422130 - }, - { - "epoch": 0.74, - "learning_rate": 1.3191927928933409e-05, - "loss": 2.3568, - "step": 422140 - }, - { - "epoch": 0.74, - "learning_rate": 1.319105598900658e-05, - "loss": 2.2569, - "step": 422150 - }, - { - "epoch": 0.74, - "learning_rate": 1.3190184049079754e-05, - "loss": 2.4299, - "step": 422160 - }, - { - "epoch": 0.74, - "learning_rate": 1.318931210915293e-05, - "loss": 2.2504, - "step": 422170 - }, - { - "epoch": 0.74, - "learning_rate": 1.3188440169226102e-05, - "loss": 2.3937, - "step": 422180 - }, - { - "epoch": 0.74, - "learning_rate": 1.3187568229299274e-05, - "loss": 2.4045, - "step": 422190 - }, - { - "epoch": 0.74, - "learning_rate": 1.318669628937245e-05, - "loss": 2.2578, - "step": 422200 - }, - { - "epoch": 0.74, - "learning_rate": 1.3185824349445622e-05, - "loss": 2.2869, - "step": 422210 - }, - { - "epoch": 0.74, - "learning_rate": 1.3184952409518794e-05, - "loss": 2.2881, - "step": 422220 - }, - { - "epoch": 0.74, - "learning_rate": 1.3184080469591967e-05, - "loss": 2.275, - "step": 422230 - }, - { - "epoch": 0.74, - "learning_rate": 1.3183208529665141e-05, - "loss": 2.3379, - "step": 422240 - }, - { - "epoch": 0.74, - "learning_rate": 1.3182336589738315e-05, - "loss": 2.2107, - "step": 422250 - }, - { - "epoch": 0.74, - "learning_rate": 1.3181464649811487e-05, - "loss": 2.3251, - "step": 422260 - }, - { - "epoch": 0.74, - "learning_rate": 1.318059270988466e-05, - "loss": 2.3077, - "step": 422270 - }, - { - "epoch": 0.74, - "learning_rate": 1.3179720769957835e-05, - "loss": 2.1784, - "step": 422280 - }, - { - "epoch": 0.74, - "learning_rate": 1.3178848830031007e-05, - "loss": 2.3484, - "step": 422290 - }, - { - "epoch": 0.74, - "learning_rate": 1.3177976890104179e-05, - "loss": 2.2851, - "step": 422300 - }, - { - "epoch": 0.74, - "learning_rate": 1.3177104950177353e-05, - "loss": 2.3913, - "step": 422310 - }, - { - "epoch": 0.74, - "learning_rate": 1.3176233010250526e-05, - "loss": 2.3338, - "step": 422320 - }, - { - "epoch": 0.74, - "learning_rate": 1.31753610703237e-05, - "loss": 2.3193, - "step": 422330 - }, - { - "epoch": 0.74, - "learning_rate": 1.3174489130396872e-05, - "loss": 2.3092, - "step": 422340 - }, - { - "epoch": 0.74, - "learning_rate": 1.3173617190470048e-05, - "loss": 2.4006, - "step": 422350 - }, - { - "epoch": 0.74, - "learning_rate": 1.317274525054322e-05, - "loss": 2.3484, - "step": 422360 - }, - { - "epoch": 0.74, - "learning_rate": 1.3171873310616392e-05, - "loss": 2.4023, - "step": 422370 - }, - { - "epoch": 0.74, - "learning_rate": 1.3171001370689564e-05, - "loss": 2.2273, - "step": 422380 - }, - { - "epoch": 0.74, - "learning_rate": 1.317012943076274e-05, - "loss": 2.1958, - "step": 422390 - }, - { - "epoch": 0.74, - "learning_rate": 1.3169257490835913e-05, - "loss": 2.3093, - "step": 422400 - }, - { - "epoch": 0.74, - "learning_rate": 1.3168385550909085e-05, - "loss": 2.3737, - "step": 422410 - }, - { - "epoch": 0.74, - "learning_rate": 1.3167513610982257e-05, - "loss": 2.1521, - "step": 422420 - }, - { - "epoch": 0.74, - "learning_rate": 1.3166641671055433e-05, - "loss": 2.1514, - "step": 422430 - }, - { - "epoch": 0.74, - "learning_rate": 1.3165769731128605e-05, - "loss": 2.3051, - "step": 422440 - }, - { - "epoch": 0.74, - "learning_rate": 1.3164897791201777e-05, - "loss": 2.4599, - "step": 422450 - }, - { - "epoch": 0.74, - "learning_rate": 1.316402585127495e-05, - "loss": 2.3126, - "step": 422460 - }, - { - "epoch": 0.74, - "learning_rate": 1.3163153911348124e-05, - "loss": 2.3017, - "step": 422470 - }, - { - "epoch": 0.74, - "learning_rate": 1.3162281971421298e-05, - "loss": 2.2048, - "step": 422480 - }, - { - "epoch": 0.74, - "learning_rate": 1.316141003149447e-05, - "loss": 2.4562, - "step": 422490 - }, - { - "epoch": 0.74, - "learning_rate": 1.3160538091567646e-05, - "loss": 2.2126, - "step": 422500 - }, - { - "epoch": 0.74, - "learning_rate": 1.3159666151640818e-05, - "loss": 2.1914, - "step": 422510 - }, - { - "epoch": 0.74, - "learning_rate": 1.315879421171399e-05, - "loss": 2.2986, - "step": 422520 - }, - { - "epoch": 0.74, - "learning_rate": 1.3157922271787162e-05, - "loss": 2.3506, - "step": 422530 - }, - { - "epoch": 0.74, - "learning_rate": 1.3157050331860337e-05, - "loss": 2.4304, - "step": 422540 - }, - { - "epoch": 0.74, - "learning_rate": 1.315617839193351e-05, - "loss": 2.2895, - "step": 422550 - }, - { - "epoch": 0.74, - "learning_rate": 1.3155306452006683e-05, - "loss": 2.3035, - "step": 422560 - }, - { - "epoch": 0.74, - "learning_rate": 1.3154434512079855e-05, - "loss": 2.2396, - "step": 422570 - }, - { - "epoch": 0.74, - "learning_rate": 1.315356257215303e-05, - "loss": 2.3022, - "step": 422580 - }, - { - "epoch": 0.74, - "learning_rate": 1.3152690632226203e-05, - "loss": 2.1777, - "step": 422590 - }, - { - "epoch": 0.74, - "learning_rate": 1.3151818692299375e-05, - "loss": 2.1674, - "step": 422600 - }, - { - "epoch": 0.74, - "learning_rate": 1.315094675237255e-05, - "loss": 2.2545, - "step": 422610 - }, - { - "epoch": 0.74, - "learning_rate": 1.3150074812445723e-05, - "loss": 2.2442, - "step": 422620 - }, - { - "epoch": 0.74, - "learning_rate": 1.3149202872518895e-05, - "loss": 2.3141, - "step": 422630 - }, - { - "epoch": 0.74, - "learning_rate": 1.3148330932592068e-05, - "loss": 2.3717, - "step": 422640 - }, - { - "epoch": 0.74, - "learning_rate": 1.3147458992665244e-05, - "loss": 2.2798, - "step": 422650 - }, - { - "epoch": 0.74, - "learning_rate": 1.3146587052738416e-05, - "loss": 2.2973, - "step": 422660 - }, - { - "epoch": 0.74, - "learning_rate": 1.3145715112811588e-05, - "loss": 2.3426, - "step": 422670 - }, - { - "epoch": 0.74, - "learning_rate": 1.314484317288476e-05, - "loss": 2.3374, - "step": 422680 - }, - { - "epoch": 0.74, - "learning_rate": 1.3143971232957936e-05, - "loss": 2.2601, - "step": 422690 - }, - { - "epoch": 0.74, - "learning_rate": 1.3143099293031108e-05, - "loss": 2.3095, - "step": 422700 - }, - { - "epoch": 0.74, - "learning_rate": 1.3142227353104281e-05, - "loss": 2.2143, - "step": 422710 - }, - { - "epoch": 0.74, - "learning_rate": 1.3141355413177453e-05, - "loss": 2.2194, - "step": 422720 - }, - { - "epoch": 0.74, - "learning_rate": 1.3140483473250629e-05, - "loss": 2.3312, - "step": 422730 - }, - { - "epoch": 0.74, - "learning_rate": 1.3139611533323801e-05, - "loss": 2.242, - "step": 422740 - }, - { - "epoch": 0.74, - "learning_rate": 1.3138739593396973e-05, - "loss": 2.3138, - "step": 422750 - }, - { - "epoch": 0.74, - "learning_rate": 1.3137867653470149e-05, - "loss": 2.3001, - "step": 422760 - }, - { - "epoch": 0.74, - "learning_rate": 1.313699571354332e-05, - "loss": 2.3024, - "step": 422770 - }, - { - "epoch": 0.74, - "learning_rate": 1.3136123773616493e-05, - "loss": 2.2874, - "step": 422780 - }, - { - "epoch": 0.74, - "learning_rate": 1.3135251833689666e-05, - "loss": 2.3442, - "step": 422790 - }, - { - "epoch": 0.74, - "learning_rate": 1.313437989376284e-05, - "loss": 2.2803, - "step": 422800 - }, - { - "epoch": 0.74, - "learning_rate": 1.3133507953836014e-05, - "loss": 2.2651, - "step": 422810 - }, - { - "epoch": 0.74, - "learning_rate": 1.3132636013909186e-05, - "loss": 2.4126, - "step": 422820 - }, - { - "epoch": 0.74, - "learning_rate": 1.3131764073982358e-05, - "loss": 2.415, - "step": 422830 - }, - { - "epoch": 0.74, - "learning_rate": 1.3130892134055534e-05, - "loss": 2.1327, - "step": 422840 - }, - { - "epoch": 0.74, - "learning_rate": 1.3130020194128706e-05, - "loss": 2.3068, - "step": 422850 - }, - { - "epoch": 0.74, - "learning_rate": 1.3129148254201878e-05, - "loss": 2.246, - "step": 422860 - }, - { - "epoch": 0.74, - "learning_rate": 1.3128276314275053e-05, - "loss": 2.3617, - "step": 422870 - }, - { - "epoch": 0.74, - "learning_rate": 1.3127404374348227e-05, - "loss": 2.3211, - "step": 422880 - }, - { - "epoch": 0.74, - "learning_rate": 1.3126532434421399e-05, - "loss": 2.4197, - "step": 422890 - }, - { - "epoch": 0.74, - "learning_rate": 1.3125660494494571e-05, - "loss": 2.1742, - "step": 422900 - }, - { - "epoch": 0.74, - "learning_rate": 1.3124788554567747e-05, - "loss": 2.3276, - "step": 422910 - }, - { - "epoch": 0.74, - "learning_rate": 1.3123916614640919e-05, - "loss": 2.2675, - "step": 422920 - }, - { - "epoch": 0.74, - "learning_rate": 1.312304467471409e-05, - "loss": 2.2098, - "step": 422930 - }, - { - "epoch": 0.74, - "learning_rate": 1.3122172734787263e-05, - "loss": 2.3089, - "step": 422940 - }, - { - "epoch": 0.74, - "learning_rate": 1.3121300794860438e-05, - "loss": 2.4355, - "step": 422950 - }, - { - "epoch": 0.74, - "learning_rate": 1.3120428854933612e-05, - "loss": 2.396, - "step": 422960 - }, - { - "epoch": 0.74, - "learning_rate": 1.3119556915006784e-05, - "loss": 2.3966, - "step": 422970 - }, - { - "epoch": 0.74, - "learning_rate": 1.3118684975079956e-05, - "loss": 2.2654, - "step": 422980 - }, - { - "epoch": 0.74, - "learning_rate": 1.3117813035153132e-05, - "loss": 2.3095, - "step": 422990 - }, - { - "epoch": 0.74, - "learning_rate": 1.3116941095226304e-05, - "loss": 2.2646, - "step": 423000 - }, - { - "epoch": 0.74, - "learning_rate": 1.3116069155299476e-05, - "loss": 2.2137, - "step": 423010 - }, - { - "epoch": 0.74, - "learning_rate": 1.3115197215372651e-05, - "loss": 2.4599, - "step": 423020 - }, - { - "epoch": 0.74, - "learning_rate": 1.3114325275445823e-05, - "loss": 2.2618, - "step": 423030 - }, - { - "epoch": 0.74, - "learning_rate": 1.3113453335518997e-05, - "loss": 2.3388, - "step": 423040 - }, - { - "epoch": 0.74, - "learning_rate": 1.311258139559217e-05, - "loss": 2.339, - "step": 423050 - }, - { - "epoch": 0.74, - "learning_rate": 1.3111709455665345e-05, - "loss": 2.2821, - "step": 423060 - }, - { - "epoch": 0.74, - "learning_rate": 1.3110837515738517e-05, - "loss": 2.3103, - "step": 423070 - }, - { - "epoch": 0.74, - "learning_rate": 1.3109965575811689e-05, - "loss": 2.2327, - "step": 423080 - }, - { - "epoch": 0.74, - "learning_rate": 1.3109093635884861e-05, - "loss": 2.3603, - "step": 423090 - }, - { - "epoch": 0.74, - "learning_rate": 1.3108221695958036e-05, - "loss": 2.2072, - "step": 423100 - }, - { - "epoch": 0.74, - "learning_rate": 1.3107349756031208e-05, - "loss": 2.4111, - "step": 423110 - }, - { - "epoch": 0.74, - "learning_rate": 1.3106477816104382e-05, - "loss": 2.2768, - "step": 423120 - }, - { - "epoch": 0.74, - "learning_rate": 1.3105605876177558e-05, - "loss": 2.1458, - "step": 423130 - }, - { - "epoch": 0.74, - "learning_rate": 1.310473393625073e-05, - "loss": 2.3063, - "step": 423140 - }, - { - "epoch": 0.74, - "learning_rate": 1.3103861996323902e-05, - "loss": 2.321, - "step": 423150 - }, - { - "epoch": 0.74, - "learning_rate": 1.3102990056397074e-05, - "loss": 2.2542, - "step": 423160 - }, - { - "epoch": 0.74, - "learning_rate": 1.310211811647025e-05, - "loss": 2.2871, - "step": 423170 - }, - { - "epoch": 0.74, - "learning_rate": 1.3101246176543421e-05, - "loss": 2.2685, - "step": 423180 - }, - { - "epoch": 0.74, - "learning_rate": 1.3100374236616595e-05, - "loss": 2.3032, - "step": 423190 - }, - { - "epoch": 0.74, - "learning_rate": 1.3099502296689767e-05, - "loss": 2.4071, - "step": 423200 - }, - { - "epoch": 0.74, - "learning_rate": 1.3098630356762943e-05, - "loss": 2.283, - "step": 423210 - }, - { - "epoch": 0.74, - "learning_rate": 1.3097758416836115e-05, - "loss": 2.273, - "step": 423220 - }, - { - "epoch": 0.74, - "learning_rate": 1.3096886476909287e-05, - "loss": 2.2937, - "step": 423230 - }, - { - "epoch": 0.74, - "learning_rate": 1.3096014536982459e-05, - "loss": 2.28, - "step": 423240 - }, - { - "epoch": 0.74, - "learning_rate": 1.3095142597055634e-05, - "loss": 2.2466, - "step": 423250 - }, - { - "epoch": 0.74, - "learning_rate": 1.3094270657128807e-05, - "loss": 2.1375, - "step": 423260 - }, - { - "epoch": 0.74, - "learning_rate": 1.309339871720198e-05, - "loss": 2.1914, - "step": 423270 - }, - { - "epoch": 0.74, - "learning_rate": 1.3092526777275154e-05, - "loss": 2.3435, - "step": 423280 - }, - { - "epoch": 0.74, - "learning_rate": 1.3091654837348328e-05, - "loss": 2.299, - "step": 423290 - }, - { - "epoch": 0.74, - "learning_rate": 1.30907828974215e-05, - "loss": 2.2157, - "step": 423300 - }, - { - "epoch": 0.74, - "learning_rate": 1.3089910957494672e-05, - "loss": 2.2674, - "step": 423310 - }, - { - "epoch": 0.74, - "learning_rate": 1.3089039017567847e-05, - "loss": 2.3856, - "step": 423320 - }, - { - "epoch": 0.74, - "learning_rate": 1.308816707764102e-05, - "loss": 2.3597, - "step": 423330 - }, - { - "epoch": 0.74, - "learning_rate": 1.3087295137714192e-05, - "loss": 2.3412, - "step": 423340 - }, - { - "epoch": 0.74, - "learning_rate": 1.3086423197787365e-05, - "loss": 2.2645, - "step": 423350 - }, - { - "epoch": 0.74, - "learning_rate": 1.3085551257860539e-05, - "loss": 2.2724, - "step": 423360 - }, - { - "epoch": 0.74, - "learning_rate": 1.3084679317933713e-05, - "loss": 2.2903, - "step": 423370 - }, - { - "epoch": 0.74, - "learning_rate": 1.3083807378006885e-05, - "loss": 2.2896, - "step": 423380 - }, - { - "epoch": 0.74, - "learning_rate": 1.3082935438080057e-05, - "loss": 2.444, - "step": 423390 - }, - { - "epoch": 0.74, - "learning_rate": 1.3082063498153233e-05, - "loss": 2.2987, - "step": 423400 - }, - { - "epoch": 0.74, - "learning_rate": 1.3081191558226405e-05, - "loss": 2.3328, - "step": 423410 - }, - { - "epoch": 0.74, - "learning_rate": 1.3080319618299577e-05, - "loss": 2.218, - "step": 423420 - }, - { - "epoch": 0.74, - "learning_rate": 1.3079447678372752e-05, - "loss": 2.2922, - "step": 423430 - }, - { - "epoch": 0.74, - "learning_rate": 1.3078575738445926e-05, - "loss": 2.2677, - "step": 423440 - }, - { - "epoch": 0.74, - "learning_rate": 1.3077703798519098e-05, - "loss": 2.2752, - "step": 423450 - }, - { - "epoch": 0.74, - "learning_rate": 1.307683185859227e-05, - "loss": 2.2689, - "step": 423460 - }, - { - "epoch": 0.74, - "learning_rate": 1.3075959918665446e-05, - "loss": 2.4626, - "step": 423470 - }, - { - "epoch": 0.74, - "learning_rate": 1.3075087978738618e-05, - "loss": 2.4144, - "step": 423480 - }, - { - "epoch": 0.74, - "learning_rate": 1.307421603881179e-05, - "loss": 2.2629, - "step": 423490 - }, - { - "epoch": 0.74, - "learning_rate": 1.3073344098884963e-05, - "loss": 2.3403, - "step": 423500 - }, - { - "epoch": 0.74, - "learning_rate": 1.3072472158958137e-05, - "loss": 2.3025, - "step": 423510 - }, - { - "epoch": 0.74, - "learning_rate": 1.3071600219031311e-05, - "loss": 2.3532, - "step": 423520 - }, - { - "epoch": 0.74, - "learning_rate": 1.3070728279104483e-05, - "loss": 2.3511, - "step": 423530 - }, - { - "epoch": 0.74, - "learning_rate": 1.3069856339177659e-05, - "loss": 2.3071, - "step": 423540 - }, - { - "epoch": 0.74, - "learning_rate": 1.306898439925083e-05, - "loss": 2.3016, - "step": 423550 - }, - { - "epoch": 0.74, - "learning_rate": 1.3068112459324003e-05, - "loss": 2.34, - "step": 423560 - }, - { - "epoch": 0.74, - "learning_rate": 1.3067240519397175e-05, - "loss": 2.3066, - "step": 423570 - }, - { - "epoch": 0.74, - "learning_rate": 1.306636857947035e-05, - "loss": 2.2354, - "step": 423580 - }, - { - "epoch": 0.74, - "learning_rate": 1.3065496639543522e-05, - "loss": 2.3129, - "step": 423590 - }, - { - "epoch": 0.74, - "learning_rate": 1.3064624699616696e-05, - "loss": 2.2307, - "step": 423600 - }, - { - "epoch": 0.74, - "learning_rate": 1.3063752759689868e-05, - "loss": 2.2669, - "step": 423610 - }, - { - "epoch": 0.74, - "learning_rate": 1.3062880819763044e-05, - "loss": 2.2807, - "step": 423620 - }, - { - "epoch": 0.74, - "learning_rate": 1.3062008879836216e-05, - "loss": 2.378, - "step": 423630 - }, - { - "epoch": 0.74, - "learning_rate": 1.3061136939909388e-05, - "loss": 2.406, - "step": 423640 - }, - { - "epoch": 0.74, - "learning_rate": 1.306026499998256e-05, - "loss": 2.2688, - "step": 423650 - }, - { - "epoch": 0.74, - "learning_rate": 1.3059393060055735e-05, - "loss": 2.2208, - "step": 423660 - }, - { - "epoch": 0.74, - "learning_rate": 1.3058521120128907e-05, - "loss": 2.2605, - "step": 423670 - }, - { - "epoch": 0.74, - "learning_rate": 1.3057649180202081e-05, - "loss": 2.2844, - "step": 423680 - }, - { - "epoch": 0.74, - "learning_rate": 1.3056777240275257e-05, - "loss": 2.2764, - "step": 423690 - }, - { - "epoch": 0.74, - "learning_rate": 1.3055905300348429e-05, - "loss": 2.3216, - "step": 423700 - }, - { - "epoch": 0.74, - "learning_rate": 1.30550333604216e-05, - "loss": 2.2684, - "step": 423710 - }, - { - "epoch": 0.74, - "learning_rate": 1.3054161420494773e-05, - "loss": 2.258, - "step": 423720 - }, - { - "epoch": 0.74, - "learning_rate": 1.3053289480567948e-05, - "loss": 2.2599, - "step": 423730 - }, - { - "epoch": 0.74, - "learning_rate": 1.305241754064112e-05, - "loss": 2.3126, - "step": 423740 - }, - { - "epoch": 0.74, - "learning_rate": 1.3051545600714294e-05, - "loss": 2.313, - "step": 423750 - }, - { - "epoch": 0.74, - "learning_rate": 1.3050673660787466e-05, - "loss": 2.292, - "step": 423760 - }, - { - "epoch": 0.74, - "learning_rate": 1.3049801720860642e-05, - "loss": 2.233, - "step": 423770 - }, - { - "epoch": 0.74, - "learning_rate": 1.3048929780933814e-05, - "loss": 2.3019, - "step": 423780 - }, - { - "epoch": 0.74, - "learning_rate": 1.3048057841006986e-05, - "loss": 2.3358, - "step": 423790 - }, - { - "epoch": 0.74, - "learning_rate": 1.3047185901080161e-05, - "loss": 2.3216, - "step": 423800 - }, - { - "epoch": 0.74, - "learning_rate": 1.3046313961153333e-05, - "loss": 2.413, - "step": 423810 - }, - { - "epoch": 0.74, - "learning_rate": 1.3045442021226505e-05, - "loss": 2.3645, - "step": 423820 - }, - { - "epoch": 0.74, - "learning_rate": 1.304457008129968e-05, - "loss": 2.2903, - "step": 423830 - }, - { - "epoch": 0.74, - "learning_rate": 1.3043698141372853e-05, - "loss": 2.4125, - "step": 423840 - }, - { - "epoch": 0.74, - "learning_rate": 1.3042826201446027e-05, - "loss": 2.3314, - "step": 423850 - }, - { - "epoch": 0.74, - "learning_rate": 1.3041954261519199e-05, - "loss": 2.3749, - "step": 423860 - }, - { - "epoch": 0.74, - "learning_rate": 1.3041082321592371e-05, - "loss": 2.1941, - "step": 423870 - }, - { - "epoch": 0.74, - "learning_rate": 1.3040210381665546e-05, - "loss": 2.287, - "step": 423880 - }, - { - "epoch": 0.74, - "learning_rate": 1.3039338441738718e-05, - "loss": 2.3887, - "step": 423890 - }, - { - "epoch": 0.74, - "learning_rate": 1.303846650181189e-05, - "loss": 2.311, - "step": 423900 - }, - { - "epoch": 0.74, - "learning_rate": 1.3037594561885064e-05, - "loss": 2.3866, - "step": 423910 - }, - { - "epoch": 0.74, - "learning_rate": 1.303672262195824e-05, - "loss": 2.4264, - "step": 423920 - }, - { - "epoch": 0.74, - "learning_rate": 1.3035850682031412e-05, - "loss": 2.3246, - "step": 423930 - }, - { - "epoch": 0.74, - "learning_rate": 1.3034978742104584e-05, - "loss": 2.3345, - "step": 423940 - }, - { - "epoch": 0.74, - "learning_rate": 1.303410680217776e-05, - "loss": 2.3408, - "step": 423950 - }, - { - "epoch": 0.74, - "learning_rate": 1.3033234862250931e-05, - "loss": 2.3533, - "step": 423960 - }, - { - "epoch": 0.74, - "learning_rate": 1.3032362922324104e-05, - "loss": 2.398, - "step": 423970 - }, - { - "epoch": 0.74, - "learning_rate": 1.3031490982397276e-05, - "loss": 2.2287, - "step": 423980 - }, - { - "epoch": 0.74, - "learning_rate": 1.3030619042470451e-05, - "loss": 2.3555, - "step": 423990 - }, - { - "epoch": 0.74, - "learning_rate": 1.3029747102543625e-05, - "loss": 2.2868, - "step": 424000 - }, - { - "epoch": 0.74, - "learning_rate": 1.3028875162616797e-05, - "loss": 2.3162, - "step": 424010 - }, - { - "epoch": 0.74, - "learning_rate": 1.3028003222689969e-05, - "loss": 2.2895, - "step": 424020 - }, - { - "epoch": 0.74, - "learning_rate": 1.3027131282763144e-05, - "loss": 2.2424, - "step": 424030 - }, - { - "epoch": 0.74, - "learning_rate": 1.3026259342836317e-05, - "loss": 2.2555, - "step": 424040 - }, - { - "epoch": 0.74, - "learning_rate": 1.3025387402909489e-05, - "loss": 2.2236, - "step": 424050 - }, - { - "epoch": 0.74, - "learning_rate": 1.3024515462982664e-05, - "loss": 2.3055, - "step": 424060 - }, - { - "epoch": 0.74, - "learning_rate": 1.3023643523055836e-05, - "loss": 2.242, - "step": 424070 - }, - { - "epoch": 0.74, - "learning_rate": 1.302277158312901e-05, - "loss": 2.2157, - "step": 424080 - }, - { - "epoch": 0.74, - "learning_rate": 1.3021899643202182e-05, - "loss": 2.3133, - "step": 424090 - }, - { - "epoch": 0.74, - "learning_rate": 1.3021027703275357e-05, - "loss": 2.2935, - "step": 424100 - }, - { - "epoch": 0.74, - "learning_rate": 1.302015576334853e-05, - "loss": 2.3229, - "step": 424110 - }, - { - "epoch": 0.74, - "learning_rate": 1.3019283823421702e-05, - "loss": 2.2146, - "step": 424120 - }, - { - "epoch": 0.74, - "learning_rate": 1.3018411883494874e-05, - "loss": 2.2858, - "step": 424130 - }, - { - "epoch": 0.74, - "learning_rate": 1.3017539943568049e-05, - "loss": 2.2677, - "step": 424140 - }, - { - "epoch": 0.74, - "learning_rate": 1.3016668003641221e-05, - "loss": 2.2931, - "step": 424150 - }, - { - "epoch": 0.74, - "learning_rate": 1.3015796063714395e-05, - "loss": 2.2373, - "step": 424160 - }, - { - "epoch": 0.74, - "learning_rate": 1.3014924123787567e-05, - "loss": 2.2684, - "step": 424170 - }, - { - "epoch": 0.74, - "learning_rate": 1.3014052183860743e-05, - "loss": 2.2891, - "step": 424180 - }, - { - "epoch": 0.74, - "learning_rate": 1.3013180243933915e-05, - "loss": 2.2579, - "step": 424190 - }, - { - "epoch": 0.74, - "learning_rate": 1.3012308304007087e-05, - "loss": 2.2638, - "step": 424200 - }, - { - "epoch": 0.74, - "learning_rate": 1.3011436364080262e-05, - "loss": 2.4067, - "step": 424210 - }, - { - "epoch": 0.74, - "learning_rate": 1.3010564424153434e-05, - "loss": 2.3492, - "step": 424220 - }, - { - "epoch": 0.74, - "learning_rate": 1.3009692484226608e-05, - "loss": 2.2458, - "step": 424230 - }, - { - "epoch": 0.74, - "learning_rate": 1.300882054429978e-05, - "loss": 2.345, - "step": 424240 - }, - { - "epoch": 0.74, - "learning_rate": 1.3007948604372956e-05, - "loss": 2.308, - "step": 424250 - }, - { - "epoch": 0.74, - "learning_rate": 1.3007076664446128e-05, - "loss": 2.2263, - "step": 424260 - }, - { - "epoch": 0.74, - "learning_rate": 1.30062047245193e-05, - "loss": 2.2953, - "step": 424270 - }, - { - "epoch": 0.74, - "learning_rate": 1.3005332784592472e-05, - "loss": 2.3069, - "step": 424280 - }, - { - "epoch": 0.74, - "learning_rate": 1.3004460844665647e-05, - "loss": 2.2515, - "step": 424290 - }, - { - "epoch": 0.74, - "learning_rate": 1.300358890473882e-05, - "loss": 2.346, - "step": 424300 - }, - { - "epoch": 0.74, - "learning_rate": 1.3002716964811993e-05, - "loss": 2.3555, - "step": 424310 - }, - { - "epoch": 0.74, - "learning_rate": 1.3001845024885165e-05, - "loss": 2.1906, - "step": 424320 - }, - { - "epoch": 0.74, - "learning_rate": 1.300097308495834e-05, - "loss": 2.2148, - "step": 424330 - }, - { - "epoch": 0.74, - "learning_rate": 1.3000101145031513e-05, - "loss": 2.255, - "step": 424340 - }, - { - "epoch": 0.74, - "learning_rate": 1.2999229205104685e-05, - "loss": 2.2056, - "step": 424350 - }, - { - "epoch": 0.74, - "learning_rate": 1.299835726517786e-05, - "loss": 2.3169, - "step": 424360 - }, - { - "epoch": 0.74, - "learning_rate": 1.2997485325251032e-05, - "loss": 2.3075, - "step": 424370 - }, - { - "epoch": 0.74, - "learning_rate": 1.2996613385324204e-05, - "loss": 2.3292, - "step": 424380 - }, - { - "epoch": 0.74, - "learning_rate": 1.2995741445397378e-05, - "loss": 2.4528, - "step": 424390 - }, - { - "epoch": 0.74, - "learning_rate": 1.2994869505470552e-05, - "loss": 2.279, - "step": 424400 - }, - { - "epoch": 0.74, - "learning_rate": 1.2993997565543726e-05, - "loss": 2.3482, - "step": 424410 - }, - { - "epoch": 0.74, - "learning_rate": 1.2993125625616898e-05, - "loss": 2.1972, - "step": 424420 - }, - { - "epoch": 0.74, - "learning_rate": 1.299225368569007e-05, - "loss": 2.3324, - "step": 424430 - }, - { - "epoch": 0.74, - "learning_rate": 1.2991381745763245e-05, - "loss": 2.1826, - "step": 424440 - }, - { - "epoch": 0.74, - "learning_rate": 1.2990509805836417e-05, - "loss": 2.3573, - "step": 424450 - }, - { - "epoch": 0.74, - "learning_rate": 1.298963786590959e-05, - "loss": 2.3239, - "step": 424460 - }, - { - "epoch": 0.74, - "learning_rate": 1.2988765925982765e-05, - "loss": 2.2044, - "step": 424470 - }, - { - "epoch": 0.74, - "learning_rate": 1.2987893986055939e-05, - "loss": 2.3965, - "step": 424480 - }, - { - "epoch": 0.74, - "learning_rate": 1.298702204612911e-05, - "loss": 2.3034, - "step": 424490 - }, - { - "epoch": 0.74, - "learning_rate": 1.2986150106202283e-05, - "loss": 2.3175, - "step": 424500 - }, - { - "epoch": 0.74, - "learning_rate": 1.2985278166275458e-05, - "loss": 2.2037, - "step": 424510 - }, - { - "epoch": 0.74, - "learning_rate": 1.298440622634863e-05, - "loss": 2.4287, - "step": 424520 - }, - { - "epoch": 0.74, - "learning_rate": 1.2983534286421802e-05, - "loss": 2.2594, - "step": 424530 - }, - { - "epoch": 0.74, - "learning_rate": 1.2982662346494976e-05, - "loss": 2.193, - "step": 424540 - }, - { - "epoch": 0.74, - "learning_rate": 1.298179040656815e-05, - "loss": 2.3404, - "step": 424550 - }, - { - "epoch": 0.74, - "learning_rate": 1.2980918466641324e-05, - "loss": 2.3511, - "step": 424560 - }, - { - "epoch": 0.74, - "learning_rate": 1.2980046526714496e-05, - "loss": 2.2279, - "step": 424570 - }, - { - "epoch": 0.74, - "learning_rate": 1.2979174586787668e-05, - "loss": 2.3629, - "step": 424580 - }, - { - "epoch": 0.74, - "learning_rate": 1.2978302646860843e-05, - "loss": 2.3818, - "step": 424590 - }, - { - "epoch": 0.74, - "learning_rate": 1.2977430706934015e-05, - "loss": 2.4654, - "step": 424600 - }, - { - "epoch": 0.74, - "learning_rate": 1.2976558767007188e-05, - "loss": 2.2323, - "step": 424610 - }, - { - "epoch": 0.74, - "learning_rate": 1.2975686827080363e-05, - "loss": 2.3387, - "step": 424620 - }, - { - "epoch": 0.74, - "learning_rate": 1.2974814887153535e-05, - "loss": 2.2153, - "step": 424630 - }, - { - "epoch": 0.74, - "learning_rate": 1.2973942947226709e-05, - "loss": 2.3062, - "step": 424640 - }, - { - "epoch": 0.74, - "learning_rate": 1.2973071007299881e-05, - "loss": 2.2875, - "step": 424650 - }, - { - "epoch": 0.74, - "learning_rate": 1.2972199067373056e-05, - "loss": 2.3532, - "step": 424660 - }, - { - "epoch": 0.74, - "learning_rate": 1.2971327127446228e-05, - "loss": 2.277, - "step": 424670 - }, - { - "epoch": 0.74, - "learning_rate": 1.29704551875194e-05, - "loss": 2.2467, - "step": 424680 - }, - { - "epoch": 0.74, - "learning_rate": 1.2969583247592573e-05, - "loss": 2.258, - "step": 424690 - }, - { - "epoch": 0.74, - "learning_rate": 1.2968711307665748e-05, - "loss": 2.3057, - "step": 424700 - }, - { - "epoch": 0.74, - "learning_rate": 1.296783936773892e-05, - "loss": 2.3182, - "step": 424710 - }, - { - "epoch": 0.74, - "learning_rate": 1.2966967427812094e-05, - "loss": 2.2796, - "step": 424720 - }, - { - "epoch": 0.74, - "learning_rate": 1.296609548788527e-05, - "loss": 2.2052, - "step": 424730 - }, - { - "epoch": 0.74, - "learning_rate": 1.2965223547958441e-05, - "loss": 2.2478, - "step": 424740 - }, - { - "epoch": 0.74, - "learning_rate": 1.2964351608031614e-05, - "loss": 2.3472, - "step": 424750 - }, - { - "epoch": 0.74, - "learning_rate": 1.2963479668104786e-05, - "loss": 2.351, - "step": 424760 - }, - { - "epoch": 0.74, - "learning_rate": 1.2962607728177961e-05, - "loss": 2.2938, - "step": 424770 - }, - { - "epoch": 0.74, - "learning_rate": 1.2961735788251133e-05, - "loss": 2.3623, - "step": 424780 - }, - { - "epoch": 0.74, - "learning_rate": 1.2960863848324307e-05, - "loss": 2.3099, - "step": 424790 - }, - { - "epoch": 0.74, - "learning_rate": 1.2959991908397479e-05, - "loss": 2.3868, - "step": 424800 - }, - { - "epoch": 0.74, - "learning_rate": 1.2959119968470654e-05, - "loss": 2.2602, - "step": 424810 - }, - { - "epoch": 0.74, - "learning_rate": 1.2958248028543827e-05, - "loss": 2.3175, - "step": 424820 - }, - { - "epoch": 0.74, - "learning_rate": 1.2957376088616999e-05, - "loss": 2.2707, - "step": 424830 - }, - { - "epoch": 0.74, - "learning_rate": 1.295650414869017e-05, - "loss": 2.4049, - "step": 424840 - }, - { - "epoch": 0.74, - "learning_rate": 1.2955632208763346e-05, - "loss": 2.2962, - "step": 424850 - }, - { - "epoch": 0.74, - "learning_rate": 1.2954760268836518e-05, - "loss": 2.3117, - "step": 424860 - }, - { - "epoch": 0.74, - "learning_rate": 1.2953888328909692e-05, - "loss": 2.2402, - "step": 424870 - }, - { - "epoch": 0.74, - "learning_rate": 1.2953016388982866e-05, - "loss": 2.2246, - "step": 424880 - }, - { - "epoch": 0.74, - "learning_rate": 1.295214444905604e-05, - "loss": 2.232, - "step": 424890 - }, - { - "epoch": 0.74, - "learning_rate": 1.2951272509129212e-05, - "loss": 2.298, - "step": 424900 - }, - { - "epoch": 0.74, - "learning_rate": 1.2950400569202384e-05, - "loss": 2.2286, - "step": 424910 - }, - { - "epoch": 0.74, - "learning_rate": 1.2949528629275559e-05, - "loss": 2.2773, - "step": 424920 - }, - { - "epoch": 0.74, - "learning_rate": 1.2948656689348731e-05, - "loss": 2.2504, - "step": 424930 - }, - { - "epoch": 0.74, - "learning_rate": 1.2947784749421903e-05, - "loss": 2.202, - "step": 424940 - }, - { - "epoch": 0.74, - "learning_rate": 1.2946912809495077e-05, - "loss": 2.2346, - "step": 424950 - }, - { - "epoch": 0.74, - "learning_rate": 1.2946040869568253e-05, - "loss": 2.315, - "step": 424960 - }, - { - "epoch": 0.74, - "learning_rate": 1.2945168929641425e-05, - "loss": 2.3666, - "step": 424970 - }, - { - "epoch": 0.74, - "learning_rate": 1.2944296989714597e-05, - "loss": 2.4372, - "step": 424980 - }, - { - "epoch": 0.74, - "learning_rate": 1.2943425049787772e-05, - "loss": 2.296, - "step": 424990 - }, - { - "epoch": 0.74, - "learning_rate": 1.2942553109860944e-05, - "loss": 2.3503, - "step": 425000 - }, - { - "epoch": 0.74, - "learning_rate": 1.2941681169934116e-05, - "loss": 2.3558, - "step": 425010 - }, - { - "epoch": 0.74, - "learning_rate": 1.2940809230007288e-05, - "loss": 2.3423, - "step": 425020 - }, - { - "epoch": 0.74, - "learning_rate": 1.2939937290080464e-05, - "loss": 2.3436, - "step": 425030 - }, - { - "epoch": 0.74, - "learning_rate": 1.2939065350153638e-05, - "loss": 2.3237, - "step": 425040 - }, - { - "epoch": 0.74, - "learning_rate": 1.293819341022681e-05, - "loss": 2.3037, - "step": 425050 - }, - { - "epoch": 0.74, - "learning_rate": 1.2937321470299982e-05, - "loss": 2.2948, - "step": 425060 - }, - { - "epoch": 0.74, - "learning_rate": 1.2936449530373157e-05, - "loss": 2.266, - "step": 425070 - }, - { - "epoch": 0.74, - "learning_rate": 1.293557759044633e-05, - "loss": 2.3544, - "step": 425080 - }, - { - "epoch": 0.74, - "learning_rate": 1.2934705650519501e-05, - "loss": 2.2751, - "step": 425090 - }, - { - "epoch": 0.74, - "learning_rate": 1.2933833710592675e-05, - "loss": 2.2929, - "step": 425100 - }, - { - "epoch": 0.74, - "learning_rate": 1.2932961770665849e-05, - "loss": 2.3326, - "step": 425110 - }, - { - "epoch": 0.74, - "learning_rate": 1.2932089830739023e-05, - "loss": 2.314, - "step": 425120 - }, - { - "epoch": 0.74, - "learning_rate": 1.2931217890812195e-05, - "loss": 2.3144, - "step": 425130 - }, - { - "epoch": 0.74, - "learning_rate": 1.293034595088537e-05, - "loss": 2.2934, - "step": 425140 - }, - { - "epoch": 0.74, - "learning_rate": 1.2929474010958542e-05, - "loss": 2.3552, - "step": 425150 - }, - { - "epoch": 0.74, - "learning_rate": 1.2928602071031714e-05, - "loss": 2.37, - "step": 425160 - }, - { - "epoch": 0.74, - "learning_rate": 1.2927730131104886e-05, - "loss": 2.3498, - "step": 425170 - }, - { - "epoch": 0.74, - "learning_rate": 1.2926858191178062e-05, - "loss": 2.3065, - "step": 425180 - }, - { - "epoch": 0.74, - "learning_rate": 1.2925986251251234e-05, - "loss": 2.3282, - "step": 425190 - }, - { - "epoch": 0.74, - "learning_rate": 1.2925114311324408e-05, - "loss": 2.2815, - "step": 425200 - }, - { - "epoch": 0.74, - "learning_rate": 1.292424237139758e-05, - "loss": 2.385, - "step": 425210 - }, - { - "epoch": 0.74, - "learning_rate": 1.2923370431470755e-05, - "loss": 2.3553, - "step": 425220 - }, - { - "epoch": 0.74, - "learning_rate": 1.2922498491543927e-05, - "loss": 2.2366, - "step": 425230 - }, - { - "epoch": 0.74, - "learning_rate": 1.29216265516171e-05, - "loss": 2.187, - "step": 425240 - }, - { - "epoch": 0.74, - "learning_rate": 1.2920754611690272e-05, - "loss": 2.1891, - "step": 425250 - }, - { - "epoch": 0.74, - "learning_rate": 1.2919882671763447e-05, - "loss": 2.2118, - "step": 425260 - }, - { - "epoch": 0.74, - "learning_rate": 1.291901073183662e-05, - "loss": 2.1524, - "step": 425270 - }, - { - "epoch": 0.74, - "learning_rate": 1.2918138791909793e-05, - "loss": 2.2495, - "step": 425280 - }, - { - "epoch": 0.74, - "learning_rate": 1.2917266851982968e-05, - "loss": 2.3346, - "step": 425290 - }, - { - "epoch": 0.74, - "learning_rate": 1.291639491205614e-05, - "loss": 2.2317, - "step": 425300 - }, - { - "epoch": 0.74, - "learning_rate": 1.2915522972129312e-05, - "loss": 2.3541, - "step": 425310 - }, - { - "epoch": 0.74, - "learning_rate": 1.2914651032202485e-05, - "loss": 2.1646, - "step": 425320 - }, - { - "epoch": 0.74, - "learning_rate": 1.291377909227566e-05, - "loss": 2.3818, - "step": 425330 - }, - { - "epoch": 0.74, - "learning_rate": 1.2912907152348832e-05, - "loss": 2.3045, - "step": 425340 - }, - { - "epoch": 0.74, - "learning_rate": 1.2912035212422006e-05, - "loss": 2.2115, - "step": 425350 - }, - { - "epoch": 0.74, - "learning_rate": 1.2911163272495178e-05, - "loss": 2.2539, - "step": 425360 - }, - { - "epoch": 0.74, - "learning_rate": 1.2910291332568353e-05, - "loss": 2.3765, - "step": 425370 - }, - { - "epoch": 0.74, - "learning_rate": 1.2909419392641525e-05, - "loss": 2.1783, - "step": 425380 - }, - { - "epoch": 0.74, - "learning_rate": 1.2908547452714698e-05, - "loss": 2.3033, - "step": 425390 - }, - { - "epoch": 0.74, - "learning_rate": 1.2907675512787873e-05, - "loss": 2.314, - "step": 425400 - }, - { - "epoch": 0.74, - "learning_rate": 1.2906803572861045e-05, - "loss": 2.3091, - "step": 425410 - }, - { - "epoch": 0.74, - "learning_rate": 1.2905931632934217e-05, - "loss": 2.2542, - "step": 425420 - }, - { - "epoch": 0.74, - "learning_rate": 1.2905059693007391e-05, - "loss": 2.2323, - "step": 425430 - }, - { - "epoch": 0.74, - "learning_rate": 1.2904187753080565e-05, - "loss": 2.265, - "step": 425440 - }, - { - "epoch": 0.74, - "learning_rate": 1.2903315813153738e-05, - "loss": 2.288, - "step": 425450 - }, - { - "epoch": 0.74, - "learning_rate": 1.290244387322691e-05, - "loss": 2.4525, - "step": 425460 - }, - { - "epoch": 0.74, - "learning_rate": 1.2901571933300083e-05, - "loss": 2.2632, - "step": 425470 - }, - { - "epoch": 0.74, - "learning_rate": 1.2900699993373258e-05, - "loss": 2.2992, - "step": 425480 - }, - { - "epoch": 0.74, - "learning_rate": 1.289982805344643e-05, - "loss": 2.3668, - "step": 425490 - }, - { - "epoch": 0.74, - "learning_rate": 1.2898956113519602e-05, - "loss": 2.3134, - "step": 425500 - }, - { - "epoch": 0.74, - "learning_rate": 1.2898084173592776e-05, - "loss": 2.3688, - "step": 425510 - }, - { - "epoch": 0.74, - "learning_rate": 1.2897212233665951e-05, - "loss": 2.3327, - "step": 425520 - }, - { - "epoch": 0.74, - "learning_rate": 1.2896340293739124e-05, - "loss": 2.3018, - "step": 425530 - }, - { - "epoch": 0.74, - "learning_rate": 1.2895468353812296e-05, - "loss": 2.3049, - "step": 425540 - }, - { - "epoch": 0.74, - "learning_rate": 1.2894596413885471e-05, - "loss": 2.3639, - "step": 425550 - }, - { - "epoch": 0.74, - "learning_rate": 1.2893724473958643e-05, - "loss": 2.3315, - "step": 425560 - }, - { - "epoch": 0.74, - "learning_rate": 1.2892852534031815e-05, - "loss": 2.1887, - "step": 425570 - }, - { - "epoch": 0.74, - "learning_rate": 1.2891980594104989e-05, - "loss": 2.2305, - "step": 425580 - }, - { - "epoch": 0.74, - "learning_rate": 1.2891108654178163e-05, - "loss": 2.3333, - "step": 425590 - }, - { - "epoch": 0.74, - "learning_rate": 1.2890236714251337e-05, - "loss": 2.2267, - "step": 425600 - }, - { - "epoch": 0.74, - "learning_rate": 1.2889364774324509e-05, - "loss": 2.2995, - "step": 425610 - }, - { - "epoch": 0.74, - "learning_rate": 1.288849283439768e-05, - "loss": 2.3094, - "step": 425620 - }, - { - "epoch": 0.74, - "learning_rate": 1.2887620894470856e-05, - "loss": 2.4354, - "step": 425630 - }, - { - "epoch": 0.74, - "learning_rate": 1.2886748954544028e-05, - "loss": 2.4238, - "step": 425640 - }, - { - "epoch": 0.74, - "learning_rate": 1.28858770146172e-05, - "loss": 2.3473, - "step": 425650 - }, - { - "epoch": 0.74, - "learning_rate": 1.2885005074690376e-05, - "loss": 2.1976, - "step": 425660 - }, - { - "epoch": 0.74, - "learning_rate": 1.2884133134763548e-05, - "loss": 2.4744, - "step": 425670 - }, - { - "epoch": 0.74, - "learning_rate": 1.2883261194836722e-05, - "loss": 2.2807, - "step": 425680 - }, - { - "epoch": 0.74, - "learning_rate": 1.2882389254909894e-05, - "loss": 2.2764, - "step": 425690 - }, - { - "epoch": 0.74, - "learning_rate": 1.2881517314983069e-05, - "loss": 2.3103, - "step": 425700 - }, - { - "epoch": 0.74, - "learning_rate": 1.2880645375056241e-05, - "loss": 2.2309, - "step": 425710 - }, - { - "epoch": 0.74, - "learning_rate": 1.2879773435129413e-05, - "loss": 2.2823, - "step": 425720 - }, - { - "epoch": 0.74, - "learning_rate": 1.2878901495202585e-05, - "loss": 2.2578, - "step": 425730 - }, - { - "epoch": 0.74, - "learning_rate": 1.287802955527576e-05, - "loss": 2.2483, - "step": 425740 - }, - { - "epoch": 0.74, - "learning_rate": 1.2877157615348933e-05, - "loss": 2.3581, - "step": 425750 - }, - { - "epoch": 0.74, - "learning_rate": 1.2876285675422107e-05, - "loss": 2.3155, - "step": 425760 - }, - { - "epoch": 0.74, - "learning_rate": 1.2875413735495279e-05, - "loss": 2.3715, - "step": 425770 - }, - { - "epoch": 0.74, - "learning_rate": 1.2874541795568454e-05, - "loss": 2.2605, - "step": 425780 - }, - { - "epoch": 0.74, - "learning_rate": 1.2873669855641626e-05, - "loss": 2.2693, - "step": 425790 - }, - { - "epoch": 0.74, - "learning_rate": 1.2872797915714798e-05, - "loss": 2.2966, - "step": 425800 - }, - { - "epoch": 0.74, - "learning_rate": 1.2871925975787974e-05, - "loss": 2.393, - "step": 425810 - }, - { - "epoch": 0.74, - "learning_rate": 1.2871054035861146e-05, - "loss": 2.2953, - "step": 425820 - }, - { - "epoch": 0.74, - "learning_rate": 1.287018209593432e-05, - "loss": 2.2692, - "step": 425830 - }, - { - "epoch": 0.74, - "learning_rate": 1.2869310156007492e-05, - "loss": 2.3418, - "step": 425840 - }, - { - "epoch": 0.74, - "learning_rate": 1.2868438216080667e-05, - "loss": 2.4206, - "step": 425850 - }, - { - "epoch": 0.74, - "learning_rate": 1.286756627615384e-05, - "loss": 2.2242, - "step": 425860 - }, - { - "epoch": 0.74, - "learning_rate": 1.2866694336227011e-05, - "loss": 2.4132, - "step": 425870 - }, - { - "epoch": 0.74, - "learning_rate": 1.2865822396300183e-05, - "loss": 2.275, - "step": 425880 - }, - { - "epoch": 0.74, - "learning_rate": 1.2864950456373359e-05, - "loss": 2.2273, - "step": 425890 - }, - { - "epoch": 0.74, - "learning_rate": 1.2864078516446531e-05, - "loss": 2.2501, - "step": 425900 - }, - { - "epoch": 0.74, - "learning_rate": 1.2863206576519705e-05, - "loss": 2.3736, - "step": 425910 - }, - { - "epoch": 0.74, - "learning_rate": 1.2862334636592879e-05, - "loss": 2.2369, - "step": 425920 - }, - { - "epoch": 0.74, - "learning_rate": 1.2861462696666052e-05, - "loss": 2.3492, - "step": 425930 - }, - { - "epoch": 0.74, - "learning_rate": 1.2860590756739224e-05, - "loss": 2.2936, - "step": 425940 - }, - { - "epoch": 0.74, - "learning_rate": 1.2859718816812396e-05, - "loss": 2.3347, - "step": 425950 - }, - { - "epoch": 0.74, - "learning_rate": 1.2858846876885572e-05, - "loss": 2.3164, - "step": 425960 - }, - { - "epoch": 0.74, - "learning_rate": 1.2857974936958744e-05, - "loss": 2.2924, - "step": 425970 - }, - { - "epoch": 0.74, - "learning_rate": 1.2857102997031916e-05, - "loss": 2.2932, - "step": 425980 - }, - { - "epoch": 0.74, - "learning_rate": 1.285623105710509e-05, - "loss": 2.2052, - "step": 425990 - }, - { - "epoch": 0.74, - "learning_rate": 1.2855359117178265e-05, - "loss": 2.2564, - "step": 426000 - }, - { - "epoch": 0.74, - "learning_rate": 1.2854487177251437e-05, - "loss": 2.2621, - "step": 426010 - }, - { - "epoch": 0.74, - "learning_rate": 1.285361523732461e-05, - "loss": 2.3652, - "step": 426020 - }, - { - "epoch": 0.74, - "learning_rate": 1.2852743297397782e-05, - "loss": 2.2714, - "step": 426030 - }, - { - "epoch": 0.74, - "learning_rate": 1.2851871357470957e-05, - "loss": 2.2578, - "step": 426040 - }, - { - "epoch": 0.74, - "learning_rate": 1.2850999417544129e-05, - "loss": 2.2461, - "step": 426050 - }, - { - "epoch": 0.74, - "learning_rate": 1.2850127477617301e-05, - "loss": 2.1916, - "step": 426060 - }, - { - "epoch": 0.74, - "learning_rate": 1.2849255537690477e-05, - "loss": 2.2427, - "step": 426070 - }, - { - "epoch": 0.74, - "learning_rate": 1.284838359776365e-05, - "loss": 2.1682, - "step": 426080 - }, - { - "epoch": 0.74, - "learning_rate": 1.2847511657836822e-05, - "loss": 2.3149, - "step": 426090 - }, - { - "epoch": 0.74, - "learning_rate": 1.2846639717909995e-05, - "loss": 2.3221, - "step": 426100 - }, - { - "epoch": 0.74, - "learning_rate": 1.284576777798317e-05, - "loss": 2.2231, - "step": 426110 - }, - { - "epoch": 0.74, - "learning_rate": 1.2844895838056342e-05, - "loss": 2.3239, - "step": 426120 - }, - { - "epoch": 0.74, - "learning_rate": 1.2844023898129514e-05, - "loss": 2.2734, - "step": 426130 - }, - { - "epoch": 0.74, - "learning_rate": 1.2843151958202688e-05, - "loss": 2.3867, - "step": 426140 - }, - { - "epoch": 0.74, - "learning_rate": 1.2842280018275862e-05, - "loss": 2.3155, - "step": 426150 - }, - { - "epoch": 0.74, - "learning_rate": 1.2841408078349035e-05, - "loss": 2.3511, - "step": 426160 - }, - { - "epoch": 0.74, - "learning_rate": 1.2840536138422208e-05, - "loss": 2.2868, - "step": 426170 - }, - { - "epoch": 0.74, - "learning_rate": 1.283966419849538e-05, - "loss": 2.4232, - "step": 426180 - }, - { - "epoch": 0.74, - "learning_rate": 1.2838792258568555e-05, - "loss": 2.2564, - "step": 426190 - }, - { - "epoch": 0.74, - "learning_rate": 1.2837920318641727e-05, - "loss": 2.251, - "step": 426200 - }, - { - "epoch": 0.74, - "learning_rate": 1.28370483787149e-05, - "loss": 2.3695, - "step": 426210 - }, - { - "epoch": 0.74, - "learning_rate": 1.2836176438788075e-05, - "loss": 2.1671, - "step": 426220 - }, - { - "epoch": 0.74, - "learning_rate": 1.2835304498861247e-05, - "loss": 2.2722, - "step": 426230 - }, - { - "epoch": 0.74, - "learning_rate": 1.283443255893442e-05, - "loss": 2.381, - "step": 426240 - }, - { - "epoch": 0.74, - "learning_rate": 1.2833560619007593e-05, - "loss": 2.1946, - "step": 426250 - }, - { - "epoch": 0.74, - "learning_rate": 1.2832688679080768e-05, - "loss": 2.2892, - "step": 426260 - }, - { - "epoch": 0.74, - "learning_rate": 1.283181673915394e-05, - "loss": 2.2314, - "step": 426270 - }, - { - "epoch": 0.74, - "learning_rate": 1.2830944799227112e-05, - "loss": 2.2315, - "step": 426280 - }, - { - "epoch": 0.74, - "learning_rate": 1.2830072859300284e-05, - "loss": 2.2994, - "step": 426290 - }, - { - "epoch": 0.74, - "learning_rate": 1.282920091937346e-05, - "loss": 2.2716, - "step": 426300 - }, - { - "epoch": 0.74, - "learning_rate": 1.2828328979446634e-05, - "loss": 2.3445, - "step": 426310 - }, - { - "epoch": 0.74, - "learning_rate": 1.2827457039519806e-05, - "loss": 2.26, - "step": 426320 - }, - { - "epoch": 0.74, - "learning_rate": 1.2826585099592981e-05, - "loss": 2.2979, - "step": 426330 - }, - { - "epoch": 0.74, - "learning_rate": 1.2825713159666153e-05, - "loss": 2.3045, - "step": 426340 - }, - { - "epoch": 0.74, - "learning_rate": 1.2824841219739325e-05, - "loss": 2.3063, - "step": 426350 - }, - { - "epoch": 0.74, - "learning_rate": 1.2823969279812497e-05, - "loss": 2.2174, - "step": 426360 - }, - { - "epoch": 0.74, - "learning_rate": 1.2823097339885673e-05, - "loss": 2.3775, - "step": 426370 - }, - { - "epoch": 0.74, - "learning_rate": 1.2822225399958845e-05, - "loss": 2.3425, - "step": 426380 - }, - { - "epoch": 0.74, - "learning_rate": 1.2821353460032019e-05, - "loss": 2.2955, - "step": 426390 - }, - { - "epoch": 0.74, - "learning_rate": 1.282048152010519e-05, - "loss": 2.3067, - "step": 426400 - }, - { - "epoch": 0.74, - "learning_rate": 1.2819609580178366e-05, - "loss": 2.328, - "step": 426410 - }, - { - "epoch": 0.74, - "learning_rate": 1.2818737640251538e-05, - "loss": 2.4774, - "step": 426420 - }, - { - "epoch": 0.74, - "learning_rate": 1.281786570032471e-05, - "loss": 2.3169, - "step": 426430 - }, - { - "epoch": 0.74, - "learning_rate": 1.2816993760397882e-05, - "loss": 2.2383, - "step": 426440 - }, - { - "epoch": 0.74, - "learning_rate": 1.2816121820471058e-05, - "loss": 2.3168, - "step": 426450 - }, - { - "epoch": 0.74, - "learning_rate": 1.281524988054423e-05, - "loss": 2.3179, - "step": 426460 - }, - { - "epoch": 0.74, - "learning_rate": 1.2814377940617404e-05, - "loss": 2.4369, - "step": 426470 - }, - { - "epoch": 0.74, - "learning_rate": 1.2813506000690577e-05, - "loss": 2.3934, - "step": 426480 - }, - { - "epoch": 0.74, - "learning_rate": 1.2812634060763751e-05, - "loss": 2.2677, - "step": 426490 - }, - { - "epoch": 0.74, - "learning_rate": 1.2811762120836923e-05, - "loss": 2.2514, - "step": 426500 - }, - { - "epoch": 0.74, - "learning_rate": 1.2810890180910095e-05, - "loss": 2.3554, - "step": 426510 - }, - { - "epoch": 0.74, - "learning_rate": 1.281001824098327e-05, - "loss": 2.2198, - "step": 426520 - }, - { - "epoch": 0.74, - "learning_rate": 1.2809146301056443e-05, - "loss": 2.2334, - "step": 426530 - }, - { - "epoch": 0.74, - "learning_rate": 1.2808274361129615e-05, - "loss": 2.3271, - "step": 426540 - }, - { - "epoch": 0.74, - "learning_rate": 1.2807402421202789e-05, - "loss": 2.396, - "step": 426550 - }, - { - "epoch": 0.74, - "learning_rate": 1.2806530481275964e-05, - "loss": 2.1531, - "step": 426560 - }, - { - "epoch": 0.74, - "learning_rate": 1.2805658541349136e-05, - "loss": 2.3516, - "step": 426570 - }, - { - "epoch": 0.74, - "learning_rate": 1.2804786601422308e-05, - "loss": 2.3483, - "step": 426580 - }, - { - "epoch": 0.74, - "learning_rate": 1.2803914661495484e-05, - "loss": 2.4123, - "step": 426590 - }, - { - "epoch": 0.74, - "learning_rate": 1.2803042721568656e-05, - "loss": 2.2762, - "step": 426600 - }, - { - "epoch": 0.74, - "learning_rate": 1.2802170781641828e-05, - "loss": 2.3533, - "step": 426610 - }, - { - "epoch": 0.74, - "learning_rate": 1.2801298841715002e-05, - "loss": 2.3854, - "step": 426620 - }, - { - "epoch": 0.74, - "learning_rate": 1.2800426901788176e-05, - "loss": 2.245, - "step": 426630 - }, - { - "epoch": 0.74, - "learning_rate": 1.279955496186135e-05, - "loss": 2.2645, - "step": 426640 - }, - { - "epoch": 0.74, - "learning_rate": 1.2798683021934521e-05, - "loss": 2.3054, - "step": 426650 - }, - { - "epoch": 0.74, - "learning_rate": 1.2797811082007693e-05, - "loss": 2.3399, - "step": 426660 - }, - { - "epoch": 0.74, - "learning_rate": 1.2796939142080869e-05, - "loss": 2.2052, - "step": 426670 - }, - { - "epoch": 0.74, - "learning_rate": 1.2796067202154041e-05, - "loss": 2.2664, - "step": 426680 - }, - { - "epoch": 0.74, - "learning_rate": 1.2795195262227213e-05, - "loss": 2.2544, - "step": 426690 - }, - { - "epoch": 0.74, - "learning_rate": 1.2794323322300387e-05, - "loss": 2.2523, - "step": 426700 - }, - { - "epoch": 0.74, - "learning_rate": 1.279345138237356e-05, - "loss": 2.2167, - "step": 426710 - }, - { - "epoch": 0.74, - "learning_rate": 1.2792579442446734e-05, - "loss": 2.3599, - "step": 426720 - }, - { - "epoch": 0.74, - "learning_rate": 1.2791707502519906e-05, - "loss": 2.3374, - "step": 426730 - }, - { - "epoch": 0.74, - "learning_rate": 1.2790835562593082e-05, - "loss": 2.2787, - "step": 426740 - }, - { - "epoch": 0.74, - "learning_rate": 1.2789963622666254e-05, - "loss": 2.297, - "step": 426750 - }, - { - "epoch": 0.74, - "learning_rate": 1.2789091682739426e-05, - "loss": 2.2318, - "step": 426760 - }, - { - "epoch": 0.74, - "learning_rate": 1.2788219742812598e-05, - "loss": 2.1947, - "step": 426770 - }, - { - "epoch": 0.74, - "learning_rate": 1.2787347802885774e-05, - "loss": 2.2497, - "step": 426780 - }, - { - "epoch": 0.74, - "learning_rate": 1.2786475862958946e-05, - "loss": 2.3655, - "step": 426790 - }, - { - "epoch": 0.74, - "learning_rate": 1.278560392303212e-05, - "loss": 2.3224, - "step": 426800 - }, - { - "epoch": 0.74, - "learning_rate": 1.2784731983105292e-05, - "loss": 2.3529, - "step": 426810 - }, - { - "epoch": 0.74, - "learning_rate": 1.2783860043178467e-05, - "loss": 2.3054, - "step": 426820 - }, - { - "epoch": 0.74, - "learning_rate": 1.2782988103251639e-05, - "loss": 2.1812, - "step": 426830 - }, - { - "epoch": 0.74, - "learning_rate": 1.2782116163324811e-05, - "loss": 2.1832, - "step": 426840 - }, - { - "epoch": 0.74, - "learning_rate": 1.2781244223397987e-05, - "loss": 2.2471, - "step": 426850 - }, - { - "epoch": 0.74, - "learning_rate": 1.2780372283471159e-05, - "loss": 2.2926, - "step": 426860 - }, - { - "epoch": 0.74, - "learning_rate": 1.2779500343544332e-05, - "loss": 2.2486, - "step": 426870 - }, - { - "epoch": 0.74, - "learning_rate": 1.2778628403617505e-05, - "loss": 2.382, - "step": 426880 - }, - { - "epoch": 0.74, - "learning_rate": 1.277775646369068e-05, - "loss": 2.3627, - "step": 426890 - }, - { - "epoch": 0.74, - "learning_rate": 1.2776884523763852e-05, - "loss": 2.3608, - "step": 426900 - }, - { - "epoch": 0.74, - "learning_rate": 1.2776012583837024e-05, - "loss": 2.2485, - "step": 426910 - }, - { - "epoch": 0.74, - "learning_rate": 1.2775140643910196e-05, - "loss": 2.3219, - "step": 426920 - }, - { - "epoch": 0.74, - "learning_rate": 1.2774268703983372e-05, - "loss": 2.2409, - "step": 426930 - }, - { - "epoch": 0.74, - "learning_rate": 1.2773396764056544e-05, - "loss": 2.3138, - "step": 426940 - }, - { - "epoch": 0.74, - "learning_rate": 1.2772524824129718e-05, - "loss": 2.2372, - "step": 426950 - }, - { - "epoch": 0.74, - "learning_rate": 1.277165288420289e-05, - "loss": 2.3694, - "step": 426960 - }, - { - "epoch": 0.74, - "learning_rate": 1.2770780944276065e-05, - "loss": 2.3195, - "step": 426970 - }, - { - "epoch": 0.74, - "learning_rate": 1.2769909004349237e-05, - "loss": 2.299, - "step": 426980 - }, - { - "epoch": 0.74, - "learning_rate": 1.276903706442241e-05, - "loss": 2.2719, - "step": 426990 - }, - { - "epoch": 0.74, - "learning_rate": 1.2768165124495585e-05, - "loss": 2.3227, - "step": 427000 - }, - { - "epoch": 0.74, - "learning_rate": 1.2767293184568757e-05, - "loss": 2.3344, - "step": 427010 - }, - { - "epoch": 0.74, - "learning_rate": 1.2766421244641929e-05, - "loss": 2.3043, - "step": 427020 - }, - { - "epoch": 0.74, - "learning_rate": 1.2765549304715103e-05, - "loss": 2.2727, - "step": 427030 - }, - { - "epoch": 0.74, - "learning_rate": 1.2764677364788278e-05, - "loss": 2.2267, - "step": 427040 - }, - { - "epoch": 0.74, - "learning_rate": 1.276380542486145e-05, - "loss": 2.292, - "step": 427050 - }, - { - "epoch": 0.74, - "learning_rate": 1.2762933484934622e-05, - "loss": 2.2526, - "step": 427060 - }, - { - "epoch": 0.74, - "learning_rate": 1.2762061545007794e-05, - "loss": 2.32, - "step": 427070 - }, - { - "epoch": 0.74, - "learning_rate": 1.276118960508097e-05, - "loss": 2.3542, - "step": 427080 - }, - { - "epoch": 0.74, - "learning_rate": 1.2760317665154142e-05, - "loss": 2.2609, - "step": 427090 - }, - { - "epoch": 0.74, - "learning_rate": 1.2759445725227314e-05, - "loss": 2.2753, - "step": 427100 - }, - { - "epoch": 0.74, - "learning_rate": 1.2758573785300488e-05, - "loss": 2.2078, - "step": 427110 - }, - { - "epoch": 0.74, - "learning_rate": 1.2757701845373663e-05, - "loss": 2.353, - "step": 427120 - }, - { - "epoch": 0.74, - "learning_rate": 1.2756829905446835e-05, - "loss": 2.3686, - "step": 427130 - }, - { - "epoch": 0.74, - "learning_rate": 1.2755957965520007e-05, - "loss": 2.3508, - "step": 427140 - }, - { - "epoch": 0.74, - "learning_rate": 1.2755086025593183e-05, - "loss": 2.3317, - "step": 427150 - }, - { - "epoch": 0.74, - "learning_rate": 1.2754214085666355e-05, - "loss": 2.2903, - "step": 427160 - }, - { - "epoch": 0.74, - "learning_rate": 1.2753342145739527e-05, - "loss": 2.344, - "step": 427170 - }, - { - "epoch": 0.74, - "learning_rate": 1.27524702058127e-05, - "loss": 2.2762, - "step": 427180 - }, - { - "epoch": 0.74, - "learning_rate": 1.2751598265885874e-05, - "loss": 2.3019, - "step": 427190 - }, - { - "epoch": 0.74, - "learning_rate": 1.2750726325959048e-05, - "loss": 2.3484, - "step": 427200 - }, - { - "epoch": 0.75, - "learning_rate": 1.274985438603222e-05, - "loss": 2.2539, - "step": 427210 - }, - { - "epoch": 0.75, - "learning_rate": 1.2748982446105392e-05, - "loss": 2.2996, - "step": 427220 - }, - { - "epoch": 0.75, - "learning_rate": 1.2748110506178568e-05, - "loss": 2.3495, - "step": 427230 - }, - { - "epoch": 0.75, - "learning_rate": 1.274723856625174e-05, - "loss": 2.3103, - "step": 427240 - }, - { - "epoch": 0.75, - "learning_rate": 1.2746366626324912e-05, - "loss": 2.3337, - "step": 427250 - }, - { - "epoch": 0.75, - "learning_rate": 1.2745494686398087e-05, - "loss": 2.3735, - "step": 427260 - }, - { - "epoch": 0.75, - "learning_rate": 1.274462274647126e-05, - "loss": 2.3138, - "step": 427270 - }, - { - "epoch": 0.75, - "learning_rate": 1.2743750806544433e-05, - "loss": 2.3854, - "step": 427280 - }, - { - "epoch": 0.75, - "learning_rate": 1.2742878866617605e-05, - "loss": 2.2414, - "step": 427290 - }, - { - "epoch": 0.75, - "learning_rate": 1.2742006926690781e-05, - "loss": 2.2411, - "step": 427300 - }, - { - "epoch": 0.75, - "learning_rate": 1.2741134986763953e-05, - "loss": 2.328, - "step": 427310 - }, - { - "epoch": 0.75, - "learning_rate": 1.2740263046837125e-05, - "loss": 2.3118, - "step": 427320 - }, - { - "epoch": 0.75, - "learning_rate": 1.2739391106910297e-05, - "loss": 2.2028, - "step": 427330 - }, - { - "epoch": 0.75, - "learning_rate": 1.2738519166983473e-05, - "loss": 2.2871, - "step": 427340 - }, - { - "epoch": 0.75, - "learning_rate": 1.2737647227056646e-05, - "loss": 2.2957, - "step": 427350 - }, - { - "epoch": 0.75, - "learning_rate": 1.2736775287129818e-05, - "loss": 2.3161, - "step": 427360 - }, - { - "epoch": 0.75, - "learning_rate": 1.273590334720299e-05, - "loss": 2.3104, - "step": 427370 - }, - { - "epoch": 0.75, - "learning_rate": 1.2735031407276166e-05, - "loss": 2.1806, - "step": 427380 - }, - { - "epoch": 0.75, - "learning_rate": 1.2734159467349338e-05, - "loss": 2.1583, - "step": 427390 - }, - { - "epoch": 0.75, - "learning_rate": 1.273328752742251e-05, - "loss": 2.2891, - "step": 427400 - }, - { - "epoch": 0.75, - "learning_rate": 1.2732415587495686e-05, - "loss": 2.2192, - "step": 427410 - }, - { - "epoch": 0.75, - "learning_rate": 1.2731543647568858e-05, - "loss": 2.198, - "step": 427420 - }, - { - "epoch": 0.75, - "learning_rate": 1.2730671707642031e-05, - "loss": 2.2498, - "step": 427430 - }, - { - "epoch": 0.75, - "learning_rate": 1.2729799767715203e-05, - "loss": 2.3343, - "step": 427440 - }, - { - "epoch": 0.75, - "learning_rate": 1.2728927827788379e-05, - "loss": 2.2685, - "step": 427450 - }, - { - "epoch": 0.75, - "learning_rate": 1.2728055887861551e-05, - "loss": 2.3365, - "step": 427460 - }, - { - "epoch": 0.75, - "learning_rate": 1.2727183947934723e-05, - "loss": 2.2553, - "step": 427470 - }, - { - "epoch": 0.75, - "learning_rate": 1.2726312008007895e-05, - "loss": 2.3586, - "step": 427480 - }, - { - "epoch": 0.75, - "learning_rate": 1.272544006808107e-05, - "loss": 2.3864, - "step": 427490 - }, - { - "epoch": 0.75, - "learning_rate": 1.2724568128154243e-05, - "loss": 2.3961, - "step": 427500 - }, - { - "epoch": 0.75, - "learning_rate": 1.2723696188227416e-05, - "loss": 2.3577, - "step": 427510 - }, - { - "epoch": 0.75, - "learning_rate": 1.272282424830059e-05, - "loss": 2.4164, - "step": 427520 - }, - { - "epoch": 0.75, - "learning_rate": 1.2721952308373764e-05, - "loss": 2.2949, - "step": 427530 - }, - { - "epoch": 0.75, - "learning_rate": 1.2721080368446936e-05, - "loss": 2.3114, - "step": 427540 - }, - { - "epoch": 0.75, - "learning_rate": 1.2720208428520108e-05, - "loss": 2.2914, - "step": 427550 - }, - { - "epoch": 0.75, - "learning_rate": 1.2719336488593284e-05, - "loss": 2.3349, - "step": 427560 - }, - { - "epoch": 0.75, - "learning_rate": 1.2718464548666456e-05, - "loss": 2.1842, - "step": 427570 - }, - { - "epoch": 0.75, - "learning_rate": 1.2717592608739628e-05, - "loss": 2.3024, - "step": 427580 - }, - { - "epoch": 0.75, - "learning_rate": 1.2716720668812802e-05, - "loss": 2.3439, - "step": 427590 - }, - { - "epoch": 0.75, - "learning_rate": 1.2715848728885977e-05, - "loss": 2.4224, - "step": 427600 - }, - { - "epoch": 0.75, - "learning_rate": 1.2714976788959149e-05, - "loss": 2.2835, - "step": 427610 - }, - { - "epoch": 0.75, - "learning_rate": 1.2714104849032321e-05, - "loss": 2.4283, - "step": 427620 - }, - { - "epoch": 0.75, - "learning_rate": 1.2713232909105493e-05, - "loss": 2.3624, - "step": 427630 - }, - { - "epoch": 0.75, - "learning_rate": 1.2712360969178669e-05, - "loss": 2.291, - "step": 427640 - }, - { - "epoch": 0.75, - "learning_rate": 1.271148902925184e-05, - "loss": 2.338, - "step": 427650 - }, - { - "epoch": 0.75, - "learning_rate": 1.2710617089325015e-05, - "loss": 2.137, - "step": 427660 - }, - { - "epoch": 0.75, - "learning_rate": 1.2709745149398188e-05, - "loss": 2.3319, - "step": 427670 - }, - { - "epoch": 0.75, - "learning_rate": 1.2708873209471362e-05, - "loss": 2.358, - "step": 427680 - }, - { - "epoch": 0.75, - "learning_rate": 1.2708001269544534e-05, - "loss": 2.1922, - "step": 427690 - }, - { - "epoch": 0.75, - "learning_rate": 1.2707129329617706e-05, - "loss": 2.3485, - "step": 427700 - }, - { - "epoch": 0.75, - "learning_rate": 1.2706257389690882e-05, - "loss": 2.3436, - "step": 427710 - }, - { - "epoch": 0.75, - "learning_rate": 1.2705385449764054e-05, - "loss": 2.2881, - "step": 427720 - }, - { - "epoch": 0.75, - "learning_rate": 1.2704513509837226e-05, - "loss": 2.2323, - "step": 427730 - }, - { - "epoch": 0.75, - "learning_rate": 1.27036415699104e-05, - "loss": 2.2931, - "step": 427740 - }, - { - "epoch": 0.75, - "learning_rate": 1.2702769629983573e-05, - "loss": 2.3473, - "step": 427750 - }, - { - "epoch": 0.75, - "learning_rate": 1.2701897690056747e-05, - "loss": 2.238, - "step": 427760 - }, - { - "epoch": 0.75, - "learning_rate": 1.270102575012992e-05, - "loss": 2.3562, - "step": 427770 - }, - { - "epoch": 0.75, - "learning_rate": 1.2700153810203091e-05, - "loss": 2.2953, - "step": 427780 - }, - { - "epoch": 0.75, - "learning_rate": 1.2699281870276267e-05, - "loss": 2.3623, - "step": 427790 - }, - { - "epoch": 0.75, - "learning_rate": 1.2698409930349439e-05, - "loss": 2.4194, - "step": 427800 - }, - { - "epoch": 0.75, - "learning_rate": 1.2697537990422611e-05, - "loss": 2.2922, - "step": 427810 - }, - { - "epoch": 0.75, - "learning_rate": 1.2696666050495786e-05, - "loss": 2.3996, - "step": 427820 - }, - { - "epoch": 0.75, - "learning_rate": 1.2695794110568958e-05, - "loss": 2.3309, - "step": 427830 - }, - { - "epoch": 0.75, - "learning_rate": 1.2694922170642132e-05, - "loss": 2.2257, - "step": 427840 - }, - { - "epoch": 0.75, - "learning_rate": 1.2694050230715304e-05, - "loss": 2.3211, - "step": 427850 - }, - { - "epoch": 0.75, - "learning_rate": 1.269317829078848e-05, - "loss": 2.3007, - "step": 427860 - }, - { - "epoch": 0.75, - "learning_rate": 1.2692306350861652e-05, - "loss": 2.2854, - "step": 427870 - }, - { - "epoch": 0.75, - "learning_rate": 1.2691434410934824e-05, - "loss": 2.3506, - "step": 427880 - }, - { - "epoch": 0.75, - "learning_rate": 1.2690562471007996e-05, - "loss": 2.3264, - "step": 427890 - }, - { - "epoch": 0.75, - "learning_rate": 1.2689690531081171e-05, - "loss": 2.2475, - "step": 427900 - }, - { - "epoch": 0.75, - "learning_rate": 1.2688818591154345e-05, - "loss": 2.3421, - "step": 427910 - }, - { - "epoch": 0.75, - "learning_rate": 1.2687946651227517e-05, - "loss": 2.2825, - "step": 427920 - }, - { - "epoch": 0.75, - "learning_rate": 1.2687074711300693e-05, - "loss": 2.3102, - "step": 427930 - }, - { - "epoch": 0.75, - "learning_rate": 1.2686202771373865e-05, - "loss": 2.2546, - "step": 427940 - }, - { - "epoch": 0.75, - "learning_rate": 1.2685330831447037e-05, - "loss": 2.2659, - "step": 427950 - }, - { - "epoch": 0.75, - "learning_rate": 1.2684458891520209e-05, - "loss": 2.2774, - "step": 427960 - }, - { - "epoch": 0.75, - "learning_rate": 1.2683586951593384e-05, - "loss": 2.2001, - "step": 427970 - }, - { - "epoch": 0.75, - "learning_rate": 1.2682715011666557e-05, - "loss": 2.2541, - "step": 427980 - }, - { - "epoch": 0.75, - "learning_rate": 1.268184307173973e-05, - "loss": 2.3907, - "step": 427990 - }, - { - "epoch": 0.75, - "learning_rate": 1.2680971131812902e-05, - "loss": 2.3241, - "step": 428000 - }, - { - "epoch": 0.75, - "learning_rate": 1.2680099191886078e-05, - "loss": 2.3213, - "step": 428010 - }, - { - "epoch": 0.75, - "learning_rate": 1.267922725195925e-05, - "loss": 2.3483, - "step": 428020 - }, - { - "epoch": 0.75, - "learning_rate": 1.2678355312032422e-05, - "loss": 2.3835, - "step": 428030 - }, - { - "epoch": 0.75, - "learning_rate": 1.2677483372105594e-05, - "loss": 2.3446, - "step": 428040 - }, - { - "epoch": 0.75, - "learning_rate": 1.267661143217877e-05, - "loss": 2.3246, - "step": 428050 - }, - { - "epoch": 0.75, - "learning_rate": 1.2675739492251942e-05, - "loss": 2.2427, - "step": 428060 - }, - { - "epoch": 0.75, - "learning_rate": 1.2674867552325115e-05, - "loss": 2.2901, - "step": 428070 - }, - { - "epoch": 0.75, - "learning_rate": 1.2673995612398291e-05, - "loss": 2.0889, - "step": 428080 - }, - { - "epoch": 0.75, - "learning_rate": 1.2673123672471463e-05, - "loss": 2.2811, - "step": 428090 - }, - { - "epoch": 0.75, - "learning_rate": 1.2672251732544635e-05, - "loss": 2.3438, - "step": 428100 - }, - { - "epoch": 0.75, - "learning_rate": 1.2671379792617807e-05, - "loss": 2.2951, - "step": 428110 - }, - { - "epoch": 0.75, - "learning_rate": 1.2670507852690983e-05, - "loss": 2.2885, - "step": 428120 - }, - { - "epoch": 0.75, - "learning_rate": 1.2669635912764155e-05, - "loss": 2.3522, - "step": 428130 - }, - { - "epoch": 0.75, - "learning_rate": 1.2668763972837327e-05, - "loss": 2.3224, - "step": 428140 - }, - { - "epoch": 0.75, - "learning_rate": 1.26678920329105e-05, - "loss": 2.3119, - "step": 428150 - }, - { - "epoch": 0.75, - "learning_rate": 1.2667020092983676e-05, - "loss": 2.2574, - "step": 428160 - }, - { - "epoch": 0.75, - "learning_rate": 1.2666148153056848e-05, - "loss": 2.2948, - "step": 428170 - }, - { - "epoch": 0.75, - "learning_rate": 1.266527621313002e-05, - "loss": 2.4124, - "step": 428180 - }, - { - "epoch": 0.75, - "learning_rate": 1.2664404273203196e-05, - "loss": 2.2785, - "step": 428190 - }, - { - "epoch": 0.75, - "learning_rate": 1.2663532333276368e-05, - "loss": 2.2787, - "step": 428200 - }, - { - "epoch": 0.75, - "learning_rate": 1.266266039334954e-05, - "loss": 2.336, - "step": 428210 - }, - { - "epoch": 0.75, - "learning_rate": 1.2661788453422713e-05, - "loss": 2.2911, - "step": 428220 - }, - { - "epoch": 0.75, - "learning_rate": 1.2660916513495887e-05, - "loss": 2.3358, - "step": 428230 - }, - { - "epoch": 0.75, - "learning_rate": 1.2660044573569061e-05, - "loss": 2.3435, - "step": 428240 - }, - { - "epoch": 0.75, - "learning_rate": 1.2659172633642233e-05, - "loss": 2.3094, - "step": 428250 - }, - { - "epoch": 0.75, - "learning_rate": 1.2658300693715405e-05, - "loss": 2.2371, - "step": 428260 - }, - { - "epoch": 0.75, - "learning_rate": 1.265742875378858e-05, - "loss": 2.149, - "step": 428270 - }, - { - "epoch": 0.75, - "learning_rate": 1.2656556813861753e-05, - "loss": 2.3117, - "step": 428280 - }, - { - "epoch": 0.75, - "learning_rate": 1.2655684873934925e-05, - "loss": 2.3452, - "step": 428290 - }, - { - "epoch": 0.75, - "learning_rate": 1.2654812934008099e-05, - "loss": 2.4521, - "step": 428300 - }, - { - "epoch": 0.75, - "learning_rate": 1.2653940994081272e-05, - "loss": 2.3157, - "step": 428310 - }, - { - "epoch": 0.75, - "learning_rate": 1.2653069054154446e-05, - "loss": 2.3468, - "step": 428320 - }, - { - "epoch": 0.75, - "learning_rate": 1.2652197114227618e-05, - "loss": 2.2541, - "step": 428330 - }, - { - "epoch": 0.75, - "learning_rate": 1.2651325174300794e-05, - "loss": 2.3085, - "step": 428340 - }, - { - "epoch": 0.75, - "learning_rate": 1.2650453234373966e-05, - "loss": 2.3485, - "step": 428350 - }, - { - "epoch": 0.75, - "learning_rate": 1.2649581294447138e-05, - "loss": 2.3203, - "step": 428360 - }, - { - "epoch": 0.75, - "learning_rate": 1.264870935452031e-05, - "loss": 2.2292, - "step": 428370 - }, - { - "epoch": 0.75, - "learning_rate": 1.2647837414593485e-05, - "loss": 2.3703, - "step": 428380 - }, - { - "epoch": 0.75, - "learning_rate": 1.2646965474666659e-05, - "loss": 2.3596, - "step": 428390 - }, - { - "epoch": 0.75, - "learning_rate": 1.2646093534739831e-05, - "loss": 2.2557, - "step": 428400 - }, - { - "epoch": 0.75, - "learning_rate": 1.2645221594813003e-05, - "loss": 2.2273, - "step": 428410 - }, - { - "epoch": 0.75, - "learning_rate": 1.2644349654886179e-05, - "loss": 2.2813, - "step": 428420 - }, - { - "epoch": 0.75, - "learning_rate": 1.264347771495935e-05, - "loss": 2.3938, - "step": 428430 - }, - { - "epoch": 0.75, - "learning_rate": 1.2642605775032523e-05, - "loss": 2.2174, - "step": 428440 - }, - { - "epoch": 0.75, - "learning_rate": 1.2641733835105698e-05, - "loss": 2.3638, - "step": 428450 - }, - { - "epoch": 0.75, - "learning_rate": 1.264086189517887e-05, - "loss": 2.2816, - "step": 428460 - }, - { - "epoch": 0.75, - "learning_rate": 1.2639989955252044e-05, - "loss": 2.2666, - "step": 428470 - }, - { - "epoch": 0.75, - "learning_rate": 1.2639118015325216e-05, - "loss": 2.424, - "step": 428480 - }, - { - "epoch": 0.75, - "learning_rate": 1.2638246075398392e-05, - "loss": 2.2251, - "step": 428490 - }, - { - "epoch": 0.75, - "learning_rate": 1.2637374135471564e-05, - "loss": 2.2485, - "step": 428500 - }, - { - "epoch": 0.75, - "learning_rate": 1.2636502195544736e-05, - "loss": 2.2797, - "step": 428510 - }, - { - "epoch": 0.75, - "learning_rate": 1.2635630255617908e-05, - "loss": 2.2738, - "step": 428520 - }, - { - "epoch": 0.75, - "learning_rate": 1.2634758315691083e-05, - "loss": 2.2671, - "step": 428530 - }, - { - "epoch": 0.75, - "learning_rate": 1.2633886375764255e-05, - "loss": 2.2411, - "step": 428540 - }, - { - "epoch": 0.75, - "learning_rate": 1.263301443583743e-05, - "loss": 2.3489, - "step": 428550 - }, - { - "epoch": 0.75, - "learning_rate": 1.2632142495910601e-05, - "loss": 2.3603, - "step": 428560 - }, - { - "epoch": 0.75, - "learning_rate": 1.2631270555983777e-05, - "loss": 2.2538, - "step": 428570 - }, - { - "epoch": 0.75, - "learning_rate": 1.2630398616056949e-05, - "loss": 2.2398, - "step": 428580 - }, - { - "epoch": 0.75, - "learning_rate": 1.2629526676130121e-05, - "loss": 2.3871, - "step": 428590 - }, - { - "epoch": 0.75, - "learning_rate": 1.2628654736203296e-05, - "loss": 2.3093, - "step": 428600 - }, - { - "epoch": 0.75, - "learning_rate": 1.2627782796276468e-05, - "loss": 2.3077, - "step": 428610 - }, - { - "epoch": 0.75, - "learning_rate": 1.262691085634964e-05, - "loss": 2.3587, - "step": 428620 - }, - { - "epoch": 0.75, - "learning_rate": 1.2626038916422814e-05, - "loss": 2.2906, - "step": 428630 - }, - { - "epoch": 0.75, - "learning_rate": 1.262516697649599e-05, - "loss": 2.2076, - "step": 428640 - }, - { - "epoch": 0.75, - "learning_rate": 1.2624295036569162e-05, - "loss": 2.1888, - "step": 428650 - }, - { - "epoch": 0.75, - "learning_rate": 1.2623423096642334e-05, - "loss": 2.299, - "step": 428660 - }, - { - "epoch": 0.75, - "learning_rate": 1.2622551156715506e-05, - "loss": 2.3576, - "step": 428670 - }, - { - "epoch": 0.75, - "learning_rate": 1.2621679216788681e-05, - "loss": 2.1995, - "step": 428680 - }, - { - "epoch": 0.75, - "learning_rate": 1.2620807276861854e-05, - "loss": 2.3016, - "step": 428690 - }, - { - "epoch": 0.75, - "learning_rate": 1.2619935336935027e-05, - "loss": 2.1625, - "step": 428700 - }, - { - "epoch": 0.75, - "learning_rate": 1.26190633970082e-05, - "loss": 2.3626, - "step": 428710 - }, - { - "epoch": 0.75, - "learning_rate": 1.2618191457081375e-05, - "loss": 2.3414, - "step": 428720 - }, - { - "epoch": 0.75, - "learning_rate": 1.2617319517154547e-05, - "loss": 2.3943, - "step": 428730 - }, - { - "epoch": 0.75, - "learning_rate": 1.2616447577227719e-05, - "loss": 2.2171, - "step": 428740 - }, - { - "epoch": 0.75, - "learning_rate": 1.2615575637300894e-05, - "loss": 2.2017, - "step": 428750 - }, - { - "epoch": 0.75, - "learning_rate": 1.2614703697374067e-05, - "loss": 2.2874, - "step": 428760 - }, - { - "epoch": 0.75, - "learning_rate": 1.2613831757447239e-05, - "loss": 2.3699, - "step": 428770 - }, - { - "epoch": 0.75, - "learning_rate": 1.2612959817520412e-05, - "loss": 2.3567, - "step": 428780 - }, - { - "epoch": 0.75, - "learning_rate": 1.2612087877593586e-05, - "loss": 2.3365, - "step": 428790 - }, - { - "epoch": 0.75, - "learning_rate": 1.261121593766676e-05, - "loss": 2.2256, - "step": 428800 - }, - { - "epoch": 0.75, - "learning_rate": 1.2610343997739932e-05, - "loss": 2.263, - "step": 428810 - }, - { - "epoch": 0.75, - "learning_rate": 1.2609472057813104e-05, - "loss": 2.1801, - "step": 428820 - }, - { - "epoch": 0.75, - "learning_rate": 1.260860011788628e-05, - "loss": 2.3598, - "step": 428830 - }, - { - "epoch": 0.75, - "learning_rate": 1.2607728177959452e-05, - "loss": 2.18, - "step": 428840 - }, - { - "epoch": 0.75, - "learning_rate": 1.2606856238032624e-05, - "loss": 2.2425, - "step": 428850 - }, - { - "epoch": 0.75, - "learning_rate": 1.26059842981058e-05, - "loss": 2.2818, - "step": 428860 - }, - { - "epoch": 0.75, - "learning_rate": 1.2605112358178971e-05, - "loss": 2.2217, - "step": 428870 - }, - { - "epoch": 0.75, - "learning_rate": 1.2604240418252145e-05, - "loss": 2.3881, - "step": 428880 - }, - { - "epoch": 0.75, - "learning_rate": 1.2603368478325317e-05, - "loss": 2.3546, - "step": 428890 - }, - { - "epoch": 0.75, - "learning_rate": 1.2602496538398493e-05, - "loss": 2.38, - "step": 428900 - }, - { - "epoch": 0.75, - "learning_rate": 1.2601624598471665e-05, - "loss": 2.2649, - "step": 428910 - }, - { - "epoch": 0.75, - "learning_rate": 1.2600752658544837e-05, - "loss": 2.2933, - "step": 428920 - }, - { - "epoch": 0.75, - "learning_rate": 1.2599880718618009e-05, - "loss": 2.2862, - "step": 428930 - }, - { - "epoch": 0.75, - "learning_rate": 1.2599008778691184e-05, - "loss": 2.207, - "step": 428940 - }, - { - "epoch": 0.75, - "learning_rate": 1.2598136838764358e-05, - "loss": 2.1495, - "step": 428950 - }, - { - "epoch": 0.75, - "learning_rate": 1.259726489883753e-05, - "loss": 2.2837, - "step": 428960 - }, - { - "epoch": 0.75, - "learning_rate": 1.2596392958910702e-05, - "loss": 2.1271, - "step": 428970 - }, - { - "epoch": 0.75, - "learning_rate": 1.2595521018983878e-05, - "loss": 2.3183, - "step": 428980 - }, - { - "epoch": 0.75, - "learning_rate": 1.259464907905705e-05, - "loss": 2.2, - "step": 428990 - }, - { - "epoch": 0.75, - "learning_rate": 1.2593777139130222e-05, - "loss": 2.2845, - "step": 429000 - }, - { - "epoch": 0.75, - "learning_rate": 1.2592905199203397e-05, - "loss": 2.255, - "step": 429010 - }, - { - "epoch": 0.75, - "learning_rate": 1.259203325927657e-05, - "loss": 2.2112, - "step": 429020 - }, - { - "epoch": 0.75, - "learning_rate": 1.2591161319349743e-05, - "loss": 2.3706, - "step": 429030 - }, - { - "epoch": 0.75, - "learning_rate": 1.2590289379422915e-05, - "loss": 2.3109, - "step": 429040 - }, - { - "epoch": 0.75, - "learning_rate": 1.258941743949609e-05, - "loss": 2.3016, - "step": 429050 - }, - { - "epoch": 0.75, - "learning_rate": 1.2588545499569263e-05, - "loss": 2.2403, - "step": 429060 - }, - { - "epoch": 0.75, - "learning_rate": 1.2587673559642435e-05, - "loss": 2.3567, - "step": 429070 - }, - { - "epoch": 0.75, - "learning_rate": 1.2586801619715607e-05, - "loss": 2.2794, - "step": 429080 - }, - { - "epoch": 0.75, - "learning_rate": 1.2585929679788782e-05, - "loss": 2.2749, - "step": 429090 - }, - { - "epoch": 0.75, - "learning_rate": 1.2585057739861954e-05, - "loss": 2.3986, - "step": 429100 - }, - { - "epoch": 0.75, - "learning_rate": 1.2584185799935128e-05, - "loss": 2.3954, - "step": 429110 - }, - { - "epoch": 0.75, - "learning_rate": 1.2583313860008304e-05, - "loss": 2.3538, - "step": 429120 - }, - { - "epoch": 0.75, - "learning_rate": 1.2582441920081476e-05, - "loss": 2.2754, - "step": 429130 - }, - { - "epoch": 0.75, - "learning_rate": 1.2581569980154648e-05, - "loss": 2.2697, - "step": 429140 - }, - { - "epoch": 0.75, - "learning_rate": 1.258069804022782e-05, - "loss": 2.3046, - "step": 429150 - }, - { - "epoch": 0.75, - "learning_rate": 1.2579826100300995e-05, - "loss": 2.2519, - "step": 429160 - }, - { - "epoch": 0.75, - "learning_rate": 1.2578954160374167e-05, - "loss": 2.2765, - "step": 429170 - }, - { - "epoch": 0.75, - "learning_rate": 1.257808222044734e-05, - "loss": 2.2253, - "step": 429180 - }, - { - "epoch": 0.75, - "learning_rate": 1.2577210280520513e-05, - "loss": 2.3191, - "step": 429190 - }, - { - "epoch": 0.75, - "learning_rate": 1.2576338340593689e-05, - "loss": 2.1579, - "step": 429200 - }, - { - "epoch": 0.75, - "learning_rate": 1.257546640066686e-05, - "loss": 2.2884, - "step": 429210 - }, - { - "epoch": 0.75, - "learning_rate": 1.2574594460740033e-05, - "loss": 2.3666, - "step": 429220 - }, - { - "epoch": 0.75, - "learning_rate": 1.2573722520813205e-05, - "loss": 2.3003, - "step": 429230 - }, - { - "epoch": 0.75, - "learning_rate": 1.257285058088638e-05, - "loss": 2.3723, - "step": 429240 - }, - { - "epoch": 0.75, - "learning_rate": 1.2571978640959552e-05, - "loss": 2.3006, - "step": 429250 - }, - { - "epoch": 0.75, - "learning_rate": 1.2571106701032726e-05, - "loss": 2.3629, - "step": 429260 - }, - { - "epoch": 0.75, - "learning_rate": 1.25702347611059e-05, - "loss": 2.2096, - "step": 429270 - }, - { - "epoch": 0.75, - "learning_rate": 1.2569362821179074e-05, - "loss": 2.3598, - "step": 429280 - }, - { - "epoch": 0.75, - "learning_rate": 1.2568490881252246e-05, - "loss": 2.3131, - "step": 429290 - }, - { - "epoch": 0.75, - "learning_rate": 1.2567618941325418e-05, - "loss": 2.2707, - "step": 429300 - }, - { - "epoch": 0.75, - "learning_rate": 1.2566747001398593e-05, - "loss": 2.2118, - "step": 429310 - }, - { - "epoch": 0.75, - "learning_rate": 1.2565875061471765e-05, - "loss": 2.2013, - "step": 429320 - }, - { - "epoch": 0.75, - "learning_rate": 1.2565003121544938e-05, - "loss": 2.3399, - "step": 429330 - }, - { - "epoch": 0.75, - "learning_rate": 1.2564131181618111e-05, - "loss": 2.3324, - "step": 429340 - }, - { - "epoch": 0.75, - "learning_rate": 1.2563259241691285e-05, - "loss": 2.3219, - "step": 429350 - }, - { - "epoch": 0.75, - "learning_rate": 1.2562387301764459e-05, - "loss": 2.338, - "step": 429360 - }, - { - "epoch": 0.75, - "learning_rate": 1.2561515361837631e-05, - "loss": 2.2719, - "step": 429370 - }, - { - "epoch": 0.75, - "learning_rate": 1.2560643421910806e-05, - "loss": 2.3537, - "step": 429380 - }, - { - "epoch": 0.75, - "learning_rate": 1.2559771481983978e-05, - "loss": 2.344, - "step": 429390 - }, - { - "epoch": 0.75, - "learning_rate": 1.255889954205715e-05, - "loss": 2.3254, - "step": 429400 - }, - { - "epoch": 0.75, - "learning_rate": 1.2558027602130323e-05, - "loss": 2.2969, - "step": 429410 - }, - { - "epoch": 0.75, - "learning_rate": 1.2557155662203498e-05, - "loss": 2.3201, - "step": 429420 - }, - { - "epoch": 0.75, - "learning_rate": 1.2556283722276672e-05, - "loss": 2.2946, - "step": 429430 - }, - { - "epoch": 0.75, - "learning_rate": 1.2555411782349844e-05, - "loss": 2.311, - "step": 429440 - }, - { - "epoch": 0.75, - "learning_rate": 1.2554539842423016e-05, - "loss": 2.3764, - "step": 429450 - }, - { - "epoch": 0.75, - "learning_rate": 1.2553667902496191e-05, - "loss": 2.2321, - "step": 429460 - }, - { - "epoch": 0.75, - "learning_rate": 1.2552795962569364e-05, - "loss": 2.2953, - "step": 429470 - }, - { - "epoch": 0.75, - "learning_rate": 1.2551924022642536e-05, - "loss": 2.2417, - "step": 429480 - }, - { - "epoch": 0.75, - "learning_rate": 1.2551052082715708e-05, - "loss": 2.2974, - "step": 429490 - }, - { - "epoch": 0.75, - "learning_rate": 1.2550180142788883e-05, - "loss": 2.3408, - "step": 429500 - }, - { - "epoch": 0.75, - "learning_rate": 1.2549308202862057e-05, - "loss": 2.221, - "step": 429510 - }, - { - "epoch": 0.75, - "learning_rate": 1.2548436262935229e-05, - "loss": 2.3572, - "step": 429520 - }, - { - "epoch": 0.75, - "learning_rate": 1.2547564323008404e-05, - "loss": 2.4, - "step": 429530 - }, - { - "epoch": 0.75, - "learning_rate": 1.2546692383081577e-05, - "loss": 2.1124, - "step": 429540 - }, - { - "epoch": 0.75, - "learning_rate": 1.2545820443154749e-05, - "loss": 2.321, - "step": 429550 - }, - { - "epoch": 0.75, - "learning_rate": 1.254494850322792e-05, - "loss": 2.3177, - "step": 429560 - }, - { - "epoch": 0.75, - "learning_rate": 1.2544076563301096e-05, - "loss": 2.4005, - "step": 429570 - }, - { - "epoch": 0.75, - "learning_rate": 1.2543204623374268e-05, - "loss": 2.32, - "step": 429580 - }, - { - "epoch": 0.75, - "learning_rate": 1.2542332683447442e-05, - "loss": 2.2283, - "step": 429590 - }, - { - "epoch": 0.75, - "learning_rate": 1.2541460743520614e-05, - "loss": 2.4201, - "step": 429600 - }, - { - "epoch": 0.75, - "learning_rate": 1.254058880359379e-05, - "loss": 2.3056, - "step": 429610 - }, - { - "epoch": 0.75, - "learning_rate": 1.2539716863666962e-05, - "loss": 2.2576, - "step": 429620 - }, - { - "epoch": 0.75, - "learning_rate": 1.2538844923740134e-05, - "loss": 2.4192, - "step": 429630 - }, - { - "epoch": 0.75, - "learning_rate": 1.2537972983813306e-05, - "loss": 2.3112, - "step": 429640 - }, - { - "epoch": 0.75, - "learning_rate": 1.2537101043886481e-05, - "loss": 2.2509, - "step": 429650 - }, - { - "epoch": 0.75, - "learning_rate": 1.2536229103959653e-05, - "loss": 2.2446, - "step": 429660 - }, - { - "epoch": 0.75, - "learning_rate": 1.2535357164032827e-05, - "loss": 2.2774, - "step": 429670 - }, - { - "epoch": 0.75, - "learning_rate": 1.2534485224106003e-05, - "loss": 2.2675, - "step": 429680 - }, - { - "epoch": 0.75, - "learning_rate": 1.2533613284179175e-05, - "loss": 2.2531, - "step": 429690 - }, - { - "epoch": 0.75, - "learning_rate": 1.2532741344252347e-05, - "loss": 2.3141, - "step": 429700 - }, - { - "epoch": 0.75, - "learning_rate": 1.2531869404325519e-05, - "loss": 2.3724, - "step": 429710 - }, - { - "epoch": 0.75, - "learning_rate": 1.2530997464398694e-05, - "loss": 2.4073, - "step": 429720 - }, - { - "epoch": 0.75, - "learning_rate": 1.2530125524471866e-05, - "loss": 2.2659, - "step": 429730 - }, - { - "epoch": 0.75, - "learning_rate": 1.252925358454504e-05, - "loss": 2.335, - "step": 429740 - }, - { - "epoch": 0.75, - "learning_rate": 1.2528381644618212e-05, - "loss": 2.3803, - "step": 429750 - }, - { - "epoch": 0.75, - "learning_rate": 1.2527509704691388e-05, - "loss": 2.3049, - "step": 429760 - }, - { - "epoch": 0.75, - "learning_rate": 1.252663776476456e-05, - "loss": 2.44, - "step": 429770 - }, - { - "epoch": 0.75, - "learning_rate": 1.2525765824837732e-05, - "loss": 2.3378, - "step": 429780 - }, - { - "epoch": 0.75, - "learning_rate": 1.2524893884910907e-05, - "loss": 2.3233, - "step": 429790 - }, - { - "epoch": 0.75, - "learning_rate": 1.252402194498408e-05, - "loss": 2.2883, - "step": 429800 - }, - { - "epoch": 0.75, - "learning_rate": 1.2523150005057251e-05, - "loss": 2.2993, - "step": 429810 - }, - { - "epoch": 0.75, - "learning_rate": 1.2522278065130425e-05, - "loss": 2.286, - "step": 429820 - }, - { - "epoch": 0.75, - "learning_rate": 1.2521406125203599e-05, - "loss": 2.3248, - "step": 429830 - }, - { - "epoch": 0.75, - "learning_rate": 1.2520534185276773e-05, - "loss": 2.3474, - "step": 429840 - }, - { - "epoch": 0.75, - "learning_rate": 1.2519662245349945e-05, - "loss": 2.353, - "step": 429850 - }, - { - "epoch": 0.75, - "learning_rate": 1.2518790305423117e-05, - "loss": 2.2929, - "step": 429860 - }, - { - "epoch": 0.75, - "learning_rate": 1.2517918365496292e-05, - "loss": 2.2918, - "step": 429870 - }, - { - "epoch": 0.75, - "learning_rate": 1.2517046425569464e-05, - "loss": 2.1749, - "step": 429880 - }, - { - "epoch": 0.75, - "learning_rate": 1.2516174485642636e-05, - "loss": 2.3313, - "step": 429890 - }, - { - "epoch": 0.75, - "learning_rate": 1.251530254571581e-05, - "loss": 2.3798, - "step": 429900 - }, - { - "epoch": 0.75, - "learning_rate": 1.2514430605788984e-05, - "loss": 2.3129, - "step": 429910 - }, - { - "epoch": 0.75, - "learning_rate": 1.2513558665862158e-05, - "loss": 2.3621, - "step": 429920 - }, - { - "epoch": 0.75, - "learning_rate": 1.251268672593533e-05, - "loss": 2.3206, - "step": 429930 - }, - { - "epoch": 0.75, - "learning_rate": 1.2511814786008505e-05, - "loss": 2.3201, - "step": 429940 - }, - { - "epoch": 0.75, - "learning_rate": 1.2510942846081677e-05, - "loss": 2.2501, - "step": 429950 - }, - { - "epoch": 0.75, - "learning_rate": 1.251007090615485e-05, - "loss": 2.3295, - "step": 429960 - }, - { - "epoch": 0.75, - "learning_rate": 1.2509198966228022e-05, - "loss": 2.2833, - "step": 429970 - }, - { - "epoch": 0.75, - "learning_rate": 1.2508327026301197e-05, - "loss": 2.307, - "step": 429980 - }, - { - "epoch": 0.75, - "learning_rate": 1.250745508637437e-05, - "loss": 2.1906, - "step": 429990 - }, - { - "epoch": 0.75, - "learning_rate": 1.2506583146447543e-05, - "loss": 2.3406, - "step": 430000 - }, - { - "epoch": 0.75, - "learning_rate": 1.2505711206520715e-05, - "loss": 2.2772, - "step": 430010 - }, - { - "epoch": 0.75, - "learning_rate": 1.250483926659389e-05, - "loss": 2.2328, - "step": 430020 - }, - { - "epoch": 0.75, - "learning_rate": 1.2503967326667062e-05, - "loss": 2.3465, - "step": 430030 - }, - { - "epoch": 0.75, - "learning_rate": 1.2503095386740235e-05, - "loss": 2.204, - "step": 430040 - }, - { - "epoch": 0.75, - "learning_rate": 1.250222344681341e-05, - "loss": 2.2941, - "step": 430050 - }, - { - "epoch": 0.75, - "learning_rate": 1.2501351506886582e-05, - "loss": 2.291, - "step": 430060 - }, - { - "epoch": 0.75, - "learning_rate": 1.2500479566959756e-05, - "loss": 2.302, - "step": 430070 - }, - { - "epoch": 0.75, - "learning_rate": 1.249960762703293e-05, - "loss": 2.3651, - "step": 430080 - }, - { - "epoch": 0.75, - "learning_rate": 1.2498735687106102e-05, - "loss": 2.2469, - "step": 430090 - }, - { - "epoch": 0.75, - "learning_rate": 1.2497863747179275e-05, - "loss": 2.2324, - "step": 430100 - }, - { - "epoch": 0.75, - "learning_rate": 1.2496991807252448e-05, - "loss": 2.3362, - "step": 430110 - }, - { - "epoch": 0.75, - "learning_rate": 1.2496119867325621e-05, - "loss": 2.1829, - "step": 430120 - }, - { - "epoch": 0.75, - "learning_rate": 1.2495247927398793e-05, - "loss": 2.338, - "step": 430130 - }, - { - "epoch": 0.75, - "learning_rate": 1.2494375987471967e-05, - "loss": 2.1362, - "step": 430140 - }, - { - "epoch": 0.75, - "learning_rate": 1.2493504047545141e-05, - "loss": 2.1693, - "step": 430150 - }, - { - "epoch": 0.75, - "learning_rate": 1.2492632107618315e-05, - "loss": 2.3345, - "step": 430160 - }, - { - "epoch": 0.75, - "learning_rate": 1.2491760167691487e-05, - "loss": 2.31, - "step": 430170 - }, - { - "epoch": 0.75, - "learning_rate": 1.249088822776466e-05, - "loss": 2.1956, - "step": 430180 - }, - { - "epoch": 0.75, - "learning_rate": 1.2490016287837834e-05, - "loss": 2.2792, - "step": 430190 - }, - { - "epoch": 0.75, - "learning_rate": 1.2489144347911006e-05, - "loss": 2.277, - "step": 430200 - }, - { - "epoch": 0.75, - "learning_rate": 1.248827240798418e-05, - "loss": 2.2261, - "step": 430210 - }, - { - "epoch": 0.75, - "learning_rate": 1.2487400468057352e-05, - "loss": 2.3165, - "step": 430220 - }, - { - "epoch": 0.75, - "learning_rate": 1.2486528528130528e-05, - "loss": 2.2603, - "step": 430230 - }, - { - "epoch": 0.75, - "learning_rate": 1.24856565882037e-05, - "loss": 2.2627, - "step": 430240 - }, - { - "epoch": 0.75, - "learning_rate": 1.2484784648276874e-05, - "loss": 2.2724, - "step": 430250 - }, - { - "epoch": 0.75, - "learning_rate": 1.2483912708350046e-05, - "loss": 2.326, - "step": 430260 - }, - { - "epoch": 0.75, - "learning_rate": 1.248304076842322e-05, - "loss": 2.3078, - "step": 430270 - }, - { - "epoch": 0.75, - "learning_rate": 1.2482168828496391e-05, - "loss": 2.2616, - "step": 430280 - }, - { - "epoch": 0.75, - "learning_rate": 1.2481296888569565e-05, - "loss": 2.3336, - "step": 430290 - }, - { - "epoch": 0.75, - "learning_rate": 1.2480424948642739e-05, - "loss": 2.2896, - "step": 430300 - }, - { - "epoch": 0.75, - "learning_rate": 1.2479553008715913e-05, - "loss": 2.2755, - "step": 430310 - }, - { - "epoch": 0.75, - "learning_rate": 1.2478681068789087e-05, - "loss": 2.3078, - "step": 430320 - }, - { - "epoch": 0.75, - "learning_rate": 1.2477809128862259e-05, - "loss": 2.4001, - "step": 430330 - }, - { - "epoch": 0.75, - "learning_rate": 1.2476937188935432e-05, - "loss": 2.3428, - "step": 430340 - }, - { - "epoch": 0.75, - "learning_rate": 1.2476065249008604e-05, - "loss": 2.4513, - "step": 430350 - }, - { - "epoch": 0.75, - "learning_rate": 1.2475193309081778e-05, - "loss": 2.2398, - "step": 430360 - }, - { - "epoch": 0.75, - "learning_rate": 1.247432136915495e-05, - "loss": 2.3023, - "step": 430370 - }, - { - "epoch": 0.75, - "learning_rate": 1.2473449429228124e-05, - "loss": 2.2842, - "step": 430380 - }, - { - "epoch": 0.75, - "learning_rate": 1.2472577489301298e-05, - "loss": 2.3243, - "step": 430390 - }, - { - "epoch": 0.75, - "learning_rate": 1.2471705549374472e-05, - "loss": 2.1835, - "step": 430400 - }, - { - "epoch": 0.75, - "learning_rate": 1.2470833609447644e-05, - "loss": 2.2384, - "step": 430410 - }, - { - "epoch": 0.75, - "learning_rate": 1.2469961669520817e-05, - "loss": 2.2934, - "step": 430420 - }, - { - "epoch": 0.75, - "learning_rate": 1.246908972959399e-05, - "loss": 2.2791, - "step": 430430 - }, - { - "epoch": 0.75, - "learning_rate": 1.2468217789667163e-05, - "loss": 2.3289, - "step": 430440 - }, - { - "epoch": 0.75, - "learning_rate": 1.2467345849740337e-05, - "loss": 2.2266, - "step": 430450 - }, - { - "epoch": 0.75, - "learning_rate": 1.246647390981351e-05, - "loss": 2.283, - "step": 430460 - }, - { - "epoch": 0.75, - "learning_rate": 1.2465601969886685e-05, - "loss": 2.2633, - "step": 430470 - }, - { - "epoch": 0.75, - "learning_rate": 1.2464730029959857e-05, - "loss": 2.2677, - "step": 430480 - }, - { - "epoch": 0.75, - "learning_rate": 1.246385809003303e-05, - "loss": 2.35, - "step": 430490 - }, - { - "epoch": 0.75, - "learning_rate": 1.2462986150106203e-05, - "loss": 2.2852, - "step": 430500 - }, - { - "epoch": 0.75, - "learning_rate": 1.2462114210179376e-05, - "loss": 2.2767, - "step": 430510 - }, - { - "epoch": 0.75, - "learning_rate": 1.2461242270252548e-05, - "loss": 2.1912, - "step": 430520 - }, - { - "epoch": 0.75, - "learning_rate": 1.2460370330325722e-05, - "loss": 2.23, - "step": 430530 - }, - { - "epoch": 0.75, - "learning_rate": 1.2459498390398896e-05, - "loss": 2.3149, - "step": 430540 - }, - { - "epoch": 0.75, - "learning_rate": 1.245862645047207e-05, - "loss": 2.3125, - "step": 430550 - }, - { - "epoch": 0.75, - "learning_rate": 1.2457754510545242e-05, - "loss": 2.2934, - "step": 430560 - }, - { - "epoch": 0.75, - "learning_rate": 1.2456882570618416e-05, - "loss": 2.3053, - "step": 430570 - }, - { - "epoch": 0.75, - "learning_rate": 1.245601063069159e-05, - "loss": 2.3255, - "step": 430580 - }, - { - "epoch": 0.75, - "learning_rate": 1.2455138690764761e-05, - "loss": 2.2165, - "step": 430590 - }, - { - "epoch": 0.75, - "learning_rate": 1.2454266750837935e-05, - "loss": 2.3666, - "step": 430600 - }, - { - "epoch": 0.75, - "learning_rate": 1.2453394810911107e-05, - "loss": 2.2977, - "step": 430610 - }, - { - "epoch": 0.75, - "learning_rate": 1.2452522870984281e-05, - "loss": 2.2188, - "step": 430620 - }, - { - "epoch": 0.75, - "learning_rate": 1.2451650931057455e-05, - "loss": 2.2685, - "step": 430630 - }, - { - "epoch": 0.75, - "learning_rate": 1.2450778991130629e-05, - "loss": 2.2936, - "step": 430640 - }, - { - "epoch": 0.75, - "learning_rate": 1.24499070512038e-05, - "loss": 2.3253, - "step": 430650 - }, - { - "epoch": 0.75, - "learning_rate": 1.2449035111276974e-05, - "loss": 2.2544, - "step": 430660 - }, - { - "epoch": 0.75, - "learning_rate": 1.2448163171350146e-05, - "loss": 2.213, - "step": 430670 - }, - { - "epoch": 0.75, - "learning_rate": 1.244729123142332e-05, - "loss": 2.2439, - "step": 430680 - }, - { - "epoch": 0.75, - "learning_rate": 1.2446419291496492e-05, - "loss": 2.2306, - "step": 430690 - }, - { - "epoch": 0.75, - "learning_rate": 1.2445547351569666e-05, - "loss": 2.3207, - "step": 430700 - }, - { - "epoch": 0.75, - "learning_rate": 1.2444675411642842e-05, - "loss": 2.1876, - "step": 430710 - }, - { - "epoch": 0.75, - "learning_rate": 1.2443803471716014e-05, - "loss": 2.3452, - "step": 430720 - }, - { - "epoch": 0.75, - "learning_rate": 1.2442931531789187e-05, - "loss": 2.2607, - "step": 430730 - }, - { - "epoch": 0.75, - "learning_rate": 1.244205959186236e-05, - "loss": 2.3531, - "step": 430740 - }, - { - "epoch": 0.75, - "learning_rate": 1.2441187651935533e-05, - "loss": 2.253, - "step": 430750 - }, - { - "epoch": 0.75, - "learning_rate": 1.2440315712008705e-05, - "loss": 2.2587, - "step": 430760 - }, - { - "epoch": 0.75, - "learning_rate": 1.2439443772081879e-05, - "loss": 2.3564, - "step": 430770 - }, - { - "epoch": 0.75, - "learning_rate": 1.2438571832155053e-05, - "loss": 2.26, - "step": 430780 - }, - { - "epoch": 0.75, - "learning_rate": 1.2437699892228227e-05, - "loss": 2.3151, - "step": 430790 - }, - { - "epoch": 0.75, - "learning_rate": 1.2436827952301399e-05, - "loss": 2.3336, - "step": 430800 - }, - { - "epoch": 0.75, - "learning_rate": 1.2435956012374572e-05, - "loss": 2.4097, - "step": 430810 - }, - { - "epoch": 0.75, - "learning_rate": 1.2435084072447745e-05, - "loss": 2.3263, - "step": 430820 - }, - { - "epoch": 0.75, - "learning_rate": 1.2434212132520918e-05, - "loss": 2.2847, - "step": 430830 - }, - { - "epoch": 0.75, - "learning_rate": 1.243334019259409e-05, - "loss": 2.2821, - "step": 430840 - }, - { - "epoch": 0.75, - "learning_rate": 1.2432468252667264e-05, - "loss": 2.2294, - "step": 430850 - }, - { - "epoch": 0.75, - "learning_rate": 1.2431596312740438e-05, - "loss": 2.2835, - "step": 430860 - }, - { - "epoch": 0.75, - "learning_rate": 1.2430724372813612e-05, - "loss": 2.3482, - "step": 430870 - }, - { - "epoch": 0.75, - "learning_rate": 1.2429852432886785e-05, - "loss": 2.2268, - "step": 430880 - }, - { - "epoch": 0.75, - "learning_rate": 1.2428980492959958e-05, - "loss": 2.3767, - "step": 430890 - }, - { - "epoch": 0.75, - "learning_rate": 1.2428108553033131e-05, - "loss": 2.3723, - "step": 430900 - }, - { - "epoch": 0.75, - "learning_rate": 1.2427236613106303e-05, - "loss": 2.2646, - "step": 430910 - }, - { - "epoch": 0.75, - "learning_rate": 1.2426364673179477e-05, - "loss": 2.1816, - "step": 430920 - }, - { - "epoch": 0.75, - "learning_rate": 1.242549273325265e-05, - "loss": 2.2341, - "step": 430930 - }, - { - "epoch": 0.75, - "learning_rate": 1.2424620793325823e-05, - "loss": 2.4105, - "step": 430940 - }, - { - "epoch": 0.75, - "learning_rate": 1.2423748853398997e-05, - "loss": 2.3706, - "step": 430950 - }, - { - "epoch": 0.75, - "learning_rate": 1.242287691347217e-05, - "loss": 2.2288, - "step": 430960 - }, - { - "epoch": 0.75, - "learning_rate": 1.2422004973545343e-05, - "loss": 2.1493, - "step": 430970 - }, - { - "epoch": 0.75, - "learning_rate": 1.2421133033618516e-05, - "loss": 2.3942, - "step": 430980 - }, - { - "epoch": 0.75, - "learning_rate": 1.242026109369169e-05, - "loss": 2.3133, - "step": 430990 - }, - { - "epoch": 0.75, - "learning_rate": 1.2419389153764862e-05, - "loss": 2.3313, - "step": 431000 - }, - { - "epoch": 0.75, - "learning_rate": 1.2418517213838036e-05, - "loss": 2.2344, - "step": 431010 - }, - { - "epoch": 0.75, - "learning_rate": 1.241764527391121e-05, - "loss": 2.2585, - "step": 431020 - }, - { - "epoch": 0.75, - "learning_rate": 1.2416773333984384e-05, - "loss": 2.3969, - "step": 431030 - }, - { - "epoch": 0.75, - "learning_rate": 1.2415901394057556e-05, - "loss": 2.3141, - "step": 431040 - }, - { - "epoch": 0.75, - "learning_rate": 1.241502945413073e-05, - "loss": 2.1783, - "step": 431050 - }, - { - "epoch": 0.75, - "learning_rate": 1.2414157514203901e-05, - "loss": 2.337, - "step": 431060 - }, - { - "epoch": 0.75, - "learning_rate": 1.2413285574277075e-05, - "loss": 2.1364, - "step": 431070 - }, - { - "epoch": 0.75, - "learning_rate": 1.2412413634350247e-05, - "loss": 2.3021, - "step": 431080 - }, - { - "epoch": 0.75, - "learning_rate": 1.2411541694423421e-05, - "loss": 2.3385, - "step": 431090 - }, - { - "epoch": 0.75, - "learning_rate": 1.2410669754496595e-05, - "loss": 2.218, - "step": 431100 - }, - { - "epoch": 0.75, - "learning_rate": 1.2409797814569769e-05, - "loss": 2.1744, - "step": 431110 - }, - { - "epoch": 0.75, - "learning_rate": 1.2408925874642942e-05, - "loss": 2.1865, - "step": 431120 - }, - { - "epoch": 0.75, - "learning_rate": 1.2408053934716114e-05, - "loss": 2.2268, - "step": 431130 - }, - { - "epoch": 0.75, - "learning_rate": 1.2407181994789288e-05, - "loss": 2.3231, - "step": 431140 - }, - { - "epoch": 0.75, - "learning_rate": 1.240631005486246e-05, - "loss": 2.3173, - "step": 431150 - }, - { - "epoch": 0.75, - "learning_rate": 1.2405438114935634e-05, - "loss": 2.3424, - "step": 431160 - }, - { - "epoch": 0.75, - "learning_rate": 1.2404566175008806e-05, - "loss": 2.3555, - "step": 431170 - }, - { - "epoch": 0.75, - "learning_rate": 1.240369423508198e-05, - "loss": 2.3902, - "step": 431180 - }, - { - "epoch": 0.75, - "learning_rate": 1.2402822295155154e-05, - "loss": 2.2431, - "step": 431190 - }, - { - "epoch": 0.75, - "learning_rate": 1.2401950355228327e-05, - "loss": 2.2839, - "step": 431200 - }, - { - "epoch": 0.75, - "learning_rate": 1.24010784153015e-05, - "loss": 2.4037, - "step": 431210 - }, - { - "epoch": 0.75, - "learning_rate": 1.2400206475374673e-05, - "loss": 2.2102, - "step": 431220 - }, - { - "epoch": 0.75, - "learning_rate": 1.2399334535447845e-05, - "loss": 2.2618, - "step": 431230 - }, - { - "epoch": 0.75, - "learning_rate": 1.239846259552102e-05, - "loss": 2.3489, - "step": 431240 - }, - { - "epoch": 0.75, - "learning_rate": 1.2397590655594193e-05, - "loss": 2.3412, - "step": 431250 - }, - { - "epoch": 0.75, - "learning_rate": 1.2396718715667365e-05, - "loss": 2.3083, - "step": 431260 - }, - { - "epoch": 0.75, - "learning_rate": 1.239584677574054e-05, - "loss": 2.325, - "step": 431270 - }, - { - "epoch": 0.75, - "learning_rate": 1.2394974835813713e-05, - "loss": 2.2436, - "step": 431280 - }, - { - "epoch": 0.75, - "learning_rate": 1.2394102895886886e-05, - "loss": 2.2675, - "step": 431290 - }, - { - "epoch": 0.75, - "learning_rate": 1.2393230955960058e-05, - "loss": 2.2711, - "step": 431300 - }, - { - "epoch": 0.75, - "learning_rate": 1.2392359016033232e-05, - "loss": 2.2689, - "step": 431310 - }, - { - "epoch": 0.75, - "learning_rate": 1.2391487076106404e-05, - "loss": 2.2739, - "step": 431320 - }, - { - "epoch": 0.75, - "learning_rate": 1.2390615136179578e-05, - "loss": 2.2429, - "step": 431330 - }, - { - "epoch": 0.75, - "learning_rate": 1.2389743196252752e-05, - "loss": 2.1971, - "step": 431340 - }, - { - "epoch": 0.75, - "learning_rate": 1.2388871256325926e-05, - "loss": 2.2773, - "step": 431350 - }, - { - "epoch": 0.75, - "learning_rate": 1.2387999316399098e-05, - "loss": 2.2624, - "step": 431360 - }, - { - "epoch": 0.75, - "learning_rate": 1.2387127376472271e-05, - "loss": 2.3473, - "step": 431370 - }, - { - "epoch": 0.75, - "learning_rate": 1.2386255436545445e-05, - "loss": 2.3948, - "step": 431380 - }, - { - "epoch": 0.75, - "learning_rate": 1.2385383496618617e-05, - "loss": 2.2383, - "step": 431390 - }, - { - "epoch": 0.75, - "learning_rate": 1.2384511556691791e-05, - "loss": 2.1901, - "step": 431400 - }, - { - "epoch": 0.75, - "learning_rate": 1.2383639616764963e-05, - "loss": 2.2535, - "step": 431410 - }, - { - "epoch": 0.75, - "learning_rate": 1.2382767676838137e-05, - "loss": 2.4933, - "step": 431420 - }, - { - "epoch": 0.75, - "learning_rate": 1.238189573691131e-05, - "loss": 2.2502, - "step": 431430 - }, - { - "epoch": 0.75, - "learning_rate": 1.2381023796984484e-05, - "loss": 2.2589, - "step": 431440 - }, - { - "epoch": 0.75, - "learning_rate": 1.2380151857057656e-05, - "loss": 2.2068, - "step": 431450 - }, - { - "epoch": 0.75, - "learning_rate": 1.237927991713083e-05, - "loss": 2.347, - "step": 431460 - }, - { - "epoch": 0.75, - "learning_rate": 1.2378407977204002e-05, - "loss": 2.2005, - "step": 431470 - }, - { - "epoch": 0.75, - "learning_rate": 1.2377536037277176e-05, - "loss": 2.3444, - "step": 431480 - }, - { - "epoch": 0.75, - "learning_rate": 1.2376664097350348e-05, - "loss": 2.4076, - "step": 431490 - }, - { - "epoch": 0.75, - "learning_rate": 1.2375792157423522e-05, - "loss": 2.2486, - "step": 431500 - }, - { - "epoch": 0.75, - "learning_rate": 1.2374920217496697e-05, - "loss": 2.3379, - "step": 431510 - }, - { - "epoch": 0.75, - "learning_rate": 1.237404827756987e-05, - "loss": 2.3295, - "step": 431520 - }, - { - "epoch": 0.75, - "learning_rate": 1.2373176337643043e-05, - "loss": 2.3363, - "step": 431530 - }, - { - "epoch": 0.75, - "learning_rate": 1.2372304397716215e-05, - "loss": 2.327, - "step": 431540 - }, - { - "epoch": 0.75, - "learning_rate": 1.2371432457789389e-05, - "loss": 2.2871, - "step": 431550 - }, - { - "epoch": 0.75, - "learning_rate": 1.2370560517862561e-05, - "loss": 2.3273, - "step": 431560 - }, - { - "epoch": 0.75, - "learning_rate": 1.2369688577935735e-05, - "loss": 2.3299, - "step": 431570 - }, - { - "epoch": 0.75, - "learning_rate": 1.2368816638008909e-05, - "loss": 2.2492, - "step": 431580 - }, - { - "epoch": 0.75, - "learning_rate": 1.2367944698082083e-05, - "loss": 2.2303, - "step": 431590 - }, - { - "epoch": 0.75, - "learning_rate": 1.2367072758155255e-05, - "loss": 2.1952, - "step": 431600 - }, - { - "epoch": 0.75, - "learning_rate": 1.2366200818228428e-05, - "loss": 2.2524, - "step": 431610 - }, - { - "epoch": 0.75, - "learning_rate": 1.23653288783016e-05, - "loss": 2.253, - "step": 431620 - }, - { - "epoch": 0.75, - "learning_rate": 1.2364456938374774e-05, - "loss": 2.1553, - "step": 431630 - }, - { - "epoch": 0.75, - "learning_rate": 1.2363584998447948e-05, - "loss": 2.2896, - "step": 431640 - }, - { - "epoch": 0.75, - "learning_rate": 1.236271305852112e-05, - "loss": 2.362, - "step": 431650 - }, - { - "epoch": 0.75, - "learning_rate": 1.2361841118594294e-05, - "loss": 2.2717, - "step": 431660 - }, - { - "epoch": 0.75, - "learning_rate": 1.2360969178667468e-05, - "loss": 2.2061, - "step": 431670 - }, - { - "epoch": 0.75, - "learning_rate": 1.2360097238740641e-05, - "loss": 2.2638, - "step": 431680 - }, - { - "epoch": 0.75, - "learning_rate": 1.2359225298813813e-05, - "loss": 2.3124, - "step": 431690 - }, - { - "epoch": 0.75, - "learning_rate": 1.2358353358886987e-05, - "loss": 2.2623, - "step": 431700 - }, - { - "epoch": 0.75, - "learning_rate": 1.235748141896016e-05, - "loss": 2.257, - "step": 431710 - }, - { - "epoch": 0.75, - "learning_rate": 1.2356609479033333e-05, - "loss": 2.2747, - "step": 431720 - }, - { - "epoch": 0.75, - "learning_rate": 1.2355737539106505e-05, - "loss": 2.3743, - "step": 431730 - }, - { - "epoch": 0.75, - "learning_rate": 1.2354865599179679e-05, - "loss": 2.2992, - "step": 431740 - }, - { - "epoch": 0.75, - "learning_rate": 1.2353993659252853e-05, - "loss": 2.3413, - "step": 431750 - }, - { - "epoch": 0.75, - "learning_rate": 1.2353121719326026e-05, - "loss": 2.2194, - "step": 431760 - }, - { - "epoch": 0.75, - "learning_rate": 1.2352249779399199e-05, - "loss": 2.445, - "step": 431770 - }, - { - "epoch": 0.75, - "learning_rate": 1.2351377839472372e-05, - "loss": 2.3065, - "step": 431780 - }, - { - "epoch": 0.75, - "learning_rate": 1.2350505899545546e-05, - "loss": 2.3713, - "step": 431790 - }, - { - "epoch": 0.75, - "learning_rate": 1.2349633959618718e-05, - "loss": 2.3308, - "step": 431800 - }, - { - "epoch": 0.75, - "learning_rate": 1.2348762019691892e-05, - "loss": 2.1941, - "step": 431810 - }, - { - "epoch": 0.75, - "learning_rate": 1.2347890079765066e-05, - "loss": 2.439, - "step": 431820 - }, - { - "epoch": 0.75, - "learning_rate": 1.234701813983824e-05, - "loss": 2.1827, - "step": 431830 - }, - { - "epoch": 0.75, - "learning_rate": 1.2346146199911412e-05, - "loss": 2.1707, - "step": 431840 - }, - { - "epoch": 0.75, - "learning_rate": 1.2345274259984585e-05, - "loss": 2.2451, - "step": 431850 - }, - { - "epoch": 0.75, - "learning_rate": 1.2344402320057757e-05, - "loss": 2.3095, - "step": 431860 - }, - { - "epoch": 0.75, - "learning_rate": 1.2343530380130931e-05, - "loss": 2.4196, - "step": 431870 - }, - { - "epoch": 0.75, - "learning_rate": 1.2342658440204103e-05, - "loss": 2.3124, - "step": 431880 - }, - { - "epoch": 0.75, - "learning_rate": 1.2341786500277277e-05, - "loss": 2.1628, - "step": 431890 - }, - { - "epoch": 0.75, - "learning_rate": 1.234091456035045e-05, - "loss": 2.2246, - "step": 431900 - }, - { - "epoch": 0.75, - "learning_rate": 1.2340042620423625e-05, - "loss": 2.3087, - "step": 431910 - }, - { - "epoch": 0.75, - "learning_rate": 1.2339170680496798e-05, - "loss": 2.2268, - "step": 431920 - }, - { - "epoch": 0.75, - "learning_rate": 1.233829874056997e-05, - "loss": 2.2193, - "step": 431930 - }, - { - "epoch": 0.75, - "learning_rate": 1.2337426800643144e-05, - "loss": 2.2155, - "step": 431940 - }, - { - "epoch": 0.75, - "learning_rate": 1.2336554860716316e-05, - "loss": 2.2813, - "step": 431950 - }, - { - "epoch": 0.75, - "learning_rate": 1.233568292078949e-05, - "loss": 2.217, - "step": 431960 - }, - { - "epoch": 0.75, - "learning_rate": 1.2334810980862662e-05, - "loss": 2.3602, - "step": 431970 - }, - { - "epoch": 0.75, - "learning_rate": 1.2333939040935836e-05, - "loss": 2.3269, - "step": 431980 - }, - { - "epoch": 0.75, - "learning_rate": 1.233306710100901e-05, - "loss": 2.3882, - "step": 431990 - }, - { - "epoch": 0.75, - "learning_rate": 1.2332195161082183e-05, - "loss": 2.1942, - "step": 432000 - }, - { - "epoch": 0.75, - "learning_rate": 1.2331323221155355e-05, - "loss": 2.2282, - "step": 432010 - }, - { - "epoch": 0.75, - "learning_rate": 1.233045128122853e-05, - "loss": 2.2575, - "step": 432020 - }, - { - "epoch": 0.75, - "learning_rate": 1.2329579341301701e-05, - "loss": 2.1454, - "step": 432030 - }, - { - "epoch": 0.75, - "learning_rate": 1.2328707401374875e-05, - "loss": 2.3605, - "step": 432040 - }, - { - "epoch": 0.75, - "learning_rate": 1.2327835461448049e-05, - "loss": 2.339, - "step": 432050 - }, - { - "epoch": 0.75, - "learning_rate": 1.2326963521521223e-05, - "loss": 2.2501, - "step": 432060 - }, - { - "epoch": 0.75, - "learning_rate": 1.2326091581594396e-05, - "loss": 2.3426, - "step": 432070 - }, - { - "epoch": 0.75, - "learning_rate": 1.2325219641667568e-05, - "loss": 2.2078, - "step": 432080 - }, - { - "epoch": 0.75, - "learning_rate": 1.2324347701740742e-05, - "loss": 2.2359, - "step": 432090 - }, - { - "epoch": 0.75, - "learning_rate": 1.2323475761813914e-05, - "loss": 2.316, - "step": 432100 - }, - { - "epoch": 0.75, - "learning_rate": 1.2322603821887088e-05, - "loss": 2.3265, - "step": 432110 - }, - { - "epoch": 0.75, - "learning_rate": 1.232173188196026e-05, - "loss": 2.3798, - "step": 432120 - }, - { - "epoch": 0.75, - "learning_rate": 1.2320859942033434e-05, - "loss": 2.2483, - "step": 432130 - }, - { - "epoch": 0.75, - "learning_rate": 1.2319988002106608e-05, - "loss": 2.2666, - "step": 432140 - }, - { - "epoch": 0.75, - "learning_rate": 1.2319116062179781e-05, - "loss": 2.268, - "step": 432150 - }, - { - "epoch": 0.75, - "learning_rate": 1.2318244122252954e-05, - "loss": 2.3563, - "step": 432160 - }, - { - "epoch": 0.75, - "learning_rate": 1.2317372182326127e-05, - "loss": 2.3811, - "step": 432170 - }, - { - "epoch": 0.75, - "learning_rate": 1.2316500242399301e-05, - "loss": 2.3372, - "step": 432180 - }, - { - "epoch": 0.75, - "learning_rate": 1.2315628302472473e-05, - "loss": 2.2457, - "step": 432190 - }, - { - "epoch": 0.75, - "learning_rate": 1.2314756362545647e-05, - "loss": 2.3501, - "step": 432200 - }, - { - "epoch": 0.75, - "learning_rate": 1.2313884422618819e-05, - "loss": 2.2886, - "step": 432210 - }, - { - "epoch": 0.75, - "learning_rate": 1.2313012482691993e-05, - "loss": 2.3366, - "step": 432220 - }, - { - "epoch": 0.75, - "learning_rate": 1.2312140542765167e-05, - "loss": 2.3237, - "step": 432230 - }, - { - "epoch": 0.75, - "learning_rate": 1.231126860283834e-05, - "loss": 2.2527, - "step": 432240 - }, - { - "epoch": 0.75, - "learning_rate": 1.2310396662911512e-05, - "loss": 2.1979, - "step": 432250 - }, - { - "epoch": 0.75, - "learning_rate": 1.2309524722984686e-05, - "loss": 2.3028, - "step": 432260 - }, - { - "epoch": 0.75, - "learning_rate": 1.2308652783057858e-05, - "loss": 2.3212, - "step": 432270 - }, - { - "epoch": 0.75, - "learning_rate": 1.2307780843131032e-05, - "loss": 2.277, - "step": 432280 - }, - { - "epoch": 0.75, - "learning_rate": 1.2306908903204204e-05, - "loss": 2.2678, - "step": 432290 - }, - { - "epoch": 0.75, - "learning_rate": 1.2306036963277378e-05, - "loss": 2.172, - "step": 432300 - }, - { - "epoch": 0.75, - "learning_rate": 1.2305165023350553e-05, - "loss": 2.1756, - "step": 432310 - }, - { - "epoch": 0.75, - "learning_rate": 1.2304293083423725e-05, - "loss": 2.2474, - "step": 432320 - }, - { - "epoch": 0.75, - "learning_rate": 1.2303421143496899e-05, - "loss": 2.2323, - "step": 432330 - }, - { - "epoch": 0.75, - "learning_rate": 1.2302549203570071e-05, - "loss": 2.3816, - "step": 432340 - }, - { - "epoch": 0.75, - "learning_rate": 1.2301677263643245e-05, - "loss": 2.2799, - "step": 432350 - }, - { - "epoch": 0.75, - "learning_rate": 1.2300805323716417e-05, - "loss": 2.2751, - "step": 432360 - }, - { - "epoch": 0.75, - "learning_rate": 1.229993338378959e-05, - "loss": 2.2545, - "step": 432370 - }, - { - "epoch": 0.75, - "learning_rate": 1.2299061443862765e-05, - "loss": 2.3215, - "step": 432380 - }, - { - "epoch": 0.75, - "learning_rate": 1.2298189503935938e-05, - "loss": 2.2608, - "step": 432390 - }, - { - "epoch": 0.75, - "learning_rate": 1.229731756400911e-05, - "loss": 2.2394, - "step": 432400 - }, - { - "epoch": 0.75, - "learning_rate": 1.2296445624082284e-05, - "loss": 2.3429, - "step": 432410 - }, - { - "epoch": 0.75, - "learning_rate": 1.2295573684155456e-05, - "loss": 2.3905, - "step": 432420 - }, - { - "epoch": 0.75, - "learning_rate": 1.229470174422863e-05, - "loss": 2.309, - "step": 432430 - }, - { - "epoch": 0.75, - "learning_rate": 1.2293829804301804e-05, - "loss": 2.2944, - "step": 432440 - }, - { - "epoch": 0.75, - "learning_rate": 1.2292957864374976e-05, - "loss": 2.217, - "step": 432450 - }, - { - "epoch": 0.75, - "learning_rate": 1.229208592444815e-05, - "loss": 2.3549, - "step": 432460 - }, - { - "epoch": 0.75, - "learning_rate": 1.2291213984521323e-05, - "loss": 2.2179, - "step": 432470 - }, - { - "epoch": 0.75, - "learning_rate": 1.2290342044594497e-05, - "loss": 2.2638, - "step": 432480 - }, - { - "epoch": 0.75, - "learning_rate": 1.228947010466767e-05, - "loss": 2.2747, - "step": 432490 - }, - { - "epoch": 0.75, - "learning_rate": 1.2288598164740843e-05, - "loss": 2.2716, - "step": 432500 - }, - { - "epoch": 0.75, - "learning_rate": 1.2287726224814015e-05, - "loss": 2.2474, - "step": 432510 - }, - { - "epoch": 0.75, - "learning_rate": 1.2286854284887189e-05, - "loss": 2.2574, - "step": 432520 - }, - { - "epoch": 0.75, - "learning_rate": 1.2285982344960361e-05, - "loss": 2.2848, - "step": 432530 - }, - { - "epoch": 0.75, - "learning_rate": 1.2285110405033535e-05, - "loss": 2.3045, - "step": 432540 - }, - { - "epoch": 0.75, - "learning_rate": 1.2284238465106709e-05, - "loss": 2.2349, - "step": 432550 - }, - { - "epoch": 0.75, - "learning_rate": 1.2283366525179882e-05, - "loss": 2.2166, - "step": 432560 - }, - { - "epoch": 0.75, - "learning_rate": 1.2282494585253056e-05, - "loss": 2.3255, - "step": 432570 - }, - { - "epoch": 0.75, - "learning_rate": 1.2281622645326228e-05, - "loss": 2.2917, - "step": 432580 - }, - { - "epoch": 0.75, - "learning_rate": 1.2280750705399402e-05, - "loss": 2.1825, - "step": 432590 - }, - { - "epoch": 0.75, - "learning_rate": 1.2279878765472574e-05, - "loss": 2.4541, - "step": 432600 - }, - { - "epoch": 0.75, - "learning_rate": 1.2279006825545748e-05, - "loss": 2.4021, - "step": 432610 - }, - { - "epoch": 0.75, - "learning_rate": 1.2278134885618922e-05, - "loss": 2.2482, - "step": 432620 - }, - { - "epoch": 0.75, - "learning_rate": 1.2277262945692095e-05, - "loss": 2.3189, - "step": 432630 - }, - { - "epoch": 0.75, - "learning_rate": 1.2276391005765267e-05, - "loss": 2.2188, - "step": 432640 - }, - { - "epoch": 0.75, - "learning_rate": 1.2275519065838441e-05, - "loss": 2.382, - "step": 432650 - }, - { - "epoch": 0.75, - "learning_rate": 1.2274647125911613e-05, - "loss": 2.2912, - "step": 432660 - }, - { - "epoch": 0.75, - "learning_rate": 1.2273775185984787e-05, - "loss": 2.1922, - "step": 432670 - }, - { - "epoch": 0.75, - "learning_rate": 1.2272903246057959e-05, - "loss": 2.3746, - "step": 432680 - }, - { - "epoch": 0.75, - "learning_rate": 1.2272031306131133e-05, - "loss": 2.2201, - "step": 432690 - }, - { - "epoch": 0.75, - "learning_rate": 1.2271159366204307e-05, - "loss": 2.2845, - "step": 432700 - }, - { - "epoch": 0.75, - "learning_rate": 1.227028742627748e-05, - "loss": 2.3539, - "step": 432710 - }, - { - "epoch": 0.75, - "learning_rate": 1.2269415486350654e-05, - "loss": 2.3064, - "step": 432720 - }, - { - "epoch": 0.75, - "learning_rate": 1.2268543546423826e-05, - "loss": 2.29, - "step": 432730 - }, - { - "epoch": 0.75, - "learning_rate": 1.2267671606497e-05, - "loss": 2.2329, - "step": 432740 - }, - { - "epoch": 0.75, - "learning_rate": 1.2266799666570172e-05, - "loss": 2.3186, - "step": 432750 - }, - { - "epoch": 0.75, - "learning_rate": 1.2265927726643346e-05, - "loss": 2.3822, - "step": 432760 - }, - { - "epoch": 0.75, - "learning_rate": 1.2265055786716518e-05, - "loss": 2.2437, - "step": 432770 - }, - { - "epoch": 0.75, - "learning_rate": 1.2264183846789692e-05, - "loss": 2.1741, - "step": 432780 - }, - { - "epoch": 0.75, - "learning_rate": 1.2263311906862865e-05, - "loss": 2.3217, - "step": 432790 - }, - { - "epoch": 0.75, - "learning_rate": 1.226243996693604e-05, - "loss": 2.3937, - "step": 432800 - }, - { - "epoch": 0.75, - "learning_rate": 1.2261568027009211e-05, - "loss": 2.2544, - "step": 432810 - }, - { - "epoch": 0.75, - "learning_rate": 1.2260696087082385e-05, - "loss": 2.1612, - "step": 432820 - }, - { - "epoch": 0.75, - "learning_rate": 1.2259824147155557e-05, - "loss": 2.2168, - "step": 432830 - }, - { - "epoch": 0.75, - "learning_rate": 1.2258952207228731e-05, - "loss": 2.3348, - "step": 432840 - }, - { - "epoch": 0.75, - "learning_rate": 1.2258080267301905e-05, - "loss": 2.3217, - "step": 432850 - }, - { - "epoch": 0.75, - "learning_rate": 1.2257208327375078e-05, - "loss": 2.2607, - "step": 432860 - }, - { - "epoch": 0.75, - "learning_rate": 1.2256336387448252e-05, - "loss": 2.2428, - "step": 432870 - }, - { - "epoch": 0.75, - "learning_rate": 1.2255464447521424e-05, - "loss": 2.2038, - "step": 432880 - }, - { - "epoch": 0.75, - "learning_rate": 1.2254592507594598e-05, - "loss": 2.276, - "step": 432890 - }, - { - "epoch": 0.75, - "learning_rate": 1.225372056766777e-05, - "loss": 2.3743, - "step": 432900 - }, - { - "epoch": 0.75, - "learning_rate": 1.2252848627740944e-05, - "loss": 2.3315, - "step": 432910 - }, - { - "epoch": 0.75, - "learning_rate": 1.2251976687814116e-05, - "loss": 2.2787, - "step": 432920 - }, - { - "epoch": 0.75, - "learning_rate": 1.225110474788729e-05, - "loss": 2.2751, - "step": 432930 - }, - { - "epoch": 0.75, - "learning_rate": 1.2250232807960464e-05, - "loss": 2.3161, - "step": 432940 - }, - { - "epoch": 0.76, - "learning_rate": 1.2249360868033637e-05, - "loss": 2.2476, - "step": 432950 - }, - { - "epoch": 0.76, - "learning_rate": 1.224848892810681e-05, - "loss": 2.3039, - "step": 432960 - }, - { - "epoch": 0.76, - "learning_rate": 1.2247616988179983e-05, - "loss": 2.2871, - "step": 432970 - }, - { - "epoch": 0.76, - "learning_rate": 1.2246745048253157e-05, - "loss": 2.3461, - "step": 432980 - }, - { - "epoch": 0.76, - "learning_rate": 1.2245873108326329e-05, - "loss": 2.1529, - "step": 432990 - }, - { - "epoch": 0.76, - "learning_rate": 1.2245001168399503e-05, - "loss": 2.3567, - "step": 433000 - }, - { - "epoch": 0.76, - "learning_rate": 1.2244129228472675e-05, - "loss": 2.3715, - "step": 433010 - }, - { - "epoch": 0.76, - "learning_rate": 1.2243257288545849e-05, - "loss": 2.2445, - "step": 433020 - }, - { - "epoch": 0.76, - "learning_rate": 1.2242385348619022e-05, - "loss": 2.301, - "step": 433030 - }, - { - "epoch": 0.76, - "learning_rate": 1.2241513408692196e-05, - "loss": 2.2616, - "step": 433040 - }, - { - "epoch": 0.76, - "learning_rate": 1.2240641468765368e-05, - "loss": 2.2741, - "step": 433050 - }, - { - "epoch": 0.76, - "learning_rate": 1.2239769528838542e-05, - "loss": 2.3001, - "step": 433060 - }, - { - "epoch": 0.76, - "learning_rate": 1.2238897588911714e-05, - "loss": 2.288, - "step": 433070 - }, - { - "epoch": 0.76, - "learning_rate": 1.2238025648984888e-05, - "loss": 2.1951, - "step": 433080 - }, - { - "epoch": 0.76, - "learning_rate": 1.223715370905806e-05, - "loss": 2.3228, - "step": 433090 - }, - { - "epoch": 0.76, - "learning_rate": 1.2236281769131235e-05, - "loss": 2.3128, - "step": 433100 - }, - { - "epoch": 0.76, - "learning_rate": 1.2235409829204409e-05, - "loss": 2.2805, - "step": 433110 - }, - { - "epoch": 0.76, - "learning_rate": 1.2234537889277581e-05, - "loss": 2.2675, - "step": 433120 - }, - { - "epoch": 0.76, - "learning_rate": 1.2233665949350755e-05, - "loss": 2.3546, - "step": 433130 - }, - { - "epoch": 0.76, - "learning_rate": 1.2232794009423927e-05, - "loss": 2.2527, - "step": 433140 - }, - { - "epoch": 0.76, - "learning_rate": 1.22319220694971e-05, - "loss": 2.3533, - "step": 433150 - }, - { - "epoch": 0.76, - "learning_rate": 1.2231050129570273e-05, - "loss": 2.2791, - "step": 433160 - }, - { - "epoch": 0.76, - "learning_rate": 1.2230178189643447e-05, - "loss": 2.3351, - "step": 433170 - }, - { - "epoch": 0.76, - "learning_rate": 1.222930624971662e-05, - "loss": 2.323, - "step": 433180 - }, - { - "epoch": 0.76, - "learning_rate": 1.2228434309789794e-05, - "loss": 2.3258, - "step": 433190 - }, - { - "epoch": 0.76, - "learning_rate": 1.2227562369862966e-05, - "loss": 2.3105, - "step": 433200 - }, - { - "epoch": 0.76, - "learning_rate": 1.222669042993614e-05, - "loss": 2.2381, - "step": 433210 - }, - { - "epoch": 0.76, - "learning_rate": 1.2225818490009312e-05, - "loss": 2.2836, - "step": 433220 - }, - { - "epoch": 0.76, - "learning_rate": 1.2224946550082486e-05, - "loss": 2.2295, - "step": 433230 - }, - { - "epoch": 0.76, - "learning_rate": 1.222407461015566e-05, - "loss": 2.394, - "step": 433240 - }, - { - "epoch": 0.76, - "learning_rate": 1.2223202670228832e-05, - "loss": 2.3541, - "step": 433250 - }, - { - "epoch": 0.76, - "learning_rate": 1.2222330730302006e-05, - "loss": 2.3361, - "step": 433260 - }, - { - "epoch": 0.76, - "learning_rate": 1.222145879037518e-05, - "loss": 2.3056, - "step": 433270 - }, - { - "epoch": 0.76, - "learning_rate": 1.2220586850448353e-05, - "loss": 2.3278, - "step": 433280 - }, - { - "epoch": 0.76, - "learning_rate": 1.2219714910521525e-05, - "loss": 2.3015, - "step": 433290 - }, - { - "epoch": 0.76, - "learning_rate": 1.2218842970594699e-05, - "loss": 2.3064, - "step": 433300 - }, - { - "epoch": 0.76, - "learning_rate": 1.2217971030667871e-05, - "loss": 2.337, - "step": 433310 - }, - { - "epoch": 0.76, - "learning_rate": 1.2217099090741045e-05, - "loss": 2.2979, - "step": 433320 - }, - { - "epoch": 0.76, - "learning_rate": 1.2216227150814217e-05, - "loss": 2.3166, - "step": 433330 - }, - { - "epoch": 0.76, - "learning_rate": 1.221535521088739e-05, - "loss": 2.2371, - "step": 433340 - }, - { - "epoch": 0.76, - "learning_rate": 1.2214483270960564e-05, - "loss": 2.2954, - "step": 433350 - }, - { - "epoch": 0.76, - "learning_rate": 1.2213611331033738e-05, - "loss": 2.2702, - "step": 433360 - }, - { - "epoch": 0.76, - "learning_rate": 1.2212739391106912e-05, - "loss": 2.3288, - "step": 433370 - }, - { - "epoch": 0.76, - "learning_rate": 1.2211867451180084e-05, - "loss": 2.1678, - "step": 433380 - }, - { - "epoch": 0.76, - "learning_rate": 1.2210995511253258e-05, - "loss": 2.4486, - "step": 433390 - }, - { - "epoch": 0.76, - "learning_rate": 1.221012357132643e-05, - "loss": 2.391, - "step": 433400 - }, - { - "epoch": 0.76, - "learning_rate": 1.2209251631399604e-05, - "loss": 2.2991, - "step": 433410 - }, - { - "epoch": 0.76, - "learning_rate": 1.2208379691472777e-05, - "loss": 2.3054, - "step": 433420 - }, - { - "epoch": 0.76, - "learning_rate": 1.2207507751545951e-05, - "loss": 2.2189, - "step": 433430 - }, - { - "epoch": 0.76, - "learning_rate": 1.2206635811619123e-05, - "loss": 2.1663, - "step": 433440 - }, - { - "epoch": 0.76, - "learning_rate": 1.2205763871692297e-05, - "loss": 2.3414, - "step": 433450 - }, - { - "epoch": 0.76, - "learning_rate": 1.2204891931765469e-05, - "loss": 2.1358, - "step": 433460 - }, - { - "epoch": 0.76, - "learning_rate": 1.2204019991838643e-05, - "loss": 2.3007, - "step": 433470 - }, - { - "epoch": 0.76, - "learning_rate": 1.2203148051911815e-05, - "loss": 2.3154, - "step": 433480 - }, - { - "epoch": 0.76, - "learning_rate": 1.2202276111984989e-05, - "loss": 2.2839, - "step": 433490 - }, - { - "epoch": 0.76, - "learning_rate": 1.2201404172058162e-05, - "loss": 2.3322, - "step": 433500 - }, - { - "epoch": 0.76, - "learning_rate": 1.2200532232131336e-05, - "loss": 2.4088, - "step": 433510 - }, - { - "epoch": 0.76, - "learning_rate": 1.219966029220451e-05, - "loss": 2.1762, - "step": 433520 - }, - { - "epoch": 0.76, - "learning_rate": 1.2198788352277682e-05, - "loss": 2.2413, - "step": 433530 - }, - { - "epoch": 0.76, - "learning_rate": 1.2197916412350856e-05, - "loss": 2.3604, - "step": 433540 - }, - { - "epoch": 0.76, - "learning_rate": 1.2197044472424028e-05, - "loss": 2.2466, - "step": 433550 - }, - { - "epoch": 0.76, - "learning_rate": 1.2196172532497202e-05, - "loss": 2.3996, - "step": 433560 - }, - { - "epoch": 0.76, - "learning_rate": 1.2195300592570374e-05, - "loss": 2.2444, - "step": 433570 - }, - { - "epoch": 0.76, - "learning_rate": 1.2194428652643548e-05, - "loss": 2.303, - "step": 433580 - }, - { - "epoch": 0.76, - "learning_rate": 1.2193556712716721e-05, - "loss": 2.2899, - "step": 433590 - }, - { - "epoch": 0.76, - "learning_rate": 1.2192684772789895e-05, - "loss": 2.2272, - "step": 433600 - }, - { - "epoch": 0.76, - "learning_rate": 1.2191812832863067e-05, - "loss": 2.1924, - "step": 433610 - }, - { - "epoch": 0.76, - "learning_rate": 1.2190940892936241e-05, - "loss": 2.3394, - "step": 433620 - }, - { - "epoch": 0.76, - "learning_rate": 1.2190068953009413e-05, - "loss": 2.2221, - "step": 433630 - }, - { - "epoch": 0.76, - "learning_rate": 1.2189197013082587e-05, - "loss": 2.2687, - "step": 433640 - }, - { - "epoch": 0.76, - "learning_rate": 1.218832507315576e-05, - "loss": 2.3711, - "step": 433650 - }, - { - "epoch": 0.76, - "learning_rate": 1.2187453133228934e-05, - "loss": 2.3461, - "step": 433660 - }, - { - "epoch": 0.76, - "learning_rate": 1.2186581193302108e-05, - "loss": 2.2049, - "step": 433670 - }, - { - "epoch": 0.76, - "learning_rate": 1.218570925337528e-05, - "loss": 2.2887, - "step": 433680 - }, - { - "epoch": 0.76, - "learning_rate": 1.2184837313448454e-05, - "loss": 2.29, - "step": 433690 - }, - { - "epoch": 0.76, - "learning_rate": 1.2183965373521626e-05, - "loss": 2.3307, - "step": 433700 - }, - { - "epoch": 0.76, - "learning_rate": 1.21830934335948e-05, - "loss": 2.2696, - "step": 433710 - }, - { - "epoch": 0.76, - "learning_rate": 1.2182221493667972e-05, - "loss": 2.223, - "step": 433720 - }, - { - "epoch": 0.76, - "learning_rate": 1.2181349553741146e-05, - "loss": 2.2038, - "step": 433730 - }, - { - "epoch": 0.76, - "learning_rate": 1.218047761381432e-05, - "loss": 2.3218, - "step": 433740 - }, - { - "epoch": 0.76, - "learning_rate": 1.2179605673887493e-05, - "loss": 2.2946, - "step": 433750 - }, - { - "epoch": 0.76, - "learning_rate": 1.2178733733960665e-05, - "loss": 2.3072, - "step": 433760 - }, - { - "epoch": 0.76, - "learning_rate": 1.2177861794033839e-05, - "loss": 2.2707, - "step": 433770 - }, - { - "epoch": 0.76, - "learning_rate": 1.2176989854107013e-05, - "loss": 2.2303, - "step": 433780 - }, - { - "epoch": 0.76, - "learning_rate": 1.2176117914180185e-05, - "loss": 2.3097, - "step": 433790 - }, - { - "epoch": 0.76, - "learning_rate": 1.2175245974253359e-05, - "loss": 2.1335, - "step": 433800 - }, - { - "epoch": 0.76, - "learning_rate": 1.217437403432653e-05, - "loss": 2.2695, - "step": 433810 - }, - { - "epoch": 0.76, - "learning_rate": 1.2173502094399704e-05, - "loss": 2.3014, - "step": 433820 - }, - { - "epoch": 0.76, - "learning_rate": 1.2172630154472878e-05, - "loss": 2.2408, - "step": 433830 - }, - { - "epoch": 0.76, - "learning_rate": 1.2171758214546052e-05, - "loss": 2.2663, - "step": 433840 - }, - { - "epoch": 0.76, - "learning_rate": 1.2170886274619224e-05, - "loss": 2.2492, - "step": 433850 - }, - { - "epoch": 0.76, - "learning_rate": 1.2170014334692398e-05, - "loss": 2.3336, - "step": 433860 - }, - { - "epoch": 0.76, - "learning_rate": 1.216914239476557e-05, - "loss": 2.3229, - "step": 433870 - }, - { - "epoch": 0.76, - "learning_rate": 1.2168270454838744e-05, - "loss": 2.3273, - "step": 433880 - }, - { - "epoch": 0.76, - "learning_rate": 1.2167398514911916e-05, - "loss": 2.3287, - "step": 433890 - }, - { - "epoch": 0.76, - "learning_rate": 1.2166526574985091e-05, - "loss": 2.1744, - "step": 433900 - }, - { - "epoch": 0.76, - "learning_rate": 1.2165654635058265e-05, - "loss": 2.2443, - "step": 433910 - }, - { - "epoch": 0.76, - "learning_rate": 1.2164782695131437e-05, - "loss": 2.3509, - "step": 433920 - }, - { - "epoch": 0.76, - "learning_rate": 1.216391075520461e-05, - "loss": 2.1948, - "step": 433930 - }, - { - "epoch": 0.76, - "learning_rate": 1.2163038815277783e-05, - "loss": 2.2224, - "step": 433940 - }, - { - "epoch": 0.76, - "learning_rate": 1.2162166875350957e-05, - "loss": 2.2941, - "step": 433950 - }, - { - "epoch": 0.76, - "learning_rate": 1.2161294935424129e-05, - "loss": 2.3805, - "step": 433960 - }, - { - "epoch": 0.76, - "learning_rate": 1.2160422995497303e-05, - "loss": 2.3235, - "step": 433970 - }, - { - "epoch": 0.76, - "learning_rate": 1.2159551055570476e-05, - "loss": 2.3223, - "step": 433980 - }, - { - "epoch": 0.76, - "learning_rate": 1.215867911564365e-05, - "loss": 2.2689, - "step": 433990 - }, - { - "epoch": 0.76, - "learning_rate": 1.2157807175716822e-05, - "loss": 2.2087, - "step": 434000 - }, - { - "epoch": 0.76, - "learning_rate": 1.2156935235789996e-05, - "loss": 2.3336, - "step": 434010 - }, - { - "epoch": 0.76, - "learning_rate": 1.2156063295863168e-05, - "loss": 2.3619, - "step": 434020 - }, - { - "epoch": 0.76, - "learning_rate": 1.2155191355936342e-05, - "loss": 2.2452, - "step": 434030 - }, - { - "epoch": 0.76, - "learning_rate": 1.2154319416009516e-05, - "loss": 2.3374, - "step": 434040 - }, - { - "epoch": 0.76, - "learning_rate": 1.2153447476082688e-05, - "loss": 2.2307, - "step": 434050 - }, - { - "epoch": 0.76, - "learning_rate": 1.2152575536155861e-05, - "loss": 2.258, - "step": 434060 - }, - { - "epoch": 0.76, - "learning_rate": 1.2151703596229035e-05, - "loss": 2.2428, - "step": 434070 - }, - { - "epoch": 0.76, - "learning_rate": 1.2150831656302209e-05, - "loss": 2.2406, - "step": 434080 - }, - { - "epoch": 0.76, - "learning_rate": 1.2149959716375381e-05, - "loss": 2.1973, - "step": 434090 - }, - { - "epoch": 0.76, - "learning_rate": 1.2149087776448555e-05, - "loss": 2.2102, - "step": 434100 - }, - { - "epoch": 0.76, - "learning_rate": 1.2148215836521727e-05, - "loss": 2.2985, - "step": 434110 - }, - { - "epoch": 0.76, - "learning_rate": 1.21473438965949e-05, - "loss": 2.2877, - "step": 434120 - }, - { - "epoch": 0.76, - "learning_rate": 1.2146471956668073e-05, - "loss": 2.3153, - "step": 434130 - }, - { - "epoch": 0.76, - "learning_rate": 1.2145600016741248e-05, - "loss": 2.3168, - "step": 434140 - }, - { - "epoch": 0.76, - "learning_rate": 1.214472807681442e-05, - "loss": 2.3024, - "step": 434150 - }, - { - "epoch": 0.76, - "learning_rate": 1.2143856136887594e-05, - "loss": 2.3861, - "step": 434160 - }, - { - "epoch": 0.76, - "learning_rate": 1.2142984196960768e-05, - "loss": 2.2474, - "step": 434170 - }, - { - "epoch": 0.76, - "learning_rate": 1.214211225703394e-05, - "loss": 2.3182, - "step": 434180 - }, - { - "epoch": 0.76, - "learning_rate": 1.2141240317107114e-05, - "loss": 2.2311, - "step": 434190 - }, - { - "epoch": 0.76, - "learning_rate": 1.2140368377180286e-05, - "loss": 2.1735, - "step": 434200 - }, - { - "epoch": 0.76, - "learning_rate": 1.213949643725346e-05, - "loss": 2.3278, - "step": 434210 - }, - { - "epoch": 0.76, - "learning_rate": 1.2138624497326633e-05, - "loss": 2.2257, - "step": 434220 - }, - { - "epoch": 0.76, - "learning_rate": 1.2137752557399807e-05, - "loss": 2.2758, - "step": 434230 - }, - { - "epoch": 0.76, - "learning_rate": 1.2136880617472979e-05, - "loss": 2.2629, - "step": 434240 - }, - { - "epoch": 0.76, - "learning_rate": 1.2136008677546153e-05, - "loss": 2.3442, - "step": 434250 - }, - { - "epoch": 0.76, - "learning_rate": 1.2135136737619325e-05, - "loss": 2.3744, - "step": 434260 - }, - { - "epoch": 0.76, - "learning_rate": 1.2134264797692499e-05, - "loss": 2.2936, - "step": 434270 - }, - { - "epoch": 0.76, - "learning_rate": 1.213339285776567e-05, - "loss": 2.2281, - "step": 434280 - }, - { - "epoch": 0.76, - "learning_rate": 1.2132520917838845e-05, - "loss": 2.3654, - "step": 434290 - }, - { - "epoch": 0.76, - "learning_rate": 1.2131648977912018e-05, - "loss": 2.2773, - "step": 434300 - }, - { - "epoch": 0.76, - "learning_rate": 1.2130777037985192e-05, - "loss": 2.3002, - "step": 434310 - }, - { - "epoch": 0.76, - "learning_rate": 1.2129905098058366e-05, - "loss": 2.1493, - "step": 434320 - }, - { - "epoch": 0.76, - "learning_rate": 1.2129033158131538e-05, - "loss": 2.2955, - "step": 434330 - }, - { - "epoch": 0.76, - "learning_rate": 1.2128161218204712e-05, - "loss": 2.3985, - "step": 434340 - }, - { - "epoch": 0.76, - "learning_rate": 1.2127289278277884e-05, - "loss": 2.2304, - "step": 434350 - }, - { - "epoch": 0.76, - "learning_rate": 1.2126417338351058e-05, - "loss": 2.3558, - "step": 434360 - }, - { - "epoch": 0.76, - "learning_rate": 1.212554539842423e-05, - "loss": 2.2084, - "step": 434370 - }, - { - "epoch": 0.76, - "learning_rate": 1.2124673458497403e-05, - "loss": 2.4218, - "step": 434380 - }, - { - "epoch": 0.76, - "learning_rate": 1.2123801518570577e-05, - "loss": 2.2544, - "step": 434390 - }, - { - "epoch": 0.76, - "learning_rate": 1.2122929578643751e-05, - "loss": 2.3, - "step": 434400 - }, - { - "epoch": 0.76, - "learning_rate": 1.2122057638716923e-05, - "loss": 2.2691, - "step": 434410 - }, - { - "epoch": 0.76, - "learning_rate": 1.2121185698790097e-05, - "loss": 2.2578, - "step": 434420 - }, - { - "epoch": 0.76, - "learning_rate": 1.2120313758863269e-05, - "loss": 2.3645, - "step": 434430 - }, - { - "epoch": 0.76, - "learning_rate": 1.2119441818936443e-05, - "loss": 2.2347, - "step": 434440 - }, - { - "epoch": 0.76, - "learning_rate": 1.2118569879009616e-05, - "loss": 2.27, - "step": 434450 - }, - { - "epoch": 0.76, - "learning_rate": 1.211769793908279e-05, - "loss": 2.2927, - "step": 434460 - }, - { - "epoch": 0.76, - "learning_rate": 1.2116825999155964e-05, - "loss": 2.2392, - "step": 434470 - }, - { - "epoch": 0.76, - "learning_rate": 1.2115954059229136e-05, - "loss": 2.2985, - "step": 434480 - }, - { - "epoch": 0.76, - "learning_rate": 1.211508211930231e-05, - "loss": 2.3113, - "step": 434490 - }, - { - "epoch": 0.76, - "learning_rate": 1.2114210179375482e-05, - "loss": 2.4351, - "step": 434500 - }, - { - "epoch": 0.76, - "learning_rate": 1.2113338239448656e-05, - "loss": 2.2837, - "step": 434510 - }, - { - "epoch": 0.76, - "learning_rate": 1.2112466299521828e-05, - "loss": 2.3278, - "step": 434520 - }, - { - "epoch": 0.76, - "learning_rate": 1.2111594359595001e-05, - "loss": 2.3032, - "step": 434530 - }, - { - "epoch": 0.76, - "learning_rate": 1.2110722419668175e-05, - "loss": 2.3435, - "step": 434540 - }, - { - "epoch": 0.76, - "learning_rate": 1.2109850479741349e-05, - "loss": 2.4171, - "step": 434550 - }, - { - "epoch": 0.76, - "learning_rate": 1.2108978539814521e-05, - "loss": 2.1678, - "step": 434560 - }, - { - "epoch": 0.76, - "learning_rate": 1.2108106599887695e-05, - "loss": 2.2568, - "step": 434570 - }, - { - "epoch": 0.76, - "learning_rate": 1.2107234659960869e-05, - "loss": 2.3171, - "step": 434580 - }, - { - "epoch": 0.76, - "learning_rate": 1.210636272003404e-05, - "loss": 2.3063, - "step": 434590 - }, - { - "epoch": 0.76, - "learning_rate": 1.2105490780107214e-05, - "loss": 2.2913, - "step": 434600 - }, - { - "epoch": 0.76, - "learning_rate": 1.2104618840180387e-05, - "loss": 2.2838, - "step": 434610 - }, - { - "epoch": 0.76, - "learning_rate": 1.210374690025356e-05, - "loss": 2.2443, - "step": 434620 - }, - { - "epoch": 0.76, - "learning_rate": 1.2102874960326734e-05, - "loss": 2.314, - "step": 434630 - }, - { - "epoch": 0.76, - "learning_rate": 1.2102003020399908e-05, - "loss": 2.292, - "step": 434640 - }, - { - "epoch": 0.76, - "learning_rate": 1.210113108047308e-05, - "loss": 2.2669, - "step": 434650 - }, - { - "epoch": 0.76, - "learning_rate": 1.2100259140546254e-05, - "loss": 2.2929, - "step": 434660 - }, - { - "epoch": 0.76, - "learning_rate": 1.2099387200619426e-05, - "loss": 2.1524, - "step": 434670 - }, - { - "epoch": 0.76, - "learning_rate": 1.20985152606926e-05, - "loss": 2.2483, - "step": 434680 - }, - { - "epoch": 0.76, - "learning_rate": 1.2097643320765772e-05, - "loss": 2.349, - "step": 434690 - }, - { - "epoch": 0.76, - "learning_rate": 1.2096771380838947e-05, - "loss": 2.3567, - "step": 434700 - }, - { - "epoch": 0.76, - "learning_rate": 1.209589944091212e-05, - "loss": 2.1778, - "step": 434710 - }, - { - "epoch": 0.76, - "learning_rate": 1.2095027500985293e-05, - "loss": 2.3361, - "step": 434720 - }, - { - "epoch": 0.76, - "learning_rate": 1.2094155561058467e-05, - "loss": 2.2951, - "step": 434730 - }, - { - "epoch": 0.76, - "learning_rate": 1.2093283621131639e-05, - "loss": 2.3174, - "step": 434740 - }, - { - "epoch": 0.76, - "learning_rate": 1.2092411681204813e-05, - "loss": 2.2889, - "step": 434750 - }, - { - "epoch": 0.76, - "learning_rate": 1.2091539741277985e-05, - "loss": 2.4059, - "step": 434760 - }, - { - "epoch": 0.76, - "learning_rate": 1.2090667801351158e-05, - "loss": 2.2874, - "step": 434770 - }, - { - "epoch": 0.76, - "learning_rate": 1.2089795861424332e-05, - "loss": 2.2742, - "step": 434780 - }, - { - "epoch": 0.76, - "learning_rate": 1.2088923921497506e-05, - "loss": 2.2326, - "step": 434790 - }, - { - "epoch": 0.76, - "learning_rate": 1.2088051981570678e-05, - "loss": 2.2288, - "step": 434800 - }, - { - "epoch": 0.76, - "learning_rate": 1.2087180041643852e-05, - "loss": 2.2833, - "step": 434810 - }, - { - "epoch": 0.76, - "learning_rate": 1.2086308101717024e-05, - "loss": 2.3285, - "step": 434820 - }, - { - "epoch": 0.76, - "learning_rate": 1.2085436161790198e-05, - "loss": 2.2895, - "step": 434830 - }, - { - "epoch": 0.76, - "learning_rate": 1.2084564221863371e-05, - "loss": 2.273, - "step": 434840 - }, - { - "epoch": 0.76, - "learning_rate": 1.2083692281936543e-05, - "loss": 2.2998, - "step": 434850 - }, - { - "epoch": 0.76, - "learning_rate": 1.2082820342009717e-05, - "loss": 2.3696, - "step": 434860 - }, - { - "epoch": 0.76, - "learning_rate": 1.2081948402082891e-05, - "loss": 2.2377, - "step": 434870 - }, - { - "epoch": 0.76, - "learning_rate": 1.2081076462156065e-05, - "loss": 2.2346, - "step": 434880 - }, - { - "epoch": 0.76, - "learning_rate": 1.2080204522229237e-05, - "loss": 2.2638, - "step": 434890 - }, - { - "epoch": 0.76, - "learning_rate": 1.207933258230241e-05, - "loss": 2.2955, - "step": 434900 - }, - { - "epoch": 0.76, - "learning_rate": 1.2078460642375583e-05, - "loss": 2.3776, - "step": 434910 - }, - { - "epoch": 0.76, - "learning_rate": 1.2077588702448756e-05, - "loss": 2.3274, - "step": 434920 - }, - { - "epoch": 0.76, - "learning_rate": 1.2076716762521929e-05, - "loss": 2.2582, - "step": 434930 - }, - { - "epoch": 0.76, - "learning_rate": 1.2075844822595104e-05, - "loss": 2.3308, - "step": 434940 - }, - { - "epoch": 0.76, - "learning_rate": 1.2074972882668276e-05, - "loss": 2.3247, - "step": 434950 - }, - { - "epoch": 0.76, - "learning_rate": 1.207410094274145e-05, - "loss": 2.2948, - "step": 434960 - }, - { - "epoch": 0.76, - "learning_rate": 1.2073229002814624e-05, - "loss": 2.3518, - "step": 434970 - }, - { - "epoch": 0.76, - "learning_rate": 1.2072357062887796e-05, - "loss": 2.3521, - "step": 434980 - }, - { - "epoch": 0.76, - "learning_rate": 1.207148512296097e-05, - "loss": 2.2491, - "step": 434990 - }, - { - "epoch": 0.76, - "learning_rate": 1.2070613183034142e-05, - "loss": 2.143, - "step": 435000 - }, - { - "epoch": 0.76, - "learning_rate": 1.2069741243107315e-05, - "loss": 2.3631, - "step": 435010 - }, - { - "epoch": 0.76, - "learning_rate": 1.2068869303180489e-05, - "loss": 2.2669, - "step": 435020 - }, - { - "epoch": 0.76, - "learning_rate": 1.2067997363253663e-05, - "loss": 2.3158, - "step": 435030 - }, - { - "epoch": 0.76, - "learning_rate": 1.2067125423326835e-05, - "loss": 2.2045, - "step": 435040 - }, - { - "epoch": 0.76, - "learning_rate": 1.2066253483400009e-05, - "loss": 2.1861, - "step": 435050 - }, - { - "epoch": 0.76, - "learning_rate": 1.206538154347318e-05, - "loss": 2.3619, - "step": 435060 - }, - { - "epoch": 0.76, - "learning_rate": 1.2064509603546355e-05, - "loss": 2.3582, - "step": 435070 - }, - { - "epoch": 0.76, - "learning_rate": 1.2063637663619527e-05, - "loss": 2.2134, - "step": 435080 - }, - { - "epoch": 0.76, - "learning_rate": 1.20627657236927e-05, - "loss": 2.2489, - "step": 435090 - }, - { - "epoch": 0.76, - "learning_rate": 1.2061893783765874e-05, - "loss": 2.2232, - "step": 435100 - }, - { - "epoch": 0.76, - "learning_rate": 1.2061021843839048e-05, - "loss": 2.3629, - "step": 435110 - }, - { - "epoch": 0.76, - "learning_rate": 1.2060149903912222e-05, - "loss": 2.2823, - "step": 435120 - }, - { - "epoch": 0.76, - "learning_rate": 1.2059277963985394e-05, - "loss": 2.1805, - "step": 435130 - }, - { - "epoch": 0.76, - "learning_rate": 1.2058406024058568e-05, - "loss": 2.1763, - "step": 435140 - }, - { - "epoch": 0.76, - "learning_rate": 1.205753408413174e-05, - "loss": 2.2928, - "step": 435150 - }, - { - "epoch": 0.76, - "learning_rate": 1.2056662144204913e-05, - "loss": 2.206, - "step": 435160 - }, - { - "epoch": 0.76, - "learning_rate": 1.2055790204278085e-05, - "loss": 2.2718, - "step": 435170 - }, - { - "epoch": 0.76, - "learning_rate": 1.2054918264351261e-05, - "loss": 2.3268, - "step": 435180 - }, - { - "epoch": 0.76, - "learning_rate": 1.2054046324424433e-05, - "loss": 2.3362, - "step": 435190 - }, - { - "epoch": 0.76, - "learning_rate": 1.2053174384497607e-05, - "loss": 2.1401, - "step": 435200 - }, - { - "epoch": 0.76, - "learning_rate": 1.2052302444570779e-05, - "loss": 2.3287, - "step": 435210 - }, - { - "epoch": 0.76, - "learning_rate": 1.2051430504643953e-05, - "loss": 2.2279, - "step": 435220 - }, - { - "epoch": 0.76, - "learning_rate": 1.2050558564717126e-05, - "loss": 2.2728, - "step": 435230 - }, - { - "epoch": 0.76, - "learning_rate": 1.2049686624790298e-05, - "loss": 2.327, - "step": 435240 - }, - { - "epoch": 0.76, - "learning_rate": 1.2048814684863472e-05, - "loss": 2.2526, - "step": 435250 - }, - { - "epoch": 0.76, - "learning_rate": 1.2047942744936646e-05, - "loss": 2.2893, - "step": 435260 - }, - { - "epoch": 0.76, - "learning_rate": 1.204707080500982e-05, - "loss": 2.2525, - "step": 435270 - }, - { - "epoch": 0.76, - "learning_rate": 1.2046198865082992e-05, - "loss": 2.2365, - "step": 435280 - }, - { - "epoch": 0.76, - "learning_rate": 1.2045326925156166e-05, - "loss": 2.3474, - "step": 435290 - }, - { - "epoch": 0.76, - "learning_rate": 1.2044454985229338e-05, - "loss": 2.3316, - "step": 435300 - }, - { - "epoch": 0.76, - "learning_rate": 1.2043583045302511e-05, - "loss": 2.3184, - "step": 435310 - }, - { - "epoch": 0.76, - "learning_rate": 1.2042711105375684e-05, - "loss": 2.3553, - "step": 435320 - }, - { - "epoch": 0.76, - "learning_rate": 1.2041839165448857e-05, - "loss": 2.2137, - "step": 435330 - }, - { - "epoch": 0.76, - "learning_rate": 1.2040967225522031e-05, - "loss": 2.2568, - "step": 435340 - }, - { - "epoch": 0.76, - "learning_rate": 1.2040095285595205e-05, - "loss": 2.4449, - "step": 435350 - }, - { - "epoch": 0.76, - "learning_rate": 1.2039223345668377e-05, - "loss": 2.1973, - "step": 435360 - }, - { - "epoch": 0.76, - "learning_rate": 1.203835140574155e-05, - "loss": 2.2499, - "step": 435370 - }, - { - "epoch": 0.76, - "learning_rate": 1.2037479465814724e-05, - "loss": 2.1725, - "step": 435380 - }, - { - "epoch": 0.76, - "learning_rate": 1.2036607525887897e-05, - "loss": 2.3479, - "step": 435390 - }, - { - "epoch": 0.76, - "learning_rate": 1.203573558596107e-05, - "loss": 2.2611, - "step": 435400 - }, - { - "epoch": 0.76, - "learning_rate": 1.2034863646034242e-05, - "loss": 2.3087, - "step": 435410 - }, - { - "epoch": 0.76, - "learning_rate": 1.2033991706107418e-05, - "loss": 2.2493, - "step": 435420 - }, - { - "epoch": 0.76, - "learning_rate": 1.203311976618059e-05, - "loss": 2.2386, - "step": 435430 - }, - { - "epoch": 0.76, - "learning_rate": 1.2032247826253764e-05, - "loss": 2.3229, - "step": 435440 - }, - { - "epoch": 0.76, - "learning_rate": 1.2031375886326936e-05, - "loss": 2.2988, - "step": 435450 - }, - { - "epoch": 0.76, - "learning_rate": 1.203050394640011e-05, - "loss": 2.3215, - "step": 435460 - }, - { - "epoch": 0.76, - "learning_rate": 1.2029632006473282e-05, - "loss": 2.3625, - "step": 435470 - }, - { - "epoch": 0.76, - "learning_rate": 1.2028760066546455e-05, - "loss": 2.2332, - "step": 435480 - }, - { - "epoch": 0.76, - "learning_rate": 1.2027888126619629e-05, - "loss": 2.2513, - "step": 435490 - }, - { - "epoch": 0.76, - "learning_rate": 1.2027016186692803e-05, - "loss": 2.2617, - "step": 435500 - }, - { - "epoch": 0.76, - "learning_rate": 1.2026144246765977e-05, - "loss": 2.3146, - "step": 435510 - }, - { - "epoch": 0.76, - "learning_rate": 1.2025272306839149e-05, - "loss": 2.195, - "step": 435520 - }, - { - "epoch": 0.76, - "learning_rate": 1.2024400366912323e-05, - "loss": 2.2957, - "step": 435530 - }, - { - "epoch": 0.76, - "learning_rate": 1.2023528426985495e-05, - "loss": 2.2153, - "step": 435540 - }, - { - "epoch": 0.76, - "learning_rate": 1.2022656487058668e-05, - "loss": 2.2859, - "step": 435550 - }, - { - "epoch": 0.76, - "learning_rate": 1.202178454713184e-05, - "loss": 2.3039, - "step": 435560 - }, - { - "epoch": 0.76, - "learning_rate": 1.2020912607205014e-05, - "loss": 2.4033, - "step": 435570 - }, - { - "epoch": 0.76, - "learning_rate": 1.2020040667278188e-05, - "loss": 2.2287, - "step": 435580 - }, - { - "epoch": 0.76, - "learning_rate": 1.2019168727351362e-05, - "loss": 2.3503, - "step": 435590 - }, - { - "epoch": 0.76, - "learning_rate": 1.2018296787424534e-05, - "loss": 2.4052, - "step": 435600 - }, - { - "epoch": 0.76, - "learning_rate": 1.2017424847497708e-05, - "loss": 2.3102, - "step": 435610 - }, - { - "epoch": 0.76, - "learning_rate": 1.201655290757088e-05, - "loss": 2.3511, - "step": 435620 - }, - { - "epoch": 0.76, - "learning_rate": 1.2015680967644053e-05, - "loss": 2.3118, - "step": 435630 - }, - { - "epoch": 0.76, - "learning_rate": 1.2014809027717227e-05, - "loss": 2.3303, - "step": 435640 - }, - { - "epoch": 0.76, - "learning_rate": 1.20139370877904e-05, - "loss": 2.249, - "step": 435650 - }, - { - "epoch": 0.76, - "learning_rate": 1.2013065147863573e-05, - "loss": 2.3284, - "step": 435660 - }, - { - "epoch": 0.76, - "learning_rate": 1.2012193207936747e-05, - "loss": 2.2634, - "step": 435670 - }, - { - "epoch": 0.76, - "learning_rate": 1.201132126800992e-05, - "loss": 2.3045, - "step": 435680 - }, - { - "epoch": 0.76, - "learning_rate": 1.2010449328083093e-05, - "loss": 2.2956, - "step": 435690 - }, - { - "epoch": 0.76, - "learning_rate": 1.2009577388156266e-05, - "loss": 2.3301, - "step": 435700 - }, - { - "epoch": 0.76, - "learning_rate": 1.2008705448229439e-05, - "loss": 2.277, - "step": 435710 - }, - { - "epoch": 0.76, - "learning_rate": 1.2007833508302612e-05, - "loss": 2.2494, - "step": 435720 - }, - { - "epoch": 0.76, - "learning_rate": 1.2006961568375786e-05, - "loss": 2.3249, - "step": 435730 - }, - { - "epoch": 0.76, - "learning_rate": 1.200608962844896e-05, - "loss": 2.2809, - "step": 435740 - }, - { - "epoch": 0.76, - "learning_rate": 1.2005217688522132e-05, - "loss": 2.1963, - "step": 435750 - }, - { - "epoch": 0.76, - "learning_rate": 1.2004345748595306e-05, - "loss": 2.2939, - "step": 435760 - }, - { - "epoch": 0.76, - "learning_rate": 1.200347380866848e-05, - "loss": 2.3309, - "step": 435770 - }, - { - "epoch": 0.76, - "learning_rate": 1.2002601868741652e-05, - "loss": 2.2723, - "step": 435780 - }, - { - "epoch": 0.76, - "learning_rate": 1.2001729928814825e-05, - "loss": 2.2678, - "step": 435790 - }, - { - "epoch": 0.76, - "learning_rate": 1.2000857988887997e-05, - "loss": 2.2241, - "step": 435800 - }, - { - "epoch": 0.76, - "learning_rate": 1.1999986048961171e-05, - "loss": 2.2807, - "step": 435810 - }, - { - "epoch": 0.76, - "learning_rate": 1.1999114109034345e-05, - "loss": 2.2729, - "step": 435820 - }, - { - "epoch": 0.76, - "learning_rate": 1.1998242169107519e-05, - "loss": 2.2196, - "step": 435830 - }, - { - "epoch": 0.76, - "learning_rate": 1.199737022918069e-05, - "loss": 2.3225, - "step": 435840 - }, - { - "epoch": 0.76, - "learning_rate": 1.1996498289253865e-05, - "loss": 2.3192, - "step": 435850 - }, - { - "epoch": 0.76, - "learning_rate": 1.1995626349327037e-05, - "loss": 2.2917, - "step": 435860 - }, - { - "epoch": 0.76, - "learning_rate": 1.199475440940021e-05, - "loss": 2.263, - "step": 435870 - }, - { - "epoch": 0.76, - "learning_rate": 1.1993882469473382e-05, - "loss": 2.2684, - "step": 435880 - }, - { - "epoch": 0.76, - "learning_rate": 1.1993010529546556e-05, - "loss": 2.3755, - "step": 435890 - }, - { - "epoch": 0.76, - "learning_rate": 1.199213858961973e-05, - "loss": 2.2566, - "step": 435900 - }, - { - "epoch": 0.76, - "learning_rate": 1.1991266649692904e-05, - "loss": 2.2614, - "step": 435910 - }, - { - "epoch": 0.76, - "learning_rate": 1.1990394709766078e-05, - "loss": 2.3387, - "step": 435920 - }, - { - "epoch": 0.76, - "learning_rate": 1.198952276983925e-05, - "loss": 2.343, - "step": 435930 - }, - { - "epoch": 0.76, - "learning_rate": 1.1988650829912423e-05, - "loss": 2.277, - "step": 435940 - }, - { - "epoch": 0.76, - "learning_rate": 1.1987778889985595e-05, - "loss": 2.2908, - "step": 435950 - }, - { - "epoch": 0.76, - "learning_rate": 1.198690695005877e-05, - "loss": 2.2535, - "step": 435960 - }, - { - "epoch": 0.76, - "learning_rate": 1.1986035010131941e-05, - "loss": 2.2077, - "step": 435970 - }, - { - "epoch": 0.76, - "learning_rate": 1.1985163070205117e-05, - "loss": 2.3141, - "step": 435980 - }, - { - "epoch": 0.76, - "learning_rate": 1.1984291130278289e-05, - "loss": 2.3001, - "step": 435990 - }, - { - "epoch": 0.76, - "learning_rate": 1.1983419190351463e-05, - "loss": 2.3169, - "step": 436000 - }, - { - "epoch": 0.76, - "learning_rate": 1.1982547250424635e-05, - "loss": 2.3274, - "step": 436010 - }, - { - "epoch": 0.76, - "learning_rate": 1.1981675310497808e-05, - "loss": 2.2395, - "step": 436020 - }, - { - "epoch": 0.76, - "learning_rate": 1.1980803370570982e-05, - "loss": 2.263, - "step": 436030 - }, - { - "epoch": 0.76, - "learning_rate": 1.1979931430644154e-05, - "loss": 2.2891, - "step": 436040 - }, - { - "epoch": 0.76, - "learning_rate": 1.1979059490717328e-05, - "loss": 2.1914, - "step": 436050 - }, - { - "epoch": 0.76, - "learning_rate": 1.1978187550790502e-05, - "loss": 2.2523, - "step": 436060 - }, - { - "epoch": 0.76, - "learning_rate": 1.1977315610863676e-05, - "loss": 2.3598, - "step": 436070 - }, - { - "epoch": 0.76, - "learning_rate": 1.1976443670936848e-05, - "loss": 2.1507, - "step": 436080 - }, - { - "epoch": 0.76, - "learning_rate": 1.1975571731010021e-05, - "loss": 2.2127, - "step": 436090 - }, - { - "epoch": 0.76, - "learning_rate": 1.1974699791083194e-05, - "loss": 2.3488, - "step": 436100 - }, - { - "epoch": 0.76, - "learning_rate": 1.1973827851156367e-05, - "loss": 2.4749, - "step": 436110 - }, - { - "epoch": 0.76, - "learning_rate": 1.197295591122954e-05, - "loss": 2.4008, - "step": 436120 - }, - { - "epoch": 0.76, - "learning_rate": 1.1972083971302713e-05, - "loss": 2.3095, - "step": 436130 - }, - { - "epoch": 0.76, - "learning_rate": 1.1971212031375887e-05, - "loss": 2.2396, - "step": 436140 - }, - { - "epoch": 0.76, - "learning_rate": 1.197034009144906e-05, - "loss": 2.3284, - "step": 436150 - }, - { - "epoch": 0.76, - "learning_rate": 1.1969468151522233e-05, - "loss": 2.2921, - "step": 436160 - }, - { - "epoch": 0.76, - "learning_rate": 1.1968596211595407e-05, - "loss": 2.1272, - "step": 436170 - }, - { - "epoch": 0.76, - "learning_rate": 1.196772427166858e-05, - "loss": 2.2505, - "step": 436180 - }, - { - "epoch": 0.76, - "learning_rate": 1.1966852331741752e-05, - "loss": 2.4698, - "step": 436190 - }, - { - "epoch": 0.76, - "learning_rate": 1.1965980391814926e-05, - "loss": 2.2598, - "step": 436200 - }, - { - "epoch": 0.76, - "learning_rate": 1.1965108451888098e-05, - "loss": 2.2108, - "step": 436210 - }, - { - "epoch": 0.76, - "learning_rate": 1.1964236511961274e-05, - "loss": 2.2687, - "step": 436220 - }, - { - "epoch": 0.76, - "learning_rate": 1.1963364572034446e-05, - "loss": 2.3736, - "step": 436230 - }, - { - "epoch": 0.76, - "learning_rate": 1.196249263210762e-05, - "loss": 2.2154, - "step": 436240 - }, - { - "epoch": 0.76, - "learning_rate": 1.1961620692180792e-05, - "loss": 2.3473, - "step": 436250 - }, - { - "epoch": 0.76, - "learning_rate": 1.1960748752253965e-05, - "loss": 2.3345, - "step": 436260 - }, - { - "epoch": 0.76, - "learning_rate": 1.1959876812327137e-05, - "loss": 2.3999, - "step": 436270 - }, - { - "epoch": 0.76, - "learning_rate": 1.1959004872400311e-05, - "loss": 2.3477, - "step": 436280 - }, - { - "epoch": 0.76, - "learning_rate": 1.1958132932473485e-05, - "loss": 2.2641, - "step": 436290 - }, - { - "epoch": 0.76, - "learning_rate": 1.1957260992546659e-05, - "loss": 2.2217, - "step": 436300 - }, - { - "epoch": 0.76, - "learning_rate": 1.1956389052619833e-05, - "loss": 2.279, - "step": 436310 - }, - { - "epoch": 0.76, - "learning_rate": 1.1955517112693005e-05, - "loss": 2.2767, - "step": 436320 - }, - { - "epoch": 0.76, - "learning_rate": 1.1954645172766178e-05, - "loss": 2.3269, - "step": 436330 - }, - { - "epoch": 0.76, - "learning_rate": 1.195377323283935e-05, - "loss": 2.329, - "step": 436340 - }, - { - "epoch": 0.76, - "learning_rate": 1.1952901292912524e-05, - "loss": 2.35, - "step": 436350 - }, - { - "epoch": 0.76, - "learning_rate": 1.1952029352985696e-05, - "loss": 2.3343, - "step": 436360 - }, - { - "epoch": 0.76, - "learning_rate": 1.195115741305887e-05, - "loss": 2.305, - "step": 436370 - }, - { - "epoch": 0.76, - "learning_rate": 1.1950285473132044e-05, - "loss": 2.3208, - "step": 436380 - }, - { - "epoch": 0.76, - "learning_rate": 1.1949413533205218e-05, - "loss": 2.1747, - "step": 436390 - }, - { - "epoch": 0.76, - "learning_rate": 1.194854159327839e-05, - "loss": 2.2471, - "step": 436400 - }, - { - "epoch": 0.76, - "learning_rate": 1.1947669653351563e-05, - "loss": 2.2062, - "step": 436410 - }, - { - "epoch": 0.76, - "learning_rate": 1.1946797713424736e-05, - "loss": 2.293, - "step": 436420 - }, - { - "epoch": 0.76, - "learning_rate": 1.194592577349791e-05, - "loss": 2.3584, - "step": 436430 - }, - { - "epoch": 0.76, - "learning_rate": 1.1945053833571083e-05, - "loss": 2.2629, - "step": 436440 - }, - { - "epoch": 0.76, - "learning_rate": 1.1944181893644255e-05, - "loss": 2.2457, - "step": 436450 - }, - { - "epoch": 0.76, - "learning_rate": 1.194330995371743e-05, - "loss": 2.233, - "step": 436460 - }, - { - "epoch": 0.76, - "learning_rate": 1.1942438013790603e-05, - "loss": 2.2983, - "step": 436470 - }, - { - "epoch": 0.76, - "learning_rate": 1.1941566073863776e-05, - "loss": 2.2692, - "step": 436480 - }, - { - "epoch": 0.76, - "learning_rate": 1.1940694133936949e-05, - "loss": 2.3063, - "step": 436490 - }, - { - "epoch": 0.76, - "learning_rate": 1.1939822194010122e-05, - "loss": 2.2382, - "step": 436500 - }, - { - "epoch": 0.76, - "learning_rate": 1.1938950254083294e-05, - "loss": 2.1981, - "step": 436510 - }, - { - "epoch": 0.76, - "learning_rate": 1.1938078314156468e-05, - "loss": 2.3661, - "step": 436520 - }, - { - "epoch": 0.76, - "learning_rate": 1.1937206374229642e-05, - "loss": 2.2696, - "step": 436530 - }, - { - "epoch": 0.76, - "learning_rate": 1.1936334434302816e-05, - "loss": 2.1254, - "step": 436540 - }, - { - "epoch": 0.76, - "learning_rate": 1.1935462494375988e-05, - "loss": 2.3049, - "step": 436550 - }, - { - "epoch": 0.76, - "learning_rate": 1.1934590554449162e-05, - "loss": 2.2027, - "step": 436560 - }, - { - "epoch": 0.76, - "learning_rate": 1.1933718614522335e-05, - "loss": 2.2369, - "step": 436570 - }, - { - "epoch": 0.76, - "learning_rate": 1.1932846674595507e-05, - "loss": 2.288, - "step": 436580 - }, - { - "epoch": 0.76, - "learning_rate": 1.1931974734668681e-05, - "loss": 2.2328, - "step": 436590 - }, - { - "epoch": 0.76, - "learning_rate": 1.1931102794741853e-05, - "loss": 2.2589, - "step": 436600 - }, - { - "epoch": 0.76, - "learning_rate": 1.1930230854815027e-05, - "loss": 2.2404, - "step": 436610 - }, - { - "epoch": 0.76, - "learning_rate": 1.19293589148882e-05, - "loss": 2.3324, - "step": 436620 - }, - { - "epoch": 0.76, - "learning_rate": 1.1928486974961375e-05, - "loss": 2.3032, - "step": 436630 - }, - { - "epoch": 0.76, - "learning_rate": 1.1927615035034547e-05, - "loss": 2.264, - "step": 436640 - }, - { - "epoch": 0.76, - "learning_rate": 1.192674309510772e-05, - "loss": 2.2035, - "step": 436650 - }, - { - "epoch": 0.76, - "learning_rate": 1.1925871155180892e-05, - "loss": 2.3162, - "step": 436660 - }, - { - "epoch": 0.76, - "learning_rate": 1.1924999215254066e-05, - "loss": 2.3383, - "step": 436670 - }, - { - "epoch": 0.76, - "learning_rate": 1.1924127275327238e-05, - "loss": 2.14, - "step": 436680 - }, - { - "epoch": 0.76, - "learning_rate": 1.1923255335400412e-05, - "loss": 2.3076, - "step": 436690 - }, - { - "epoch": 0.76, - "learning_rate": 1.1922383395473586e-05, - "loss": 2.3565, - "step": 436700 - }, - { - "epoch": 0.76, - "learning_rate": 1.192151145554676e-05, - "loss": 2.2616, - "step": 436710 - }, - { - "epoch": 0.76, - "learning_rate": 1.1920639515619933e-05, - "loss": 2.1697, - "step": 436720 - }, - { - "epoch": 0.76, - "learning_rate": 1.1919767575693105e-05, - "loss": 2.2209, - "step": 436730 - }, - { - "epoch": 0.76, - "learning_rate": 1.191889563576628e-05, - "loss": 2.3401, - "step": 436740 - }, - { - "epoch": 0.76, - "learning_rate": 1.1918023695839451e-05, - "loss": 2.2343, - "step": 436750 - }, - { - "epoch": 0.76, - "learning_rate": 1.1917151755912625e-05, - "loss": 2.2252, - "step": 436760 - }, - { - "epoch": 0.76, - "learning_rate": 1.1916279815985799e-05, - "loss": 2.3167, - "step": 436770 - }, - { - "epoch": 0.76, - "learning_rate": 1.1915407876058973e-05, - "loss": 2.3346, - "step": 436780 - }, - { - "epoch": 0.76, - "learning_rate": 1.1914535936132145e-05, - "loss": 2.305, - "step": 436790 - }, - { - "epoch": 0.76, - "learning_rate": 1.1913663996205318e-05, - "loss": 2.385, - "step": 436800 - }, - { - "epoch": 0.76, - "learning_rate": 1.191279205627849e-05, - "loss": 2.4493, - "step": 436810 - }, - { - "epoch": 0.76, - "learning_rate": 1.1911920116351664e-05, - "loss": 2.2704, - "step": 436820 - }, - { - "epoch": 0.76, - "learning_rate": 1.1911048176424838e-05, - "loss": 2.4191, - "step": 436830 - }, - { - "epoch": 0.76, - "learning_rate": 1.191017623649801e-05, - "loss": 2.2549, - "step": 436840 - }, - { - "epoch": 0.76, - "learning_rate": 1.1909304296571184e-05, - "loss": 2.3122, - "step": 436850 - }, - { - "epoch": 0.76, - "learning_rate": 1.1908432356644358e-05, - "loss": 2.49, - "step": 436860 - }, - { - "epoch": 0.76, - "learning_rate": 1.1907560416717531e-05, - "loss": 2.3083, - "step": 436870 - }, - { - "epoch": 0.76, - "learning_rate": 1.1906688476790704e-05, - "loss": 2.2988, - "step": 436880 - }, - { - "epoch": 0.76, - "learning_rate": 1.1905816536863877e-05, - "loss": 2.2913, - "step": 436890 - }, - { - "epoch": 0.76, - "learning_rate": 1.190494459693705e-05, - "loss": 2.3435, - "step": 436900 - }, - { - "epoch": 0.76, - "learning_rate": 1.1904072657010223e-05, - "loss": 2.1962, - "step": 436910 - }, - { - "epoch": 0.76, - "learning_rate": 1.1903200717083395e-05, - "loss": 2.2966, - "step": 436920 - }, - { - "epoch": 0.76, - "learning_rate": 1.1902328777156569e-05, - "loss": 2.266, - "step": 436930 - }, - { - "epoch": 0.76, - "learning_rate": 1.1901456837229743e-05, - "loss": 2.1955, - "step": 436940 - }, - { - "epoch": 0.76, - "learning_rate": 1.1900584897302917e-05, - "loss": 2.289, - "step": 436950 - }, - { - "epoch": 0.76, - "learning_rate": 1.189971295737609e-05, - "loss": 2.1969, - "step": 436960 - }, - { - "epoch": 0.76, - "learning_rate": 1.1898841017449262e-05, - "loss": 2.2713, - "step": 436970 - }, - { - "epoch": 0.76, - "learning_rate": 1.1897969077522436e-05, - "loss": 2.2985, - "step": 436980 - }, - { - "epoch": 0.76, - "learning_rate": 1.1897097137595608e-05, - "loss": 2.4081, - "step": 436990 - }, - { - "epoch": 0.76, - "learning_rate": 1.1896225197668782e-05, - "loss": 2.2888, - "step": 437000 - }, - { - "epoch": 0.76, - "learning_rate": 1.1895353257741954e-05, - "loss": 2.2729, - "step": 437010 - }, - { - "epoch": 0.76, - "learning_rate": 1.189448131781513e-05, - "loss": 2.2797, - "step": 437020 - }, - { - "epoch": 0.76, - "learning_rate": 1.1893609377888302e-05, - "loss": 2.3011, - "step": 437030 - }, - { - "epoch": 0.76, - "learning_rate": 1.1892737437961475e-05, - "loss": 2.2451, - "step": 437040 - }, - { - "epoch": 0.76, - "learning_rate": 1.1891865498034647e-05, - "loss": 2.1881, - "step": 437050 - }, - { - "epoch": 0.76, - "learning_rate": 1.1890993558107821e-05, - "loss": 2.0864, - "step": 437060 - }, - { - "epoch": 0.76, - "learning_rate": 1.1890121618180993e-05, - "loss": 2.2867, - "step": 437070 - }, - { - "epoch": 0.76, - "learning_rate": 1.1889249678254167e-05, - "loss": 2.3077, - "step": 437080 - }, - { - "epoch": 0.76, - "learning_rate": 1.1888377738327341e-05, - "loss": 2.2078, - "step": 437090 - }, - { - "epoch": 0.76, - "learning_rate": 1.1887505798400515e-05, - "loss": 2.3033, - "step": 437100 - }, - { - "epoch": 0.76, - "learning_rate": 1.1886633858473688e-05, - "loss": 2.453, - "step": 437110 - }, - { - "epoch": 0.76, - "learning_rate": 1.188576191854686e-05, - "loss": 2.2234, - "step": 437120 - }, - { - "epoch": 0.76, - "learning_rate": 1.1884889978620034e-05, - "loss": 2.2932, - "step": 437130 - }, - { - "epoch": 0.76, - "learning_rate": 1.1884018038693206e-05, - "loss": 2.1201, - "step": 437140 - }, - { - "epoch": 0.76, - "learning_rate": 1.188314609876638e-05, - "loss": 2.259, - "step": 437150 - }, - { - "epoch": 0.76, - "learning_rate": 1.1882274158839552e-05, - "loss": 2.2026, - "step": 437160 - }, - { - "epoch": 0.76, - "learning_rate": 1.1881402218912726e-05, - "loss": 2.3185, - "step": 437170 - }, - { - "epoch": 0.76, - "learning_rate": 1.18805302789859e-05, - "loss": 2.3925, - "step": 437180 - }, - { - "epoch": 0.76, - "learning_rate": 1.1879658339059073e-05, - "loss": 2.3445, - "step": 437190 - }, - { - "epoch": 0.76, - "learning_rate": 1.1878786399132246e-05, - "loss": 2.3259, - "step": 437200 - }, - { - "epoch": 0.76, - "learning_rate": 1.187791445920542e-05, - "loss": 2.2819, - "step": 437210 - }, - { - "epoch": 0.76, - "learning_rate": 1.1877042519278591e-05, - "loss": 2.3233, - "step": 437220 - }, - { - "epoch": 0.76, - "learning_rate": 1.1876170579351765e-05, - "loss": 2.325, - "step": 437230 - }, - { - "epoch": 0.76, - "learning_rate": 1.1875298639424939e-05, - "loss": 2.3831, - "step": 437240 - }, - { - "epoch": 0.76, - "learning_rate": 1.1874426699498111e-05, - "loss": 2.2647, - "step": 437250 - }, - { - "epoch": 0.76, - "learning_rate": 1.1873554759571286e-05, - "loss": 2.2267, - "step": 437260 - }, - { - "epoch": 0.76, - "learning_rate": 1.1872682819644459e-05, - "loss": 2.2798, - "step": 437270 - }, - { - "epoch": 0.76, - "learning_rate": 1.1871810879717632e-05, - "loss": 2.2716, - "step": 437280 - }, - { - "epoch": 0.76, - "learning_rate": 1.1870938939790804e-05, - "loss": 2.3968, - "step": 437290 - }, - { - "epoch": 0.76, - "learning_rate": 1.1870066999863978e-05, - "loss": 2.2871, - "step": 437300 - }, - { - "epoch": 0.76, - "learning_rate": 1.186919505993715e-05, - "loss": 2.2939, - "step": 437310 - }, - { - "epoch": 0.76, - "learning_rate": 1.1868323120010324e-05, - "loss": 2.1815, - "step": 437320 - }, - { - "epoch": 0.76, - "learning_rate": 1.1867451180083498e-05, - "loss": 2.336, - "step": 437330 - }, - { - "epoch": 0.76, - "learning_rate": 1.1866579240156672e-05, - "loss": 2.2191, - "step": 437340 - }, - { - "epoch": 0.76, - "learning_rate": 1.1865707300229844e-05, - "loss": 2.3454, - "step": 437350 - }, - { - "epoch": 0.76, - "learning_rate": 1.1864835360303017e-05, - "loss": 2.4072, - "step": 437360 - }, - { - "epoch": 0.76, - "learning_rate": 1.1863963420376191e-05, - "loss": 2.2659, - "step": 437370 - }, - { - "epoch": 0.76, - "learning_rate": 1.1863091480449363e-05, - "loss": 2.2704, - "step": 437380 - }, - { - "epoch": 0.76, - "learning_rate": 1.1862219540522537e-05, - "loss": 2.1928, - "step": 437390 - }, - { - "epoch": 0.76, - "learning_rate": 1.1861347600595709e-05, - "loss": 2.3157, - "step": 437400 - }, - { - "epoch": 0.76, - "learning_rate": 1.1860475660668883e-05, - "loss": 2.1856, - "step": 437410 - }, - { - "epoch": 0.76, - "learning_rate": 1.1859603720742057e-05, - "loss": 2.3807, - "step": 437420 - }, - { - "epoch": 0.76, - "learning_rate": 1.185873178081523e-05, - "loss": 2.3126, - "step": 437430 - }, - { - "epoch": 0.76, - "learning_rate": 1.1857859840888402e-05, - "loss": 2.2362, - "step": 437440 - }, - { - "epoch": 0.76, - "learning_rate": 1.1856987900961576e-05, - "loss": 2.3099, - "step": 437450 - }, - { - "epoch": 0.76, - "learning_rate": 1.1856115961034748e-05, - "loss": 2.2985, - "step": 437460 - }, - { - "epoch": 0.76, - "learning_rate": 1.1855244021107922e-05, - "loss": 2.3315, - "step": 437470 - }, - { - "epoch": 0.76, - "learning_rate": 1.1854372081181094e-05, - "loss": 2.2503, - "step": 437480 - }, - { - "epoch": 0.76, - "learning_rate": 1.1853500141254268e-05, - "loss": 2.3502, - "step": 437490 - }, - { - "epoch": 0.76, - "learning_rate": 1.1852628201327443e-05, - "loss": 2.2484, - "step": 437500 - }, - { - "epoch": 0.76, - "learning_rate": 1.1851756261400615e-05, - "loss": 2.3198, - "step": 437510 - }, - { - "epoch": 0.76, - "learning_rate": 1.185088432147379e-05, - "loss": 2.3559, - "step": 437520 - }, - { - "epoch": 0.76, - "learning_rate": 1.1850012381546961e-05, - "loss": 2.2279, - "step": 437530 - }, - { - "epoch": 0.76, - "learning_rate": 1.1849140441620135e-05, - "loss": 2.2293, - "step": 437540 - }, - { - "epoch": 0.76, - "learning_rate": 1.1848268501693307e-05, - "loss": 2.3317, - "step": 437550 - }, - { - "epoch": 0.76, - "learning_rate": 1.1847396561766481e-05, - "loss": 2.3056, - "step": 437560 - }, - { - "epoch": 0.76, - "learning_rate": 1.1846524621839655e-05, - "loss": 2.3609, - "step": 437570 - }, - { - "epoch": 0.76, - "learning_rate": 1.1845652681912828e-05, - "loss": 2.2955, - "step": 437580 - }, - { - "epoch": 0.76, - "learning_rate": 1.1844780741986e-05, - "loss": 2.2439, - "step": 437590 - }, - { - "epoch": 0.76, - "learning_rate": 1.1843908802059174e-05, - "loss": 2.2649, - "step": 437600 - }, - { - "epoch": 0.76, - "learning_rate": 1.1843036862132346e-05, - "loss": 2.2604, - "step": 437610 - }, - { - "epoch": 0.76, - "learning_rate": 1.184216492220552e-05, - "loss": 2.2809, - "step": 437620 - }, - { - "epoch": 0.76, - "learning_rate": 1.1841292982278694e-05, - "loss": 2.2751, - "step": 437630 - }, - { - "epoch": 0.76, - "learning_rate": 1.1840421042351866e-05, - "loss": 2.3787, - "step": 437640 - }, - { - "epoch": 0.76, - "learning_rate": 1.183954910242504e-05, - "loss": 2.368, - "step": 437650 - }, - { - "epoch": 0.76, - "learning_rate": 1.1838677162498214e-05, - "loss": 2.2282, - "step": 437660 - }, - { - "epoch": 0.76, - "learning_rate": 1.1837805222571387e-05, - "loss": 2.2739, - "step": 437670 - }, - { - "epoch": 0.76, - "learning_rate": 1.183693328264456e-05, - "loss": 2.3552, - "step": 437680 - }, - { - "epoch": 0.76, - "learning_rate": 1.1836061342717733e-05, - "loss": 2.0246, - "step": 437690 - }, - { - "epoch": 0.76, - "learning_rate": 1.1835189402790905e-05, - "loss": 2.241, - "step": 437700 - }, - { - "epoch": 0.76, - "learning_rate": 1.1834317462864079e-05, - "loss": 2.3704, - "step": 437710 - }, - { - "epoch": 0.76, - "learning_rate": 1.1833445522937251e-05, - "loss": 2.1794, - "step": 437720 - }, - { - "epoch": 0.76, - "learning_rate": 1.1832573583010425e-05, - "loss": 2.1826, - "step": 437730 - }, - { - "epoch": 0.76, - "learning_rate": 1.1831701643083599e-05, - "loss": 2.3267, - "step": 437740 - }, - { - "epoch": 0.76, - "learning_rate": 1.1830829703156772e-05, - "loss": 2.2485, - "step": 437750 - }, - { - "epoch": 0.76, - "learning_rate": 1.1829957763229946e-05, - "loss": 2.3579, - "step": 437760 - }, - { - "epoch": 0.76, - "learning_rate": 1.1829085823303118e-05, - "loss": 2.1757, - "step": 437770 - }, - { - "epoch": 0.76, - "learning_rate": 1.1828213883376292e-05, - "loss": 2.3029, - "step": 437780 - }, - { - "epoch": 0.76, - "learning_rate": 1.1827341943449464e-05, - "loss": 2.2348, - "step": 437790 - }, - { - "epoch": 0.76, - "learning_rate": 1.1826470003522638e-05, - "loss": 2.3018, - "step": 437800 - }, - { - "epoch": 0.76, - "learning_rate": 1.1825598063595812e-05, - "loss": 2.2963, - "step": 437810 - }, - { - "epoch": 0.76, - "learning_rate": 1.1824726123668985e-05, - "loss": 2.3649, - "step": 437820 - }, - { - "epoch": 0.76, - "learning_rate": 1.1823854183742157e-05, - "loss": 2.2898, - "step": 437830 - }, - { - "epoch": 0.76, - "learning_rate": 1.1822982243815331e-05, - "loss": 2.2651, - "step": 437840 - }, - { - "epoch": 0.76, - "learning_rate": 1.1822110303888503e-05, - "loss": 2.2584, - "step": 437850 - }, - { - "epoch": 0.76, - "learning_rate": 1.1821238363961677e-05, - "loss": 2.328, - "step": 437860 - }, - { - "epoch": 0.76, - "learning_rate": 1.182036642403485e-05, - "loss": 2.2122, - "step": 437870 - }, - { - "epoch": 0.76, - "learning_rate": 1.1819494484108023e-05, - "loss": 2.1238, - "step": 437880 - }, - { - "epoch": 0.76, - "learning_rate": 1.1818622544181197e-05, - "loss": 2.2369, - "step": 437890 - }, - { - "epoch": 0.76, - "learning_rate": 1.181775060425437e-05, - "loss": 2.2601, - "step": 437900 - }, - { - "epoch": 0.76, - "learning_rate": 1.1816878664327544e-05, - "loss": 2.3041, - "step": 437910 - }, - { - "epoch": 0.76, - "learning_rate": 1.1816006724400716e-05, - "loss": 2.2176, - "step": 437920 - }, - { - "epoch": 0.76, - "learning_rate": 1.181513478447389e-05, - "loss": 2.2778, - "step": 437930 - }, - { - "epoch": 0.76, - "learning_rate": 1.1814262844547062e-05, - "loss": 2.2285, - "step": 437940 - }, - { - "epoch": 0.76, - "learning_rate": 1.1813390904620236e-05, - "loss": 2.267, - "step": 437950 - }, - { - "epoch": 0.76, - "learning_rate": 1.1812518964693408e-05, - "loss": 2.2607, - "step": 437960 - }, - { - "epoch": 0.76, - "learning_rate": 1.1811647024766582e-05, - "loss": 2.3241, - "step": 437970 - }, - { - "epoch": 0.76, - "learning_rate": 1.1810775084839756e-05, - "loss": 2.2849, - "step": 437980 - }, - { - "epoch": 0.76, - "learning_rate": 1.180990314491293e-05, - "loss": 2.3362, - "step": 437990 - }, - { - "epoch": 0.76, - "learning_rate": 1.1809031204986101e-05, - "loss": 2.3062, - "step": 438000 - }, - { - "epoch": 0.76, - "learning_rate": 1.1808159265059275e-05, - "loss": 2.195, - "step": 438010 - }, - { - "epoch": 0.76, - "learning_rate": 1.1807287325132447e-05, - "loss": 2.3272, - "step": 438020 - }, - { - "epoch": 0.76, - "learning_rate": 1.1806415385205621e-05, - "loss": 2.3001, - "step": 438030 - }, - { - "epoch": 0.76, - "learning_rate": 1.1805543445278795e-05, - "loss": 2.315, - "step": 438040 - }, - { - "epoch": 0.76, - "learning_rate": 1.1804671505351967e-05, - "loss": 2.1472, - "step": 438050 - }, - { - "epoch": 0.76, - "learning_rate": 1.1803799565425142e-05, - "loss": 2.2429, - "step": 438060 - }, - { - "epoch": 0.76, - "learning_rate": 1.1802927625498314e-05, - "loss": 2.2475, - "step": 438070 - }, - { - "epoch": 0.76, - "learning_rate": 1.1802055685571488e-05, - "loss": 2.2943, - "step": 438080 - }, - { - "epoch": 0.76, - "learning_rate": 1.180118374564466e-05, - "loss": 2.3692, - "step": 438090 - }, - { - "epoch": 0.76, - "learning_rate": 1.1800311805717834e-05, - "loss": 2.327, - "step": 438100 - }, - { - "epoch": 0.76, - "learning_rate": 1.1799439865791006e-05, - "loss": 2.2793, - "step": 438110 - }, - { - "epoch": 0.76, - "learning_rate": 1.179856792586418e-05, - "loss": 2.1828, - "step": 438120 - }, - { - "epoch": 0.76, - "learning_rate": 1.1797695985937354e-05, - "loss": 2.4025, - "step": 438130 - }, - { - "epoch": 0.76, - "learning_rate": 1.1796824046010527e-05, - "loss": 2.3, - "step": 438140 - }, - { - "epoch": 0.76, - "learning_rate": 1.17959521060837e-05, - "loss": 2.2573, - "step": 438150 - }, - { - "epoch": 0.76, - "learning_rate": 1.1795080166156873e-05, - "loss": 2.19, - "step": 438160 - }, - { - "epoch": 0.76, - "learning_rate": 1.1794208226230047e-05, - "loss": 2.274, - "step": 438170 - }, - { - "epoch": 0.76, - "learning_rate": 1.1793336286303219e-05, - "loss": 2.3055, - "step": 438180 - }, - { - "epoch": 0.76, - "learning_rate": 1.1792464346376393e-05, - "loss": 2.3269, - "step": 438190 - }, - { - "epoch": 0.76, - "learning_rate": 1.1791592406449565e-05, - "loss": 2.268, - "step": 438200 - }, - { - "epoch": 0.76, - "learning_rate": 1.1790720466522739e-05, - "loss": 2.2477, - "step": 438210 - }, - { - "epoch": 0.76, - "learning_rate": 1.1789848526595912e-05, - "loss": 2.2705, - "step": 438220 - }, - { - "epoch": 0.76, - "learning_rate": 1.1788976586669086e-05, - "loss": 2.2868, - "step": 438230 - }, - { - "epoch": 0.76, - "learning_rate": 1.1788104646742258e-05, - "loss": 2.2267, - "step": 438240 - }, - { - "epoch": 0.76, - "learning_rate": 1.1787232706815432e-05, - "loss": 2.264, - "step": 438250 - }, - { - "epoch": 0.76, - "learning_rate": 1.1786360766888604e-05, - "loss": 2.2902, - "step": 438260 - }, - { - "epoch": 0.76, - "learning_rate": 1.1785488826961778e-05, - "loss": 2.3549, - "step": 438270 - }, - { - "epoch": 0.76, - "learning_rate": 1.178461688703495e-05, - "loss": 2.2446, - "step": 438280 - }, - { - "epoch": 0.76, - "learning_rate": 1.1783744947108124e-05, - "loss": 2.3461, - "step": 438290 - }, - { - "epoch": 0.76, - "learning_rate": 1.17828730071813e-05, - "loss": 2.4054, - "step": 438300 - }, - { - "epoch": 0.76, - "learning_rate": 1.1782001067254471e-05, - "loss": 2.3446, - "step": 438310 - }, - { - "epoch": 0.76, - "learning_rate": 1.1781129127327645e-05, - "loss": 2.1767, - "step": 438320 - }, - { - "epoch": 0.76, - "learning_rate": 1.1780257187400817e-05, - "loss": 2.1974, - "step": 438330 - }, - { - "epoch": 0.76, - "learning_rate": 1.1779385247473991e-05, - "loss": 2.3541, - "step": 438340 - }, - { - "epoch": 0.76, - "learning_rate": 1.1778513307547163e-05, - "loss": 2.4266, - "step": 438350 - }, - { - "epoch": 0.76, - "learning_rate": 1.1777641367620337e-05, - "loss": 2.3797, - "step": 438360 - }, - { - "epoch": 0.76, - "learning_rate": 1.177676942769351e-05, - "loss": 2.3331, - "step": 438370 - }, - { - "epoch": 0.76, - "learning_rate": 1.1775897487766684e-05, - "loss": 2.3934, - "step": 438380 - }, - { - "epoch": 0.76, - "learning_rate": 1.1775025547839856e-05, - "loss": 2.2746, - "step": 438390 - }, - { - "epoch": 0.76, - "learning_rate": 1.177415360791303e-05, - "loss": 2.4004, - "step": 438400 - }, - { - "epoch": 0.76, - "learning_rate": 1.1773281667986202e-05, - "loss": 2.3522, - "step": 438410 - }, - { - "epoch": 0.76, - "learning_rate": 1.1772409728059376e-05, - "loss": 2.2364, - "step": 438420 - }, - { - "epoch": 0.76, - "learning_rate": 1.177153778813255e-05, - "loss": 2.1708, - "step": 438430 - }, - { - "epoch": 0.76, - "learning_rate": 1.1770665848205722e-05, - "loss": 2.2358, - "step": 438440 - }, - { - "epoch": 0.76, - "learning_rate": 1.1769793908278896e-05, - "loss": 2.2252, - "step": 438450 - }, - { - "epoch": 0.76, - "learning_rate": 1.176892196835207e-05, - "loss": 2.4012, - "step": 438460 - }, - { - "epoch": 0.76, - "learning_rate": 1.1768050028425243e-05, - "loss": 2.317, - "step": 438470 - }, - { - "epoch": 0.76, - "learning_rate": 1.1767178088498415e-05, - "loss": 2.3128, - "step": 438480 - }, - { - "epoch": 0.76, - "learning_rate": 1.1766306148571589e-05, - "loss": 2.415, - "step": 438490 - }, - { - "epoch": 0.76, - "learning_rate": 1.1765434208644761e-05, - "loss": 2.2636, - "step": 438500 - }, - { - "epoch": 0.76, - "learning_rate": 1.1764562268717935e-05, - "loss": 2.3215, - "step": 438510 - }, - { - "epoch": 0.76, - "learning_rate": 1.1763690328791107e-05, - "loss": 2.2097, - "step": 438520 - }, - { - "epoch": 0.76, - "learning_rate": 1.176281838886428e-05, - "loss": 2.1438, - "step": 438530 - }, - { - "epoch": 0.76, - "learning_rate": 1.1761946448937454e-05, - "loss": 2.265, - "step": 438540 - }, - { - "epoch": 0.76, - "learning_rate": 1.1761074509010628e-05, - "loss": 2.2696, - "step": 438550 - }, - { - "epoch": 0.76, - "learning_rate": 1.1760202569083802e-05, - "loss": 2.4999, - "step": 438560 - }, - { - "epoch": 0.76, - "learning_rate": 1.1759330629156974e-05, - "loss": 2.371, - "step": 438570 - }, - { - "epoch": 0.76, - "learning_rate": 1.1758458689230148e-05, - "loss": 2.2285, - "step": 438580 - }, - { - "epoch": 0.76, - "learning_rate": 1.175758674930332e-05, - "loss": 2.2791, - "step": 438590 - }, - { - "epoch": 0.76, - "learning_rate": 1.1756714809376494e-05, - "loss": 2.3049, - "step": 438600 - }, - { - "epoch": 0.76, - "learning_rate": 1.1755842869449667e-05, - "loss": 2.2164, - "step": 438610 - }, - { - "epoch": 0.76, - "learning_rate": 1.1754970929522841e-05, - "loss": 2.2926, - "step": 438620 - }, - { - "epoch": 0.76, - "learning_rate": 1.1754098989596013e-05, - "loss": 2.2853, - "step": 438630 - }, - { - "epoch": 0.76, - "learning_rate": 1.1753227049669187e-05, - "loss": 2.3771, - "step": 438640 - }, - { - "epoch": 0.76, - "learning_rate": 1.175235510974236e-05, - "loss": 2.3758, - "step": 438650 - }, - { - "epoch": 0.76, - "learning_rate": 1.1751483169815533e-05, - "loss": 2.3044, - "step": 438660 - }, - { - "epoch": 0.76, - "learning_rate": 1.1750611229888705e-05, - "loss": 2.1976, - "step": 438670 - }, - { - "epoch": 0.77, - "learning_rate": 1.1749739289961879e-05, - "loss": 2.2946, - "step": 438680 - }, - { - "epoch": 0.77, - "learning_rate": 1.1748867350035053e-05, - "loss": 2.1538, - "step": 438690 - }, - { - "epoch": 0.77, - "learning_rate": 1.1747995410108226e-05, - "loss": 2.2845, - "step": 438700 - }, - { - "epoch": 0.77, - "learning_rate": 1.17471234701814e-05, - "loss": 2.2547, - "step": 438710 - }, - { - "epoch": 0.77, - "learning_rate": 1.1746251530254572e-05, - "loss": 2.3169, - "step": 438720 - }, - { - "epoch": 0.77, - "learning_rate": 1.1745379590327746e-05, - "loss": 2.2718, - "step": 438730 - }, - { - "epoch": 0.77, - "learning_rate": 1.1744507650400918e-05, - "loss": 2.2979, - "step": 438740 - }, - { - "epoch": 0.77, - "learning_rate": 1.1743635710474092e-05, - "loss": 2.1868, - "step": 438750 - }, - { - "epoch": 0.77, - "learning_rate": 1.1742763770547264e-05, - "loss": 2.2695, - "step": 438760 - }, - { - "epoch": 0.77, - "learning_rate": 1.1741891830620438e-05, - "loss": 2.2908, - "step": 438770 - }, - { - "epoch": 0.77, - "learning_rate": 1.1741019890693611e-05, - "loss": 2.2445, - "step": 438780 - }, - { - "epoch": 0.77, - "learning_rate": 1.1740147950766785e-05, - "loss": 2.4076, - "step": 438790 - }, - { - "epoch": 0.77, - "learning_rate": 1.1739276010839957e-05, - "loss": 2.3065, - "step": 438800 - }, - { - "epoch": 0.77, - "learning_rate": 1.1738404070913131e-05, - "loss": 2.3337, - "step": 438810 - }, - { - "epoch": 0.77, - "learning_rate": 1.1737532130986303e-05, - "loss": 2.2239, - "step": 438820 - }, - { - "epoch": 0.77, - "learning_rate": 1.1736660191059477e-05, - "loss": 2.3039, - "step": 438830 - }, - { - "epoch": 0.77, - "learning_rate": 1.173578825113265e-05, - "loss": 2.3793, - "step": 438840 - }, - { - "epoch": 0.77, - "learning_rate": 1.1734916311205824e-05, - "loss": 2.239, - "step": 438850 - }, - { - "epoch": 0.77, - "learning_rate": 1.1734044371278998e-05, - "loss": 2.2663, - "step": 438860 - }, - { - "epoch": 0.77, - "learning_rate": 1.173317243135217e-05, - "loss": 2.1068, - "step": 438870 - }, - { - "epoch": 0.77, - "learning_rate": 1.1732300491425344e-05, - "loss": 2.1901, - "step": 438880 - }, - { - "epoch": 0.77, - "learning_rate": 1.1731428551498516e-05, - "loss": 2.229, - "step": 438890 - }, - { - "epoch": 0.77, - "learning_rate": 1.173055661157169e-05, - "loss": 2.2318, - "step": 438900 - }, - { - "epoch": 0.77, - "learning_rate": 1.1729684671644862e-05, - "loss": 2.1943, - "step": 438910 - }, - { - "epoch": 0.77, - "learning_rate": 1.1728812731718036e-05, - "loss": 2.2803, - "step": 438920 - }, - { - "epoch": 0.77, - "learning_rate": 1.172794079179121e-05, - "loss": 2.2416, - "step": 438930 - }, - { - "epoch": 0.77, - "learning_rate": 1.1727068851864383e-05, - "loss": 2.2278, - "step": 438940 - }, - { - "epoch": 0.77, - "learning_rate": 1.1726196911937555e-05, - "loss": 2.2074, - "step": 438950 - }, - { - "epoch": 0.77, - "learning_rate": 1.1725324972010729e-05, - "loss": 2.182, - "step": 438960 - }, - { - "epoch": 0.77, - "learning_rate": 1.1724453032083903e-05, - "loss": 2.2698, - "step": 438970 - }, - { - "epoch": 0.77, - "learning_rate": 1.1723581092157075e-05, - "loss": 2.2911, - "step": 438980 - }, - { - "epoch": 0.77, - "learning_rate": 1.1722709152230249e-05, - "loss": 2.3819, - "step": 438990 - }, - { - "epoch": 0.77, - "learning_rate": 1.172183721230342e-05, - "loss": 2.2482, - "step": 439000 - }, - { - "epoch": 0.77, - "learning_rate": 1.1720965272376595e-05, - "loss": 2.1293, - "step": 439010 - }, - { - "epoch": 0.77, - "learning_rate": 1.1720093332449768e-05, - "loss": 2.2876, - "step": 439020 - }, - { - "epoch": 0.77, - "learning_rate": 1.1719221392522942e-05, - "loss": 2.2393, - "step": 439030 - }, - { - "epoch": 0.77, - "learning_rate": 1.1718349452596114e-05, - "loss": 2.2584, - "step": 439040 - }, - { - "epoch": 0.77, - "learning_rate": 1.1717477512669288e-05, - "loss": 2.3677, - "step": 439050 - }, - { - "epoch": 0.77, - "learning_rate": 1.171660557274246e-05, - "loss": 2.2718, - "step": 439060 - }, - { - "epoch": 0.77, - "learning_rate": 1.1715733632815634e-05, - "loss": 2.2359, - "step": 439070 - }, - { - "epoch": 0.77, - "learning_rate": 1.1714861692888806e-05, - "loss": 2.2136, - "step": 439080 - }, - { - "epoch": 0.77, - "learning_rate": 1.171398975296198e-05, - "loss": 2.2367, - "step": 439090 - }, - { - "epoch": 0.77, - "learning_rate": 1.1713117813035155e-05, - "loss": 2.3731, - "step": 439100 - }, - { - "epoch": 0.77, - "learning_rate": 1.1712245873108327e-05, - "loss": 2.2727, - "step": 439110 - }, - { - "epoch": 0.77, - "learning_rate": 1.1711373933181501e-05, - "loss": 2.2035, - "step": 439120 - }, - { - "epoch": 0.77, - "learning_rate": 1.1710501993254673e-05, - "loss": 2.3439, - "step": 439130 - }, - { - "epoch": 0.77, - "learning_rate": 1.1709630053327847e-05, - "loss": 2.3064, - "step": 439140 - }, - { - "epoch": 0.77, - "learning_rate": 1.1708758113401019e-05, - "loss": 2.3385, - "step": 439150 - }, - { - "epoch": 0.77, - "learning_rate": 1.1707886173474193e-05, - "loss": 2.2957, - "step": 439160 - }, - { - "epoch": 0.77, - "learning_rate": 1.1707014233547366e-05, - "loss": 2.3467, - "step": 439170 - }, - { - "epoch": 0.77, - "learning_rate": 1.170614229362054e-05, - "loss": 2.3405, - "step": 439180 - }, - { - "epoch": 0.77, - "learning_rate": 1.1705270353693712e-05, - "loss": 2.3456, - "step": 439190 - }, - { - "epoch": 0.77, - "learning_rate": 1.1704398413766886e-05, - "loss": 2.3471, - "step": 439200 - }, - { - "epoch": 0.77, - "learning_rate": 1.1703526473840058e-05, - "loss": 2.3141, - "step": 439210 - }, - { - "epoch": 0.77, - "learning_rate": 1.1702654533913232e-05, - "loss": 2.3868, - "step": 439220 - }, - { - "epoch": 0.77, - "learning_rate": 1.1701782593986406e-05, - "loss": 2.2235, - "step": 439230 - }, - { - "epoch": 0.77, - "learning_rate": 1.1700910654059578e-05, - "loss": 2.189, - "step": 439240 - }, - { - "epoch": 0.77, - "learning_rate": 1.1700038714132751e-05, - "loss": 2.2305, - "step": 439250 - }, - { - "epoch": 0.77, - "learning_rate": 1.1699166774205925e-05, - "loss": 2.3076, - "step": 439260 - }, - { - "epoch": 0.77, - "learning_rate": 1.1698294834279099e-05, - "loss": 2.365, - "step": 439270 - }, - { - "epoch": 0.77, - "learning_rate": 1.1697422894352271e-05, - "loss": 2.3477, - "step": 439280 - }, - { - "epoch": 0.77, - "learning_rate": 1.1696550954425445e-05, - "loss": 2.3484, - "step": 439290 - }, - { - "epoch": 0.77, - "learning_rate": 1.1695679014498617e-05, - "loss": 2.2972, - "step": 439300 - }, - { - "epoch": 0.77, - "learning_rate": 1.169480707457179e-05, - "loss": 2.2838, - "step": 439310 - }, - { - "epoch": 0.77, - "learning_rate": 1.1693935134644963e-05, - "loss": 2.2388, - "step": 439320 - }, - { - "epoch": 0.77, - "learning_rate": 1.1693063194718137e-05, - "loss": 2.3089, - "step": 439330 - }, - { - "epoch": 0.77, - "learning_rate": 1.169219125479131e-05, - "loss": 2.2813, - "step": 439340 - }, - { - "epoch": 0.77, - "learning_rate": 1.1691319314864484e-05, - "loss": 2.4205, - "step": 439350 - }, - { - "epoch": 0.77, - "learning_rate": 1.1690447374937658e-05, - "loss": 2.3515, - "step": 439360 - }, - { - "epoch": 0.77, - "learning_rate": 1.168957543501083e-05, - "loss": 2.3287, - "step": 439370 - }, - { - "epoch": 0.77, - "learning_rate": 1.1688703495084004e-05, - "loss": 2.3202, - "step": 439380 - }, - { - "epoch": 0.77, - "learning_rate": 1.1687831555157176e-05, - "loss": 2.3228, - "step": 439390 - }, - { - "epoch": 0.77, - "learning_rate": 1.168695961523035e-05, - "loss": 2.265, - "step": 439400 - }, - { - "epoch": 0.77, - "learning_rate": 1.1686087675303523e-05, - "loss": 2.2284, - "step": 439410 - }, - { - "epoch": 0.77, - "learning_rate": 1.1685215735376697e-05, - "loss": 2.4191, - "step": 439420 - }, - { - "epoch": 0.77, - "learning_rate": 1.168434379544987e-05, - "loss": 2.3629, - "step": 439430 - }, - { - "epoch": 0.77, - "learning_rate": 1.1683471855523043e-05, - "loss": 2.3072, - "step": 439440 - }, - { - "epoch": 0.77, - "learning_rate": 1.1682599915596215e-05, - "loss": 2.2466, - "step": 439450 - }, - { - "epoch": 0.77, - "learning_rate": 1.1681727975669389e-05, - "loss": 2.3138, - "step": 439460 - }, - { - "epoch": 0.77, - "learning_rate": 1.1680856035742561e-05, - "loss": 2.285, - "step": 439470 - }, - { - "epoch": 0.77, - "learning_rate": 1.1679984095815735e-05, - "loss": 2.3356, - "step": 439480 - }, - { - "epoch": 0.77, - "learning_rate": 1.1679112155888908e-05, - "loss": 2.2668, - "step": 439490 - }, - { - "epoch": 0.77, - "learning_rate": 1.1678240215962082e-05, - "loss": 2.3318, - "step": 439500 - }, - { - "epoch": 0.77, - "learning_rate": 1.1677368276035256e-05, - "loss": 2.276, - "step": 439510 - }, - { - "epoch": 0.77, - "learning_rate": 1.1676496336108428e-05, - "loss": 2.2518, - "step": 439520 - }, - { - "epoch": 0.77, - "learning_rate": 1.1675624396181602e-05, - "loss": 2.3168, - "step": 439530 - }, - { - "epoch": 0.77, - "learning_rate": 1.1674752456254774e-05, - "loss": 2.3134, - "step": 439540 - }, - { - "epoch": 0.77, - "learning_rate": 1.1673880516327948e-05, - "loss": 2.3527, - "step": 439550 - }, - { - "epoch": 0.77, - "learning_rate": 1.167300857640112e-05, - "loss": 2.4295, - "step": 439560 - }, - { - "epoch": 0.77, - "learning_rate": 1.1672136636474293e-05, - "loss": 2.3475, - "step": 439570 - }, - { - "epoch": 0.77, - "learning_rate": 1.1671264696547467e-05, - "loss": 2.1997, - "step": 439580 - }, - { - "epoch": 0.77, - "learning_rate": 1.1670392756620641e-05, - "loss": 2.2278, - "step": 439590 - }, - { - "epoch": 0.77, - "learning_rate": 1.1669520816693813e-05, - "loss": 2.204, - "step": 439600 - }, - { - "epoch": 0.77, - "learning_rate": 1.1668648876766987e-05, - "loss": 2.3062, - "step": 439610 - }, - { - "epoch": 0.77, - "learning_rate": 1.166777693684016e-05, - "loss": 2.2507, - "step": 439620 - }, - { - "epoch": 0.77, - "learning_rate": 1.1666904996913333e-05, - "loss": 2.3325, - "step": 439630 - }, - { - "epoch": 0.77, - "learning_rate": 1.1666033056986506e-05, - "loss": 2.2483, - "step": 439640 - }, - { - "epoch": 0.77, - "learning_rate": 1.166516111705968e-05, - "loss": 2.3445, - "step": 439650 - }, - { - "epoch": 0.77, - "learning_rate": 1.1664289177132854e-05, - "loss": 2.1863, - "step": 439660 - }, - { - "epoch": 0.77, - "learning_rate": 1.1663417237206026e-05, - "loss": 2.283, - "step": 439670 - }, - { - "epoch": 0.77, - "learning_rate": 1.16625452972792e-05, - "loss": 2.2978, - "step": 439680 - }, - { - "epoch": 0.77, - "learning_rate": 1.1661673357352372e-05, - "loss": 2.2829, - "step": 439690 - }, - { - "epoch": 0.77, - "learning_rate": 1.1660801417425546e-05, - "loss": 2.3124, - "step": 439700 - }, - { - "epoch": 0.77, - "learning_rate": 1.1659929477498718e-05, - "loss": 2.3278, - "step": 439710 - }, - { - "epoch": 0.77, - "learning_rate": 1.1659057537571892e-05, - "loss": 2.2392, - "step": 439720 - }, - { - "epoch": 0.77, - "learning_rate": 1.1658185597645065e-05, - "loss": 2.344, - "step": 439730 - }, - { - "epoch": 0.77, - "learning_rate": 1.1657313657718239e-05, - "loss": 2.165, - "step": 439740 - }, - { - "epoch": 0.77, - "learning_rate": 1.1656441717791411e-05, - "loss": 2.3424, - "step": 439750 - }, - { - "epoch": 0.77, - "learning_rate": 1.1655569777864585e-05, - "loss": 2.3458, - "step": 439760 - }, - { - "epoch": 0.77, - "learning_rate": 1.1654697837937759e-05, - "loss": 2.3166, - "step": 439770 - }, - { - "epoch": 0.77, - "learning_rate": 1.165382589801093e-05, - "loss": 2.256, - "step": 439780 - }, - { - "epoch": 0.77, - "learning_rate": 1.1652953958084105e-05, - "loss": 2.2272, - "step": 439790 - }, - { - "epoch": 0.77, - "learning_rate": 1.1652082018157277e-05, - "loss": 2.322, - "step": 439800 - }, - { - "epoch": 0.77, - "learning_rate": 1.165121007823045e-05, - "loss": 2.2766, - "step": 439810 - }, - { - "epoch": 0.77, - "learning_rate": 1.1650338138303624e-05, - "loss": 2.3352, - "step": 439820 - }, - { - "epoch": 0.77, - "learning_rate": 1.1649466198376798e-05, - "loss": 2.4012, - "step": 439830 - }, - { - "epoch": 0.77, - "learning_rate": 1.164859425844997e-05, - "loss": 2.3911, - "step": 439840 - }, - { - "epoch": 0.77, - "learning_rate": 1.1647722318523144e-05, - "loss": 2.3384, - "step": 439850 - }, - { - "epoch": 0.77, - "learning_rate": 1.1646850378596316e-05, - "loss": 2.2549, - "step": 439860 - }, - { - "epoch": 0.77, - "learning_rate": 1.164597843866949e-05, - "loss": 2.3206, - "step": 439870 - }, - { - "epoch": 0.77, - "learning_rate": 1.1645106498742662e-05, - "loss": 2.353, - "step": 439880 - }, - { - "epoch": 0.77, - "learning_rate": 1.1644234558815837e-05, - "loss": 2.2649, - "step": 439890 - }, - { - "epoch": 0.77, - "learning_rate": 1.1643362618889011e-05, - "loss": 2.239, - "step": 439900 - }, - { - "epoch": 0.77, - "learning_rate": 1.1642490678962183e-05, - "loss": 2.1971, - "step": 439910 - }, - { - "epoch": 0.77, - "learning_rate": 1.1641618739035357e-05, - "loss": 2.3096, - "step": 439920 - }, - { - "epoch": 0.77, - "learning_rate": 1.1640746799108529e-05, - "loss": 2.3334, - "step": 439930 - }, - { - "epoch": 0.77, - "learning_rate": 1.1639874859181703e-05, - "loss": 2.374, - "step": 439940 - }, - { - "epoch": 0.77, - "learning_rate": 1.1639002919254875e-05, - "loss": 2.3248, - "step": 439950 - }, - { - "epoch": 0.77, - "learning_rate": 1.1638130979328048e-05, - "loss": 2.3077, - "step": 439960 - }, - { - "epoch": 0.77, - "learning_rate": 1.1637259039401222e-05, - "loss": 2.3445, - "step": 439970 - }, - { - "epoch": 0.77, - "learning_rate": 1.1636387099474396e-05, - "loss": 2.2927, - "step": 439980 - }, - { - "epoch": 0.77, - "learning_rate": 1.1635515159547568e-05, - "loss": 2.2255, - "step": 439990 - }, - { - "epoch": 0.77, - "learning_rate": 1.1634643219620742e-05, - "loss": 2.344, - "step": 440000 - }, - { - "epoch": 0.77, - "learning_rate": 1.1633771279693914e-05, - "loss": 2.2819, - "step": 440010 - }, - { - "epoch": 0.77, - "learning_rate": 1.1632899339767088e-05, - "loss": 2.2565, - "step": 440020 - }, - { - "epoch": 0.77, - "learning_rate": 1.1632027399840261e-05, - "loss": 2.2535, - "step": 440030 - }, - { - "epoch": 0.77, - "learning_rate": 1.1631155459913434e-05, - "loss": 2.3199, - "step": 440040 - }, - { - "epoch": 0.77, - "learning_rate": 1.1630283519986607e-05, - "loss": 2.2195, - "step": 440050 - }, - { - "epoch": 0.77, - "learning_rate": 1.1629411580059781e-05, - "loss": 2.2199, - "step": 440060 - }, - { - "epoch": 0.77, - "learning_rate": 1.1628539640132955e-05, - "loss": 2.2482, - "step": 440070 - }, - { - "epoch": 0.77, - "learning_rate": 1.1627667700206127e-05, - "loss": 2.2641, - "step": 440080 - }, - { - "epoch": 0.77, - "learning_rate": 1.16267957602793e-05, - "loss": 2.2342, - "step": 440090 - }, - { - "epoch": 0.77, - "learning_rate": 1.1625923820352473e-05, - "loss": 2.3322, - "step": 440100 - }, - { - "epoch": 0.77, - "learning_rate": 1.1625051880425647e-05, - "loss": 2.3296, - "step": 440110 - }, - { - "epoch": 0.77, - "learning_rate": 1.1624179940498819e-05, - "loss": 2.3057, - "step": 440120 - }, - { - "epoch": 0.77, - "learning_rate": 1.1623308000571992e-05, - "loss": 2.3281, - "step": 440130 - }, - { - "epoch": 0.77, - "learning_rate": 1.1622436060645166e-05, - "loss": 2.2251, - "step": 440140 - }, - { - "epoch": 0.77, - "learning_rate": 1.162156412071834e-05, - "loss": 2.138, - "step": 440150 - }, - { - "epoch": 0.77, - "learning_rate": 1.1620692180791514e-05, - "loss": 2.2566, - "step": 440160 - }, - { - "epoch": 0.77, - "learning_rate": 1.1619820240864686e-05, - "loss": 2.3324, - "step": 440170 - }, - { - "epoch": 0.77, - "learning_rate": 1.161894830093786e-05, - "loss": 2.3647, - "step": 440180 - }, - { - "epoch": 0.77, - "learning_rate": 1.1618076361011032e-05, - "loss": 2.2662, - "step": 440190 - }, - { - "epoch": 0.77, - "learning_rate": 1.1617204421084205e-05, - "loss": 2.3397, - "step": 440200 - }, - { - "epoch": 0.77, - "learning_rate": 1.161633248115738e-05, - "loss": 2.1374, - "step": 440210 - }, - { - "epoch": 0.77, - "learning_rate": 1.1615460541230553e-05, - "loss": 2.3566, - "step": 440220 - }, - { - "epoch": 0.77, - "learning_rate": 1.1614588601303725e-05, - "loss": 2.3496, - "step": 440230 - }, - { - "epoch": 0.77, - "learning_rate": 1.1613716661376899e-05, - "loss": 2.3534, - "step": 440240 - }, - { - "epoch": 0.77, - "learning_rate": 1.1612844721450071e-05, - "loss": 2.2905, - "step": 440250 - }, - { - "epoch": 0.77, - "learning_rate": 1.1611972781523245e-05, - "loss": 2.2326, - "step": 440260 - }, - { - "epoch": 0.77, - "learning_rate": 1.1611100841596417e-05, - "loss": 2.3108, - "step": 440270 - }, - { - "epoch": 0.77, - "learning_rate": 1.161022890166959e-05, - "loss": 2.2599, - "step": 440280 - }, - { - "epoch": 0.77, - "learning_rate": 1.1609356961742764e-05, - "loss": 2.3368, - "step": 440290 - }, - { - "epoch": 0.77, - "learning_rate": 1.1608485021815938e-05, - "loss": 2.372, - "step": 440300 - }, - { - "epoch": 0.77, - "learning_rate": 1.1607613081889112e-05, - "loss": 2.3474, - "step": 440310 - }, - { - "epoch": 0.77, - "learning_rate": 1.1606741141962284e-05, - "loss": 2.2903, - "step": 440320 - }, - { - "epoch": 0.77, - "learning_rate": 1.1605869202035458e-05, - "loss": 2.3847, - "step": 440330 - }, - { - "epoch": 0.77, - "learning_rate": 1.160499726210863e-05, - "loss": 2.3456, - "step": 440340 - }, - { - "epoch": 0.77, - "learning_rate": 1.1604125322181803e-05, - "loss": 2.1777, - "step": 440350 - }, - { - "epoch": 0.77, - "learning_rate": 1.1603253382254976e-05, - "loss": 2.3557, - "step": 440360 - }, - { - "epoch": 0.77, - "learning_rate": 1.160238144232815e-05, - "loss": 2.3247, - "step": 440370 - }, - { - "epoch": 0.77, - "learning_rate": 1.1601509502401323e-05, - "loss": 2.3388, - "step": 440380 - }, - { - "epoch": 0.77, - "learning_rate": 1.1600637562474497e-05, - "loss": 2.2179, - "step": 440390 - }, - { - "epoch": 0.77, - "learning_rate": 1.1599765622547669e-05, - "loss": 2.2306, - "step": 440400 - }, - { - "epoch": 0.77, - "learning_rate": 1.1598893682620843e-05, - "loss": 2.277, - "step": 440410 - }, - { - "epoch": 0.77, - "learning_rate": 1.1598021742694017e-05, - "loss": 2.2958, - "step": 440420 - }, - { - "epoch": 0.77, - "learning_rate": 1.1597149802767189e-05, - "loss": 2.2306, - "step": 440430 - }, - { - "epoch": 0.77, - "learning_rate": 1.1596277862840362e-05, - "loss": 2.1943, - "step": 440440 - }, - { - "epoch": 0.77, - "learning_rate": 1.1595405922913536e-05, - "loss": 2.3639, - "step": 440450 - }, - { - "epoch": 0.77, - "learning_rate": 1.159453398298671e-05, - "loss": 2.2936, - "step": 440460 - }, - { - "epoch": 0.77, - "learning_rate": 1.1593662043059882e-05, - "loss": 2.176, - "step": 440470 - }, - { - "epoch": 0.77, - "learning_rate": 1.1592790103133056e-05, - "loss": 2.1451, - "step": 440480 - }, - { - "epoch": 0.77, - "learning_rate": 1.1591918163206228e-05, - "loss": 2.3523, - "step": 440490 - }, - { - "epoch": 0.77, - "learning_rate": 1.1591046223279402e-05, - "loss": 2.3878, - "step": 440500 - }, - { - "epoch": 0.77, - "learning_rate": 1.1590174283352574e-05, - "loss": 2.3117, - "step": 440510 - }, - { - "epoch": 0.77, - "learning_rate": 1.1589302343425747e-05, - "loss": 2.4163, - "step": 440520 - }, - { - "epoch": 0.77, - "learning_rate": 1.1588430403498921e-05, - "loss": 2.3461, - "step": 440530 - }, - { - "epoch": 0.77, - "learning_rate": 1.1587558463572095e-05, - "loss": 2.2792, - "step": 440540 - }, - { - "epoch": 0.77, - "learning_rate": 1.1586686523645267e-05, - "loss": 2.3513, - "step": 440550 - }, - { - "epoch": 0.77, - "learning_rate": 1.158581458371844e-05, - "loss": 2.3076, - "step": 440560 - }, - { - "epoch": 0.77, - "learning_rate": 1.1584942643791615e-05, - "loss": 2.1899, - "step": 440570 - }, - { - "epoch": 0.77, - "learning_rate": 1.1584070703864787e-05, - "loss": 2.1465, - "step": 440580 - }, - { - "epoch": 0.77, - "learning_rate": 1.158319876393796e-05, - "loss": 2.2403, - "step": 440590 - }, - { - "epoch": 0.77, - "learning_rate": 1.1582326824011133e-05, - "loss": 2.2381, - "step": 440600 - }, - { - "epoch": 0.77, - "learning_rate": 1.1581454884084306e-05, - "loss": 2.2999, - "step": 440610 - }, - { - "epoch": 0.77, - "learning_rate": 1.158058294415748e-05, - "loss": 2.3578, - "step": 440620 - }, - { - "epoch": 0.77, - "learning_rate": 1.1579711004230654e-05, - "loss": 2.3703, - "step": 440630 - }, - { - "epoch": 0.77, - "learning_rate": 1.1578839064303826e-05, - "loss": 2.2819, - "step": 440640 - }, - { - "epoch": 0.77, - "learning_rate": 1.1577967124377e-05, - "loss": 2.3156, - "step": 440650 - }, - { - "epoch": 0.77, - "learning_rate": 1.1577095184450172e-05, - "loss": 2.3167, - "step": 440660 - }, - { - "epoch": 0.77, - "learning_rate": 1.1576223244523346e-05, - "loss": 2.2281, - "step": 440670 - }, - { - "epoch": 0.77, - "learning_rate": 1.1575351304596518e-05, - "loss": 2.2529, - "step": 440680 - }, - { - "epoch": 0.77, - "learning_rate": 1.1574479364669693e-05, - "loss": 2.3718, - "step": 440690 - }, - { - "epoch": 0.77, - "learning_rate": 1.1573607424742867e-05, - "loss": 2.3906, - "step": 440700 - }, - { - "epoch": 0.77, - "learning_rate": 1.1572735484816039e-05, - "loss": 2.3601, - "step": 440710 - }, - { - "epoch": 0.77, - "learning_rate": 1.1571863544889213e-05, - "loss": 2.2727, - "step": 440720 - }, - { - "epoch": 0.77, - "learning_rate": 1.1570991604962385e-05, - "loss": 2.2464, - "step": 440730 - }, - { - "epoch": 0.77, - "learning_rate": 1.1570119665035559e-05, - "loss": 2.2479, - "step": 440740 - }, - { - "epoch": 0.77, - "learning_rate": 1.156924772510873e-05, - "loss": 2.1991, - "step": 440750 - }, - { - "epoch": 0.77, - "learning_rate": 1.1568375785181904e-05, - "loss": 2.2424, - "step": 440760 - }, - { - "epoch": 0.77, - "learning_rate": 1.1567503845255078e-05, - "loss": 2.2998, - "step": 440770 - }, - { - "epoch": 0.77, - "learning_rate": 1.1566631905328252e-05, - "loss": 2.2732, - "step": 440780 - }, - { - "epoch": 0.77, - "learning_rate": 1.1565759965401424e-05, - "loss": 2.2798, - "step": 440790 - }, - { - "epoch": 0.77, - "learning_rate": 1.1564888025474598e-05, - "loss": 2.3549, - "step": 440800 - }, - { - "epoch": 0.77, - "learning_rate": 1.156401608554777e-05, - "loss": 2.385, - "step": 440810 - }, - { - "epoch": 0.77, - "learning_rate": 1.1563144145620944e-05, - "loss": 2.23, - "step": 440820 - }, - { - "epoch": 0.77, - "learning_rate": 1.1562272205694117e-05, - "loss": 2.2472, - "step": 440830 - }, - { - "epoch": 0.77, - "learning_rate": 1.156140026576729e-05, - "loss": 2.3045, - "step": 440840 - }, - { - "epoch": 0.77, - "learning_rate": 1.1560528325840463e-05, - "loss": 2.2812, - "step": 440850 - }, - { - "epoch": 0.77, - "learning_rate": 1.1559656385913637e-05, - "loss": 2.3309, - "step": 440860 - }, - { - "epoch": 0.77, - "learning_rate": 1.155878444598681e-05, - "loss": 2.3459, - "step": 440870 - }, - { - "epoch": 0.77, - "learning_rate": 1.1557912506059983e-05, - "loss": 2.3818, - "step": 440880 - }, - { - "epoch": 0.77, - "learning_rate": 1.1557040566133157e-05, - "loss": 2.3476, - "step": 440890 - }, - { - "epoch": 0.77, - "learning_rate": 1.1556168626206329e-05, - "loss": 2.2308, - "step": 440900 - }, - { - "epoch": 0.77, - "learning_rate": 1.1555296686279502e-05, - "loss": 2.2354, - "step": 440910 - }, - { - "epoch": 0.77, - "learning_rate": 1.1554424746352675e-05, - "loss": 2.2878, - "step": 440920 - }, - { - "epoch": 0.77, - "learning_rate": 1.155355280642585e-05, - "loss": 2.291, - "step": 440930 - }, - { - "epoch": 0.77, - "learning_rate": 1.1552680866499022e-05, - "loss": 2.2726, - "step": 440940 - }, - { - "epoch": 0.77, - "learning_rate": 1.1551808926572196e-05, - "loss": 2.3957, - "step": 440950 - }, - { - "epoch": 0.77, - "learning_rate": 1.155093698664537e-05, - "loss": 2.3692, - "step": 440960 - }, - { - "epoch": 0.77, - "learning_rate": 1.1550065046718542e-05, - "loss": 2.252, - "step": 440970 - }, - { - "epoch": 0.77, - "learning_rate": 1.1549193106791715e-05, - "loss": 2.4021, - "step": 440980 - }, - { - "epoch": 0.77, - "learning_rate": 1.1548321166864888e-05, - "loss": 2.2444, - "step": 440990 - }, - { - "epoch": 0.77, - "learning_rate": 1.1547449226938061e-05, - "loss": 2.2714, - "step": 441000 - }, - { - "epoch": 0.77, - "learning_rate": 1.1546577287011235e-05, - "loss": 2.2246, - "step": 441010 - }, - { - "epoch": 0.77, - "learning_rate": 1.1545705347084409e-05, - "loss": 2.3502, - "step": 441020 - }, - { - "epoch": 0.77, - "learning_rate": 1.1544833407157581e-05, - "loss": 2.3964, - "step": 441030 - }, - { - "epoch": 0.77, - "learning_rate": 1.1543961467230755e-05, - "loss": 2.2211, - "step": 441040 - }, - { - "epoch": 0.77, - "learning_rate": 1.1543089527303927e-05, - "loss": 2.3345, - "step": 441050 - }, - { - "epoch": 0.77, - "learning_rate": 1.15422175873771e-05, - "loss": 2.23, - "step": 441060 - }, - { - "epoch": 0.77, - "learning_rate": 1.1541345647450273e-05, - "loss": 2.3012, - "step": 441070 - }, - { - "epoch": 0.77, - "learning_rate": 1.1540473707523446e-05, - "loss": 2.3837, - "step": 441080 - }, - { - "epoch": 0.77, - "learning_rate": 1.153960176759662e-05, - "loss": 2.2867, - "step": 441090 - }, - { - "epoch": 0.77, - "learning_rate": 1.1538729827669794e-05, - "loss": 2.3403, - "step": 441100 - }, - { - "epoch": 0.77, - "learning_rate": 1.1537857887742968e-05, - "loss": 2.4245, - "step": 441110 - }, - { - "epoch": 0.77, - "learning_rate": 1.153698594781614e-05, - "loss": 2.2826, - "step": 441120 - }, - { - "epoch": 0.77, - "learning_rate": 1.1536114007889314e-05, - "loss": 2.1886, - "step": 441130 - }, - { - "epoch": 0.77, - "learning_rate": 1.1535242067962486e-05, - "loss": 2.1808, - "step": 441140 - }, - { - "epoch": 0.77, - "learning_rate": 1.153437012803566e-05, - "loss": 2.2924, - "step": 441150 - }, - { - "epoch": 0.77, - "learning_rate": 1.1533498188108831e-05, - "loss": 2.2438, - "step": 441160 - }, - { - "epoch": 0.77, - "learning_rate": 1.1532626248182005e-05, - "loss": 2.275, - "step": 441170 - }, - { - "epoch": 0.77, - "learning_rate": 1.1531754308255179e-05, - "loss": 2.333, - "step": 441180 - }, - { - "epoch": 0.77, - "learning_rate": 1.1530882368328353e-05, - "loss": 2.3186, - "step": 441190 - }, - { - "epoch": 0.77, - "learning_rate": 1.1530010428401525e-05, - "loss": 2.3236, - "step": 441200 - }, - { - "epoch": 0.77, - "learning_rate": 1.1529138488474699e-05, - "loss": 2.2094, - "step": 441210 - }, - { - "epoch": 0.77, - "learning_rate": 1.1528266548547872e-05, - "loss": 2.3318, - "step": 441220 - }, - { - "epoch": 0.77, - "learning_rate": 1.1527394608621044e-05, - "loss": 2.2167, - "step": 441230 - }, - { - "epoch": 0.77, - "learning_rate": 1.1526522668694218e-05, - "loss": 2.2774, - "step": 441240 - }, - { - "epoch": 0.77, - "learning_rate": 1.1525650728767392e-05, - "loss": 2.2971, - "step": 441250 - }, - { - "epoch": 0.77, - "learning_rate": 1.1524778788840566e-05, - "loss": 2.4035, - "step": 441260 - }, - { - "epoch": 0.77, - "learning_rate": 1.1523906848913738e-05, - "loss": 2.3331, - "step": 441270 - }, - { - "epoch": 0.77, - "learning_rate": 1.1523034908986912e-05, - "loss": 2.3294, - "step": 441280 - }, - { - "epoch": 0.77, - "learning_rate": 1.1522162969060084e-05, - "loss": 2.3198, - "step": 441290 - }, - { - "epoch": 0.77, - "learning_rate": 1.1521291029133257e-05, - "loss": 2.3225, - "step": 441300 - }, - { - "epoch": 0.77, - "learning_rate": 1.152041908920643e-05, - "loss": 2.1802, - "step": 441310 - }, - { - "epoch": 0.77, - "learning_rate": 1.1519547149279603e-05, - "loss": 2.3921, - "step": 441320 - }, - { - "epoch": 0.77, - "learning_rate": 1.1518675209352777e-05, - "loss": 2.3137, - "step": 441330 - }, - { - "epoch": 0.77, - "learning_rate": 1.151780326942595e-05, - "loss": 2.4577, - "step": 441340 - }, - { - "epoch": 0.77, - "learning_rate": 1.1516931329499125e-05, - "loss": 2.2941, - "step": 441350 - }, - { - "epoch": 0.77, - "learning_rate": 1.1516059389572297e-05, - "loss": 2.3541, - "step": 441360 - }, - { - "epoch": 0.77, - "learning_rate": 1.151518744964547e-05, - "loss": 2.2608, - "step": 441370 - }, - { - "epoch": 0.77, - "learning_rate": 1.1514315509718643e-05, - "loss": 2.2543, - "step": 441380 - }, - { - "epoch": 0.77, - "learning_rate": 1.1513443569791816e-05, - "loss": 2.2413, - "step": 441390 - }, - { - "epoch": 0.77, - "learning_rate": 1.1512571629864988e-05, - "loss": 2.2585, - "step": 441400 - }, - { - "epoch": 0.77, - "learning_rate": 1.1511699689938162e-05, - "loss": 2.2774, - "step": 441410 - }, - { - "epoch": 0.77, - "learning_rate": 1.1510827750011336e-05, - "loss": 2.3072, - "step": 441420 - }, - { - "epoch": 0.77, - "learning_rate": 1.150995581008451e-05, - "loss": 2.202, - "step": 441430 - }, - { - "epoch": 0.77, - "learning_rate": 1.1509083870157682e-05, - "loss": 2.2669, - "step": 441440 - }, - { - "epoch": 0.77, - "learning_rate": 1.1508211930230856e-05, - "loss": 2.2946, - "step": 441450 - }, - { - "epoch": 0.77, - "learning_rate": 1.1507339990304028e-05, - "loss": 2.2571, - "step": 441460 - }, - { - "epoch": 0.77, - "learning_rate": 1.1506468050377201e-05, - "loss": 2.2855, - "step": 441470 - }, - { - "epoch": 0.77, - "learning_rate": 1.1505596110450373e-05, - "loss": 2.1909, - "step": 441480 - }, - { - "epoch": 0.77, - "learning_rate": 1.1504724170523549e-05, - "loss": 2.1876, - "step": 441490 - }, - { - "epoch": 0.77, - "learning_rate": 1.1503852230596723e-05, - "loss": 2.3172, - "step": 441500 - }, - { - "epoch": 0.77, - "learning_rate": 1.1502980290669895e-05, - "loss": 2.2001, - "step": 441510 - }, - { - "epoch": 0.77, - "learning_rate": 1.1502108350743069e-05, - "loss": 2.3835, - "step": 441520 - }, - { - "epoch": 0.77, - "learning_rate": 1.150123641081624e-05, - "loss": 2.2911, - "step": 441530 - }, - { - "epoch": 0.77, - "learning_rate": 1.1500364470889414e-05, - "loss": 2.3556, - "step": 441540 - }, - { - "epoch": 0.77, - "learning_rate": 1.1499492530962586e-05, - "loss": 2.202, - "step": 441550 - }, - { - "epoch": 0.77, - "learning_rate": 1.149862059103576e-05, - "loss": 2.3068, - "step": 441560 - }, - { - "epoch": 0.77, - "learning_rate": 1.1497748651108934e-05, - "loss": 2.2696, - "step": 441570 - }, - { - "epoch": 0.77, - "learning_rate": 1.1496876711182108e-05, - "loss": 2.3124, - "step": 441580 - }, - { - "epoch": 0.77, - "learning_rate": 1.149600477125528e-05, - "loss": 2.3974, - "step": 441590 - }, - { - "epoch": 0.77, - "learning_rate": 1.1495132831328454e-05, - "loss": 2.2354, - "step": 441600 - }, - { - "epoch": 0.77, - "learning_rate": 1.1494260891401626e-05, - "loss": 2.3868, - "step": 441610 - }, - { - "epoch": 0.77, - "learning_rate": 1.14933889514748e-05, - "loss": 2.4555, - "step": 441620 - }, - { - "epoch": 0.77, - "learning_rate": 1.1492517011547973e-05, - "loss": 2.3575, - "step": 441630 - }, - { - "epoch": 0.77, - "learning_rate": 1.1491645071621145e-05, - "loss": 2.2476, - "step": 441640 - }, - { - "epoch": 0.77, - "learning_rate": 1.1490773131694319e-05, - "loss": 2.3353, - "step": 441650 - }, - { - "epoch": 0.77, - "learning_rate": 1.1489901191767493e-05, - "loss": 2.3245, - "step": 441660 - }, - { - "epoch": 0.77, - "learning_rate": 1.1489029251840667e-05, - "loss": 2.3207, - "step": 441670 - }, - { - "epoch": 0.77, - "learning_rate": 1.1488157311913839e-05, - "loss": 2.1932, - "step": 441680 - }, - { - "epoch": 0.77, - "learning_rate": 1.1487285371987012e-05, - "loss": 2.2192, - "step": 441690 - }, - { - "epoch": 0.77, - "learning_rate": 1.1486413432060185e-05, - "loss": 2.3155, - "step": 441700 - }, - { - "epoch": 0.77, - "learning_rate": 1.1485541492133358e-05, - "loss": 2.352, - "step": 441710 - }, - { - "epoch": 0.77, - "learning_rate": 1.148466955220653e-05, - "loss": 2.3711, - "step": 441720 - }, - { - "epoch": 0.77, - "learning_rate": 1.1483797612279706e-05, - "loss": 2.2626, - "step": 441730 - }, - { - "epoch": 0.77, - "learning_rate": 1.1482925672352878e-05, - "loss": 2.1487, - "step": 441740 - }, - { - "epoch": 0.77, - "learning_rate": 1.1482053732426052e-05, - "loss": 2.2826, - "step": 441750 - }, - { - "epoch": 0.77, - "learning_rate": 1.1481181792499225e-05, - "loss": 2.2136, - "step": 441760 - }, - { - "epoch": 0.77, - "learning_rate": 1.1480309852572398e-05, - "loss": 2.3015, - "step": 441770 - }, - { - "epoch": 0.77, - "learning_rate": 1.1479437912645571e-05, - "loss": 2.1912, - "step": 441780 - }, - { - "epoch": 0.77, - "learning_rate": 1.1478565972718743e-05, - "loss": 2.2176, - "step": 441790 - }, - { - "epoch": 0.77, - "learning_rate": 1.1477694032791917e-05, - "loss": 2.3106, - "step": 441800 - }, - { - "epoch": 0.77, - "learning_rate": 1.1476822092865091e-05, - "loss": 2.2558, - "step": 441810 - }, - { - "epoch": 0.77, - "learning_rate": 1.1475950152938265e-05, - "loss": 2.2964, - "step": 441820 - }, - { - "epoch": 0.77, - "learning_rate": 1.1475078213011437e-05, - "loss": 2.2797, - "step": 441830 - }, - { - "epoch": 0.77, - "learning_rate": 1.147420627308461e-05, - "loss": 2.2214, - "step": 441840 - }, - { - "epoch": 0.77, - "learning_rate": 1.1473334333157783e-05, - "loss": 2.4091, - "step": 441850 - }, - { - "epoch": 0.77, - "learning_rate": 1.1472462393230956e-05, - "loss": 2.2337, - "step": 441860 - }, - { - "epoch": 0.77, - "learning_rate": 1.1471590453304128e-05, - "loss": 2.3971, - "step": 441870 - }, - { - "epoch": 0.77, - "learning_rate": 1.1470718513377302e-05, - "loss": 2.359, - "step": 441880 - }, - { - "epoch": 0.77, - "learning_rate": 1.1469846573450476e-05, - "loss": 2.3386, - "step": 441890 - }, - { - "epoch": 0.77, - "learning_rate": 1.146897463352365e-05, - "loss": 2.3293, - "step": 441900 - }, - { - "epoch": 0.77, - "learning_rate": 1.1468102693596824e-05, - "loss": 2.2993, - "step": 441910 - }, - { - "epoch": 0.77, - "learning_rate": 1.1467230753669996e-05, - "loss": 2.2495, - "step": 441920 - }, - { - "epoch": 0.77, - "learning_rate": 1.146635881374317e-05, - "loss": 2.2235, - "step": 441930 - }, - { - "epoch": 0.77, - "learning_rate": 1.1465486873816341e-05, - "loss": 2.2756, - "step": 441940 - }, - { - "epoch": 0.77, - "learning_rate": 1.1464614933889515e-05, - "loss": 2.361, - "step": 441950 - }, - { - "epoch": 0.77, - "learning_rate": 1.1463742993962687e-05, - "loss": 2.2701, - "step": 441960 - }, - { - "epoch": 0.77, - "learning_rate": 1.1462871054035863e-05, - "loss": 2.3264, - "step": 441970 - }, - { - "epoch": 0.77, - "learning_rate": 1.1461999114109035e-05, - "loss": 2.3145, - "step": 441980 - }, - { - "epoch": 0.77, - "learning_rate": 1.1461127174182209e-05, - "loss": 2.2411, - "step": 441990 - }, - { - "epoch": 0.77, - "learning_rate": 1.146025523425538e-05, - "loss": 2.3803, - "step": 442000 - }, - { - "epoch": 0.77, - "learning_rate": 1.1459383294328554e-05, - "loss": 2.3105, - "step": 442010 - }, - { - "epoch": 0.77, - "learning_rate": 1.1458511354401728e-05, - "loss": 2.2808, - "step": 442020 - }, - { - "epoch": 0.77, - "learning_rate": 1.14576394144749e-05, - "loss": 2.3209, - "step": 442030 - }, - { - "epoch": 0.77, - "learning_rate": 1.1456767474548074e-05, - "loss": 2.2561, - "step": 442040 - }, - { - "epoch": 0.77, - "learning_rate": 1.1455895534621248e-05, - "loss": 2.4107, - "step": 442050 - }, - { - "epoch": 0.77, - "learning_rate": 1.1455023594694422e-05, - "loss": 2.215, - "step": 442060 - }, - { - "epoch": 0.77, - "learning_rate": 1.1454151654767594e-05, - "loss": 2.3042, - "step": 442070 - }, - { - "epoch": 0.77, - "learning_rate": 1.1453279714840767e-05, - "loss": 2.3641, - "step": 442080 - }, - { - "epoch": 0.77, - "learning_rate": 1.145240777491394e-05, - "loss": 2.2658, - "step": 442090 - }, - { - "epoch": 0.77, - "learning_rate": 1.1451535834987113e-05, - "loss": 2.3063, - "step": 442100 - }, - { - "epoch": 0.77, - "learning_rate": 1.1450663895060285e-05, - "loss": 2.2094, - "step": 442110 - }, - { - "epoch": 0.77, - "learning_rate": 1.1449791955133459e-05, - "loss": 2.3612, - "step": 442120 - }, - { - "epoch": 0.77, - "learning_rate": 1.1448920015206633e-05, - "loss": 2.2046, - "step": 442130 - }, - { - "epoch": 0.77, - "learning_rate": 1.1448048075279807e-05, - "loss": 2.2141, - "step": 442140 - }, - { - "epoch": 0.77, - "learning_rate": 1.144717613535298e-05, - "loss": 2.2333, - "step": 442150 - }, - { - "epoch": 0.77, - "learning_rate": 1.1446304195426153e-05, - "loss": 2.178, - "step": 442160 - }, - { - "epoch": 0.77, - "learning_rate": 1.1445432255499326e-05, - "loss": 2.283, - "step": 442170 - }, - { - "epoch": 0.77, - "learning_rate": 1.1444560315572498e-05, - "loss": 2.2878, - "step": 442180 - }, - { - "epoch": 0.77, - "learning_rate": 1.1443688375645672e-05, - "loss": 2.302, - "step": 442190 - }, - { - "epoch": 0.77, - "learning_rate": 1.1442816435718844e-05, - "loss": 2.372, - "step": 442200 - }, - { - "epoch": 0.77, - "learning_rate": 1.144194449579202e-05, - "loss": 2.2427, - "step": 442210 - }, - { - "epoch": 0.77, - "learning_rate": 1.1441072555865192e-05, - "loss": 2.2689, - "step": 442220 - }, - { - "epoch": 0.77, - "learning_rate": 1.1440200615938366e-05, - "loss": 2.297, - "step": 442230 - }, - { - "epoch": 0.77, - "learning_rate": 1.1439328676011538e-05, - "loss": 2.1606, - "step": 442240 - }, - { - "epoch": 0.77, - "learning_rate": 1.1438456736084711e-05, - "loss": 2.2629, - "step": 442250 - }, - { - "epoch": 0.77, - "learning_rate": 1.1437584796157883e-05, - "loss": 2.2376, - "step": 442260 - }, - { - "epoch": 0.77, - "learning_rate": 1.1436712856231057e-05, - "loss": 2.3667, - "step": 442270 - }, - { - "epoch": 0.77, - "learning_rate": 1.1435840916304231e-05, - "loss": 2.2862, - "step": 442280 - }, - { - "epoch": 0.77, - "learning_rate": 1.1434968976377405e-05, - "loss": 2.2437, - "step": 442290 - }, - { - "epoch": 0.77, - "learning_rate": 1.1434097036450579e-05, - "loss": 2.4049, - "step": 442300 - }, - { - "epoch": 0.77, - "learning_rate": 1.143322509652375e-05, - "loss": 2.1968, - "step": 442310 - }, - { - "epoch": 0.77, - "learning_rate": 1.1432353156596924e-05, - "loss": 2.324, - "step": 442320 - }, - { - "epoch": 0.77, - "learning_rate": 1.1431481216670096e-05, - "loss": 2.2881, - "step": 442330 - }, - { - "epoch": 0.77, - "learning_rate": 1.143060927674327e-05, - "loss": 2.2988, - "step": 442340 - }, - { - "epoch": 0.77, - "learning_rate": 1.1429737336816442e-05, - "loss": 2.3386, - "step": 442350 - }, - { - "epoch": 0.77, - "learning_rate": 1.1428865396889616e-05, - "loss": 2.2011, - "step": 442360 - }, - { - "epoch": 0.77, - "learning_rate": 1.142799345696279e-05, - "loss": 2.402, - "step": 442370 - }, - { - "epoch": 0.77, - "learning_rate": 1.1427121517035964e-05, - "loss": 2.181, - "step": 442380 - }, - { - "epoch": 0.77, - "learning_rate": 1.1426249577109136e-05, - "loss": 2.1969, - "step": 442390 - }, - { - "epoch": 0.77, - "learning_rate": 1.142537763718231e-05, - "loss": 2.3544, - "step": 442400 - }, - { - "epoch": 0.77, - "learning_rate": 1.1424505697255482e-05, - "loss": 2.3886, - "step": 442410 - }, - { - "epoch": 0.77, - "learning_rate": 1.1423633757328655e-05, - "loss": 2.3261, - "step": 442420 - }, - { - "epoch": 0.77, - "learning_rate": 1.1422761817401829e-05, - "loss": 2.3483, - "step": 442430 - }, - { - "epoch": 0.77, - "learning_rate": 1.1421889877475001e-05, - "loss": 2.3505, - "step": 442440 - }, - { - "epoch": 0.77, - "learning_rate": 1.1421017937548175e-05, - "loss": 2.2604, - "step": 442450 - }, - { - "epoch": 0.77, - "learning_rate": 1.1420145997621349e-05, - "loss": 2.3345, - "step": 442460 - }, - { - "epoch": 0.77, - "learning_rate": 1.1419274057694522e-05, - "loss": 2.3471, - "step": 442470 - }, - { - "epoch": 0.77, - "learning_rate": 1.1418402117767695e-05, - "loss": 2.3064, - "step": 442480 - }, - { - "epoch": 0.77, - "learning_rate": 1.1417530177840868e-05, - "loss": 2.3729, - "step": 442490 - }, - { - "epoch": 0.77, - "learning_rate": 1.141665823791404e-05, - "loss": 2.3103, - "step": 442500 - }, - { - "epoch": 0.77, - "learning_rate": 1.1415786297987214e-05, - "loss": 2.1957, - "step": 442510 - }, - { - "epoch": 0.77, - "learning_rate": 1.1414914358060388e-05, - "loss": 2.3828, - "step": 442520 - }, - { - "epoch": 0.77, - "learning_rate": 1.1414042418133562e-05, - "loss": 2.3158, - "step": 442530 - }, - { - "epoch": 0.77, - "learning_rate": 1.1413170478206734e-05, - "loss": 2.3615, - "step": 442540 - }, - { - "epoch": 0.77, - "learning_rate": 1.1412298538279908e-05, - "loss": 2.3379, - "step": 442550 - }, - { - "epoch": 0.77, - "learning_rate": 1.1411426598353081e-05, - "loss": 2.2441, - "step": 442560 - }, - { - "epoch": 0.77, - "learning_rate": 1.1410554658426253e-05, - "loss": 2.2827, - "step": 442570 - }, - { - "epoch": 0.77, - "learning_rate": 1.1409682718499427e-05, - "loss": 2.2765, - "step": 442580 - }, - { - "epoch": 0.77, - "learning_rate": 1.14088107785726e-05, - "loss": 2.3964, - "step": 442590 - }, - { - "epoch": 0.77, - "learning_rate": 1.1407938838645773e-05, - "loss": 2.3709, - "step": 442600 - }, - { - "epoch": 0.77, - "learning_rate": 1.1407066898718947e-05, - "loss": 2.2688, - "step": 442610 - }, - { - "epoch": 0.77, - "learning_rate": 1.140619495879212e-05, - "loss": 2.3644, - "step": 442620 - }, - { - "epoch": 0.77, - "learning_rate": 1.1405323018865293e-05, - "loss": 2.3784, - "step": 442630 - }, - { - "epoch": 0.77, - "learning_rate": 1.1404451078938466e-05, - "loss": 2.3041, - "step": 442640 - }, - { - "epoch": 0.77, - "learning_rate": 1.1403579139011638e-05, - "loss": 2.3006, - "step": 442650 - }, - { - "epoch": 0.77, - "learning_rate": 1.1402707199084812e-05, - "loss": 2.3316, - "step": 442660 - }, - { - "epoch": 0.77, - "learning_rate": 1.1401835259157984e-05, - "loss": 2.2732, - "step": 442670 - }, - { - "epoch": 0.77, - "learning_rate": 1.1400963319231158e-05, - "loss": 2.2693, - "step": 442680 - }, - { - "epoch": 0.77, - "learning_rate": 1.1400091379304332e-05, - "loss": 2.3554, - "step": 442690 - }, - { - "epoch": 0.77, - "learning_rate": 1.1399219439377506e-05, - "loss": 2.3022, - "step": 442700 - }, - { - "epoch": 0.77, - "learning_rate": 1.139834749945068e-05, - "loss": 2.2779, - "step": 442710 - }, - { - "epoch": 0.77, - "learning_rate": 1.1397475559523851e-05, - "loss": 2.1976, - "step": 442720 - }, - { - "epoch": 0.77, - "learning_rate": 1.1396603619597025e-05, - "loss": 2.2241, - "step": 442730 - }, - { - "epoch": 0.77, - "learning_rate": 1.1395731679670197e-05, - "loss": 2.1747, - "step": 442740 - }, - { - "epoch": 0.77, - "learning_rate": 1.1394859739743371e-05, - "loss": 2.2242, - "step": 442750 - }, - { - "epoch": 0.77, - "learning_rate": 1.1393987799816543e-05, - "loss": 2.2127, - "step": 442760 - }, - { - "epoch": 0.77, - "learning_rate": 1.1393115859889719e-05, - "loss": 2.25, - "step": 442770 - }, - { - "epoch": 0.77, - "learning_rate": 1.139224391996289e-05, - "loss": 2.304, - "step": 442780 - }, - { - "epoch": 0.77, - "learning_rate": 1.1391371980036064e-05, - "loss": 2.3174, - "step": 442790 - }, - { - "epoch": 0.77, - "learning_rate": 1.1390500040109237e-05, - "loss": 2.3089, - "step": 442800 - }, - { - "epoch": 0.77, - "learning_rate": 1.138962810018241e-05, - "loss": 2.2301, - "step": 442810 - }, - { - "epoch": 0.77, - "learning_rate": 1.1388756160255584e-05, - "loss": 2.1689, - "step": 442820 - }, - { - "epoch": 0.77, - "learning_rate": 1.1387884220328756e-05, - "loss": 2.1705, - "step": 442830 - }, - { - "epoch": 0.77, - "learning_rate": 1.138701228040193e-05, - "loss": 2.3199, - "step": 442840 - }, - { - "epoch": 0.77, - "learning_rate": 1.1386140340475104e-05, - "loss": 2.2517, - "step": 442850 - }, - { - "epoch": 0.77, - "learning_rate": 1.1385268400548277e-05, - "loss": 2.2468, - "step": 442860 - }, - { - "epoch": 0.77, - "learning_rate": 1.138439646062145e-05, - "loss": 2.1731, - "step": 442870 - }, - { - "epoch": 0.77, - "learning_rate": 1.1383524520694623e-05, - "loss": 2.3136, - "step": 442880 - }, - { - "epoch": 0.77, - "learning_rate": 1.1382652580767795e-05, - "loss": 2.36, - "step": 442890 - }, - { - "epoch": 0.77, - "learning_rate": 1.1381780640840969e-05, - "loss": 2.2493, - "step": 442900 - }, - { - "epoch": 0.77, - "learning_rate": 1.1380908700914141e-05, - "loss": 2.2718, - "step": 442910 - }, - { - "epoch": 0.77, - "learning_rate": 1.1380036760987315e-05, - "loss": 2.3636, - "step": 442920 - }, - { - "epoch": 0.77, - "learning_rate": 1.1379164821060489e-05, - "loss": 2.2011, - "step": 442930 - }, - { - "epoch": 0.77, - "learning_rate": 1.1378292881133663e-05, - "loss": 2.2611, - "step": 442940 - }, - { - "epoch": 0.77, - "learning_rate": 1.1377420941206836e-05, - "loss": 2.2703, - "step": 442950 - }, - { - "epoch": 0.77, - "learning_rate": 1.1376549001280008e-05, - "loss": 2.2762, - "step": 442960 - }, - { - "epoch": 0.77, - "learning_rate": 1.1375677061353182e-05, - "loss": 2.2718, - "step": 442970 - }, - { - "epoch": 0.77, - "learning_rate": 1.1374805121426354e-05, - "loss": 2.2008, - "step": 442980 - }, - { - "epoch": 0.77, - "learning_rate": 1.1373933181499528e-05, - "loss": 2.2625, - "step": 442990 - }, - { - "epoch": 0.77, - "learning_rate": 1.13730612415727e-05, - "loss": 2.2905, - "step": 443000 - }, - { - "epoch": 0.77, - "learning_rate": 1.1372189301645876e-05, - "loss": 2.2955, - "step": 443010 - }, - { - "epoch": 0.77, - "learning_rate": 1.1371317361719048e-05, - "loss": 2.4221, - "step": 443020 - }, - { - "epoch": 0.77, - "learning_rate": 1.1370445421792221e-05, - "loss": 2.2002, - "step": 443030 - }, - { - "epoch": 0.77, - "learning_rate": 1.1369573481865393e-05, - "loss": 2.2964, - "step": 443040 - }, - { - "epoch": 0.77, - "learning_rate": 1.1368701541938567e-05, - "loss": 2.2398, - "step": 443050 - }, - { - "epoch": 0.77, - "learning_rate": 1.136782960201174e-05, - "loss": 2.3681, - "step": 443060 - }, - { - "epoch": 0.77, - "learning_rate": 1.1366957662084913e-05, - "loss": 2.3536, - "step": 443070 - }, - { - "epoch": 0.77, - "learning_rate": 1.1366085722158087e-05, - "loss": 2.3502, - "step": 443080 - }, - { - "epoch": 0.77, - "learning_rate": 1.136521378223126e-05, - "loss": 2.2787, - "step": 443090 - }, - { - "epoch": 0.77, - "learning_rate": 1.1364341842304434e-05, - "loss": 2.1749, - "step": 443100 - }, - { - "epoch": 0.77, - "learning_rate": 1.1363469902377606e-05, - "loss": 2.2683, - "step": 443110 - }, - { - "epoch": 0.77, - "learning_rate": 1.136259796245078e-05, - "loss": 2.3503, - "step": 443120 - }, - { - "epoch": 0.77, - "learning_rate": 1.1361726022523952e-05, - "loss": 2.2559, - "step": 443130 - }, - { - "epoch": 0.77, - "learning_rate": 1.1360854082597126e-05, - "loss": 2.3696, - "step": 443140 - }, - { - "epoch": 0.77, - "learning_rate": 1.1359982142670298e-05, - "loss": 2.3032, - "step": 443150 - }, - { - "epoch": 0.77, - "learning_rate": 1.1359110202743472e-05, - "loss": 2.331, - "step": 443160 - }, - { - "epoch": 0.77, - "learning_rate": 1.1358238262816646e-05, - "loss": 2.1705, - "step": 443170 - }, - { - "epoch": 0.77, - "learning_rate": 1.135736632288982e-05, - "loss": 2.3288, - "step": 443180 - }, - { - "epoch": 0.77, - "learning_rate": 1.1356494382962992e-05, - "loss": 2.3141, - "step": 443190 - }, - { - "epoch": 0.77, - "learning_rate": 1.1355622443036165e-05, - "loss": 2.2466, - "step": 443200 - }, - { - "epoch": 0.77, - "learning_rate": 1.1354750503109337e-05, - "loss": 2.3888, - "step": 443210 - }, - { - "epoch": 0.77, - "learning_rate": 1.1353878563182511e-05, - "loss": 2.3667, - "step": 443220 - }, - { - "epoch": 0.77, - "learning_rate": 1.1353006623255685e-05, - "loss": 2.2648, - "step": 443230 - }, - { - "epoch": 0.77, - "learning_rate": 1.1352134683328857e-05, - "loss": 2.2556, - "step": 443240 - }, - { - "epoch": 0.77, - "learning_rate": 1.1351262743402032e-05, - "loss": 2.3124, - "step": 443250 - }, - { - "epoch": 0.77, - "learning_rate": 1.1350390803475205e-05, - "loss": 2.2525, - "step": 443260 - }, - { - "epoch": 0.77, - "learning_rate": 1.1349518863548378e-05, - "loss": 2.1357, - "step": 443270 - }, - { - "epoch": 0.77, - "learning_rate": 1.134864692362155e-05, - "loss": 2.3506, - "step": 443280 - }, - { - "epoch": 0.77, - "learning_rate": 1.1347774983694724e-05, - "loss": 2.2727, - "step": 443290 - }, - { - "epoch": 0.77, - "learning_rate": 1.1346903043767896e-05, - "loss": 2.3041, - "step": 443300 - }, - { - "epoch": 0.77, - "learning_rate": 1.134603110384107e-05, - "loss": 2.2606, - "step": 443310 - }, - { - "epoch": 0.77, - "learning_rate": 1.1345159163914244e-05, - "loss": 2.2527, - "step": 443320 - }, - { - "epoch": 0.77, - "learning_rate": 1.1344287223987418e-05, - "loss": 2.2761, - "step": 443330 - }, - { - "epoch": 0.77, - "learning_rate": 1.134341528406059e-05, - "loss": 2.207, - "step": 443340 - }, - { - "epoch": 0.77, - "learning_rate": 1.1342543344133763e-05, - "loss": 2.2462, - "step": 443350 - }, - { - "epoch": 0.77, - "learning_rate": 1.1341671404206937e-05, - "loss": 2.2754, - "step": 443360 - }, - { - "epoch": 0.77, - "learning_rate": 1.134079946428011e-05, - "loss": 2.2876, - "step": 443370 - }, - { - "epoch": 0.77, - "learning_rate": 1.1339927524353283e-05, - "loss": 2.2097, - "step": 443380 - }, - { - "epoch": 0.77, - "learning_rate": 1.1339055584426455e-05, - "loss": 2.2854, - "step": 443390 - }, - { - "epoch": 0.77, - "learning_rate": 1.1338183644499629e-05, - "loss": 2.3233, - "step": 443400 - }, - { - "epoch": 0.77, - "learning_rate": 1.1337311704572803e-05, - "loss": 2.2621, - "step": 443410 - }, - { - "epoch": 0.77, - "learning_rate": 1.1336439764645976e-05, - "loss": 2.2674, - "step": 443420 - }, - { - "epoch": 0.77, - "learning_rate": 1.1335567824719148e-05, - "loss": 2.2612, - "step": 443430 - }, - { - "epoch": 0.77, - "learning_rate": 1.1334695884792322e-05, - "loss": 2.3003, - "step": 443440 - }, - { - "epoch": 0.77, - "learning_rate": 1.1333823944865494e-05, - "loss": 2.3331, - "step": 443450 - }, - { - "epoch": 0.77, - "learning_rate": 1.1332952004938668e-05, - "loss": 2.3157, - "step": 443460 - }, - { - "epoch": 0.77, - "learning_rate": 1.133208006501184e-05, - "loss": 2.3107, - "step": 443470 - }, - { - "epoch": 0.77, - "learning_rate": 1.1331208125085014e-05, - "loss": 2.2727, - "step": 443480 - }, - { - "epoch": 0.77, - "learning_rate": 1.1330336185158188e-05, - "loss": 2.1937, - "step": 443490 - }, - { - "epoch": 0.77, - "learning_rate": 1.1329464245231361e-05, - "loss": 2.2603, - "step": 443500 - }, - { - "epoch": 0.77, - "learning_rate": 1.1328592305304535e-05, - "loss": 2.3079, - "step": 443510 - }, - { - "epoch": 0.77, - "learning_rate": 1.1327720365377707e-05, - "loss": 2.2434, - "step": 443520 - }, - { - "epoch": 0.77, - "learning_rate": 1.1326848425450881e-05, - "loss": 2.4682, - "step": 443530 - }, - { - "epoch": 0.77, - "learning_rate": 1.1325976485524053e-05, - "loss": 2.3533, - "step": 443540 - }, - { - "epoch": 0.77, - "learning_rate": 1.1325104545597227e-05, - "loss": 2.3551, - "step": 443550 - }, - { - "epoch": 0.77, - "learning_rate": 1.13242326056704e-05, - "loss": 2.2796, - "step": 443560 - }, - { - "epoch": 0.77, - "learning_rate": 1.1323360665743574e-05, - "loss": 2.3481, - "step": 443570 - }, - { - "epoch": 0.77, - "learning_rate": 1.1322488725816747e-05, - "loss": 2.3078, - "step": 443580 - }, - { - "epoch": 0.77, - "learning_rate": 1.132161678588992e-05, - "loss": 2.3236, - "step": 443590 - }, - { - "epoch": 0.77, - "learning_rate": 1.1320744845963092e-05, - "loss": 2.2767, - "step": 443600 - }, - { - "epoch": 0.77, - "learning_rate": 1.1319872906036266e-05, - "loss": 2.2666, - "step": 443610 - }, - { - "epoch": 0.77, - "learning_rate": 1.131900096610944e-05, - "loss": 2.1927, - "step": 443620 - }, - { - "epoch": 0.77, - "learning_rate": 1.1318129026182612e-05, - "loss": 2.4212, - "step": 443630 - }, - { - "epoch": 0.77, - "learning_rate": 1.1317257086255786e-05, - "loss": 2.2373, - "step": 443640 - }, - { - "epoch": 0.77, - "learning_rate": 1.131638514632896e-05, - "loss": 2.3863, - "step": 443650 - }, - { - "epoch": 0.77, - "learning_rate": 1.1315513206402133e-05, - "loss": 2.3001, - "step": 443660 - }, - { - "epoch": 0.77, - "learning_rate": 1.1314641266475305e-05, - "loss": 2.4255, - "step": 443670 - }, - { - "epoch": 0.77, - "learning_rate": 1.1313769326548479e-05, - "loss": 2.2708, - "step": 443680 - }, - { - "epoch": 0.77, - "learning_rate": 1.1312897386621651e-05, - "loss": 2.3324, - "step": 443690 - }, - { - "epoch": 0.77, - "learning_rate": 1.1312025446694825e-05, - "loss": 2.264, - "step": 443700 - }, - { - "epoch": 0.77, - "learning_rate": 1.1311153506767997e-05, - "loss": 2.3868, - "step": 443710 - }, - { - "epoch": 0.77, - "learning_rate": 1.131028156684117e-05, - "loss": 2.3644, - "step": 443720 - }, - { - "epoch": 0.77, - "learning_rate": 1.1309409626914345e-05, - "loss": 2.274, - "step": 443730 - }, - { - "epoch": 0.77, - "learning_rate": 1.1308537686987518e-05, - "loss": 2.3552, - "step": 443740 - }, - { - "epoch": 0.77, - "learning_rate": 1.1307665747060692e-05, - "loss": 2.3022, - "step": 443750 - }, - { - "epoch": 0.77, - "learning_rate": 1.1306793807133864e-05, - "loss": 2.2444, - "step": 443760 - }, - { - "epoch": 0.77, - "learning_rate": 1.1305921867207038e-05, - "loss": 2.2508, - "step": 443770 - }, - { - "epoch": 0.77, - "learning_rate": 1.130504992728021e-05, - "loss": 2.321, - "step": 443780 - }, - { - "epoch": 0.77, - "learning_rate": 1.1304177987353384e-05, - "loss": 2.3016, - "step": 443790 - }, - { - "epoch": 0.77, - "learning_rate": 1.1303306047426556e-05, - "loss": 2.3187, - "step": 443800 - }, - { - "epoch": 0.77, - "learning_rate": 1.1302434107499731e-05, - "loss": 2.0915, - "step": 443810 - }, - { - "epoch": 0.77, - "learning_rate": 1.1301562167572903e-05, - "loss": 2.2583, - "step": 443820 - }, - { - "epoch": 0.77, - "learning_rate": 1.1300690227646077e-05, - "loss": 2.099, - "step": 443830 - }, - { - "epoch": 0.77, - "learning_rate": 1.129981828771925e-05, - "loss": 2.2144, - "step": 443840 - }, - { - "epoch": 0.77, - "learning_rate": 1.1298946347792423e-05, - "loss": 2.2657, - "step": 443850 - }, - { - "epoch": 0.77, - "learning_rate": 1.1298074407865595e-05, - "loss": 2.2708, - "step": 443860 - }, - { - "epoch": 0.77, - "learning_rate": 1.1297202467938769e-05, - "loss": 2.2895, - "step": 443870 - }, - { - "epoch": 0.77, - "learning_rate": 1.1296330528011943e-05, - "loss": 2.2475, - "step": 443880 - }, - { - "epoch": 0.77, - "learning_rate": 1.1295458588085116e-05, - "loss": 2.362, - "step": 443890 - }, - { - "epoch": 0.77, - "learning_rate": 1.129458664815829e-05, - "loss": 2.2924, - "step": 443900 - }, - { - "epoch": 0.77, - "learning_rate": 1.1293714708231462e-05, - "loss": 2.2876, - "step": 443910 - }, - { - "epoch": 0.77, - "learning_rate": 1.1292842768304636e-05, - "loss": 2.2846, - "step": 443920 - }, - { - "epoch": 0.77, - "learning_rate": 1.1291970828377808e-05, - "loss": 2.281, - "step": 443930 - }, - { - "epoch": 0.77, - "learning_rate": 1.1291098888450982e-05, - "loss": 2.2607, - "step": 443940 - }, - { - "epoch": 0.77, - "learning_rate": 1.1290226948524154e-05, - "loss": 2.2328, - "step": 443950 - }, - { - "epoch": 0.77, - "learning_rate": 1.1289355008597328e-05, - "loss": 2.3527, - "step": 443960 - }, - { - "epoch": 0.77, - "learning_rate": 1.1288483068670502e-05, - "loss": 2.2653, - "step": 443970 - }, - { - "epoch": 0.77, - "learning_rate": 1.1287611128743675e-05, - "loss": 2.2704, - "step": 443980 - }, - { - "epoch": 0.77, - "learning_rate": 1.1286739188816847e-05, - "loss": 2.2154, - "step": 443990 - }, - { - "epoch": 0.77, - "learning_rate": 1.1285867248890021e-05, - "loss": 2.4098, - "step": 444000 - }, - { - "epoch": 0.77, - "learning_rate": 1.1284995308963195e-05, - "loss": 2.1601, - "step": 444010 - }, - { - "epoch": 0.77, - "learning_rate": 1.1284123369036367e-05, - "loss": 2.2257, - "step": 444020 - }, - { - "epoch": 0.77, - "learning_rate": 1.128325142910954e-05, - "loss": 2.3907, - "step": 444030 - }, - { - "epoch": 0.77, - "learning_rate": 1.1282379489182713e-05, - "loss": 2.3331, - "step": 444040 - }, - { - "epoch": 0.77, - "learning_rate": 1.1281507549255888e-05, - "loss": 2.2241, - "step": 444050 - }, - { - "epoch": 0.77, - "learning_rate": 1.128063560932906e-05, - "loss": 2.2878, - "step": 444060 - }, - { - "epoch": 0.77, - "learning_rate": 1.1279763669402234e-05, - "loss": 2.1922, - "step": 444070 - }, - { - "epoch": 0.77, - "learning_rate": 1.1278891729475406e-05, - "loss": 2.1935, - "step": 444080 - }, - { - "epoch": 0.77, - "learning_rate": 1.127801978954858e-05, - "loss": 2.257, - "step": 444090 - }, - { - "epoch": 0.77, - "learning_rate": 1.1277147849621752e-05, - "loss": 2.2388, - "step": 444100 - }, - { - "epoch": 0.77, - "learning_rate": 1.1276275909694926e-05, - "loss": 2.3457, - "step": 444110 - }, - { - "epoch": 0.77, - "learning_rate": 1.12754039697681e-05, - "loss": 2.3185, - "step": 444120 - }, - { - "epoch": 0.77, - "learning_rate": 1.1274532029841273e-05, - "loss": 2.2908, - "step": 444130 - }, - { - "epoch": 0.77, - "learning_rate": 1.1273660089914445e-05, - "loss": 2.3729, - "step": 444140 - }, - { - "epoch": 0.77, - "learning_rate": 1.127278814998762e-05, - "loss": 2.295, - "step": 444150 - }, - { - "epoch": 0.77, - "learning_rate": 1.1271916210060793e-05, - "loss": 2.3062, - "step": 444160 - }, - { - "epoch": 0.77, - "learning_rate": 1.1271044270133965e-05, - "loss": 2.3516, - "step": 444170 - }, - { - "epoch": 0.77, - "learning_rate": 1.1270172330207139e-05, - "loss": 2.1769, - "step": 444180 - }, - { - "epoch": 0.77, - "learning_rate": 1.1269300390280311e-05, - "loss": 2.2359, - "step": 444190 - }, - { - "epoch": 0.77, - "learning_rate": 1.1268428450353485e-05, - "loss": 2.3965, - "step": 444200 - }, - { - "epoch": 0.77, - "learning_rate": 1.1267556510426658e-05, - "loss": 2.2488, - "step": 444210 - }, - { - "epoch": 0.77, - "learning_rate": 1.1266684570499832e-05, - "loss": 2.2517, - "step": 444220 - }, - { - "epoch": 0.77, - "learning_rate": 1.1265812630573004e-05, - "loss": 2.1965, - "step": 444230 - }, - { - "epoch": 0.77, - "learning_rate": 1.1264940690646178e-05, - "loss": 2.2403, - "step": 444240 - }, - { - "epoch": 0.77, - "learning_rate": 1.126406875071935e-05, - "loss": 2.2833, - "step": 444250 - }, - { - "epoch": 0.77, - "learning_rate": 1.1263196810792524e-05, - "loss": 2.2581, - "step": 444260 - }, - { - "epoch": 0.77, - "learning_rate": 1.1262324870865696e-05, - "loss": 2.291, - "step": 444270 - }, - { - "epoch": 0.77, - "learning_rate": 1.126145293093887e-05, - "loss": 2.2796, - "step": 444280 - }, - { - "epoch": 0.77, - "learning_rate": 1.1260580991012045e-05, - "loss": 2.2586, - "step": 444290 - }, - { - "epoch": 0.77, - "learning_rate": 1.1259709051085217e-05, - "loss": 2.325, - "step": 444300 - }, - { - "epoch": 0.77, - "learning_rate": 1.1258837111158391e-05, - "loss": 2.3854, - "step": 444310 - }, - { - "epoch": 0.77, - "learning_rate": 1.1257965171231563e-05, - "loss": 2.5011, - "step": 444320 - }, - { - "epoch": 0.77, - "learning_rate": 1.1257093231304737e-05, - "loss": 2.2575, - "step": 444330 - }, - { - "epoch": 0.77, - "learning_rate": 1.1256221291377909e-05, - "loss": 2.1858, - "step": 444340 - }, - { - "epoch": 0.77, - "learning_rate": 1.1255349351451083e-05, - "loss": 2.329, - "step": 444350 - }, - { - "epoch": 0.77, - "learning_rate": 1.1254477411524257e-05, - "loss": 2.3247, - "step": 444360 - }, - { - "epoch": 0.77, - "learning_rate": 1.125360547159743e-05, - "loss": 2.1808, - "step": 444370 - }, - { - "epoch": 0.77, - "learning_rate": 1.1252733531670602e-05, - "loss": 2.2999, - "step": 444380 - }, - { - "epoch": 0.77, - "learning_rate": 1.1251861591743776e-05, - "loss": 2.3184, - "step": 444390 - }, - { - "epoch": 0.77, - "learning_rate": 1.1250989651816948e-05, - "loss": 2.0871, - "step": 444400 - }, - { - "epoch": 0.77, - "learning_rate": 1.1250117711890122e-05, - "loss": 2.3079, - "step": 444410 - }, - { - "epoch": 0.78, - "learning_rate": 1.1249245771963296e-05, - "loss": 2.218, - "step": 444420 - }, - { - "epoch": 0.78, - "learning_rate": 1.1248373832036468e-05, - "loss": 2.2505, - "step": 444430 - }, - { - "epoch": 0.78, - "learning_rate": 1.1247501892109642e-05, - "loss": 2.2965, - "step": 444440 - }, - { - "epoch": 0.78, - "learning_rate": 1.1246629952182815e-05, - "loss": 2.2786, - "step": 444450 - }, - { - "epoch": 0.78, - "learning_rate": 1.1245758012255989e-05, - "loss": 2.2333, - "step": 444460 - }, - { - "epoch": 0.78, - "learning_rate": 1.1244886072329161e-05, - "loss": 2.2494, - "step": 444470 - }, - { - "epoch": 0.78, - "learning_rate": 1.1244014132402335e-05, - "loss": 2.3123, - "step": 444480 - }, - { - "epoch": 0.78, - "learning_rate": 1.1243142192475507e-05, - "loss": 2.1919, - "step": 444490 - }, - { - "epoch": 0.78, - "learning_rate": 1.124227025254868e-05, - "loss": 2.3422, - "step": 444500 - }, - { - "epoch": 0.78, - "learning_rate": 1.1241398312621853e-05, - "loss": 2.1733, - "step": 444510 - }, - { - "epoch": 0.78, - "learning_rate": 1.1240526372695027e-05, - "loss": 2.2518, - "step": 444520 - }, - { - "epoch": 0.78, - "learning_rate": 1.12396544327682e-05, - "loss": 2.3716, - "step": 444530 - }, - { - "epoch": 0.78, - "learning_rate": 1.1238782492841374e-05, - "loss": 2.2074, - "step": 444540 - }, - { - "epoch": 0.78, - "learning_rate": 1.1237910552914548e-05, - "loss": 2.2585, - "step": 444550 - }, - { - "epoch": 0.78, - "learning_rate": 1.123703861298772e-05, - "loss": 2.3049, - "step": 444560 - }, - { - "epoch": 0.78, - "learning_rate": 1.1236166673060894e-05, - "loss": 2.2581, - "step": 444570 - }, - { - "epoch": 0.78, - "learning_rate": 1.1235294733134066e-05, - "loss": 2.379, - "step": 444580 - }, - { - "epoch": 0.78, - "learning_rate": 1.123442279320724e-05, - "loss": 2.3974, - "step": 444590 - }, - { - "epoch": 0.78, - "learning_rate": 1.1233550853280413e-05, - "loss": 2.3748, - "step": 444600 - }, - { - "epoch": 0.78, - "learning_rate": 1.1232678913353587e-05, - "loss": 2.4447, - "step": 444610 - }, - { - "epoch": 0.78, - "learning_rate": 1.123180697342676e-05, - "loss": 2.4431, - "step": 444620 - }, - { - "epoch": 0.78, - "learning_rate": 1.1230935033499933e-05, - "loss": 2.4242, - "step": 444630 - }, - { - "epoch": 0.78, - "learning_rate": 1.1230063093573105e-05, - "loss": 2.2831, - "step": 444640 - }, - { - "epoch": 0.78, - "learning_rate": 1.1229191153646279e-05, - "loss": 2.2753, - "step": 444650 - }, - { - "epoch": 0.78, - "learning_rate": 1.1228319213719451e-05, - "loss": 2.2655, - "step": 444660 - }, - { - "epoch": 0.78, - "learning_rate": 1.1227447273792625e-05, - "loss": 2.2909, - "step": 444670 - }, - { - "epoch": 0.78, - "learning_rate": 1.1226575333865799e-05, - "loss": 2.2935, - "step": 444680 - }, - { - "epoch": 0.78, - "learning_rate": 1.1225703393938972e-05, - "loss": 2.2303, - "step": 444690 - }, - { - "epoch": 0.78, - "learning_rate": 1.1224831454012146e-05, - "loss": 2.2456, - "step": 444700 - }, - { - "epoch": 0.78, - "learning_rate": 1.1223959514085318e-05, - "loss": 2.2644, - "step": 444710 - }, - { - "epoch": 0.78, - "learning_rate": 1.1223087574158492e-05, - "loss": 2.2878, - "step": 444720 - }, - { - "epoch": 0.78, - "learning_rate": 1.1222215634231664e-05, - "loss": 2.3468, - "step": 444730 - }, - { - "epoch": 0.78, - "learning_rate": 1.1221343694304838e-05, - "loss": 2.3988, - "step": 444740 - }, - { - "epoch": 0.78, - "learning_rate": 1.122047175437801e-05, - "loss": 2.2817, - "step": 444750 - }, - { - "epoch": 0.78, - "learning_rate": 1.1219599814451184e-05, - "loss": 2.2633, - "step": 444760 - }, - { - "epoch": 0.78, - "learning_rate": 1.1218727874524357e-05, - "loss": 2.3469, - "step": 444770 - }, - { - "epoch": 0.78, - "learning_rate": 1.1217855934597531e-05, - "loss": 2.2329, - "step": 444780 - }, - { - "epoch": 0.78, - "learning_rate": 1.1216983994670703e-05, - "loss": 2.311, - "step": 444790 - }, - { - "epoch": 0.78, - "learning_rate": 1.1216112054743877e-05, - "loss": 2.2568, - "step": 444800 - }, - { - "epoch": 0.78, - "learning_rate": 1.121524011481705e-05, - "loss": 2.2154, - "step": 444810 - }, - { - "epoch": 0.78, - "learning_rate": 1.1214368174890223e-05, - "loss": 2.2415, - "step": 444820 - }, - { - "epoch": 0.78, - "learning_rate": 1.1213496234963397e-05, - "loss": 2.3039, - "step": 444830 - }, - { - "epoch": 0.78, - "learning_rate": 1.1212624295036569e-05, - "loss": 2.3384, - "step": 444840 - }, - { - "epoch": 0.78, - "learning_rate": 1.1211752355109744e-05, - "loss": 2.3308, - "step": 444850 - }, - { - "epoch": 0.78, - "learning_rate": 1.1210880415182916e-05, - "loss": 2.3205, - "step": 444860 - }, - { - "epoch": 0.78, - "learning_rate": 1.121000847525609e-05, - "loss": 2.2237, - "step": 444870 - }, - { - "epoch": 0.78, - "learning_rate": 1.1209136535329262e-05, - "loss": 2.2971, - "step": 444880 - }, - { - "epoch": 0.78, - "learning_rate": 1.1208264595402436e-05, - "loss": 2.3601, - "step": 444890 - }, - { - "epoch": 0.78, - "learning_rate": 1.1207392655475608e-05, - "loss": 2.2509, - "step": 444900 - }, - { - "epoch": 0.78, - "learning_rate": 1.1206520715548782e-05, - "loss": 2.2498, - "step": 444910 - }, - { - "epoch": 0.78, - "learning_rate": 1.1205648775621955e-05, - "loss": 2.2865, - "step": 444920 - }, - { - "epoch": 0.78, - "learning_rate": 1.120477683569513e-05, - "loss": 2.3177, - "step": 444930 - }, - { - "epoch": 0.78, - "learning_rate": 1.1203904895768301e-05, - "loss": 2.322, - "step": 444940 - }, - { - "epoch": 0.78, - "learning_rate": 1.1203032955841475e-05, - "loss": 2.3145, - "step": 444950 - }, - { - "epoch": 0.78, - "learning_rate": 1.1202161015914649e-05, - "loss": 2.0987, - "step": 444960 - }, - { - "epoch": 0.78, - "learning_rate": 1.1201289075987821e-05, - "loss": 2.2856, - "step": 444970 - }, - { - "epoch": 0.78, - "learning_rate": 1.1200417136060995e-05, - "loss": 2.237, - "step": 444980 - }, - { - "epoch": 0.78, - "learning_rate": 1.1199545196134167e-05, - "loss": 2.2878, - "step": 444990 - }, - { - "epoch": 0.78, - "learning_rate": 1.119867325620734e-05, - "loss": 2.323, - "step": 445000 - }, - { - "epoch": 0.78, - "learning_rate": 1.1197801316280514e-05, - "loss": 2.4189, - "step": 445010 - }, - { - "epoch": 0.78, - "learning_rate": 1.1196929376353688e-05, - "loss": 2.3263, - "step": 445020 - }, - { - "epoch": 0.78, - "learning_rate": 1.119605743642686e-05, - "loss": 2.2098, - "step": 445030 - }, - { - "epoch": 0.78, - "learning_rate": 1.1195185496500034e-05, - "loss": 2.2601, - "step": 445040 - }, - { - "epoch": 0.78, - "learning_rate": 1.1194313556573206e-05, - "loss": 2.2623, - "step": 445050 - }, - { - "epoch": 0.78, - "learning_rate": 1.119344161664638e-05, - "loss": 2.2819, - "step": 445060 - }, - { - "epoch": 0.78, - "learning_rate": 1.1192569676719552e-05, - "loss": 2.3501, - "step": 445070 - }, - { - "epoch": 0.78, - "learning_rate": 1.1191697736792726e-05, - "loss": 2.2116, - "step": 445080 - }, - { - "epoch": 0.78, - "learning_rate": 1.1190825796865901e-05, - "loss": 2.403, - "step": 445090 - }, - { - "epoch": 0.78, - "learning_rate": 1.1189953856939073e-05, - "loss": 2.2098, - "step": 445100 - }, - { - "epoch": 0.78, - "learning_rate": 1.1189081917012247e-05, - "loss": 2.1387, - "step": 445110 - }, - { - "epoch": 0.78, - "learning_rate": 1.1188209977085419e-05, - "loss": 2.2139, - "step": 445120 - }, - { - "epoch": 0.78, - "learning_rate": 1.1187338037158593e-05, - "loss": 2.2802, - "step": 445130 - }, - { - "epoch": 0.78, - "learning_rate": 1.1186466097231765e-05, - "loss": 2.3202, - "step": 445140 - }, - { - "epoch": 0.78, - "learning_rate": 1.1185594157304939e-05, - "loss": 2.2726, - "step": 445150 - }, - { - "epoch": 0.78, - "learning_rate": 1.1184722217378112e-05, - "loss": 2.2588, - "step": 445160 - }, - { - "epoch": 0.78, - "learning_rate": 1.1183850277451286e-05, - "loss": 2.3647, - "step": 445170 - }, - { - "epoch": 0.78, - "learning_rate": 1.1182978337524458e-05, - "loss": 2.4024, - "step": 445180 - }, - { - "epoch": 0.78, - "learning_rate": 1.1182106397597632e-05, - "loss": 2.1812, - "step": 445190 - }, - { - "epoch": 0.78, - "learning_rate": 1.1181234457670804e-05, - "loss": 2.4287, - "step": 445200 - }, - { - "epoch": 0.78, - "learning_rate": 1.1180362517743978e-05, - "loss": 2.2527, - "step": 445210 - }, - { - "epoch": 0.78, - "learning_rate": 1.1179490577817152e-05, - "loss": 2.2525, - "step": 445220 - }, - { - "epoch": 0.78, - "learning_rate": 1.1178618637890324e-05, - "loss": 2.345, - "step": 445230 - }, - { - "epoch": 0.78, - "learning_rate": 1.1177746697963497e-05, - "loss": 2.3535, - "step": 445240 - }, - { - "epoch": 0.78, - "learning_rate": 1.1176874758036671e-05, - "loss": 2.2037, - "step": 445250 - }, - { - "epoch": 0.78, - "learning_rate": 1.1176002818109845e-05, - "loss": 2.2121, - "step": 445260 - }, - { - "epoch": 0.78, - "learning_rate": 1.1175130878183017e-05, - "loss": 2.2654, - "step": 445270 - }, - { - "epoch": 0.78, - "learning_rate": 1.1174258938256191e-05, - "loss": 2.2105, - "step": 445280 - }, - { - "epoch": 0.78, - "learning_rate": 1.1173386998329363e-05, - "loss": 2.2731, - "step": 445290 - }, - { - "epoch": 0.78, - "learning_rate": 1.1172515058402537e-05, - "loss": 2.3115, - "step": 445300 - }, - { - "epoch": 0.78, - "learning_rate": 1.1171643118475709e-05, - "loss": 2.2629, - "step": 445310 - }, - { - "epoch": 0.78, - "learning_rate": 1.1170771178548883e-05, - "loss": 2.2872, - "step": 445320 - }, - { - "epoch": 0.78, - "learning_rate": 1.1169899238622056e-05, - "loss": 2.3385, - "step": 445330 - }, - { - "epoch": 0.78, - "learning_rate": 1.116902729869523e-05, - "loss": 2.1549, - "step": 445340 - }, - { - "epoch": 0.78, - "learning_rate": 1.1168155358768404e-05, - "loss": 2.2786, - "step": 445350 - }, - { - "epoch": 0.78, - "learning_rate": 1.1167283418841576e-05, - "loss": 2.3616, - "step": 445360 - }, - { - "epoch": 0.78, - "learning_rate": 1.116641147891475e-05, - "loss": 2.3212, - "step": 445370 - }, - { - "epoch": 0.78, - "learning_rate": 1.1165539538987922e-05, - "loss": 2.2334, - "step": 445380 - }, - { - "epoch": 0.78, - "learning_rate": 1.1164667599061096e-05, - "loss": 2.2739, - "step": 445390 - }, - { - "epoch": 0.78, - "learning_rate": 1.116379565913427e-05, - "loss": 2.176, - "step": 445400 - }, - { - "epoch": 0.78, - "learning_rate": 1.1162923719207443e-05, - "loss": 2.3715, - "step": 445410 - }, - { - "epoch": 0.78, - "learning_rate": 1.1162051779280615e-05, - "loss": 2.3533, - "step": 445420 - }, - { - "epoch": 0.78, - "learning_rate": 1.1161179839353789e-05, - "loss": 2.3252, - "step": 445430 - }, - { - "epoch": 0.78, - "learning_rate": 1.1160307899426961e-05, - "loss": 2.3687, - "step": 445440 - }, - { - "epoch": 0.78, - "learning_rate": 1.1159435959500135e-05, - "loss": 2.1664, - "step": 445450 - }, - { - "epoch": 0.78, - "learning_rate": 1.1158564019573307e-05, - "loss": 2.3211, - "step": 445460 - }, - { - "epoch": 0.78, - "learning_rate": 1.115769207964648e-05, - "loss": 2.3419, - "step": 445470 - }, - { - "epoch": 0.78, - "learning_rate": 1.1156820139719654e-05, - "loss": 2.1386, - "step": 445480 - }, - { - "epoch": 0.78, - "learning_rate": 1.1155948199792828e-05, - "loss": 2.2662, - "step": 445490 - }, - { - "epoch": 0.78, - "learning_rate": 1.1155076259866002e-05, - "loss": 2.2983, - "step": 445500 - }, - { - "epoch": 0.78, - "learning_rate": 1.1154204319939174e-05, - "loss": 2.3353, - "step": 445510 - }, - { - "epoch": 0.78, - "learning_rate": 1.1153332380012348e-05, - "loss": 2.2877, - "step": 445520 - }, - { - "epoch": 0.78, - "learning_rate": 1.115246044008552e-05, - "loss": 2.2556, - "step": 445530 - }, - { - "epoch": 0.78, - "learning_rate": 1.1151588500158694e-05, - "loss": 2.3652, - "step": 445540 - }, - { - "epoch": 0.78, - "learning_rate": 1.1150716560231866e-05, - "loss": 2.2252, - "step": 445550 - }, - { - "epoch": 0.78, - "learning_rate": 1.114984462030504e-05, - "loss": 2.2733, - "step": 445560 - }, - { - "epoch": 0.78, - "learning_rate": 1.1148972680378213e-05, - "loss": 2.2063, - "step": 445570 - }, - { - "epoch": 0.78, - "learning_rate": 1.1148100740451387e-05, - "loss": 2.3213, - "step": 445580 - }, - { - "epoch": 0.78, - "learning_rate": 1.1147228800524559e-05, - "loss": 2.31, - "step": 445590 - }, - { - "epoch": 0.78, - "learning_rate": 1.1146356860597733e-05, - "loss": 2.238, - "step": 445600 - }, - { - "epoch": 0.78, - "learning_rate": 1.1145484920670907e-05, - "loss": 2.3359, - "step": 445610 - }, - { - "epoch": 0.78, - "learning_rate": 1.1144612980744079e-05, - "loss": 2.2639, - "step": 445620 - }, - { - "epoch": 0.78, - "learning_rate": 1.1143741040817252e-05, - "loss": 2.3284, - "step": 445630 - }, - { - "epoch": 0.78, - "learning_rate": 1.1142869100890426e-05, - "loss": 2.2822, - "step": 445640 - }, - { - "epoch": 0.78, - "learning_rate": 1.11419971609636e-05, - "loss": 2.2232, - "step": 445650 - }, - { - "epoch": 0.78, - "learning_rate": 1.1141125221036772e-05, - "loss": 2.244, - "step": 445660 - }, - { - "epoch": 0.78, - "learning_rate": 1.1140253281109946e-05, - "loss": 2.2085, - "step": 445670 - }, - { - "epoch": 0.78, - "learning_rate": 1.1139381341183118e-05, - "loss": 2.2299, - "step": 445680 - }, - { - "epoch": 0.78, - "learning_rate": 1.1138509401256292e-05, - "loss": 2.339, - "step": 445690 - }, - { - "epoch": 0.78, - "learning_rate": 1.1137637461329464e-05, - "loss": 2.3712, - "step": 445700 - }, - { - "epoch": 0.78, - "learning_rate": 1.1136765521402638e-05, - "loss": 2.35, - "step": 445710 - }, - { - "epoch": 0.78, - "learning_rate": 1.1135893581475811e-05, - "loss": 2.3036, - "step": 445720 - }, - { - "epoch": 0.78, - "learning_rate": 1.1135021641548985e-05, - "loss": 2.2134, - "step": 445730 - }, - { - "epoch": 0.78, - "learning_rate": 1.1134149701622159e-05, - "loss": 2.3258, - "step": 445740 - }, - { - "epoch": 0.78, - "learning_rate": 1.1133277761695331e-05, - "loss": 2.3676, - "step": 445750 - }, - { - "epoch": 0.78, - "learning_rate": 1.1132405821768505e-05, - "loss": 2.3372, - "step": 445760 - }, - { - "epoch": 0.78, - "learning_rate": 1.1131533881841677e-05, - "loss": 2.2774, - "step": 445770 - }, - { - "epoch": 0.78, - "learning_rate": 1.113066194191485e-05, - "loss": 2.2449, - "step": 445780 - }, - { - "epoch": 0.78, - "learning_rate": 1.1129790001988023e-05, - "loss": 2.334, - "step": 445790 - }, - { - "epoch": 0.78, - "learning_rate": 1.1128918062061196e-05, - "loss": 2.355, - "step": 445800 - }, - { - "epoch": 0.78, - "learning_rate": 1.112804612213437e-05, - "loss": 2.3197, - "step": 445810 - }, - { - "epoch": 0.78, - "learning_rate": 1.1127174182207544e-05, - "loss": 2.2316, - "step": 445820 - }, - { - "epoch": 0.78, - "learning_rate": 1.1126302242280716e-05, - "loss": 2.4049, - "step": 445830 - }, - { - "epoch": 0.78, - "learning_rate": 1.112543030235389e-05, - "loss": 2.2272, - "step": 445840 - }, - { - "epoch": 0.78, - "learning_rate": 1.1124558362427062e-05, - "loss": 2.2697, - "step": 445850 - }, - { - "epoch": 0.78, - "learning_rate": 1.1123686422500236e-05, - "loss": 2.29, - "step": 445860 - }, - { - "epoch": 0.78, - "learning_rate": 1.1122814482573408e-05, - "loss": 2.239, - "step": 445870 - }, - { - "epoch": 0.78, - "learning_rate": 1.1121942542646581e-05, - "loss": 2.403, - "step": 445880 - }, - { - "epoch": 0.78, - "learning_rate": 1.1121070602719757e-05, - "loss": 2.167, - "step": 445890 - }, - { - "epoch": 0.78, - "learning_rate": 1.1120198662792929e-05, - "loss": 2.2898, - "step": 445900 - }, - { - "epoch": 0.78, - "learning_rate": 1.1119326722866103e-05, - "loss": 2.2417, - "step": 445910 - }, - { - "epoch": 0.78, - "learning_rate": 1.1118454782939275e-05, - "loss": 2.3041, - "step": 445920 - }, - { - "epoch": 0.78, - "learning_rate": 1.1117582843012449e-05, - "loss": 2.2393, - "step": 445930 - }, - { - "epoch": 0.78, - "learning_rate": 1.111671090308562e-05, - "loss": 2.1993, - "step": 445940 - }, - { - "epoch": 0.78, - "learning_rate": 1.1115838963158794e-05, - "loss": 2.2735, - "step": 445950 - }, - { - "epoch": 0.78, - "learning_rate": 1.1114967023231968e-05, - "loss": 2.2793, - "step": 445960 - }, - { - "epoch": 0.78, - "learning_rate": 1.1114095083305142e-05, - "loss": 2.2112, - "step": 445970 - }, - { - "epoch": 0.78, - "learning_rate": 1.1113223143378314e-05, - "loss": 2.2422, - "step": 445980 - }, - { - "epoch": 0.78, - "learning_rate": 1.1112351203451488e-05, - "loss": 2.3416, - "step": 445990 - }, - { - "epoch": 0.78, - "learning_rate": 1.111147926352466e-05, - "loss": 2.3276, - "step": 446000 - }, - { - "epoch": 0.78, - "learning_rate": 1.1110607323597834e-05, - "loss": 2.2889, - "step": 446010 - }, - { - "epoch": 0.78, - "learning_rate": 1.1109735383671007e-05, - "loss": 2.3087, - "step": 446020 - }, - { - "epoch": 0.78, - "learning_rate": 1.110886344374418e-05, - "loss": 2.2605, - "step": 446030 - }, - { - "epoch": 0.78, - "learning_rate": 1.1107991503817353e-05, - "loss": 2.1994, - "step": 446040 - }, - { - "epoch": 0.78, - "learning_rate": 1.1107119563890527e-05, - "loss": 2.3569, - "step": 446050 - }, - { - "epoch": 0.78, - "learning_rate": 1.1106247623963701e-05, - "loss": 2.254, - "step": 446060 - }, - { - "epoch": 0.78, - "learning_rate": 1.1105375684036873e-05, - "loss": 2.2616, - "step": 446070 - }, - { - "epoch": 0.78, - "learning_rate": 1.1104503744110047e-05, - "loss": 2.2765, - "step": 446080 - }, - { - "epoch": 0.78, - "learning_rate": 1.1103631804183219e-05, - "loss": 2.2048, - "step": 446090 - }, - { - "epoch": 0.78, - "learning_rate": 1.1102759864256393e-05, - "loss": 2.3075, - "step": 446100 - }, - { - "epoch": 0.78, - "learning_rate": 1.1101887924329565e-05, - "loss": 2.3581, - "step": 446110 - }, - { - "epoch": 0.78, - "learning_rate": 1.1101015984402738e-05, - "loss": 2.3565, - "step": 446120 - }, - { - "epoch": 0.78, - "learning_rate": 1.1100144044475912e-05, - "loss": 2.2526, - "step": 446130 - }, - { - "epoch": 0.78, - "learning_rate": 1.1099272104549086e-05, - "loss": 2.2316, - "step": 446140 - }, - { - "epoch": 0.78, - "learning_rate": 1.109840016462226e-05, - "loss": 2.2508, - "step": 446150 - }, - { - "epoch": 0.78, - "learning_rate": 1.1097528224695432e-05, - "loss": 2.237, - "step": 446160 - }, - { - "epoch": 0.78, - "learning_rate": 1.1096656284768606e-05, - "loss": 2.3562, - "step": 446170 - }, - { - "epoch": 0.78, - "learning_rate": 1.1095784344841778e-05, - "loss": 2.2726, - "step": 446180 - }, - { - "epoch": 0.78, - "learning_rate": 1.1094912404914951e-05, - "loss": 2.2558, - "step": 446190 - }, - { - "epoch": 0.78, - "learning_rate": 1.1094040464988125e-05, - "loss": 2.3041, - "step": 446200 - }, - { - "epoch": 0.78, - "learning_rate": 1.1093168525061299e-05, - "loss": 2.3083, - "step": 446210 - }, - { - "epoch": 0.78, - "learning_rate": 1.1092296585134471e-05, - "loss": 2.2715, - "step": 446220 - }, - { - "epoch": 0.78, - "learning_rate": 1.1091424645207645e-05, - "loss": 2.1642, - "step": 446230 - }, - { - "epoch": 0.78, - "learning_rate": 1.1090552705280817e-05, - "loss": 2.2833, - "step": 446240 - }, - { - "epoch": 0.78, - "learning_rate": 1.108968076535399e-05, - "loss": 2.2689, - "step": 446250 - }, - { - "epoch": 0.78, - "learning_rate": 1.1088808825427163e-05, - "loss": 2.2884, - "step": 446260 - }, - { - "epoch": 0.78, - "learning_rate": 1.1087936885500336e-05, - "loss": 2.2104, - "step": 446270 - }, - { - "epoch": 0.78, - "learning_rate": 1.108706494557351e-05, - "loss": 2.2287, - "step": 446280 - }, - { - "epoch": 0.78, - "learning_rate": 1.1086193005646684e-05, - "loss": 2.3536, - "step": 446290 - }, - { - "epoch": 0.78, - "learning_rate": 1.1085321065719858e-05, - "loss": 2.1844, - "step": 446300 - }, - { - "epoch": 0.78, - "learning_rate": 1.108444912579303e-05, - "loss": 2.3056, - "step": 446310 - }, - { - "epoch": 0.78, - "learning_rate": 1.1083577185866204e-05, - "loss": 2.2632, - "step": 446320 - }, - { - "epoch": 0.78, - "learning_rate": 1.1082705245939376e-05, - "loss": 2.334, - "step": 446330 - }, - { - "epoch": 0.78, - "learning_rate": 1.108183330601255e-05, - "loss": 2.2087, - "step": 446340 - }, - { - "epoch": 0.78, - "learning_rate": 1.1080961366085722e-05, - "loss": 2.2475, - "step": 446350 - }, - { - "epoch": 0.78, - "learning_rate": 1.1080089426158895e-05, - "loss": 2.3455, - "step": 446360 - }, - { - "epoch": 0.78, - "learning_rate": 1.1079217486232069e-05, - "loss": 2.2522, - "step": 446370 - }, - { - "epoch": 0.78, - "learning_rate": 1.1078345546305243e-05, - "loss": 2.2919, - "step": 446380 - }, - { - "epoch": 0.78, - "learning_rate": 1.1077473606378415e-05, - "loss": 2.2653, - "step": 446390 - }, - { - "epoch": 0.78, - "learning_rate": 1.1076601666451589e-05, - "loss": 2.3586, - "step": 446400 - }, - { - "epoch": 0.78, - "learning_rate": 1.1075729726524762e-05, - "loss": 2.1692, - "step": 446410 - }, - { - "epoch": 0.78, - "learning_rate": 1.1074857786597935e-05, - "loss": 2.2088, - "step": 446420 - }, - { - "epoch": 0.78, - "learning_rate": 1.1073985846671108e-05, - "loss": 2.2327, - "step": 446430 - }, - { - "epoch": 0.78, - "learning_rate": 1.1073113906744282e-05, - "loss": 2.3086, - "step": 446440 - }, - { - "epoch": 0.78, - "learning_rate": 1.1072241966817456e-05, - "loss": 2.3474, - "step": 446450 - }, - { - "epoch": 0.78, - "learning_rate": 1.1071370026890628e-05, - "loss": 2.3636, - "step": 446460 - }, - { - "epoch": 0.78, - "learning_rate": 1.1070498086963802e-05, - "loss": 2.2901, - "step": 446470 - }, - { - "epoch": 0.78, - "learning_rate": 1.1069626147036974e-05, - "loss": 2.3037, - "step": 446480 - }, - { - "epoch": 0.78, - "learning_rate": 1.1068754207110148e-05, - "loss": 2.229, - "step": 446490 - }, - { - "epoch": 0.78, - "learning_rate": 1.106788226718332e-05, - "loss": 2.2816, - "step": 446500 - }, - { - "epoch": 0.78, - "learning_rate": 1.1067010327256493e-05, - "loss": 2.1807, - "step": 446510 - }, - { - "epoch": 0.78, - "learning_rate": 1.1066138387329667e-05, - "loss": 2.2818, - "step": 446520 - }, - { - "epoch": 0.78, - "learning_rate": 1.1065266447402841e-05, - "loss": 2.3987, - "step": 446530 - }, - { - "epoch": 0.78, - "learning_rate": 1.1064394507476015e-05, - "loss": 2.2472, - "step": 446540 - }, - { - "epoch": 0.78, - "learning_rate": 1.1063522567549187e-05, - "loss": 2.2862, - "step": 446550 - }, - { - "epoch": 0.78, - "learning_rate": 1.106265062762236e-05, - "loss": 2.3113, - "step": 446560 - }, - { - "epoch": 0.78, - "learning_rate": 1.1061778687695533e-05, - "loss": 2.2414, - "step": 446570 - }, - { - "epoch": 0.78, - "learning_rate": 1.1060906747768706e-05, - "loss": 2.3419, - "step": 446580 - }, - { - "epoch": 0.78, - "learning_rate": 1.1060034807841878e-05, - "loss": 2.1414, - "step": 446590 - }, - { - "epoch": 0.78, - "learning_rate": 1.1059162867915052e-05, - "loss": 2.3085, - "step": 446600 - }, - { - "epoch": 0.78, - "learning_rate": 1.1058290927988226e-05, - "loss": 2.1271, - "step": 446610 - }, - { - "epoch": 0.78, - "learning_rate": 1.10574189880614e-05, - "loss": 2.0722, - "step": 446620 - }, - { - "epoch": 0.78, - "learning_rate": 1.1056547048134572e-05, - "loss": 2.2798, - "step": 446630 - }, - { - "epoch": 0.78, - "learning_rate": 1.1055675108207746e-05, - "loss": 2.2962, - "step": 446640 - }, - { - "epoch": 0.78, - "learning_rate": 1.1054803168280918e-05, - "loss": 2.2891, - "step": 446650 - }, - { - "epoch": 0.78, - "learning_rate": 1.1053931228354091e-05, - "loss": 2.2241, - "step": 446660 - }, - { - "epoch": 0.78, - "learning_rate": 1.1053059288427265e-05, - "loss": 2.191, - "step": 446670 - }, - { - "epoch": 0.78, - "learning_rate": 1.1052187348500439e-05, - "loss": 2.2935, - "step": 446680 - }, - { - "epoch": 0.78, - "learning_rate": 1.1051315408573613e-05, - "loss": 2.4007, - "step": 446690 - }, - { - "epoch": 0.78, - "learning_rate": 1.1050443468646785e-05, - "loss": 2.3889, - "step": 446700 - }, - { - "epoch": 0.78, - "learning_rate": 1.1049571528719959e-05, - "loss": 2.3619, - "step": 446710 - }, - { - "epoch": 0.78, - "learning_rate": 1.104869958879313e-05, - "loss": 2.3061, - "step": 446720 - }, - { - "epoch": 0.78, - "learning_rate": 1.1047827648866304e-05, - "loss": 2.3259, - "step": 446730 - }, - { - "epoch": 0.78, - "learning_rate": 1.1046955708939477e-05, - "loss": 2.3453, - "step": 446740 - }, - { - "epoch": 0.78, - "learning_rate": 1.104608376901265e-05, - "loss": 2.3418, - "step": 446750 - }, - { - "epoch": 0.78, - "learning_rate": 1.1045211829085824e-05, - "loss": 2.2666, - "step": 446760 - }, - { - "epoch": 0.78, - "learning_rate": 1.1044339889158998e-05, - "loss": 2.351, - "step": 446770 - }, - { - "epoch": 0.78, - "learning_rate": 1.104346794923217e-05, - "loss": 2.2604, - "step": 446780 - }, - { - "epoch": 0.78, - "learning_rate": 1.1042596009305344e-05, - "loss": 2.1564, - "step": 446790 - }, - { - "epoch": 0.78, - "learning_rate": 1.1041724069378516e-05, - "loss": 2.3085, - "step": 446800 - }, - { - "epoch": 0.78, - "learning_rate": 1.104085212945169e-05, - "loss": 2.332, - "step": 446810 - }, - { - "epoch": 0.78, - "learning_rate": 1.1039980189524863e-05, - "loss": 2.2855, - "step": 446820 - }, - { - "epoch": 0.78, - "learning_rate": 1.1039108249598035e-05, - "loss": 2.4223, - "step": 446830 - }, - { - "epoch": 0.78, - "learning_rate": 1.103823630967121e-05, - "loss": 2.2385, - "step": 446840 - }, - { - "epoch": 0.78, - "learning_rate": 1.1037364369744383e-05, - "loss": 2.1582, - "step": 446850 - }, - { - "epoch": 0.78, - "learning_rate": 1.1036492429817557e-05, - "loss": 2.3146, - "step": 446860 - }, - { - "epoch": 0.78, - "learning_rate": 1.1035620489890729e-05, - "loss": 2.3067, - "step": 446870 - }, - { - "epoch": 0.78, - "learning_rate": 1.1034748549963903e-05, - "loss": 2.2691, - "step": 446880 - }, - { - "epoch": 0.78, - "learning_rate": 1.1033876610037075e-05, - "loss": 2.349, - "step": 446890 - }, - { - "epoch": 0.78, - "learning_rate": 1.1033004670110248e-05, - "loss": 2.4146, - "step": 446900 - }, - { - "epoch": 0.78, - "learning_rate": 1.103213273018342e-05, - "loss": 2.2405, - "step": 446910 - }, - { - "epoch": 0.78, - "learning_rate": 1.1031260790256594e-05, - "loss": 2.2862, - "step": 446920 - }, - { - "epoch": 0.78, - "learning_rate": 1.1030388850329768e-05, - "loss": 2.3093, - "step": 446930 - }, - { - "epoch": 0.78, - "learning_rate": 1.1029516910402942e-05, - "loss": 2.3189, - "step": 446940 - }, - { - "epoch": 0.78, - "learning_rate": 1.1028644970476116e-05, - "loss": 2.2441, - "step": 446950 - }, - { - "epoch": 0.78, - "learning_rate": 1.1027773030549288e-05, - "loss": 2.2554, - "step": 446960 - }, - { - "epoch": 0.78, - "learning_rate": 1.1026901090622461e-05, - "loss": 2.3194, - "step": 446970 - }, - { - "epoch": 0.78, - "learning_rate": 1.1026029150695633e-05, - "loss": 2.2225, - "step": 446980 - }, - { - "epoch": 0.78, - "learning_rate": 1.1025157210768807e-05, - "loss": 2.214, - "step": 446990 - }, - { - "epoch": 0.78, - "learning_rate": 1.1024285270841981e-05, - "loss": 2.3019, - "step": 447000 - }, - { - "epoch": 0.78, - "learning_rate": 1.1023413330915155e-05, - "loss": 2.3267, - "step": 447010 - }, - { - "epoch": 0.78, - "learning_rate": 1.1022541390988327e-05, - "loss": 2.3323, - "step": 447020 - }, - { - "epoch": 0.78, - "learning_rate": 1.10216694510615e-05, - "loss": 2.433, - "step": 447030 - }, - { - "epoch": 0.78, - "learning_rate": 1.1020797511134673e-05, - "loss": 2.3244, - "step": 447040 - }, - { - "epoch": 0.78, - "learning_rate": 1.1019925571207846e-05, - "loss": 2.3029, - "step": 447050 - }, - { - "epoch": 0.78, - "learning_rate": 1.1019053631281019e-05, - "loss": 2.2674, - "step": 447060 - }, - { - "epoch": 0.78, - "learning_rate": 1.1018181691354192e-05, - "loss": 2.2632, - "step": 447070 - }, - { - "epoch": 0.78, - "learning_rate": 1.1017309751427366e-05, - "loss": 2.2927, - "step": 447080 - }, - { - "epoch": 0.78, - "learning_rate": 1.101643781150054e-05, - "loss": 2.2025, - "step": 447090 - }, - { - "epoch": 0.78, - "learning_rate": 1.1015565871573714e-05, - "loss": 2.1706, - "step": 447100 - }, - { - "epoch": 0.78, - "learning_rate": 1.1014693931646886e-05, - "loss": 2.2141, - "step": 447110 - }, - { - "epoch": 0.78, - "learning_rate": 1.101382199172006e-05, - "loss": 2.3135, - "step": 447120 - }, - { - "epoch": 0.78, - "learning_rate": 1.1012950051793232e-05, - "loss": 2.2779, - "step": 447130 - }, - { - "epoch": 0.78, - "learning_rate": 1.1012078111866405e-05, - "loss": 2.359, - "step": 447140 - }, - { - "epoch": 0.78, - "learning_rate": 1.1011206171939577e-05, - "loss": 2.2618, - "step": 447150 - }, - { - "epoch": 0.78, - "learning_rate": 1.1010334232012751e-05, - "loss": 2.2528, - "step": 447160 - }, - { - "epoch": 0.78, - "learning_rate": 1.1009462292085925e-05, - "loss": 2.36, - "step": 447170 - }, - { - "epoch": 0.78, - "learning_rate": 1.1008590352159099e-05, - "loss": 2.278, - "step": 447180 - }, - { - "epoch": 0.78, - "learning_rate": 1.100771841223227e-05, - "loss": 2.2808, - "step": 447190 - }, - { - "epoch": 0.78, - "learning_rate": 1.1006846472305445e-05, - "loss": 2.4314, - "step": 447200 - }, - { - "epoch": 0.78, - "learning_rate": 1.1005974532378618e-05, - "loss": 2.2784, - "step": 447210 - }, - { - "epoch": 0.78, - "learning_rate": 1.100510259245179e-05, - "loss": 2.2529, - "step": 447220 - }, - { - "epoch": 0.78, - "learning_rate": 1.1004230652524964e-05, - "loss": 2.2777, - "step": 447230 - }, - { - "epoch": 0.78, - "learning_rate": 1.1003358712598138e-05, - "loss": 2.3169, - "step": 447240 - }, - { - "epoch": 0.78, - "learning_rate": 1.1002486772671312e-05, - "loss": 2.2251, - "step": 447250 - }, - { - "epoch": 0.78, - "learning_rate": 1.1001614832744484e-05, - "loss": 2.3217, - "step": 447260 - }, - { - "epoch": 0.78, - "learning_rate": 1.1000742892817658e-05, - "loss": 2.268, - "step": 447270 - }, - { - "epoch": 0.78, - "learning_rate": 1.099987095289083e-05, - "loss": 2.307, - "step": 447280 - }, - { - "epoch": 0.78, - "learning_rate": 1.0998999012964003e-05, - "loss": 2.2134, - "step": 447290 - }, - { - "epoch": 0.78, - "learning_rate": 1.0998127073037175e-05, - "loss": 2.2463, - "step": 447300 - }, - { - "epoch": 0.78, - "learning_rate": 1.099725513311035e-05, - "loss": 2.279, - "step": 447310 - }, - { - "epoch": 0.78, - "learning_rate": 1.0996383193183523e-05, - "loss": 2.3445, - "step": 447320 - }, - { - "epoch": 0.78, - "learning_rate": 1.0995511253256697e-05, - "loss": 2.3498, - "step": 447330 - }, - { - "epoch": 0.78, - "learning_rate": 1.099463931332987e-05, - "loss": 2.2694, - "step": 447340 - }, - { - "epoch": 0.78, - "learning_rate": 1.0993767373403043e-05, - "loss": 2.3334, - "step": 447350 - }, - { - "epoch": 0.78, - "learning_rate": 1.0992895433476216e-05, - "loss": 2.2519, - "step": 447360 - }, - { - "epoch": 0.78, - "learning_rate": 1.0992023493549388e-05, - "loss": 2.3013, - "step": 447370 - }, - { - "epoch": 0.78, - "learning_rate": 1.0991151553622562e-05, - "loss": 2.2051, - "step": 447380 - }, - { - "epoch": 0.78, - "learning_rate": 1.0990279613695734e-05, - "loss": 2.2646, - "step": 447390 - }, - { - "epoch": 0.78, - "learning_rate": 1.0989407673768908e-05, - "loss": 2.1417, - "step": 447400 - }, - { - "epoch": 0.78, - "learning_rate": 1.0988535733842082e-05, - "loss": 2.335, - "step": 447410 - }, - { - "epoch": 0.78, - "learning_rate": 1.0987663793915256e-05, - "loss": 2.2486, - "step": 447420 - }, - { - "epoch": 0.78, - "learning_rate": 1.0986791853988428e-05, - "loss": 2.3027, - "step": 447430 - }, - { - "epoch": 0.78, - "learning_rate": 1.0985919914061601e-05, - "loss": 2.2399, - "step": 447440 - }, - { - "epoch": 0.78, - "learning_rate": 1.0985047974134774e-05, - "loss": 2.3594, - "step": 447450 - }, - { - "epoch": 0.78, - "learning_rate": 1.0984176034207947e-05, - "loss": 2.358, - "step": 447460 - }, - { - "epoch": 0.78, - "learning_rate": 1.0983304094281121e-05, - "loss": 2.2909, - "step": 447470 - }, - { - "epoch": 0.78, - "learning_rate": 1.0982432154354295e-05, - "loss": 2.2096, - "step": 447480 - }, - { - "epoch": 0.78, - "learning_rate": 1.0981560214427469e-05, - "loss": 2.2437, - "step": 447490 - }, - { - "epoch": 0.78, - "learning_rate": 1.098068827450064e-05, - "loss": 2.2955, - "step": 447500 - }, - { - "epoch": 0.78, - "learning_rate": 1.0979816334573814e-05, - "loss": 2.2038, - "step": 447510 - }, - { - "epoch": 0.78, - "learning_rate": 1.0978944394646987e-05, - "loss": 2.3192, - "step": 447520 - }, - { - "epoch": 0.78, - "learning_rate": 1.097807245472016e-05, - "loss": 2.3408, - "step": 447530 - }, - { - "epoch": 0.78, - "learning_rate": 1.0977200514793332e-05, - "loss": 2.2949, - "step": 447540 - }, - { - "epoch": 0.78, - "learning_rate": 1.0976328574866506e-05, - "loss": 2.2573, - "step": 447550 - }, - { - "epoch": 0.78, - "learning_rate": 1.097545663493968e-05, - "loss": 2.2396, - "step": 447560 - }, - { - "epoch": 0.78, - "learning_rate": 1.0974584695012854e-05, - "loss": 2.2342, - "step": 447570 - }, - { - "epoch": 0.78, - "learning_rate": 1.0973712755086026e-05, - "loss": 2.2065, - "step": 447580 - }, - { - "epoch": 0.78, - "learning_rate": 1.09728408151592e-05, - "loss": 2.1327, - "step": 447590 - }, - { - "epoch": 0.78, - "learning_rate": 1.0971968875232372e-05, - "loss": 2.2753, - "step": 447600 - }, - { - "epoch": 0.78, - "learning_rate": 1.0971096935305545e-05, - "loss": 2.4205, - "step": 447610 - }, - { - "epoch": 0.78, - "learning_rate": 1.097022499537872e-05, - "loss": 2.2626, - "step": 447620 - }, - { - "epoch": 0.78, - "learning_rate": 1.0969353055451891e-05, - "loss": 2.2871, - "step": 447630 - }, - { - "epoch": 0.78, - "learning_rate": 1.0968481115525065e-05, - "loss": 2.2328, - "step": 447640 - }, - { - "epoch": 0.78, - "learning_rate": 1.0967609175598239e-05, - "loss": 2.3665, - "step": 447650 - }, - { - "epoch": 0.78, - "learning_rate": 1.0966737235671413e-05, - "loss": 2.3321, - "step": 447660 - }, - { - "epoch": 0.78, - "learning_rate": 1.0965865295744585e-05, - "loss": 2.2465, - "step": 447670 - }, - { - "epoch": 0.78, - "learning_rate": 1.0964993355817758e-05, - "loss": 2.3034, - "step": 447680 - }, - { - "epoch": 0.78, - "learning_rate": 1.096412141589093e-05, - "loss": 2.2495, - "step": 447690 - }, - { - "epoch": 0.78, - "learning_rate": 1.0963249475964104e-05, - "loss": 2.3279, - "step": 447700 - }, - { - "epoch": 0.78, - "learning_rate": 1.0962377536037276e-05, - "loss": 2.153, - "step": 447710 - }, - { - "epoch": 0.78, - "learning_rate": 1.0961505596110452e-05, - "loss": 2.3023, - "step": 447720 - }, - { - "epoch": 0.78, - "learning_rate": 1.0960633656183624e-05, - "loss": 2.4085, - "step": 447730 - }, - { - "epoch": 0.78, - "learning_rate": 1.0959761716256798e-05, - "loss": 2.2664, - "step": 447740 - }, - { - "epoch": 0.78, - "learning_rate": 1.0958889776329971e-05, - "loss": 2.3539, - "step": 447750 - }, - { - "epoch": 0.78, - "learning_rate": 1.0958017836403143e-05, - "loss": 2.2912, - "step": 447760 - }, - { - "epoch": 0.78, - "learning_rate": 1.0957145896476317e-05, - "loss": 2.3172, - "step": 447770 - }, - { - "epoch": 0.78, - "learning_rate": 1.095627395654949e-05, - "loss": 2.1588, - "step": 447780 - }, - { - "epoch": 0.78, - "learning_rate": 1.0955402016622663e-05, - "loss": 2.29, - "step": 447790 - }, - { - "epoch": 0.78, - "learning_rate": 1.0954530076695837e-05, - "loss": 2.2013, - "step": 447800 - }, - { - "epoch": 0.78, - "learning_rate": 1.095365813676901e-05, - "loss": 2.3078, - "step": 447810 - }, - { - "epoch": 0.78, - "learning_rate": 1.0952786196842183e-05, - "loss": 2.3843, - "step": 447820 - }, - { - "epoch": 0.78, - "learning_rate": 1.0951914256915356e-05, - "loss": 2.263, - "step": 447830 - }, - { - "epoch": 0.78, - "learning_rate": 1.0951042316988529e-05, - "loss": 2.3343, - "step": 447840 - }, - { - "epoch": 0.78, - "learning_rate": 1.0950170377061702e-05, - "loss": 2.2634, - "step": 447850 - }, - { - "epoch": 0.78, - "learning_rate": 1.0949298437134874e-05, - "loss": 2.1757, - "step": 447860 - }, - { - "epoch": 0.78, - "learning_rate": 1.0948426497208048e-05, - "loss": 2.2699, - "step": 447870 - }, - { - "epoch": 0.78, - "learning_rate": 1.0947554557281222e-05, - "loss": 2.3486, - "step": 447880 - }, - { - "epoch": 0.78, - "learning_rate": 1.0946682617354396e-05, - "loss": 2.1854, - "step": 447890 - }, - { - "epoch": 0.78, - "learning_rate": 1.094581067742757e-05, - "loss": 2.241, - "step": 447900 - }, - { - "epoch": 0.78, - "learning_rate": 1.0944938737500742e-05, - "loss": 2.1979, - "step": 447910 - }, - { - "epoch": 0.78, - "learning_rate": 1.0944066797573915e-05, - "loss": 2.3076, - "step": 447920 - }, - { - "epoch": 0.78, - "learning_rate": 1.0943194857647087e-05, - "loss": 2.2866, - "step": 447930 - }, - { - "epoch": 0.78, - "learning_rate": 1.0942322917720261e-05, - "loss": 2.3123, - "step": 447940 - }, - { - "epoch": 0.78, - "learning_rate": 1.0941450977793433e-05, - "loss": 2.2125, - "step": 447950 - }, - { - "epoch": 0.78, - "learning_rate": 1.0940579037866607e-05, - "loss": 2.4053, - "step": 447960 - }, - { - "epoch": 0.78, - "learning_rate": 1.093970709793978e-05, - "loss": 2.3394, - "step": 447970 - }, - { - "epoch": 0.78, - "learning_rate": 1.0938835158012955e-05, - "loss": 2.3901, - "step": 447980 - }, - { - "epoch": 0.78, - "learning_rate": 1.0937963218086127e-05, - "loss": 2.312, - "step": 447990 - }, - { - "epoch": 0.78, - "learning_rate": 1.09370912781593e-05, - "loss": 2.3416, - "step": 448000 - }, - { - "epoch": 0.78, - "learning_rate": 1.0936219338232474e-05, - "loss": 2.2258, - "step": 448010 - }, - { - "epoch": 0.78, - "learning_rate": 1.0935347398305646e-05, - "loss": 2.3343, - "step": 448020 - }, - { - "epoch": 0.78, - "learning_rate": 1.093447545837882e-05, - "loss": 2.3504, - "step": 448030 - }, - { - "epoch": 0.78, - "learning_rate": 1.0933603518451994e-05, - "loss": 2.2995, - "step": 448040 - }, - { - "epoch": 0.78, - "learning_rate": 1.0932731578525168e-05, - "loss": 2.3014, - "step": 448050 - }, - { - "epoch": 0.78, - "learning_rate": 1.093185963859834e-05, - "loss": 2.2266, - "step": 448060 - }, - { - "epoch": 0.78, - "learning_rate": 1.0930987698671513e-05, - "loss": 2.3508, - "step": 448070 - }, - { - "epoch": 0.78, - "learning_rate": 1.0930115758744685e-05, - "loss": 2.2831, - "step": 448080 - }, - { - "epoch": 0.78, - "learning_rate": 1.092924381881786e-05, - "loss": 2.2383, - "step": 448090 - }, - { - "epoch": 0.78, - "learning_rate": 1.0928371878891031e-05, - "loss": 2.2214, - "step": 448100 - }, - { - "epoch": 0.78, - "learning_rate": 1.0927499938964205e-05, - "loss": 2.2117, - "step": 448110 - }, - { - "epoch": 0.78, - "learning_rate": 1.0926627999037379e-05, - "loss": 2.1928, - "step": 448120 - }, - { - "epoch": 0.78, - "learning_rate": 1.0925756059110553e-05, - "loss": 2.3885, - "step": 448130 - }, - { - "epoch": 0.78, - "learning_rate": 1.0924884119183726e-05, - "loss": 2.3726, - "step": 448140 - }, - { - "epoch": 0.78, - "learning_rate": 1.0924012179256898e-05, - "loss": 2.2789, - "step": 448150 - }, - { - "epoch": 0.78, - "learning_rate": 1.0923140239330072e-05, - "loss": 2.3413, - "step": 448160 - }, - { - "epoch": 0.78, - "learning_rate": 1.0922268299403244e-05, - "loss": 2.2719, - "step": 448170 - }, - { - "epoch": 0.78, - "learning_rate": 1.0921396359476418e-05, - "loss": 2.254, - "step": 448180 - }, - { - "epoch": 0.78, - "learning_rate": 1.092052441954959e-05, - "loss": 2.3938, - "step": 448190 - }, - { - "epoch": 0.78, - "learning_rate": 1.0919652479622764e-05, - "loss": 2.3804, - "step": 448200 - }, - { - "epoch": 0.78, - "learning_rate": 1.0918780539695938e-05, - "loss": 2.3806, - "step": 448210 - }, - { - "epoch": 0.78, - "learning_rate": 1.0917908599769111e-05, - "loss": 2.3337, - "step": 448220 - }, - { - "epoch": 0.78, - "learning_rate": 1.0917036659842284e-05, - "loss": 2.1988, - "step": 448230 - }, - { - "epoch": 0.78, - "learning_rate": 1.0916164719915457e-05, - "loss": 2.2141, - "step": 448240 - }, - { - "epoch": 0.78, - "learning_rate": 1.091529277998863e-05, - "loss": 2.3316, - "step": 448250 - }, - { - "epoch": 0.78, - "learning_rate": 1.0914420840061803e-05, - "loss": 2.269, - "step": 448260 - }, - { - "epoch": 0.78, - "learning_rate": 1.0913548900134977e-05, - "loss": 2.3499, - "step": 448270 - }, - { - "epoch": 0.78, - "learning_rate": 1.091267696020815e-05, - "loss": 2.333, - "step": 448280 - }, - { - "epoch": 0.78, - "learning_rate": 1.0911805020281324e-05, - "loss": 2.273, - "step": 448290 - }, - { - "epoch": 0.78, - "learning_rate": 1.0910933080354497e-05, - "loss": 2.3449, - "step": 448300 - }, - { - "epoch": 0.78, - "learning_rate": 1.091006114042767e-05, - "loss": 2.2618, - "step": 448310 - }, - { - "epoch": 0.78, - "learning_rate": 1.0909189200500842e-05, - "loss": 2.3276, - "step": 448320 - }, - { - "epoch": 0.78, - "learning_rate": 1.0908317260574016e-05, - "loss": 2.3009, - "step": 448330 - }, - { - "epoch": 0.78, - "learning_rate": 1.0907445320647188e-05, - "loss": 2.4322, - "step": 448340 - }, - { - "epoch": 0.78, - "learning_rate": 1.0906573380720362e-05, - "loss": 2.3093, - "step": 448350 - }, - { - "epoch": 0.78, - "learning_rate": 1.0905701440793536e-05, - "loss": 2.3618, - "step": 448360 - }, - { - "epoch": 0.78, - "learning_rate": 1.090482950086671e-05, - "loss": 2.2381, - "step": 448370 - }, - { - "epoch": 0.78, - "learning_rate": 1.0903957560939882e-05, - "loss": 2.298, - "step": 448380 - }, - { - "epoch": 0.78, - "learning_rate": 1.0903085621013055e-05, - "loss": 2.3223, - "step": 448390 - }, - { - "epoch": 0.78, - "learning_rate": 1.090221368108623e-05, - "loss": 2.2489, - "step": 448400 - }, - { - "epoch": 0.78, - "learning_rate": 1.0901341741159401e-05, - "loss": 2.3532, - "step": 448410 - }, - { - "epoch": 0.78, - "learning_rate": 1.0900469801232575e-05, - "loss": 2.3726, - "step": 448420 - }, - { - "epoch": 0.78, - "learning_rate": 1.0899597861305747e-05, - "loss": 2.3058, - "step": 448430 - }, - { - "epoch": 0.78, - "learning_rate": 1.0898725921378921e-05, - "loss": 2.3509, - "step": 448440 - }, - { - "epoch": 0.78, - "learning_rate": 1.0897853981452095e-05, - "loss": 2.2069, - "step": 448450 - }, - { - "epoch": 0.78, - "learning_rate": 1.0896982041525268e-05, - "loss": 2.3641, - "step": 448460 - }, - { - "epoch": 0.78, - "learning_rate": 1.089611010159844e-05, - "loss": 2.2752, - "step": 448470 - }, - { - "epoch": 0.78, - "learning_rate": 1.0895238161671614e-05, - "loss": 2.283, - "step": 448480 - }, - { - "epoch": 0.78, - "learning_rate": 1.0894366221744786e-05, - "loss": 2.2041, - "step": 448490 - }, - { - "epoch": 0.78, - "learning_rate": 1.089349428181796e-05, - "loss": 2.1738, - "step": 448500 - }, - { - "epoch": 0.78, - "learning_rate": 1.0892622341891132e-05, - "loss": 2.231, - "step": 448510 - }, - { - "epoch": 0.78, - "learning_rate": 1.0891750401964308e-05, - "loss": 2.2712, - "step": 448520 - }, - { - "epoch": 0.78, - "learning_rate": 1.089087846203748e-05, - "loss": 2.301, - "step": 448530 - }, - { - "epoch": 0.78, - "learning_rate": 1.0890006522110653e-05, - "loss": 2.3201, - "step": 448540 - }, - { - "epoch": 0.78, - "learning_rate": 1.0889134582183827e-05, - "loss": 2.3108, - "step": 448550 - }, - { - "epoch": 0.78, - "learning_rate": 1.0888262642257e-05, - "loss": 2.214, - "step": 448560 - }, - { - "epoch": 0.78, - "learning_rate": 1.0887390702330173e-05, - "loss": 2.2519, - "step": 448570 - }, - { - "epoch": 0.78, - "learning_rate": 1.0886518762403345e-05, - "loss": 2.2344, - "step": 448580 - }, - { - "epoch": 0.78, - "learning_rate": 1.0885646822476519e-05, - "loss": 2.2845, - "step": 448590 - }, - { - "epoch": 0.78, - "learning_rate": 1.0884774882549693e-05, - "loss": 2.3209, - "step": 448600 - }, - { - "epoch": 0.78, - "learning_rate": 1.0883902942622866e-05, - "loss": 2.2117, - "step": 448610 - }, - { - "epoch": 0.78, - "learning_rate": 1.0883031002696039e-05, - "loss": 2.332, - "step": 448620 - }, - { - "epoch": 0.78, - "learning_rate": 1.0882159062769212e-05, - "loss": 2.2885, - "step": 448630 - }, - { - "epoch": 0.78, - "learning_rate": 1.0881287122842384e-05, - "loss": 2.4049, - "step": 448640 - }, - { - "epoch": 0.78, - "learning_rate": 1.0880415182915558e-05, - "loss": 2.2754, - "step": 448650 - }, - { - "epoch": 0.78, - "learning_rate": 1.087954324298873e-05, - "loss": 2.2095, - "step": 448660 - }, - { - "epoch": 0.78, - "learning_rate": 1.0878671303061904e-05, - "loss": 2.3389, - "step": 448670 - }, - { - "epoch": 0.78, - "learning_rate": 1.0877799363135078e-05, - "loss": 2.3013, - "step": 448680 - }, - { - "epoch": 0.78, - "learning_rate": 1.0876927423208252e-05, - "loss": 2.3097, - "step": 448690 - }, - { - "epoch": 0.78, - "learning_rate": 1.0876055483281425e-05, - "loss": 2.3084, - "step": 448700 - }, - { - "epoch": 0.78, - "learning_rate": 1.0875183543354597e-05, - "loss": 2.1587, - "step": 448710 - }, - { - "epoch": 0.78, - "learning_rate": 1.0874311603427771e-05, - "loss": 2.2526, - "step": 448720 - }, - { - "epoch": 0.78, - "learning_rate": 1.0873439663500943e-05, - "loss": 2.3235, - "step": 448730 - }, - { - "epoch": 0.78, - "learning_rate": 1.0872567723574117e-05, - "loss": 2.1592, - "step": 448740 - }, - { - "epoch": 0.78, - "learning_rate": 1.0871695783647289e-05, - "loss": 2.265, - "step": 448750 - }, - { - "epoch": 0.78, - "learning_rate": 1.0870823843720465e-05, - "loss": 2.3007, - "step": 448760 - }, - { - "epoch": 0.78, - "learning_rate": 1.0869951903793637e-05, - "loss": 2.2539, - "step": 448770 - }, - { - "epoch": 0.78, - "learning_rate": 1.086907996386681e-05, - "loss": 2.2202, - "step": 448780 - }, - { - "epoch": 0.78, - "learning_rate": 1.0868208023939982e-05, - "loss": 2.3093, - "step": 448790 - }, - { - "epoch": 0.78, - "learning_rate": 1.0867336084013156e-05, - "loss": 2.3515, - "step": 448800 - }, - { - "epoch": 0.78, - "learning_rate": 1.086646414408633e-05, - "loss": 2.2852, - "step": 448810 - }, - { - "epoch": 0.78, - "learning_rate": 1.0865592204159502e-05, - "loss": 2.3158, - "step": 448820 - }, - { - "epoch": 0.78, - "learning_rate": 1.0864720264232676e-05, - "loss": 2.2456, - "step": 448830 - }, - { - "epoch": 0.78, - "learning_rate": 1.086384832430585e-05, - "loss": 2.2556, - "step": 448840 - }, - { - "epoch": 0.78, - "learning_rate": 1.0862976384379023e-05, - "loss": 2.2917, - "step": 448850 - }, - { - "epoch": 0.78, - "learning_rate": 1.0862104444452195e-05, - "loss": 2.1712, - "step": 448860 - }, - { - "epoch": 0.78, - "learning_rate": 1.086123250452537e-05, - "loss": 2.174, - "step": 448870 - }, - { - "epoch": 0.78, - "learning_rate": 1.0860360564598541e-05, - "loss": 2.3618, - "step": 448880 - }, - { - "epoch": 0.78, - "learning_rate": 1.0859488624671715e-05, - "loss": 2.2951, - "step": 448890 - }, - { - "epoch": 0.78, - "learning_rate": 1.0858616684744887e-05, - "loss": 2.1882, - "step": 448900 - }, - { - "epoch": 0.78, - "learning_rate": 1.0857744744818061e-05, - "loss": 2.2281, - "step": 448910 - }, - { - "epoch": 0.78, - "learning_rate": 1.0856872804891235e-05, - "loss": 2.3293, - "step": 448920 - }, - { - "epoch": 0.78, - "learning_rate": 1.0856000864964408e-05, - "loss": 2.3897, - "step": 448930 - }, - { - "epoch": 0.78, - "learning_rate": 1.0855128925037582e-05, - "loss": 2.2934, - "step": 448940 - }, - { - "epoch": 0.78, - "learning_rate": 1.0854256985110754e-05, - "loss": 2.4413, - "step": 448950 - }, - { - "epoch": 0.78, - "learning_rate": 1.0853385045183928e-05, - "loss": 2.2849, - "step": 448960 - }, - { - "epoch": 0.78, - "learning_rate": 1.08525131052571e-05, - "loss": 2.3869, - "step": 448970 - }, - { - "epoch": 0.78, - "learning_rate": 1.0851641165330274e-05, - "loss": 2.3043, - "step": 448980 - }, - { - "epoch": 0.78, - "learning_rate": 1.0850769225403446e-05, - "loss": 2.218, - "step": 448990 - }, - { - "epoch": 0.78, - "learning_rate": 1.0849897285476621e-05, - "loss": 2.2313, - "step": 449000 - }, - { - "epoch": 0.78, - "learning_rate": 1.0849025345549794e-05, - "loss": 2.2683, - "step": 449010 - }, - { - "epoch": 0.78, - "learning_rate": 1.0848153405622967e-05, - "loss": 2.3161, - "step": 449020 - }, - { - "epoch": 0.78, - "learning_rate": 1.084728146569614e-05, - "loss": 2.3097, - "step": 449030 - }, - { - "epoch": 0.78, - "learning_rate": 1.0846409525769313e-05, - "loss": 2.2864, - "step": 449040 - }, - { - "epoch": 0.78, - "learning_rate": 1.0845537585842485e-05, - "loss": 2.2166, - "step": 449050 - }, - { - "epoch": 0.78, - "learning_rate": 1.0844665645915659e-05, - "loss": 2.2431, - "step": 449060 - }, - { - "epoch": 0.78, - "learning_rate": 1.0843793705988833e-05, - "loss": 2.2889, - "step": 449070 - }, - { - "epoch": 0.78, - "learning_rate": 1.0842921766062007e-05, - "loss": 2.2386, - "step": 449080 - }, - { - "epoch": 0.78, - "learning_rate": 1.084204982613518e-05, - "loss": 2.309, - "step": 449090 - }, - { - "epoch": 0.78, - "learning_rate": 1.0841177886208352e-05, - "loss": 2.2211, - "step": 449100 - }, - { - "epoch": 0.78, - "learning_rate": 1.0840305946281526e-05, - "loss": 2.3847, - "step": 449110 - }, - { - "epoch": 0.78, - "learning_rate": 1.0839434006354698e-05, - "loss": 2.368, - "step": 449120 - }, - { - "epoch": 0.78, - "learning_rate": 1.0838562066427872e-05, - "loss": 2.2543, - "step": 449130 - }, - { - "epoch": 0.78, - "learning_rate": 1.0837690126501044e-05, - "loss": 2.1969, - "step": 449140 - }, - { - "epoch": 0.78, - "learning_rate": 1.0836818186574218e-05, - "loss": 2.3512, - "step": 449150 - }, - { - "epoch": 0.78, - "learning_rate": 1.0835946246647392e-05, - "loss": 2.2207, - "step": 449160 - }, - { - "epoch": 0.78, - "learning_rate": 1.0835074306720565e-05, - "loss": 2.2446, - "step": 449170 - }, - { - "epoch": 0.78, - "learning_rate": 1.0834202366793737e-05, - "loss": 2.2618, - "step": 449180 - }, - { - "epoch": 0.78, - "learning_rate": 1.0833330426866911e-05, - "loss": 2.3821, - "step": 449190 - }, - { - "epoch": 0.78, - "learning_rate": 1.0832458486940085e-05, - "loss": 2.2228, - "step": 449200 - }, - { - "epoch": 0.78, - "learning_rate": 1.0831586547013257e-05, - "loss": 2.3172, - "step": 449210 - }, - { - "epoch": 0.78, - "learning_rate": 1.0830714607086431e-05, - "loss": 2.3321, - "step": 449220 - }, - { - "epoch": 0.78, - "learning_rate": 1.0829842667159603e-05, - "loss": 2.3625, - "step": 449230 - }, - { - "epoch": 0.78, - "learning_rate": 1.0828970727232777e-05, - "loss": 2.2753, - "step": 449240 - }, - { - "epoch": 0.78, - "learning_rate": 1.082809878730595e-05, - "loss": 2.2643, - "step": 449250 - }, - { - "epoch": 0.78, - "learning_rate": 1.0827226847379124e-05, - "loss": 2.3571, - "step": 449260 - }, - { - "epoch": 0.78, - "learning_rate": 1.0826354907452296e-05, - "loss": 2.2732, - "step": 449270 - }, - { - "epoch": 0.78, - "learning_rate": 1.082548296752547e-05, - "loss": 2.327, - "step": 449280 - }, - { - "epoch": 0.78, - "learning_rate": 1.0824611027598642e-05, - "loss": 2.2776, - "step": 449290 - }, - { - "epoch": 0.78, - "learning_rate": 1.0823739087671816e-05, - "loss": 2.321, - "step": 449300 - }, - { - "epoch": 0.78, - "learning_rate": 1.082286714774499e-05, - "loss": 2.3378, - "step": 449310 - }, - { - "epoch": 0.78, - "learning_rate": 1.0821995207818164e-05, - "loss": 2.3567, - "step": 449320 - }, - { - "epoch": 0.78, - "learning_rate": 1.0821123267891337e-05, - "loss": 2.258, - "step": 449330 - }, - { - "epoch": 0.78, - "learning_rate": 1.082025132796451e-05, - "loss": 2.3548, - "step": 449340 - }, - { - "epoch": 0.78, - "learning_rate": 1.0819379388037683e-05, - "loss": 2.3303, - "step": 449350 - }, - { - "epoch": 0.78, - "learning_rate": 1.0818507448110855e-05, - "loss": 2.2754, - "step": 449360 - }, - { - "epoch": 0.78, - "learning_rate": 1.0817635508184029e-05, - "loss": 2.2137, - "step": 449370 - }, - { - "epoch": 0.78, - "learning_rate": 1.0816763568257201e-05, - "loss": 2.2348, - "step": 449380 - }, - { - "epoch": 0.78, - "learning_rate": 1.0815891628330375e-05, - "loss": 2.4426, - "step": 449390 - }, - { - "epoch": 0.78, - "learning_rate": 1.0815019688403549e-05, - "loss": 2.2729, - "step": 449400 - }, - { - "epoch": 0.78, - "learning_rate": 1.0814147748476722e-05, - "loss": 2.2749, - "step": 449410 - }, - { - "epoch": 0.78, - "learning_rate": 1.0813275808549894e-05, - "loss": 2.3461, - "step": 449420 - }, - { - "epoch": 0.78, - "learning_rate": 1.0812403868623068e-05, - "loss": 2.3582, - "step": 449430 - }, - { - "epoch": 0.78, - "learning_rate": 1.081153192869624e-05, - "loss": 2.3003, - "step": 449440 - }, - { - "epoch": 0.78, - "learning_rate": 1.0810659988769414e-05, - "loss": 2.3169, - "step": 449450 - }, - { - "epoch": 0.78, - "learning_rate": 1.0809788048842586e-05, - "loss": 2.2189, - "step": 449460 - }, - { - "epoch": 0.78, - "learning_rate": 1.080891610891576e-05, - "loss": 2.3281, - "step": 449470 - }, - { - "epoch": 0.78, - "learning_rate": 1.0808044168988934e-05, - "loss": 2.3016, - "step": 449480 - }, - { - "epoch": 0.78, - "learning_rate": 1.0807172229062107e-05, - "loss": 2.2522, - "step": 449490 - }, - { - "epoch": 0.78, - "learning_rate": 1.0806300289135281e-05, - "loss": 2.1331, - "step": 449500 - }, - { - "epoch": 0.78, - "learning_rate": 1.0805428349208453e-05, - "loss": 2.3617, - "step": 449510 - }, - { - "epoch": 0.78, - "learning_rate": 1.0804556409281627e-05, - "loss": 2.1801, - "step": 449520 - }, - { - "epoch": 0.78, - "learning_rate": 1.0803684469354799e-05, - "loss": 2.3151, - "step": 449530 - }, - { - "epoch": 0.78, - "learning_rate": 1.0802812529427973e-05, - "loss": 2.3262, - "step": 449540 - }, - { - "epoch": 0.78, - "learning_rate": 1.0801940589501145e-05, - "loss": 2.2605, - "step": 449550 - }, - { - "epoch": 0.78, - "learning_rate": 1.080106864957432e-05, - "loss": 2.3488, - "step": 449560 - }, - { - "epoch": 0.78, - "learning_rate": 1.0800196709647493e-05, - "loss": 2.3618, - "step": 449570 - }, - { - "epoch": 0.78, - "learning_rate": 1.0799324769720666e-05, - "loss": 2.2361, - "step": 449580 - }, - { - "epoch": 0.78, - "learning_rate": 1.0798452829793838e-05, - "loss": 2.2158, - "step": 449590 - }, - { - "epoch": 0.78, - "learning_rate": 1.0797580889867012e-05, - "loss": 2.2754, - "step": 449600 - }, - { - "epoch": 0.78, - "learning_rate": 1.0796708949940186e-05, - "loss": 2.1509, - "step": 449610 - }, - { - "epoch": 0.78, - "learning_rate": 1.0795837010013358e-05, - "loss": 2.39, - "step": 449620 - }, - { - "epoch": 0.78, - "learning_rate": 1.0794965070086532e-05, - "loss": 2.3359, - "step": 449630 - }, - { - "epoch": 0.78, - "learning_rate": 1.0794093130159706e-05, - "loss": 2.3593, - "step": 449640 - }, - { - "epoch": 0.78, - "learning_rate": 1.079322119023288e-05, - "loss": 2.3454, - "step": 449650 - }, - { - "epoch": 0.78, - "learning_rate": 1.0792349250306051e-05, - "loss": 2.2673, - "step": 449660 - }, - { - "epoch": 0.78, - "learning_rate": 1.0791477310379225e-05, - "loss": 2.2401, - "step": 449670 - }, - { - "epoch": 0.78, - "learning_rate": 1.0790605370452397e-05, - "loss": 2.2842, - "step": 449680 - }, - { - "epoch": 0.78, - "learning_rate": 1.0789733430525571e-05, - "loss": 2.2947, - "step": 449690 - }, - { - "epoch": 0.78, - "learning_rate": 1.0788861490598743e-05, - "loss": 2.2988, - "step": 449700 - }, - { - "epoch": 0.78, - "learning_rate": 1.0787989550671917e-05, - "loss": 2.3312, - "step": 449710 - }, - { - "epoch": 0.78, - "learning_rate": 1.078711761074509e-05, - "loss": 2.2716, - "step": 449720 - }, - { - "epoch": 0.78, - "learning_rate": 1.0786245670818264e-05, - "loss": 2.3822, - "step": 449730 - }, - { - "epoch": 0.78, - "learning_rate": 1.0785373730891438e-05, - "loss": 2.3064, - "step": 449740 - }, - { - "epoch": 0.78, - "learning_rate": 1.078450179096461e-05, - "loss": 2.2458, - "step": 449750 - }, - { - "epoch": 0.78, - "learning_rate": 1.0783629851037784e-05, - "loss": 2.4669, - "step": 449760 - }, - { - "epoch": 0.78, - "learning_rate": 1.0782757911110956e-05, - "loss": 2.3021, - "step": 449770 - }, - { - "epoch": 0.78, - "learning_rate": 1.078188597118413e-05, - "loss": 2.3231, - "step": 449780 - }, - { - "epoch": 0.78, - "learning_rate": 1.0781014031257302e-05, - "loss": 2.3044, - "step": 449790 - }, - { - "epoch": 0.78, - "learning_rate": 1.0780142091330477e-05, - "loss": 2.2474, - "step": 449800 - }, - { - "epoch": 0.78, - "learning_rate": 1.077927015140365e-05, - "loss": 2.3739, - "step": 449810 - }, - { - "epoch": 0.78, - "learning_rate": 1.0778398211476823e-05, - "loss": 2.3696, - "step": 449820 - }, - { - "epoch": 0.78, - "learning_rate": 1.0777526271549995e-05, - "loss": 2.2697, - "step": 449830 - }, - { - "epoch": 0.78, - "learning_rate": 1.0776654331623169e-05, - "loss": 2.3265, - "step": 449840 - }, - { - "epoch": 0.78, - "learning_rate": 1.0775782391696341e-05, - "loss": 2.2406, - "step": 449850 - }, - { - "epoch": 0.78, - "learning_rate": 1.0774910451769515e-05, - "loss": 2.2847, - "step": 449860 - }, - { - "epoch": 0.78, - "learning_rate": 1.0774038511842689e-05, - "loss": 2.3965, - "step": 449870 - }, - { - "epoch": 0.78, - "learning_rate": 1.0773166571915862e-05, - "loss": 2.3005, - "step": 449880 - }, - { - "epoch": 0.78, - "learning_rate": 1.0772294631989036e-05, - "loss": 2.3411, - "step": 449890 - }, - { - "epoch": 0.78, - "learning_rate": 1.0771422692062208e-05, - "loss": 2.3527, - "step": 449900 - }, - { - "epoch": 0.78, - "learning_rate": 1.0770550752135382e-05, - "loss": 2.371, - "step": 449910 - }, - { - "epoch": 0.78, - "learning_rate": 1.0769678812208554e-05, - "loss": 2.3902, - "step": 449920 - }, - { - "epoch": 0.78, - "learning_rate": 1.0768806872281728e-05, - "loss": 2.3924, - "step": 449930 - }, - { - "epoch": 0.78, - "learning_rate": 1.07679349323549e-05, - "loss": 2.2465, - "step": 449940 - }, - { - "epoch": 0.78, - "learning_rate": 1.0767062992428074e-05, - "loss": 2.4209, - "step": 449950 - }, - { - "epoch": 0.78, - "learning_rate": 1.0766191052501248e-05, - "loss": 2.2868, - "step": 449960 - }, - { - "epoch": 0.78, - "learning_rate": 1.0765319112574421e-05, - "loss": 2.2233, - "step": 449970 - }, - { - "epoch": 0.78, - "learning_rate": 1.0764447172647593e-05, - "loss": 2.294, - "step": 449980 - }, - { - "epoch": 0.78, - "learning_rate": 1.0763575232720767e-05, - "loss": 2.2497, - "step": 449990 - }, - { - "epoch": 0.78, - "learning_rate": 1.0762703292793941e-05, - "loss": 2.2802, - "step": 450000 - }, - { - "epoch": 0.78, - "learning_rate": 1.0761831352867113e-05, - "loss": 2.3855, - "step": 450010 - }, - { - "epoch": 0.78, - "learning_rate": 1.0760959412940287e-05, - "loss": 2.2662, - "step": 450020 - }, - { - "epoch": 0.78, - "learning_rate": 1.0760087473013459e-05, - "loss": 2.3497, - "step": 450030 - }, - { - "epoch": 0.78, - "learning_rate": 1.0759215533086634e-05, - "loss": 2.2592, - "step": 450040 - }, - { - "epoch": 0.78, - "learning_rate": 1.0758343593159806e-05, - "loss": 2.284, - "step": 450050 - }, - { - "epoch": 0.78, - "learning_rate": 1.075747165323298e-05, - "loss": 2.3896, - "step": 450060 - }, - { - "epoch": 0.78, - "learning_rate": 1.0756599713306152e-05, - "loss": 2.2608, - "step": 450070 - }, - { - "epoch": 0.78, - "learning_rate": 1.0755727773379326e-05, - "loss": 2.2361, - "step": 450080 - }, - { - "epoch": 0.78, - "learning_rate": 1.0754855833452498e-05, - "loss": 2.1684, - "step": 450090 - }, - { - "epoch": 0.78, - "learning_rate": 1.0753983893525672e-05, - "loss": 2.2717, - "step": 450100 - }, - { - "epoch": 0.78, - "learning_rate": 1.0753111953598846e-05, - "loss": 2.3537, - "step": 450110 - }, - { - "epoch": 0.78, - "learning_rate": 1.075224001367202e-05, - "loss": 2.2698, - "step": 450120 - }, - { - "epoch": 0.78, - "learning_rate": 1.0751368073745193e-05, - "loss": 2.3842, - "step": 450130 - }, - { - "epoch": 0.78, - "learning_rate": 1.0750496133818365e-05, - "loss": 2.198, - "step": 450140 - }, - { - "epoch": 0.79, - "learning_rate": 1.0749624193891539e-05, - "loss": 2.346, - "step": 450150 - }, - { - "epoch": 0.79, - "learning_rate": 1.0748752253964711e-05, - "loss": 2.3203, - "step": 450160 - }, - { - "epoch": 0.79, - "learning_rate": 1.0747880314037885e-05, - "loss": 2.2108, - "step": 450170 - }, - { - "epoch": 0.79, - "learning_rate": 1.0747008374111057e-05, - "loss": 2.2306, - "step": 450180 - }, - { - "epoch": 0.79, - "learning_rate": 1.074613643418423e-05, - "loss": 2.2754, - "step": 450190 - }, - { - "epoch": 0.79, - "learning_rate": 1.0745264494257404e-05, - "loss": 2.1815, - "step": 450200 - }, - { - "epoch": 0.79, - "learning_rate": 1.0744392554330578e-05, - "loss": 2.2219, - "step": 450210 - }, - { - "epoch": 0.79, - "learning_rate": 1.074352061440375e-05, - "loss": 2.3242, - "step": 450220 - }, - { - "epoch": 0.79, - "learning_rate": 1.0742648674476924e-05, - "loss": 2.2676, - "step": 450230 - }, - { - "epoch": 0.79, - "learning_rate": 1.0741776734550096e-05, - "loss": 2.2477, - "step": 450240 - }, - { - "epoch": 0.79, - "learning_rate": 1.074090479462327e-05, - "loss": 2.3049, - "step": 450250 - }, - { - "epoch": 0.79, - "learning_rate": 1.0740032854696442e-05, - "loss": 2.3957, - "step": 450260 - }, - { - "epoch": 0.79, - "learning_rate": 1.0739160914769616e-05, - "loss": 2.2668, - "step": 450270 - }, - { - "epoch": 0.79, - "learning_rate": 1.073828897484279e-05, - "loss": 2.3204, - "step": 450280 - }, - { - "epoch": 0.79, - "learning_rate": 1.0737417034915963e-05, - "loss": 2.1676, - "step": 450290 - }, - { - "epoch": 0.79, - "learning_rate": 1.0736545094989137e-05, - "loss": 2.1814, - "step": 450300 - }, - { - "epoch": 0.79, - "learning_rate": 1.0735673155062309e-05, - "loss": 2.3295, - "step": 450310 - }, - { - "epoch": 0.79, - "learning_rate": 1.0734801215135483e-05, - "loss": 2.2568, - "step": 450320 - }, - { - "epoch": 0.79, - "learning_rate": 1.0733929275208655e-05, - "loss": 2.2412, - "step": 450330 - }, - { - "epoch": 0.79, - "learning_rate": 1.0733057335281829e-05, - "loss": 2.2534, - "step": 450340 - }, - { - "epoch": 0.79, - "learning_rate": 1.0732185395355003e-05, - "loss": 2.2497, - "step": 450350 - }, - { - "epoch": 0.79, - "learning_rate": 1.0731313455428176e-05, - "loss": 2.2187, - "step": 450360 - }, - { - "epoch": 0.79, - "learning_rate": 1.0730441515501348e-05, - "loss": 2.1791, - "step": 450370 - }, - { - "epoch": 0.79, - "learning_rate": 1.0729569575574522e-05, - "loss": 2.2016, - "step": 450380 - }, - { - "epoch": 0.79, - "learning_rate": 1.0728697635647694e-05, - "loss": 2.2771, - "step": 450390 - }, - { - "epoch": 0.79, - "learning_rate": 1.0727825695720868e-05, - "loss": 2.4166, - "step": 450400 - }, - { - "epoch": 0.79, - "learning_rate": 1.0726953755794042e-05, - "loss": 2.3865, - "step": 450410 - }, - { - "epoch": 0.79, - "learning_rate": 1.0726081815867214e-05, - "loss": 2.2444, - "step": 450420 - }, - { - "epoch": 0.79, - "learning_rate": 1.0725209875940388e-05, - "loss": 2.2878, - "step": 450430 - }, - { - "epoch": 0.79, - "learning_rate": 1.0724337936013561e-05, - "loss": 2.3997, - "step": 450440 - }, - { - "epoch": 0.79, - "learning_rate": 1.0723465996086735e-05, - "loss": 2.2708, - "step": 450450 - }, - { - "epoch": 0.79, - "learning_rate": 1.0722594056159907e-05, - "loss": 2.3768, - "step": 450460 - }, - { - "epoch": 0.79, - "learning_rate": 1.0721722116233081e-05, - "loss": 2.2351, - "step": 450470 - }, - { - "epoch": 0.79, - "learning_rate": 1.0720850176306253e-05, - "loss": 2.3214, - "step": 450480 - }, - { - "epoch": 0.79, - "learning_rate": 1.0719978236379427e-05, - "loss": 2.1862, - "step": 450490 - }, - { - "epoch": 0.79, - "learning_rate": 1.0719106296452599e-05, - "loss": 2.1891, - "step": 450500 - }, - { - "epoch": 0.79, - "learning_rate": 1.0718234356525773e-05, - "loss": 2.3988, - "step": 450510 - }, - { - "epoch": 0.79, - "learning_rate": 1.0717362416598946e-05, - "loss": 2.2365, - "step": 450520 - }, - { - "epoch": 0.79, - "learning_rate": 1.071649047667212e-05, - "loss": 2.3106, - "step": 450530 - }, - { - "epoch": 0.79, - "learning_rate": 1.0715618536745294e-05, - "loss": 2.3045, - "step": 450540 - }, - { - "epoch": 0.79, - "learning_rate": 1.0714746596818466e-05, - "loss": 2.2453, - "step": 450550 - }, - { - "epoch": 0.79, - "learning_rate": 1.071387465689164e-05, - "loss": 2.2847, - "step": 450560 - }, - { - "epoch": 0.79, - "learning_rate": 1.0713002716964812e-05, - "loss": 2.2715, - "step": 450570 - }, - { - "epoch": 0.79, - "learning_rate": 1.0712130777037986e-05, - "loss": 2.2767, - "step": 450580 - }, - { - "epoch": 0.79, - "learning_rate": 1.0711258837111158e-05, - "loss": 2.2663, - "step": 450590 - }, - { - "epoch": 0.79, - "learning_rate": 1.0710386897184333e-05, - "loss": 2.2989, - "step": 450600 - }, - { - "epoch": 0.79, - "learning_rate": 1.0709514957257505e-05, - "loss": 2.331, - "step": 450610 - }, - { - "epoch": 0.79, - "learning_rate": 1.0708643017330679e-05, - "loss": 2.3558, - "step": 450620 - }, - { - "epoch": 0.79, - "learning_rate": 1.0707771077403851e-05, - "loss": 2.1973, - "step": 450630 - }, - { - "epoch": 0.79, - "learning_rate": 1.0706899137477025e-05, - "loss": 2.3248, - "step": 450640 - }, - { - "epoch": 0.79, - "learning_rate": 1.0706027197550197e-05, - "loss": 2.3293, - "step": 450650 - }, - { - "epoch": 0.79, - "learning_rate": 1.070515525762337e-05, - "loss": 2.3976, - "step": 450660 - }, - { - "epoch": 0.79, - "learning_rate": 1.0704283317696545e-05, - "loss": 2.3094, - "step": 450670 - }, - { - "epoch": 0.79, - "learning_rate": 1.0703411377769718e-05, - "loss": 2.3532, - "step": 450680 - }, - { - "epoch": 0.79, - "learning_rate": 1.0702539437842892e-05, - "loss": 2.3697, - "step": 450690 - }, - { - "epoch": 0.79, - "learning_rate": 1.0701667497916064e-05, - "loss": 2.4347, - "step": 450700 - }, - { - "epoch": 0.79, - "learning_rate": 1.0700795557989238e-05, - "loss": 2.3374, - "step": 450710 - }, - { - "epoch": 0.79, - "learning_rate": 1.069992361806241e-05, - "loss": 2.2787, - "step": 450720 - }, - { - "epoch": 0.79, - "learning_rate": 1.0699051678135584e-05, - "loss": 2.323, - "step": 450730 - }, - { - "epoch": 0.79, - "learning_rate": 1.0698179738208756e-05, - "loss": 2.3431, - "step": 450740 - }, - { - "epoch": 0.79, - "learning_rate": 1.069730779828193e-05, - "loss": 2.3029, - "step": 450750 - }, - { - "epoch": 0.79, - "learning_rate": 1.0696435858355103e-05, - "loss": 2.3509, - "step": 450760 - }, - { - "epoch": 0.79, - "learning_rate": 1.0695563918428277e-05, - "loss": 2.4273, - "step": 450770 - }, - { - "epoch": 0.79, - "learning_rate": 1.069469197850145e-05, - "loss": 2.2018, - "step": 450780 - }, - { - "epoch": 0.79, - "learning_rate": 1.0693820038574623e-05, - "loss": 2.1855, - "step": 450790 - }, - { - "epoch": 0.79, - "learning_rate": 1.0692948098647797e-05, - "loss": 2.2757, - "step": 450800 - }, - { - "epoch": 0.79, - "learning_rate": 1.0692076158720969e-05, - "loss": 2.2735, - "step": 450810 - }, - { - "epoch": 0.79, - "learning_rate": 1.0691204218794143e-05, - "loss": 2.4053, - "step": 450820 - }, - { - "epoch": 0.79, - "learning_rate": 1.0690332278867315e-05, - "loss": 2.2096, - "step": 450830 - }, - { - "epoch": 0.79, - "learning_rate": 1.068946033894049e-05, - "loss": 2.3292, - "step": 450840 - }, - { - "epoch": 0.79, - "learning_rate": 1.0688588399013662e-05, - "loss": 2.3046, - "step": 450850 - }, - { - "epoch": 0.79, - "learning_rate": 1.0687716459086836e-05, - "loss": 2.2382, - "step": 450860 - }, - { - "epoch": 0.79, - "learning_rate": 1.0686844519160008e-05, - "loss": 2.2304, - "step": 450870 - }, - { - "epoch": 0.79, - "learning_rate": 1.0685972579233182e-05, - "loss": 2.2396, - "step": 450880 - }, - { - "epoch": 0.79, - "learning_rate": 1.0685100639306354e-05, - "loss": 2.2996, - "step": 450890 - }, - { - "epoch": 0.79, - "learning_rate": 1.0684228699379528e-05, - "loss": 2.233, - "step": 450900 - }, - { - "epoch": 0.79, - "learning_rate": 1.0683356759452701e-05, - "loss": 2.3296, - "step": 450910 - }, - { - "epoch": 0.79, - "learning_rate": 1.0682484819525875e-05, - "loss": 2.3448, - "step": 450920 - }, - { - "epoch": 0.79, - "learning_rate": 1.0681612879599049e-05, - "loss": 2.2208, - "step": 450930 - }, - { - "epoch": 0.79, - "learning_rate": 1.0680740939672221e-05, - "loss": 2.326, - "step": 450940 - }, - { - "epoch": 0.79, - "learning_rate": 1.0679868999745395e-05, - "loss": 2.3926, - "step": 450950 - }, - { - "epoch": 0.79, - "learning_rate": 1.0678997059818567e-05, - "loss": 2.1418, - "step": 450960 - }, - { - "epoch": 0.79, - "learning_rate": 1.067812511989174e-05, - "loss": 2.3779, - "step": 450970 - }, - { - "epoch": 0.79, - "learning_rate": 1.0677253179964913e-05, - "loss": 2.307, - "step": 450980 - }, - { - "epoch": 0.79, - "learning_rate": 1.0676381240038087e-05, - "loss": 2.2993, - "step": 450990 - }, - { - "epoch": 0.79, - "learning_rate": 1.067550930011126e-05, - "loss": 2.2492, - "step": 451000 - }, - { - "epoch": 0.79, - "learning_rate": 1.0674637360184434e-05, - "loss": 2.2619, - "step": 451010 - }, - { - "epoch": 0.79, - "learning_rate": 1.0673765420257606e-05, - "loss": 2.3215, - "step": 451020 - }, - { - "epoch": 0.79, - "learning_rate": 1.067289348033078e-05, - "loss": 2.3279, - "step": 451030 - }, - { - "epoch": 0.79, - "learning_rate": 1.0672021540403952e-05, - "loss": 2.2973, - "step": 451040 - }, - { - "epoch": 0.79, - "learning_rate": 1.0671149600477126e-05, - "loss": 2.3695, - "step": 451050 - }, - { - "epoch": 0.79, - "learning_rate": 1.06702776605503e-05, - "loss": 2.367, - "step": 451060 - }, - { - "epoch": 0.79, - "learning_rate": 1.0669405720623472e-05, - "loss": 2.282, - "step": 451070 - }, - { - "epoch": 0.79, - "learning_rate": 1.0668533780696647e-05, - "loss": 2.4045, - "step": 451080 - }, - { - "epoch": 0.79, - "learning_rate": 1.0667661840769819e-05, - "loss": 2.2837, - "step": 451090 - }, - { - "epoch": 0.79, - "learning_rate": 1.0666789900842993e-05, - "loss": 2.2095, - "step": 451100 - }, - { - "epoch": 0.79, - "learning_rate": 1.0665917960916165e-05, - "loss": 2.3161, - "step": 451110 - }, - { - "epoch": 0.79, - "learning_rate": 1.0665046020989339e-05, - "loss": 2.2393, - "step": 451120 - }, - { - "epoch": 0.79, - "learning_rate": 1.066417408106251e-05, - "loss": 2.3892, - "step": 451130 - }, - { - "epoch": 0.79, - "learning_rate": 1.0663302141135685e-05, - "loss": 2.3358, - "step": 451140 - }, - { - "epoch": 0.79, - "learning_rate": 1.0662430201208858e-05, - "loss": 2.2544, - "step": 451150 - }, - { - "epoch": 0.79, - "learning_rate": 1.0661558261282032e-05, - "loss": 2.2247, - "step": 451160 - }, - { - "epoch": 0.79, - "learning_rate": 1.0660686321355204e-05, - "loss": 2.2466, - "step": 451170 - }, - { - "epoch": 0.79, - "learning_rate": 1.0659814381428378e-05, - "loss": 2.199, - "step": 451180 - }, - { - "epoch": 0.79, - "learning_rate": 1.065894244150155e-05, - "loss": 2.2166, - "step": 451190 - }, - { - "epoch": 0.79, - "learning_rate": 1.0658070501574724e-05, - "loss": 2.2486, - "step": 451200 - }, - { - "epoch": 0.79, - "learning_rate": 1.0657198561647898e-05, - "loss": 2.3837, - "step": 451210 - }, - { - "epoch": 0.79, - "learning_rate": 1.065632662172107e-05, - "loss": 2.2161, - "step": 451220 - }, - { - "epoch": 0.79, - "learning_rate": 1.0655454681794243e-05, - "loss": 2.1949, - "step": 451230 - }, - { - "epoch": 0.79, - "learning_rate": 1.0654582741867417e-05, - "loss": 2.3243, - "step": 451240 - }, - { - "epoch": 0.79, - "learning_rate": 1.0653710801940591e-05, - "loss": 2.2487, - "step": 451250 - }, - { - "epoch": 0.79, - "learning_rate": 1.0652838862013763e-05, - "loss": 2.3385, - "step": 451260 - }, - { - "epoch": 0.79, - "learning_rate": 1.0651966922086937e-05, - "loss": 2.2253, - "step": 451270 - }, - { - "epoch": 0.79, - "learning_rate": 1.0651094982160109e-05, - "loss": 2.1901, - "step": 451280 - }, - { - "epoch": 0.79, - "learning_rate": 1.0650223042233283e-05, - "loss": 2.3437, - "step": 451290 - }, - { - "epoch": 0.79, - "learning_rate": 1.0649351102306455e-05, - "loss": 2.4116, - "step": 451300 - }, - { - "epoch": 0.79, - "learning_rate": 1.0648479162379629e-05, - "loss": 2.3056, - "step": 451310 - }, - { - "epoch": 0.79, - "learning_rate": 1.0647607222452802e-05, - "loss": 2.3883, - "step": 451320 - }, - { - "epoch": 0.79, - "learning_rate": 1.0646735282525976e-05, - "loss": 2.2487, - "step": 451330 - }, - { - "epoch": 0.79, - "learning_rate": 1.064586334259915e-05, - "loss": 2.2987, - "step": 451340 - }, - { - "epoch": 0.79, - "learning_rate": 1.0644991402672322e-05, - "loss": 2.4565, - "step": 451350 - }, - { - "epoch": 0.79, - "learning_rate": 1.0644119462745496e-05, - "loss": 2.2087, - "step": 451360 - }, - { - "epoch": 0.79, - "learning_rate": 1.0643247522818668e-05, - "loss": 2.3303, - "step": 451370 - }, - { - "epoch": 0.79, - "learning_rate": 1.0642375582891842e-05, - "loss": 2.2096, - "step": 451380 - }, - { - "epoch": 0.79, - "learning_rate": 1.0641503642965015e-05, - "loss": 2.2762, - "step": 451390 - }, - { - "epoch": 0.79, - "learning_rate": 1.0640631703038189e-05, - "loss": 2.2706, - "step": 451400 - }, - { - "epoch": 0.79, - "learning_rate": 1.0639759763111361e-05, - "loss": 2.0764, - "step": 451410 - }, - { - "epoch": 0.79, - "learning_rate": 1.0638887823184535e-05, - "loss": 2.1351, - "step": 451420 - }, - { - "epoch": 0.79, - "learning_rate": 1.0638015883257707e-05, - "loss": 2.2237, - "step": 451430 - }, - { - "epoch": 0.79, - "learning_rate": 1.063714394333088e-05, - "loss": 2.2377, - "step": 451440 - }, - { - "epoch": 0.79, - "learning_rate": 1.0636272003404053e-05, - "loss": 2.3044, - "step": 451450 - }, - { - "epoch": 0.79, - "learning_rate": 1.0635400063477227e-05, - "loss": 2.3862, - "step": 451460 - }, - { - "epoch": 0.79, - "learning_rate": 1.06345281235504e-05, - "loss": 2.2312, - "step": 451470 - }, - { - "epoch": 0.79, - "learning_rate": 1.0633656183623574e-05, - "loss": 2.3081, - "step": 451480 - }, - { - "epoch": 0.79, - "learning_rate": 1.0632784243696748e-05, - "loss": 2.2366, - "step": 451490 - }, - { - "epoch": 0.79, - "learning_rate": 1.063191230376992e-05, - "loss": 2.2242, - "step": 451500 - }, - { - "epoch": 0.79, - "learning_rate": 1.0631040363843094e-05, - "loss": 2.2917, - "step": 451510 - }, - { - "epoch": 0.79, - "learning_rate": 1.0630168423916266e-05, - "loss": 2.3697, - "step": 451520 - }, - { - "epoch": 0.79, - "learning_rate": 1.062929648398944e-05, - "loss": 2.2877, - "step": 451530 - }, - { - "epoch": 0.79, - "learning_rate": 1.0628424544062612e-05, - "loss": 2.3335, - "step": 451540 - }, - { - "epoch": 0.79, - "learning_rate": 1.0627552604135785e-05, - "loss": 2.2675, - "step": 451550 - }, - { - "epoch": 0.79, - "learning_rate": 1.062668066420896e-05, - "loss": 2.3623, - "step": 451560 - }, - { - "epoch": 0.79, - "learning_rate": 1.0625808724282133e-05, - "loss": 2.2991, - "step": 451570 - }, - { - "epoch": 0.79, - "learning_rate": 1.0624936784355305e-05, - "loss": 2.286, - "step": 451580 - }, - { - "epoch": 0.79, - "learning_rate": 1.0624064844428479e-05, - "loss": 2.2107, - "step": 451590 - }, - { - "epoch": 0.79, - "learning_rate": 1.0623192904501653e-05, - "loss": 2.3226, - "step": 451600 - }, - { - "epoch": 0.79, - "learning_rate": 1.0622320964574825e-05, - "loss": 2.2885, - "step": 451610 - }, - { - "epoch": 0.79, - "learning_rate": 1.0621449024647998e-05, - "loss": 2.2379, - "step": 451620 - }, - { - "epoch": 0.79, - "learning_rate": 1.062057708472117e-05, - "loss": 2.3277, - "step": 451630 - }, - { - "epoch": 0.79, - "learning_rate": 1.0619705144794346e-05, - "loss": 2.3705, - "step": 451640 - }, - { - "epoch": 0.79, - "learning_rate": 1.0618833204867518e-05, - "loss": 2.3136, - "step": 451650 - }, - { - "epoch": 0.79, - "learning_rate": 1.0617961264940692e-05, - "loss": 2.1707, - "step": 451660 - }, - { - "epoch": 0.79, - "learning_rate": 1.0617089325013864e-05, - "loss": 2.2198, - "step": 451670 - }, - { - "epoch": 0.79, - "learning_rate": 1.0616217385087038e-05, - "loss": 2.3085, - "step": 451680 - }, - { - "epoch": 0.79, - "learning_rate": 1.061534544516021e-05, - "loss": 2.2149, - "step": 451690 - }, - { - "epoch": 0.79, - "learning_rate": 1.0614473505233384e-05, - "loss": 2.242, - "step": 451700 - }, - { - "epoch": 0.79, - "learning_rate": 1.0613601565306557e-05, - "loss": 2.3309, - "step": 451710 - }, - { - "epoch": 0.79, - "learning_rate": 1.0612729625379731e-05, - "loss": 2.223, - "step": 451720 - }, - { - "epoch": 0.79, - "learning_rate": 1.0611857685452905e-05, - "loss": 2.2953, - "step": 451730 - }, - { - "epoch": 0.79, - "learning_rate": 1.0610985745526077e-05, - "loss": 2.3243, - "step": 451740 - }, - { - "epoch": 0.79, - "learning_rate": 1.061011380559925e-05, - "loss": 2.3607, - "step": 451750 - }, - { - "epoch": 0.79, - "learning_rate": 1.0609241865672423e-05, - "loss": 2.3449, - "step": 451760 - }, - { - "epoch": 0.79, - "learning_rate": 1.0608369925745597e-05, - "loss": 2.2988, - "step": 451770 - }, - { - "epoch": 0.79, - "learning_rate": 1.0607497985818769e-05, - "loss": 2.2436, - "step": 451780 - }, - { - "epoch": 0.79, - "learning_rate": 1.0606626045891942e-05, - "loss": 2.35, - "step": 451790 - }, - { - "epoch": 0.79, - "learning_rate": 1.0605754105965116e-05, - "loss": 2.2338, - "step": 451800 - }, - { - "epoch": 0.79, - "learning_rate": 1.060488216603829e-05, - "loss": 2.2637, - "step": 451810 - }, - { - "epoch": 0.79, - "learning_rate": 1.0604010226111462e-05, - "loss": 2.247, - "step": 451820 - }, - { - "epoch": 0.79, - "learning_rate": 1.0603138286184636e-05, - "loss": 2.2722, - "step": 451830 - }, - { - "epoch": 0.79, - "learning_rate": 1.0602266346257808e-05, - "loss": 2.2879, - "step": 451840 - }, - { - "epoch": 0.79, - "learning_rate": 1.0601394406330982e-05, - "loss": 2.3636, - "step": 451850 - }, - { - "epoch": 0.79, - "learning_rate": 1.0600522466404155e-05, - "loss": 2.2544, - "step": 451860 - }, - { - "epoch": 0.79, - "learning_rate": 1.0599650526477327e-05, - "loss": 2.3306, - "step": 451870 - }, - { - "epoch": 0.79, - "learning_rate": 1.0598778586550503e-05, - "loss": 2.3093, - "step": 451880 - }, - { - "epoch": 0.79, - "learning_rate": 1.0597906646623675e-05, - "loss": 2.2767, - "step": 451890 - }, - { - "epoch": 0.79, - "learning_rate": 1.0597034706696849e-05, - "loss": 2.3309, - "step": 451900 - }, - { - "epoch": 0.79, - "learning_rate": 1.059616276677002e-05, - "loss": 2.3273, - "step": 451910 - }, - { - "epoch": 0.79, - "learning_rate": 1.0595290826843195e-05, - "loss": 2.4102, - "step": 451920 - }, - { - "epoch": 0.79, - "learning_rate": 1.0594418886916367e-05, - "loss": 2.1329, - "step": 451930 - }, - { - "epoch": 0.79, - "learning_rate": 1.059354694698954e-05, - "loss": 2.2046, - "step": 451940 - }, - { - "epoch": 0.79, - "learning_rate": 1.0592675007062714e-05, - "loss": 2.2472, - "step": 451950 - }, - { - "epoch": 0.79, - "learning_rate": 1.0591803067135888e-05, - "loss": 2.3142, - "step": 451960 - }, - { - "epoch": 0.79, - "learning_rate": 1.059093112720906e-05, - "loss": 2.3181, - "step": 451970 - }, - { - "epoch": 0.79, - "learning_rate": 1.0590059187282234e-05, - "loss": 2.2984, - "step": 451980 - }, - { - "epoch": 0.79, - "learning_rate": 1.0589187247355408e-05, - "loss": 2.2173, - "step": 451990 - }, - { - "epoch": 0.79, - "learning_rate": 1.058831530742858e-05, - "loss": 2.1415, - "step": 452000 - }, - { - "epoch": 0.79, - "learning_rate": 1.0587443367501753e-05, - "loss": 2.2295, - "step": 452010 - }, - { - "epoch": 0.79, - "learning_rate": 1.0586571427574926e-05, - "loss": 2.2254, - "step": 452020 - }, - { - "epoch": 0.79, - "learning_rate": 1.05856994876481e-05, - "loss": 2.2645, - "step": 452030 - }, - { - "epoch": 0.79, - "learning_rate": 1.0584827547721273e-05, - "loss": 2.2519, - "step": 452040 - }, - { - "epoch": 0.79, - "learning_rate": 1.0583955607794447e-05, - "loss": 2.1762, - "step": 452050 - }, - { - "epoch": 0.79, - "learning_rate": 1.0583083667867619e-05, - "loss": 2.1513, - "step": 452060 - }, - { - "epoch": 0.79, - "learning_rate": 1.0582211727940793e-05, - "loss": 2.4179, - "step": 452070 - }, - { - "epoch": 0.79, - "learning_rate": 1.0581339788013965e-05, - "loss": 2.2772, - "step": 452080 - }, - { - "epoch": 0.79, - "learning_rate": 1.0580467848087139e-05, - "loss": 2.2102, - "step": 452090 - }, - { - "epoch": 0.79, - "learning_rate": 1.057959590816031e-05, - "loss": 2.3593, - "step": 452100 - }, - { - "epoch": 0.79, - "learning_rate": 1.0578723968233484e-05, - "loss": 2.3284, - "step": 452110 - }, - { - "epoch": 0.79, - "learning_rate": 1.0577852028306658e-05, - "loss": 2.2732, - "step": 452120 - }, - { - "epoch": 0.79, - "learning_rate": 1.0576980088379832e-05, - "loss": 2.282, - "step": 452130 - }, - { - "epoch": 0.79, - "learning_rate": 1.0576108148453006e-05, - "loss": 2.2818, - "step": 452140 - }, - { - "epoch": 0.79, - "learning_rate": 1.0575236208526178e-05, - "loss": 2.2902, - "step": 452150 - }, - { - "epoch": 0.79, - "learning_rate": 1.0574364268599352e-05, - "loss": 2.2469, - "step": 452160 - }, - { - "epoch": 0.79, - "learning_rate": 1.0573492328672524e-05, - "loss": 2.2644, - "step": 452170 - }, - { - "epoch": 0.79, - "learning_rate": 1.0572620388745697e-05, - "loss": 2.309, - "step": 452180 - }, - { - "epoch": 0.79, - "learning_rate": 1.0571748448818871e-05, - "loss": 2.2679, - "step": 452190 - }, - { - "epoch": 0.79, - "learning_rate": 1.0570876508892045e-05, - "loss": 2.3388, - "step": 452200 - }, - { - "epoch": 0.79, - "learning_rate": 1.0570004568965217e-05, - "loss": 2.2145, - "step": 452210 - }, - { - "epoch": 0.79, - "learning_rate": 1.056913262903839e-05, - "loss": 2.2889, - "step": 452220 - }, - { - "epoch": 0.79, - "learning_rate": 1.0568260689111563e-05, - "loss": 2.3089, - "step": 452230 - }, - { - "epoch": 0.79, - "learning_rate": 1.0567388749184737e-05, - "loss": 2.3108, - "step": 452240 - }, - { - "epoch": 0.79, - "learning_rate": 1.0566516809257909e-05, - "loss": 2.3201, - "step": 452250 - }, - { - "epoch": 0.79, - "learning_rate": 1.0565644869331082e-05, - "loss": 2.1881, - "step": 452260 - }, - { - "epoch": 0.79, - "learning_rate": 1.0564772929404256e-05, - "loss": 2.3154, - "step": 452270 - }, - { - "epoch": 0.79, - "learning_rate": 1.056390098947743e-05, - "loss": 2.1353, - "step": 452280 - }, - { - "epoch": 0.79, - "learning_rate": 1.0563029049550604e-05, - "loss": 2.3708, - "step": 452290 - }, - { - "epoch": 0.79, - "learning_rate": 1.0562157109623776e-05, - "loss": 2.2985, - "step": 452300 - }, - { - "epoch": 0.79, - "learning_rate": 1.056128516969695e-05, - "loss": 2.3198, - "step": 452310 - }, - { - "epoch": 0.79, - "learning_rate": 1.0560413229770122e-05, - "loss": 2.2688, - "step": 452320 - }, - { - "epoch": 0.79, - "learning_rate": 1.0559541289843295e-05, - "loss": 2.4053, - "step": 452330 - }, - { - "epoch": 0.79, - "learning_rate": 1.0558669349916468e-05, - "loss": 2.245, - "step": 452340 - }, - { - "epoch": 0.79, - "learning_rate": 1.0557797409989641e-05, - "loss": 2.2403, - "step": 452350 - }, - { - "epoch": 0.79, - "learning_rate": 1.0556925470062815e-05, - "loss": 2.3639, - "step": 452360 - }, - { - "epoch": 0.79, - "learning_rate": 1.0556053530135989e-05, - "loss": 2.3416, - "step": 452370 - }, - { - "epoch": 0.79, - "learning_rate": 1.0555181590209161e-05, - "loss": 2.1843, - "step": 452380 - }, - { - "epoch": 0.79, - "learning_rate": 1.0554309650282335e-05, - "loss": 2.3293, - "step": 452390 - }, - { - "epoch": 0.79, - "learning_rate": 1.0553437710355508e-05, - "loss": 2.2337, - "step": 452400 - }, - { - "epoch": 0.79, - "learning_rate": 1.055256577042868e-05, - "loss": 2.2505, - "step": 452410 - }, - { - "epoch": 0.79, - "learning_rate": 1.0551693830501854e-05, - "loss": 2.335, - "step": 452420 - }, - { - "epoch": 0.79, - "learning_rate": 1.0550821890575028e-05, - "loss": 2.3186, - "step": 452430 - }, - { - "epoch": 0.79, - "learning_rate": 1.0549949950648202e-05, - "loss": 2.3046, - "step": 452440 - }, - { - "epoch": 0.79, - "learning_rate": 1.0549078010721374e-05, - "loss": 2.1998, - "step": 452450 - }, - { - "epoch": 0.79, - "learning_rate": 1.0548206070794548e-05, - "loss": 2.3185, - "step": 452460 - }, - { - "epoch": 0.79, - "learning_rate": 1.054733413086772e-05, - "loss": 2.3074, - "step": 452470 - }, - { - "epoch": 0.79, - "learning_rate": 1.0546462190940894e-05, - "loss": 2.2568, - "step": 452480 - }, - { - "epoch": 0.79, - "learning_rate": 1.0545590251014066e-05, - "loss": 2.2233, - "step": 452490 - }, - { - "epoch": 0.79, - "learning_rate": 1.054471831108724e-05, - "loss": 2.343, - "step": 452500 - }, - { - "epoch": 0.79, - "learning_rate": 1.0543846371160413e-05, - "loss": 2.3096, - "step": 452510 - }, - { - "epoch": 0.79, - "learning_rate": 1.0542974431233587e-05, - "loss": 2.3047, - "step": 452520 - }, - { - "epoch": 0.79, - "learning_rate": 1.054210249130676e-05, - "loss": 2.3072, - "step": 452530 - }, - { - "epoch": 0.79, - "learning_rate": 1.0541230551379933e-05, - "loss": 2.3619, - "step": 452540 - }, - { - "epoch": 0.79, - "learning_rate": 1.0540358611453107e-05, - "loss": 2.3085, - "step": 452550 - }, - { - "epoch": 0.79, - "learning_rate": 1.0539486671526279e-05, - "loss": 2.3789, - "step": 452560 - }, - { - "epoch": 0.79, - "learning_rate": 1.0538614731599452e-05, - "loss": 2.1945, - "step": 452570 - }, - { - "epoch": 0.79, - "learning_rate": 1.0537742791672624e-05, - "loss": 2.3497, - "step": 452580 - }, - { - "epoch": 0.79, - "learning_rate": 1.0536870851745798e-05, - "loss": 2.298, - "step": 452590 - }, - { - "epoch": 0.79, - "learning_rate": 1.0535998911818972e-05, - "loss": 2.4094, - "step": 452600 - }, - { - "epoch": 0.79, - "learning_rate": 1.0535126971892146e-05, - "loss": 2.3332, - "step": 452610 - }, - { - "epoch": 0.79, - "learning_rate": 1.0534255031965318e-05, - "loss": 2.2849, - "step": 452620 - }, - { - "epoch": 0.79, - "learning_rate": 1.0533383092038492e-05, - "loss": 2.2324, - "step": 452630 - }, - { - "epoch": 0.79, - "learning_rate": 1.0532511152111664e-05, - "loss": 2.1565, - "step": 452640 - }, - { - "epoch": 0.79, - "learning_rate": 1.0531639212184837e-05, - "loss": 2.276, - "step": 452650 - }, - { - "epoch": 0.79, - "learning_rate": 1.0530767272258011e-05, - "loss": 2.1321, - "step": 452660 - }, - { - "epoch": 0.79, - "learning_rate": 1.0529895332331183e-05, - "loss": 2.2902, - "step": 452670 - }, - { - "epoch": 0.79, - "learning_rate": 1.0529023392404359e-05, - "loss": 2.4007, - "step": 452680 - }, - { - "epoch": 0.79, - "learning_rate": 1.052815145247753e-05, - "loss": 2.2385, - "step": 452690 - }, - { - "epoch": 0.79, - "learning_rate": 1.0527279512550705e-05, - "loss": 2.1755, - "step": 452700 - }, - { - "epoch": 0.79, - "learning_rate": 1.0526407572623877e-05, - "loss": 2.3412, - "step": 452710 - }, - { - "epoch": 0.79, - "learning_rate": 1.052553563269705e-05, - "loss": 2.3553, - "step": 452720 - }, - { - "epoch": 0.79, - "learning_rate": 1.0524663692770223e-05, - "loss": 2.3552, - "step": 452730 - }, - { - "epoch": 0.79, - "learning_rate": 1.0523791752843396e-05, - "loss": 2.3038, - "step": 452740 - }, - { - "epoch": 0.79, - "learning_rate": 1.052291981291657e-05, - "loss": 2.2834, - "step": 452750 - }, - { - "epoch": 0.79, - "learning_rate": 1.0522047872989744e-05, - "loss": 2.3163, - "step": 452760 - }, - { - "epoch": 0.79, - "learning_rate": 1.0521175933062916e-05, - "loss": 2.4166, - "step": 452770 - }, - { - "epoch": 0.79, - "learning_rate": 1.052030399313609e-05, - "loss": 2.1991, - "step": 452780 - }, - { - "epoch": 0.79, - "learning_rate": 1.0519432053209263e-05, - "loss": 2.2902, - "step": 452790 - }, - { - "epoch": 0.79, - "learning_rate": 1.0518560113282436e-05, - "loss": 2.2797, - "step": 452800 - }, - { - "epoch": 0.79, - "learning_rate": 1.051768817335561e-05, - "loss": 2.3774, - "step": 452810 - }, - { - "epoch": 0.79, - "learning_rate": 1.0516816233428781e-05, - "loss": 2.2566, - "step": 452820 - }, - { - "epoch": 0.79, - "learning_rate": 1.0515944293501955e-05, - "loss": 2.2583, - "step": 452830 - }, - { - "epoch": 0.79, - "learning_rate": 1.0515072353575129e-05, - "loss": 2.4059, - "step": 452840 - }, - { - "epoch": 0.79, - "learning_rate": 1.0514200413648303e-05, - "loss": 2.3052, - "step": 452850 - }, - { - "epoch": 0.79, - "learning_rate": 1.0513328473721475e-05, - "loss": 2.2644, - "step": 452860 - }, - { - "epoch": 0.79, - "learning_rate": 1.0512456533794649e-05, - "loss": 2.3236, - "step": 452870 - }, - { - "epoch": 0.79, - "learning_rate": 1.051158459386782e-05, - "loss": 2.2617, - "step": 452880 - }, - { - "epoch": 0.79, - "learning_rate": 1.0510712653940994e-05, - "loss": 2.2539, - "step": 452890 - }, - { - "epoch": 0.79, - "learning_rate": 1.0509840714014166e-05, - "loss": 2.292, - "step": 452900 - }, - { - "epoch": 0.79, - "learning_rate": 1.050896877408734e-05, - "loss": 2.2064, - "step": 452910 - }, - { - "epoch": 0.79, - "learning_rate": 1.0508096834160514e-05, - "loss": 2.308, - "step": 452920 - }, - { - "epoch": 0.79, - "learning_rate": 1.0507224894233688e-05, - "loss": 2.2915, - "step": 452930 - }, - { - "epoch": 0.79, - "learning_rate": 1.0506352954306862e-05, - "loss": 2.2012, - "step": 452940 - }, - { - "epoch": 0.79, - "learning_rate": 1.0505481014380034e-05, - "loss": 2.3145, - "step": 452950 - }, - { - "epoch": 0.79, - "learning_rate": 1.0504609074453207e-05, - "loss": 2.3252, - "step": 452960 - }, - { - "epoch": 0.79, - "learning_rate": 1.050373713452638e-05, - "loss": 2.235, - "step": 452970 - }, - { - "epoch": 0.79, - "learning_rate": 1.0502865194599553e-05, - "loss": 2.2096, - "step": 452980 - }, - { - "epoch": 0.79, - "learning_rate": 1.0501993254672727e-05, - "loss": 2.2575, - "step": 452990 - }, - { - "epoch": 0.79, - "learning_rate": 1.05011213147459e-05, - "loss": 2.3625, - "step": 453000 - }, - { - "epoch": 0.79, - "learning_rate": 1.0500249374819073e-05, - "loss": 2.2595, - "step": 453010 - }, - { - "epoch": 0.79, - "learning_rate": 1.0499377434892247e-05, - "loss": 2.3905, - "step": 453020 - }, - { - "epoch": 0.79, - "learning_rate": 1.0498505494965419e-05, - "loss": 2.3253, - "step": 453030 - }, - { - "epoch": 0.79, - "learning_rate": 1.0497633555038592e-05, - "loss": 2.3007, - "step": 453040 - }, - { - "epoch": 0.79, - "learning_rate": 1.0496761615111765e-05, - "loss": 2.3192, - "step": 453050 - }, - { - "epoch": 0.79, - "learning_rate": 1.0495889675184938e-05, - "loss": 2.1549, - "step": 453060 - }, - { - "epoch": 0.79, - "learning_rate": 1.0495017735258112e-05, - "loss": 2.2492, - "step": 453070 - }, - { - "epoch": 0.79, - "learning_rate": 1.0494145795331286e-05, - "loss": 2.1885, - "step": 453080 - }, - { - "epoch": 0.79, - "learning_rate": 1.049327385540446e-05, - "loss": 2.2944, - "step": 453090 - }, - { - "epoch": 0.79, - "learning_rate": 1.0492401915477632e-05, - "loss": 2.2835, - "step": 453100 - }, - { - "epoch": 0.79, - "learning_rate": 1.0491529975550805e-05, - "loss": 2.3707, - "step": 453110 - }, - { - "epoch": 0.79, - "learning_rate": 1.0490658035623978e-05, - "loss": 2.224, - "step": 453120 - }, - { - "epoch": 0.79, - "learning_rate": 1.0489786095697151e-05, - "loss": 2.3236, - "step": 453130 - }, - { - "epoch": 0.79, - "learning_rate": 1.0488914155770323e-05, - "loss": 2.1553, - "step": 453140 - }, - { - "epoch": 0.79, - "learning_rate": 1.0488042215843497e-05, - "loss": 2.2136, - "step": 453150 - }, - { - "epoch": 0.79, - "learning_rate": 1.0487170275916671e-05, - "loss": 2.2753, - "step": 453160 - }, - { - "epoch": 0.79, - "learning_rate": 1.0486298335989845e-05, - "loss": 2.2864, - "step": 453170 - }, - { - "epoch": 0.79, - "learning_rate": 1.0485426396063017e-05, - "loss": 2.2853, - "step": 453180 - }, - { - "epoch": 0.79, - "learning_rate": 1.048455445613619e-05, - "loss": 2.3571, - "step": 453190 - }, - { - "epoch": 0.79, - "learning_rate": 1.0483682516209364e-05, - "loss": 2.2903, - "step": 453200 - }, - { - "epoch": 0.79, - "learning_rate": 1.0482810576282536e-05, - "loss": 2.2756, - "step": 453210 - }, - { - "epoch": 0.79, - "learning_rate": 1.048193863635571e-05, - "loss": 2.2264, - "step": 453220 - }, - { - "epoch": 0.79, - "learning_rate": 1.0481066696428884e-05, - "loss": 2.2601, - "step": 453230 - }, - { - "epoch": 0.79, - "learning_rate": 1.0480194756502058e-05, - "loss": 2.2023, - "step": 453240 - }, - { - "epoch": 0.79, - "learning_rate": 1.047932281657523e-05, - "loss": 2.4168, - "step": 453250 - }, - { - "epoch": 0.79, - "learning_rate": 1.0478450876648404e-05, - "loss": 2.3077, - "step": 453260 - }, - { - "epoch": 0.79, - "learning_rate": 1.0477578936721576e-05, - "loss": 2.3765, - "step": 453270 - }, - { - "epoch": 0.79, - "learning_rate": 1.047670699679475e-05, - "loss": 2.2408, - "step": 453280 - }, - { - "epoch": 0.79, - "learning_rate": 1.0475835056867921e-05, - "loss": 2.2858, - "step": 453290 - }, - { - "epoch": 0.79, - "learning_rate": 1.0474963116941095e-05, - "loss": 2.2378, - "step": 453300 - }, - { - "epoch": 0.79, - "learning_rate": 1.0474091177014269e-05, - "loss": 2.1564, - "step": 453310 - }, - { - "epoch": 0.79, - "learning_rate": 1.0473219237087443e-05, - "loss": 2.3288, - "step": 453320 - }, - { - "epoch": 0.79, - "learning_rate": 1.0472347297160617e-05, - "loss": 2.2816, - "step": 453330 - }, - { - "epoch": 0.79, - "learning_rate": 1.0471475357233789e-05, - "loss": 2.3118, - "step": 453340 - }, - { - "epoch": 0.79, - "learning_rate": 1.0470603417306962e-05, - "loss": 2.3097, - "step": 453350 - }, - { - "epoch": 0.79, - "learning_rate": 1.0469731477380134e-05, - "loss": 2.3308, - "step": 453360 - }, - { - "epoch": 0.79, - "learning_rate": 1.0468859537453308e-05, - "loss": 2.3783, - "step": 453370 - }, - { - "epoch": 0.79, - "learning_rate": 1.046798759752648e-05, - "loss": 2.2155, - "step": 453380 - }, - { - "epoch": 0.79, - "learning_rate": 1.0467115657599654e-05, - "loss": 2.3847, - "step": 453390 - }, - { - "epoch": 0.79, - "learning_rate": 1.0466243717672828e-05, - "loss": 2.2966, - "step": 453400 - }, - { - "epoch": 0.79, - "learning_rate": 1.0465371777746002e-05, - "loss": 2.2489, - "step": 453410 - }, - { - "epoch": 0.79, - "learning_rate": 1.0464499837819174e-05, - "loss": 2.3314, - "step": 453420 - }, - { - "epoch": 0.79, - "learning_rate": 1.0463627897892347e-05, - "loss": 2.3311, - "step": 453430 - }, - { - "epoch": 0.79, - "learning_rate": 1.046275595796552e-05, - "loss": 2.2792, - "step": 453440 - }, - { - "epoch": 0.79, - "learning_rate": 1.0461884018038693e-05, - "loss": 2.271, - "step": 453450 - }, - { - "epoch": 0.79, - "learning_rate": 1.0461012078111867e-05, - "loss": 2.3909, - "step": 453460 - }, - { - "epoch": 0.79, - "learning_rate": 1.046014013818504e-05, - "loss": 2.2059, - "step": 453470 - }, - { - "epoch": 0.79, - "learning_rate": 1.0459268198258215e-05, - "loss": 2.3837, - "step": 453480 - }, - { - "epoch": 0.79, - "learning_rate": 1.0458396258331387e-05, - "loss": 2.3049, - "step": 453490 - }, - { - "epoch": 0.79, - "learning_rate": 1.045752431840456e-05, - "loss": 2.1819, - "step": 453500 - }, - { - "epoch": 0.79, - "learning_rate": 1.0456652378477733e-05, - "loss": 2.315, - "step": 453510 - }, - { - "epoch": 0.79, - "learning_rate": 1.0455780438550906e-05, - "loss": 2.3159, - "step": 453520 - }, - { - "epoch": 0.79, - "learning_rate": 1.0454908498624078e-05, - "loss": 2.3121, - "step": 453530 - }, - { - "epoch": 0.79, - "learning_rate": 1.0454036558697252e-05, - "loss": 2.2927, - "step": 453540 - }, - { - "epoch": 0.79, - "learning_rate": 1.0453164618770426e-05, - "loss": 2.3073, - "step": 453550 - }, - { - "epoch": 0.79, - "learning_rate": 1.04522926788436e-05, - "loss": 2.2488, - "step": 453560 - }, - { - "epoch": 0.79, - "learning_rate": 1.0451420738916772e-05, - "loss": 2.2603, - "step": 453570 - }, - { - "epoch": 0.79, - "learning_rate": 1.0450548798989946e-05, - "loss": 2.2571, - "step": 453580 - }, - { - "epoch": 0.79, - "learning_rate": 1.044967685906312e-05, - "loss": 2.2432, - "step": 453590 - }, - { - "epoch": 0.79, - "learning_rate": 1.0448804919136291e-05, - "loss": 2.2681, - "step": 453600 - }, - { - "epoch": 0.79, - "learning_rate": 1.0447932979209465e-05, - "loss": 2.2863, - "step": 453610 - }, - { - "epoch": 0.79, - "learning_rate": 1.0447061039282637e-05, - "loss": 2.2252, - "step": 453620 - }, - { - "epoch": 0.79, - "learning_rate": 1.0446189099355811e-05, - "loss": 2.304, - "step": 453630 - }, - { - "epoch": 0.79, - "learning_rate": 1.0445317159428985e-05, - "loss": 2.2744, - "step": 453640 - }, - { - "epoch": 0.79, - "learning_rate": 1.0444445219502159e-05, - "loss": 2.3194, - "step": 453650 - }, - { - "epoch": 0.79, - "learning_rate": 1.044357327957533e-05, - "loss": 2.3457, - "step": 453660 - }, - { - "epoch": 0.79, - "learning_rate": 1.0442701339648504e-05, - "loss": 2.2564, - "step": 453670 - }, - { - "epoch": 0.79, - "learning_rate": 1.0441829399721676e-05, - "loss": 2.3639, - "step": 453680 - }, - { - "epoch": 0.79, - "learning_rate": 1.044095745979485e-05, - "loss": 2.229, - "step": 453690 - }, - { - "epoch": 0.79, - "learning_rate": 1.0440085519868022e-05, - "loss": 2.3204, - "step": 453700 - }, - { - "epoch": 0.79, - "learning_rate": 1.0439213579941196e-05, - "loss": 2.2176, - "step": 453710 - }, - { - "epoch": 0.79, - "learning_rate": 1.0438341640014372e-05, - "loss": 2.2916, - "step": 453720 - }, - { - "epoch": 0.79, - "learning_rate": 1.0437469700087544e-05, - "loss": 2.3048, - "step": 453730 - }, - { - "epoch": 0.79, - "learning_rate": 1.0436597760160717e-05, - "loss": 2.2944, - "step": 453740 - }, - { - "epoch": 0.79, - "learning_rate": 1.043572582023389e-05, - "loss": 2.2797, - "step": 453750 - }, - { - "epoch": 0.79, - "learning_rate": 1.0434853880307063e-05, - "loss": 2.3289, - "step": 453760 - }, - { - "epoch": 0.79, - "learning_rate": 1.0433981940380235e-05, - "loss": 2.2244, - "step": 453770 - }, - { - "epoch": 0.79, - "learning_rate": 1.0433110000453409e-05, - "loss": 2.2719, - "step": 453780 - }, - { - "epoch": 0.79, - "learning_rate": 1.0432238060526583e-05, - "loss": 2.3097, - "step": 453790 - }, - { - "epoch": 0.79, - "learning_rate": 1.0431366120599757e-05, - "loss": 2.2685, - "step": 453800 - }, - { - "epoch": 0.79, - "learning_rate": 1.0430494180672929e-05, - "loss": 2.2846, - "step": 453810 - }, - { - "epoch": 0.79, - "learning_rate": 1.0429622240746102e-05, - "loss": 2.2304, - "step": 453820 - }, - { - "epoch": 0.79, - "learning_rate": 1.0428750300819275e-05, - "loss": 2.3654, - "step": 453830 - }, - { - "epoch": 0.79, - "learning_rate": 1.0427878360892448e-05, - "loss": 2.4001, - "step": 453840 - }, - { - "epoch": 0.79, - "learning_rate": 1.042700642096562e-05, - "loss": 2.2937, - "step": 453850 - }, - { - "epoch": 0.79, - "learning_rate": 1.0426134481038794e-05, - "loss": 2.1865, - "step": 453860 - }, - { - "epoch": 0.79, - "learning_rate": 1.0425262541111968e-05, - "loss": 2.2469, - "step": 453870 - }, - { - "epoch": 0.79, - "learning_rate": 1.0424390601185142e-05, - "loss": 2.2711, - "step": 453880 - }, - { - "epoch": 0.79, - "learning_rate": 1.0423518661258315e-05, - "loss": 2.2986, - "step": 453890 - }, - { - "epoch": 0.79, - "learning_rate": 1.0422646721331488e-05, - "loss": 2.203, - "step": 453900 - }, - { - "epoch": 0.79, - "learning_rate": 1.0421774781404661e-05, - "loss": 2.3036, - "step": 453910 - }, - { - "epoch": 0.79, - "learning_rate": 1.0420902841477833e-05, - "loss": 2.4139, - "step": 453920 - }, - { - "epoch": 0.79, - "learning_rate": 1.0420030901551007e-05, - "loss": 2.2616, - "step": 453930 - }, - { - "epoch": 0.79, - "learning_rate": 1.041915896162418e-05, - "loss": 2.3448, - "step": 453940 - }, - { - "epoch": 0.79, - "learning_rate": 1.0418287021697353e-05, - "loss": 2.3987, - "step": 453950 - }, - { - "epoch": 0.79, - "learning_rate": 1.0417415081770527e-05, - "loss": 2.3411, - "step": 453960 - }, - { - "epoch": 0.79, - "learning_rate": 1.04165431418437e-05, - "loss": 2.1596, - "step": 453970 - }, - { - "epoch": 0.79, - "learning_rate": 1.0415671201916873e-05, - "loss": 2.2911, - "step": 453980 - }, - { - "epoch": 0.79, - "learning_rate": 1.0414799261990046e-05, - "loss": 2.27, - "step": 453990 - }, - { - "epoch": 0.79, - "learning_rate": 1.041392732206322e-05, - "loss": 2.3854, - "step": 454000 - }, - { - "epoch": 0.79, - "learning_rate": 1.0413055382136392e-05, - "loss": 2.3329, - "step": 454010 - }, - { - "epoch": 0.79, - "learning_rate": 1.0412183442209566e-05, - "loss": 2.2325, - "step": 454020 - }, - { - "epoch": 0.79, - "learning_rate": 1.041131150228274e-05, - "loss": 2.2671, - "step": 454030 - }, - { - "epoch": 0.79, - "learning_rate": 1.0410439562355914e-05, - "loss": 2.392, - "step": 454040 - }, - { - "epoch": 0.79, - "learning_rate": 1.0409567622429086e-05, - "loss": 2.0128, - "step": 454050 - }, - { - "epoch": 0.79, - "learning_rate": 1.040869568250226e-05, - "loss": 2.2458, - "step": 454060 - }, - { - "epoch": 0.79, - "learning_rate": 1.0407823742575431e-05, - "loss": 2.3026, - "step": 454070 - }, - { - "epoch": 0.79, - "learning_rate": 1.0406951802648605e-05, - "loss": 2.3298, - "step": 454080 - }, - { - "epoch": 0.79, - "learning_rate": 1.0406079862721777e-05, - "loss": 2.2624, - "step": 454090 - }, - { - "epoch": 0.79, - "learning_rate": 1.0405207922794951e-05, - "loss": 2.2841, - "step": 454100 - }, - { - "epoch": 0.79, - "learning_rate": 1.0404335982868125e-05, - "loss": 2.3559, - "step": 454110 - }, - { - "epoch": 0.79, - "learning_rate": 1.0403464042941299e-05, - "loss": 2.2938, - "step": 454120 - }, - { - "epoch": 0.79, - "learning_rate": 1.0402592103014472e-05, - "loss": 2.2563, - "step": 454130 - }, - { - "epoch": 0.79, - "learning_rate": 1.0401720163087644e-05, - "loss": 2.2391, - "step": 454140 - }, - { - "epoch": 0.79, - "learning_rate": 1.0400848223160818e-05, - "loss": 2.3401, - "step": 454150 - }, - { - "epoch": 0.79, - "learning_rate": 1.039997628323399e-05, - "loss": 2.2908, - "step": 454160 - }, - { - "epoch": 0.79, - "learning_rate": 1.0399104343307164e-05, - "loss": 2.1049, - "step": 454170 - }, - { - "epoch": 0.79, - "learning_rate": 1.0398232403380336e-05, - "loss": 2.2316, - "step": 454180 - }, - { - "epoch": 0.79, - "learning_rate": 1.039736046345351e-05, - "loss": 2.2138, - "step": 454190 - }, - { - "epoch": 0.79, - "learning_rate": 1.0396488523526684e-05, - "loss": 2.3647, - "step": 454200 - }, - { - "epoch": 0.79, - "learning_rate": 1.0395616583599857e-05, - "loss": 2.3238, - "step": 454210 - }, - { - "epoch": 0.79, - "learning_rate": 1.039474464367303e-05, - "loss": 2.2706, - "step": 454220 - }, - { - "epoch": 0.79, - "learning_rate": 1.0393872703746203e-05, - "loss": 2.3839, - "step": 454230 - }, - { - "epoch": 0.79, - "learning_rate": 1.0393000763819375e-05, - "loss": 2.2937, - "step": 454240 - }, - { - "epoch": 0.79, - "learning_rate": 1.039212882389255e-05, - "loss": 2.2041, - "step": 454250 - }, - { - "epoch": 0.79, - "learning_rate": 1.0391256883965723e-05, - "loss": 2.317, - "step": 454260 - }, - { - "epoch": 0.79, - "learning_rate": 1.0390384944038897e-05, - "loss": 2.2637, - "step": 454270 - }, - { - "epoch": 0.79, - "learning_rate": 1.038951300411207e-05, - "loss": 2.2196, - "step": 454280 - }, - { - "epoch": 0.79, - "learning_rate": 1.0388641064185243e-05, - "loss": 2.239, - "step": 454290 - }, - { - "epoch": 0.79, - "learning_rate": 1.0387769124258416e-05, - "loss": 2.2925, - "step": 454300 - }, - { - "epoch": 0.79, - "learning_rate": 1.0386897184331588e-05, - "loss": 2.1006, - "step": 454310 - }, - { - "epoch": 0.79, - "learning_rate": 1.0386025244404762e-05, - "loss": 2.4033, - "step": 454320 - }, - { - "epoch": 0.79, - "learning_rate": 1.0385153304477934e-05, - "loss": 2.307, - "step": 454330 - }, - { - "epoch": 0.79, - "learning_rate": 1.0384281364551108e-05, - "loss": 2.2598, - "step": 454340 - }, - { - "epoch": 0.79, - "learning_rate": 1.0383409424624282e-05, - "loss": 2.1797, - "step": 454350 - }, - { - "epoch": 0.79, - "learning_rate": 1.0382537484697456e-05, - "loss": 2.4317, - "step": 454360 - }, - { - "epoch": 0.79, - "learning_rate": 1.0381665544770628e-05, - "loss": 2.2899, - "step": 454370 - }, - { - "epoch": 0.79, - "learning_rate": 1.0380793604843801e-05, - "loss": 2.2194, - "step": 454380 - }, - { - "epoch": 0.79, - "learning_rate": 1.0379921664916975e-05, - "loss": 2.3406, - "step": 454390 - }, - { - "epoch": 0.79, - "learning_rate": 1.0379049724990147e-05, - "loss": 2.279, - "step": 454400 - }, - { - "epoch": 0.79, - "learning_rate": 1.0378177785063321e-05, - "loss": 2.1529, - "step": 454410 - }, - { - "epoch": 0.79, - "learning_rate": 1.0377305845136493e-05, - "loss": 2.267, - "step": 454420 - }, - { - "epoch": 0.79, - "learning_rate": 1.0376433905209667e-05, - "loss": 2.3338, - "step": 454430 - }, - { - "epoch": 0.79, - "learning_rate": 1.037556196528284e-05, - "loss": 2.296, - "step": 454440 - }, - { - "epoch": 0.79, - "learning_rate": 1.0374690025356014e-05, - "loss": 2.2688, - "step": 454450 - }, - { - "epoch": 0.79, - "learning_rate": 1.0373818085429186e-05, - "loss": 2.3013, - "step": 454460 - }, - { - "epoch": 0.79, - "learning_rate": 1.037294614550236e-05, - "loss": 2.2531, - "step": 454470 - }, - { - "epoch": 0.79, - "learning_rate": 1.0372074205575532e-05, - "loss": 2.2577, - "step": 454480 - }, - { - "epoch": 0.79, - "learning_rate": 1.0371202265648706e-05, - "loss": 2.255, - "step": 454490 - }, - { - "epoch": 0.79, - "learning_rate": 1.0370330325721878e-05, - "loss": 2.3246, - "step": 454500 - }, - { - "epoch": 0.79, - "learning_rate": 1.0369458385795054e-05, - "loss": 2.3504, - "step": 454510 - }, - { - "epoch": 0.79, - "learning_rate": 1.0368586445868227e-05, - "loss": 2.2741, - "step": 454520 - }, - { - "epoch": 0.79, - "learning_rate": 1.03677145059414e-05, - "loss": 2.3379, - "step": 454530 - }, - { - "epoch": 0.79, - "learning_rate": 1.0366842566014573e-05, - "loss": 2.2637, - "step": 454540 - }, - { - "epoch": 0.79, - "learning_rate": 1.0365970626087745e-05, - "loss": 2.3252, - "step": 454550 - }, - { - "epoch": 0.79, - "learning_rate": 1.0365098686160919e-05, - "loss": 2.2663, - "step": 454560 - }, - { - "epoch": 0.79, - "learning_rate": 1.0364226746234091e-05, - "loss": 2.2904, - "step": 454570 - }, - { - "epoch": 0.79, - "learning_rate": 1.0363354806307265e-05, - "loss": 2.1167, - "step": 454580 - }, - { - "epoch": 0.79, - "learning_rate": 1.0362482866380439e-05, - "loss": 2.1991, - "step": 454590 - }, - { - "epoch": 0.79, - "learning_rate": 1.0361610926453612e-05, - "loss": 2.3079, - "step": 454600 - }, - { - "epoch": 0.79, - "learning_rate": 1.0360738986526785e-05, - "loss": 2.2726, - "step": 454610 - }, - { - "epoch": 0.79, - "learning_rate": 1.0359867046599958e-05, - "loss": 2.2643, - "step": 454620 - }, - { - "epoch": 0.79, - "learning_rate": 1.035899510667313e-05, - "loss": 2.2773, - "step": 454630 - }, - { - "epoch": 0.79, - "learning_rate": 1.0358123166746304e-05, - "loss": 2.3584, - "step": 454640 - }, - { - "epoch": 0.79, - "learning_rate": 1.0357251226819476e-05, - "loss": 2.1178, - "step": 454650 - }, - { - "epoch": 0.79, - "learning_rate": 1.035637928689265e-05, - "loss": 2.3628, - "step": 454660 - }, - { - "epoch": 0.79, - "learning_rate": 1.0355507346965824e-05, - "loss": 2.2896, - "step": 454670 - }, - { - "epoch": 0.79, - "learning_rate": 1.0354635407038998e-05, - "loss": 2.2954, - "step": 454680 - }, - { - "epoch": 0.79, - "learning_rate": 1.0353763467112171e-05, - "loss": 2.427, - "step": 454690 - }, - { - "epoch": 0.79, - "learning_rate": 1.0352891527185343e-05, - "loss": 2.2731, - "step": 454700 - }, - { - "epoch": 0.79, - "learning_rate": 1.0352019587258517e-05, - "loss": 2.3983, - "step": 454710 - }, - { - "epoch": 0.79, - "learning_rate": 1.035114764733169e-05, - "loss": 2.2936, - "step": 454720 - }, - { - "epoch": 0.79, - "learning_rate": 1.0350275707404863e-05, - "loss": 2.385, - "step": 454730 - }, - { - "epoch": 0.79, - "learning_rate": 1.0349403767478035e-05, - "loss": 2.2529, - "step": 454740 - }, - { - "epoch": 0.79, - "learning_rate": 1.034853182755121e-05, - "loss": 2.3041, - "step": 454750 - }, - { - "epoch": 0.79, - "learning_rate": 1.0347659887624383e-05, - "loss": 2.1404, - "step": 454760 - }, - { - "epoch": 0.79, - "learning_rate": 1.0346787947697556e-05, - "loss": 2.3379, - "step": 454770 - }, - { - "epoch": 0.79, - "learning_rate": 1.0345916007770728e-05, - "loss": 2.439, - "step": 454780 - }, - { - "epoch": 0.79, - "learning_rate": 1.0345044067843902e-05, - "loss": 2.2303, - "step": 454790 - }, - { - "epoch": 0.79, - "learning_rate": 1.0344172127917076e-05, - "loss": 2.3086, - "step": 454800 - }, - { - "epoch": 0.79, - "learning_rate": 1.0343300187990248e-05, - "loss": 2.2801, - "step": 454810 - }, - { - "epoch": 0.79, - "learning_rate": 1.0342428248063422e-05, - "loss": 2.1555, - "step": 454820 - }, - { - "epoch": 0.79, - "learning_rate": 1.0341556308136596e-05, - "loss": 2.198, - "step": 454830 - }, - { - "epoch": 0.79, - "learning_rate": 1.034068436820977e-05, - "loss": 2.328, - "step": 454840 - }, - { - "epoch": 0.79, - "learning_rate": 1.0339812428282941e-05, - "loss": 2.1695, - "step": 454850 - }, - { - "epoch": 0.79, - "learning_rate": 1.0338940488356115e-05, - "loss": 2.2677, - "step": 454860 - }, - { - "epoch": 0.79, - "learning_rate": 1.0338068548429287e-05, - "loss": 2.2012, - "step": 454870 - }, - { - "epoch": 0.79, - "learning_rate": 1.0337196608502461e-05, - "loss": 2.1827, - "step": 454880 - }, - { - "epoch": 0.79, - "learning_rate": 1.0336324668575633e-05, - "loss": 2.2224, - "step": 454890 - }, - { - "epoch": 0.79, - "learning_rate": 1.0335452728648807e-05, - "loss": 2.148, - "step": 454900 - }, - { - "epoch": 0.79, - "learning_rate": 1.033458078872198e-05, - "loss": 2.3284, - "step": 454910 - }, - { - "epoch": 0.79, - "learning_rate": 1.0333708848795154e-05, - "loss": 2.1774, - "step": 454920 - }, - { - "epoch": 0.79, - "learning_rate": 1.0332836908868328e-05, - "loss": 2.149, - "step": 454930 - }, - { - "epoch": 0.79, - "learning_rate": 1.03319649689415e-05, - "loss": 2.2078, - "step": 454940 - }, - { - "epoch": 0.79, - "learning_rate": 1.0331093029014674e-05, - "loss": 2.2306, - "step": 454950 - }, - { - "epoch": 0.79, - "learning_rate": 1.0330221089087846e-05, - "loss": 2.2018, - "step": 454960 - }, - { - "epoch": 0.79, - "learning_rate": 1.032934914916102e-05, - "loss": 2.3288, - "step": 454970 - }, - { - "epoch": 0.79, - "learning_rate": 1.0328477209234192e-05, - "loss": 2.2547, - "step": 454980 - }, - { - "epoch": 0.79, - "learning_rate": 1.0327605269307366e-05, - "loss": 2.3211, - "step": 454990 - }, - { - "epoch": 0.79, - "learning_rate": 1.032673332938054e-05, - "loss": 2.2887, - "step": 455000 - }, - { - "epoch": 0.79, - "learning_rate": 1.0325861389453713e-05, - "loss": 2.3162, - "step": 455010 - }, - { - "epoch": 0.79, - "learning_rate": 1.0324989449526885e-05, - "loss": 2.2333, - "step": 455020 - }, - { - "epoch": 0.79, - "learning_rate": 1.032411750960006e-05, - "loss": 2.247, - "step": 455030 - }, - { - "epoch": 0.79, - "learning_rate": 1.0323245569673231e-05, - "loss": 2.2089, - "step": 455040 - }, - { - "epoch": 0.79, - "learning_rate": 1.0322373629746405e-05, - "loss": 2.2909, - "step": 455050 - }, - { - "epoch": 0.79, - "learning_rate": 1.0321501689819579e-05, - "loss": 2.3872, - "step": 455060 - }, - { - "epoch": 0.79, - "learning_rate": 1.0320629749892753e-05, - "loss": 2.197, - "step": 455070 - }, - { - "epoch": 0.79, - "learning_rate": 1.0319757809965926e-05, - "loss": 2.2202, - "step": 455080 - }, - { - "epoch": 0.79, - "learning_rate": 1.0318885870039098e-05, - "loss": 2.3442, - "step": 455090 - }, - { - "epoch": 0.79, - "learning_rate": 1.0318013930112272e-05, - "loss": 2.2652, - "step": 455100 - }, - { - "epoch": 0.79, - "learning_rate": 1.0317141990185444e-05, - "loss": 2.3097, - "step": 455110 - }, - { - "epoch": 0.79, - "learning_rate": 1.0316270050258618e-05, - "loss": 2.2533, - "step": 455120 - }, - { - "epoch": 0.79, - "learning_rate": 1.031539811033179e-05, - "loss": 2.2632, - "step": 455130 - }, - { - "epoch": 0.79, - "learning_rate": 1.0314526170404964e-05, - "loss": 2.2452, - "step": 455140 - }, - { - "epoch": 0.79, - "learning_rate": 1.0313654230478138e-05, - "loss": 2.3086, - "step": 455150 - }, - { - "epoch": 0.79, - "learning_rate": 1.0312782290551311e-05, - "loss": 2.1754, - "step": 455160 - }, - { - "epoch": 0.79, - "learning_rate": 1.0311910350624483e-05, - "loss": 2.3588, - "step": 455170 - }, - { - "epoch": 0.79, - "learning_rate": 1.0311038410697657e-05, - "loss": 2.2809, - "step": 455180 - }, - { - "epoch": 0.79, - "learning_rate": 1.0310166470770831e-05, - "loss": 2.453, - "step": 455190 - }, - { - "epoch": 0.79, - "learning_rate": 1.0309294530844003e-05, - "loss": 2.2489, - "step": 455200 - }, - { - "epoch": 0.79, - "learning_rate": 1.0308422590917177e-05, - "loss": 2.1281, - "step": 455210 - }, - { - "epoch": 0.79, - "learning_rate": 1.0307550650990349e-05, - "loss": 2.3183, - "step": 455220 - }, - { - "epoch": 0.79, - "learning_rate": 1.0306678711063523e-05, - "loss": 2.2488, - "step": 455230 - }, - { - "epoch": 0.79, - "learning_rate": 1.0305806771136696e-05, - "loss": 2.2858, - "step": 455240 - }, - { - "epoch": 0.79, - "learning_rate": 1.030493483120987e-05, - "loss": 2.2097, - "step": 455250 - }, - { - "epoch": 0.79, - "learning_rate": 1.0304062891283042e-05, - "loss": 2.2607, - "step": 455260 - }, - { - "epoch": 0.79, - "learning_rate": 1.0303190951356216e-05, - "loss": 2.2811, - "step": 455270 - }, - { - "epoch": 0.79, - "learning_rate": 1.0302319011429388e-05, - "loss": 2.3136, - "step": 455280 - }, - { - "epoch": 0.79, - "learning_rate": 1.0301447071502562e-05, - "loss": 2.2547, - "step": 455290 - }, - { - "epoch": 0.79, - "learning_rate": 1.0300575131575734e-05, - "loss": 2.332, - "step": 455300 - }, - { - "epoch": 0.79, - "learning_rate": 1.029970319164891e-05, - "loss": 2.3722, - "step": 455310 - }, - { - "epoch": 0.79, - "learning_rate": 1.0298831251722083e-05, - "loss": 2.365, - "step": 455320 - }, - { - "epoch": 0.79, - "learning_rate": 1.0297959311795255e-05, - "loss": 2.1628, - "step": 455330 - }, - { - "epoch": 0.79, - "learning_rate": 1.0297087371868429e-05, - "loss": 2.3057, - "step": 455340 - }, - { - "epoch": 0.79, - "learning_rate": 1.0296215431941601e-05, - "loss": 2.3358, - "step": 455350 - }, - { - "epoch": 0.79, - "learning_rate": 1.0295343492014775e-05, - "loss": 2.2987, - "step": 455360 - }, - { - "epoch": 0.79, - "learning_rate": 1.0294471552087947e-05, - "loss": 2.2985, - "step": 455370 - }, - { - "epoch": 0.79, - "learning_rate": 1.029359961216112e-05, - "loss": 2.3233, - "step": 455380 - }, - { - "epoch": 0.79, - "learning_rate": 1.0292727672234295e-05, - "loss": 2.2621, - "step": 455390 - }, - { - "epoch": 0.79, - "learning_rate": 1.0291855732307468e-05, - "loss": 2.2854, - "step": 455400 - }, - { - "epoch": 0.79, - "learning_rate": 1.029098379238064e-05, - "loss": 2.2423, - "step": 455410 - }, - { - "epoch": 0.79, - "learning_rate": 1.0290111852453814e-05, - "loss": 2.2162, - "step": 455420 - }, - { - "epoch": 0.79, - "learning_rate": 1.0289239912526986e-05, - "loss": 2.2645, - "step": 455430 - }, - { - "epoch": 0.79, - "learning_rate": 1.028836797260016e-05, - "loss": 2.2314, - "step": 455440 - }, - { - "epoch": 0.79, - "learning_rate": 1.0287496032673334e-05, - "loss": 2.2398, - "step": 455450 - }, - { - "epoch": 0.79, - "learning_rate": 1.0286624092746506e-05, - "loss": 2.3141, - "step": 455460 - }, - { - "epoch": 0.79, - "learning_rate": 1.028575215281968e-05, - "loss": 2.2874, - "step": 455470 - }, - { - "epoch": 0.79, - "learning_rate": 1.0284880212892853e-05, - "loss": 2.2639, - "step": 455480 - }, - { - "epoch": 0.79, - "learning_rate": 1.0284008272966027e-05, - "loss": 2.2938, - "step": 455490 - }, - { - "epoch": 0.79, - "learning_rate": 1.02831363330392e-05, - "loss": 2.2546, - "step": 455500 - }, - { - "epoch": 0.79, - "learning_rate": 1.0282264393112373e-05, - "loss": 2.3014, - "step": 455510 - }, - { - "epoch": 0.79, - "learning_rate": 1.0281392453185545e-05, - "loss": 2.4053, - "step": 455520 - }, - { - "epoch": 0.79, - "learning_rate": 1.0280520513258719e-05, - "loss": 2.2545, - "step": 455530 - }, - { - "epoch": 0.79, - "learning_rate": 1.0279648573331891e-05, - "loss": 2.3766, - "step": 455540 - }, - { - "epoch": 0.79, - "learning_rate": 1.0278776633405066e-05, - "loss": 2.2293, - "step": 455550 - }, - { - "epoch": 0.79, - "learning_rate": 1.0277904693478238e-05, - "loss": 2.2899, - "step": 455560 - }, - { - "epoch": 0.79, - "learning_rate": 1.0277032753551412e-05, - "loss": 2.1769, - "step": 455570 - }, - { - "epoch": 0.79, - "learning_rate": 1.0276160813624584e-05, - "loss": 2.2893, - "step": 455580 - }, - { - "epoch": 0.79, - "learning_rate": 1.0275288873697758e-05, - "loss": 2.2664, - "step": 455590 - }, - { - "epoch": 0.79, - "learning_rate": 1.0274416933770932e-05, - "loss": 2.2969, - "step": 455600 - }, - { - "epoch": 0.79, - "learning_rate": 1.0273544993844104e-05, - "loss": 2.2321, - "step": 455610 - }, - { - "epoch": 0.79, - "learning_rate": 1.0272673053917278e-05, - "loss": 2.2864, - "step": 455620 - }, - { - "epoch": 0.79, - "learning_rate": 1.0271801113990451e-05, - "loss": 2.235, - "step": 455630 - }, - { - "epoch": 0.79, - "learning_rate": 1.0270929174063625e-05, - "loss": 2.2235, - "step": 455640 - }, - { - "epoch": 0.79, - "learning_rate": 1.0270057234136797e-05, - "loss": 2.2072, - "step": 455650 - }, - { - "epoch": 0.79, - "learning_rate": 1.0269185294209971e-05, - "loss": 2.2663, - "step": 455660 - }, - { - "epoch": 0.79, - "learning_rate": 1.0268313354283143e-05, - "loss": 2.3835, - "step": 455670 - }, - { - "epoch": 0.79, - "learning_rate": 1.0267441414356317e-05, - "loss": 2.3211, - "step": 455680 - }, - { - "epoch": 0.79, - "learning_rate": 1.0266569474429489e-05, - "loss": 2.3107, - "step": 455690 - }, - { - "epoch": 0.79, - "learning_rate": 1.0265697534502663e-05, - "loss": 2.1725, - "step": 455700 - }, - { - "epoch": 0.79, - "learning_rate": 1.0264825594575837e-05, - "loss": 2.2997, - "step": 455710 - }, - { - "epoch": 0.79, - "learning_rate": 1.026395365464901e-05, - "loss": 2.2006, - "step": 455720 - }, - { - "epoch": 0.79, - "learning_rate": 1.0263081714722184e-05, - "loss": 2.2786, - "step": 455730 - }, - { - "epoch": 0.79, - "learning_rate": 1.0262209774795356e-05, - "loss": 2.2797, - "step": 455740 - }, - { - "epoch": 0.79, - "learning_rate": 1.026133783486853e-05, - "loss": 2.2773, - "step": 455750 - }, - { - "epoch": 0.79, - "learning_rate": 1.0260465894941702e-05, - "loss": 2.3626, - "step": 455760 - }, - { - "epoch": 0.79, - "learning_rate": 1.0259593955014876e-05, - "loss": 2.4114, - "step": 455770 - }, - { - "epoch": 0.79, - "learning_rate": 1.0258722015088048e-05, - "loss": 2.2432, - "step": 455780 - }, - { - "epoch": 0.79, - "learning_rate": 1.0257850075161223e-05, - "loss": 2.332, - "step": 455790 - }, - { - "epoch": 0.79, - "learning_rate": 1.0256978135234395e-05, - "loss": 2.2243, - "step": 455800 - }, - { - "epoch": 0.79, - "learning_rate": 1.025610619530757e-05, - "loss": 2.2557, - "step": 455810 - }, - { - "epoch": 0.79, - "learning_rate": 1.0255234255380741e-05, - "loss": 2.2338, - "step": 455820 - }, - { - "epoch": 0.79, - "learning_rate": 1.0254362315453915e-05, - "loss": 2.1983, - "step": 455830 - }, - { - "epoch": 0.79, - "learning_rate": 1.0253490375527087e-05, - "loss": 2.3047, - "step": 455840 - }, - { - "epoch": 0.79, - "learning_rate": 1.0252618435600261e-05, - "loss": 2.2354, - "step": 455850 - }, - { - "epoch": 0.79, - "learning_rate": 1.0251746495673435e-05, - "loss": 2.3497, - "step": 455860 - }, - { - "epoch": 0.79, - "learning_rate": 1.0250874555746608e-05, - "loss": 2.2838, - "step": 455870 - }, - { - "epoch": 0.79, - "learning_rate": 1.0250002615819782e-05, - "loss": 2.2829, - "step": 455880 - }, - { - "epoch": 0.8, - "learning_rate": 1.0249130675892954e-05, - "loss": 2.2515, - "step": 455890 - }, - { - "epoch": 0.8, - "learning_rate": 1.0248258735966128e-05, - "loss": 2.3795, - "step": 455900 - }, - { - "epoch": 0.8, - "learning_rate": 1.02473867960393e-05, - "loss": 2.3264, - "step": 455910 - }, - { - "epoch": 0.8, - "learning_rate": 1.0246514856112474e-05, - "loss": 2.3261, - "step": 455920 - }, - { - "epoch": 0.8, - "learning_rate": 1.0245642916185646e-05, - "loss": 2.2902, - "step": 455930 - }, - { - "epoch": 0.8, - "learning_rate": 1.024477097625882e-05, - "loss": 2.3128, - "step": 455940 - }, - { - "epoch": 0.8, - "learning_rate": 1.0243899036331993e-05, - "loss": 2.375, - "step": 455950 - }, - { - "epoch": 0.8, - "learning_rate": 1.0243027096405167e-05, - "loss": 2.3436, - "step": 455960 - }, - { - "epoch": 0.8, - "learning_rate": 1.024215515647834e-05, - "loss": 2.2801, - "step": 455970 - }, - { - "epoch": 0.8, - "learning_rate": 1.0241283216551513e-05, - "loss": 2.2826, - "step": 455980 - }, - { - "epoch": 0.8, - "learning_rate": 1.0240411276624687e-05, - "loss": 2.2964, - "step": 455990 - }, - { - "epoch": 0.8, - "learning_rate": 1.0239539336697859e-05, - "loss": 2.3736, - "step": 456000 - }, - { - "epoch": 0.8, - "learning_rate": 1.0238667396771033e-05, - "loss": 2.271, - "step": 456010 - }, - { - "epoch": 0.8, - "learning_rate": 1.0237795456844205e-05, - "loss": 2.3297, - "step": 456020 - }, - { - "epoch": 0.8, - "learning_rate": 1.0236923516917379e-05, - "loss": 2.404, - "step": 456030 - }, - { - "epoch": 0.8, - "learning_rate": 1.0236051576990552e-05, - "loss": 2.4018, - "step": 456040 - }, - { - "epoch": 0.8, - "learning_rate": 1.0235179637063726e-05, - "loss": 2.2696, - "step": 456050 - }, - { - "epoch": 0.8, - "learning_rate": 1.0234307697136898e-05, - "loss": 2.3234, - "step": 456060 - }, - { - "epoch": 0.8, - "learning_rate": 1.0233435757210072e-05, - "loss": 2.3017, - "step": 456070 - }, - { - "epoch": 0.8, - "learning_rate": 1.0232563817283244e-05, - "loss": 2.2849, - "step": 456080 - }, - { - "epoch": 0.8, - "learning_rate": 1.0231691877356418e-05, - "loss": 2.3493, - "step": 456090 - }, - { - "epoch": 0.8, - "learning_rate": 1.0230819937429592e-05, - "loss": 2.2633, - "step": 456100 - }, - { - "epoch": 0.8, - "learning_rate": 1.0229947997502765e-05, - "loss": 2.32, - "step": 456110 - }, - { - "epoch": 0.8, - "learning_rate": 1.0229076057575939e-05, - "loss": 2.1316, - "step": 456120 - }, - { - "epoch": 0.8, - "learning_rate": 1.0228204117649111e-05, - "loss": 2.3321, - "step": 456130 - }, - { - "epoch": 0.8, - "learning_rate": 1.0227332177722285e-05, - "loss": 2.2818, - "step": 456140 - }, - { - "epoch": 0.8, - "learning_rate": 1.0226460237795457e-05, - "loss": 2.2615, - "step": 456150 - }, - { - "epoch": 0.8, - "learning_rate": 1.022558829786863e-05, - "loss": 2.3526, - "step": 456160 - }, - { - "epoch": 0.8, - "learning_rate": 1.0224716357941803e-05, - "loss": 2.3402, - "step": 456170 - }, - { - "epoch": 0.8, - "learning_rate": 1.0223844418014977e-05, - "loss": 2.2826, - "step": 456180 - }, - { - "epoch": 0.8, - "learning_rate": 1.022297247808815e-05, - "loss": 2.3186, - "step": 456190 - }, - { - "epoch": 0.8, - "learning_rate": 1.0222100538161324e-05, - "loss": 2.2036, - "step": 456200 - }, - { - "epoch": 0.8, - "learning_rate": 1.0221228598234496e-05, - "loss": 2.2488, - "step": 456210 - }, - { - "epoch": 0.8, - "learning_rate": 1.022035665830767e-05, - "loss": 2.3437, - "step": 456220 - }, - { - "epoch": 0.8, - "learning_rate": 1.0219484718380842e-05, - "loss": 2.214, - "step": 456230 - }, - { - "epoch": 0.8, - "learning_rate": 1.0218612778454016e-05, - "loss": 2.2569, - "step": 456240 - }, - { - "epoch": 0.8, - "learning_rate": 1.021774083852719e-05, - "loss": 2.214, - "step": 456250 - }, - { - "epoch": 0.8, - "learning_rate": 1.0216868898600362e-05, - "loss": 2.4505, - "step": 456260 - }, - { - "epoch": 0.8, - "learning_rate": 1.0215996958673535e-05, - "loss": 2.3328, - "step": 456270 - }, - { - "epoch": 0.8, - "learning_rate": 1.021512501874671e-05, - "loss": 2.2238, - "step": 456280 - }, - { - "epoch": 0.8, - "learning_rate": 1.0214253078819883e-05, - "loss": 2.3256, - "step": 456290 - }, - { - "epoch": 0.8, - "learning_rate": 1.0213381138893055e-05, - "loss": 2.2977, - "step": 456300 - }, - { - "epoch": 0.8, - "learning_rate": 1.0212509198966229e-05, - "loss": 2.281, - "step": 456310 - }, - { - "epoch": 0.8, - "learning_rate": 1.0211637259039401e-05, - "loss": 2.2134, - "step": 456320 - }, - { - "epoch": 0.8, - "learning_rate": 1.0210765319112575e-05, - "loss": 2.2763, - "step": 456330 - }, - { - "epoch": 0.8, - "learning_rate": 1.0209893379185747e-05, - "loss": 2.3005, - "step": 456340 - }, - { - "epoch": 0.8, - "learning_rate": 1.0209021439258922e-05, - "loss": 2.321, - "step": 456350 - }, - { - "epoch": 0.8, - "learning_rate": 1.0208149499332094e-05, - "loss": 2.2534, - "step": 456360 - }, - { - "epoch": 0.8, - "learning_rate": 1.0207277559405268e-05, - "loss": 2.2804, - "step": 456370 - }, - { - "epoch": 0.8, - "learning_rate": 1.0206405619478442e-05, - "loss": 2.3103, - "step": 456380 - }, - { - "epoch": 0.8, - "learning_rate": 1.0205533679551614e-05, - "loss": 2.2577, - "step": 456390 - }, - { - "epoch": 0.8, - "learning_rate": 1.0204661739624788e-05, - "loss": 2.3658, - "step": 456400 - }, - { - "epoch": 0.8, - "learning_rate": 1.020378979969796e-05, - "loss": 2.3513, - "step": 456410 - }, - { - "epoch": 0.8, - "learning_rate": 1.0202917859771134e-05, - "loss": 2.3178, - "step": 456420 - }, - { - "epoch": 0.8, - "learning_rate": 1.0202045919844307e-05, - "loss": 2.3019, - "step": 456430 - }, - { - "epoch": 0.8, - "learning_rate": 1.0201173979917481e-05, - "loss": 2.2501, - "step": 456440 - }, - { - "epoch": 0.8, - "learning_rate": 1.0200302039990653e-05, - "loss": 2.2567, - "step": 456450 - }, - { - "epoch": 0.8, - "learning_rate": 1.0199430100063827e-05, - "loss": 2.339, - "step": 456460 - }, - { - "epoch": 0.8, - "learning_rate": 1.0198558160136999e-05, - "loss": 2.3375, - "step": 456470 - }, - { - "epoch": 0.8, - "learning_rate": 1.0197686220210173e-05, - "loss": 2.2499, - "step": 456480 - }, - { - "epoch": 0.8, - "learning_rate": 1.0196814280283345e-05, - "loss": 2.1961, - "step": 456490 - }, - { - "epoch": 0.8, - "learning_rate": 1.0195942340356519e-05, - "loss": 2.2849, - "step": 456500 - }, - { - "epoch": 0.8, - "learning_rate": 1.0195070400429692e-05, - "loss": 2.2554, - "step": 456510 - }, - { - "epoch": 0.8, - "learning_rate": 1.0194198460502866e-05, - "loss": 2.4108, - "step": 456520 - }, - { - "epoch": 0.8, - "learning_rate": 1.019332652057604e-05, - "loss": 2.2612, - "step": 456530 - }, - { - "epoch": 0.8, - "learning_rate": 1.0192454580649212e-05, - "loss": 2.2284, - "step": 456540 - }, - { - "epoch": 0.8, - "learning_rate": 1.0191582640722386e-05, - "loss": 2.3868, - "step": 456550 - }, - { - "epoch": 0.8, - "learning_rate": 1.0190710700795558e-05, - "loss": 2.2374, - "step": 456560 - }, - { - "epoch": 0.8, - "learning_rate": 1.0189838760868732e-05, - "loss": 2.2217, - "step": 456570 - }, - { - "epoch": 0.8, - "learning_rate": 1.0188966820941904e-05, - "loss": 2.3317, - "step": 456580 - }, - { - "epoch": 0.8, - "learning_rate": 1.018809488101508e-05, - "loss": 2.2325, - "step": 456590 - }, - { - "epoch": 0.8, - "learning_rate": 1.0187222941088251e-05, - "loss": 2.4173, - "step": 456600 - }, - { - "epoch": 0.8, - "learning_rate": 1.0186351001161425e-05, - "loss": 2.3532, - "step": 456610 - }, - { - "epoch": 0.8, - "learning_rate": 1.0185479061234597e-05, - "loss": 2.1998, - "step": 456620 - }, - { - "epoch": 0.8, - "learning_rate": 1.0184607121307771e-05, - "loss": 2.1966, - "step": 456630 - }, - { - "epoch": 0.8, - "learning_rate": 1.0183735181380943e-05, - "loss": 2.373, - "step": 456640 - }, - { - "epoch": 0.8, - "learning_rate": 1.0182863241454117e-05, - "loss": 2.2637, - "step": 456650 - }, - { - "epoch": 0.8, - "learning_rate": 1.018199130152729e-05, - "loss": 2.2134, - "step": 456660 - }, - { - "epoch": 0.8, - "learning_rate": 1.0181119361600464e-05, - "loss": 2.3778, - "step": 456670 - }, - { - "epoch": 0.8, - "learning_rate": 1.0180247421673638e-05, - "loss": 2.3773, - "step": 456680 - }, - { - "epoch": 0.8, - "learning_rate": 1.017937548174681e-05, - "loss": 2.2001, - "step": 456690 - }, - { - "epoch": 0.8, - "learning_rate": 1.0178503541819984e-05, - "loss": 2.2764, - "step": 456700 - }, - { - "epoch": 0.8, - "learning_rate": 1.0177631601893156e-05, - "loss": 2.2621, - "step": 456710 - }, - { - "epoch": 0.8, - "learning_rate": 1.017675966196633e-05, - "loss": 2.1777, - "step": 456720 - }, - { - "epoch": 0.8, - "learning_rate": 1.0175887722039502e-05, - "loss": 2.2171, - "step": 456730 - }, - { - "epoch": 0.8, - "learning_rate": 1.0175015782112676e-05, - "loss": 2.2904, - "step": 456740 - }, - { - "epoch": 0.8, - "learning_rate": 1.017414384218585e-05, - "loss": 2.4294, - "step": 456750 - }, - { - "epoch": 0.8, - "learning_rate": 1.0173271902259023e-05, - "loss": 2.3357, - "step": 456760 - }, - { - "epoch": 0.8, - "learning_rate": 1.0172399962332195e-05, - "loss": 2.2069, - "step": 456770 - }, - { - "epoch": 0.8, - "learning_rate": 1.0171528022405369e-05, - "loss": 2.3238, - "step": 456780 - }, - { - "epoch": 0.8, - "learning_rate": 1.0170656082478543e-05, - "loss": 2.2988, - "step": 456790 - }, - { - "epoch": 0.8, - "learning_rate": 1.0169784142551715e-05, - "loss": 2.1942, - "step": 456800 - }, - { - "epoch": 0.8, - "learning_rate": 1.0168912202624889e-05, - "loss": 2.2448, - "step": 456810 - }, - { - "epoch": 0.8, - "learning_rate": 1.016804026269806e-05, - "loss": 2.3814, - "step": 456820 - }, - { - "epoch": 0.8, - "learning_rate": 1.0167168322771236e-05, - "loss": 2.4019, - "step": 456830 - }, - { - "epoch": 0.8, - "learning_rate": 1.0166296382844408e-05, - "loss": 2.2615, - "step": 456840 - }, - { - "epoch": 0.8, - "learning_rate": 1.0165424442917582e-05, - "loss": 2.2266, - "step": 456850 - }, - { - "epoch": 0.8, - "learning_rate": 1.0164552502990754e-05, - "loss": 2.2027, - "step": 456860 - }, - { - "epoch": 0.8, - "learning_rate": 1.0163680563063928e-05, - "loss": 2.3064, - "step": 456870 - }, - { - "epoch": 0.8, - "learning_rate": 1.01628086231371e-05, - "loss": 2.2205, - "step": 456880 - }, - { - "epoch": 0.8, - "learning_rate": 1.0161936683210274e-05, - "loss": 2.1588, - "step": 456890 - }, - { - "epoch": 0.8, - "learning_rate": 1.0161064743283447e-05, - "loss": 2.3081, - "step": 456900 - }, - { - "epoch": 0.8, - "learning_rate": 1.0160192803356621e-05, - "loss": 2.2436, - "step": 456910 - }, - { - "epoch": 0.8, - "learning_rate": 1.0159320863429795e-05, - "loss": 2.2165, - "step": 456920 - }, - { - "epoch": 0.8, - "learning_rate": 1.0158448923502967e-05, - "loss": 2.2916, - "step": 456930 - }, - { - "epoch": 0.8, - "learning_rate": 1.015757698357614e-05, - "loss": 2.1819, - "step": 456940 - }, - { - "epoch": 0.8, - "learning_rate": 1.0156705043649313e-05, - "loss": 2.2934, - "step": 456950 - }, - { - "epoch": 0.8, - "learning_rate": 1.0155833103722487e-05, - "loss": 2.287, - "step": 456960 - }, - { - "epoch": 0.8, - "learning_rate": 1.0154961163795659e-05, - "loss": 2.278, - "step": 456970 - }, - { - "epoch": 0.8, - "learning_rate": 1.0154089223868832e-05, - "loss": 2.1921, - "step": 456980 - }, - { - "epoch": 0.8, - "learning_rate": 1.0153217283942006e-05, - "loss": 2.2831, - "step": 456990 - }, - { - "epoch": 0.8, - "learning_rate": 1.015234534401518e-05, - "loss": 2.1598, - "step": 457000 - }, - { - "epoch": 0.8, - "learning_rate": 1.0151473404088352e-05, - "loss": 2.156, - "step": 457010 - }, - { - "epoch": 0.8, - "learning_rate": 1.0150601464161526e-05, - "loss": 2.2436, - "step": 457020 - }, - { - "epoch": 0.8, - "learning_rate": 1.0149729524234698e-05, - "loss": 2.3272, - "step": 457030 - }, - { - "epoch": 0.8, - "learning_rate": 1.0148857584307872e-05, - "loss": 2.1464, - "step": 457040 - }, - { - "epoch": 0.8, - "learning_rate": 1.0147985644381045e-05, - "loss": 2.4018, - "step": 457050 - }, - { - "epoch": 0.8, - "learning_rate": 1.0147113704454218e-05, - "loss": 2.2389, - "step": 457060 - }, - { - "epoch": 0.8, - "learning_rate": 1.0146241764527391e-05, - "loss": 2.3816, - "step": 457070 - }, - { - "epoch": 0.8, - "learning_rate": 1.0145369824600565e-05, - "loss": 2.3573, - "step": 457080 - }, - { - "epoch": 0.8, - "learning_rate": 1.0144497884673739e-05, - "loss": 2.2781, - "step": 457090 - }, - { - "epoch": 0.8, - "learning_rate": 1.0143625944746911e-05, - "loss": 2.3567, - "step": 457100 - }, - { - "epoch": 0.8, - "learning_rate": 1.0142754004820085e-05, - "loss": 2.2553, - "step": 457110 - }, - { - "epoch": 0.8, - "learning_rate": 1.0141882064893257e-05, - "loss": 2.3246, - "step": 457120 - }, - { - "epoch": 0.8, - "learning_rate": 1.014101012496643e-05, - "loss": 2.3476, - "step": 457130 - }, - { - "epoch": 0.8, - "learning_rate": 1.0140138185039604e-05, - "loss": 2.3082, - "step": 457140 - }, - { - "epoch": 0.8, - "learning_rate": 1.0139266245112778e-05, - "loss": 2.2878, - "step": 457150 - }, - { - "epoch": 0.8, - "learning_rate": 1.013839430518595e-05, - "loss": 2.2959, - "step": 457160 - }, - { - "epoch": 0.8, - "learning_rate": 1.0137522365259124e-05, - "loss": 2.3426, - "step": 457170 - }, - { - "epoch": 0.8, - "learning_rate": 1.0136650425332298e-05, - "loss": 2.3728, - "step": 457180 - }, - { - "epoch": 0.8, - "learning_rate": 1.013577848540547e-05, - "loss": 2.3496, - "step": 457190 - }, - { - "epoch": 0.8, - "learning_rate": 1.0134906545478644e-05, - "loss": 2.3535, - "step": 457200 - }, - { - "epoch": 0.8, - "learning_rate": 1.0134034605551816e-05, - "loss": 2.2799, - "step": 457210 - }, - { - "epoch": 0.8, - "learning_rate": 1.013316266562499e-05, - "loss": 2.2267, - "step": 457220 - }, - { - "epoch": 0.8, - "learning_rate": 1.0132290725698163e-05, - "loss": 2.3898, - "step": 457230 - }, - { - "epoch": 0.8, - "learning_rate": 1.0131418785771337e-05, - "loss": 2.353, - "step": 457240 - }, - { - "epoch": 0.8, - "learning_rate": 1.0130546845844509e-05, - "loss": 2.1921, - "step": 457250 - }, - { - "epoch": 0.8, - "learning_rate": 1.0129674905917683e-05, - "loss": 2.1977, - "step": 457260 - }, - { - "epoch": 0.8, - "learning_rate": 1.0128802965990855e-05, - "loss": 2.2127, - "step": 457270 - }, - { - "epoch": 0.8, - "learning_rate": 1.0127931026064029e-05, - "loss": 2.2541, - "step": 457280 - }, - { - "epoch": 0.8, - "learning_rate": 1.01270590861372e-05, - "loss": 2.3327, - "step": 457290 - }, - { - "epoch": 0.8, - "learning_rate": 1.0126187146210374e-05, - "loss": 2.3581, - "step": 457300 - }, - { - "epoch": 0.8, - "learning_rate": 1.0125315206283548e-05, - "loss": 2.1413, - "step": 457310 - }, - { - "epoch": 0.8, - "learning_rate": 1.0124443266356722e-05, - "loss": 2.1325, - "step": 457320 - }, - { - "epoch": 0.8, - "learning_rate": 1.0123571326429896e-05, - "loss": 2.3, - "step": 457330 - }, - { - "epoch": 0.8, - "learning_rate": 1.0122699386503068e-05, - "loss": 2.3582, - "step": 457340 - }, - { - "epoch": 0.8, - "learning_rate": 1.0121827446576242e-05, - "loss": 2.2801, - "step": 457350 - }, - { - "epoch": 0.8, - "learning_rate": 1.0120955506649414e-05, - "loss": 2.2628, - "step": 457360 - }, - { - "epoch": 0.8, - "learning_rate": 1.0120083566722587e-05, - "loss": 2.2705, - "step": 457370 - }, - { - "epoch": 0.8, - "learning_rate": 1.011921162679576e-05, - "loss": 2.1547, - "step": 457380 - }, - { - "epoch": 0.8, - "learning_rate": 1.0118339686868935e-05, - "loss": 2.4016, - "step": 457390 - }, - { - "epoch": 0.8, - "learning_rate": 1.0117467746942107e-05, - "loss": 2.2526, - "step": 457400 - }, - { - "epoch": 0.8, - "learning_rate": 1.0116595807015281e-05, - "loss": 2.3333, - "step": 457410 - }, - { - "epoch": 0.8, - "learning_rate": 1.0115723867088453e-05, - "loss": 2.2813, - "step": 457420 - }, - { - "epoch": 0.8, - "learning_rate": 1.0114851927161627e-05, - "loss": 2.2581, - "step": 457430 - }, - { - "epoch": 0.8, - "learning_rate": 1.0113979987234799e-05, - "loss": 2.3778, - "step": 457440 - }, - { - "epoch": 0.8, - "learning_rate": 1.0113108047307973e-05, - "loss": 2.3536, - "step": 457450 - }, - { - "epoch": 0.8, - "learning_rate": 1.0112236107381146e-05, - "loss": 2.3413, - "step": 457460 - }, - { - "epoch": 0.8, - "learning_rate": 1.011136416745432e-05, - "loss": 2.2367, - "step": 457470 - }, - { - "epoch": 0.8, - "learning_rate": 1.0110492227527494e-05, - "loss": 2.2759, - "step": 457480 - }, - { - "epoch": 0.8, - "learning_rate": 1.0109620287600666e-05, - "loss": 2.3587, - "step": 457490 - }, - { - "epoch": 0.8, - "learning_rate": 1.010874834767384e-05, - "loss": 2.3707, - "step": 457500 - }, - { - "epoch": 0.8, - "learning_rate": 1.0107876407747012e-05, - "loss": 2.3099, - "step": 457510 - }, - { - "epoch": 0.8, - "learning_rate": 1.0107004467820186e-05, - "loss": 2.3616, - "step": 457520 - }, - { - "epoch": 0.8, - "learning_rate": 1.0106132527893358e-05, - "loss": 2.2816, - "step": 457530 - }, - { - "epoch": 0.8, - "learning_rate": 1.0105260587966531e-05, - "loss": 2.2066, - "step": 457540 - }, - { - "epoch": 0.8, - "learning_rate": 1.0104388648039705e-05, - "loss": 2.3049, - "step": 457550 - }, - { - "epoch": 0.8, - "learning_rate": 1.0103516708112879e-05, - "loss": 2.3138, - "step": 457560 - }, - { - "epoch": 0.8, - "learning_rate": 1.0102644768186051e-05, - "loss": 2.3393, - "step": 457570 - }, - { - "epoch": 0.8, - "learning_rate": 1.0101772828259225e-05, - "loss": 2.3993, - "step": 457580 - }, - { - "epoch": 0.8, - "learning_rate": 1.0100900888332399e-05, - "loss": 2.2408, - "step": 457590 - }, - { - "epoch": 0.8, - "learning_rate": 1.010002894840557e-05, - "loss": 2.2718, - "step": 457600 - }, - { - "epoch": 0.8, - "learning_rate": 1.0099157008478744e-05, - "loss": 2.1689, - "step": 457610 - }, - { - "epoch": 0.8, - "learning_rate": 1.0098285068551916e-05, - "loss": 2.1708, - "step": 457620 - }, - { - "epoch": 0.8, - "learning_rate": 1.0097413128625092e-05, - "loss": 2.3301, - "step": 457630 - }, - { - "epoch": 0.8, - "learning_rate": 1.0096541188698264e-05, - "loss": 2.2453, - "step": 457640 - }, - { - "epoch": 0.8, - "learning_rate": 1.0095669248771438e-05, - "loss": 2.3494, - "step": 457650 - }, - { - "epoch": 0.8, - "learning_rate": 1.009479730884461e-05, - "loss": 2.1454, - "step": 457660 - }, - { - "epoch": 0.8, - "learning_rate": 1.0093925368917784e-05, - "loss": 2.3022, - "step": 457670 - }, - { - "epoch": 0.8, - "learning_rate": 1.0093053428990956e-05, - "loss": 2.3147, - "step": 457680 - }, - { - "epoch": 0.8, - "learning_rate": 1.009218148906413e-05, - "loss": 2.2131, - "step": 457690 - }, - { - "epoch": 0.8, - "learning_rate": 1.0091309549137303e-05, - "loss": 2.2225, - "step": 457700 - }, - { - "epoch": 0.8, - "learning_rate": 1.0090437609210477e-05, - "loss": 2.19, - "step": 457710 - }, - { - "epoch": 0.8, - "learning_rate": 1.008956566928365e-05, - "loss": 2.3567, - "step": 457720 - }, - { - "epoch": 0.8, - "learning_rate": 1.0088693729356823e-05, - "loss": 2.2101, - "step": 457730 - }, - { - "epoch": 0.8, - "learning_rate": 1.0087821789429997e-05, - "loss": 2.3761, - "step": 457740 - }, - { - "epoch": 0.8, - "learning_rate": 1.0086949849503169e-05, - "loss": 2.2063, - "step": 457750 - }, - { - "epoch": 0.8, - "learning_rate": 1.0086077909576342e-05, - "loss": 2.3801, - "step": 457760 - }, - { - "epoch": 0.8, - "learning_rate": 1.0085205969649515e-05, - "loss": 2.3444, - "step": 457770 - }, - { - "epoch": 0.8, - "learning_rate": 1.0084334029722688e-05, - "loss": 2.2795, - "step": 457780 - }, - { - "epoch": 0.8, - "learning_rate": 1.0083462089795862e-05, - "loss": 2.1985, - "step": 457790 - }, - { - "epoch": 0.8, - "learning_rate": 1.0082590149869036e-05, - "loss": 2.2211, - "step": 457800 - }, - { - "epoch": 0.8, - "learning_rate": 1.0081718209942208e-05, - "loss": 2.2929, - "step": 457810 - }, - { - "epoch": 0.8, - "learning_rate": 1.0080846270015382e-05, - "loss": 2.3386, - "step": 457820 - }, - { - "epoch": 0.8, - "learning_rate": 1.0079974330088554e-05, - "loss": 2.2618, - "step": 457830 - }, - { - "epoch": 0.8, - "learning_rate": 1.0079102390161728e-05, - "loss": 2.1884, - "step": 457840 - }, - { - "epoch": 0.8, - "learning_rate": 1.0078230450234901e-05, - "loss": 2.2534, - "step": 457850 - }, - { - "epoch": 0.8, - "learning_rate": 1.0077358510308073e-05, - "loss": 2.3501, - "step": 457860 - }, - { - "epoch": 0.8, - "learning_rate": 1.0076486570381249e-05, - "loss": 2.1807, - "step": 457870 - }, - { - "epoch": 0.8, - "learning_rate": 1.0075614630454421e-05, - "loss": 2.2635, - "step": 457880 - }, - { - "epoch": 0.8, - "learning_rate": 1.0074742690527595e-05, - "loss": 2.3627, - "step": 457890 - }, - { - "epoch": 0.8, - "learning_rate": 1.0073870750600767e-05, - "loss": 2.236, - "step": 457900 - }, - { - "epoch": 0.8, - "learning_rate": 1.007299881067394e-05, - "loss": 2.1729, - "step": 457910 - }, - { - "epoch": 0.8, - "learning_rate": 1.0072126870747113e-05, - "loss": 2.2908, - "step": 457920 - }, - { - "epoch": 0.8, - "learning_rate": 1.0071254930820286e-05, - "loss": 2.3901, - "step": 457930 - }, - { - "epoch": 0.8, - "learning_rate": 1.007038299089346e-05, - "loss": 2.3614, - "step": 457940 - }, - { - "epoch": 0.8, - "learning_rate": 1.0069511050966634e-05, - "loss": 2.2896, - "step": 457950 - }, - { - "epoch": 0.8, - "learning_rate": 1.0068639111039806e-05, - "loss": 2.2317, - "step": 457960 - }, - { - "epoch": 0.8, - "learning_rate": 1.006776717111298e-05, - "loss": 2.4015, - "step": 457970 - }, - { - "epoch": 0.8, - "learning_rate": 1.0066895231186154e-05, - "loss": 2.1717, - "step": 457980 - }, - { - "epoch": 0.8, - "learning_rate": 1.0066023291259326e-05, - "loss": 2.3586, - "step": 457990 - }, - { - "epoch": 0.8, - "learning_rate": 1.00651513513325e-05, - "loss": 2.2567, - "step": 458000 - }, - { - "epoch": 0.8, - "learning_rate": 1.0064279411405671e-05, - "loss": 2.3111, - "step": 458010 - }, - { - "epoch": 0.8, - "learning_rate": 1.0063407471478845e-05, - "loss": 2.2909, - "step": 458020 - }, - { - "epoch": 0.8, - "learning_rate": 1.0062535531552019e-05, - "loss": 2.324, - "step": 458030 - }, - { - "epoch": 0.8, - "learning_rate": 1.0061663591625193e-05, - "loss": 2.2165, - "step": 458040 - }, - { - "epoch": 0.8, - "learning_rate": 1.0060791651698365e-05, - "loss": 2.267, - "step": 458050 - }, - { - "epoch": 0.8, - "learning_rate": 1.0059919711771539e-05, - "loss": 2.4236, - "step": 458060 - }, - { - "epoch": 0.8, - "learning_rate": 1.005904777184471e-05, - "loss": 2.3693, - "step": 458070 - }, - { - "epoch": 0.8, - "learning_rate": 1.0058175831917884e-05, - "loss": 2.2432, - "step": 458080 - }, - { - "epoch": 0.8, - "learning_rate": 1.0057303891991057e-05, - "loss": 2.2693, - "step": 458090 - }, - { - "epoch": 0.8, - "learning_rate": 1.005643195206423e-05, - "loss": 2.3034, - "step": 458100 - }, - { - "epoch": 0.8, - "learning_rate": 1.0055560012137404e-05, - "loss": 2.3461, - "step": 458110 - }, - { - "epoch": 0.8, - "learning_rate": 1.0054688072210578e-05, - "loss": 2.3826, - "step": 458120 - }, - { - "epoch": 0.8, - "learning_rate": 1.0053816132283752e-05, - "loss": 2.2949, - "step": 458130 - }, - { - "epoch": 0.8, - "learning_rate": 1.0052944192356924e-05, - "loss": 2.2529, - "step": 458140 - }, - { - "epoch": 0.8, - "learning_rate": 1.0052072252430097e-05, - "loss": 2.3531, - "step": 458150 - }, - { - "epoch": 0.8, - "learning_rate": 1.005120031250327e-05, - "loss": 2.1888, - "step": 458160 - }, - { - "epoch": 0.8, - "learning_rate": 1.0050328372576443e-05, - "loss": 2.2133, - "step": 458170 - }, - { - "epoch": 0.8, - "learning_rate": 1.0049456432649617e-05, - "loss": 2.2132, - "step": 458180 - }, - { - "epoch": 0.8, - "learning_rate": 1.0048584492722791e-05, - "loss": 2.2863, - "step": 458190 - }, - { - "epoch": 0.8, - "learning_rate": 1.0047712552795963e-05, - "loss": 2.1705, - "step": 458200 - }, - { - "epoch": 0.8, - "learning_rate": 1.0046840612869137e-05, - "loss": 2.3012, - "step": 458210 - }, - { - "epoch": 0.8, - "learning_rate": 1.0045968672942309e-05, - "loss": 2.2875, - "step": 458220 - }, - { - "epoch": 0.8, - "learning_rate": 1.0045096733015483e-05, - "loss": 2.3942, - "step": 458230 - }, - { - "epoch": 0.8, - "learning_rate": 1.0044224793088655e-05, - "loss": 2.2993, - "step": 458240 - }, - { - "epoch": 0.8, - "learning_rate": 1.0043352853161828e-05, - "loss": 2.3151, - "step": 458250 - }, - { - "epoch": 0.8, - "learning_rate": 1.0042480913235002e-05, - "loss": 2.231, - "step": 458260 - }, - { - "epoch": 0.8, - "learning_rate": 1.0041608973308176e-05, - "loss": 2.203, - "step": 458270 - }, - { - "epoch": 0.8, - "learning_rate": 1.004073703338135e-05, - "loss": 2.3102, - "step": 458280 - }, - { - "epoch": 0.8, - "learning_rate": 1.0039865093454522e-05, - "loss": 2.1522, - "step": 458290 - }, - { - "epoch": 0.8, - "learning_rate": 1.0038993153527696e-05, - "loss": 2.3514, - "step": 458300 - }, - { - "epoch": 0.8, - "learning_rate": 1.0038121213600868e-05, - "loss": 2.3091, - "step": 458310 - }, - { - "epoch": 0.8, - "learning_rate": 1.0037249273674041e-05, - "loss": 2.1504, - "step": 458320 - }, - { - "epoch": 0.8, - "learning_rate": 1.0036377333747213e-05, - "loss": 2.3445, - "step": 458330 - }, - { - "epoch": 0.8, - "learning_rate": 1.0035505393820387e-05, - "loss": 2.3288, - "step": 458340 - }, - { - "epoch": 0.8, - "learning_rate": 1.0034633453893561e-05, - "loss": 2.2515, - "step": 458350 - }, - { - "epoch": 0.8, - "learning_rate": 1.0033761513966735e-05, - "loss": 2.327, - "step": 458360 - }, - { - "epoch": 0.8, - "learning_rate": 1.0032889574039907e-05, - "loss": 2.3173, - "step": 458370 - }, - { - "epoch": 0.8, - "learning_rate": 1.003201763411308e-05, - "loss": 2.1925, - "step": 458380 - }, - { - "epoch": 0.8, - "learning_rate": 1.0031145694186254e-05, - "loss": 2.2726, - "step": 458390 - }, - { - "epoch": 0.8, - "learning_rate": 1.0030273754259427e-05, - "loss": 2.2427, - "step": 458400 - }, - { - "epoch": 0.8, - "learning_rate": 1.00294018143326e-05, - "loss": 2.2935, - "step": 458410 - }, - { - "epoch": 0.8, - "learning_rate": 1.0028529874405772e-05, - "loss": 2.2865, - "step": 458420 - }, - { - "epoch": 0.8, - "learning_rate": 1.0027657934478948e-05, - "loss": 2.3111, - "step": 458430 - }, - { - "epoch": 0.8, - "learning_rate": 1.002678599455212e-05, - "loss": 2.2273, - "step": 458440 - }, - { - "epoch": 0.8, - "learning_rate": 1.0025914054625294e-05, - "loss": 2.3415, - "step": 458450 - }, - { - "epoch": 0.8, - "learning_rate": 1.0025042114698466e-05, - "loss": 2.3635, - "step": 458460 - }, - { - "epoch": 0.8, - "learning_rate": 1.002417017477164e-05, - "loss": 2.3311, - "step": 458470 - }, - { - "epoch": 0.8, - "learning_rate": 1.0023298234844812e-05, - "loss": 2.2854, - "step": 458480 - }, - { - "epoch": 0.8, - "learning_rate": 1.0022426294917985e-05, - "loss": 2.3056, - "step": 458490 - }, - { - "epoch": 0.8, - "learning_rate": 1.0021554354991159e-05, - "loss": 2.241, - "step": 458500 - }, - { - "epoch": 0.8, - "learning_rate": 1.0020682415064333e-05, - "loss": 2.3025, - "step": 458510 - }, - { - "epoch": 0.8, - "learning_rate": 1.0019810475137507e-05, - "loss": 2.2092, - "step": 458520 - }, - { - "epoch": 0.8, - "learning_rate": 1.0018938535210679e-05, - "loss": 2.3765, - "step": 458530 - }, - { - "epoch": 0.8, - "learning_rate": 1.0018066595283853e-05, - "loss": 2.1046, - "step": 458540 - }, - { - "epoch": 0.8, - "learning_rate": 1.0017194655357025e-05, - "loss": 2.3204, - "step": 458550 - }, - { - "epoch": 0.8, - "learning_rate": 1.0016322715430198e-05, - "loss": 2.2965, - "step": 458560 - }, - { - "epoch": 0.8, - "learning_rate": 1.001545077550337e-05, - "loss": 2.1909, - "step": 458570 - }, - { - "epoch": 0.8, - "learning_rate": 1.0014578835576544e-05, - "loss": 2.3328, - "step": 458580 - }, - { - "epoch": 0.8, - "learning_rate": 1.0013706895649718e-05, - "loss": 2.3678, - "step": 458590 - }, - { - "epoch": 0.8, - "learning_rate": 1.0012834955722892e-05, - "loss": 2.1684, - "step": 458600 - }, - { - "epoch": 0.8, - "learning_rate": 1.0011963015796064e-05, - "loss": 2.3882, - "step": 458610 - }, - { - "epoch": 0.8, - "learning_rate": 1.0011091075869238e-05, - "loss": 2.3761, - "step": 458620 - }, - { - "epoch": 0.8, - "learning_rate": 1.001021913594241e-05, - "loss": 2.3699, - "step": 458630 - }, - { - "epoch": 0.8, - "learning_rate": 1.0009347196015583e-05, - "loss": 2.2884, - "step": 458640 - }, - { - "epoch": 0.8, - "learning_rate": 1.0008475256088757e-05, - "loss": 2.2661, - "step": 458650 - }, - { - "epoch": 0.8, - "learning_rate": 1.000760331616193e-05, - "loss": 2.2008, - "step": 458660 - }, - { - "epoch": 0.8, - "learning_rate": 1.0006731376235105e-05, - "loss": 2.387, - "step": 458670 - }, - { - "epoch": 0.8, - "learning_rate": 1.0005859436308277e-05, - "loss": 2.1805, - "step": 458680 - }, - { - "epoch": 0.8, - "learning_rate": 1.000498749638145e-05, - "loss": 2.3639, - "step": 458690 - }, - { - "epoch": 0.8, - "learning_rate": 1.0004115556454623e-05, - "loss": 2.3196, - "step": 458700 - }, - { - "epoch": 0.8, - "learning_rate": 1.0003243616527796e-05, - "loss": 2.1667, - "step": 458710 - }, - { - "epoch": 0.8, - "learning_rate": 1.0002371676600969e-05, - "loss": 2.2237, - "step": 458720 - }, - { - "epoch": 0.8, - "learning_rate": 1.0001499736674142e-05, - "loss": 2.3328, - "step": 458730 - }, - { - "epoch": 0.8, - "learning_rate": 1.0000627796747316e-05, - "loss": 2.2116, - "step": 458740 - }, - { - "epoch": 0.8, - "learning_rate": 9.99975585682049e-06, - "loss": 2.3603, - "step": 458750 - }, - { - "epoch": 0.8, - "learning_rate": 9.998883916893662e-06, - "loss": 2.2597, - "step": 458760 - }, - { - "epoch": 0.8, - "learning_rate": 9.998011976966836e-06, - "loss": 2.3841, - "step": 458770 - }, - { - "epoch": 0.8, - "learning_rate": 9.99714003704001e-06, - "loss": 2.3041, - "step": 458780 - }, - { - "epoch": 0.8, - "learning_rate": 9.996268097113182e-06, - "loss": 2.2805, - "step": 458790 - }, - { - "epoch": 0.8, - "learning_rate": 9.995396157186355e-06, - "loss": 2.1132, - "step": 458800 - }, - { - "epoch": 0.8, - "learning_rate": 9.994524217259527e-06, - "loss": 2.3801, - "step": 458810 - }, - { - "epoch": 0.8, - "learning_rate": 9.993652277332701e-06, - "loss": 2.2965, - "step": 458820 - }, - { - "epoch": 0.8, - "learning_rate": 9.992780337405875e-06, - "loss": 2.2712, - "step": 458830 - }, - { - "epoch": 0.8, - "learning_rate": 9.991908397479049e-06, - "loss": 2.2052, - "step": 458840 - }, - { - "epoch": 0.8, - "learning_rate": 9.99103645755222e-06, - "loss": 2.3493, - "step": 458850 - }, - { - "epoch": 0.8, - "learning_rate": 9.990164517625395e-06, - "loss": 2.2523, - "step": 458860 - }, - { - "epoch": 0.8, - "learning_rate": 9.989292577698567e-06, - "loss": 2.1716, - "step": 458870 - }, - { - "epoch": 0.8, - "learning_rate": 9.98842063777174e-06, - "loss": 2.2131, - "step": 458880 - }, - { - "epoch": 0.8, - "learning_rate": 9.987548697844912e-06, - "loss": 2.181, - "step": 458890 - }, - { - "epoch": 0.8, - "learning_rate": 9.986676757918086e-06, - "loss": 2.3255, - "step": 458900 - }, - { - "epoch": 0.8, - "learning_rate": 9.985804817991262e-06, - "loss": 2.2251, - "step": 458910 - }, - { - "epoch": 0.8, - "learning_rate": 9.984932878064434e-06, - "loss": 2.3024, - "step": 458920 - }, - { - "epoch": 0.8, - "learning_rate": 9.984060938137608e-06, - "loss": 2.2322, - "step": 458930 - }, - { - "epoch": 0.8, - "learning_rate": 9.98318899821078e-06, - "loss": 2.2235, - "step": 458940 - }, - { - "epoch": 0.8, - "learning_rate": 9.982317058283953e-06, - "loss": 2.3719, - "step": 458950 - }, - { - "epoch": 0.8, - "learning_rate": 9.981445118357125e-06, - "loss": 2.2881, - "step": 458960 - }, - { - "epoch": 0.8, - "learning_rate": 9.9805731784303e-06, - "loss": 2.223, - "step": 458970 - }, - { - "epoch": 0.8, - "learning_rate": 9.979701238503473e-06, - "loss": 2.2339, - "step": 458980 - }, - { - "epoch": 0.8, - "learning_rate": 9.978829298576647e-06, - "loss": 2.1285, - "step": 458990 - }, - { - "epoch": 0.8, - "learning_rate": 9.977957358649819e-06, - "loss": 2.3414, - "step": 459000 - }, - { - "epoch": 0.8, - "learning_rate": 9.977085418722993e-06, - "loss": 2.2691, - "step": 459010 - }, - { - "epoch": 0.8, - "learning_rate": 9.976213478796165e-06, - "loss": 2.3539, - "step": 459020 - }, - { - "epoch": 0.8, - "learning_rate": 9.975341538869338e-06, - "loss": 2.2187, - "step": 459030 - }, - { - "epoch": 0.8, - "learning_rate": 9.974469598942512e-06, - "loss": 2.2154, - "step": 459040 - }, - { - "epoch": 0.8, - "learning_rate": 9.973597659015684e-06, - "loss": 2.2027, - "step": 459050 - }, - { - "epoch": 0.8, - "learning_rate": 9.972725719088858e-06, - "loss": 2.289, - "step": 459060 - }, - { - "epoch": 0.8, - "learning_rate": 9.971853779162032e-06, - "loss": 2.2903, - "step": 459070 - }, - { - "epoch": 0.8, - "learning_rate": 9.970981839235206e-06, - "loss": 2.2789, - "step": 459080 - }, - { - "epoch": 0.8, - "learning_rate": 9.970109899308378e-06, - "loss": 2.1605, - "step": 459090 - }, - { - "epoch": 0.8, - "learning_rate": 9.969237959381551e-06, - "loss": 2.2421, - "step": 459100 - }, - { - "epoch": 0.8, - "learning_rate": 9.968366019454724e-06, - "loss": 2.2792, - "step": 459110 - }, - { - "epoch": 0.8, - "learning_rate": 9.967494079527897e-06, - "loss": 2.2682, - "step": 459120 - }, - { - "epoch": 0.8, - "learning_rate": 9.96662213960107e-06, - "loss": 2.4117, - "step": 459130 - }, - { - "epoch": 0.8, - "learning_rate": 9.965750199674243e-06, - "loss": 2.3045, - "step": 459140 - }, - { - "epoch": 0.8, - "learning_rate": 9.964878259747417e-06, - "loss": 2.2914, - "step": 459150 - }, - { - "epoch": 0.8, - "learning_rate": 9.96400631982059e-06, - "loss": 2.3532, - "step": 459160 - }, - { - "epoch": 0.8, - "learning_rate": 9.963134379893763e-06, - "loss": 2.2648, - "step": 459170 - }, - { - "epoch": 0.8, - "learning_rate": 9.962262439966937e-06, - "loss": 2.2499, - "step": 459180 - }, - { - "epoch": 0.8, - "learning_rate": 9.96139050004011e-06, - "loss": 2.3808, - "step": 459190 - }, - { - "epoch": 0.8, - "learning_rate": 9.960518560113282e-06, - "loss": 2.2252, - "step": 459200 - }, - { - "epoch": 0.8, - "learning_rate": 9.959646620186456e-06, - "loss": 2.3499, - "step": 459210 - }, - { - "epoch": 0.8, - "learning_rate": 9.95877468025963e-06, - "loss": 2.3076, - "step": 459220 - }, - { - "epoch": 0.8, - "learning_rate": 9.957902740332804e-06, - "loss": 2.2194, - "step": 459230 - }, - { - "epoch": 0.8, - "learning_rate": 9.957030800405976e-06, - "loss": 2.2813, - "step": 459240 - }, - { - "epoch": 0.8, - "learning_rate": 9.95615886047915e-06, - "loss": 2.2945, - "step": 459250 - }, - { - "epoch": 0.8, - "learning_rate": 9.955286920552322e-06, - "loss": 2.3421, - "step": 459260 - }, - { - "epoch": 0.8, - "learning_rate": 9.954414980625495e-06, - "loss": 2.2655, - "step": 459270 - }, - { - "epoch": 0.8, - "learning_rate": 9.953543040698667e-06, - "loss": 2.3175, - "step": 459280 - }, - { - "epoch": 0.8, - "learning_rate": 9.952671100771841e-06, - "loss": 2.3767, - "step": 459290 - }, - { - "epoch": 0.8, - "learning_rate": 9.951799160845015e-06, - "loss": 2.3178, - "step": 459300 - }, - { - "epoch": 0.8, - "learning_rate": 9.950927220918189e-06, - "loss": 2.2262, - "step": 459310 - }, - { - "epoch": 0.8, - "learning_rate": 9.950055280991363e-06, - "loss": 2.337, - "step": 459320 - }, - { - "epoch": 0.8, - "learning_rate": 9.949183341064535e-06, - "loss": 2.3416, - "step": 459330 - }, - { - "epoch": 0.8, - "learning_rate": 9.948311401137708e-06, - "loss": 2.1605, - "step": 459340 - }, - { - "epoch": 0.8, - "learning_rate": 9.94743946121088e-06, - "loss": 2.3179, - "step": 459350 - }, - { - "epoch": 0.8, - "learning_rate": 9.946567521284054e-06, - "loss": 2.3776, - "step": 459360 - }, - { - "epoch": 0.8, - "learning_rate": 9.945695581357226e-06, - "loss": 2.3356, - "step": 459370 - }, - { - "epoch": 0.8, - "learning_rate": 9.9448236414304e-06, - "loss": 2.302, - "step": 459380 - }, - { - "epoch": 0.8, - "learning_rate": 9.943951701503574e-06, - "loss": 2.2167, - "step": 459390 - }, - { - "epoch": 0.8, - "learning_rate": 9.943079761576748e-06, - "loss": 2.3249, - "step": 459400 - }, - { - "epoch": 0.8, - "learning_rate": 9.94220782164992e-06, - "loss": 2.2319, - "step": 459410 - }, - { - "epoch": 0.8, - "learning_rate": 9.941335881723093e-06, - "loss": 2.2735, - "step": 459420 - }, - { - "epoch": 0.8, - "learning_rate": 9.940463941796266e-06, - "loss": 2.369, - "step": 459430 - }, - { - "epoch": 0.8, - "learning_rate": 9.93959200186944e-06, - "loss": 2.2707, - "step": 459440 - }, - { - "epoch": 0.8, - "learning_rate": 9.938720061942613e-06, - "loss": 2.2711, - "step": 459450 - }, - { - "epoch": 0.8, - "learning_rate": 9.937848122015785e-06, - "loss": 2.3094, - "step": 459460 - }, - { - "epoch": 0.8, - "learning_rate": 9.93697618208896e-06, - "loss": 2.2569, - "step": 459470 - }, - { - "epoch": 0.8, - "learning_rate": 9.936104242162133e-06, - "loss": 2.2734, - "step": 459480 - }, - { - "epoch": 0.8, - "learning_rate": 9.935232302235306e-06, - "loss": 2.2205, - "step": 459490 - }, - { - "epoch": 0.8, - "learning_rate": 9.934360362308479e-06, - "loss": 2.2177, - "step": 459500 - }, - { - "epoch": 0.8, - "learning_rate": 9.933488422381652e-06, - "loss": 2.2526, - "step": 459510 - }, - { - "epoch": 0.8, - "learning_rate": 9.932616482454824e-06, - "loss": 2.2605, - "step": 459520 - }, - { - "epoch": 0.8, - "learning_rate": 9.931744542527998e-06, - "loss": 2.278, - "step": 459530 - }, - { - "epoch": 0.8, - "learning_rate": 9.930872602601172e-06, - "loss": 2.2297, - "step": 459540 - }, - { - "epoch": 0.8, - "learning_rate": 9.930000662674346e-06, - "loss": 2.17, - "step": 459550 - }, - { - "epoch": 0.8, - "learning_rate": 9.929128722747518e-06, - "loss": 2.2, - "step": 459560 - }, - { - "epoch": 0.8, - "learning_rate": 9.928256782820692e-06, - "loss": 2.2844, - "step": 459570 - }, - { - "epoch": 0.8, - "learning_rate": 9.927384842893865e-06, - "loss": 2.2453, - "step": 459580 - }, - { - "epoch": 0.8, - "learning_rate": 9.926512902967037e-06, - "loss": 2.3461, - "step": 459590 - }, - { - "epoch": 0.8, - "learning_rate": 9.925640963040211e-06, - "loss": 2.2285, - "step": 459600 - }, - { - "epoch": 0.8, - "learning_rate": 9.924769023113383e-06, - "loss": 2.1742, - "step": 459610 - }, - { - "epoch": 0.8, - "learning_rate": 9.923897083186557e-06, - "loss": 2.3657, - "step": 459620 - }, - { - "epoch": 0.8, - "learning_rate": 9.92302514325973e-06, - "loss": 2.3206, - "step": 459630 - }, - { - "epoch": 0.8, - "learning_rate": 9.922153203332905e-06, - "loss": 2.2691, - "step": 459640 - }, - { - "epoch": 0.8, - "learning_rate": 9.921281263406077e-06, - "loss": 2.2035, - "step": 459650 - }, - { - "epoch": 0.8, - "learning_rate": 9.92040932347925e-06, - "loss": 2.3607, - "step": 459660 - }, - { - "epoch": 0.8, - "learning_rate": 9.919537383552422e-06, - "loss": 2.2331, - "step": 459670 - }, - { - "epoch": 0.8, - "learning_rate": 9.918665443625596e-06, - "loss": 2.1333, - "step": 459680 - }, - { - "epoch": 0.8, - "learning_rate": 9.917793503698768e-06, - "loss": 2.2003, - "step": 459690 - }, - { - "epoch": 0.8, - "learning_rate": 9.916921563771942e-06, - "loss": 2.2191, - "step": 459700 - }, - { - "epoch": 0.8, - "learning_rate": 9.916049623845118e-06, - "loss": 2.4377, - "step": 459710 - }, - { - "epoch": 0.8, - "learning_rate": 9.91517768391829e-06, - "loss": 2.3826, - "step": 459720 - }, - { - "epoch": 0.8, - "learning_rate": 9.914305743991463e-06, - "loss": 2.2306, - "step": 459730 - }, - { - "epoch": 0.8, - "learning_rate": 9.913433804064635e-06, - "loss": 2.3233, - "step": 459740 - }, - { - "epoch": 0.8, - "learning_rate": 9.91256186413781e-06, - "loss": 2.259, - "step": 459750 - }, - { - "epoch": 0.8, - "learning_rate": 9.911689924210981e-06, - "loss": 2.3186, - "step": 459760 - }, - { - "epoch": 0.8, - "learning_rate": 9.910817984284155e-06, - "loss": 2.2173, - "step": 459770 - }, - { - "epoch": 0.8, - "learning_rate": 9.909946044357329e-06, - "loss": 2.2089, - "step": 459780 - }, - { - "epoch": 0.8, - "learning_rate": 9.909074104430503e-06, - "loss": 2.1254, - "step": 459790 - }, - { - "epoch": 0.8, - "learning_rate": 9.908202164503675e-06, - "loss": 2.2899, - "step": 459800 - }, - { - "epoch": 0.8, - "learning_rate": 9.907330224576848e-06, - "loss": 2.3397, - "step": 459810 - }, - { - "epoch": 0.8, - "learning_rate": 9.90645828465002e-06, - "loss": 2.3194, - "step": 459820 - }, - { - "epoch": 0.8, - "learning_rate": 9.905586344723194e-06, - "loss": 2.192, - "step": 459830 - }, - { - "epoch": 0.8, - "learning_rate": 9.904714404796368e-06, - "loss": 2.3501, - "step": 459840 - }, - { - "epoch": 0.8, - "learning_rate": 9.90384246486954e-06, - "loss": 2.2316, - "step": 459850 - }, - { - "epoch": 0.8, - "learning_rate": 9.902970524942714e-06, - "loss": 2.2887, - "step": 459860 - }, - { - "epoch": 0.8, - "learning_rate": 9.902098585015888e-06, - "loss": 2.2893, - "step": 459870 - }, - { - "epoch": 0.8, - "learning_rate": 9.901226645089061e-06, - "loss": 2.2282, - "step": 459880 - }, - { - "epoch": 0.8, - "learning_rate": 9.900354705162234e-06, - "loss": 2.264, - "step": 459890 - }, - { - "epoch": 0.8, - "learning_rate": 9.899482765235407e-06, - "loss": 2.3938, - "step": 459900 - }, - { - "epoch": 0.8, - "learning_rate": 9.89861082530858e-06, - "loss": 2.3484, - "step": 459910 - }, - { - "epoch": 0.8, - "learning_rate": 9.897738885381753e-06, - "loss": 2.2869, - "step": 459920 - }, - { - "epoch": 0.8, - "learning_rate": 9.896866945454925e-06, - "loss": 2.3862, - "step": 459930 - }, - { - "epoch": 0.8, - "learning_rate": 9.895995005528099e-06, - "loss": 2.3129, - "step": 459940 - }, - { - "epoch": 0.8, - "learning_rate": 9.895123065601273e-06, - "loss": 2.3278, - "step": 459950 - }, - { - "epoch": 0.8, - "learning_rate": 9.894251125674447e-06, - "loss": 2.3507, - "step": 459960 - }, - { - "epoch": 0.8, - "learning_rate": 9.893379185747619e-06, - "loss": 2.3797, - "step": 459970 - }, - { - "epoch": 0.8, - "learning_rate": 9.892507245820792e-06, - "loss": 2.316, - "step": 459980 - }, - { - "epoch": 0.8, - "learning_rate": 9.891635305893966e-06, - "loss": 2.2166, - "step": 459990 - }, - { - "epoch": 0.8, - "learning_rate": 9.890763365967138e-06, - "loss": 2.2996, - "step": 460000 - }, - { - "epoch": 0.8, - "learning_rate": 9.889891426040312e-06, - "loss": 2.3254, - "step": 460010 - }, - { - "epoch": 0.8, - "learning_rate": 9.889019486113486e-06, - "loss": 2.2105, - "step": 460020 - }, - { - "epoch": 0.8, - "learning_rate": 9.88814754618666e-06, - "loss": 2.2586, - "step": 460030 - }, - { - "epoch": 0.8, - "learning_rate": 9.887275606259832e-06, - "loss": 2.2783, - "step": 460040 - }, - { - "epoch": 0.8, - "learning_rate": 9.886403666333005e-06, - "loss": 2.3236, - "step": 460050 - }, - { - "epoch": 0.8, - "learning_rate": 9.885531726406177e-06, - "loss": 2.1681, - "step": 460060 - }, - { - "epoch": 0.8, - "learning_rate": 9.884659786479351e-06, - "loss": 2.2079, - "step": 460070 - }, - { - "epoch": 0.8, - "learning_rate": 9.883787846552523e-06, - "loss": 2.2531, - "step": 460080 - }, - { - "epoch": 0.8, - "learning_rate": 9.882915906625697e-06, - "loss": 2.2716, - "step": 460090 - }, - { - "epoch": 0.8, - "learning_rate": 9.88204396669887e-06, - "loss": 2.3136, - "step": 460100 - }, - { - "epoch": 0.8, - "learning_rate": 9.881172026772045e-06, - "loss": 2.3114, - "step": 460110 - }, - { - "epoch": 0.8, - "learning_rate": 9.880300086845218e-06, - "loss": 2.2314, - "step": 460120 - }, - { - "epoch": 0.8, - "learning_rate": 9.87942814691839e-06, - "loss": 2.2421, - "step": 460130 - }, - { - "epoch": 0.8, - "learning_rate": 9.878556206991564e-06, - "loss": 2.27, - "step": 460140 - }, - { - "epoch": 0.8, - "learning_rate": 9.877684267064736e-06, - "loss": 2.331, - "step": 460150 - }, - { - "epoch": 0.8, - "learning_rate": 9.87681232713791e-06, - "loss": 2.2145, - "step": 460160 - }, - { - "epoch": 0.8, - "learning_rate": 9.875940387211082e-06, - "loss": 2.2758, - "step": 460170 - }, - { - "epoch": 0.8, - "learning_rate": 9.875068447284256e-06, - "loss": 2.2945, - "step": 460180 - }, - { - "epoch": 0.8, - "learning_rate": 9.87419650735743e-06, - "loss": 2.33, - "step": 460190 - }, - { - "epoch": 0.8, - "learning_rate": 9.873324567430603e-06, - "loss": 2.1489, - "step": 460200 - }, - { - "epoch": 0.8, - "learning_rate": 9.872452627503776e-06, - "loss": 2.2552, - "step": 460210 - }, - { - "epoch": 0.8, - "learning_rate": 9.87158068757695e-06, - "loss": 2.3222, - "step": 460220 - }, - { - "epoch": 0.8, - "learning_rate": 9.870708747650121e-06, - "loss": 2.3249, - "step": 460230 - }, - { - "epoch": 0.8, - "learning_rate": 9.869836807723295e-06, - "loss": 2.2406, - "step": 460240 - }, - { - "epoch": 0.8, - "learning_rate": 9.868964867796469e-06, - "loss": 2.2769, - "step": 460250 - }, - { - "epoch": 0.8, - "learning_rate": 9.868092927869643e-06, - "loss": 2.2979, - "step": 460260 - }, - { - "epoch": 0.8, - "learning_rate": 9.867220987942816e-06, - "loss": 2.3454, - "step": 460270 - }, - { - "epoch": 0.8, - "learning_rate": 9.866349048015989e-06, - "loss": 2.2307, - "step": 460280 - }, - { - "epoch": 0.8, - "learning_rate": 9.865477108089162e-06, - "loss": 2.2042, - "step": 460290 - }, - { - "epoch": 0.8, - "learning_rate": 9.864605168162334e-06, - "loss": 2.2946, - "step": 460300 - }, - { - "epoch": 0.8, - "learning_rate": 9.863733228235508e-06, - "loss": 2.3304, - "step": 460310 - }, - { - "epoch": 0.8, - "learning_rate": 9.86286128830868e-06, - "loss": 2.3997, - "step": 460320 - }, - { - "epoch": 0.8, - "learning_rate": 9.861989348381854e-06, - "loss": 2.2052, - "step": 460330 - }, - { - "epoch": 0.8, - "learning_rate": 9.861117408455028e-06, - "loss": 2.2112, - "step": 460340 - }, - { - "epoch": 0.8, - "learning_rate": 9.860245468528202e-06, - "loss": 2.2988, - "step": 460350 - }, - { - "epoch": 0.8, - "learning_rate": 9.859373528601374e-06, - "loss": 2.1461, - "step": 460360 - }, - { - "epoch": 0.8, - "learning_rate": 9.858501588674547e-06, - "loss": 2.2437, - "step": 460370 - }, - { - "epoch": 0.8, - "learning_rate": 9.857629648747721e-06, - "loss": 2.2345, - "step": 460380 - }, - { - "epoch": 0.8, - "learning_rate": 9.856757708820893e-06, - "loss": 2.3012, - "step": 460390 - }, - { - "epoch": 0.8, - "learning_rate": 9.855885768894067e-06, - "loss": 2.2173, - "step": 460400 - }, - { - "epoch": 0.8, - "learning_rate": 9.855013828967239e-06, - "loss": 2.259, - "step": 460410 - }, - { - "epoch": 0.8, - "learning_rate": 9.854141889040413e-06, - "loss": 2.2222, - "step": 460420 - }, - { - "epoch": 0.8, - "learning_rate": 9.853269949113587e-06, - "loss": 2.216, - "step": 460430 - }, - { - "epoch": 0.8, - "learning_rate": 9.85239800918676e-06, - "loss": 2.4202, - "step": 460440 - }, - { - "epoch": 0.8, - "learning_rate": 9.851526069259932e-06, - "loss": 2.2899, - "step": 460450 - }, - { - "epoch": 0.8, - "learning_rate": 9.850654129333106e-06, - "loss": 2.2682, - "step": 460460 - }, - { - "epoch": 0.8, - "learning_rate": 9.849782189406278e-06, - "loss": 2.1516, - "step": 460470 - }, - { - "epoch": 0.8, - "learning_rate": 9.848910249479452e-06, - "loss": 2.2997, - "step": 460480 - }, - { - "epoch": 0.8, - "learning_rate": 9.848038309552624e-06, - "loss": 2.3052, - "step": 460490 - }, - { - "epoch": 0.8, - "learning_rate": 9.847166369625798e-06, - "loss": 2.3291, - "step": 460500 - }, - { - "epoch": 0.8, - "learning_rate": 9.846294429698973e-06, - "loss": 2.1916, - "step": 460510 - }, - { - "epoch": 0.8, - "learning_rate": 9.845422489772145e-06, - "loss": 2.1937, - "step": 460520 - }, - { - "epoch": 0.8, - "learning_rate": 9.84455054984532e-06, - "loss": 2.1999, - "step": 460530 - }, - { - "epoch": 0.8, - "learning_rate": 9.843678609918491e-06, - "loss": 2.2219, - "step": 460540 - }, - { - "epoch": 0.8, - "learning_rate": 9.842806669991665e-06, - "loss": 2.3913, - "step": 460550 - }, - { - "epoch": 0.8, - "learning_rate": 9.841934730064837e-06, - "loss": 2.4393, - "step": 460560 - }, - { - "epoch": 0.8, - "learning_rate": 9.841062790138011e-06, - "loss": 2.3071, - "step": 460570 - }, - { - "epoch": 0.8, - "learning_rate": 9.840190850211185e-06, - "loss": 2.3381, - "step": 460580 - }, - { - "epoch": 0.8, - "learning_rate": 9.839318910284358e-06, - "loss": 2.3493, - "step": 460590 - }, - { - "epoch": 0.8, - "learning_rate": 9.83844697035753e-06, - "loss": 2.2347, - "step": 460600 - }, - { - "epoch": 0.8, - "learning_rate": 9.837575030430704e-06, - "loss": 2.3319, - "step": 460610 - }, - { - "epoch": 0.8, - "learning_rate": 9.836703090503876e-06, - "loss": 2.2805, - "step": 460620 - }, - { - "epoch": 0.8, - "learning_rate": 9.83583115057705e-06, - "loss": 2.2221, - "step": 460630 - }, - { - "epoch": 0.8, - "learning_rate": 9.834959210650224e-06, - "loss": 2.3207, - "step": 460640 - }, - { - "epoch": 0.8, - "learning_rate": 9.834087270723396e-06, - "loss": 2.3358, - "step": 460650 - }, - { - "epoch": 0.8, - "learning_rate": 9.83321533079657e-06, - "loss": 2.449, - "step": 460660 - }, - { - "epoch": 0.8, - "learning_rate": 9.832343390869744e-06, - "loss": 2.3289, - "step": 460670 - }, - { - "epoch": 0.8, - "learning_rate": 9.831471450942917e-06, - "loss": 2.1865, - "step": 460680 - }, - { - "epoch": 0.8, - "learning_rate": 9.83059951101609e-06, - "loss": 2.2791, - "step": 460690 - }, - { - "epoch": 0.8, - "learning_rate": 9.829727571089263e-06, - "loss": 2.3125, - "step": 460700 - }, - { - "epoch": 0.8, - "learning_rate": 9.828855631162435e-06, - "loss": 2.2768, - "step": 460710 - }, - { - "epoch": 0.8, - "learning_rate": 9.827983691235609e-06, - "loss": 2.3149, - "step": 460720 - }, - { - "epoch": 0.8, - "learning_rate": 9.827111751308781e-06, - "loss": 2.2623, - "step": 460730 - }, - { - "epoch": 0.8, - "learning_rate": 9.826239811381955e-06, - "loss": 2.2918, - "step": 460740 - }, - { - "epoch": 0.8, - "learning_rate": 9.825367871455129e-06, - "loss": 2.3039, - "step": 460750 - }, - { - "epoch": 0.8, - "learning_rate": 9.824495931528302e-06, - "loss": 2.2642, - "step": 460760 - }, - { - "epoch": 0.8, - "learning_rate": 9.823623991601476e-06, - "loss": 2.3009, - "step": 460770 - }, - { - "epoch": 0.8, - "learning_rate": 9.822752051674648e-06, - "loss": 2.3608, - "step": 460780 - }, - { - "epoch": 0.8, - "learning_rate": 9.821880111747822e-06, - "loss": 2.1848, - "step": 460790 - }, - { - "epoch": 0.8, - "learning_rate": 9.821008171820994e-06, - "loss": 2.2706, - "step": 460800 - }, - { - "epoch": 0.8, - "learning_rate": 9.820136231894168e-06, - "loss": 2.4928, - "step": 460810 - }, - { - "epoch": 0.8, - "learning_rate": 9.819264291967342e-06, - "loss": 2.1858, - "step": 460820 - }, - { - "epoch": 0.8, - "learning_rate": 9.818392352040515e-06, - "loss": 2.3026, - "step": 460830 - }, - { - "epoch": 0.8, - "learning_rate": 9.817520412113687e-06, - "loss": 2.3787, - "step": 460840 - }, - { - "epoch": 0.8, - "learning_rate": 9.816648472186861e-06, - "loss": 2.229, - "step": 460850 - }, - { - "epoch": 0.8, - "learning_rate": 9.815776532260033e-06, - "loss": 2.2501, - "step": 460860 - }, - { - "epoch": 0.8, - "learning_rate": 9.814904592333207e-06, - "loss": 2.3331, - "step": 460870 - }, - { - "epoch": 0.8, - "learning_rate": 9.814032652406379e-06, - "loss": 2.2698, - "step": 460880 - }, - { - "epoch": 0.8, - "learning_rate": 9.813160712479553e-06, - "loss": 2.157, - "step": 460890 - }, - { - "epoch": 0.8, - "learning_rate": 9.812288772552727e-06, - "loss": 2.3676, - "step": 460900 - }, - { - "epoch": 0.8, - "learning_rate": 9.8114168326259e-06, - "loss": 2.3883, - "step": 460910 - }, - { - "epoch": 0.8, - "learning_rate": 9.810544892699074e-06, - "loss": 2.1903, - "step": 460920 - }, - { - "epoch": 0.8, - "learning_rate": 9.809672952772246e-06, - "loss": 2.246, - "step": 460930 - }, - { - "epoch": 0.8, - "learning_rate": 9.80880101284542e-06, - "loss": 2.3466, - "step": 460940 - }, - { - "epoch": 0.8, - "learning_rate": 9.807929072918592e-06, - "loss": 2.3384, - "step": 460950 - }, - { - "epoch": 0.8, - "learning_rate": 9.807057132991766e-06, - "loss": 2.3993, - "step": 460960 - }, - { - "epoch": 0.8, - "learning_rate": 9.806185193064938e-06, - "loss": 2.2644, - "step": 460970 - }, - { - "epoch": 0.8, - "learning_rate": 9.805313253138112e-06, - "loss": 2.2528, - "step": 460980 - }, - { - "epoch": 0.8, - "learning_rate": 9.804441313211286e-06, - "loss": 2.3014, - "step": 460990 - }, - { - "epoch": 0.8, - "learning_rate": 9.80356937328446e-06, - "loss": 2.2652, - "step": 461000 - }, - { - "epoch": 0.8, - "learning_rate": 9.802697433357631e-06, - "loss": 2.3375, - "step": 461010 - }, - { - "epoch": 0.8, - "learning_rate": 9.801825493430805e-06, - "loss": 2.2792, - "step": 461020 - }, - { - "epoch": 0.8, - "learning_rate": 9.800953553503977e-06, - "loss": 2.3274, - "step": 461030 - }, - { - "epoch": 0.8, - "learning_rate": 9.800081613577151e-06, - "loss": 2.2519, - "step": 461040 - }, - { - "epoch": 0.8, - "learning_rate": 9.799209673650325e-06, - "loss": 2.2746, - "step": 461050 - }, - { - "epoch": 0.8, - "learning_rate": 9.798337733723499e-06, - "loss": 2.2612, - "step": 461060 - }, - { - "epoch": 0.8, - "learning_rate": 9.797465793796672e-06, - "loss": 2.2038, - "step": 461070 - }, - { - "epoch": 0.8, - "learning_rate": 9.796593853869844e-06, - "loss": 2.3006, - "step": 461080 - }, - { - "epoch": 0.8, - "learning_rate": 9.795721913943018e-06, - "loss": 2.3086, - "step": 461090 - }, - { - "epoch": 0.8, - "learning_rate": 9.79484997401619e-06, - "loss": 2.2805, - "step": 461100 - }, - { - "epoch": 0.8, - "learning_rate": 9.793978034089364e-06, - "loss": 2.2433, - "step": 461110 - }, - { - "epoch": 0.8, - "learning_rate": 9.793106094162536e-06, - "loss": 2.3381, - "step": 461120 - }, - { - "epoch": 0.8, - "learning_rate": 9.79223415423571e-06, - "loss": 2.1596, - "step": 461130 - }, - { - "epoch": 0.8, - "learning_rate": 9.791362214308884e-06, - "loss": 2.164, - "step": 461140 - }, - { - "epoch": 0.8, - "learning_rate": 9.790490274382057e-06, - "loss": 2.2251, - "step": 461150 - }, - { - "epoch": 0.8, - "learning_rate": 9.78961833445523e-06, - "loss": 2.2668, - "step": 461160 - }, - { - "epoch": 0.8, - "learning_rate": 9.788746394528403e-06, - "loss": 2.243, - "step": 461170 - }, - { - "epoch": 0.8, - "learning_rate": 9.787874454601577e-06, - "loss": 2.2959, - "step": 461180 - }, - { - "epoch": 0.8, - "learning_rate": 9.787002514674749e-06, - "loss": 2.269, - "step": 461190 - }, - { - "epoch": 0.8, - "learning_rate": 9.786130574747923e-06, - "loss": 2.3094, - "step": 461200 - }, - { - "epoch": 0.8, - "learning_rate": 9.785258634821095e-06, - "loss": 2.302, - "step": 461210 - }, - { - "epoch": 0.8, - "learning_rate": 9.784386694894269e-06, - "loss": 2.161, - "step": 461220 - }, - { - "epoch": 0.8, - "learning_rate": 9.783514754967442e-06, - "loss": 2.2233, - "step": 461230 - }, - { - "epoch": 0.8, - "learning_rate": 9.782642815040616e-06, - "loss": 2.2141, - "step": 461240 - }, - { - "epoch": 0.8, - "learning_rate": 9.781770875113788e-06, - "loss": 2.2958, - "step": 461250 - }, - { - "epoch": 0.8, - "learning_rate": 9.780898935186962e-06, - "loss": 2.1967, - "step": 461260 - }, - { - "epoch": 0.8, - "learning_rate": 9.780026995260134e-06, - "loss": 2.3022, - "step": 461270 - }, - { - "epoch": 0.8, - "learning_rate": 9.779155055333308e-06, - "loss": 2.2211, - "step": 461280 - }, - { - "epoch": 0.8, - "learning_rate": 9.77828311540648e-06, - "loss": 2.2893, - "step": 461290 - }, - { - "epoch": 0.8, - "learning_rate": 9.777411175479655e-06, - "loss": 2.3421, - "step": 461300 - }, - { - "epoch": 0.8, - "learning_rate": 9.77653923555283e-06, - "loss": 2.3761, - "step": 461310 - }, - { - "epoch": 0.8, - "learning_rate": 9.775667295626001e-06, - "loss": 2.2286, - "step": 461320 - }, - { - "epoch": 0.8, - "learning_rate": 9.774795355699175e-06, - "loss": 2.2997, - "step": 461330 - }, - { - "epoch": 0.8, - "learning_rate": 9.773923415772347e-06, - "loss": 2.2914, - "step": 461340 - }, - { - "epoch": 0.8, - "learning_rate": 9.773051475845521e-06, - "loss": 2.2417, - "step": 461350 - }, - { - "epoch": 0.8, - "learning_rate": 9.772179535918693e-06, - "loss": 2.2785, - "step": 461360 - }, - { - "epoch": 0.8, - "learning_rate": 9.771307595991867e-06, - "loss": 2.3267, - "step": 461370 - }, - { - "epoch": 0.8, - "learning_rate": 9.77043565606504e-06, - "loss": 2.1927, - "step": 461380 - }, - { - "epoch": 0.8, - "learning_rate": 9.769563716138214e-06, - "loss": 2.1601, - "step": 461390 - }, - { - "epoch": 0.8, - "learning_rate": 9.768691776211386e-06, - "loss": 2.307, - "step": 461400 - }, - { - "epoch": 0.8, - "learning_rate": 9.76781983628456e-06, - "loss": 2.3399, - "step": 461410 - }, - { - "epoch": 0.8, - "learning_rate": 9.766947896357732e-06, - "loss": 2.3713, - "step": 461420 - }, - { - "epoch": 0.8, - "learning_rate": 9.766075956430906e-06, - "loss": 2.2372, - "step": 461430 - }, - { - "epoch": 0.8, - "learning_rate": 9.76520401650408e-06, - "loss": 2.2618, - "step": 461440 - }, - { - "epoch": 0.8, - "learning_rate": 9.764332076577252e-06, - "loss": 2.236, - "step": 461450 - }, - { - "epoch": 0.8, - "learning_rate": 9.763460136650426e-06, - "loss": 2.2066, - "step": 461460 - }, - { - "epoch": 0.8, - "learning_rate": 9.7625881967236e-06, - "loss": 2.263, - "step": 461470 - }, - { - "epoch": 0.8, - "learning_rate": 9.761716256796773e-06, - "loss": 2.2171, - "step": 461480 - }, - { - "epoch": 0.8, - "learning_rate": 9.760844316869945e-06, - "loss": 2.2325, - "step": 461490 - }, - { - "epoch": 0.8, - "learning_rate": 9.759972376943119e-06, - "loss": 2.3289, - "step": 461500 - }, - { - "epoch": 0.8, - "learning_rate": 9.759100437016291e-06, - "loss": 2.1298, - "step": 461510 - }, - { - "epoch": 0.8, - "learning_rate": 9.758228497089465e-06, - "loss": 2.3865, - "step": 461520 - }, - { - "epoch": 0.8, - "learning_rate": 9.757356557162637e-06, - "loss": 2.2719, - "step": 461530 - }, - { - "epoch": 0.8, - "learning_rate": 9.756484617235812e-06, - "loss": 2.1885, - "step": 461540 - }, - { - "epoch": 0.8, - "learning_rate": 9.755612677308984e-06, - "loss": 2.1713, - "step": 461550 - }, - { - "epoch": 0.8, - "learning_rate": 9.754740737382158e-06, - "loss": 2.3244, - "step": 461560 - }, - { - "epoch": 0.8, - "learning_rate": 9.753868797455332e-06, - "loss": 2.1511, - "step": 461570 - }, - { - "epoch": 0.8, - "learning_rate": 9.752996857528504e-06, - "loss": 2.2641, - "step": 461580 - }, - { - "epoch": 0.8, - "learning_rate": 9.752124917601678e-06, - "loss": 2.3371, - "step": 461590 - }, - { - "epoch": 0.8, - "learning_rate": 9.75125297767485e-06, - "loss": 2.3791, - "step": 461600 - }, - { - "epoch": 0.8, - "learning_rate": 9.750381037748024e-06, - "loss": 2.2319, - "step": 461610 - }, - { - "epoch": 0.81, - "learning_rate": 9.749509097821197e-06, - "loss": 2.2948, - "step": 461620 - }, - { - "epoch": 0.81, - "learning_rate": 9.748637157894371e-06, - "loss": 2.2818, - "step": 461630 - }, - { - "epoch": 0.81, - "learning_rate": 9.747765217967543e-06, - "loss": 2.2277, - "step": 461640 - }, - { - "epoch": 0.81, - "learning_rate": 9.746893278040717e-06, - "loss": 2.2864, - "step": 461650 - }, - { - "epoch": 0.81, - "learning_rate": 9.746021338113889e-06, - "loss": 2.2742, - "step": 461660 - }, - { - "epoch": 0.81, - "learning_rate": 9.745149398187063e-06, - "loss": 2.1785, - "step": 461670 - }, - { - "epoch": 0.81, - "learning_rate": 9.744277458260235e-06, - "loss": 2.4142, - "step": 461680 - }, - { - "epoch": 0.81, - "learning_rate": 9.743405518333409e-06, - "loss": 2.2952, - "step": 461690 - }, - { - "epoch": 0.81, - "learning_rate": 9.742533578406583e-06, - "loss": 2.281, - "step": 461700 - }, - { - "epoch": 0.81, - "learning_rate": 9.741661638479756e-06, - "loss": 2.2048, - "step": 461710 - }, - { - "epoch": 0.81, - "learning_rate": 9.74078969855293e-06, - "loss": 2.3189, - "step": 461720 - }, - { - "epoch": 0.81, - "learning_rate": 9.739917758626102e-06, - "loss": 2.3236, - "step": 461730 - }, - { - "epoch": 0.81, - "learning_rate": 9.739045818699276e-06, - "loss": 2.2812, - "step": 461740 - }, - { - "epoch": 0.81, - "learning_rate": 9.738173878772448e-06, - "loss": 2.3552, - "step": 461750 - }, - { - "epoch": 0.81, - "learning_rate": 9.737301938845622e-06, - "loss": 2.322, - "step": 461760 - }, - { - "epoch": 0.81, - "learning_rate": 9.736429998918794e-06, - "loss": 2.3071, - "step": 461770 - }, - { - "epoch": 0.81, - "learning_rate": 9.735558058991968e-06, - "loss": 2.3435, - "step": 461780 - }, - { - "epoch": 0.81, - "learning_rate": 9.734686119065141e-06, - "loss": 2.2909, - "step": 461790 - }, - { - "epoch": 0.81, - "learning_rate": 9.733814179138315e-06, - "loss": 2.3062, - "step": 461800 - }, - { - "epoch": 0.81, - "learning_rate": 9.732942239211487e-06, - "loss": 2.2117, - "step": 461810 - }, - { - "epoch": 0.81, - "learning_rate": 9.732070299284661e-06, - "loss": 2.2615, - "step": 461820 - }, - { - "epoch": 0.81, - "learning_rate": 9.731198359357833e-06, - "loss": 2.3769, - "step": 461830 - }, - { - "epoch": 0.81, - "learning_rate": 9.730326419431007e-06, - "loss": 2.2025, - "step": 461840 - }, - { - "epoch": 0.81, - "learning_rate": 9.72945447950418e-06, - "loss": 2.2856, - "step": 461850 - }, - { - "epoch": 0.81, - "learning_rate": 9.728582539577354e-06, - "loss": 2.2502, - "step": 461860 - }, - { - "epoch": 0.81, - "learning_rate": 9.727710599650528e-06, - "loss": 2.1335, - "step": 461870 - }, - { - "epoch": 0.81, - "learning_rate": 9.7268386597237e-06, - "loss": 2.2497, - "step": 461880 - }, - { - "epoch": 0.81, - "learning_rate": 9.725966719796874e-06, - "loss": 2.1398, - "step": 461890 - }, - { - "epoch": 0.81, - "learning_rate": 9.725094779870046e-06, - "loss": 2.3193, - "step": 461900 - }, - { - "epoch": 0.81, - "learning_rate": 9.72422283994322e-06, - "loss": 2.2169, - "step": 461910 - }, - { - "epoch": 0.81, - "learning_rate": 9.723350900016392e-06, - "loss": 2.2593, - "step": 461920 - }, - { - "epoch": 0.81, - "learning_rate": 9.722478960089566e-06, - "loss": 2.2068, - "step": 461930 - }, - { - "epoch": 0.81, - "learning_rate": 9.72160702016274e-06, - "loss": 2.1866, - "step": 461940 - }, - { - "epoch": 0.81, - "learning_rate": 9.720735080235913e-06, - "loss": 2.315, - "step": 461950 - }, - { - "epoch": 0.81, - "learning_rate": 9.719863140309085e-06, - "loss": 2.2587, - "step": 461960 - }, - { - "epoch": 0.81, - "learning_rate": 9.718991200382259e-06, - "loss": 2.2719, - "step": 461970 - }, - { - "epoch": 0.81, - "learning_rate": 9.718119260455433e-06, - "loss": 2.2694, - "step": 461980 - }, - { - "epoch": 0.81, - "learning_rate": 9.717247320528605e-06, - "loss": 2.0898, - "step": 461990 - }, - { - "epoch": 0.81, - "learning_rate": 9.716375380601779e-06, - "loss": 2.2857, - "step": 462000 - }, - { - "epoch": 0.81, - "learning_rate": 9.71550344067495e-06, - "loss": 2.2594, - "step": 462010 - }, - { - "epoch": 0.81, - "learning_rate": 9.714631500748125e-06, - "loss": 2.2779, - "step": 462020 - }, - { - "epoch": 0.81, - "learning_rate": 9.713759560821298e-06, - "loss": 2.2759, - "step": 462030 - }, - { - "epoch": 0.81, - "learning_rate": 9.712887620894472e-06, - "loss": 2.2726, - "step": 462040 - }, - { - "epoch": 0.81, - "learning_rate": 9.712015680967644e-06, - "loss": 2.3134, - "step": 462050 - }, - { - "epoch": 0.81, - "learning_rate": 9.711143741040818e-06, - "loss": 2.2181, - "step": 462060 - }, - { - "epoch": 0.81, - "learning_rate": 9.71027180111399e-06, - "loss": 2.315, - "step": 462070 - }, - { - "epoch": 0.81, - "learning_rate": 9.709399861187164e-06, - "loss": 2.3029, - "step": 462080 - }, - { - "epoch": 0.81, - "learning_rate": 9.708527921260336e-06, - "loss": 2.302, - "step": 462090 - }, - { - "epoch": 0.81, - "learning_rate": 9.707655981333511e-06, - "loss": 2.2265, - "step": 462100 - }, - { - "epoch": 0.81, - "learning_rate": 9.706784041406685e-06, - "loss": 2.3033, - "step": 462110 - }, - { - "epoch": 0.81, - "learning_rate": 9.705912101479857e-06, - "loss": 2.2984, - "step": 462120 - }, - { - "epoch": 0.81, - "learning_rate": 9.705040161553031e-06, - "loss": 2.2442, - "step": 462130 - }, - { - "epoch": 0.81, - "learning_rate": 9.704168221626203e-06, - "loss": 2.3654, - "step": 462140 - }, - { - "epoch": 0.81, - "learning_rate": 9.703296281699377e-06, - "loss": 2.293, - "step": 462150 - }, - { - "epoch": 0.81, - "learning_rate": 9.702424341772549e-06, - "loss": 2.3781, - "step": 462160 - }, - { - "epoch": 0.81, - "learning_rate": 9.701552401845723e-06, - "loss": 2.3354, - "step": 462170 - }, - { - "epoch": 0.81, - "learning_rate": 9.700680461918896e-06, - "loss": 2.2997, - "step": 462180 - }, - { - "epoch": 0.81, - "learning_rate": 9.69980852199207e-06, - "loss": 2.1891, - "step": 462190 - }, - { - "epoch": 0.81, - "learning_rate": 9.698936582065242e-06, - "loss": 2.1401, - "step": 462200 - }, - { - "epoch": 0.81, - "learning_rate": 9.698064642138416e-06, - "loss": 2.2428, - "step": 462210 - }, - { - "epoch": 0.81, - "learning_rate": 9.697192702211588e-06, - "loss": 2.3894, - "step": 462220 - }, - { - "epoch": 0.81, - "learning_rate": 9.696320762284762e-06, - "loss": 2.138, - "step": 462230 - }, - { - "epoch": 0.81, - "learning_rate": 9.695448822357936e-06, - "loss": 2.3338, - "step": 462240 - }, - { - "epoch": 0.81, - "learning_rate": 9.694576882431108e-06, - "loss": 2.3364, - "step": 462250 - }, - { - "epoch": 0.81, - "learning_rate": 9.693704942504281e-06, - "loss": 2.3063, - "step": 462260 - }, - { - "epoch": 0.81, - "learning_rate": 9.692833002577455e-06, - "loss": 2.3859, - "step": 462270 - }, - { - "epoch": 0.81, - "learning_rate": 9.691961062650629e-06, - "loss": 2.1622, - "step": 462280 - }, - { - "epoch": 0.81, - "learning_rate": 9.691089122723801e-06, - "loss": 2.216, - "step": 462290 - }, - { - "epoch": 0.81, - "learning_rate": 9.690217182796975e-06, - "loss": 2.2386, - "step": 462300 - }, - { - "epoch": 0.81, - "learning_rate": 9.689345242870147e-06, - "loss": 2.4427, - "step": 462310 - }, - { - "epoch": 0.81, - "learning_rate": 9.68847330294332e-06, - "loss": 2.2906, - "step": 462320 - }, - { - "epoch": 0.81, - "learning_rate": 9.687601363016493e-06, - "loss": 2.1312, - "step": 462330 - }, - { - "epoch": 0.81, - "learning_rate": 9.686729423089668e-06, - "loss": 2.3482, - "step": 462340 - }, - { - "epoch": 0.81, - "learning_rate": 9.68585748316284e-06, - "loss": 2.2903, - "step": 462350 - }, - { - "epoch": 0.81, - "learning_rate": 9.684985543236014e-06, - "loss": 2.3512, - "step": 462360 - }, - { - "epoch": 0.81, - "learning_rate": 9.684113603309188e-06, - "loss": 2.1794, - "step": 462370 - }, - { - "epoch": 0.81, - "learning_rate": 9.68324166338236e-06, - "loss": 2.2717, - "step": 462380 - }, - { - "epoch": 0.81, - "learning_rate": 9.682369723455534e-06, - "loss": 2.2021, - "step": 462390 - }, - { - "epoch": 0.81, - "learning_rate": 9.681497783528706e-06, - "loss": 2.2041, - "step": 462400 - }, - { - "epoch": 0.81, - "learning_rate": 9.68062584360188e-06, - "loss": 2.4284, - "step": 462410 - }, - { - "epoch": 0.81, - "learning_rate": 9.679753903675053e-06, - "loss": 2.2501, - "step": 462420 - }, - { - "epoch": 0.81, - "learning_rate": 9.678881963748227e-06, - "loss": 2.2783, - "step": 462430 - }, - { - "epoch": 0.81, - "learning_rate": 9.678010023821399e-06, - "loss": 2.2838, - "step": 462440 - }, - { - "epoch": 0.81, - "learning_rate": 9.677138083894573e-06, - "loss": 2.3623, - "step": 462450 - }, - { - "epoch": 0.81, - "learning_rate": 9.676266143967745e-06, - "loss": 2.1904, - "step": 462460 - }, - { - "epoch": 0.81, - "learning_rate": 9.675394204040919e-06, - "loss": 2.292, - "step": 462470 - }, - { - "epoch": 0.81, - "learning_rate": 9.67452226411409e-06, - "loss": 2.236, - "step": 462480 - }, - { - "epoch": 0.81, - "learning_rate": 9.673650324187265e-06, - "loss": 2.2622, - "step": 462490 - }, - { - "epoch": 0.81, - "learning_rate": 9.672778384260438e-06, - "loss": 2.3332, - "step": 462500 - }, - { - "epoch": 0.81, - "learning_rate": 9.671906444333612e-06, - "loss": 2.1442, - "step": 462510 - }, - { - "epoch": 0.81, - "learning_rate": 9.671034504406786e-06, - "loss": 2.181, - "step": 462520 - }, - { - "epoch": 0.81, - "learning_rate": 9.670162564479958e-06, - "loss": 2.3661, - "step": 462530 - }, - { - "epoch": 0.81, - "learning_rate": 9.669290624553132e-06, - "loss": 2.279, - "step": 462540 - }, - { - "epoch": 0.81, - "learning_rate": 9.668418684626304e-06, - "loss": 2.2246, - "step": 462550 - }, - { - "epoch": 0.81, - "learning_rate": 9.667546744699478e-06, - "loss": 2.197, - "step": 462560 - }, - { - "epoch": 0.81, - "learning_rate": 9.66667480477265e-06, - "loss": 2.2802, - "step": 462570 - }, - { - "epoch": 0.81, - "learning_rate": 9.665802864845825e-06, - "loss": 2.2604, - "step": 462580 - }, - { - "epoch": 0.81, - "learning_rate": 9.664930924918997e-06, - "loss": 2.2238, - "step": 462590 - }, - { - "epoch": 0.81, - "learning_rate": 9.664058984992171e-06, - "loss": 2.3071, - "step": 462600 - }, - { - "epoch": 0.81, - "learning_rate": 9.663187045065343e-06, - "loss": 2.2205, - "step": 462610 - }, - { - "epoch": 0.81, - "learning_rate": 9.662315105138517e-06, - "loss": 2.253, - "step": 462620 - }, - { - "epoch": 0.81, - "learning_rate": 9.661443165211689e-06, - "loss": 2.268, - "step": 462630 - }, - { - "epoch": 0.81, - "learning_rate": 9.660571225284863e-06, - "loss": 2.2242, - "step": 462640 - }, - { - "epoch": 0.81, - "learning_rate": 9.659699285358036e-06, - "loss": 2.3673, - "step": 462650 - }, - { - "epoch": 0.81, - "learning_rate": 9.65882734543121e-06, - "loss": 2.1344, - "step": 462660 - }, - { - "epoch": 0.81, - "learning_rate": 9.657955405504384e-06, - "loss": 2.2998, - "step": 462670 - }, - { - "epoch": 0.81, - "learning_rate": 9.657083465577556e-06, - "loss": 2.2733, - "step": 462680 - }, - { - "epoch": 0.81, - "learning_rate": 9.65621152565073e-06, - "loss": 2.237, - "step": 462690 - }, - { - "epoch": 0.81, - "learning_rate": 9.655339585723902e-06, - "loss": 2.2746, - "step": 462700 - }, - { - "epoch": 0.81, - "learning_rate": 9.654467645797076e-06, - "loss": 2.1696, - "step": 462710 - }, - { - "epoch": 0.81, - "learning_rate": 9.653595705870248e-06, - "loss": 2.3345, - "step": 462720 - }, - { - "epoch": 0.81, - "learning_rate": 9.652723765943422e-06, - "loss": 2.2599, - "step": 462730 - }, - { - "epoch": 0.81, - "learning_rate": 9.651851826016595e-06, - "loss": 2.2071, - "step": 462740 - }, - { - "epoch": 0.81, - "learning_rate": 9.650979886089769e-06, - "loss": 2.3071, - "step": 462750 - }, - { - "epoch": 0.81, - "learning_rate": 9.650107946162941e-06, - "loss": 2.3692, - "step": 462760 - }, - { - "epoch": 0.81, - "learning_rate": 9.649236006236115e-06, - "loss": 2.2608, - "step": 462770 - }, - { - "epoch": 0.81, - "learning_rate": 9.648364066309289e-06, - "loss": 2.2634, - "step": 462780 - }, - { - "epoch": 0.81, - "learning_rate": 9.64749212638246e-06, - "loss": 2.3703, - "step": 462790 - }, - { - "epoch": 0.81, - "learning_rate": 9.646620186455635e-06, - "loss": 2.3405, - "step": 462800 - }, - { - "epoch": 0.81, - "learning_rate": 9.645748246528807e-06, - "loss": 2.3245, - "step": 462810 - }, - { - "epoch": 0.81, - "learning_rate": 9.64487630660198e-06, - "loss": 2.2792, - "step": 462820 - }, - { - "epoch": 0.81, - "learning_rate": 9.644004366675154e-06, - "loss": 2.2008, - "step": 462830 - }, - { - "epoch": 0.81, - "learning_rate": 9.643132426748328e-06, - "loss": 2.2359, - "step": 462840 - }, - { - "epoch": 0.81, - "learning_rate": 9.6422604868215e-06, - "loss": 2.3409, - "step": 462850 - }, - { - "epoch": 0.81, - "learning_rate": 9.641388546894674e-06, - "loss": 2.3073, - "step": 462860 - }, - { - "epoch": 0.81, - "learning_rate": 9.640516606967846e-06, - "loss": 2.2467, - "step": 462870 - }, - { - "epoch": 0.81, - "learning_rate": 9.63964466704102e-06, - "loss": 2.2072, - "step": 462880 - }, - { - "epoch": 0.81, - "learning_rate": 9.638772727114193e-06, - "loss": 2.2951, - "step": 462890 - }, - { - "epoch": 0.81, - "learning_rate": 9.637900787187367e-06, - "loss": 2.206, - "step": 462900 - }, - { - "epoch": 0.81, - "learning_rate": 9.637028847260541e-06, - "loss": 2.2743, - "step": 462910 - }, - { - "epoch": 0.81, - "learning_rate": 9.636156907333713e-06, - "loss": 2.3653, - "step": 462920 - }, - { - "epoch": 0.81, - "learning_rate": 9.635284967406887e-06, - "loss": 2.1935, - "step": 462930 - }, - { - "epoch": 0.81, - "learning_rate": 9.634413027480059e-06, - "loss": 2.2169, - "step": 462940 - }, - { - "epoch": 0.81, - "learning_rate": 9.633541087553233e-06, - "loss": 2.3167, - "step": 462950 - }, - { - "epoch": 0.81, - "learning_rate": 9.632669147626405e-06, - "loss": 2.3238, - "step": 462960 - }, - { - "epoch": 0.81, - "learning_rate": 9.631797207699578e-06, - "loss": 2.3397, - "step": 462970 - }, - { - "epoch": 0.81, - "learning_rate": 9.630925267772752e-06, - "loss": 2.3194, - "step": 462980 - }, - { - "epoch": 0.81, - "learning_rate": 9.630053327845926e-06, - "loss": 2.1578, - "step": 462990 - }, - { - "epoch": 0.81, - "learning_rate": 9.629181387919098e-06, - "loss": 2.2071, - "step": 463000 - }, - { - "epoch": 0.81, - "learning_rate": 9.628309447992272e-06, - "loss": 2.1551, - "step": 463010 - }, - { - "epoch": 0.81, - "learning_rate": 9.627437508065444e-06, - "loss": 2.2401, - "step": 463020 - }, - { - "epoch": 0.81, - "learning_rate": 9.626565568138618e-06, - "loss": 2.4323, - "step": 463030 - }, - { - "epoch": 0.81, - "learning_rate": 9.625693628211791e-06, - "loss": 2.3128, - "step": 463040 - }, - { - "epoch": 0.81, - "learning_rate": 9.624821688284964e-06, - "loss": 2.305, - "step": 463050 - }, - { - "epoch": 0.81, - "learning_rate": 9.623949748358137e-06, - "loss": 2.4229, - "step": 463060 - }, - { - "epoch": 0.81, - "learning_rate": 9.623077808431311e-06, - "loss": 2.303, - "step": 463070 - }, - { - "epoch": 0.81, - "learning_rate": 9.622205868504485e-06, - "loss": 2.2435, - "step": 463080 - }, - { - "epoch": 0.81, - "learning_rate": 9.621333928577657e-06, - "loss": 2.2038, - "step": 463090 - }, - { - "epoch": 0.81, - "learning_rate": 9.62046198865083e-06, - "loss": 2.2867, - "step": 463100 - }, - { - "epoch": 0.81, - "learning_rate": 9.619590048724003e-06, - "loss": 2.2928, - "step": 463110 - }, - { - "epoch": 0.81, - "learning_rate": 9.618718108797177e-06, - "loss": 2.2329, - "step": 463120 - }, - { - "epoch": 0.81, - "learning_rate": 9.617846168870349e-06, - "loss": 2.3219, - "step": 463130 - }, - { - "epoch": 0.81, - "learning_rate": 9.616974228943524e-06, - "loss": 2.3009, - "step": 463140 - }, - { - "epoch": 0.81, - "learning_rate": 9.616102289016696e-06, - "loss": 2.3077, - "step": 463150 - }, - { - "epoch": 0.81, - "learning_rate": 9.61523034908987e-06, - "loss": 2.322, - "step": 463160 - }, - { - "epoch": 0.81, - "learning_rate": 9.614358409163044e-06, - "loss": 2.2151, - "step": 463170 - }, - { - "epoch": 0.81, - "learning_rate": 9.613486469236216e-06, - "loss": 2.3262, - "step": 463180 - }, - { - "epoch": 0.81, - "learning_rate": 9.61261452930939e-06, - "loss": 2.3037, - "step": 463190 - }, - { - "epoch": 0.81, - "learning_rate": 9.611742589382562e-06, - "loss": 2.3272, - "step": 463200 - }, - { - "epoch": 0.81, - "learning_rate": 9.610870649455735e-06, - "loss": 2.2648, - "step": 463210 - }, - { - "epoch": 0.81, - "learning_rate": 9.60999870952891e-06, - "loss": 2.3157, - "step": 463220 - }, - { - "epoch": 0.81, - "learning_rate": 9.609126769602083e-06, - "loss": 2.3418, - "step": 463230 - }, - { - "epoch": 0.81, - "learning_rate": 9.608254829675255e-06, - "loss": 2.2101, - "step": 463240 - }, - { - "epoch": 0.81, - "learning_rate": 9.607382889748429e-06, - "loss": 2.3253, - "step": 463250 - }, - { - "epoch": 0.81, - "learning_rate": 9.606510949821601e-06, - "loss": 2.2491, - "step": 463260 - }, - { - "epoch": 0.81, - "learning_rate": 9.605639009894775e-06, - "loss": 2.1893, - "step": 463270 - }, - { - "epoch": 0.81, - "learning_rate": 9.604767069967947e-06, - "loss": 2.3761, - "step": 463280 - }, - { - "epoch": 0.81, - "learning_rate": 9.60389513004112e-06, - "loss": 2.3148, - "step": 463290 - }, - { - "epoch": 0.81, - "learning_rate": 9.603023190114294e-06, - "loss": 2.253, - "step": 463300 - }, - { - "epoch": 0.81, - "learning_rate": 9.602151250187468e-06, - "loss": 2.3344, - "step": 463310 - }, - { - "epoch": 0.81, - "learning_rate": 9.601279310260642e-06, - "loss": 2.2237, - "step": 463320 - }, - { - "epoch": 0.81, - "learning_rate": 9.600407370333814e-06, - "loss": 2.2966, - "step": 463330 - }, - { - "epoch": 0.81, - "learning_rate": 9.599535430406988e-06, - "loss": 2.3825, - "step": 463340 - }, - { - "epoch": 0.81, - "learning_rate": 9.59866349048016e-06, - "loss": 2.2171, - "step": 463350 - }, - { - "epoch": 0.81, - "learning_rate": 9.597791550553333e-06, - "loss": 2.183, - "step": 463360 - }, - { - "epoch": 0.81, - "learning_rate": 9.596919610626506e-06, - "loss": 2.1944, - "step": 463370 - }, - { - "epoch": 0.81, - "learning_rate": 9.596047670699681e-06, - "loss": 2.2783, - "step": 463380 - }, - { - "epoch": 0.81, - "learning_rate": 9.595175730772853e-06, - "loss": 2.2714, - "step": 463390 - }, - { - "epoch": 0.81, - "learning_rate": 9.594303790846027e-06, - "loss": 2.3665, - "step": 463400 - }, - { - "epoch": 0.81, - "learning_rate": 9.593431850919199e-06, - "loss": 2.2259, - "step": 463410 - }, - { - "epoch": 0.81, - "learning_rate": 9.592559910992373e-06, - "loss": 2.2529, - "step": 463420 - }, - { - "epoch": 0.81, - "learning_rate": 9.591687971065546e-06, - "loss": 2.2926, - "step": 463430 - }, - { - "epoch": 0.81, - "learning_rate": 9.590816031138719e-06, - "loss": 2.3446, - "step": 463440 - }, - { - "epoch": 0.81, - "learning_rate": 9.589944091211892e-06, - "loss": 2.2161, - "step": 463450 - }, - { - "epoch": 0.81, - "learning_rate": 9.589072151285066e-06, - "loss": 2.305, - "step": 463460 - }, - { - "epoch": 0.81, - "learning_rate": 9.58820021135824e-06, - "loss": 2.2171, - "step": 463470 - }, - { - "epoch": 0.81, - "learning_rate": 9.587328271431412e-06, - "loss": 2.2229, - "step": 463480 - }, - { - "epoch": 0.81, - "learning_rate": 9.586456331504586e-06, - "loss": 2.3728, - "step": 463490 - }, - { - "epoch": 0.81, - "learning_rate": 9.585584391577758e-06, - "loss": 2.2915, - "step": 463500 - }, - { - "epoch": 0.81, - "learning_rate": 9.584712451650932e-06, - "loss": 2.2681, - "step": 463510 - }, - { - "epoch": 0.81, - "learning_rate": 9.583840511724104e-06, - "loss": 2.2537, - "step": 463520 - }, - { - "epoch": 0.81, - "learning_rate": 9.582968571797277e-06, - "loss": 2.3889, - "step": 463530 - }, - { - "epoch": 0.81, - "learning_rate": 9.582096631870451e-06, - "loss": 2.2855, - "step": 463540 - }, - { - "epoch": 0.81, - "learning_rate": 9.581224691943625e-06, - "loss": 2.2563, - "step": 463550 - }, - { - "epoch": 0.81, - "learning_rate": 9.580352752016797e-06, - "loss": 2.4538, - "step": 463560 - }, - { - "epoch": 0.81, - "learning_rate": 9.57948081208997e-06, - "loss": 2.2932, - "step": 463570 - }, - { - "epoch": 0.81, - "learning_rate": 9.578608872163145e-06, - "loss": 2.2085, - "step": 463580 - }, - { - "epoch": 0.81, - "learning_rate": 9.577736932236317e-06, - "loss": 2.3606, - "step": 463590 - }, - { - "epoch": 0.81, - "learning_rate": 9.57686499230949e-06, - "loss": 2.2438, - "step": 463600 - }, - { - "epoch": 0.81, - "learning_rate": 9.575993052382662e-06, - "loss": 2.2384, - "step": 463610 - }, - { - "epoch": 0.81, - "learning_rate": 9.575121112455838e-06, - "loss": 2.2093, - "step": 463620 - }, - { - "epoch": 0.81, - "learning_rate": 9.57424917252901e-06, - "loss": 2.3108, - "step": 463630 - }, - { - "epoch": 0.81, - "learning_rate": 9.573377232602184e-06, - "loss": 2.1545, - "step": 463640 - }, - { - "epoch": 0.81, - "learning_rate": 9.572505292675356e-06, - "loss": 2.2412, - "step": 463650 - }, - { - "epoch": 0.81, - "learning_rate": 9.57163335274853e-06, - "loss": 2.3051, - "step": 463660 - }, - { - "epoch": 0.81, - "learning_rate": 9.570761412821702e-06, - "loss": 2.3843, - "step": 463670 - }, - { - "epoch": 0.81, - "learning_rate": 9.569889472894875e-06, - "loss": 2.2068, - "step": 463680 - }, - { - "epoch": 0.81, - "learning_rate": 9.56901753296805e-06, - "loss": 2.2292, - "step": 463690 - }, - { - "epoch": 0.81, - "learning_rate": 9.568145593041223e-06, - "loss": 2.2298, - "step": 463700 - }, - { - "epoch": 0.81, - "learning_rate": 9.567273653114397e-06, - "loss": 2.2597, - "step": 463710 - }, - { - "epoch": 0.81, - "learning_rate": 9.566401713187569e-06, - "loss": 2.1824, - "step": 463720 - }, - { - "epoch": 0.81, - "learning_rate": 9.565529773260743e-06, - "loss": 2.2518, - "step": 463730 - }, - { - "epoch": 0.81, - "learning_rate": 9.564657833333915e-06, - "loss": 2.24, - "step": 463740 - }, - { - "epoch": 0.81, - "learning_rate": 9.563785893407088e-06, - "loss": 2.2089, - "step": 463750 - }, - { - "epoch": 0.81, - "learning_rate": 9.56291395348026e-06, - "loss": 2.2578, - "step": 463760 - }, - { - "epoch": 0.81, - "learning_rate": 9.562042013553434e-06, - "loss": 2.3088, - "step": 463770 - }, - { - "epoch": 0.81, - "learning_rate": 9.561170073626608e-06, - "loss": 2.3787, - "step": 463780 - }, - { - "epoch": 0.81, - "learning_rate": 9.560298133699782e-06, - "loss": 2.3584, - "step": 463790 - }, - { - "epoch": 0.81, - "learning_rate": 9.559426193772954e-06, - "loss": 2.261, - "step": 463800 - }, - { - "epoch": 0.81, - "learning_rate": 9.558554253846128e-06, - "loss": 2.1089, - "step": 463810 - }, - { - "epoch": 0.81, - "learning_rate": 9.5576823139193e-06, - "loss": 2.2588, - "step": 463820 - }, - { - "epoch": 0.81, - "learning_rate": 9.556810373992474e-06, - "loss": 2.2269, - "step": 463830 - }, - { - "epoch": 0.81, - "learning_rate": 9.555938434065647e-06, - "loss": 2.2993, - "step": 463840 - }, - { - "epoch": 0.81, - "learning_rate": 9.55506649413882e-06, - "loss": 2.324, - "step": 463850 - }, - { - "epoch": 0.81, - "learning_rate": 9.554194554211993e-06, - "loss": 2.3146, - "step": 463860 - }, - { - "epoch": 0.81, - "learning_rate": 9.553322614285167e-06, - "loss": 2.2315, - "step": 463870 - }, - { - "epoch": 0.81, - "learning_rate": 9.55245067435834e-06, - "loss": 2.4138, - "step": 463880 - }, - { - "epoch": 0.81, - "learning_rate": 9.551578734431513e-06, - "loss": 2.1568, - "step": 463890 - }, - { - "epoch": 0.81, - "learning_rate": 9.550706794504687e-06, - "loss": 2.2545, - "step": 463900 - }, - { - "epoch": 0.81, - "learning_rate": 9.549834854577859e-06, - "loss": 2.2599, - "step": 463910 - }, - { - "epoch": 0.81, - "learning_rate": 9.548962914651032e-06, - "loss": 2.1734, - "step": 463920 - }, - { - "epoch": 0.81, - "learning_rate": 9.548090974724206e-06, - "loss": 2.2852, - "step": 463930 - }, - { - "epoch": 0.81, - "learning_rate": 9.54721903479738e-06, - "loss": 2.376, - "step": 463940 - }, - { - "epoch": 0.81, - "learning_rate": 9.546347094870552e-06, - "loss": 2.3724, - "step": 463950 - }, - { - "epoch": 0.81, - "learning_rate": 9.545475154943726e-06, - "loss": 2.2832, - "step": 463960 - }, - { - "epoch": 0.81, - "learning_rate": 9.5446032150169e-06, - "loss": 2.2743, - "step": 463970 - }, - { - "epoch": 0.81, - "learning_rate": 9.543731275090072e-06, - "loss": 2.21, - "step": 463980 - }, - { - "epoch": 0.81, - "learning_rate": 9.542859335163245e-06, - "loss": 2.3196, - "step": 463990 - }, - { - "epoch": 0.81, - "learning_rate": 9.541987395236417e-06, - "loss": 2.4368, - "step": 464000 - }, - { - "epoch": 0.81, - "learning_rate": 9.541115455309591e-06, - "loss": 2.2538, - "step": 464010 - }, - { - "epoch": 0.81, - "learning_rate": 9.540243515382765e-06, - "loss": 2.2789, - "step": 464020 - }, - { - "epoch": 0.81, - "learning_rate": 9.539371575455939e-06, - "loss": 2.3362, - "step": 464030 - }, - { - "epoch": 0.81, - "learning_rate": 9.538499635529111e-06, - "loss": 2.1835, - "step": 464040 - }, - { - "epoch": 0.81, - "learning_rate": 9.537627695602285e-06, - "loss": 2.2731, - "step": 464050 - }, - { - "epoch": 0.81, - "learning_rate": 9.536755755675457e-06, - "loss": 2.2904, - "step": 464060 - }, - { - "epoch": 0.81, - "learning_rate": 9.53588381574863e-06, - "loss": 2.2062, - "step": 464070 - }, - { - "epoch": 0.81, - "learning_rate": 9.535011875821803e-06, - "loss": 2.351, - "step": 464080 - }, - { - "epoch": 0.81, - "learning_rate": 9.534139935894976e-06, - "loss": 2.3866, - "step": 464090 - }, - { - "epoch": 0.81, - "learning_rate": 9.53326799596815e-06, - "loss": 2.271, - "step": 464100 - }, - { - "epoch": 0.81, - "learning_rate": 9.532396056041324e-06, - "loss": 2.3362, - "step": 464110 - }, - { - "epoch": 0.81, - "learning_rate": 9.531524116114498e-06, - "loss": 2.3706, - "step": 464120 - }, - { - "epoch": 0.81, - "learning_rate": 9.53065217618767e-06, - "loss": 2.3248, - "step": 464130 - }, - { - "epoch": 0.81, - "learning_rate": 9.529780236260843e-06, - "loss": 2.2477, - "step": 464140 - }, - { - "epoch": 0.81, - "learning_rate": 9.528908296334016e-06, - "loss": 2.4081, - "step": 464150 - }, - { - "epoch": 0.81, - "learning_rate": 9.52803635640719e-06, - "loss": 2.218, - "step": 464160 - }, - { - "epoch": 0.81, - "learning_rate": 9.527164416480361e-06, - "loss": 2.2943, - "step": 464170 - }, - { - "epoch": 0.81, - "learning_rate": 9.526292476553537e-06, - "loss": 2.1861, - "step": 464180 - }, - { - "epoch": 0.81, - "learning_rate": 9.525420536626709e-06, - "loss": 2.1959, - "step": 464190 - }, - { - "epoch": 0.81, - "learning_rate": 9.524548596699883e-06, - "loss": 2.2726, - "step": 464200 - }, - { - "epoch": 0.81, - "learning_rate": 9.523676656773055e-06, - "loss": 2.2803, - "step": 464210 - }, - { - "epoch": 0.81, - "learning_rate": 9.522804716846229e-06, - "loss": 2.2846, - "step": 464220 - }, - { - "epoch": 0.81, - "learning_rate": 9.521932776919402e-06, - "loss": 2.3372, - "step": 464230 - }, - { - "epoch": 0.81, - "learning_rate": 9.521060836992574e-06, - "loss": 2.3138, - "step": 464240 - }, - { - "epoch": 0.81, - "learning_rate": 9.520188897065748e-06, - "loss": 2.3496, - "step": 464250 - }, - { - "epoch": 0.81, - "learning_rate": 9.519316957138922e-06, - "loss": 2.2879, - "step": 464260 - }, - { - "epoch": 0.81, - "learning_rate": 9.518445017212096e-06, - "loss": 2.287, - "step": 464270 - }, - { - "epoch": 0.81, - "learning_rate": 9.517573077285268e-06, - "loss": 2.3332, - "step": 464280 - }, - { - "epoch": 0.81, - "learning_rate": 9.516701137358442e-06, - "loss": 2.3555, - "step": 464290 - }, - { - "epoch": 0.81, - "learning_rate": 9.515829197431614e-06, - "loss": 2.2432, - "step": 464300 - }, - { - "epoch": 0.81, - "learning_rate": 9.514957257504787e-06, - "loss": 2.3096, - "step": 464310 - }, - { - "epoch": 0.81, - "learning_rate": 9.51408531757796e-06, - "loss": 2.2806, - "step": 464320 - }, - { - "epoch": 0.81, - "learning_rate": 9.513213377651133e-06, - "loss": 2.2538, - "step": 464330 - }, - { - "epoch": 0.81, - "learning_rate": 9.512341437724307e-06, - "loss": 2.2277, - "step": 464340 - }, - { - "epoch": 0.81, - "learning_rate": 9.51146949779748e-06, - "loss": 2.3631, - "step": 464350 - }, - { - "epoch": 0.81, - "learning_rate": 9.510597557870653e-06, - "loss": 2.2753, - "step": 464360 - }, - { - "epoch": 0.81, - "learning_rate": 9.509725617943827e-06, - "loss": 2.3703, - "step": 464370 - }, - { - "epoch": 0.81, - "learning_rate": 9.508853678017e-06, - "loss": 2.2804, - "step": 464380 - }, - { - "epoch": 0.81, - "learning_rate": 9.507981738090172e-06, - "loss": 2.3168, - "step": 464390 - }, - { - "epoch": 0.81, - "learning_rate": 9.507109798163346e-06, - "loss": 2.4042, - "step": 464400 - }, - { - "epoch": 0.81, - "learning_rate": 9.506237858236518e-06, - "loss": 2.2548, - "step": 464410 - }, - { - "epoch": 0.81, - "learning_rate": 9.505365918309694e-06, - "loss": 2.2664, - "step": 464420 - }, - { - "epoch": 0.81, - "learning_rate": 9.504493978382866e-06, - "loss": 2.2417, - "step": 464430 - }, - { - "epoch": 0.81, - "learning_rate": 9.50362203845604e-06, - "loss": 2.2806, - "step": 464440 - }, - { - "epoch": 0.81, - "learning_rate": 9.502750098529212e-06, - "loss": 2.3855, - "step": 464450 - }, - { - "epoch": 0.81, - "learning_rate": 9.501878158602385e-06, - "loss": 2.2366, - "step": 464460 - }, - { - "epoch": 0.81, - "learning_rate": 9.501006218675558e-06, - "loss": 2.333, - "step": 464470 - }, - { - "epoch": 0.81, - "learning_rate": 9.500134278748731e-06, - "loss": 2.3019, - "step": 464480 - }, - { - "epoch": 0.81, - "learning_rate": 9.499262338821905e-06, - "loss": 2.2844, - "step": 464490 - }, - { - "epoch": 0.81, - "learning_rate": 9.498390398895079e-06, - "loss": 2.1582, - "step": 464500 - }, - { - "epoch": 0.81, - "learning_rate": 9.497518458968253e-06, - "loss": 2.3401, - "step": 464510 - }, - { - "epoch": 0.81, - "learning_rate": 9.496646519041425e-06, - "loss": 2.3612, - "step": 464520 - }, - { - "epoch": 0.81, - "learning_rate": 9.495774579114598e-06, - "loss": 2.2959, - "step": 464530 - }, - { - "epoch": 0.81, - "learning_rate": 9.49490263918777e-06, - "loss": 2.3885, - "step": 464540 - }, - { - "epoch": 0.81, - "learning_rate": 9.494030699260944e-06, - "loss": 2.3043, - "step": 464550 - }, - { - "epoch": 0.81, - "learning_rate": 9.493158759334116e-06, - "loss": 2.3141, - "step": 464560 - }, - { - "epoch": 0.81, - "learning_rate": 9.49228681940729e-06, - "loss": 2.1647, - "step": 464570 - }, - { - "epoch": 0.81, - "learning_rate": 9.491414879480464e-06, - "loss": 2.3067, - "step": 464580 - }, - { - "epoch": 0.81, - "learning_rate": 9.490542939553638e-06, - "loss": 2.2291, - "step": 464590 - }, - { - "epoch": 0.81, - "learning_rate": 9.48967099962681e-06, - "loss": 2.3075, - "step": 464600 - }, - { - "epoch": 0.81, - "learning_rate": 9.488799059699984e-06, - "loss": 2.4187, - "step": 464610 - }, - { - "epoch": 0.81, - "learning_rate": 9.487927119773156e-06, - "loss": 2.2761, - "step": 464620 - }, - { - "epoch": 0.81, - "learning_rate": 9.48705517984633e-06, - "loss": 2.2026, - "step": 464630 - }, - { - "epoch": 0.81, - "learning_rate": 9.486183239919503e-06, - "loss": 2.2428, - "step": 464640 - }, - { - "epoch": 0.81, - "learning_rate": 9.485311299992675e-06, - "loss": 2.299, - "step": 464650 - }, - { - "epoch": 0.81, - "learning_rate": 9.48443936006585e-06, - "loss": 2.2875, - "step": 464660 - }, - { - "epoch": 0.81, - "learning_rate": 9.483567420139023e-06, - "loss": 2.4015, - "step": 464670 - }, - { - "epoch": 0.81, - "learning_rate": 9.482695480212197e-06, - "loss": 2.1658, - "step": 464680 - }, - { - "epoch": 0.81, - "learning_rate": 9.481823540285369e-06, - "loss": 2.2701, - "step": 464690 - }, - { - "epoch": 0.81, - "learning_rate": 9.480951600358542e-06, - "loss": 2.3384, - "step": 464700 - }, - { - "epoch": 0.81, - "learning_rate": 9.480079660431714e-06, - "loss": 2.2287, - "step": 464710 - }, - { - "epoch": 0.81, - "learning_rate": 9.479207720504888e-06, - "loss": 2.2202, - "step": 464720 - }, - { - "epoch": 0.81, - "learning_rate": 9.478335780578062e-06, - "loss": 2.4132, - "step": 464730 - }, - { - "epoch": 0.81, - "learning_rate": 9.477463840651236e-06, - "loss": 2.1698, - "step": 464740 - }, - { - "epoch": 0.81, - "learning_rate": 9.476591900724408e-06, - "loss": 2.2847, - "step": 464750 - }, - { - "epoch": 0.81, - "learning_rate": 9.475719960797582e-06, - "loss": 2.2116, - "step": 464760 - }, - { - "epoch": 0.81, - "learning_rate": 9.474848020870755e-06, - "loss": 2.3476, - "step": 464770 - }, - { - "epoch": 0.81, - "learning_rate": 9.473976080943927e-06, - "loss": 2.2488, - "step": 464780 - }, - { - "epoch": 0.81, - "learning_rate": 9.473104141017101e-06, - "loss": 2.2156, - "step": 464790 - }, - { - "epoch": 0.81, - "learning_rate": 9.472232201090273e-06, - "loss": 2.4621, - "step": 464800 - }, - { - "epoch": 0.81, - "learning_rate": 9.471360261163447e-06, - "loss": 2.3295, - "step": 464810 - }, - { - "epoch": 0.81, - "learning_rate": 9.470488321236621e-06, - "loss": 2.3023, - "step": 464820 - }, - { - "epoch": 0.81, - "learning_rate": 9.469616381309795e-06, - "loss": 2.2363, - "step": 464830 - }, - { - "epoch": 0.81, - "learning_rate": 9.468744441382967e-06, - "loss": 2.3424, - "step": 464840 - }, - { - "epoch": 0.81, - "learning_rate": 9.46787250145614e-06, - "loss": 2.2067, - "step": 464850 - }, - { - "epoch": 0.81, - "learning_rate": 9.467000561529313e-06, - "loss": 2.2296, - "step": 464860 - }, - { - "epoch": 0.81, - "learning_rate": 9.466128621602486e-06, - "loss": 2.244, - "step": 464870 - }, - { - "epoch": 0.81, - "learning_rate": 9.465256681675658e-06, - "loss": 2.2382, - "step": 464880 - }, - { - "epoch": 0.81, - "learning_rate": 9.464384741748832e-06, - "loss": 2.199, - "step": 464890 - }, - { - "epoch": 0.81, - "learning_rate": 9.463512801822006e-06, - "loss": 2.2164, - "step": 464900 - }, - { - "epoch": 0.81, - "learning_rate": 9.46264086189518e-06, - "loss": 2.3531, - "step": 464910 - }, - { - "epoch": 0.81, - "learning_rate": 9.461768921968353e-06, - "loss": 2.2779, - "step": 464920 - }, - { - "epoch": 0.81, - "learning_rate": 9.460896982041526e-06, - "loss": 2.2544, - "step": 464930 - }, - { - "epoch": 0.81, - "learning_rate": 9.4600250421147e-06, - "loss": 2.2201, - "step": 464940 - }, - { - "epoch": 0.81, - "learning_rate": 9.459153102187871e-06, - "loss": 2.3248, - "step": 464950 - }, - { - "epoch": 0.81, - "learning_rate": 9.458281162261045e-06, - "loss": 2.262, - "step": 464960 - }, - { - "epoch": 0.81, - "learning_rate": 9.457409222334219e-06, - "loss": 2.3265, - "step": 464970 - }, - { - "epoch": 0.81, - "learning_rate": 9.456537282407393e-06, - "loss": 2.1953, - "step": 464980 - }, - { - "epoch": 0.81, - "learning_rate": 9.455665342480565e-06, - "loss": 2.2495, - "step": 464990 - }, - { - "epoch": 0.81, - "learning_rate": 9.454793402553739e-06, - "loss": 2.2498, - "step": 465000 - }, - { - "epoch": 0.81, - "learning_rate": 9.45392146262691e-06, - "loss": 2.193, - "step": 465010 - }, - { - "epoch": 0.81, - "learning_rate": 9.453049522700084e-06, - "loss": 2.2302, - "step": 465020 - }, - { - "epoch": 0.81, - "learning_rate": 9.452177582773258e-06, - "loss": 2.3052, - "step": 465030 - }, - { - "epoch": 0.81, - "learning_rate": 9.45130564284643e-06, - "loss": 2.3187, - "step": 465040 - }, - { - "epoch": 0.81, - "learning_rate": 9.450433702919604e-06, - "loss": 2.2977, - "step": 465050 - }, - { - "epoch": 0.81, - "learning_rate": 9.449561762992778e-06, - "loss": 2.3282, - "step": 465060 - }, - { - "epoch": 0.81, - "learning_rate": 9.448689823065952e-06, - "loss": 2.2754, - "step": 465070 - }, - { - "epoch": 0.81, - "learning_rate": 9.447817883139124e-06, - "loss": 2.2461, - "step": 465080 - }, - { - "epoch": 0.81, - "learning_rate": 9.446945943212297e-06, - "loss": 2.2569, - "step": 465090 - }, - { - "epoch": 0.81, - "learning_rate": 9.44607400328547e-06, - "loss": 2.2876, - "step": 465100 - }, - { - "epoch": 0.81, - "learning_rate": 9.445202063358643e-06, - "loss": 2.3476, - "step": 465110 - }, - { - "epoch": 0.81, - "learning_rate": 9.444330123431815e-06, - "loss": 2.2372, - "step": 465120 - }, - { - "epoch": 0.81, - "learning_rate": 9.443458183504989e-06, - "loss": 2.3945, - "step": 465130 - }, - { - "epoch": 0.81, - "learning_rate": 9.442586243578163e-06, - "loss": 2.2113, - "step": 465140 - }, - { - "epoch": 0.81, - "learning_rate": 9.441714303651337e-06, - "loss": 2.209, - "step": 465150 - }, - { - "epoch": 0.81, - "learning_rate": 9.44084236372451e-06, - "loss": 2.3132, - "step": 465160 - }, - { - "epoch": 0.81, - "learning_rate": 9.439970423797682e-06, - "loss": 2.2412, - "step": 465170 - }, - { - "epoch": 0.81, - "learning_rate": 9.439098483870856e-06, - "loss": 2.3951, - "step": 465180 - }, - { - "epoch": 0.81, - "learning_rate": 9.438226543944028e-06, - "loss": 2.4415, - "step": 465190 - }, - { - "epoch": 0.81, - "learning_rate": 9.437354604017202e-06, - "loss": 2.3874, - "step": 465200 - }, - { - "epoch": 0.81, - "learning_rate": 9.436482664090374e-06, - "loss": 2.3114, - "step": 465210 - }, - { - "epoch": 0.81, - "learning_rate": 9.43561072416355e-06, - "loss": 2.3312, - "step": 465220 - }, - { - "epoch": 0.81, - "learning_rate": 9.434738784236722e-06, - "loss": 2.1296, - "step": 465230 - }, - { - "epoch": 0.81, - "learning_rate": 9.433866844309895e-06, - "loss": 2.218, - "step": 465240 - }, - { - "epoch": 0.81, - "learning_rate": 9.432994904383068e-06, - "loss": 2.3336, - "step": 465250 - }, - { - "epoch": 0.81, - "learning_rate": 9.432122964456241e-06, - "loss": 2.2695, - "step": 465260 - }, - { - "epoch": 0.81, - "learning_rate": 9.431251024529413e-06, - "loss": 2.3797, - "step": 465270 - }, - { - "epoch": 0.81, - "learning_rate": 9.430379084602587e-06, - "loss": 2.3055, - "step": 465280 - }, - { - "epoch": 0.81, - "learning_rate": 9.429507144675761e-06, - "loss": 2.354, - "step": 465290 - }, - { - "epoch": 0.81, - "learning_rate": 9.428635204748935e-06, - "loss": 2.3488, - "step": 465300 - }, - { - "epoch": 0.81, - "learning_rate": 9.427763264822108e-06, - "loss": 2.4137, - "step": 465310 - }, - { - "epoch": 0.81, - "learning_rate": 9.42689132489528e-06, - "loss": 2.1888, - "step": 465320 - }, - { - "epoch": 0.81, - "learning_rate": 9.426019384968454e-06, - "loss": 2.383, - "step": 465330 - }, - { - "epoch": 0.81, - "learning_rate": 9.425147445041626e-06, - "loss": 2.2878, - "step": 465340 - }, - { - "epoch": 0.81, - "learning_rate": 9.4242755051148e-06, - "loss": 2.2034, - "step": 465350 - }, - { - "epoch": 0.81, - "learning_rate": 9.423403565187972e-06, - "loss": 2.2333, - "step": 465360 - }, - { - "epoch": 0.81, - "learning_rate": 9.422531625261146e-06, - "loss": 2.2315, - "step": 465370 - }, - { - "epoch": 0.81, - "learning_rate": 9.42165968533432e-06, - "loss": 2.369, - "step": 465380 - }, - { - "epoch": 0.81, - "learning_rate": 9.420787745407494e-06, - "loss": 2.233, - "step": 465390 - }, - { - "epoch": 0.81, - "learning_rate": 9.419915805480666e-06, - "loss": 2.3456, - "step": 465400 - }, - { - "epoch": 0.81, - "learning_rate": 9.41904386555384e-06, - "loss": 2.164, - "step": 465410 - }, - { - "epoch": 0.81, - "learning_rate": 9.418171925627011e-06, - "loss": 2.3369, - "step": 465420 - }, - { - "epoch": 0.81, - "learning_rate": 9.417299985700185e-06, - "loss": 2.3116, - "step": 465430 - }, - { - "epoch": 0.81, - "learning_rate": 9.416428045773359e-06, - "loss": 2.1963, - "step": 465440 - }, - { - "epoch": 0.81, - "learning_rate": 9.415556105846531e-06, - "loss": 2.2613, - "step": 465450 - }, - { - "epoch": 0.81, - "learning_rate": 9.414684165919707e-06, - "loss": 2.2578, - "step": 465460 - }, - { - "epoch": 0.81, - "learning_rate": 9.413812225992879e-06, - "loss": 2.3095, - "step": 465470 - }, - { - "epoch": 0.81, - "learning_rate": 9.412940286066052e-06, - "loss": 2.3118, - "step": 465480 - }, - { - "epoch": 0.81, - "learning_rate": 9.412068346139224e-06, - "loss": 2.2322, - "step": 465490 - }, - { - "epoch": 0.81, - "learning_rate": 9.411196406212398e-06, - "loss": 2.3372, - "step": 465500 - }, - { - "epoch": 0.81, - "learning_rate": 9.41032446628557e-06, - "loss": 2.254, - "step": 465510 - }, - { - "epoch": 0.81, - "learning_rate": 9.409452526358744e-06, - "loss": 2.3581, - "step": 465520 - }, - { - "epoch": 0.81, - "learning_rate": 9.408580586431918e-06, - "loss": 2.3527, - "step": 465530 - }, - { - "epoch": 0.81, - "learning_rate": 9.407708646505092e-06, - "loss": 2.2541, - "step": 465540 - }, - { - "epoch": 0.81, - "learning_rate": 9.406836706578264e-06, - "loss": 2.3878, - "step": 465550 - }, - { - "epoch": 0.81, - "learning_rate": 9.405964766651437e-06, - "loss": 2.2432, - "step": 465560 - }, - { - "epoch": 0.81, - "learning_rate": 9.405092826724611e-06, - "loss": 2.2939, - "step": 465570 - }, - { - "epoch": 0.81, - "learning_rate": 9.404220886797783e-06, - "loss": 2.3414, - "step": 465580 - }, - { - "epoch": 0.81, - "learning_rate": 9.403348946870957e-06, - "loss": 2.3944, - "step": 465590 - }, - { - "epoch": 0.81, - "learning_rate": 9.40247700694413e-06, - "loss": 2.2318, - "step": 465600 - }, - { - "epoch": 0.81, - "learning_rate": 9.401605067017303e-06, - "loss": 2.1803, - "step": 465610 - }, - { - "epoch": 0.81, - "learning_rate": 9.400733127090477e-06, - "loss": 2.2965, - "step": 465620 - }, - { - "epoch": 0.81, - "learning_rate": 9.39986118716365e-06, - "loss": 2.3262, - "step": 465630 - }, - { - "epoch": 0.81, - "learning_rate": 9.398989247236823e-06, - "loss": 2.3602, - "step": 465640 - }, - { - "epoch": 0.81, - "learning_rate": 9.398117307309996e-06, - "loss": 2.2377, - "step": 465650 - }, - { - "epoch": 0.81, - "learning_rate": 9.397245367383168e-06, - "loss": 2.2079, - "step": 465660 - }, - { - "epoch": 0.81, - "learning_rate": 9.396373427456342e-06, - "loss": 2.2865, - "step": 465670 - }, - { - "epoch": 0.81, - "learning_rate": 9.395501487529514e-06, - "loss": 2.3769, - "step": 465680 - }, - { - "epoch": 0.81, - "learning_rate": 9.394629547602688e-06, - "loss": 2.3081, - "step": 465690 - }, - { - "epoch": 0.81, - "learning_rate": 9.393757607675863e-06, - "loss": 2.3759, - "step": 465700 - }, - { - "epoch": 0.81, - "learning_rate": 9.392885667749036e-06, - "loss": 2.2342, - "step": 465710 - }, - { - "epoch": 0.81, - "learning_rate": 9.39201372782221e-06, - "loss": 2.3388, - "step": 465720 - }, - { - "epoch": 0.81, - "learning_rate": 9.391141787895381e-06, - "loss": 2.4401, - "step": 465730 - }, - { - "epoch": 0.81, - "learning_rate": 9.390269847968555e-06, - "loss": 2.2444, - "step": 465740 - }, - { - "epoch": 0.81, - "learning_rate": 9.389397908041727e-06, - "loss": 2.2846, - "step": 465750 - }, - { - "epoch": 0.81, - "learning_rate": 9.388525968114901e-06, - "loss": 2.2863, - "step": 465760 - }, - { - "epoch": 0.81, - "learning_rate": 9.387654028188075e-06, - "loss": 2.3823, - "step": 465770 - }, - { - "epoch": 0.81, - "learning_rate": 9.386782088261249e-06, - "loss": 2.3122, - "step": 465780 - }, - { - "epoch": 0.81, - "learning_rate": 9.38591014833442e-06, - "loss": 2.2337, - "step": 465790 - }, - { - "epoch": 0.81, - "learning_rate": 9.385038208407594e-06, - "loss": 2.2701, - "step": 465800 - }, - { - "epoch": 0.81, - "learning_rate": 9.384166268480766e-06, - "loss": 2.2521, - "step": 465810 - }, - { - "epoch": 0.81, - "learning_rate": 9.38329432855394e-06, - "loss": 2.2585, - "step": 465820 - }, - { - "epoch": 0.81, - "learning_rate": 9.382422388627114e-06, - "loss": 2.3538, - "step": 465830 - }, - { - "epoch": 0.81, - "learning_rate": 9.381550448700286e-06, - "loss": 2.3531, - "step": 465840 - }, - { - "epoch": 0.81, - "learning_rate": 9.38067850877346e-06, - "loss": 2.3538, - "step": 465850 - }, - { - "epoch": 0.81, - "learning_rate": 9.379806568846634e-06, - "loss": 2.394, - "step": 465860 - }, - { - "epoch": 0.81, - "learning_rate": 9.378934628919807e-06, - "loss": 2.2953, - "step": 465870 - }, - { - "epoch": 0.81, - "learning_rate": 9.37806268899298e-06, - "loss": 2.2795, - "step": 465880 - }, - { - "epoch": 0.81, - "learning_rate": 9.377190749066153e-06, - "loss": 2.2722, - "step": 465890 - }, - { - "epoch": 0.81, - "learning_rate": 9.376318809139325e-06, - "loss": 2.2738, - "step": 465900 - }, - { - "epoch": 0.81, - "learning_rate": 9.375446869212499e-06, - "loss": 2.279, - "step": 465910 - }, - { - "epoch": 0.81, - "learning_rate": 9.374574929285671e-06, - "loss": 2.314, - "step": 465920 - }, - { - "epoch": 0.81, - "learning_rate": 9.373702989358845e-06, - "loss": 2.249, - "step": 465930 - }, - { - "epoch": 0.81, - "learning_rate": 9.372831049432019e-06, - "loss": 2.2731, - "step": 465940 - }, - { - "epoch": 0.81, - "learning_rate": 9.371959109505192e-06, - "loss": 2.31, - "step": 465950 - }, - { - "epoch": 0.81, - "learning_rate": 9.371087169578366e-06, - "loss": 2.2732, - "step": 465960 - }, - { - "epoch": 0.81, - "learning_rate": 9.370215229651538e-06, - "loss": 2.3234, - "step": 465970 - }, - { - "epoch": 0.81, - "learning_rate": 9.369343289724712e-06, - "loss": 2.2397, - "step": 465980 - }, - { - "epoch": 0.81, - "learning_rate": 9.368471349797884e-06, - "loss": 2.3734, - "step": 465990 - }, - { - "epoch": 0.81, - "learning_rate": 9.367599409871058e-06, - "loss": 2.3616, - "step": 466000 - }, - { - "epoch": 0.81, - "learning_rate": 9.366727469944232e-06, - "loss": 2.3552, - "step": 466010 - }, - { - "epoch": 0.81, - "learning_rate": 9.365855530017405e-06, - "loss": 2.3402, - "step": 466020 - }, - { - "epoch": 0.81, - "learning_rate": 9.364983590090578e-06, - "loss": 2.4025, - "step": 466030 - }, - { - "epoch": 0.81, - "learning_rate": 9.364111650163751e-06, - "loss": 2.2366, - "step": 466040 - }, - { - "epoch": 0.81, - "learning_rate": 9.363239710236923e-06, - "loss": 2.2907, - "step": 466050 - }, - { - "epoch": 0.81, - "learning_rate": 9.362367770310097e-06, - "loss": 2.2637, - "step": 466060 - }, - { - "epoch": 0.81, - "learning_rate": 9.36149583038327e-06, - "loss": 2.2147, - "step": 466070 - }, - { - "epoch": 0.81, - "learning_rate": 9.360623890456443e-06, - "loss": 2.2131, - "step": 466080 - }, - { - "epoch": 0.81, - "learning_rate": 9.359751950529617e-06, - "loss": 2.1871, - "step": 466090 - }, - { - "epoch": 0.81, - "learning_rate": 9.35888001060279e-06, - "loss": 2.3621, - "step": 466100 - }, - { - "epoch": 0.81, - "learning_rate": 9.358008070675964e-06, - "loss": 2.2101, - "step": 466110 - }, - { - "epoch": 0.81, - "learning_rate": 9.357136130749136e-06, - "loss": 2.257, - "step": 466120 - }, - { - "epoch": 0.81, - "learning_rate": 9.35626419082231e-06, - "loss": 2.2399, - "step": 466130 - }, - { - "epoch": 0.81, - "learning_rate": 9.355392250895482e-06, - "loss": 2.3785, - "step": 466140 - }, - { - "epoch": 0.81, - "learning_rate": 9.354520310968656e-06, - "loss": 2.2134, - "step": 466150 - }, - { - "epoch": 0.81, - "learning_rate": 9.353648371041828e-06, - "loss": 2.1664, - "step": 466160 - }, - { - "epoch": 0.81, - "learning_rate": 9.352776431115002e-06, - "loss": 2.2, - "step": 466170 - }, - { - "epoch": 0.81, - "learning_rate": 9.351904491188176e-06, - "loss": 2.2571, - "step": 466180 - }, - { - "epoch": 0.81, - "learning_rate": 9.35103255126135e-06, - "loss": 2.2913, - "step": 466190 - }, - { - "epoch": 0.81, - "learning_rate": 9.350160611334521e-06, - "loss": 2.2974, - "step": 466200 - }, - { - "epoch": 0.81, - "learning_rate": 9.349288671407695e-06, - "loss": 2.3152, - "step": 466210 - }, - { - "epoch": 0.81, - "learning_rate": 9.348416731480867e-06, - "loss": 2.2331, - "step": 466220 - }, - { - "epoch": 0.81, - "learning_rate": 9.347544791554041e-06, - "loss": 2.308, - "step": 466230 - }, - { - "epoch": 0.81, - "learning_rate": 9.346672851627215e-06, - "loss": 2.2191, - "step": 466240 - }, - { - "epoch": 0.81, - "learning_rate": 9.345800911700387e-06, - "loss": 2.3775, - "step": 466250 - }, - { - "epoch": 0.81, - "learning_rate": 9.344928971773562e-06, - "loss": 2.261, - "step": 466260 - }, - { - "epoch": 0.81, - "learning_rate": 9.344057031846734e-06, - "loss": 2.2567, - "step": 466270 - }, - { - "epoch": 0.81, - "learning_rate": 9.343185091919908e-06, - "loss": 2.3137, - "step": 466280 - }, - { - "epoch": 0.81, - "learning_rate": 9.34231315199308e-06, - "loss": 2.2645, - "step": 466290 - }, - { - "epoch": 0.81, - "learning_rate": 9.341441212066254e-06, - "loss": 2.3091, - "step": 466300 - }, - { - "epoch": 0.81, - "learning_rate": 9.340569272139426e-06, - "loss": 2.2773, - "step": 466310 - }, - { - "epoch": 0.81, - "learning_rate": 9.3396973322126e-06, - "loss": 2.1607, - "step": 466320 - }, - { - "epoch": 0.81, - "learning_rate": 9.338825392285774e-06, - "loss": 2.2864, - "step": 466330 - }, - { - "epoch": 0.81, - "learning_rate": 9.337953452358947e-06, - "loss": 2.3671, - "step": 466340 - }, - { - "epoch": 0.81, - "learning_rate": 9.33708151243212e-06, - "loss": 2.3358, - "step": 466350 - }, - { - "epoch": 0.81, - "learning_rate": 9.336209572505293e-06, - "loss": 2.1329, - "step": 466360 - }, - { - "epoch": 0.81, - "learning_rate": 9.335337632578467e-06, - "loss": 2.3235, - "step": 466370 - }, - { - "epoch": 0.81, - "learning_rate": 9.33446569265164e-06, - "loss": 2.2316, - "step": 466380 - }, - { - "epoch": 0.81, - "learning_rate": 9.333593752724813e-06, - "loss": 2.2176, - "step": 466390 - }, - { - "epoch": 0.81, - "learning_rate": 9.332721812797985e-06, - "loss": 2.2735, - "step": 466400 - }, - { - "epoch": 0.81, - "learning_rate": 9.331849872871159e-06, - "loss": 2.3764, - "step": 466410 - }, - { - "epoch": 0.81, - "learning_rate": 9.330977932944333e-06, - "loss": 2.2556, - "step": 466420 - }, - { - "epoch": 0.81, - "learning_rate": 9.330105993017506e-06, - "loss": 2.2701, - "step": 466430 - }, - { - "epoch": 0.81, - "learning_rate": 9.329234053090678e-06, - "loss": 2.2671, - "step": 466440 - }, - { - "epoch": 0.81, - "learning_rate": 9.328362113163852e-06, - "loss": 2.2928, - "step": 466450 - }, - { - "epoch": 0.81, - "learning_rate": 9.327490173237024e-06, - "loss": 2.2962, - "step": 466460 - }, - { - "epoch": 0.81, - "learning_rate": 9.326618233310198e-06, - "loss": 2.2354, - "step": 466470 - }, - { - "epoch": 0.81, - "learning_rate": 9.32574629338337e-06, - "loss": 2.1893, - "step": 466480 - }, - { - "epoch": 0.81, - "learning_rate": 9.324874353456544e-06, - "loss": 2.1898, - "step": 466490 - }, - { - "epoch": 0.81, - "learning_rate": 9.32400241352972e-06, - "loss": 2.2342, - "step": 466500 - }, - { - "epoch": 0.81, - "learning_rate": 9.323130473602891e-06, - "loss": 2.3733, - "step": 466510 - }, - { - "epoch": 0.81, - "learning_rate": 9.322258533676065e-06, - "loss": 2.1596, - "step": 466520 - }, - { - "epoch": 0.81, - "learning_rate": 9.321386593749237e-06, - "loss": 2.3527, - "step": 466530 - }, - { - "epoch": 0.81, - "learning_rate": 9.320514653822411e-06, - "loss": 2.2471, - "step": 466540 - }, - { - "epoch": 0.81, - "learning_rate": 9.319642713895583e-06, - "loss": 2.2877, - "step": 466550 - }, - { - "epoch": 0.81, - "learning_rate": 9.318770773968757e-06, - "loss": 2.2479, - "step": 466560 - }, - { - "epoch": 0.81, - "learning_rate": 9.31789883404193e-06, - "loss": 2.2463, - "step": 466570 - }, - { - "epoch": 0.81, - "learning_rate": 9.317026894115104e-06, - "loss": 2.2274, - "step": 466580 - }, - { - "epoch": 0.81, - "learning_rate": 9.316154954188276e-06, - "loss": 2.3215, - "step": 466590 - }, - { - "epoch": 0.81, - "learning_rate": 9.31528301426145e-06, - "loss": 2.1582, - "step": 466600 - }, - { - "epoch": 0.81, - "learning_rate": 9.314411074334622e-06, - "loss": 2.3235, - "step": 466610 - }, - { - "epoch": 0.81, - "learning_rate": 9.313539134407796e-06, - "loss": 2.1922, - "step": 466620 - }, - { - "epoch": 0.81, - "learning_rate": 9.31266719448097e-06, - "loss": 2.2843, - "step": 466630 - }, - { - "epoch": 0.81, - "learning_rate": 9.311795254554142e-06, - "loss": 2.2052, - "step": 466640 - }, - { - "epoch": 0.81, - "learning_rate": 9.310923314627316e-06, - "loss": 2.2298, - "step": 466650 - }, - { - "epoch": 0.81, - "learning_rate": 9.31005137470049e-06, - "loss": 2.1759, - "step": 466660 - }, - { - "epoch": 0.81, - "learning_rate": 9.309179434773663e-06, - "loss": 2.3576, - "step": 466670 - }, - { - "epoch": 0.81, - "learning_rate": 9.308307494846835e-06, - "loss": 2.1529, - "step": 466680 - }, - { - "epoch": 0.81, - "learning_rate": 9.307435554920009e-06, - "loss": 2.3027, - "step": 466690 - }, - { - "epoch": 0.81, - "learning_rate": 9.306563614993181e-06, - "loss": 2.2786, - "step": 466700 - }, - { - "epoch": 0.81, - "learning_rate": 9.305691675066355e-06, - "loss": 2.2102, - "step": 466710 - }, - { - "epoch": 0.81, - "learning_rate": 9.304819735139527e-06, - "loss": 2.1534, - "step": 466720 - }, - { - "epoch": 0.81, - "learning_rate": 9.3039477952127e-06, - "loss": 2.3403, - "step": 466730 - }, - { - "epoch": 0.81, - "learning_rate": 9.303075855285875e-06, - "loss": 2.2204, - "step": 466740 - }, - { - "epoch": 0.81, - "learning_rate": 9.302203915359048e-06, - "loss": 2.3151, - "step": 466750 - }, - { - "epoch": 0.81, - "learning_rate": 9.301331975432222e-06, - "loss": 2.3386, - "step": 466760 - }, - { - "epoch": 0.81, - "learning_rate": 9.300460035505394e-06, - "loss": 2.2802, - "step": 466770 - }, - { - "epoch": 0.81, - "learning_rate": 9.299588095578568e-06, - "loss": 2.296, - "step": 466780 - }, - { - "epoch": 0.81, - "learning_rate": 9.29871615565174e-06, - "loss": 2.2729, - "step": 466790 - }, - { - "epoch": 0.81, - "learning_rate": 9.297844215724914e-06, - "loss": 2.2986, - "step": 466800 - }, - { - "epoch": 0.81, - "learning_rate": 9.296972275798088e-06, - "loss": 2.3128, - "step": 466810 - }, - { - "epoch": 0.81, - "learning_rate": 9.296100335871261e-06, - "loss": 2.2972, - "step": 466820 - }, - { - "epoch": 0.81, - "learning_rate": 9.295228395944433e-06, - "loss": 2.3047, - "step": 466830 - }, - { - "epoch": 0.81, - "learning_rate": 9.294356456017607e-06, - "loss": 2.2326, - "step": 466840 - }, - { - "epoch": 0.81, - "learning_rate": 9.29348451609078e-06, - "loss": 2.3383, - "step": 466850 - }, - { - "epoch": 0.81, - "learning_rate": 9.292612576163953e-06, - "loss": 2.2055, - "step": 466860 - }, - { - "epoch": 0.81, - "learning_rate": 9.291740636237125e-06, - "loss": 2.2484, - "step": 466870 - }, - { - "epoch": 0.81, - "learning_rate": 9.290868696310299e-06, - "loss": 2.297, - "step": 466880 - }, - { - "epoch": 0.81, - "learning_rate": 9.289996756383473e-06, - "loss": 2.3011, - "step": 466890 - }, - { - "epoch": 0.81, - "learning_rate": 9.289124816456646e-06, - "loss": 2.2858, - "step": 466900 - }, - { - "epoch": 0.81, - "learning_rate": 9.28825287652982e-06, - "loss": 2.3175, - "step": 466910 - }, - { - "epoch": 0.81, - "learning_rate": 9.287380936602992e-06, - "loss": 2.277, - "step": 466920 - }, - { - "epoch": 0.81, - "learning_rate": 9.286508996676166e-06, - "loss": 2.1882, - "step": 466930 - }, - { - "epoch": 0.81, - "learning_rate": 9.285637056749338e-06, - "loss": 2.3222, - "step": 466940 - }, - { - "epoch": 0.81, - "learning_rate": 9.284765116822512e-06, - "loss": 2.3349, - "step": 466950 - }, - { - "epoch": 0.81, - "learning_rate": 9.283893176895684e-06, - "loss": 2.3449, - "step": 466960 - }, - { - "epoch": 0.81, - "learning_rate": 9.283021236968858e-06, - "loss": 2.387, - "step": 466970 - }, - { - "epoch": 0.81, - "learning_rate": 9.282149297042031e-06, - "loss": 2.2316, - "step": 466980 - }, - { - "epoch": 0.81, - "learning_rate": 9.281277357115205e-06, - "loss": 2.3111, - "step": 466990 - }, - { - "epoch": 0.81, - "learning_rate": 9.280405417188377e-06, - "loss": 2.2855, - "step": 467000 - }, - { - "epoch": 0.81, - "learning_rate": 9.279533477261551e-06, - "loss": 2.209, - "step": 467010 - }, - { - "epoch": 0.81, - "learning_rate": 9.278661537334723e-06, - "loss": 2.1707, - "step": 467020 - }, - { - "epoch": 0.81, - "learning_rate": 9.277789597407897e-06, - "loss": 2.189, - "step": 467030 - }, - { - "epoch": 0.81, - "learning_rate": 9.27691765748107e-06, - "loss": 2.3714, - "step": 467040 - }, - { - "epoch": 0.81, - "learning_rate": 9.276045717554244e-06, - "loss": 2.1723, - "step": 467050 - }, - { - "epoch": 0.81, - "learning_rate": 9.275173777627418e-06, - "loss": 2.1954, - "step": 467060 - }, - { - "epoch": 0.81, - "learning_rate": 9.27430183770059e-06, - "loss": 2.1512, - "step": 467070 - }, - { - "epoch": 0.81, - "learning_rate": 9.273429897773764e-06, - "loss": 2.2387, - "step": 467080 - }, - { - "epoch": 0.81, - "learning_rate": 9.272557957846936e-06, - "loss": 2.2259, - "step": 467090 - }, - { - "epoch": 0.81, - "learning_rate": 9.27168601792011e-06, - "loss": 2.235, - "step": 467100 - }, - { - "epoch": 0.81, - "learning_rate": 9.270814077993282e-06, - "loss": 2.344, - "step": 467110 - }, - { - "epoch": 0.81, - "learning_rate": 9.269942138066456e-06, - "loss": 2.3667, - "step": 467120 - }, - { - "epoch": 0.81, - "learning_rate": 9.26907019813963e-06, - "loss": 2.3357, - "step": 467130 - }, - { - "epoch": 0.81, - "learning_rate": 9.268198258212803e-06, - "loss": 2.2116, - "step": 467140 - }, - { - "epoch": 0.81, - "learning_rate": 9.267326318285975e-06, - "loss": 2.1586, - "step": 467150 - }, - { - "epoch": 0.81, - "learning_rate": 9.26645437835915e-06, - "loss": 2.2305, - "step": 467160 - }, - { - "epoch": 0.81, - "learning_rate": 9.265582438432323e-06, - "loss": 2.2312, - "step": 467170 - }, - { - "epoch": 0.81, - "learning_rate": 9.264710498505495e-06, - "loss": 2.3675, - "step": 467180 - }, - { - "epoch": 0.81, - "learning_rate": 9.263838558578669e-06, - "loss": 2.4337, - "step": 467190 - }, - { - "epoch": 0.81, - "learning_rate": 9.262966618651841e-06, - "loss": 2.1842, - "step": 467200 - }, - { - "epoch": 0.81, - "learning_rate": 9.262094678725015e-06, - "loss": 2.182, - "step": 467210 - }, - { - "epoch": 0.81, - "learning_rate": 9.261222738798188e-06, - "loss": 2.1124, - "step": 467220 - }, - { - "epoch": 0.81, - "learning_rate": 9.260350798871362e-06, - "loss": 2.0656, - "step": 467230 - }, - { - "epoch": 0.81, - "learning_rate": 9.259478858944534e-06, - "loss": 2.3149, - "step": 467240 - }, - { - "epoch": 0.81, - "learning_rate": 9.258606919017708e-06, - "loss": 2.2024, - "step": 467250 - }, - { - "epoch": 0.81, - "learning_rate": 9.25773497909088e-06, - "loss": 2.2931, - "step": 467260 - }, - { - "epoch": 0.81, - "learning_rate": 9.256863039164054e-06, - "loss": 2.3289, - "step": 467270 - }, - { - "epoch": 0.81, - "learning_rate": 9.255991099237226e-06, - "loss": 2.3462, - "step": 467280 - }, - { - "epoch": 0.81, - "learning_rate": 9.255119159310401e-06, - "loss": 2.1945, - "step": 467290 - }, - { - "epoch": 0.81, - "learning_rate": 9.254247219383575e-06, - "loss": 2.2288, - "step": 467300 - }, - { - "epoch": 0.81, - "learning_rate": 9.253375279456747e-06, - "loss": 2.315, - "step": 467310 - }, - { - "epoch": 0.81, - "learning_rate": 9.252503339529921e-06, - "loss": 2.3146, - "step": 467320 - }, - { - "epoch": 0.81, - "learning_rate": 9.251631399603093e-06, - "loss": 2.3032, - "step": 467330 - }, - { - "epoch": 0.81, - "learning_rate": 9.250759459676267e-06, - "loss": 2.2879, - "step": 467340 - }, - { - "epoch": 0.82, - "learning_rate": 9.249887519749439e-06, - "loss": 2.3432, - "step": 467350 - }, - { - "epoch": 0.82, - "learning_rate": 9.249015579822613e-06, - "loss": 2.2839, - "step": 467360 - }, - { - "epoch": 0.82, - "learning_rate": 9.248143639895787e-06, - "loss": 2.3281, - "step": 467370 - }, - { - "epoch": 0.82, - "learning_rate": 9.24727169996896e-06, - "loss": 2.2762, - "step": 467380 - }, - { - "epoch": 0.82, - "learning_rate": 9.246399760042132e-06, - "loss": 2.2475, - "step": 467390 - }, - { - "epoch": 0.82, - "learning_rate": 9.245527820115306e-06, - "loss": 2.3241, - "step": 467400 - }, - { - "epoch": 0.82, - "learning_rate": 9.244655880188478e-06, - "loss": 2.2361, - "step": 467410 - }, - { - "epoch": 0.82, - "learning_rate": 9.243783940261652e-06, - "loss": 2.3974, - "step": 467420 - }, - { - "epoch": 0.82, - "learning_rate": 9.242912000334826e-06, - "loss": 2.32, - "step": 467430 - }, - { - "epoch": 0.82, - "learning_rate": 9.242040060407998e-06, - "loss": 2.2903, - "step": 467440 - }, - { - "epoch": 0.82, - "learning_rate": 9.241168120481172e-06, - "loss": 2.3442, - "step": 467450 - }, - { - "epoch": 0.82, - "learning_rate": 9.240296180554345e-06, - "loss": 2.2708, - "step": 467460 - }, - { - "epoch": 0.82, - "learning_rate": 9.239424240627519e-06, - "loss": 2.2726, - "step": 467470 - }, - { - "epoch": 0.82, - "learning_rate": 9.238552300700691e-06, - "loss": 2.3186, - "step": 467480 - }, - { - "epoch": 0.82, - "learning_rate": 9.237680360773865e-06, - "loss": 2.2975, - "step": 467490 - }, - { - "epoch": 0.82, - "learning_rate": 9.236808420847037e-06, - "loss": 2.2826, - "step": 467500 - }, - { - "epoch": 0.82, - "learning_rate": 9.23593648092021e-06, - "loss": 2.2842, - "step": 467510 - }, - { - "epoch": 0.82, - "learning_rate": 9.235064540993383e-06, - "loss": 2.3007, - "step": 467520 - }, - { - "epoch": 0.82, - "learning_rate": 9.234192601066557e-06, - "loss": 2.356, - "step": 467530 - }, - { - "epoch": 0.82, - "learning_rate": 9.23332066113973e-06, - "loss": 2.2483, - "step": 467540 - }, - { - "epoch": 0.82, - "learning_rate": 9.232448721212904e-06, - "loss": 2.223, - "step": 467550 - }, - { - "epoch": 0.82, - "learning_rate": 9.231576781286078e-06, - "loss": 2.3014, - "step": 467560 - }, - { - "epoch": 0.82, - "learning_rate": 9.23070484135925e-06, - "loss": 2.3562, - "step": 467570 - }, - { - "epoch": 0.82, - "learning_rate": 9.229832901432424e-06, - "loss": 2.2077, - "step": 467580 - }, - { - "epoch": 0.82, - "learning_rate": 9.228960961505596e-06, - "loss": 2.2583, - "step": 467590 - }, - { - "epoch": 0.82, - "learning_rate": 9.22808902157877e-06, - "loss": 2.1645, - "step": 467600 - }, - { - "epoch": 0.82, - "learning_rate": 9.227217081651943e-06, - "loss": 2.241, - "step": 467610 - }, - { - "epoch": 0.82, - "learning_rate": 9.226345141725117e-06, - "loss": 2.3337, - "step": 467620 - }, - { - "epoch": 0.82, - "learning_rate": 9.22547320179829e-06, - "loss": 2.1825, - "step": 467630 - }, - { - "epoch": 0.82, - "learning_rate": 9.224601261871463e-06, - "loss": 2.233, - "step": 467640 - }, - { - "epoch": 0.82, - "learning_rate": 9.223729321944635e-06, - "loss": 2.2293, - "step": 467650 - }, - { - "epoch": 0.82, - "learning_rate": 9.222857382017809e-06, - "loss": 2.4142, - "step": 467660 - }, - { - "epoch": 0.82, - "learning_rate": 9.221985442090981e-06, - "loss": 2.1829, - "step": 467670 - }, - { - "epoch": 0.82, - "learning_rate": 9.221113502164155e-06, - "loss": 2.2704, - "step": 467680 - }, - { - "epoch": 0.82, - "learning_rate": 9.220241562237329e-06, - "loss": 2.2839, - "step": 467690 - }, - { - "epoch": 0.82, - "learning_rate": 9.219369622310502e-06, - "loss": 2.2508, - "step": 467700 - }, - { - "epoch": 0.82, - "learning_rate": 9.218497682383676e-06, - "loss": 2.2188, - "step": 467710 - }, - { - "epoch": 0.82, - "learning_rate": 9.217625742456848e-06, - "loss": 2.3241, - "step": 467720 - }, - { - "epoch": 0.82, - "learning_rate": 9.216753802530022e-06, - "loss": 2.2856, - "step": 467730 - }, - { - "epoch": 0.82, - "learning_rate": 9.215881862603194e-06, - "loss": 2.3172, - "step": 467740 - }, - { - "epoch": 0.82, - "learning_rate": 9.215009922676368e-06, - "loss": 2.2018, - "step": 467750 - }, - { - "epoch": 0.82, - "learning_rate": 9.21413798274954e-06, - "loss": 2.3564, - "step": 467760 - }, - { - "epoch": 0.82, - "learning_rate": 9.213266042822714e-06, - "loss": 2.3059, - "step": 467770 - }, - { - "epoch": 0.82, - "learning_rate": 9.212394102895887e-06, - "loss": 2.3248, - "step": 467780 - }, - { - "epoch": 0.82, - "learning_rate": 9.211522162969061e-06, - "loss": 2.2524, - "step": 467790 - }, - { - "epoch": 0.82, - "learning_rate": 9.210650223042233e-06, - "loss": 2.3678, - "step": 467800 - }, - { - "epoch": 0.82, - "learning_rate": 9.209778283115407e-06, - "loss": 2.3251, - "step": 467810 - }, - { - "epoch": 0.82, - "learning_rate": 9.20890634318858e-06, - "loss": 2.3311, - "step": 467820 - }, - { - "epoch": 0.82, - "learning_rate": 9.208034403261753e-06, - "loss": 2.2049, - "step": 467830 - }, - { - "epoch": 0.82, - "learning_rate": 9.207162463334927e-06, - "loss": 2.2403, - "step": 467840 - }, - { - "epoch": 0.82, - "learning_rate": 9.2062905234081e-06, - "loss": 2.267, - "step": 467850 - }, - { - "epoch": 0.82, - "learning_rate": 9.205418583481274e-06, - "loss": 2.3447, - "step": 467860 - }, - { - "epoch": 0.82, - "learning_rate": 9.204546643554446e-06, - "loss": 2.3002, - "step": 467870 - }, - { - "epoch": 0.82, - "learning_rate": 9.20367470362762e-06, - "loss": 2.141, - "step": 467880 - }, - { - "epoch": 0.82, - "learning_rate": 9.202802763700792e-06, - "loss": 2.313, - "step": 467890 - }, - { - "epoch": 0.82, - "learning_rate": 9.201930823773966e-06, - "loss": 2.2412, - "step": 467900 - }, - { - "epoch": 0.82, - "learning_rate": 9.201058883847138e-06, - "loss": 2.1512, - "step": 467910 - }, - { - "epoch": 0.82, - "learning_rate": 9.200186943920312e-06, - "loss": 2.1972, - "step": 467920 - }, - { - "epoch": 0.82, - "learning_rate": 9.199315003993485e-06, - "loss": 2.2759, - "step": 467930 - }, - { - "epoch": 0.82, - "learning_rate": 9.19844306406666e-06, - "loss": 2.3298, - "step": 467940 - }, - { - "epoch": 0.82, - "learning_rate": 9.197571124139831e-06, - "loss": 2.2534, - "step": 467950 - }, - { - "epoch": 0.82, - "learning_rate": 9.196699184213005e-06, - "loss": 2.3734, - "step": 467960 - }, - { - "epoch": 0.82, - "learning_rate": 9.195827244286179e-06, - "loss": 2.3367, - "step": 467970 - }, - { - "epoch": 0.82, - "learning_rate": 9.194955304359351e-06, - "loss": 2.3283, - "step": 467980 - }, - { - "epoch": 0.82, - "learning_rate": 9.194083364432525e-06, - "loss": 2.3422, - "step": 467990 - }, - { - "epoch": 0.82, - "learning_rate": 9.193211424505697e-06, - "loss": 2.2276, - "step": 468000 - }, - { - "epoch": 0.82, - "learning_rate": 9.19233948457887e-06, - "loss": 2.2684, - "step": 468010 - }, - { - "epoch": 0.82, - "learning_rate": 9.191467544652044e-06, - "loss": 2.2105, - "step": 468020 - }, - { - "epoch": 0.82, - "learning_rate": 9.190595604725218e-06, - "loss": 2.2653, - "step": 468030 - }, - { - "epoch": 0.82, - "learning_rate": 9.18972366479839e-06, - "loss": 2.1734, - "step": 468040 - }, - { - "epoch": 0.82, - "learning_rate": 9.188851724871564e-06, - "loss": 2.2813, - "step": 468050 - }, - { - "epoch": 0.82, - "learning_rate": 9.187979784944736e-06, - "loss": 2.1684, - "step": 468060 - }, - { - "epoch": 0.82, - "learning_rate": 9.18710784501791e-06, - "loss": 2.3769, - "step": 468070 - }, - { - "epoch": 0.82, - "learning_rate": 9.186235905091082e-06, - "loss": 2.3903, - "step": 468080 - }, - { - "epoch": 0.82, - "learning_rate": 9.185363965164257e-06, - "loss": 2.3361, - "step": 468090 - }, - { - "epoch": 0.82, - "learning_rate": 9.184492025237431e-06, - "loss": 2.1425, - "step": 468100 - }, - { - "epoch": 0.82, - "learning_rate": 9.183620085310603e-06, - "loss": 2.2307, - "step": 468110 - }, - { - "epoch": 0.82, - "learning_rate": 9.182748145383777e-06, - "loss": 2.2734, - "step": 468120 - }, - { - "epoch": 0.82, - "learning_rate": 9.181876205456949e-06, - "loss": 2.1466, - "step": 468130 - }, - { - "epoch": 0.82, - "learning_rate": 9.181004265530123e-06, - "loss": 2.0652, - "step": 468140 - }, - { - "epoch": 0.82, - "learning_rate": 9.180132325603295e-06, - "loss": 2.2047, - "step": 468150 - }, - { - "epoch": 0.82, - "learning_rate": 9.179260385676469e-06, - "loss": 2.271, - "step": 468160 - }, - { - "epoch": 0.82, - "learning_rate": 9.178388445749642e-06, - "loss": 2.2627, - "step": 468170 - }, - { - "epoch": 0.82, - "learning_rate": 9.177516505822816e-06, - "loss": 2.186, - "step": 468180 - }, - { - "epoch": 0.82, - "learning_rate": 9.176644565895988e-06, - "loss": 2.3584, - "step": 468190 - }, - { - "epoch": 0.82, - "learning_rate": 9.175772625969162e-06, - "loss": 2.2742, - "step": 468200 - }, - { - "epoch": 0.82, - "learning_rate": 9.174900686042334e-06, - "loss": 2.3025, - "step": 468210 - }, - { - "epoch": 0.82, - "learning_rate": 9.174028746115508e-06, - "loss": 2.3355, - "step": 468220 - }, - { - "epoch": 0.82, - "learning_rate": 9.173156806188682e-06, - "loss": 2.3216, - "step": 468230 - }, - { - "epoch": 0.82, - "learning_rate": 9.172284866261854e-06, - "loss": 2.2914, - "step": 468240 - }, - { - "epoch": 0.82, - "learning_rate": 9.171412926335027e-06, - "loss": 2.1688, - "step": 468250 - }, - { - "epoch": 0.82, - "learning_rate": 9.170540986408201e-06, - "loss": 2.2208, - "step": 468260 - }, - { - "epoch": 0.82, - "learning_rate": 9.169669046481375e-06, - "loss": 2.3006, - "step": 468270 - }, - { - "epoch": 0.82, - "learning_rate": 9.168797106554547e-06, - "loss": 2.1131, - "step": 468280 - }, - { - "epoch": 0.82, - "learning_rate": 9.16792516662772e-06, - "loss": 2.2219, - "step": 468290 - }, - { - "epoch": 0.82, - "learning_rate": 9.167053226700893e-06, - "loss": 2.2103, - "step": 468300 - }, - { - "epoch": 0.82, - "learning_rate": 9.166181286774067e-06, - "loss": 2.2508, - "step": 468310 - }, - { - "epoch": 0.82, - "learning_rate": 9.165309346847239e-06, - "loss": 2.1679, - "step": 468320 - }, - { - "epoch": 0.82, - "learning_rate": 9.164437406920414e-06, - "loss": 2.2483, - "step": 468330 - }, - { - "epoch": 0.82, - "learning_rate": 9.163565466993586e-06, - "loss": 2.2864, - "step": 468340 - }, - { - "epoch": 0.82, - "learning_rate": 9.16269352706676e-06, - "loss": 2.2955, - "step": 468350 - }, - { - "epoch": 0.82, - "learning_rate": 9.161821587139934e-06, - "loss": 2.1778, - "step": 468360 - }, - { - "epoch": 0.82, - "learning_rate": 9.160949647213106e-06, - "loss": 2.2808, - "step": 468370 - }, - { - "epoch": 0.82, - "learning_rate": 9.16007770728628e-06, - "loss": 2.4207, - "step": 468380 - }, - { - "epoch": 0.82, - "learning_rate": 9.159205767359452e-06, - "loss": 2.331, - "step": 468390 - }, - { - "epoch": 0.82, - "learning_rate": 9.158333827432626e-06, - "loss": 2.2517, - "step": 468400 - }, - { - "epoch": 0.82, - "learning_rate": 9.1574618875058e-06, - "loss": 2.2853, - "step": 468410 - }, - { - "epoch": 0.82, - "learning_rate": 9.156589947578973e-06, - "loss": 2.3439, - "step": 468420 - }, - { - "epoch": 0.82, - "learning_rate": 9.155718007652145e-06, - "loss": 2.1823, - "step": 468430 - }, - { - "epoch": 0.82, - "learning_rate": 9.154846067725319e-06, - "loss": 2.3649, - "step": 468440 - }, - { - "epoch": 0.82, - "learning_rate": 9.153974127798491e-06, - "loss": 2.3817, - "step": 468450 - }, - { - "epoch": 0.82, - "learning_rate": 9.153102187871665e-06, - "loss": 2.2466, - "step": 468460 - }, - { - "epoch": 0.82, - "learning_rate": 9.152230247944837e-06, - "loss": 2.3161, - "step": 468470 - }, - { - "epoch": 0.82, - "learning_rate": 9.15135830801801e-06, - "loss": 2.2858, - "step": 468480 - }, - { - "epoch": 0.82, - "learning_rate": 9.150486368091184e-06, - "loss": 2.3134, - "step": 468490 - }, - { - "epoch": 0.82, - "learning_rate": 9.149614428164358e-06, - "loss": 2.3862, - "step": 468500 - }, - { - "epoch": 0.82, - "learning_rate": 9.148742488237532e-06, - "loss": 2.2782, - "step": 468510 - }, - { - "epoch": 0.82, - "learning_rate": 9.147870548310704e-06, - "loss": 2.2557, - "step": 468520 - }, - { - "epoch": 0.82, - "learning_rate": 9.146998608383878e-06, - "loss": 2.3245, - "step": 468530 - }, - { - "epoch": 0.82, - "learning_rate": 9.14612666845705e-06, - "loss": 2.3153, - "step": 468540 - }, - { - "epoch": 0.82, - "learning_rate": 9.145254728530224e-06, - "loss": 2.3127, - "step": 468550 - }, - { - "epoch": 0.82, - "learning_rate": 9.144382788603396e-06, - "loss": 2.1938, - "step": 468560 - }, - { - "epoch": 0.82, - "learning_rate": 9.14351084867657e-06, - "loss": 2.4423, - "step": 468570 - }, - { - "epoch": 0.82, - "learning_rate": 9.142638908749743e-06, - "loss": 2.2886, - "step": 468580 - }, - { - "epoch": 0.82, - "learning_rate": 9.141766968822917e-06, - "loss": 2.2553, - "step": 468590 - }, - { - "epoch": 0.82, - "learning_rate": 9.140895028896089e-06, - "loss": 2.3233, - "step": 468600 - }, - { - "epoch": 0.82, - "learning_rate": 9.140023088969263e-06, - "loss": 2.1605, - "step": 468610 - }, - { - "epoch": 0.82, - "learning_rate": 9.139151149042437e-06, - "loss": 2.3378, - "step": 468620 - }, - { - "epoch": 0.82, - "learning_rate": 9.138279209115609e-06, - "loss": 2.3131, - "step": 468630 - }, - { - "epoch": 0.82, - "learning_rate": 9.137407269188782e-06, - "loss": 2.3007, - "step": 468640 - }, - { - "epoch": 0.82, - "learning_rate": 9.136535329261956e-06, - "loss": 2.2896, - "step": 468650 - }, - { - "epoch": 0.82, - "learning_rate": 9.13566338933513e-06, - "loss": 2.233, - "step": 468660 - }, - { - "epoch": 0.82, - "learning_rate": 9.134791449408302e-06, - "loss": 2.2624, - "step": 468670 - }, - { - "epoch": 0.82, - "learning_rate": 9.133919509481476e-06, - "loss": 2.262, - "step": 468680 - }, - { - "epoch": 0.82, - "learning_rate": 9.133047569554648e-06, - "loss": 2.1692, - "step": 468690 - }, - { - "epoch": 0.82, - "learning_rate": 9.132175629627822e-06, - "loss": 2.2785, - "step": 468700 - }, - { - "epoch": 0.82, - "learning_rate": 9.131303689700994e-06, - "loss": 2.3209, - "step": 468710 - }, - { - "epoch": 0.82, - "learning_rate": 9.130431749774168e-06, - "loss": 2.2886, - "step": 468720 - }, - { - "epoch": 0.82, - "learning_rate": 9.129559809847341e-06, - "loss": 2.2217, - "step": 468730 - }, - { - "epoch": 0.82, - "learning_rate": 9.128687869920515e-06, - "loss": 2.3472, - "step": 468740 - }, - { - "epoch": 0.82, - "learning_rate": 9.127815929993687e-06, - "loss": 2.3806, - "step": 468750 - }, - { - "epoch": 0.82, - "learning_rate": 9.126943990066861e-06, - "loss": 2.3404, - "step": 468760 - }, - { - "epoch": 0.82, - "learning_rate": 9.126072050140035e-06, - "loss": 2.0481, - "step": 468770 - }, - { - "epoch": 0.82, - "learning_rate": 9.125200110213207e-06, - "loss": 2.2696, - "step": 468780 - }, - { - "epoch": 0.82, - "learning_rate": 9.12432817028638e-06, - "loss": 2.2651, - "step": 468790 - }, - { - "epoch": 0.82, - "learning_rate": 9.123456230359553e-06, - "loss": 2.2784, - "step": 468800 - }, - { - "epoch": 0.82, - "learning_rate": 9.122584290432726e-06, - "loss": 2.1997, - "step": 468810 - }, - { - "epoch": 0.82, - "learning_rate": 9.1217123505059e-06, - "loss": 2.2773, - "step": 468820 - }, - { - "epoch": 0.82, - "learning_rate": 9.120840410579074e-06, - "loss": 2.3827, - "step": 468830 - }, - { - "epoch": 0.82, - "learning_rate": 9.119968470652246e-06, - "loss": 2.2225, - "step": 468840 - }, - { - "epoch": 0.82, - "learning_rate": 9.11909653072542e-06, - "loss": 2.3505, - "step": 468850 - }, - { - "epoch": 0.82, - "learning_rate": 9.118224590798592e-06, - "loss": 2.2118, - "step": 468860 - }, - { - "epoch": 0.82, - "learning_rate": 9.117352650871766e-06, - "loss": 2.2007, - "step": 468870 - }, - { - "epoch": 0.82, - "learning_rate": 9.116480710944938e-06, - "loss": 2.166, - "step": 468880 - }, - { - "epoch": 0.82, - "learning_rate": 9.115608771018113e-06, - "loss": 2.3598, - "step": 468890 - }, - { - "epoch": 0.82, - "learning_rate": 9.114736831091287e-06, - "loss": 2.3382, - "step": 468900 - }, - { - "epoch": 0.82, - "learning_rate": 9.113864891164459e-06, - "loss": 2.3267, - "step": 468910 - }, - { - "epoch": 0.82, - "learning_rate": 9.112992951237633e-06, - "loss": 2.2422, - "step": 468920 - }, - { - "epoch": 0.82, - "learning_rate": 9.112121011310805e-06, - "loss": 2.2278, - "step": 468930 - }, - { - "epoch": 0.82, - "learning_rate": 9.111249071383979e-06, - "loss": 2.2207, - "step": 468940 - }, - { - "epoch": 0.82, - "learning_rate": 9.11037713145715e-06, - "loss": 2.2949, - "step": 468950 - }, - { - "epoch": 0.82, - "learning_rate": 9.109505191530324e-06, - "loss": 2.1944, - "step": 468960 - }, - { - "epoch": 0.82, - "learning_rate": 9.108633251603498e-06, - "loss": 2.3121, - "step": 468970 - }, - { - "epoch": 0.82, - "learning_rate": 9.107761311676672e-06, - "loss": 2.3398, - "step": 468980 - }, - { - "epoch": 0.82, - "learning_rate": 9.106889371749844e-06, - "loss": 2.2927, - "step": 468990 - }, - { - "epoch": 0.82, - "learning_rate": 9.106017431823018e-06, - "loss": 2.2454, - "step": 469000 - }, - { - "epoch": 0.82, - "learning_rate": 9.10514549189619e-06, - "loss": 2.3898, - "step": 469010 - }, - { - "epoch": 0.82, - "learning_rate": 9.104273551969364e-06, - "loss": 2.2775, - "step": 469020 - }, - { - "epoch": 0.82, - "learning_rate": 9.103401612042537e-06, - "loss": 2.2213, - "step": 469030 - }, - { - "epoch": 0.82, - "learning_rate": 9.10252967211571e-06, - "loss": 2.3986, - "step": 469040 - }, - { - "epoch": 0.82, - "learning_rate": 9.101657732188883e-06, - "loss": 2.2416, - "step": 469050 - }, - { - "epoch": 0.82, - "learning_rate": 9.100785792262057e-06, - "loss": 2.2836, - "step": 469060 - }, - { - "epoch": 0.82, - "learning_rate": 9.09991385233523e-06, - "loss": 2.3326, - "step": 469070 - }, - { - "epoch": 0.82, - "learning_rate": 9.099041912408403e-06, - "loss": 2.3263, - "step": 469080 - }, - { - "epoch": 0.82, - "learning_rate": 9.098169972481577e-06, - "loss": 2.2627, - "step": 469090 - }, - { - "epoch": 0.82, - "learning_rate": 9.097298032554749e-06, - "loss": 2.3651, - "step": 469100 - }, - { - "epoch": 0.82, - "learning_rate": 9.096426092627923e-06, - "loss": 2.2397, - "step": 469110 - }, - { - "epoch": 0.82, - "learning_rate": 9.095554152701095e-06, - "loss": 2.2586, - "step": 469120 - }, - { - "epoch": 0.82, - "learning_rate": 9.09468221277427e-06, - "loss": 2.2821, - "step": 469130 - }, - { - "epoch": 0.82, - "learning_rate": 9.093810272847442e-06, - "loss": 2.2996, - "step": 469140 - }, - { - "epoch": 0.82, - "learning_rate": 9.092938332920616e-06, - "loss": 2.2071, - "step": 469150 - }, - { - "epoch": 0.82, - "learning_rate": 9.09206639299379e-06, - "loss": 2.3098, - "step": 469160 - }, - { - "epoch": 0.82, - "learning_rate": 9.091194453066962e-06, - "loss": 2.2811, - "step": 469170 - }, - { - "epoch": 0.82, - "learning_rate": 9.090322513140136e-06, - "loss": 2.2337, - "step": 469180 - }, - { - "epoch": 0.82, - "learning_rate": 9.089450573213308e-06, - "loss": 2.3442, - "step": 469190 - }, - { - "epoch": 0.82, - "learning_rate": 9.088578633286481e-06, - "loss": 2.2529, - "step": 469200 - }, - { - "epoch": 0.82, - "learning_rate": 9.087706693359655e-06, - "loss": 2.2271, - "step": 469210 - }, - { - "epoch": 0.82, - "learning_rate": 9.086834753432829e-06, - "loss": 2.3481, - "step": 469220 - }, - { - "epoch": 0.82, - "learning_rate": 9.085962813506001e-06, - "loss": 2.2435, - "step": 469230 - }, - { - "epoch": 0.82, - "learning_rate": 9.085090873579175e-06, - "loss": 2.2631, - "step": 469240 - }, - { - "epoch": 0.82, - "learning_rate": 9.084218933652347e-06, - "loss": 2.3589, - "step": 469250 - }, - { - "epoch": 0.82, - "learning_rate": 9.08334699372552e-06, - "loss": 2.3235, - "step": 469260 - }, - { - "epoch": 0.82, - "learning_rate": 9.082475053798693e-06, - "loss": 2.2593, - "step": 469270 - }, - { - "epoch": 0.82, - "learning_rate": 9.081603113871866e-06, - "loss": 2.3189, - "step": 469280 - }, - { - "epoch": 0.82, - "learning_rate": 9.08073117394504e-06, - "loss": 2.2881, - "step": 469290 - }, - { - "epoch": 0.82, - "learning_rate": 9.079859234018214e-06, - "loss": 2.2916, - "step": 469300 - }, - { - "epoch": 0.82, - "learning_rate": 9.078987294091388e-06, - "loss": 2.2616, - "step": 469310 - }, - { - "epoch": 0.82, - "learning_rate": 9.07811535416456e-06, - "loss": 2.2874, - "step": 469320 - }, - { - "epoch": 0.82, - "learning_rate": 9.077243414237734e-06, - "loss": 2.3071, - "step": 469330 - }, - { - "epoch": 0.82, - "learning_rate": 9.076371474310906e-06, - "loss": 2.3332, - "step": 469340 - }, - { - "epoch": 0.82, - "learning_rate": 9.07549953438408e-06, - "loss": 2.4219, - "step": 469350 - }, - { - "epoch": 0.82, - "learning_rate": 9.074627594457252e-06, - "loss": 2.3301, - "step": 469360 - }, - { - "epoch": 0.82, - "learning_rate": 9.073755654530427e-06, - "loss": 2.3133, - "step": 469370 - }, - { - "epoch": 0.82, - "learning_rate": 9.072883714603599e-06, - "loss": 2.1245, - "step": 469380 - }, - { - "epoch": 0.82, - "learning_rate": 9.072011774676773e-06, - "loss": 2.24, - "step": 469390 - }, - { - "epoch": 0.82, - "learning_rate": 9.071139834749945e-06, - "loss": 2.2544, - "step": 469400 - }, - { - "epoch": 0.82, - "learning_rate": 9.070267894823119e-06, - "loss": 2.2795, - "step": 469410 - }, - { - "epoch": 0.82, - "learning_rate": 9.069395954896292e-06, - "loss": 2.1665, - "step": 469420 - }, - { - "epoch": 0.82, - "learning_rate": 9.068524014969465e-06, - "loss": 2.3691, - "step": 469430 - }, - { - "epoch": 0.82, - "learning_rate": 9.067652075042638e-06, - "loss": 2.2463, - "step": 469440 - }, - { - "epoch": 0.82, - "learning_rate": 9.066780135115812e-06, - "loss": 2.292, - "step": 469450 - }, - { - "epoch": 0.82, - "learning_rate": 9.065908195188986e-06, - "loss": 2.3023, - "step": 469460 - }, - { - "epoch": 0.82, - "learning_rate": 9.065036255262158e-06, - "loss": 2.3804, - "step": 469470 - }, - { - "epoch": 0.82, - "learning_rate": 9.064164315335332e-06, - "loss": 2.1864, - "step": 469480 - }, - { - "epoch": 0.82, - "learning_rate": 9.063292375408504e-06, - "loss": 2.1579, - "step": 469490 - }, - { - "epoch": 0.82, - "learning_rate": 9.062420435481678e-06, - "loss": 2.309, - "step": 469500 - }, - { - "epoch": 0.82, - "learning_rate": 9.06154849555485e-06, - "loss": 2.3089, - "step": 469510 - }, - { - "epoch": 0.82, - "learning_rate": 9.060676555628023e-06, - "loss": 2.3672, - "step": 469520 - }, - { - "epoch": 0.82, - "learning_rate": 9.059804615701197e-06, - "loss": 2.3495, - "step": 469530 - }, - { - "epoch": 0.82, - "learning_rate": 9.058932675774371e-06, - "loss": 2.2828, - "step": 469540 - }, - { - "epoch": 0.82, - "learning_rate": 9.058060735847545e-06, - "loss": 2.1853, - "step": 469550 - }, - { - "epoch": 0.82, - "learning_rate": 9.057188795920717e-06, - "loss": 2.352, - "step": 469560 - }, - { - "epoch": 0.82, - "learning_rate": 9.05631685599389e-06, - "loss": 2.3477, - "step": 469570 - }, - { - "epoch": 0.82, - "learning_rate": 9.055444916067063e-06, - "loss": 2.233, - "step": 469580 - }, - { - "epoch": 0.82, - "learning_rate": 9.054572976140236e-06, - "loss": 2.2785, - "step": 469590 - }, - { - "epoch": 0.82, - "learning_rate": 9.053701036213408e-06, - "loss": 2.333, - "step": 469600 - }, - { - "epoch": 0.82, - "learning_rate": 9.052829096286582e-06, - "loss": 2.2848, - "step": 469610 - }, - { - "epoch": 0.82, - "learning_rate": 9.051957156359756e-06, - "loss": 2.1815, - "step": 469620 - }, - { - "epoch": 0.82, - "learning_rate": 9.05108521643293e-06, - "loss": 2.2387, - "step": 469630 - }, - { - "epoch": 0.82, - "learning_rate": 9.050213276506102e-06, - "loss": 2.3014, - "step": 469640 - }, - { - "epoch": 0.82, - "learning_rate": 9.049341336579276e-06, - "loss": 2.3718, - "step": 469650 - }, - { - "epoch": 0.82, - "learning_rate": 9.048469396652448e-06, - "loss": 2.1547, - "step": 469660 - }, - { - "epoch": 0.82, - "learning_rate": 9.047597456725621e-06, - "loss": 2.191, - "step": 469670 - }, - { - "epoch": 0.82, - "learning_rate": 9.046725516798795e-06, - "loss": 2.2652, - "step": 469680 - }, - { - "epoch": 0.82, - "learning_rate": 9.045853576871969e-06, - "loss": 2.3063, - "step": 469690 - }, - { - "epoch": 0.82, - "learning_rate": 9.044981636945143e-06, - "loss": 2.2039, - "step": 469700 - }, - { - "epoch": 0.82, - "learning_rate": 9.044109697018315e-06, - "loss": 2.2437, - "step": 469710 - }, - { - "epoch": 0.82, - "learning_rate": 9.043237757091489e-06, - "loss": 2.3204, - "step": 469720 - }, - { - "epoch": 0.82, - "learning_rate": 9.04236581716466e-06, - "loss": 2.2554, - "step": 469730 - }, - { - "epoch": 0.82, - "learning_rate": 9.041493877237834e-06, - "loss": 2.224, - "step": 469740 - }, - { - "epoch": 0.82, - "learning_rate": 9.040621937311007e-06, - "loss": 2.2728, - "step": 469750 - }, - { - "epoch": 0.82, - "learning_rate": 9.03974999738418e-06, - "loss": 2.3063, - "step": 469760 - }, - { - "epoch": 0.82, - "learning_rate": 9.038878057457354e-06, - "loss": 2.2609, - "step": 469770 - }, - { - "epoch": 0.82, - "learning_rate": 9.038006117530528e-06, - "loss": 2.2222, - "step": 469780 - }, - { - "epoch": 0.82, - "learning_rate": 9.0371341776037e-06, - "loss": 2.338, - "step": 469790 - }, - { - "epoch": 0.82, - "learning_rate": 9.036262237676874e-06, - "loss": 2.3101, - "step": 469800 - }, - { - "epoch": 0.82, - "learning_rate": 9.035390297750046e-06, - "loss": 2.2036, - "step": 469810 - }, - { - "epoch": 0.82, - "learning_rate": 9.03451835782322e-06, - "loss": 2.3274, - "step": 469820 - }, - { - "epoch": 0.82, - "learning_rate": 9.033646417896393e-06, - "loss": 2.2299, - "step": 469830 - }, - { - "epoch": 0.82, - "learning_rate": 9.032774477969565e-06, - "loss": 2.2768, - "step": 469840 - }, - { - "epoch": 0.82, - "learning_rate": 9.031902538042739e-06, - "loss": 2.2164, - "step": 469850 - }, - { - "epoch": 0.82, - "learning_rate": 9.031030598115913e-06, - "loss": 2.24, - "step": 469860 - }, - { - "epoch": 0.82, - "learning_rate": 9.030158658189087e-06, - "loss": 2.2611, - "step": 469870 - }, - { - "epoch": 0.82, - "learning_rate": 9.029286718262259e-06, - "loss": 2.3425, - "step": 469880 - }, - { - "epoch": 0.82, - "learning_rate": 9.028414778335433e-06, - "loss": 2.1837, - "step": 469890 - }, - { - "epoch": 0.82, - "learning_rate": 9.027542838408605e-06, - "loss": 2.2721, - "step": 469900 - }, - { - "epoch": 0.82, - "learning_rate": 9.026670898481778e-06, - "loss": 2.2771, - "step": 469910 - }, - { - "epoch": 0.82, - "learning_rate": 9.02579895855495e-06, - "loss": 2.3608, - "step": 469920 - }, - { - "epoch": 0.82, - "learning_rate": 9.024927018628126e-06, - "loss": 2.2734, - "step": 469930 - }, - { - "epoch": 0.82, - "learning_rate": 9.024055078701298e-06, - "loss": 2.1884, - "step": 469940 - }, - { - "epoch": 0.82, - "learning_rate": 9.023183138774472e-06, - "loss": 2.3059, - "step": 469950 - }, - { - "epoch": 0.82, - "learning_rate": 9.022311198847646e-06, - "loss": 2.2906, - "step": 469960 - }, - { - "epoch": 0.82, - "learning_rate": 9.021439258920818e-06, - "loss": 2.3393, - "step": 469970 - }, - { - "epoch": 0.82, - "learning_rate": 9.020567318993991e-06, - "loss": 2.2146, - "step": 469980 - }, - { - "epoch": 0.82, - "learning_rate": 9.019695379067163e-06, - "loss": 2.2807, - "step": 469990 - }, - { - "epoch": 0.82, - "learning_rate": 9.018823439140337e-06, - "loss": 2.1978, - "step": 470000 - }, - { - "epoch": 0.82, - "learning_rate": 9.017951499213511e-06, - "loss": 2.2935, - "step": 470010 - }, - { - "epoch": 0.82, - "learning_rate": 9.017079559286685e-06, - "loss": 2.2789, - "step": 470020 - }, - { - "epoch": 0.82, - "learning_rate": 9.016207619359857e-06, - "loss": 2.2992, - "step": 470030 - }, - { - "epoch": 0.82, - "learning_rate": 9.01533567943303e-06, - "loss": 2.1447, - "step": 470040 - }, - { - "epoch": 0.82, - "learning_rate": 9.014463739506203e-06, - "loss": 2.2367, - "step": 470050 - }, - { - "epoch": 0.82, - "learning_rate": 9.013591799579376e-06, - "loss": 2.307, - "step": 470060 - }, - { - "epoch": 0.82, - "learning_rate": 9.012719859652549e-06, - "loss": 2.3357, - "step": 470070 - }, - { - "epoch": 0.82, - "learning_rate": 9.011847919725722e-06, - "loss": 2.3171, - "step": 470080 - }, - { - "epoch": 0.82, - "learning_rate": 9.010975979798896e-06, - "loss": 2.3004, - "step": 470090 - }, - { - "epoch": 0.82, - "learning_rate": 9.01010403987207e-06, - "loss": 2.3763, - "step": 470100 - }, - { - "epoch": 0.82, - "learning_rate": 9.009232099945244e-06, - "loss": 2.2863, - "step": 470110 - }, - { - "epoch": 0.82, - "learning_rate": 9.008360160018416e-06, - "loss": 2.3619, - "step": 470120 - }, - { - "epoch": 0.82, - "learning_rate": 9.00748822009159e-06, - "loss": 2.2901, - "step": 470130 - }, - { - "epoch": 0.82, - "learning_rate": 9.006616280164762e-06, - "loss": 2.3602, - "step": 470140 - }, - { - "epoch": 0.82, - "learning_rate": 9.005744340237935e-06, - "loss": 2.2646, - "step": 470150 - }, - { - "epoch": 0.82, - "learning_rate": 9.004872400311107e-06, - "loss": 2.2879, - "step": 470160 - }, - { - "epoch": 0.82, - "learning_rate": 9.004000460384283e-06, - "loss": 2.2794, - "step": 470170 - }, - { - "epoch": 0.82, - "learning_rate": 9.003128520457455e-06, - "loss": 2.1933, - "step": 470180 - }, - { - "epoch": 0.82, - "learning_rate": 9.002256580530629e-06, - "loss": 2.3553, - "step": 470190 - }, - { - "epoch": 0.82, - "learning_rate": 9.0013846406038e-06, - "loss": 2.2722, - "step": 470200 - }, - { - "epoch": 0.82, - "learning_rate": 9.000512700676975e-06, - "loss": 2.3319, - "step": 470210 - }, - { - "epoch": 0.82, - "learning_rate": 8.999640760750148e-06, - "loss": 2.362, - "step": 470220 - }, - { - "epoch": 0.82, - "learning_rate": 8.99876882082332e-06, - "loss": 2.2248, - "step": 470230 - }, - { - "epoch": 0.82, - "learning_rate": 8.997896880896494e-06, - "loss": 2.3041, - "step": 470240 - }, - { - "epoch": 0.82, - "learning_rate": 8.997024940969668e-06, - "loss": 2.3115, - "step": 470250 - }, - { - "epoch": 0.82, - "learning_rate": 8.996153001042842e-06, - "loss": 2.2544, - "step": 470260 - }, - { - "epoch": 0.82, - "learning_rate": 8.995281061116014e-06, - "loss": 2.2256, - "step": 470270 - }, - { - "epoch": 0.82, - "learning_rate": 8.994409121189188e-06, - "loss": 2.329, - "step": 470280 - }, - { - "epoch": 0.82, - "learning_rate": 8.99353718126236e-06, - "loss": 2.2246, - "step": 470290 - }, - { - "epoch": 0.82, - "learning_rate": 8.992665241335533e-06, - "loss": 2.1667, - "step": 470300 - }, - { - "epoch": 0.82, - "learning_rate": 8.991793301408705e-06, - "loss": 2.2255, - "step": 470310 - }, - { - "epoch": 0.82, - "learning_rate": 8.99092136148188e-06, - "loss": 2.3512, - "step": 470320 - }, - { - "epoch": 0.82, - "learning_rate": 8.990049421555053e-06, - "loss": 2.3446, - "step": 470330 - }, - { - "epoch": 0.82, - "learning_rate": 8.989177481628227e-06, - "loss": 2.3352, - "step": 470340 - }, - { - "epoch": 0.82, - "learning_rate": 8.9883055417014e-06, - "loss": 2.4277, - "step": 470350 - }, - { - "epoch": 0.82, - "learning_rate": 8.987433601774573e-06, - "loss": 2.2606, - "step": 470360 - }, - { - "epoch": 0.82, - "learning_rate": 8.986561661847746e-06, - "loss": 2.3451, - "step": 470370 - }, - { - "epoch": 0.82, - "learning_rate": 8.985689721920918e-06, - "loss": 2.2084, - "step": 470380 - }, - { - "epoch": 0.82, - "learning_rate": 8.984817781994092e-06, - "loss": 2.4582, - "step": 470390 - }, - { - "epoch": 0.82, - "learning_rate": 8.983945842067264e-06, - "loss": 2.2351, - "step": 470400 - }, - { - "epoch": 0.82, - "learning_rate": 8.98307390214044e-06, - "loss": 2.2755, - "step": 470410 - }, - { - "epoch": 0.82, - "learning_rate": 8.982201962213612e-06, - "loss": 2.2769, - "step": 470420 - }, - { - "epoch": 0.82, - "learning_rate": 8.981330022286786e-06, - "loss": 2.3406, - "step": 470430 - }, - { - "epoch": 0.82, - "learning_rate": 8.980458082359958e-06, - "loss": 2.1775, - "step": 470440 - }, - { - "epoch": 0.82, - "learning_rate": 8.979586142433131e-06, - "loss": 2.2645, - "step": 470450 - }, - { - "epoch": 0.82, - "learning_rate": 8.978714202506304e-06, - "loss": 2.3645, - "step": 470460 - }, - { - "epoch": 0.82, - "learning_rate": 8.977842262579477e-06, - "loss": 2.2887, - "step": 470470 - }, - { - "epoch": 0.82, - "learning_rate": 8.976970322652651e-06, - "loss": 2.3165, - "step": 470480 - }, - { - "epoch": 0.82, - "learning_rate": 8.976098382725825e-06, - "loss": 2.3074, - "step": 470490 - }, - { - "epoch": 0.82, - "learning_rate": 8.975226442798999e-06, - "loss": 2.1606, - "step": 470500 - }, - { - "epoch": 0.82, - "learning_rate": 8.97435450287217e-06, - "loss": 2.3953, - "step": 470510 - }, - { - "epoch": 0.82, - "learning_rate": 8.973482562945344e-06, - "loss": 2.3507, - "step": 470520 - }, - { - "epoch": 0.82, - "learning_rate": 8.972610623018517e-06, - "loss": 2.3354, - "step": 470530 - }, - { - "epoch": 0.82, - "learning_rate": 8.97173868309169e-06, - "loss": 2.347, - "step": 470540 - }, - { - "epoch": 0.82, - "learning_rate": 8.970866743164862e-06, - "loss": 2.3194, - "step": 470550 - }, - { - "epoch": 0.82, - "learning_rate": 8.969994803238036e-06, - "loss": 2.2947, - "step": 470560 - }, - { - "epoch": 0.82, - "learning_rate": 8.96912286331121e-06, - "loss": 2.2447, - "step": 470570 - }, - { - "epoch": 0.82, - "learning_rate": 8.968250923384384e-06, - "loss": 2.2683, - "step": 470580 - }, - { - "epoch": 0.82, - "learning_rate": 8.967378983457556e-06, - "loss": 2.2034, - "step": 470590 - }, - { - "epoch": 0.82, - "learning_rate": 8.96650704353073e-06, - "loss": 2.1965, - "step": 470600 - }, - { - "epoch": 0.82, - "learning_rate": 8.965635103603902e-06, - "loss": 2.3429, - "step": 470610 - }, - { - "epoch": 0.82, - "learning_rate": 8.964763163677075e-06, - "loss": 2.2145, - "step": 470620 - }, - { - "epoch": 0.82, - "learning_rate": 8.963891223750249e-06, - "loss": 2.37, - "step": 470630 - }, - { - "epoch": 0.82, - "learning_rate": 8.963019283823421e-06, - "loss": 2.229, - "step": 470640 - }, - { - "epoch": 0.82, - "learning_rate": 8.962147343896595e-06, - "loss": 2.3708, - "step": 470650 - }, - { - "epoch": 0.82, - "learning_rate": 8.961275403969769e-06, - "loss": 2.3356, - "step": 470660 - }, - { - "epoch": 0.82, - "learning_rate": 8.960403464042943e-06, - "loss": 2.3393, - "step": 470670 - }, - { - "epoch": 0.82, - "learning_rate": 8.959531524116115e-06, - "loss": 2.2832, - "step": 470680 - }, - { - "epoch": 0.82, - "learning_rate": 8.958659584189288e-06, - "loss": 2.2011, - "step": 470690 - }, - { - "epoch": 0.82, - "learning_rate": 8.95778764426246e-06, - "loss": 2.233, - "step": 470700 - }, - { - "epoch": 0.82, - "learning_rate": 8.956915704335634e-06, - "loss": 2.379, - "step": 470710 - }, - { - "epoch": 0.82, - "learning_rate": 8.956043764408808e-06, - "loss": 2.2044, - "step": 470720 - }, - { - "epoch": 0.82, - "learning_rate": 8.955171824481982e-06, - "loss": 2.2273, - "step": 470730 - }, - { - "epoch": 0.82, - "learning_rate": 8.954299884555154e-06, - "loss": 2.245, - "step": 470740 - }, - { - "epoch": 0.82, - "learning_rate": 8.953427944628328e-06, - "loss": 2.3943, - "step": 470750 - }, - { - "epoch": 0.82, - "learning_rate": 8.952556004701501e-06, - "loss": 2.3144, - "step": 470760 - }, - { - "epoch": 0.82, - "learning_rate": 8.951684064774673e-06, - "loss": 2.319, - "step": 470770 - }, - { - "epoch": 0.82, - "learning_rate": 8.950812124847847e-06, - "loss": 2.3146, - "step": 470780 - }, - { - "epoch": 0.82, - "learning_rate": 8.94994018492102e-06, - "loss": 2.178, - "step": 470790 - }, - { - "epoch": 0.82, - "learning_rate": 8.949068244994193e-06, - "loss": 2.236, - "step": 470800 - }, - { - "epoch": 0.82, - "learning_rate": 8.948196305067367e-06, - "loss": 2.2978, - "step": 470810 - }, - { - "epoch": 0.82, - "learning_rate": 8.94732436514054e-06, - "loss": 2.3081, - "step": 470820 - }, - { - "epoch": 0.82, - "learning_rate": 8.946452425213713e-06, - "loss": 2.2409, - "step": 470830 - }, - { - "epoch": 0.82, - "learning_rate": 8.945580485286886e-06, - "loss": 2.2516, - "step": 470840 - }, - { - "epoch": 0.82, - "learning_rate": 8.944708545360059e-06, - "loss": 2.2637, - "step": 470850 - }, - { - "epoch": 0.82, - "learning_rate": 8.943836605433232e-06, - "loss": 2.297, - "step": 470860 - }, - { - "epoch": 0.82, - "learning_rate": 8.942964665506404e-06, - "loss": 2.3507, - "step": 470870 - }, - { - "epoch": 0.82, - "learning_rate": 8.942092725579578e-06, - "loss": 2.2601, - "step": 470880 - }, - { - "epoch": 0.82, - "learning_rate": 8.941220785652752e-06, - "loss": 2.3266, - "step": 470890 - }, - { - "epoch": 0.82, - "learning_rate": 8.940348845725926e-06, - "loss": 2.2527, - "step": 470900 - }, - { - "epoch": 0.82, - "learning_rate": 8.9394769057991e-06, - "loss": 2.3043, - "step": 470910 - }, - { - "epoch": 0.82, - "learning_rate": 8.938604965872272e-06, - "loss": 2.2606, - "step": 470920 - }, - { - "epoch": 0.82, - "learning_rate": 8.937733025945445e-06, - "loss": 2.319, - "step": 470930 - }, - { - "epoch": 0.82, - "learning_rate": 8.936861086018617e-06, - "loss": 2.2566, - "step": 470940 - }, - { - "epoch": 0.82, - "learning_rate": 8.935989146091791e-06, - "loss": 2.3097, - "step": 470950 - }, - { - "epoch": 0.82, - "learning_rate": 8.935117206164963e-06, - "loss": 2.3286, - "step": 470960 - }, - { - "epoch": 0.82, - "learning_rate": 8.934245266238139e-06, - "loss": 2.1769, - "step": 470970 - }, - { - "epoch": 0.82, - "learning_rate": 8.93337332631131e-06, - "loss": 2.3341, - "step": 470980 - }, - { - "epoch": 0.82, - "learning_rate": 8.932501386384485e-06, - "loss": 2.2833, - "step": 470990 - }, - { - "epoch": 0.82, - "learning_rate": 8.931629446457657e-06, - "loss": 2.2434, - "step": 471000 - }, - { - "epoch": 0.82, - "learning_rate": 8.93075750653083e-06, - "loss": 2.2825, - "step": 471010 - }, - { - "epoch": 0.82, - "learning_rate": 8.929885566604004e-06, - "loss": 2.4669, - "step": 471020 - }, - { - "epoch": 0.82, - "learning_rate": 8.929013626677176e-06, - "loss": 2.3058, - "step": 471030 - }, - { - "epoch": 0.82, - "learning_rate": 8.92814168675035e-06, - "loss": 2.335, - "step": 471040 - }, - { - "epoch": 0.82, - "learning_rate": 8.927269746823524e-06, - "loss": 2.2128, - "step": 471050 - }, - { - "epoch": 0.82, - "learning_rate": 8.926397806896698e-06, - "loss": 2.2126, - "step": 471060 - }, - { - "epoch": 0.82, - "learning_rate": 8.92552586696987e-06, - "loss": 2.4059, - "step": 471070 - }, - { - "epoch": 0.82, - "learning_rate": 8.924653927043043e-06, - "loss": 2.2983, - "step": 471080 - }, - { - "epoch": 0.82, - "learning_rate": 8.923781987116215e-06, - "loss": 2.2213, - "step": 471090 - }, - { - "epoch": 0.82, - "learning_rate": 8.92291004718939e-06, - "loss": 2.404, - "step": 471100 - }, - { - "epoch": 0.82, - "learning_rate": 8.922038107262561e-06, - "loss": 2.3648, - "step": 471110 - }, - { - "epoch": 0.82, - "learning_rate": 8.921166167335735e-06, - "loss": 2.4046, - "step": 471120 - }, - { - "epoch": 0.82, - "learning_rate": 8.920294227408909e-06, - "loss": 2.2552, - "step": 471130 - }, - { - "epoch": 0.82, - "learning_rate": 8.919422287482083e-06, - "loss": 2.2658, - "step": 471140 - }, - { - "epoch": 0.82, - "learning_rate": 8.918550347555256e-06, - "loss": 2.3318, - "step": 471150 - }, - { - "epoch": 0.82, - "learning_rate": 8.917678407628428e-06, - "loss": 2.3344, - "step": 471160 - }, - { - "epoch": 0.82, - "learning_rate": 8.916806467701602e-06, - "loss": 2.2483, - "step": 471170 - }, - { - "epoch": 0.82, - "learning_rate": 8.915934527774774e-06, - "loss": 2.2124, - "step": 471180 - }, - { - "epoch": 0.82, - "learning_rate": 8.915062587847948e-06, - "loss": 2.2035, - "step": 471190 - }, - { - "epoch": 0.82, - "learning_rate": 8.91419064792112e-06, - "loss": 2.273, - "step": 471200 - }, - { - "epoch": 0.82, - "learning_rate": 8.913318707994296e-06, - "loss": 2.2498, - "step": 471210 - }, - { - "epoch": 0.82, - "learning_rate": 8.912446768067468e-06, - "loss": 2.2782, - "step": 471220 - }, - { - "epoch": 0.82, - "learning_rate": 8.911574828140641e-06, - "loss": 2.2999, - "step": 471230 - }, - { - "epoch": 0.82, - "learning_rate": 8.910702888213814e-06, - "loss": 2.2641, - "step": 471240 - }, - { - "epoch": 0.82, - "learning_rate": 8.909830948286987e-06, - "loss": 2.2904, - "step": 471250 - }, - { - "epoch": 0.82, - "learning_rate": 8.90895900836016e-06, - "loss": 2.2144, - "step": 471260 - }, - { - "epoch": 0.82, - "learning_rate": 8.908087068433333e-06, - "loss": 2.3191, - "step": 471270 - }, - { - "epoch": 0.82, - "learning_rate": 8.907215128506507e-06, - "loss": 2.2279, - "step": 471280 - }, - { - "epoch": 0.82, - "learning_rate": 8.90634318857968e-06, - "loss": 2.2864, - "step": 471290 - }, - { - "epoch": 0.82, - "learning_rate": 8.905471248652854e-06, - "loss": 2.2683, - "step": 471300 - }, - { - "epoch": 0.82, - "learning_rate": 8.904599308726027e-06, - "loss": 2.3209, - "step": 471310 - }, - { - "epoch": 0.82, - "learning_rate": 8.9037273687992e-06, - "loss": 2.1913, - "step": 471320 - }, - { - "epoch": 0.82, - "learning_rate": 8.902855428872372e-06, - "loss": 2.2909, - "step": 471330 - }, - { - "epoch": 0.82, - "learning_rate": 8.901983488945546e-06, - "loss": 2.3134, - "step": 471340 - }, - { - "epoch": 0.82, - "learning_rate": 8.901111549018718e-06, - "loss": 2.3285, - "step": 471350 - }, - { - "epoch": 0.82, - "learning_rate": 8.900239609091892e-06, - "loss": 2.332, - "step": 471360 - }, - { - "epoch": 0.82, - "learning_rate": 8.899367669165066e-06, - "loss": 2.3341, - "step": 471370 - }, - { - "epoch": 0.82, - "learning_rate": 8.89849572923824e-06, - "loss": 2.3178, - "step": 471380 - }, - { - "epoch": 0.82, - "learning_rate": 8.897623789311412e-06, - "loss": 2.3041, - "step": 471390 - }, - { - "epoch": 0.82, - "learning_rate": 8.896751849384585e-06, - "loss": 2.2676, - "step": 471400 - }, - { - "epoch": 0.82, - "learning_rate": 8.895879909457757e-06, - "loss": 2.1747, - "step": 471410 - }, - { - "epoch": 0.82, - "learning_rate": 8.895007969530931e-06, - "loss": 2.2763, - "step": 471420 - }, - { - "epoch": 0.82, - "learning_rate": 8.894136029604105e-06, - "loss": 2.308, - "step": 471430 - }, - { - "epoch": 0.82, - "learning_rate": 8.893264089677277e-06, - "loss": 2.242, - "step": 471440 - }, - { - "epoch": 0.82, - "learning_rate": 8.892392149750453e-06, - "loss": 2.2644, - "step": 471450 - }, - { - "epoch": 0.82, - "learning_rate": 8.891520209823625e-06, - "loss": 2.2862, - "step": 471460 - }, - { - "epoch": 0.82, - "learning_rate": 8.890648269896798e-06, - "loss": 2.231, - "step": 471470 - }, - { - "epoch": 0.82, - "learning_rate": 8.88977632996997e-06, - "loss": 2.3539, - "step": 471480 - }, - { - "epoch": 0.82, - "learning_rate": 8.888904390043144e-06, - "loss": 2.2294, - "step": 471490 - }, - { - "epoch": 0.82, - "learning_rate": 8.888032450116316e-06, - "loss": 2.2691, - "step": 471500 - }, - { - "epoch": 0.82, - "learning_rate": 8.88716051018949e-06, - "loss": 2.2838, - "step": 471510 - }, - { - "epoch": 0.82, - "learning_rate": 8.886288570262664e-06, - "loss": 2.294, - "step": 471520 - }, - { - "epoch": 0.82, - "learning_rate": 8.885416630335838e-06, - "loss": 2.4322, - "step": 471530 - }, - { - "epoch": 0.82, - "learning_rate": 8.88454469040901e-06, - "loss": 2.2711, - "step": 471540 - }, - { - "epoch": 0.82, - "learning_rate": 8.883672750482183e-06, - "loss": 2.3326, - "step": 471550 - }, - { - "epoch": 0.82, - "learning_rate": 8.882800810555357e-06, - "loss": 2.2436, - "step": 471560 - }, - { - "epoch": 0.82, - "learning_rate": 8.88192887062853e-06, - "loss": 2.2051, - "step": 471570 - }, - { - "epoch": 0.82, - "learning_rate": 8.881056930701703e-06, - "loss": 2.2299, - "step": 471580 - }, - { - "epoch": 0.82, - "learning_rate": 8.880184990774875e-06, - "loss": 2.249, - "step": 471590 - }, - { - "epoch": 0.82, - "learning_rate": 8.879313050848049e-06, - "loss": 2.1782, - "step": 471600 - }, - { - "epoch": 0.82, - "learning_rate": 8.878441110921223e-06, - "loss": 2.2804, - "step": 471610 - }, - { - "epoch": 0.82, - "learning_rate": 8.877569170994396e-06, - "loss": 2.2128, - "step": 471620 - }, - { - "epoch": 0.82, - "learning_rate": 8.876697231067569e-06, - "loss": 2.3252, - "step": 471630 - }, - { - "epoch": 0.82, - "learning_rate": 8.875825291140742e-06, - "loss": 2.1941, - "step": 471640 - }, - { - "epoch": 0.82, - "learning_rate": 8.874953351213914e-06, - "loss": 2.2615, - "step": 471650 - }, - { - "epoch": 0.82, - "learning_rate": 8.874081411287088e-06, - "loss": 2.2403, - "step": 471660 - }, - { - "epoch": 0.82, - "learning_rate": 8.87320947136026e-06, - "loss": 2.3557, - "step": 471670 - }, - { - "epoch": 0.82, - "learning_rate": 8.872337531433434e-06, - "loss": 2.4232, - "step": 471680 - }, - { - "epoch": 0.82, - "learning_rate": 8.871465591506608e-06, - "loss": 2.2799, - "step": 471690 - }, - { - "epoch": 0.82, - "learning_rate": 8.870593651579782e-06, - "loss": 2.3174, - "step": 471700 - }, - { - "epoch": 0.82, - "learning_rate": 8.869721711652955e-06, - "loss": 2.2411, - "step": 471710 - }, - { - "epoch": 0.82, - "learning_rate": 8.868849771726127e-06, - "loss": 2.2739, - "step": 471720 - }, - { - "epoch": 0.82, - "learning_rate": 8.867977831799301e-06, - "loss": 2.3006, - "step": 471730 - }, - { - "epoch": 0.82, - "learning_rate": 8.867105891872473e-06, - "loss": 2.349, - "step": 471740 - }, - { - "epoch": 0.82, - "learning_rate": 8.866233951945647e-06, - "loss": 2.257, - "step": 471750 - }, - { - "epoch": 0.82, - "learning_rate": 8.86536201201882e-06, - "loss": 2.2719, - "step": 471760 - }, - { - "epoch": 0.82, - "learning_rate": 8.864490072091995e-06, - "loss": 2.2428, - "step": 471770 - }, - { - "epoch": 0.82, - "learning_rate": 8.863618132165167e-06, - "loss": 2.2253, - "step": 471780 - }, - { - "epoch": 0.82, - "learning_rate": 8.86274619223834e-06, - "loss": 2.2227, - "step": 471790 - }, - { - "epoch": 0.82, - "learning_rate": 8.861874252311512e-06, - "loss": 2.2898, - "step": 471800 - }, - { - "epoch": 0.82, - "learning_rate": 8.861002312384686e-06, - "loss": 2.282, - "step": 471810 - }, - { - "epoch": 0.82, - "learning_rate": 8.86013037245786e-06, - "loss": 2.2486, - "step": 471820 - }, - { - "epoch": 0.82, - "learning_rate": 8.859258432531032e-06, - "loss": 2.2055, - "step": 471830 - }, - { - "epoch": 0.82, - "learning_rate": 8.858386492604206e-06, - "loss": 2.255, - "step": 471840 - }, - { - "epoch": 0.82, - "learning_rate": 8.85751455267738e-06, - "loss": 2.3003, - "step": 471850 - }, - { - "epoch": 0.82, - "learning_rate": 8.856642612750553e-06, - "loss": 2.2249, - "step": 471860 - }, - { - "epoch": 0.82, - "learning_rate": 8.855770672823725e-06, - "loss": 2.2975, - "step": 471870 - }, - { - "epoch": 0.82, - "learning_rate": 8.8548987328969e-06, - "loss": 2.2491, - "step": 471880 - }, - { - "epoch": 0.82, - "learning_rate": 8.854026792970071e-06, - "loss": 2.2417, - "step": 471890 - }, - { - "epoch": 0.82, - "learning_rate": 8.853154853043245e-06, - "loss": 2.311, - "step": 471900 - }, - { - "epoch": 0.82, - "learning_rate": 8.852282913116417e-06, - "loss": 2.4047, - "step": 471910 - }, - { - "epoch": 0.82, - "learning_rate": 8.851410973189591e-06, - "loss": 2.1646, - "step": 471920 - }, - { - "epoch": 0.82, - "learning_rate": 8.850539033262765e-06, - "loss": 2.2263, - "step": 471930 - }, - { - "epoch": 0.82, - "learning_rate": 8.849667093335938e-06, - "loss": 2.2196, - "step": 471940 - }, - { - "epoch": 0.82, - "learning_rate": 8.848795153409112e-06, - "loss": 2.2458, - "step": 471950 - }, - { - "epoch": 0.82, - "learning_rate": 8.847923213482284e-06, - "loss": 2.2693, - "step": 471960 - }, - { - "epoch": 0.82, - "learning_rate": 8.847051273555458e-06, - "loss": 2.1565, - "step": 471970 - }, - { - "epoch": 0.82, - "learning_rate": 8.84617933362863e-06, - "loss": 2.2372, - "step": 471980 - }, - { - "epoch": 0.82, - "learning_rate": 8.845307393701804e-06, - "loss": 2.2522, - "step": 471990 - }, - { - "epoch": 0.82, - "learning_rate": 8.844435453774976e-06, - "loss": 2.2716, - "step": 472000 - }, - { - "epoch": 0.82, - "learning_rate": 8.843563513848151e-06, - "loss": 2.1835, - "step": 472010 - }, - { - "epoch": 0.82, - "learning_rate": 8.842691573921324e-06, - "loss": 2.3335, - "step": 472020 - }, - { - "epoch": 0.82, - "learning_rate": 8.841819633994497e-06, - "loss": 2.2544, - "step": 472030 - }, - { - "epoch": 0.82, - "learning_rate": 8.84094769406767e-06, - "loss": 2.0631, - "step": 472040 - }, - { - "epoch": 0.82, - "learning_rate": 8.840075754140843e-06, - "loss": 2.2578, - "step": 472050 - }, - { - "epoch": 0.82, - "learning_rate": 8.839203814214015e-06, - "loss": 2.2897, - "step": 472060 - }, - { - "epoch": 0.82, - "learning_rate": 8.838331874287189e-06, - "loss": 2.2173, - "step": 472070 - }, - { - "epoch": 0.82, - "learning_rate": 8.837459934360363e-06, - "loss": 2.3199, - "step": 472080 - }, - { - "epoch": 0.82, - "learning_rate": 8.836587994433537e-06, - "loss": 2.0896, - "step": 472090 - }, - { - "epoch": 0.82, - "learning_rate": 8.83571605450671e-06, - "loss": 2.3811, - "step": 472100 - }, - { - "epoch": 0.82, - "learning_rate": 8.834844114579882e-06, - "loss": 2.3085, - "step": 472110 - }, - { - "epoch": 0.82, - "learning_rate": 8.833972174653056e-06, - "loss": 2.1882, - "step": 472120 - }, - { - "epoch": 0.82, - "learning_rate": 8.833100234726228e-06, - "loss": 2.1766, - "step": 472130 - }, - { - "epoch": 0.82, - "learning_rate": 8.832228294799402e-06, - "loss": 2.282, - "step": 472140 - }, - { - "epoch": 0.82, - "learning_rate": 8.831356354872574e-06, - "loss": 2.2908, - "step": 472150 - }, - { - "epoch": 0.82, - "learning_rate": 8.830484414945748e-06, - "loss": 2.2969, - "step": 472160 - }, - { - "epoch": 0.82, - "learning_rate": 8.829612475018922e-06, - "loss": 2.1593, - "step": 472170 - }, - { - "epoch": 0.82, - "learning_rate": 8.828740535092095e-06, - "loss": 2.3283, - "step": 472180 - }, - { - "epoch": 0.82, - "learning_rate": 8.827868595165267e-06, - "loss": 2.2766, - "step": 472190 - }, - { - "epoch": 0.82, - "learning_rate": 8.826996655238441e-06, - "loss": 2.2491, - "step": 472200 - }, - { - "epoch": 0.82, - "learning_rate": 8.826124715311615e-06, - "loss": 2.1119, - "step": 472210 - }, - { - "epoch": 0.82, - "learning_rate": 8.825252775384787e-06, - "loss": 2.2319, - "step": 472220 - }, - { - "epoch": 0.82, - "learning_rate": 8.824380835457961e-06, - "loss": 2.2156, - "step": 472230 - }, - { - "epoch": 0.82, - "learning_rate": 8.823508895531133e-06, - "loss": 2.2734, - "step": 472240 - }, - { - "epoch": 0.82, - "learning_rate": 8.822636955604308e-06, - "loss": 2.2617, - "step": 472250 - }, - { - "epoch": 0.82, - "learning_rate": 8.82176501567748e-06, - "loss": 2.3756, - "step": 472260 - }, - { - "epoch": 0.82, - "learning_rate": 8.820893075750654e-06, - "loss": 2.2669, - "step": 472270 - }, - { - "epoch": 0.82, - "learning_rate": 8.820021135823826e-06, - "loss": 2.2141, - "step": 472280 - }, - { - "epoch": 0.82, - "learning_rate": 8.819149195897e-06, - "loss": 2.3312, - "step": 472290 - }, - { - "epoch": 0.82, - "learning_rate": 8.818277255970172e-06, - "loss": 2.236, - "step": 472300 - }, - { - "epoch": 0.82, - "learning_rate": 8.817405316043346e-06, - "loss": 2.2862, - "step": 472310 - }, - { - "epoch": 0.82, - "learning_rate": 8.81653337611652e-06, - "loss": 2.2771, - "step": 472320 - }, - { - "epoch": 0.82, - "learning_rate": 8.815661436189693e-06, - "loss": 2.3653, - "step": 472330 - }, - { - "epoch": 0.82, - "learning_rate": 8.814789496262866e-06, - "loss": 2.3246, - "step": 472340 - }, - { - "epoch": 0.82, - "learning_rate": 8.81391755633604e-06, - "loss": 2.2508, - "step": 472350 - }, - { - "epoch": 0.82, - "learning_rate": 8.813045616409213e-06, - "loss": 2.1967, - "step": 472360 - }, - { - "epoch": 0.82, - "learning_rate": 8.812173676482385e-06, - "loss": 2.295, - "step": 472370 - }, - { - "epoch": 0.82, - "learning_rate": 8.811301736555559e-06, - "loss": 2.2281, - "step": 472380 - }, - { - "epoch": 0.82, - "learning_rate": 8.810429796628731e-06, - "loss": 2.4232, - "step": 472390 - }, - { - "epoch": 0.82, - "learning_rate": 8.809557856701905e-06, - "loss": 2.3171, - "step": 472400 - }, - { - "epoch": 0.82, - "learning_rate": 8.808685916775079e-06, - "loss": 2.3097, - "step": 472410 - }, - { - "epoch": 0.82, - "learning_rate": 8.807813976848252e-06, - "loss": 2.2769, - "step": 472420 - }, - { - "epoch": 0.82, - "learning_rate": 8.806942036921424e-06, - "loss": 2.2512, - "step": 472430 - }, - { - "epoch": 0.82, - "learning_rate": 8.806070096994598e-06, - "loss": 2.1086, - "step": 472440 - }, - { - "epoch": 0.82, - "learning_rate": 8.80519815706777e-06, - "loss": 2.2715, - "step": 472450 - }, - { - "epoch": 0.82, - "learning_rate": 8.804326217140944e-06, - "loss": 2.2346, - "step": 472460 - }, - { - "epoch": 0.82, - "learning_rate": 8.803454277214116e-06, - "loss": 2.241, - "step": 472470 - }, - { - "epoch": 0.82, - "learning_rate": 8.80258233728729e-06, - "loss": 2.2152, - "step": 472480 - }, - { - "epoch": 0.82, - "learning_rate": 8.801710397360465e-06, - "loss": 2.3598, - "step": 472490 - }, - { - "epoch": 0.82, - "learning_rate": 8.800838457433637e-06, - "loss": 2.3448, - "step": 472500 - }, - { - "epoch": 0.82, - "learning_rate": 8.799966517506811e-06, - "loss": 2.2179, - "step": 472510 - }, - { - "epoch": 0.82, - "learning_rate": 8.799094577579983e-06, - "loss": 2.2606, - "step": 472520 - }, - { - "epoch": 0.82, - "learning_rate": 8.798222637653157e-06, - "loss": 2.2263, - "step": 472530 - }, - { - "epoch": 0.82, - "learning_rate": 8.797350697726329e-06, - "loss": 2.3012, - "step": 472540 - }, - { - "epoch": 0.82, - "learning_rate": 8.796478757799503e-06, - "loss": 2.3341, - "step": 472550 - }, - { - "epoch": 0.82, - "learning_rate": 8.795606817872677e-06, - "loss": 2.2671, - "step": 472560 - }, - { - "epoch": 0.82, - "learning_rate": 8.79473487794585e-06, - "loss": 2.3169, - "step": 472570 - }, - { - "epoch": 0.82, - "learning_rate": 8.793862938019022e-06, - "loss": 2.209, - "step": 472580 - }, - { - "epoch": 0.82, - "learning_rate": 8.792990998092196e-06, - "loss": 2.2451, - "step": 472590 - }, - { - "epoch": 0.82, - "learning_rate": 8.792119058165368e-06, - "loss": 2.3416, - "step": 472600 - }, - { - "epoch": 0.82, - "learning_rate": 8.791247118238542e-06, - "loss": 2.2436, - "step": 472610 - }, - { - "epoch": 0.82, - "learning_rate": 8.790375178311716e-06, - "loss": 2.2272, - "step": 472620 - }, - { - "epoch": 0.82, - "learning_rate": 8.789503238384888e-06, - "loss": 2.3204, - "step": 472630 - }, - { - "epoch": 0.82, - "learning_rate": 8.788631298458062e-06, - "loss": 2.3277, - "step": 472640 - }, - { - "epoch": 0.82, - "learning_rate": 8.787759358531235e-06, - "loss": 2.3039, - "step": 472650 - }, - { - "epoch": 0.82, - "learning_rate": 8.78688741860441e-06, - "loss": 2.3434, - "step": 472660 - }, - { - "epoch": 0.82, - "learning_rate": 8.786015478677581e-06, - "loss": 2.0666, - "step": 472670 - }, - { - "epoch": 0.82, - "learning_rate": 8.785143538750755e-06, - "loss": 2.2171, - "step": 472680 - }, - { - "epoch": 0.82, - "learning_rate": 8.784271598823927e-06, - "loss": 2.2484, - "step": 472690 - }, - { - "epoch": 0.82, - "learning_rate": 8.783399658897101e-06, - "loss": 2.2546, - "step": 472700 - }, - { - "epoch": 0.82, - "learning_rate": 8.782527718970273e-06, - "loss": 2.2835, - "step": 472710 - }, - { - "epoch": 0.82, - "learning_rate": 8.781655779043447e-06, - "loss": 2.3424, - "step": 472720 - }, - { - "epoch": 0.82, - "learning_rate": 8.78078383911662e-06, - "loss": 2.3057, - "step": 472730 - }, - { - "epoch": 0.82, - "learning_rate": 8.779911899189794e-06, - "loss": 2.3289, - "step": 472740 - }, - { - "epoch": 0.82, - "learning_rate": 8.779039959262968e-06, - "loss": 2.3475, - "step": 472750 - }, - { - "epoch": 0.82, - "learning_rate": 8.77816801933614e-06, - "loss": 2.302, - "step": 472760 - }, - { - "epoch": 0.82, - "learning_rate": 8.777296079409314e-06, - "loss": 2.1842, - "step": 472770 - }, - { - "epoch": 0.82, - "learning_rate": 8.776424139482486e-06, - "loss": 2.3026, - "step": 472780 - }, - { - "epoch": 0.82, - "learning_rate": 8.77555219955566e-06, - "loss": 2.1847, - "step": 472790 - }, - { - "epoch": 0.82, - "learning_rate": 8.774680259628834e-06, - "loss": 2.1981, - "step": 472800 - }, - { - "epoch": 0.82, - "learning_rate": 8.773808319702007e-06, - "loss": 2.2417, - "step": 472810 - }, - { - "epoch": 0.82, - "learning_rate": 8.77293637977518e-06, - "loss": 2.33, - "step": 472820 - }, - { - "epoch": 0.82, - "learning_rate": 8.772064439848353e-06, - "loss": 2.2675, - "step": 472830 - }, - { - "epoch": 0.82, - "learning_rate": 8.771192499921525e-06, - "loss": 2.3211, - "step": 472840 - }, - { - "epoch": 0.82, - "learning_rate": 8.770320559994699e-06, - "loss": 2.3442, - "step": 472850 - }, - { - "epoch": 0.82, - "learning_rate": 8.769448620067871e-06, - "loss": 2.2454, - "step": 472860 - }, - { - "epoch": 0.82, - "learning_rate": 8.768576680141045e-06, - "loss": 2.3064, - "step": 472870 - }, - { - "epoch": 0.82, - "learning_rate": 8.767704740214219e-06, - "loss": 2.2671, - "step": 472880 - }, - { - "epoch": 0.82, - "learning_rate": 8.766832800287392e-06, - "loss": 2.3659, - "step": 472890 - }, - { - "epoch": 0.82, - "learning_rate": 8.765960860360566e-06, - "loss": 2.3167, - "step": 472900 - }, - { - "epoch": 0.82, - "learning_rate": 8.765088920433738e-06, - "loss": 2.3219, - "step": 472910 - }, - { - "epoch": 0.82, - "learning_rate": 8.764216980506912e-06, - "loss": 2.3309, - "step": 472920 - }, - { - "epoch": 0.82, - "learning_rate": 8.763345040580084e-06, - "loss": 2.4069, - "step": 472930 - }, - { - "epoch": 0.82, - "learning_rate": 8.762473100653258e-06, - "loss": 2.2254, - "step": 472940 - }, - { - "epoch": 0.82, - "learning_rate": 8.76160116072643e-06, - "loss": 2.4111, - "step": 472950 - }, - { - "epoch": 0.82, - "learning_rate": 8.760729220799604e-06, - "loss": 2.0802, - "step": 472960 - }, - { - "epoch": 0.82, - "learning_rate": 8.759857280872777e-06, - "loss": 2.2118, - "step": 472970 - }, - { - "epoch": 0.82, - "learning_rate": 8.758985340945951e-06, - "loss": 2.2344, - "step": 472980 - }, - { - "epoch": 0.82, - "learning_rate": 8.758113401019123e-06, - "loss": 2.1901, - "step": 472990 - }, - { - "epoch": 0.82, - "learning_rate": 8.757241461092297e-06, - "loss": 2.348, - "step": 473000 - }, - { - "epoch": 0.82, - "learning_rate": 8.756369521165471e-06, - "loss": 2.3072, - "step": 473010 - }, - { - "epoch": 0.82, - "learning_rate": 8.755497581238643e-06, - "loss": 2.2443, - "step": 473020 - }, - { - "epoch": 0.82, - "learning_rate": 8.754625641311817e-06, - "loss": 2.198, - "step": 473030 - }, - { - "epoch": 0.82, - "learning_rate": 8.753753701384989e-06, - "loss": 2.3734, - "step": 473040 - }, - { - "epoch": 0.82, - "learning_rate": 8.752881761458164e-06, - "loss": 2.1635, - "step": 473050 - }, - { - "epoch": 0.82, - "learning_rate": 8.752009821531336e-06, - "loss": 2.2393, - "step": 473060 - }, - { - "epoch": 0.82, - "learning_rate": 8.75113788160451e-06, - "loss": 2.3384, - "step": 473070 - }, - { - "epoch": 0.82, - "learning_rate": 8.750265941677682e-06, - "loss": 2.3154, - "step": 473080 - }, - { - "epoch": 0.83, - "learning_rate": 8.749394001750856e-06, - "loss": 2.284, - "step": 473090 - }, - { - "epoch": 0.83, - "learning_rate": 8.748522061824028e-06, - "loss": 2.2767, - "step": 473100 - }, - { - "epoch": 0.83, - "learning_rate": 8.747650121897202e-06, - "loss": 2.334, - "step": 473110 - }, - { - "epoch": 0.83, - "learning_rate": 8.746778181970376e-06, - "loss": 2.3093, - "step": 473120 - }, - { - "epoch": 0.83, - "learning_rate": 8.74590624204355e-06, - "loss": 2.2224, - "step": 473130 - }, - { - "epoch": 0.83, - "learning_rate": 8.745034302116723e-06, - "loss": 2.3021, - "step": 473140 - }, - { - "epoch": 0.83, - "learning_rate": 8.744162362189895e-06, - "loss": 2.1875, - "step": 473150 - }, - { - "epoch": 0.83, - "learning_rate": 8.743290422263069e-06, - "loss": 2.4325, - "step": 473160 - }, - { - "epoch": 0.83, - "learning_rate": 8.742418482336241e-06, - "loss": 2.0798, - "step": 473170 - }, - { - "epoch": 0.83, - "learning_rate": 8.741546542409415e-06, - "loss": 2.3246, - "step": 473180 - }, - { - "epoch": 0.83, - "learning_rate": 8.740674602482587e-06, - "loss": 2.2373, - "step": 473190 - }, - { - "epoch": 0.83, - "learning_rate": 8.73980266255576e-06, - "loss": 2.3055, - "step": 473200 - }, - { - "epoch": 0.83, - "learning_rate": 8.738930722628934e-06, - "loss": 2.2463, - "step": 473210 - }, - { - "epoch": 0.83, - "learning_rate": 8.738058782702108e-06, - "loss": 2.2724, - "step": 473220 - }, - { - "epoch": 0.83, - "learning_rate": 8.73718684277528e-06, - "loss": 2.2593, - "step": 473230 - }, - { - "epoch": 0.83, - "learning_rate": 8.736314902848454e-06, - "loss": 2.3198, - "step": 473240 - }, - { - "epoch": 0.83, - "learning_rate": 8.735442962921626e-06, - "loss": 2.4139, - "step": 473250 - }, - { - "epoch": 0.83, - "learning_rate": 8.7345710229948e-06, - "loss": 2.3379, - "step": 473260 - }, - { - "epoch": 0.83, - "learning_rate": 8.733699083067972e-06, - "loss": 2.3872, - "step": 473270 - }, - { - "epoch": 0.83, - "learning_rate": 8.732827143141146e-06, - "loss": 2.3133, - "step": 473280 - }, - { - "epoch": 0.83, - "learning_rate": 8.731955203214321e-06, - "loss": 2.235, - "step": 473290 - }, - { - "epoch": 0.83, - "learning_rate": 8.731083263287493e-06, - "loss": 2.1817, - "step": 473300 - }, - { - "epoch": 0.83, - "learning_rate": 8.730211323360667e-06, - "loss": 2.3015, - "step": 473310 - }, - { - "epoch": 0.83, - "learning_rate": 8.729339383433839e-06, - "loss": 2.2643, - "step": 473320 - }, - { - "epoch": 0.83, - "learning_rate": 8.728467443507013e-06, - "loss": 2.212, - "step": 473330 - }, - { - "epoch": 0.83, - "learning_rate": 8.727595503580185e-06, - "loss": 2.2544, - "step": 473340 - }, - { - "epoch": 0.83, - "learning_rate": 8.726723563653359e-06, - "loss": 2.2347, - "step": 473350 - }, - { - "epoch": 0.83, - "learning_rate": 8.725851623726532e-06, - "loss": 2.2856, - "step": 473360 - }, - { - "epoch": 0.83, - "learning_rate": 8.724979683799706e-06, - "loss": 2.2959, - "step": 473370 - }, - { - "epoch": 0.83, - "learning_rate": 8.724107743872878e-06, - "loss": 2.2593, - "step": 473380 - }, - { - "epoch": 0.83, - "learning_rate": 8.723235803946052e-06, - "loss": 2.3605, - "step": 473390 - }, - { - "epoch": 0.83, - "learning_rate": 8.722363864019224e-06, - "loss": 2.298, - "step": 473400 - }, - { - "epoch": 0.83, - "learning_rate": 8.721491924092398e-06, - "loss": 2.2265, - "step": 473410 - }, - { - "epoch": 0.83, - "learning_rate": 8.720619984165572e-06, - "loss": 2.1581, - "step": 473420 - }, - { - "epoch": 0.83, - "learning_rate": 8.719748044238744e-06, - "loss": 2.2321, - "step": 473430 - }, - { - "epoch": 0.83, - "learning_rate": 8.718876104311918e-06, - "loss": 2.3267, - "step": 473440 - }, - { - "epoch": 0.83, - "learning_rate": 8.718004164385091e-06, - "loss": 2.126, - "step": 473450 - }, - { - "epoch": 0.83, - "learning_rate": 8.717132224458265e-06, - "loss": 2.3792, - "step": 473460 - }, - { - "epoch": 0.83, - "learning_rate": 8.716260284531437e-06, - "loss": 2.23, - "step": 473470 - }, - { - "epoch": 0.83, - "learning_rate": 8.715388344604611e-06, - "loss": 2.2308, - "step": 473480 - }, - { - "epoch": 0.83, - "learning_rate": 8.714516404677783e-06, - "loss": 2.3047, - "step": 473490 - }, - { - "epoch": 0.83, - "learning_rate": 8.713644464750957e-06, - "loss": 2.2308, - "step": 473500 - }, - { - "epoch": 0.83, - "learning_rate": 8.712772524824129e-06, - "loss": 2.2924, - "step": 473510 - }, - { - "epoch": 0.83, - "learning_rate": 8.711900584897303e-06, - "loss": 2.1755, - "step": 473520 - }, - { - "epoch": 0.83, - "learning_rate": 8.711028644970476e-06, - "loss": 2.1875, - "step": 473530 - }, - { - "epoch": 0.83, - "learning_rate": 8.71015670504365e-06, - "loss": 2.3021, - "step": 473540 - }, - { - "epoch": 0.83, - "learning_rate": 8.709284765116824e-06, - "loss": 2.4189, - "step": 473550 - }, - { - "epoch": 0.83, - "learning_rate": 8.708412825189996e-06, - "loss": 2.3308, - "step": 473560 - }, - { - "epoch": 0.83, - "learning_rate": 8.70754088526317e-06, - "loss": 2.265, - "step": 473570 - }, - { - "epoch": 0.83, - "learning_rate": 8.706668945336342e-06, - "loss": 2.341, - "step": 473580 - }, - { - "epoch": 0.83, - "learning_rate": 8.705797005409516e-06, - "loss": 2.3446, - "step": 473590 - }, - { - "epoch": 0.83, - "learning_rate": 8.70492506548269e-06, - "loss": 2.3117, - "step": 473600 - }, - { - "epoch": 0.83, - "learning_rate": 8.704053125555863e-06, - "loss": 2.3387, - "step": 473610 - }, - { - "epoch": 0.83, - "learning_rate": 8.703181185629035e-06, - "loss": 2.3223, - "step": 473620 - }, - { - "epoch": 0.83, - "learning_rate": 8.702309245702209e-06, - "loss": 2.4142, - "step": 473630 - }, - { - "epoch": 0.83, - "learning_rate": 8.701437305775381e-06, - "loss": 2.2522, - "step": 473640 - }, - { - "epoch": 0.83, - "learning_rate": 8.700565365848555e-06, - "loss": 2.3146, - "step": 473650 - }, - { - "epoch": 0.83, - "learning_rate": 8.699693425921727e-06, - "loss": 2.361, - "step": 473660 - }, - { - "epoch": 0.83, - "learning_rate": 8.6988214859949e-06, - "loss": 2.3237, - "step": 473670 - }, - { - "epoch": 0.83, - "learning_rate": 8.697949546068074e-06, - "loss": 2.2429, - "step": 473680 - }, - { - "epoch": 0.83, - "learning_rate": 8.697077606141248e-06, - "loss": 2.3159, - "step": 473690 - }, - { - "epoch": 0.83, - "learning_rate": 8.696205666214422e-06, - "loss": 2.2631, - "step": 473700 - }, - { - "epoch": 0.83, - "learning_rate": 8.695333726287594e-06, - "loss": 2.29, - "step": 473710 - }, - { - "epoch": 0.83, - "learning_rate": 8.694461786360768e-06, - "loss": 2.2799, - "step": 473720 - }, - { - "epoch": 0.83, - "learning_rate": 8.69358984643394e-06, - "loss": 2.2509, - "step": 473730 - }, - { - "epoch": 0.83, - "learning_rate": 8.692717906507114e-06, - "loss": 2.2368, - "step": 473740 - }, - { - "epoch": 0.83, - "learning_rate": 8.691845966580286e-06, - "loss": 2.2955, - "step": 473750 - }, - { - "epoch": 0.83, - "learning_rate": 8.69097402665346e-06, - "loss": 2.2577, - "step": 473760 - }, - { - "epoch": 0.83, - "learning_rate": 8.690102086726633e-06, - "loss": 2.2942, - "step": 473770 - }, - { - "epoch": 0.83, - "learning_rate": 8.689230146799807e-06, - "loss": 2.3312, - "step": 473780 - }, - { - "epoch": 0.83, - "learning_rate": 8.68835820687298e-06, - "loss": 2.3195, - "step": 473790 - }, - { - "epoch": 0.83, - "learning_rate": 8.687486266946153e-06, - "loss": 2.2619, - "step": 473800 - }, - { - "epoch": 0.83, - "learning_rate": 8.686614327019327e-06, - "loss": 2.2416, - "step": 473810 - }, - { - "epoch": 0.83, - "learning_rate": 8.685742387092499e-06, - "loss": 2.2516, - "step": 473820 - }, - { - "epoch": 0.83, - "learning_rate": 8.684870447165673e-06, - "loss": 2.2919, - "step": 473830 - }, - { - "epoch": 0.83, - "learning_rate": 8.683998507238846e-06, - "loss": 2.3816, - "step": 473840 - }, - { - "epoch": 0.83, - "learning_rate": 8.68312656731202e-06, - "loss": 2.289, - "step": 473850 - }, - { - "epoch": 0.83, - "learning_rate": 8.682254627385192e-06, - "loss": 2.0979, - "step": 473860 - }, - { - "epoch": 0.83, - "learning_rate": 8.681382687458366e-06, - "loss": 2.2731, - "step": 473870 - }, - { - "epoch": 0.83, - "learning_rate": 8.680510747531538e-06, - "loss": 2.2459, - "step": 473880 - }, - { - "epoch": 0.83, - "learning_rate": 8.679638807604712e-06, - "loss": 2.4282, - "step": 473890 - }, - { - "epoch": 0.83, - "learning_rate": 8.678766867677884e-06, - "loss": 2.2064, - "step": 473900 - }, - { - "epoch": 0.83, - "learning_rate": 8.677894927751058e-06, - "loss": 2.2929, - "step": 473910 - }, - { - "epoch": 0.83, - "learning_rate": 8.677022987824231e-06, - "loss": 2.2592, - "step": 473920 - }, - { - "epoch": 0.83, - "learning_rate": 8.676151047897405e-06, - "loss": 2.2651, - "step": 473930 - }, - { - "epoch": 0.83, - "learning_rate": 8.675279107970579e-06, - "loss": 2.4204, - "step": 473940 - }, - { - "epoch": 0.83, - "learning_rate": 8.674407168043751e-06, - "loss": 2.3052, - "step": 473950 - }, - { - "epoch": 0.83, - "learning_rate": 8.673535228116925e-06, - "loss": 2.1808, - "step": 473960 - }, - { - "epoch": 0.83, - "learning_rate": 8.672663288190097e-06, - "loss": 2.2218, - "step": 473970 - }, - { - "epoch": 0.83, - "learning_rate": 8.67179134826327e-06, - "loss": 2.2774, - "step": 473980 - }, - { - "epoch": 0.83, - "learning_rate": 8.670919408336443e-06, - "loss": 2.2504, - "step": 473990 - }, - { - "epoch": 0.83, - "learning_rate": 8.670047468409616e-06, - "loss": 2.33, - "step": 474000 - }, - { - "epoch": 0.83, - "learning_rate": 8.66917552848279e-06, - "loss": 2.2848, - "step": 474010 - }, - { - "epoch": 0.83, - "learning_rate": 8.668303588555964e-06, - "loss": 2.4561, - "step": 474020 - }, - { - "epoch": 0.83, - "learning_rate": 8.667431648629136e-06, - "loss": 2.1958, - "step": 474030 - }, - { - "epoch": 0.83, - "learning_rate": 8.66655970870231e-06, - "loss": 2.3182, - "step": 474040 - }, - { - "epoch": 0.83, - "learning_rate": 8.665687768775482e-06, - "loss": 2.2682, - "step": 474050 - }, - { - "epoch": 0.83, - "learning_rate": 8.664815828848656e-06, - "loss": 2.1698, - "step": 474060 - }, - { - "epoch": 0.83, - "learning_rate": 8.663943888921828e-06, - "loss": 2.3929, - "step": 474070 - }, - { - "epoch": 0.83, - "learning_rate": 8.663071948995003e-06, - "loss": 2.325, - "step": 474080 - }, - { - "epoch": 0.83, - "learning_rate": 8.662200009068177e-06, - "loss": 2.3225, - "step": 474090 - }, - { - "epoch": 0.83, - "learning_rate": 8.661328069141349e-06, - "loss": 2.272, - "step": 474100 - }, - { - "epoch": 0.83, - "learning_rate": 8.660456129214523e-06, - "loss": 2.3747, - "step": 474110 - }, - { - "epoch": 0.83, - "learning_rate": 8.659584189287695e-06, - "loss": 2.1435, - "step": 474120 - }, - { - "epoch": 0.83, - "learning_rate": 8.658712249360869e-06, - "loss": 2.2887, - "step": 474130 - }, - { - "epoch": 0.83, - "learning_rate": 8.65784030943404e-06, - "loss": 2.3187, - "step": 474140 - }, - { - "epoch": 0.83, - "learning_rate": 8.656968369507215e-06, - "loss": 2.3637, - "step": 474150 - }, - { - "epoch": 0.83, - "learning_rate": 8.656096429580388e-06, - "loss": 2.345, - "step": 474160 - }, - { - "epoch": 0.83, - "learning_rate": 8.655224489653562e-06, - "loss": 2.2283, - "step": 474170 - }, - { - "epoch": 0.83, - "learning_rate": 8.654352549726734e-06, - "loss": 2.3356, - "step": 474180 - }, - { - "epoch": 0.83, - "learning_rate": 8.653480609799908e-06, - "loss": 2.2574, - "step": 474190 - }, - { - "epoch": 0.83, - "learning_rate": 8.65260866987308e-06, - "loss": 2.2217, - "step": 474200 - }, - { - "epoch": 0.83, - "learning_rate": 8.651736729946254e-06, - "loss": 2.3214, - "step": 474210 - }, - { - "epoch": 0.83, - "learning_rate": 8.650864790019428e-06, - "loss": 2.0708, - "step": 474220 - }, - { - "epoch": 0.83, - "learning_rate": 8.6499928500926e-06, - "loss": 2.3049, - "step": 474230 - }, - { - "epoch": 0.83, - "learning_rate": 8.649120910165773e-06, - "loss": 2.352, - "step": 474240 - }, - { - "epoch": 0.83, - "learning_rate": 8.648248970238947e-06, - "loss": 2.2065, - "step": 474250 - }, - { - "epoch": 0.83, - "learning_rate": 8.647377030312121e-06, - "loss": 2.3317, - "step": 474260 - }, - { - "epoch": 0.83, - "learning_rate": 8.646505090385293e-06, - "loss": 2.3289, - "step": 474270 - }, - { - "epoch": 0.83, - "learning_rate": 8.645633150458467e-06, - "loss": 2.2559, - "step": 474280 - }, - { - "epoch": 0.83, - "learning_rate": 8.644761210531639e-06, - "loss": 2.2624, - "step": 474290 - }, - { - "epoch": 0.83, - "learning_rate": 8.643889270604813e-06, - "loss": 2.2222, - "step": 474300 - }, - { - "epoch": 0.83, - "learning_rate": 8.643017330677985e-06, - "loss": 2.2371, - "step": 474310 - }, - { - "epoch": 0.83, - "learning_rate": 8.642145390751158e-06, - "loss": 2.2456, - "step": 474320 - }, - { - "epoch": 0.83, - "learning_rate": 8.641273450824332e-06, - "loss": 2.3452, - "step": 474330 - }, - { - "epoch": 0.83, - "learning_rate": 8.640401510897506e-06, - "loss": 2.3426, - "step": 474340 - }, - { - "epoch": 0.83, - "learning_rate": 8.63952957097068e-06, - "loss": 2.2748, - "step": 474350 - }, - { - "epoch": 0.83, - "learning_rate": 8.638657631043852e-06, - "loss": 2.2546, - "step": 474360 - }, - { - "epoch": 0.83, - "learning_rate": 8.637785691117026e-06, - "loss": 2.343, - "step": 474370 - }, - { - "epoch": 0.83, - "learning_rate": 8.636913751190198e-06, - "loss": 2.1966, - "step": 474380 - }, - { - "epoch": 0.83, - "learning_rate": 8.636041811263371e-06, - "loss": 2.3095, - "step": 474390 - }, - { - "epoch": 0.83, - "learning_rate": 8.635169871336545e-06, - "loss": 2.3294, - "step": 474400 - }, - { - "epoch": 0.83, - "learning_rate": 8.634297931409719e-06, - "loss": 2.2324, - "step": 474410 - }, - { - "epoch": 0.83, - "learning_rate": 8.633425991482891e-06, - "loss": 2.2627, - "step": 474420 - }, - { - "epoch": 0.83, - "learning_rate": 8.632554051556065e-06, - "loss": 2.313, - "step": 474430 - }, - { - "epoch": 0.83, - "learning_rate": 8.631682111629237e-06, - "loss": 2.3272, - "step": 474440 - }, - { - "epoch": 0.83, - "learning_rate": 8.63081017170241e-06, - "loss": 2.1803, - "step": 474450 - }, - { - "epoch": 0.83, - "learning_rate": 8.629938231775583e-06, - "loss": 2.2687, - "step": 474460 - }, - { - "epoch": 0.83, - "learning_rate": 8.629066291848757e-06, - "loss": 2.4158, - "step": 474470 - }, - { - "epoch": 0.83, - "learning_rate": 8.62819435192193e-06, - "loss": 2.2124, - "step": 474480 - }, - { - "epoch": 0.83, - "learning_rate": 8.627322411995104e-06, - "loss": 2.3736, - "step": 474490 - }, - { - "epoch": 0.83, - "learning_rate": 8.626450472068278e-06, - "loss": 2.3262, - "step": 474500 - }, - { - "epoch": 0.83, - "learning_rate": 8.62557853214145e-06, - "loss": 2.2829, - "step": 474510 - }, - { - "epoch": 0.83, - "learning_rate": 8.624706592214624e-06, - "loss": 2.2813, - "step": 474520 - }, - { - "epoch": 0.83, - "learning_rate": 8.623834652287796e-06, - "loss": 2.2777, - "step": 474530 - }, - { - "epoch": 0.83, - "learning_rate": 8.62296271236097e-06, - "loss": 2.3042, - "step": 474540 - }, - { - "epoch": 0.83, - "learning_rate": 8.622090772434142e-06, - "loss": 2.3596, - "step": 474550 - }, - { - "epoch": 0.83, - "learning_rate": 8.621218832507315e-06, - "loss": 2.2862, - "step": 474560 - }, - { - "epoch": 0.83, - "learning_rate": 8.62034689258049e-06, - "loss": 2.2222, - "step": 474570 - }, - { - "epoch": 0.83, - "learning_rate": 8.619474952653663e-06, - "loss": 2.1906, - "step": 474580 - }, - { - "epoch": 0.83, - "learning_rate": 8.618603012726835e-06, - "loss": 2.2666, - "step": 474590 - }, - { - "epoch": 0.83, - "learning_rate": 8.617731072800009e-06, - "loss": 2.2868, - "step": 474600 - }, - { - "epoch": 0.83, - "learning_rate": 8.616859132873183e-06, - "loss": 2.1968, - "step": 474610 - }, - { - "epoch": 0.83, - "learning_rate": 8.615987192946355e-06, - "loss": 2.3888, - "step": 474620 - }, - { - "epoch": 0.83, - "learning_rate": 8.615115253019528e-06, - "loss": 2.3294, - "step": 474630 - }, - { - "epoch": 0.83, - "learning_rate": 8.614243313092702e-06, - "loss": 2.3118, - "step": 474640 - }, - { - "epoch": 0.83, - "learning_rate": 8.613371373165876e-06, - "loss": 2.3182, - "step": 474650 - }, - { - "epoch": 0.83, - "learning_rate": 8.612499433239048e-06, - "loss": 2.3277, - "step": 474660 - }, - { - "epoch": 0.83, - "learning_rate": 8.611627493312222e-06, - "loss": 2.2815, - "step": 474670 - }, - { - "epoch": 0.83, - "learning_rate": 8.610755553385394e-06, - "loss": 2.3162, - "step": 474680 - }, - { - "epoch": 0.83, - "learning_rate": 8.609883613458568e-06, - "loss": 2.1328, - "step": 474690 - }, - { - "epoch": 0.83, - "learning_rate": 8.60901167353174e-06, - "loss": 2.2592, - "step": 474700 - }, - { - "epoch": 0.83, - "learning_rate": 8.608139733604913e-06, - "loss": 2.2275, - "step": 474710 - }, - { - "epoch": 0.83, - "learning_rate": 8.607267793678087e-06, - "loss": 2.2518, - "step": 474720 - }, - { - "epoch": 0.83, - "learning_rate": 8.606395853751261e-06, - "loss": 2.2649, - "step": 474730 - }, - { - "epoch": 0.83, - "learning_rate": 8.605523913824435e-06, - "loss": 2.2123, - "step": 474740 - }, - { - "epoch": 0.83, - "learning_rate": 8.604651973897607e-06, - "loss": 2.164, - "step": 474750 - }, - { - "epoch": 0.83, - "learning_rate": 8.60378003397078e-06, - "loss": 2.3776, - "step": 474760 - }, - { - "epoch": 0.83, - "learning_rate": 8.602908094043953e-06, - "loss": 2.3796, - "step": 474770 - }, - { - "epoch": 0.83, - "learning_rate": 8.602036154117126e-06, - "loss": 2.298, - "step": 474780 - }, - { - "epoch": 0.83, - "learning_rate": 8.601164214190299e-06, - "loss": 2.2475, - "step": 474790 - }, - { - "epoch": 0.83, - "learning_rate": 8.600292274263472e-06, - "loss": 2.2053, - "step": 474800 - }, - { - "epoch": 0.83, - "learning_rate": 8.599420334336646e-06, - "loss": 2.2316, - "step": 474810 - }, - { - "epoch": 0.83, - "learning_rate": 8.59854839440982e-06, - "loss": 2.2286, - "step": 474820 - }, - { - "epoch": 0.83, - "learning_rate": 8.597676454482992e-06, - "loss": 2.2788, - "step": 474830 - }, - { - "epoch": 0.83, - "learning_rate": 8.596804514556166e-06, - "loss": 2.2521, - "step": 474840 - }, - { - "epoch": 0.83, - "learning_rate": 8.595932574629338e-06, - "loss": 2.2762, - "step": 474850 - }, - { - "epoch": 0.83, - "learning_rate": 8.595060634702512e-06, - "loss": 2.2473, - "step": 474860 - }, - { - "epoch": 0.83, - "learning_rate": 8.594188694775685e-06, - "loss": 2.3532, - "step": 474870 - }, - { - "epoch": 0.83, - "learning_rate": 8.593316754848859e-06, - "loss": 2.3074, - "step": 474880 - }, - { - "epoch": 0.83, - "learning_rate": 8.592444814922033e-06, - "loss": 2.1724, - "step": 474890 - }, - { - "epoch": 0.83, - "learning_rate": 8.591572874995205e-06, - "loss": 2.2228, - "step": 474900 - }, - { - "epoch": 0.83, - "learning_rate": 8.590700935068379e-06, - "loss": 2.3808, - "step": 474910 - }, - { - "epoch": 0.83, - "learning_rate": 8.58982899514155e-06, - "loss": 2.1605, - "step": 474920 - }, - { - "epoch": 0.83, - "learning_rate": 8.588957055214725e-06, - "loss": 2.2464, - "step": 474930 - }, - { - "epoch": 0.83, - "learning_rate": 8.588085115287897e-06, - "loss": 2.2621, - "step": 474940 - }, - { - "epoch": 0.83, - "learning_rate": 8.58721317536107e-06, - "loss": 2.3218, - "step": 474950 - }, - { - "epoch": 0.83, - "learning_rate": 8.586341235434244e-06, - "loss": 2.2278, - "step": 474960 - }, - { - "epoch": 0.83, - "learning_rate": 8.585469295507418e-06, - "loss": 2.1249, - "step": 474970 - }, - { - "epoch": 0.83, - "learning_rate": 8.58459735558059e-06, - "loss": 2.25, - "step": 474980 - }, - { - "epoch": 0.83, - "learning_rate": 8.583725415653764e-06, - "loss": 2.2839, - "step": 474990 - }, - { - "epoch": 0.83, - "learning_rate": 8.582853475726936e-06, - "loss": 2.2192, - "step": 475000 - }, - { - "epoch": 0.83, - "learning_rate": 8.58198153580011e-06, - "loss": 2.2431, - "step": 475010 - }, - { - "epoch": 0.83, - "learning_rate": 8.581109595873283e-06, - "loss": 2.2492, - "step": 475020 - }, - { - "epoch": 0.83, - "learning_rate": 8.580237655946455e-06, - "loss": 2.343, - "step": 475030 - }, - { - "epoch": 0.83, - "learning_rate": 8.57936571601963e-06, - "loss": 2.2648, - "step": 475040 - }, - { - "epoch": 0.83, - "learning_rate": 8.578493776092803e-06, - "loss": 2.2901, - "step": 475050 - }, - { - "epoch": 0.83, - "learning_rate": 8.577621836165977e-06, - "loss": 2.3585, - "step": 475060 - }, - { - "epoch": 0.83, - "learning_rate": 8.576749896239149e-06, - "loss": 2.3025, - "step": 475070 - }, - { - "epoch": 0.83, - "learning_rate": 8.575877956312323e-06, - "loss": 2.3053, - "step": 475080 - }, - { - "epoch": 0.83, - "learning_rate": 8.575006016385495e-06, - "loss": 2.3274, - "step": 475090 - }, - { - "epoch": 0.83, - "learning_rate": 8.574134076458668e-06, - "loss": 2.2843, - "step": 475100 - }, - { - "epoch": 0.83, - "learning_rate": 8.57326213653184e-06, - "loss": 2.3102, - "step": 475110 - }, - { - "epoch": 0.83, - "learning_rate": 8.572390196605016e-06, - "loss": 2.314, - "step": 475120 - }, - { - "epoch": 0.83, - "learning_rate": 8.571518256678188e-06, - "loss": 2.2853, - "step": 475130 - }, - { - "epoch": 0.83, - "learning_rate": 8.570646316751362e-06, - "loss": 2.2918, - "step": 475140 - }, - { - "epoch": 0.83, - "learning_rate": 8.569774376824536e-06, - "loss": 2.3212, - "step": 475150 - }, - { - "epoch": 0.83, - "learning_rate": 8.568902436897708e-06, - "loss": 2.3371, - "step": 475160 - }, - { - "epoch": 0.83, - "learning_rate": 8.568030496970881e-06, - "loss": 2.2821, - "step": 475170 - }, - { - "epoch": 0.83, - "learning_rate": 8.567158557044054e-06, - "loss": 2.3053, - "step": 475180 - }, - { - "epoch": 0.83, - "learning_rate": 8.566286617117227e-06, - "loss": 2.2189, - "step": 475190 - }, - { - "epoch": 0.83, - "learning_rate": 8.565414677190401e-06, - "loss": 2.3146, - "step": 475200 - }, - { - "epoch": 0.83, - "learning_rate": 8.564542737263575e-06, - "loss": 2.2096, - "step": 475210 - }, - { - "epoch": 0.83, - "learning_rate": 8.563670797336747e-06, - "loss": 2.2926, - "step": 475220 - }, - { - "epoch": 0.83, - "learning_rate": 8.56279885740992e-06, - "loss": 2.2773, - "step": 475230 - }, - { - "epoch": 0.83, - "learning_rate": 8.561926917483093e-06, - "loss": 2.2977, - "step": 475240 - }, - { - "epoch": 0.83, - "learning_rate": 8.561054977556267e-06, - "loss": 2.3685, - "step": 475250 - }, - { - "epoch": 0.83, - "learning_rate": 8.560183037629439e-06, - "loss": 2.2174, - "step": 475260 - }, - { - "epoch": 0.83, - "learning_rate": 8.559311097702612e-06, - "loss": 2.2946, - "step": 475270 - }, - { - "epoch": 0.83, - "learning_rate": 8.558439157775786e-06, - "loss": 2.2854, - "step": 475280 - }, - { - "epoch": 0.83, - "learning_rate": 8.55756721784896e-06, - "loss": 2.2573, - "step": 475290 - }, - { - "epoch": 0.83, - "learning_rate": 8.556695277922134e-06, - "loss": 2.2262, - "step": 475300 - }, - { - "epoch": 0.83, - "learning_rate": 8.555823337995306e-06, - "loss": 2.2961, - "step": 475310 - }, - { - "epoch": 0.83, - "learning_rate": 8.55495139806848e-06, - "loss": 2.2903, - "step": 475320 - }, - { - "epoch": 0.83, - "learning_rate": 8.554079458141652e-06, - "loss": 2.2764, - "step": 475330 - }, - { - "epoch": 0.83, - "learning_rate": 8.553207518214825e-06, - "loss": 2.1476, - "step": 475340 - }, - { - "epoch": 0.83, - "learning_rate": 8.552335578287997e-06, - "loss": 2.2114, - "step": 475350 - }, - { - "epoch": 0.83, - "learning_rate": 8.551463638361171e-06, - "loss": 2.1639, - "step": 475360 - }, - { - "epoch": 0.83, - "learning_rate": 8.550591698434345e-06, - "loss": 2.3028, - "step": 475370 - }, - { - "epoch": 0.83, - "learning_rate": 8.549719758507519e-06, - "loss": 2.3741, - "step": 475380 - }, - { - "epoch": 0.83, - "learning_rate": 8.548847818580691e-06, - "loss": 2.329, - "step": 475390 - }, - { - "epoch": 0.83, - "learning_rate": 8.547975878653865e-06, - "loss": 2.4062, - "step": 475400 - }, - { - "epoch": 0.83, - "learning_rate": 8.547103938727038e-06, - "loss": 2.367, - "step": 475410 - }, - { - "epoch": 0.83, - "learning_rate": 8.54623199880021e-06, - "loss": 2.2503, - "step": 475420 - }, - { - "epoch": 0.83, - "learning_rate": 8.545360058873384e-06, - "loss": 2.1635, - "step": 475430 - }, - { - "epoch": 0.83, - "learning_rate": 8.544488118946558e-06, - "loss": 2.183, - "step": 475440 - }, - { - "epoch": 0.83, - "learning_rate": 8.543616179019732e-06, - "loss": 2.2927, - "step": 475450 - }, - { - "epoch": 0.83, - "learning_rate": 8.542744239092904e-06, - "loss": 2.297, - "step": 475460 - }, - { - "epoch": 0.83, - "learning_rate": 8.541872299166078e-06, - "loss": 2.2784, - "step": 475470 - }, - { - "epoch": 0.83, - "learning_rate": 8.54100035923925e-06, - "loss": 2.2832, - "step": 475480 - }, - { - "epoch": 0.83, - "learning_rate": 8.540128419312423e-06, - "loss": 2.2184, - "step": 475490 - }, - { - "epoch": 0.83, - "learning_rate": 8.539256479385596e-06, - "loss": 2.3449, - "step": 475500 - }, - { - "epoch": 0.83, - "learning_rate": 8.53838453945877e-06, - "loss": 2.1972, - "step": 475510 - }, - { - "epoch": 0.83, - "learning_rate": 8.537512599531943e-06, - "loss": 2.2883, - "step": 475520 - }, - { - "epoch": 0.83, - "learning_rate": 8.536640659605117e-06, - "loss": 2.3311, - "step": 475530 - }, - { - "epoch": 0.83, - "learning_rate": 8.53576871967829e-06, - "loss": 2.2036, - "step": 475540 - }, - { - "epoch": 0.83, - "learning_rate": 8.534896779751463e-06, - "loss": 2.3853, - "step": 475550 - }, - { - "epoch": 0.83, - "learning_rate": 8.534024839824636e-06, - "loss": 2.2309, - "step": 475560 - }, - { - "epoch": 0.83, - "learning_rate": 8.533152899897809e-06, - "loss": 2.3253, - "step": 475570 - }, - { - "epoch": 0.83, - "learning_rate": 8.532280959970982e-06, - "loss": 2.2249, - "step": 475580 - }, - { - "epoch": 0.83, - "learning_rate": 8.531409020044154e-06, - "loss": 2.266, - "step": 475590 - }, - { - "epoch": 0.83, - "learning_rate": 8.530537080117328e-06, - "loss": 2.3228, - "step": 475600 - }, - { - "epoch": 0.83, - "learning_rate": 8.529665140190502e-06, - "loss": 2.2028, - "step": 475610 - }, - { - "epoch": 0.83, - "learning_rate": 8.528793200263676e-06, - "loss": 2.3141, - "step": 475620 - }, - { - "epoch": 0.83, - "learning_rate": 8.527921260336848e-06, - "loss": 2.3455, - "step": 475630 - }, - { - "epoch": 0.83, - "learning_rate": 8.527049320410022e-06, - "loss": 2.3824, - "step": 475640 - }, - { - "epoch": 0.83, - "learning_rate": 8.526177380483194e-06, - "loss": 2.235, - "step": 475650 - }, - { - "epoch": 0.83, - "learning_rate": 8.525305440556367e-06, - "loss": 2.2821, - "step": 475660 - }, - { - "epoch": 0.83, - "learning_rate": 8.524433500629541e-06, - "loss": 2.1979, - "step": 475670 - }, - { - "epoch": 0.83, - "learning_rate": 8.523561560702715e-06, - "loss": 2.2468, - "step": 475680 - }, - { - "epoch": 0.83, - "learning_rate": 8.522689620775889e-06, - "loss": 2.1379, - "step": 475690 - }, - { - "epoch": 0.83, - "learning_rate": 8.52181768084906e-06, - "loss": 2.0841, - "step": 475700 - }, - { - "epoch": 0.83, - "learning_rate": 8.520945740922235e-06, - "loss": 2.2132, - "step": 475710 - }, - { - "epoch": 0.83, - "learning_rate": 8.520073800995407e-06, - "loss": 2.3213, - "step": 475720 - }, - { - "epoch": 0.83, - "learning_rate": 8.51920186106858e-06, - "loss": 2.2611, - "step": 475730 - }, - { - "epoch": 0.83, - "learning_rate": 8.518329921141752e-06, - "loss": 2.4095, - "step": 475740 - }, - { - "epoch": 0.83, - "learning_rate": 8.517457981214926e-06, - "loss": 2.2323, - "step": 475750 - }, - { - "epoch": 0.83, - "learning_rate": 8.5165860412881e-06, - "loss": 2.2982, - "step": 475760 - }, - { - "epoch": 0.83, - "learning_rate": 8.515714101361274e-06, - "loss": 2.2656, - "step": 475770 - }, - { - "epoch": 0.83, - "learning_rate": 8.514842161434446e-06, - "loss": 2.367, - "step": 475780 - }, - { - "epoch": 0.83, - "learning_rate": 8.51397022150762e-06, - "loss": 2.2024, - "step": 475790 - }, - { - "epoch": 0.83, - "learning_rate": 8.513098281580793e-06, - "loss": 2.3517, - "step": 475800 - }, - { - "epoch": 0.83, - "learning_rate": 8.512226341653965e-06, - "loss": 2.0865, - "step": 475810 - }, - { - "epoch": 0.83, - "learning_rate": 8.51135440172714e-06, - "loss": 2.3602, - "step": 475820 - }, - { - "epoch": 0.83, - "learning_rate": 8.510482461800311e-06, - "loss": 2.2982, - "step": 475830 - }, - { - "epoch": 0.83, - "learning_rate": 8.509610521873485e-06, - "loss": 2.2435, - "step": 475840 - }, - { - "epoch": 0.83, - "learning_rate": 8.508738581946659e-06, - "loss": 2.3224, - "step": 475850 - }, - { - "epoch": 0.83, - "learning_rate": 8.507866642019833e-06, - "loss": 2.2675, - "step": 475860 - }, - { - "epoch": 0.83, - "learning_rate": 8.506994702093005e-06, - "loss": 2.2746, - "step": 475870 - }, - { - "epoch": 0.83, - "learning_rate": 8.506122762166178e-06, - "loss": 2.3232, - "step": 475880 - }, - { - "epoch": 0.83, - "learning_rate": 8.50525082223935e-06, - "loss": 2.2571, - "step": 475890 - }, - { - "epoch": 0.83, - "learning_rate": 8.504378882312524e-06, - "loss": 2.3584, - "step": 475900 - }, - { - "epoch": 0.83, - "learning_rate": 8.503506942385696e-06, - "loss": 2.3146, - "step": 475910 - }, - { - "epoch": 0.83, - "learning_rate": 8.502635002458872e-06, - "loss": 2.2274, - "step": 475920 - }, - { - "epoch": 0.83, - "learning_rate": 8.501763062532044e-06, - "loss": 2.2637, - "step": 475930 - }, - { - "epoch": 0.83, - "learning_rate": 8.500891122605218e-06, - "loss": 2.3587, - "step": 475940 - }, - { - "epoch": 0.83, - "learning_rate": 8.500019182678391e-06, - "loss": 2.3065, - "step": 475950 - }, - { - "epoch": 0.83, - "learning_rate": 8.499147242751564e-06, - "loss": 2.2198, - "step": 475960 - }, - { - "epoch": 0.83, - "learning_rate": 8.498275302824737e-06, - "loss": 2.3292, - "step": 475970 - }, - { - "epoch": 0.83, - "learning_rate": 8.49740336289791e-06, - "loss": 2.3082, - "step": 475980 - }, - { - "epoch": 0.83, - "learning_rate": 8.496531422971083e-06, - "loss": 2.2775, - "step": 475990 - }, - { - "epoch": 0.83, - "learning_rate": 8.495659483044257e-06, - "loss": 2.1142, - "step": 476000 - }, - { - "epoch": 0.83, - "learning_rate": 8.49478754311743e-06, - "loss": 2.3147, - "step": 476010 - }, - { - "epoch": 0.83, - "learning_rate": 8.493915603190603e-06, - "loss": 2.2804, - "step": 476020 - }, - { - "epoch": 0.83, - "learning_rate": 8.493043663263777e-06, - "loss": 2.3113, - "step": 476030 - }, - { - "epoch": 0.83, - "learning_rate": 8.492171723336949e-06, - "loss": 2.2689, - "step": 476040 - }, - { - "epoch": 0.83, - "learning_rate": 8.491299783410122e-06, - "loss": 2.2099, - "step": 476050 - }, - { - "epoch": 0.83, - "learning_rate": 8.490427843483294e-06, - "loss": 2.2329, - "step": 476060 - }, - { - "epoch": 0.83, - "learning_rate": 8.489555903556468e-06, - "loss": 2.3424, - "step": 476070 - }, - { - "epoch": 0.83, - "learning_rate": 8.488683963629642e-06, - "loss": 2.2372, - "step": 476080 - }, - { - "epoch": 0.83, - "learning_rate": 8.487812023702816e-06, - "loss": 2.2927, - "step": 476090 - }, - { - "epoch": 0.83, - "learning_rate": 8.48694008377599e-06, - "loss": 2.1545, - "step": 476100 - }, - { - "epoch": 0.83, - "learning_rate": 8.486068143849162e-06, - "loss": 2.4383, - "step": 476110 - }, - { - "epoch": 0.83, - "learning_rate": 8.485196203922335e-06, - "loss": 2.2859, - "step": 476120 - }, - { - "epoch": 0.83, - "learning_rate": 8.484324263995507e-06, - "loss": 2.2105, - "step": 476130 - }, - { - "epoch": 0.83, - "learning_rate": 8.483452324068681e-06, - "loss": 2.1884, - "step": 476140 - }, - { - "epoch": 0.83, - "learning_rate": 8.482580384141853e-06, - "loss": 2.2681, - "step": 476150 - }, - { - "epoch": 0.83, - "learning_rate": 8.481708444215029e-06, - "loss": 2.1991, - "step": 476160 - }, - { - "epoch": 0.83, - "learning_rate": 8.480836504288201e-06, - "loss": 2.3411, - "step": 476170 - }, - { - "epoch": 0.83, - "learning_rate": 8.479964564361375e-06, - "loss": 2.1767, - "step": 476180 - }, - { - "epoch": 0.83, - "learning_rate": 8.479092624434547e-06, - "loss": 2.2779, - "step": 476190 - }, - { - "epoch": 0.83, - "learning_rate": 8.47822068450772e-06, - "loss": 2.239, - "step": 476200 - }, - { - "epoch": 0.83, - "learning_rate": 8.477348744580894e-06, - "loss": 2.3679, - "step": 476210 - }, - { - "epoch": 0.83, - "learning_rate": 8.476476804654066e-06, - "loss": 2.3923, - "step": 476220 - }, - { - "epoch": 0.83, - "learning_rate": 8.47560486472724e-06, - "loss": 2.3147, - "step": 476230 - }, - { - "epoch": 0.83, - "learning_rate": 8.474732924800414e-06, - "loss": 2.1106, - "step": 476240 - }, - { - "epoch": 0.83, - "learning_rate": 8.473860984873588e-06, - "loss": 2.4023, - "step": 476250 - }, - { - "epoch": 0.83, - "learning_rate": 8.47298904494676e-06, - "loss": 2.0389, - "step": 476260 - }, - { - "epoch": 0.83, - "learning_rate": 8.472117105019934e-06, - "loss": 2.2389, - "step": 476270 - }, - { - "epoch": 0.83, - "learning_rate": 8.471245165093106e-06, - "loss": 2.3043, - "step": 476280 - }, - { - "epoch": 0.83, - "learning_rate": 8.47037322516628e-06, - "loss": 2.1598, - "step": 476290 - }, - { - "epoch": 0.83, - "learning_rate": 8.469501285239451e-06, - "loss": 2.3241, - "step": 476300 - }, - { - "epoch": 0.83, - "learning_rate": 8.468629345312625e-06, - "loss": 2.1615, - "step": 476310 - }, - { - "epoch": 0.83, - "learning_rate": 8.467757405385799e-06, - "loss": 2.1564, - "step": 476320 - }, - { - "epoch": 0.83, - "learning_rate": 8.466885465458973e-06, - "loss": 2.3667, - "step": 476330 - }, - { - "epoch": 0.83, - "learning_rate": 8.466013525532147e-06, - "loss": 2.2494, - "step": 476340 - }, - { - "epoch": 0.83, - "learning_rate": 8.465141585605319e-06, - "loss": 2.2708, - "step": 476350 - }, - { - "epoch": 0.83, - "learning_rate": 8.464269645678492e-06, - "loss": 2.2011, - "step": 476360 - }, - { - "epoch": 0.83, - "learning_rate": 8.463397705751664e-06, - "loss": 2.3691, - "step": 476370 - }, - { - "epoch": 0.83, - "learning_rate": 8.462525765824838e-06, - "loss": 2.2554, - "step": 476380 - }, - { - "epoch": 0.83, - "learning_rate": 8.46165382589801e-06, - "loss": 2.3102, - "step": 476390 - }, - { - "epoch": 0.83, - "learning_rate": 8.460781885971184e-06, - "loss": 2.3114, - "step": 476400 - }, - { - "epoch": 0.83, - "learning_rate": 8.459909946044358e-06, - "loss": 2.2042, - "step": 476410 - }, - { - "epoch": 0.83, - "learning_rate": 8.459038006117532e-06, - "loss": 2.3707, - "step": 476420 - }, - { - "epoch": 0.83, - "learning_rate": 8.458166066190704e-06, - "loss": 2.2274, - "step": 476430 - }, - { - "epoch": 0.83, - "learning_rate": 8.457294126263877e-06, - "loss": 2.1619, - "step": 476440 - }, - { - "epoch": 0.83, - "learning_rate": 8.45642218633705e-06, - "loss": 2.3429, - "step": 476450 - }, - { - "epoch": 0.83, - "learning_rate": 8.455550246410223e-06, - "loss": 2.2992, - "step": 476460 - }, - { - "epoch": 0.83, - "learning_rate": 8.454678306483397e-06, - "loss": 2.241, - "step": 476470 - }, - { - "epoch": 0.83, - "learning_rate": 8.45380636655657e-06, - "loss": 2.2868, - "step": 476480 - }, - { - "epoch": 0.83, - "learning_rate": 8.452934426629745e-06, - "loss": 2.3155, - "step": 476490 - }, - { - "epoch": 0.83, - "learning_rate": 8.452062486702917e-06, - "loss": 2.3955, - "step": 476500 - }, - { - "epoch": 0.83, - "learning_rate": 8.45119054677609e-06, - "loss": 2.1655, - "step": 476510 - }, - { - "epoch": 0.83, - "learning_rate": 8.450318606849263e-06, - "loss": 2.3297, - "step": 476520 - }, - { - "epoch": 0.83, - "learning_rate": 8.449446666922436e-06, - "loss": 2.329, - "step": 476530 - }, - { - "epoch": 0.83, - "learning_rate": 8.448574726995608e-06, - "loss": 2.3799, - "step": 476540 - }, - { - "epoch": 0.83, - "learning_rate": 8.447702787068782e-06, - "loss": 2.2678, - "step": 476550 - }, - { - "epoch": 0.83, - "learning_rate": 8.446830847141956e-06, - "loss": 2.2957, - "step": 476560 - }, - { - "epoch": 0.83, - "learning_rate": 8.44595890721513e-06, - "loss": 2.3845, - "step": 476570 - }, - { - "epoch": 0.83, - "learning_rate": 8.445086967288302e-06, - "loss": 2.2667, - "step": 476580 - }, - { - "epoch": 0.83, - "learning_rate": 8.444215027361476e-06, - "loss": 2.1405, - "step": 476590 - }, - { - "epoch": 0.83, - "learning_rate": 8.44334308743465e-06, - "loss": 2.2881, - "step": 476600 - }, - { - "epoch": 0.83, - "learning_rate": 8.442471147507821e-06, - "loss": 2.2162, - "step": 476610 - }, - { - "epoch": 0.83, - "learning_rate": 8.441599207580995e-06, - "loss": 2.2943, - "step": 476620 - }, - { - "epoch": 0.83, - "learning_rate": 8.440727267654167e-06, - "loss": 2.315, - "step": 476630 - }, - { - "epoch": 0.83, - "learning_rate": 8.439855327727341e-06, - "loss": 2.3693, - "step": 476640 - }, - { - "epoch": 0.83, - "learning_rate": 8.438983387800515e-06, - "loss": 2.327, - "step": 476650 - }, - { - "epoch": 0.83, - "learning_rate": 8.438111447873689e-06, - "loss": 2.1879, - "step": 476660 - }, - { - "epoch": 0.83, - "learning_rate": 8.43723950794686e-06, - "loss": 2.1753, - "step": 476670 - }, - { - "epoch": 0.83, - "learning_rate": 8.436367568020034e-06, - "loss": 2.2798, - "step": 476680 - }, - { - "epoch": 0.83, - "learning_rate": 8.435495628093206e-06, - "loss": 2.252, - "step": 476690 - }, - { - "epoch": 0.83, - "learning_rate": 8.43462368816638e-06, - "loss": 2.2499, - "step": 476700 - }, - { - "epoch": 0.83, - "learning_rate": 8.433751748239552e-06, - "loss": 2.2868, - "step": 476710 - }, - { - "epoch": 0.83, - "learning_rate": 8.432879808312728e-06, - "loss": 2.3271, - "step": 476720 - }, - { - "epoch": 0.83, - "learning_rate": 8.4320078683859e-06, - "loss": 2.2499, - "step": 476730 - }, - { - "epoch": 0.83, - "learning_rate": 8.431135928459074e-06, - "loss": 2.217, - "step": 476740 - }, - { - "epoch": 0.83, - "learning_rate": 8.430263988532247e-06, - "loss": 2.2256, - "step": 476750 - }, - { - "epoch": 0.83, - "learning_rate": 8.42939204860542e-06, - "loss": 2.3777, - "step": 476760 - }, - { - "epoch": 0.83, - "learning_rate": 8.428520108678593e-06, - "loss": 2.2723, - "step": 476770 - }, - { - "epoch": 0.83, - "learning_rate": 8.427648168751765e-06, - "loss": 2.2823, - "step": 476780 - }, - { - "epoch": 0.83, - "learning_rate": 8.426776228824939e-06, - "loss": 2.2286, - "step": 476790 - }, - { - "epoch": 0.83, - "learning_rate": 8.425904288898113e-06, - "loss": 2.3359, - "step": 476800 - }, - { - "epoch": 0.83, - "learning_rate": 8.425032348971287e-06, - "loss": 2.3407, - "step": 476810 - }, - { - "epoch": 0.83, - "learning_rate": 8.424160409044459e-06, - "loss": 2.3377, - "step": 476820 - }, - { - "epoch": 0.83, - "learning_rate": 8.423288469117632e-06, - "loss": 2.3397, - "step": 476830 - }, - { - "epoch": 0.83, - "learning_rate": 8.422416529190805e-06, - "loss": 2.278, - "step": 476840 - }, - { - "epoch": 0.83, - "learning_rate": 8.421544589263978e-06, - "loss": 2.2304, - "step": 476850 - }, - { - "epoch": 0.83, - "learning_rate": 8.42067264933715e-06, - "loss": 2.1223, - "step": 476860 - }, - { - "epoch": 0.83, - "learning_rate": 8.419800709410324e-06, - "loss": 2.3049, - "step": 476870 - }, - { - "epoch": 0.83, - "learning_rate": 8.418928769483498e-06, - "loss": 2.1612, - "step": 476880 - }, - { - "epoch": 0.83, - "learning_rate": 8.418056829556672e-06, - "loss": 2.2601, - "step": 476890 - }, - { - "epoch": 0.83, - "learning_rate": 8.417184889629845e-06, - "loss": 2.2623, - "step": 476900 - }, - { - "epoch": 0.83, - "learning_rate": 8.416312949703018e-06, - "loss": 2.2977, - "step": 476910 - }, - { - "epoch": 0.83, - "learning_rate": 8.415441009776191e-06, - "loss": 2.3041, - "step": 476920 - }, - { - "epoch": 0.83, - "learning_rate": 8.414569069849363e-06, - "loss": 2.2297, - "step": 476930 - }, - { - "epoch": 0.83, - "learning_rate": 8.413697129922537e-06, - "loss": 2.2483, - "step": 476940 - }, - { - "epoch": 0.83, - "learning_rate": 8.41282518999571e-06, - "loss": 2.244, - "step": 476950 - }, - { - "epoch": 0.83, - "learning_rate": 8.411953250068885e-06, - "loss": 2.2763, - "step": 476960 - }, - { - "epoch": 0.83, - "learning_rate": 8.411081310142057e-06, - "loss": 2.2891, - "step": 476970 - }, - { - "epoch": 0.83, - "learning_rate": 8.41020937021523e-06, - "loss": 2.1821, - "step": 476980 - }, - { - "epoch": 0.83, - "learning_rate": 8.409337430288403e-06, - "loss": 2.3662, - "step": 476990 - }, - { - "epoch": 0.83, - "learning_rate": 8.408465490361576e-06, - "loss": 2.1608, - "step": 477000 - }, - { - "epoch": 0.83, - "learning_rate": 8.40759355043475e-06, - "loss": 2.2978, - "step": 477010 - }, - { - "epoch": 0.83, - "learning_rate": 8.406721610507922e-06, - "loss": 2.3339, - "step": 477020 - }, - { - "epoch": 0.83, - "learning_rate": 8.405849670581096e-06, - "loss": 2.3014, - "step": 477030 - }, - { - "epoch": 0.83, - "learning_rate": 8.40497773065427e-06, - "loss": 2.2962, - "step": 477040 - }, - { - "epoch": 0.83, - "learning_rate": 8.404105790727444e-06, - "loss": 2.2577, - "step": 477050 - }, - { - "epoch": 0.83, - "learning_rate": 8.403233850800616e-06, - "loss": 2.3116, - "step": 477060 - }, - { - "epoch": 0.83, - "learning_rate": 8.40236191087379e-06, - "loss": 2.2159, - "step": 477070 - }, - { - "epoch": 0.83, - "learning_rate": 8.401489970946961e-06, - "loss": 2.227, - "step": 477080 - }, - { - "epoch": 0.83, - "learning_rate": 8.400618031020135e-06, - "loss": 2.2024, - "step": 477090 - }, - { - "epoch": 0.83, - "learning_rate": 8.399746091093307e-06, - "loss": 2.266, - "step": 477100 - }, - { - "epoch": 0.83, - "learning_rate": 8.398874151166481e-06, - "loss": 2.2406, - "step": 477110 - }, - { - "epoch": 0.83, - "learning_rate": 8.398002211239655e-06, - "loss": 2.3288, - "step": 477120 - }, - { - "epoch": 0.83, - "learning_rate": 8.397130271312829e-06, - "loss": 2.2521, - "step": 477130 - }, - { - "epoch": 0.83, - "learning_rate": 8.396258331386002e-06, - "loss": 2.3274, - "step": 477140 - }, - { - "epoch": 0.83, - "learning_rate": 8.395386391459174e-06, - "loss": 2.3312, - "step": 477150 - }, - { - "epoch": 0.83, - "learning_rate": 8.394514451532348e-06, - "loss": 2.2442, - "step": 477160 - }, - { - "epoch": 0.83, - "learning_rate": 8.39364251160552e-06, - "loss": 2.3883, - "step": 477170 - }, - { - "epoch": 0.83, - "learning_rate": 8.392770571678694e-06, - "loss": 2.3247, - "step": 477180 - }, - { - "epoch": 0.83, - "learning_rate": 8.391898631751866e-06, - "loss": 2.1837, - "step": 477190 - }, - { - "epoch": 0.83, - "learning_rate": 8.391026691825042e-06, - "loss": 2.238, - "step": 477200 - }, - { - "epoch": 0.83, - "learning_rate": 8.390154751898214e-06, - "loss": 2.3133, - "step": 477210 - }, - { - "epoch": 0.83, - "learning_rate": 8.389282811971387e-06, - "loss": 2.312, - "step": 477220 - }, - { - "epoch": 0.83, - "learning_rate": 8.38841087204456e-06, - "loss": 2.3578, - "step": 477230 - }, - { - "epoch": 0.83, - "learning_rate": 8.387538932117733e-06, - "loss": 2.2222, - "step": 477240 - }, - { - "epoch": 0.83, - "learning_rate": 8.386666992190905e-06, - "loss": 2.3466, - "step": 477250 - }, - { - "epoch": 0.83, - "learning_rate": 8.385795052264079e-06, - "loss": 2.3018, - "step": 477260 - }, - { - "epoch": 0.83, - "learning_rate": 8.384923112337253e-06, - "loss": 2.3521, - "step": 477270 - }, - { - "epoch": 0.83, - "learning_rate": 8.384051172410427e-06, - "loss": 2.3073, - "step": 477280 - }, - { - "epoch": 0.83, - "learning_rate": 8.3831792324836e-06, - "loss": 2.095, - "step": 477290 - }, - { - "epoch": 0.83, - "learning_rate": 8.382307292556773e-06, - "loss": 2.3211, - "step": 477300 - }, - { - "epoch": 0.83, - "learning_rate": 8.381435352629946e-06, - "loss": 2.2695, - "step": 477310 - }, - { - "epoch": 0.83, - "learning_rate": 8.380563412703118e-06, - "loss": 2.263, - "step": 477320 - }, - { - "epoch": 0.83, - "learning_rate": 8.379691472776292e-06, - "loss": 2.2529, - "step": 477330 - }, - { - "epoch": 0.83, - "learning_rate": 8.378819532849464e-06, - "loss": 2.2209, - "step": 477340 - }, - { - "epoch": 0.83, - "learning_rate": 8.377947592922638e-06, - "loss": 2.3385, - "step": 477350 - }, - { - "epoch": 0.83, - "learning_rate": 8.377075652995812e-06, - "loss": 2.3037, - "step": 477360 - }, - { - "epoch": 0.83, - "learning_rate": 8.376203713068986e-06, - "loss": 2.2043, - "step": 477370 - }, - { - "epoch": 0.83, - "learning_rate": 8.375331773142158e-06, - "loss": 2.1906, - "step": 477380 - }, - { - "epoch": 0.83, - "learning_rate": 8.374459833215331e-06, - "loss": 2.4213, - "step": 477390 - }, - { - "epoch": 0.83, - "learning_rate": 8.373587893288505e-06, - "loss": 2.2054, - "step": 477400 - }, - { - "epoch": 0.83, - "learning_rate": 8.372715953361677e-06, - "loss": 2.2274, - "step": 477410 - }, - { - "epoch": 0.83, - "learning_rate": 8.371844013434851e-06, - "loss": 2.202, - "step": 477420 - }, - { - "epoch": 0.83, - "learning_rate": 8.370972073508023e-06, - "loss": 2.2219, - "step": 477430 - }, - { - "epoch": 0.83, - "learning_rate": 8.370100133581197e-06, - "loss": 2.4246, - "step": 477440 - }, - { - "epoch": 0.83, - "learning_rate": 8.36922819365437e-06, - "loss": 2.282, - "step": 477450 - }, - { - "epoch": 0.83, - "learning_rate": 8.368356253727544e-06, - "loss": 2.269, - "step": 477460 - }, - { - "epoch": 0.83, - "learning_rate": 8.367484313800716e-06, - "loss": 2.3711, - "step": 477470 - }, - { - "epoch": 0.83, - "learning_rate": 8.36661237387389e-06, - "loss": 2.3224, - "step": 477480 - }, - { - "epoch": 0.83, - "learning_rate": 8.365740433947062e-06, - "loss": 2.2139, - "step": 477490 - }, - { - "epoch": 0.83, - "learning_rate": 8.364868494020236e-06, - "loss": 2.3459, - "step": 477500 - }, - { - "epoch": 0.83, - "learning_rate": 8.36399655409341e-06, - "loss": 2.3052, - "step": 477510 - }, - { - "epoch": 0.83, - "learning_rate": 8.363124614166584e-06, - "loss": 2.2571, - "step": 477520 - }, - { - "epoch": 0.83, - "learning_rate": 8.362252674239757e-06, - "loss": 2.2173, - "step": 477530 - }, - { - "epoch": 0.83, - "learning_rate": 8.36138073431293e-06, - "loss": 2.2988, - "step": 477540 - }, - { - "epoch": 0.83, - "learning_rate": 8.360508794386103e-06, - "loss": 2.2934, - "step": 477550 - }, - { - "epoch": 0.83, - "learning_rate": 8.359636854459275e-06, - "loss": 2.3263, - "step": 477560 - }, - { - "epoch": 0.83, - "learning_rate": 8.358764914532449e-06, - "loss": 2.2333, - "step": 477570 - }, - { - "epoch": 0.83, - "learning_rate": 8.357892974605621e-06, - "loss": 2.3021, - "step": 477580 - }, - { - "epoch": 0.83, - "learning_rate": 8.357021034678795e-06, - "loss": 2.2049, - "step": 477590 - }, - { - "epoch": 0.83, - "learning_rate": 8.356149094751969e-06, - "loss": 2.2843, - "step": 477600 - }, - { - "epoch": 0.83, - "learning_rate": 8.355277154825142e-06, - "loss": 2.3238, - "step": 477610 - }, - { - "epoch": 0.83, - "learning_rate": 8.354405214898315e-06, - "loss": 2.2355, - "step": 477620 - }, - { - "epoch": 0.83, - "learning_rate": 8.353533274971488e-06, - "loss": 2.2714, - "step": 477630 - }, - { - "epoch": 0.83, - "learning_rate": 8.35266133504466e-06, - "loss": 2.268, - "step": 477640 - }, - { - "epoch": 0.83, - "learning_rate": 8.351789395117834e-06, - "loss": 2.171, - "step": 477650 - }, - { - "epoch": 0.83, - "learning_rate": 8.350917455191006e-06, - "loss": 2.3452, - "step": 477660 - }, - { - "epoch": 0.83, - "learning_rate": 8.35004551526418e-06, - "loss": 2.2659, - "step": 477670 - }, - { - "epoch": 0.83, - "learning_rate": 8.349173575337354e-06, - "loss": 2.3044, - "step": 477680 - }, - { - "epoch": 0.83, - "learning_rate": 8.348301635410528e-06, - "loss": 2.264, - "step": 477690 - }, - { - "epoch": 0.83, - "learning_rate": 8.347429695483701e-06, - "loss": 2.257, - "step": 477700 - }, - { - "epoch": 0.83, - "learning_rate": 8.346557755556873e-06, - "loss": 2.3204, - "step": 477710 - }, - { - "epoch": 0.83, - "learning_rate": 8.345685815630047e-06, - "loss": 2.1921, - "step": 477720 - }, - { - "epoch": 0.83, - "learning_rate": 8.34481387570322e-06, - "loss": 2.2204, - "step": 477730 - }, - { - "epoch": 0.83, - "learning_rate": 8.343941935776393e-06, - "loss": 2.2447, - "step": 477740 - }, - { - "epoch": 0.83, - "learning_rate": 8.343069995849565e-06, - "loss": 2.2456, - "step": 477750 - }, - { - "epoch": 0.83, - "learning_rate": 8.34219805592274e-06, - "loss": 2.2704, - "step": 477760 - }, - { - "epoch": 0.83, - "learning_rate": 8.341326115995913e-06, - "loss": 2.3506, - "step": 477770 - }, - { - "epoch": 0.83, - "learning_rate": 8.340454176069086e-06, - "loss": 2.2343, - "step": 477780 - }, - { - "epoch": 0.83, - "learning_rate": 8.339582236142258e-06, - "loss": 2.2678, - "step": 477790 - }, - { - "epoch": 0.83, - "learning_rate": 8.338710296215432e-06, - "loss": 2.2978, - "step": 477800 - }, - { - "epoch": 0.83, - "learning_rate": 8.337838356288606e-06, - "loss": 2.3624, - "step": 477810 - }, - { - "epoch": 0.83, - "learning_rate": 8.336966416361778e-06, - "loss": 2.2187, - "step": 477820 - }, - { - "epoch": 0.83, - "learning_rate": 8.336094476434952e-06, - "loss": 2.2323, - "step": 477830 - }, - { - "epoch": 0.83, - "learning_rate": 8.335222536508126e-06, - "loss": 2.3017, - "step": 477840 - }, - { - "epoch": 0.83, - "learning_rate": 8.3343505965813e-06, - "loss": 2.3545, - "step": 477850 - }, - { - "epoch": 0.83, - "learning_rate": 8.333478656654471e-06, - "loss": 2.2586, - "step": 477860 - }, - { - "epoch": 0.83, - "learning_rate": 8.332606716727645e-06, - "loss": 2.2586, - "step": 477870 - }, - { - "epoch": 0.83, - "learning_rate": 8.331734776800817e-06, - "loss": 2.3332, - "step": 477880 - }, - { - "epoch": 0.83, - "learning_rate": 8.330862836873991e-06, - "loss": 2.3111, - "step": 477890 - }, - { - "epoch": 0.83, - "learning_rate": 8.329990896947163e-06, - "loss": 2.3492, - "step": 477900 - }, - { - "epoch": 0.83, - "learning_rate": 8.329118957020337e-06, - "loss": 2.1101, - "step": 477910 - }, - { - "epoch": 0.83, - "learning_rate": 8.32824701709351e-06, - "loss": 2.2629, - "step": 477920 - }, - { - "epoch": 0.83, - "learning_rate": 8.327375077166684e-06, - "loss": 2.2899, - "step": 477930 - }, - { - "epoch": 0.83, - "learning_rate": 8.326503137239858e-06, - "loss": 2.3297, - "step": 477940 - }, - { - "epoch": 0.83, - "learning_rate": 8.32563119731303e-06, - "loss": 2.2774, - "step": 477950 - }, - { - "epoch": 0.83, - "learning_rate": 8.324759257386204e-06, - "loss": 2.2581, - "step": 477960 - }, - { - "epoch": 0.83, - "learning_rate": 8.323887317459376e-06, - "loss": 2.2566, - "step": 477970 - }, - { - "epoch": 0.83, - "learning_rate": 8.32301537753255e-06, - "loss": 2.3819, - "step": 477980 - }, - { - "epoch": 0.83, - "learning_rate": 8.322143437605722e-06, - "loss": 2.368, - "step": 477990 - }, - { - "epoch": 0.83, - "learning_rate": 8.321271497678897e-06, - "loss": 2.2201, - "step": 478000 - }, - { - "epoch": 0.83, - "learning_rate": 8.32039955775207e-06, - "loss": 2.3603, - "step": 478010 - }, - { - "epoch": 0.83, - "learning_rate": 8.319527617825243e-06, - "loss": 2.3095, - "step": 478020 - }, - { - "epoch": 0.83, - "learning_rate": 8.318655677898415e-06, - "loss": 2.2764, - "step": 478030 - }, - { - "epoch": 0.83, - "learning_rate": 8.317783737971589e-06, - "loss": 2.309, - "step": 478040 - }, - { - "epoch": 0.83, - "learning_rate": 8.316911798044761e-06, - "loss": 2.1855, - "step": 478050 - }, - { - "epoch": 0.83, - "learning_rate": 8.316039858117935e-06, - "loss": 2.3295, - "step": 478060 - }, - { - "epoch": 0.83, - "learning_rate": 8.315167918191109e-06, - "loss": 2.3916, - "step": 478070 - }, - { - "epoch": 0.83, - "learning_rate": 8.314295978264283e-06, - "loss": 2.2818, - "step": 478080 - }, - { - "epoch": 0.83, - "learning_rate": 8.313424038337456e-06, - "loss": 2.3059, - "step": 478090 - }, - { - "epoch": 0.83, - "learning_rate": 8.312552098410628e-06, - "loss": 2.3162, - "step": 478100 - }, - { - "epoch": 0.83, - "learning_rate": 8.311680158483802e-06, - "loss": 2.1499, - "step": 478110 - }, - { - "epoch": 0.83, - "learning_rate": 8.310808218556974e-06, - "loss": 2.2111, - "step": 478120 - }, - { - "epoch": 0.83, - "learning_rate": 8.309936278630148e-06, - "loss": 2.1834, - "step": 478130 - }, - { - "epoch": 0.83, - "learning_rate": 8.30906433870332e-06, - "loss": 2.3963, - "step": 478140 - }, - { - "epoch": 0.83, - "learning_rate": 8.308192398776494e-06, - "loss": 2.1821, - "step": 478150 - }, - { - "epoch": 0.83, - "learning_rate": 8.307320458849668e-06, - "loss": 2.3194, - "step": 478160 - }, - { - "epoch": 0.83, - "learning_rate": 8.306448518922841e-06, - "loss": 2.3462, - "step": 478170 - }, - { - "epoch": 0.83, - "learning_rate": 8.305576578996013e-06, - "loss": 2.2558, - "step": 478180 - }, - { - "epoch": 0.83, - "learning_rate": 8.304704639069187e-06, - "loss": 2.2729, - "step": 478190 - }, - { - "epoch": 0.83, - "learning_rate": 8.303832699142361e-06, - "loss": 2.3035, - "step": 478200 - }, - { - "epoch": 0.83, - "learning_rate": 8.302960759215533e-06, - "loss": 2.2249, - "step": 478210 - }, - { - "epoch": 0.83, - "learning_rate": 8.302088819288707e-06, - "loss": 2.1122, - "step": 478220 - }, - { - "epoch": 0.83, - "learning_rate": 8.301216879361879e-06, - "loss": 2.218, - "step": 478230 - }, - { - "epoch": 0.83, - "learning_rate": 8.300344939435054e-06, - "loss": 2.3227, - "step": 478240 - }, - { - "epoch": 0.83, - "learning_rate": 8.299472999508226e-06, - "loss": 2.2238, - "step": 478250 - }, - { - "epoch": 0.83, - "learning_rate": 8.2986010595814e-06, - "loss": 2.2789, - "step": 478260 - }, - { - "epoch": 0.83, - "learning_rate": 8.297729119654572e-06, - "loss": 2.1639, - "step": 478270 - }, - { - "epoch": 0.83, - "learning_rate": 8.296857179727746e-06, - "loss": 2.3395, - "step": 478280 - }, - { - "epoch": 0.83, - "learning_rate": 8.295985239800918e-06, - "loss": 2.334, - "step": 478290 - }, - { - "epoch": 0.83, - "learning_rate": 8.295113299874092e-06, - "loss": 2.3162, - "step": 478300 - }, - { - "epoch": 0.83, - "learning_rate": 8.294241359947266e-06, - "loss": 2.3743, - "step": 478310 - }, - { - "epoch": 0.83, - "learning_rate": 8.29336942002044e-06, - "loss": 2.2686, - "step": 478320 - }, - { - "epoch": 0.83, - "learning_rate": 8.292497480093613e-06, - "loss": 2.3226, - "step": 478330 - }, - { - "epoch": 0.83, - "learning_rate": 8.291625540166785e-06, - "loss": 2.2775, - "step": 478340 - }, - { - "epoch": 0.83, - "learning_rate": 8.290753600239959e-06, - "loss": 2.3007, - "step": 478350 - }, - { - "epoch": 0.83, - "learning_rate": 8.289881660313131e-06, - "loss": 2.2179, - "step": 478360 - }, - { - "epoch": 0.83, - "learning_rate": 8.289009720386305e-06, - "loss": 2.3176, - "step": 478370 - }, - { - "epoch": 0.83, - "learning_rate": 8.288137780459477e-06, - "loss": 2.2457, - "step": 478380 - }, - { - "epoch": 0.83, - "learning_rate": 8.28726584053265e-06, - "loss": 2.2523, - "step": 478390 - }, - { - "epoch": 0.83, - "learning_rate": 8.286393900605825e-06, - "loss": 2.3803, - "step": 478400 - }, - { - "epoch": 0.83, - "learning_rate": 8.285521960678998e-06, - "loss": 2.1909, - "step": 478410 - }, - { - "epoch": 0.83, - "learning_rate": 8.28465002075217e-06, - "loss": 2.3869, - "step": 478420 - }, - { - "epoch": 0.83, - "learning_rate": 8.283778080825344e-06, - "loss": 2.1477, - "step": 478430 - }, - { - "epoch": 0.83, - "learning_rate": 8.282906140898516e-06, - "loss": 2.2568, - "step": 478440 - }, - { - "epoch": 0.83, - "learning_rate": 8.28203420097169e-06, - "loss": 2.1575, - "step": 478450 - }, - { - "epoch": 0.83, - "learning_rate": 8.281162261044862e-06, - "loss": 2.2908, - "step": 478460 - }, - { - "epoch": 0.83, - "learning_rate": 8.280290321118036e-06, - "loss": 2.359, - "step": 478470 - }, - { - "epoch": 0.83, - "learning_rate": 8.27941838119121e-06, - "loss": 2.3087, - "step": 478480 - }, - { - "epoch": 0.83, - "learning_rate": 8.278546441264383e-06, - "loss": 2.255, - "step": 478490 - }, - { - "epoch": 0.83, - "learning_rate": 8.277674501337557e-06, - "loss": 2.2722, - "step": 478500 - }, - { - "epoch": 0.83, - "learning_rate": 8.27680256141073e-06, - "loss": 2.2536, - "step": 478510 - }, - { - "epoch": 0.83, - "learning_rate": 8.275930621483903e-06, - "loss": 2.3924, - "step": 478520 - }, - { - "epoch": 0.83, - "learning_rate": 8.275058681557075e-06, - "loss": 2.2938, - "step": 478530 - }, - { - "epoch": 0.83, - "learning_rate": 8.274186741630249e-06, - "loss": 2.2846, - "step": 478540 - }, - { - "epoch": 0.83, - "learning_rate": 8.273314801703423e-06, - "loss": 2.3374, - "step": 478550 - }, - { - "epoch": 0.83, - "learning_rate": 8.272442861776596e-06, - "loss": 2.2356, - "step": 478560 - }, - { - "epoch": 0.83, - "learning_rate": 8.271570921849768e-06, - "loss": 2.3213, - "step": 478570 - }, - { - "epoch": 0.83, - "learning_rate": 8.270698981922942e-06, - "loss": 2.2232, - "step": 478580 - }, - { - "epoch": 0.83, - "learning_rate": 8.269827041996114e-06, - "loss": 2.3631, - "step": 478590 - }, - { - "epoch": 0.83, - "learning_rate": 8.268955102069288e-06, - "loss": 2.2902, - "step": 478600 - }, - { - "epoch": 0.83, - "learning_rate": 8.268083162142462e-06, - "loss": 2.3103, - "step": 478610 - }, - { - "epoch": 0.83, - "learning_rate": 8.267211222215634e-06, - "loss": 2.3077, - "step": 478620 - }, - { - "epoch": 0.83, - "learning_rate": 8.266339282288808e-06, - "loss": 2.2374, - "step": 478630 - }, - { - "epoch": 0.83, - "learning_rate": 8.265467342361981e-06, - "loss": 2.3171, - "step": 478640 - }, - { - "epoch": 0.83, - "learning_rate": 8.264595402435155e-06, - "loss": 2.2571, - "step": 478650 - }, - { - "epoch": 0.83, - "learning_rate": 8.263723462508327e-06, - "loss": 2.2886, - "step": 478660 - }, - { - "epoch": 0.83, - "learning_rate": 8.262851522581501e-06, - "loss": 2.2503, - "step": 478670 - }, - { - "epoch": 0.83, - "learning_rate": 8.261979582654673e-06, - "loss": 2.2269, - "step": 478680 - }, - { - "epoch": 0.83, - "learning_rate": 8.261107642727847e-06, - "loss": 2.1363, - "step": 478690 - }, - { - "epoch": 0.83, - "learning_rate": 8.260235702801019e-06, - "loss": 2.2591, - "step": 478700 - }, - { - "epoch": 0.83, - "learning_rate": 8.259363762874193e-06, - "loss": 2.2295, - "step": 478710 - }, - { - "epoch": 0.83, - "learning_rate": 8.258491822947367e-06, - "loss": 2.3495, - "step": 478720 - }, - { - "epoch": 0.83, - "learning_rate": 8.25761988302054e-06, - "loss": 2.2862, - "step": 478730 - }, - { - "epoch": 0.83, - "learning_rate": 8.256747943093714e-06, - "loss": 2.1563, - "step": 478740 - }, - { - "epoch": 0.83, - "learning_rate": 8.255876003166886e-06, - "loss": 2.1802, - "step": 478750 - }, - { - "epoch": 0.83, - "learning_rate": 8.25500406324006e-06, - "loss": 2.3687, - "step": 478760 - }, - { - "epoch": 0.83, - "learning_rate": 8.254132123313232e-06, - "loss": 2.2936, - "step": 478770 - }, - { - "epoch": 0.83, - "learning_rate": 8.253260183386406e-06, - "loss": 2.1319, - "step": 478780 - }, - { - "epoch": 0.83, - "learning_rate": 8.252388243459578e-06, - "loss": 2.3441, - "step": 478790 - }, - { - "epoch": 0.83, - "learning_rate": 8.251516303532753e-06, - "loss": 2.3238, - "step": 478800 - }, - { - "epoch": 0.83, - "learning_rate": 8.250644363605925e-06, - "loss": 2.278, - "step": 478810 - }, - { - "epoch": 0.84, - "learning_rate": 8.249772423679099e-06, - "loss": 2.1985, - "step": 478820 - }, - { - "epoch": 0.84, - "learning_rate": 8.248900483752271e-06, - "loss": 2.233, - "step": 478830 - }, - { - "epoch": 0.84, - "learning_rate": 8.248028543825445e-06, - "loss": 2.3235, - "step": 478840 - }, - { - "epoch": 0.84, - "learning_rate": 8.247156603898617e-06, - "loss": 2.1668, - "step": 478850 - }, - { - "epoch": 0.84, - "learning_rate": 8.24628466397179e-06, - "loss": 2.2312, - "step": 478860 - }, - { - "epoch": 0.84, - "learning_rate": 8.245412724044965e-06, - "loss": 2.3197, - "step": 478870 - }, - { - "epoch": 0.84, - "learning_rate": 8.244540784118138e-06, - "loss": 2.2555, - "step": 478880 - }, - { - "epoch": 0.84, - "learning_rate": 8.243668844191312e-06, - "loss": 2.3698, - "step": 478890 - }, - { - "epoch": 0.84, - "learning_rate": 8.242796904264484e-06, - "loss": 2.2259, - "step": 478900 - }, - { - "epoch": 0.84, - "learning_rate": 8.241924964337658e-06, - "loss": 2.2431, - "step": 478910 - }, - { - "epoch": 0.84, - "learning_rate": 8.24105302441083e-06, - "loss": 2.239, - "step": 478920 - }, - { - "epoch": 0.84, - "learning_rate": 8.240181084484004e-06, - "loss": 2.2925, - "step": 478930 - }, - { - "epoch": 0.84, - "learning_rate": 8.239309144557176e-06, - "loss": 2.343, - "step": 478940 - }, - { - "epoch": 0.84, - "learning_rate": 8.23843720463035e-06, - "loss": 2.3523, - "step": 478950 - }, - { - "epoch": 0.84, - "learning_rate": 8.237565264703523e-06, - "loss": 2.3002, - "step": 478960 - }, - { - "epoch": 0.84, - "learning_rate": 8.236693324776697e-06, - "loss": 2.3588, - "step": 478970 - }, - { - "epoch": 0.84, - "learning_rate": 8.23582138484987e-06, - "loss": 2.1823, - "step": 478980 - }, - { - "epoch": 0.84, - "learning_rate": 8.234949444923043e-06, - "loss": 2.2792, - "step": 478990 - }, - { - "epoch": 0.84, - "learning_rate": 8.234077504996217e-06, - "loss": 2.2282, - "step": 479000 - }, - { - "epoch": 0.84, - "learning_rate": 8.233205565069389e-06, - "loss": 2.336, - "step": 479010 - }, - { - "epoch": 0.84, - "learning_rate": 8.232333625142563e-06, - "loss": 2.2917, - "step": 479020 - }, - { - "epoch": 0.84, - "learning_rate": 8.231461685215735e-06, - "loss": 2.2895, - "step": 479030 - }, - { - "epoch": 0.84, - "learning_rate": 8.23058974528891e-06, - "loss": 2.3257, - "step": 479040 - }, - { - "epoch": 0.84, - "learning_rate": 8.229717805362082e-06, - "loss": 2.2136, - "step": 479050 - }, - { - "epoch": 0.84, - "learning_rate": 8.228845865435256e-06, - "loss": 2.2063, - "step": 479060 - }, - { - "epoch": 0.84, - "learning_rate": 8.227973925508428e-06, - "loss": 2.2674, - "step": 479070 - }, - { - "epoch": 0.84, - "learning_rate": 8.227101985581602e-06, - "loss": 2.2509, - "step": 479080 - }, - { - "epoch": 0.84, - "learning_rate": 8.226230045654774e-06, - "loss": 2.2859, - "step": 479090 - }, - { - "epoch": 0.84, - "learning_rate": 8.225358105727948e-06, - "loss": 2.2561, - "step": 479100 - }, - { - "epoch": 0.84, - "learning_rate": 8.224486165801122e-06, - "loss": 2.1093, - "step": 479110 - }, - { - "epoch": 0.84, - "learning_rate": 8.223614225874295e-06, - "loss": 2.357, - "step": 479120 - }, - { - "epoch": 0.84, - "learning_rate": 8.222742285947469e-06, - "loss": 2.2259, - "step": 479130 - }, - { - "epoch": 0.84, - "learning_rate": 8.221870346020641e-06, - "loss": 2.1955, - "step": 479140 - }, - { - "epoch": 0.84, - "learning_rate": 8.220998406093815e-06, - "loss": 2.331, - "step": 479150 - }, - { - "epoch": 0.84, - "learning_rate": 8.220126466166987e-06, - "loss": 2.2185, - "step": 479160 - }, - { - "epoch": 0.84, - "learning_rate": 8.21925452624016e-06, - "loss": 2.1674, - "step": 479170 - }, - { - "epoch": 0.84, - "learning_rate": 8.218382586313333e-06, - "loss": 2.3092, - "step": 479180 - }, - { - "epoch": 0.84, - "learning_rate": 8.217510646386507e-06, - "loss": 2.2708, - "step": 479190 - }, - { - "epoch": 0.84, - "learning_rate": 8.21663870645968e-06, - "loss": 2.1897, - "step": 479200 - }, - { - "epoch": 0.84, - "learning_rate": 8.215766766532854e-06, - "loss": 2.3107, - "step": 479210 - }, - { - "epoch": 0.84, - "learning_rate": 8.214894826606026e-06, - "loss": 2.2706, - "step": 479220 - }, - { - "epoch": 0.84, - "learning_rate": 8.2140228866792e-06, - "loss": 2.2763, - "step": 479230 - }, - { - "epoch": 0.84, - "learning_rate": 8.213150946752372e-06, - "loss": 2.3406, - "step": 479240 - }, - { - "epoch": 0.84, - "learning_rate": 8.212279006825546e-06, - "loss": 2.2266, - "step": 479250 - }, - { - "epoch": 0.84, - "learning_rate": 8.21140706689872e-06, - "loss": 2.3253, - "step": 479260 - }, - { - "epoch": 0.84, - "learning_rate": 8.210535126971892e-06, - "loss": 2.2217, - "step": 479270 - }, - { - "epoch": 0.84, - "learning_rate": 8.209663187045067e-06, - "loss": 2.402, - "step": 479280 - }, - { - "epoch": 0.84, - "learning_rate": 8.20879124711824e-06, - "loss": 2.2318, - "step": 479290 - }, - { - "epoch": 0.84, - "learning_rate": 8.207919307191413e-06, - "loss": 2.3104, - "step": 479300 - }, - { - "epoch": 0.84, - "learning_rate": 8.207047367264585e-06, - "loss": 2.3706, - "step": 479310 - }, - { - "epoch": 0.84, - "learning_rate": 8.206175427337759e-06, - "loss": 2.2574, - "step": 479320 - }, - { - "epoch": 0.84, - "learning_rate": 8.205303487410931e-06, - "loss": 2.314, - "step": 479330 - }, - { - "epoch": 0.84, - "learning_rate": 8.204431547484105e-06, - "loss": 2.3643, - "step": 479340 - }, - { - "epoch": 0.84, - "learning_rate": 8.203559607557278e-06, - "loss": 2.2655, - "step": 479350 - }, - { - "epoch": 0.84, - "learning_rate": 8.202687667630452e-06, - "loss": 2.3429, - "step": 479360 - }, - { - "epoch": 0.84, - "learning_rate": 8.201815727703624e-06, - "loss": 2.2724, - "step": 479370 - }, - { - "epoch": 0.84, - "learning_rate": 8.200943787776798e-06, - "loss": 2.2427, - "step": 479380 - }, - { - "epoch": 0.84, - "learning_rate": 8.20007184784997e-06, - "loss": 2.2363, - "step": 479390 - }, - { - "epoch": 0.84, - "learning_rate": 8.199199907923144e-06, - "loss": 2.2567, - "step": 479400 - }, - { - "epoch": 0.84, - "learning_rate": 8.198327967996318e-06, - "loss": 2.3317, - "step": 479410 - }, - { - "epoch": 0.84, - "learning_rate": 8.19745602806949e-06, - "loss": 2.2863, - "step": 479420 - }, - { - "epoch": 0.84, - "learning_rate": 8.196584088142664e-06, - "loss": 2.2565, - "step": 479430 - }, - { - "epoch": 0.84, - "learning_rate": 8.195712148215837e-06, - "loss": 2.2854, - "step": 479440 - }, - { - "epoch": 0.84, - "learning_rate": 8.194840208289011e-06, - "loss": 2.2641, - "step": 479450 - }, - { - "epoch": 0.84, - "learning_rate": 8.193968268362183e-06, - "loss": 2.1641, - "step": 479460 - }, - { - "epoch": 0.84, - "learning_rate": 8.193096328435357e-06, - "loss": 2.3432, - "step": 479470 - }, - { - "epoch": 0.84, - "learning_rate": 8.192224388508529e-06, - "loss": 2.3654, - "step": 479480 - }, - { - "epoch": 0.84, - "learning_rate": 8.191352448581703e-06, - "loss": 2.3545, - "step": 479490 - }, - { - "epoch": 0.84, - "learning_rate": 8.190480508654875e-06, - "loss": 2.2171, - "step": 479500 - }, - { - "epoch": 0.84, - "learning_rate": 8.189608568728049e-06, - "loss": 2.2121, - "step": 479510 - }, - { - "epoch": 0.84, - "learning_rate": 8.188736628801222e-06, - "loss": 2.252, - "step": 479520 - }, - { - "epoch": 0.84, - "learning_rate": 8.187864688874396e-06, - "loss": 2.2926, - "step": 479530 - }, - { - "epoch": 0.84, - "learning_rate": 8.18699274894757e-06, - "loss": 2.2659, - "step": 479540 - }, - { - "epoch": 0.84, - "learning_rate": 8.186120809020742e-06, - "loss": 2.2368, - "step": 479550 - }, - { - "epoch": 0.84, - "learning_rate": 8.185248869093916e-06, - "loss": 2.1699, - "step": 479560 - }, - { - "epoch": 0.84, - "learning_rate": 8.184376929167088e-06, - "loss": 2.1985, - "step": 479570 - }, - { - "epoch": 0.84, - "learning_rate": 8.183504989240262e-06, - "loss": 2.38, - "step": 479580 - }, - { - "epoch": 0.84, - "learning_rate": 8.182633049313435e-06, - "loss": 2.3618, - "step": 479590 - }, - { - "epoch": 0.84, - "learning_rate": 8.181761109386609e-06, - "loss": 2.1832, - "step": 479600 - }, - { - "epoch": 0.84, - "learning_rate": 8.180889169459781e-06, - "loss": 2.3349, - "step": 479610 - }, - { - "epoch": 0.84, - "learning_rate": 8.180017229532955e-06, - "loss": 2.2448, - "step": 479620 - }, - { - "epoch": 0.84, - "learning_rate": 8.179145289606127e-06, - "loss": 2.3394, - "step": 479630 - }, - { - "epoch": 0.84, - "learning_rate": 8.1782733496793e-06, - "loss": 2.1557, - "step": 479640 - }, - { - "epoch": 0.84, - "learning_rate": 8.177401409752473e-06, - "loss": 2.3075, - "step": 479650 - }, - { - "epoch": 0.84, - "learning_rate": 8.176529469825647e-06, - "loss": 2.3287, - "step": 479660 - }, - { - "epoch": 0.84, - "learning_rate": 8.17565752989882e-06, - "loss": 2.2642, - "step": 479670 - }, - { - "epoch": 0.84, - "learning_rate": 8.174785589971994e-06, - "loss": 2.2515, - "step": 479680 - }, - { - "epoch": 0.84, - "learning_rate": 8.173913650045168e-06, - "loss": 2.207, - "step": 479690 - }, - { - "epoch": 0.84, - "learning_rate": 8.17304171011834e-06, - "loss": 2.1875, - "step": 479700 - }, - { - "epoch": 0.84, - "learning_rate": 8.172169770191514e-06, - "loss": 2.2395, - "step": 479710 - }, - { - "epoch": 0.84, - "learning_rate": 8.171297830264686e-06, - "loss": 2.1905, - "step": 479720 - }, - { - "epoch": 0.84, - "learning_rate": 8.17042589033786e-06, - "loss": 2.1485, - "step": 479730 - }, - { - "epoch": 0.84, - "learning_rate": 8.169553950411032e-06, - "loss": 2.2559, - "step": 479740 - }, - { - "epoch": 0.84, - "learning_rate": 8.168682010484206e-06, - "loss": 2.2627, - "step": 479750 - }, - { - "epoch": 0.84, - "learning_rate": 8.16781007055738e-06, - "loss": 2.2057, - "step": 479760 - }, - { - "epoch": 0.84, - "learning_rate": 8.166938130630553e-06, - "loss": 2.2042, - "step": 479770 - }, - { - "epoch": 0.84, - "learning_rate": 8.166066190703725e-06, - "loss": 2.3729, - "step": 479780 - }, - { - "epoch": 0.84, - "learning_rate": 8.165194250776899e-06, - "loss": 2.2418, - "step": 479790 - }, - { - "epoch": 0.84, - "learning_rate": 8.164322310850073e-06, - "loss": 2.2083, - "step": 479800 - }, - { - "epoch": 0.84, - "learning_rate": 8.163450370923245e-06, - "loss": 2.2266, - "step": 479810 - }, - { - "epoch": 0.84, - "learning_rate": 8.162578430996419e-06, - "loss": 2.2944, - "step": 479820 - }, - { - "epoch": 0.84, - "learning_rate": 8.16170649106959e-06, - "loss": 2.3304, - "step": 479830 - }, - { - "epoch": 0.84, - "learning_rate": 8.160834551142766e-06, - "loss": 2.2266, - "step": 479840 - }, - { - "epoch": 0.84, - "learning_rate": 8.159962611215938e-06, - "loss": 2.2574, - "step": 479850 - }, - { - "epoch": 0.84, - "learning_rate": 8.159090671289112e-06, - "loss": 2.3289, - "step": 479860 - }, - { - "epoch": 0.84, - "learning_rate": 8.158218731362284e-06, - "loss": 2.1495, - "step": 479870 - }, - { - "epoch": 0.84, - "learning_rate": 8.157346791435458e-06, - "loss": 2.2967, - "step": 479880 - }, - { - "epoch": 0.84, - "learning_rate": 8.15647485150863e-06, - "loss": 2.2817, - "step": 479890 - }, - { - "epoch": 0.84, - "learning_rate": 8.155602911581804e-06, - "loss": 2.2873, - "step": 479900 - }, - { - "epoch": 0.84, - "learning_rate": 8.154730971654977e-06, - "loss": 2.3343, - "step": 479910 - }, - { - "epoch": 0.84, - "learning_rate": 8.153859031728151e-06, - "loss": 2.1899, - "step": 479920 - }, - { - "epoch": 0.84, - "learning_rate": 8.152987091801325e-06, - "loss": 2.2454, - "step": 479930 - }, - { - "epoch": 0.84, - "learning_rate": 8.152115151874497e-06, - "loss": 2.1721, - "step": 479940 - }, - { - "epoch": 0.84, - "learning_rate": 8.15124321194767e-06, - "loss": 2.2329, - "step": 479950 - }, - { - "epoch": 0.84, - "learning_rate": 8.150371272020843e-06, - "loss": 2.3818, - "step": 479960 - }, - { - "epoch": 0.84, - "learning_rate": 8.149499332094017e-06, - "loss": 2.2541, - "step": 479970 - }, - { - "epoch": 0.84, - "learning_rate": 8.148627392167189e-06, - "loss": 2.3348, - "step": 479980 - }, - { - "epoch": 0.84, - "learning_rate": 8.147755452240362e-06, - "loss": 2.2227, - "step": 479990 - }, - { - "epoch": 0.84, - "learning_rate": 8.146883512313536e-06, - "loss": 2.1823, - "step": 480000 - }, - { - "epoch": 0.84, - "learning_rate": 8.14601157238671e-06, - "loss": 2.2014, - "step": 480010 - }, - { - "epoch": 0.84, - "learning_rate": 8.145139632459882e-06, - "loss": 2.346, - "step": 480020 - }, - { - "epoch": 0.84, - "learning_rate": 8.144267692533056e-06, - "loss": 2.265, - "step": 480030 - }, - { - "epoch": 0.84, - "learning_rate": 8.143395752606228e-06, - "loss": 2.3703, - "step": 480040 - }, - { - "epoch": 0.84, - "learning_rate": 8.142523812679402e-06, - "loss": 2.1757, - "step": 480050 - }, - { - "epoch": 0.84, - "learning_rate": 8.141651872752575e-06, - "loss": 2.2442, - "step": 480060 - }, - { - "epoch": 0.84, - "learning_rate": 8.140779932825748e-06, - "loss": 2.3107, - "step": 480070 - }, - { - "epoch": 0.84, - "learning_rate": 8.139907992898923e-06, - "loss": 2.1683, - "step": 480080 - }, - { - "epoch": 0.84, - "learning_rate": 8.139036052972095e-06, - "loss": 2.3207, - "step": 480090 - }, - { - "epoch": 0.84, - "learning_rate": 8.138164113045269e-06, - "loss": 2.2354, - "step": 480100 - }, - { - "epoch": 0.84, - "learning_rate": 8.137292173118441e-06, - "loss": 2.2828, - "step": 480110 - }, - { - "epoch": 0.84, - "learning_rate": 8.136420233191615e-06, - "loss": 2.3285, - "step": 480120 - }, - { - "epoch": 0.84, - "learning_rate": 8.135548293264787e-06, - "loss": 2.2609, - "step": 480130 - }, - { - "epoch": 0.84, - "learning_rate": 8.13467635333796e-06, - "loss": 2.2757, - "step": 480140 - }, - { - "epoch": 0.84, - "learning_rate": 8.133804413411134e-06, - "loss": 2.2774, - "step": 480150 - }, - { - "epoch": 0.84, - "learning_rate": 8.132932473484308e-06, - "loss": 2.2263, - "step": 480160 - }, - { - "epoch": 0.84, - "learning_rate": 8.13206053355748e-06, - "loss": 2.2212, - "step": 480170 - }, - { - "epoch": 0.84, - "learning_rate": 8.131188593630654e-06, - "loss": 2.363, - "step": 480180 - }, - { - "epoch": 0.84, - "learning_rate": 8.130316653703828e-06, - "loss": 2.2706, - "step": 480190 - }, - { - "epoch": 0.84, - "learning_rate": 8.129444713777e-06, - "loss": 2.3416, - "step": 480200 - }, - { - "epoch": 0.84, - "learning_rate": 8.128572773850174e-06, - "loss": 2.2542, - "step": 480210 - }, - { - "epoch": 0.84, - "learning_rate": 8.127700833923346e-06, - "loss": 2.3508, - "step": 480220 - }, - { - "epoch": 0.84, - "learning_rate": 8.12682889399652e-06, - "loss": 2.2711, - "step": 480230 - }, - { - "epoch": 0.84, - "learning_rate": 8.125956954069693e-06, - "loss": 2.3115, - "step": 480240 - }, - { - "epoch": 0.84, - "learning_rate": 8.125085014142867e-06, - "loss": 2.2974, - "step": 480250 - }, - { - "epoch": 0.84, - "learning_rate": 8.124213074216039e-06, - "loss": 2.1337, - "step": 480260 - }, - { - "epoch": 0.84, - "learning_rate": 8.123341134289213e-06, - "loss": 2.3016, - "step": 480270 - }, - { - "epoch": 0.84, - "learning_rate": 8.122469194362385e-06, - "loss": 2.1987, - "step": 480280 - }, - { - "epoch": 0.84, - "learning_rate": 8.121597254435559e-06, - "loss": 2.1943, - "step": 480290 - }, - { - "epoch": 0.84, - "learning_rate": 8.12072531450873e-06, - "loss": 2.2346, - "step": 480300 - }, - { - "epoch": 0.84, - "learning_rate": 8.119853374581904e-06, - "loss": 2.2797, - "step": 480310 - }, - { - "epoch": 0.84, - "learning_rate": 8.118981434655078e-06, - "loss": 2.2062, - "step": 480320 - }, - { - "epoch": 0.84, - "learning_rate": 8.118109494728252e-06, - "loss": 2.3208, - "step": 480330 - }, - { - "epoch": 0.84, - "learning_rate": 8.117237554801426e-06, - "loss": 2.2687, - "step": 480340 - }, - { - "epoch": 0.84, - "learning_rate": 8.116365614874598e-06, - "loss": 2.292, - "step": 480350 - }, - { - "epoch": 0.84, - "learning_rate": 8.115493674947772e-06, - "loss": 2.2818, - "step": 480360 - }, - { - "epoch": 0.84, - "learning_rate": 8.114621735020944e-06, - "loss": 2.2127, - "step": 480370 - }, - { - "epoch": 0.84, - "learning_rate": 8.113749795094117e-06, - "loss": 2.329, - "step": 480380 - }, - { - "epoch": 0.84, - "learning_rate": 8.112877855167291e-06, - "loss": 2.2776, - "step": 480390 - }, - { - "epoch": 0.84, - "learning_rate": 8.112005915240465e-06, - "loss": 2.2102, - "step": 480400 - }, - { - "epoch": 0.84, - "learning_rate": 8.111133975313637e-06, - "loss": 2.2094, - "step": 480410 - }, - { - "epoch": 0.84, - "learning_rate": 8.11026203538681e-06, - "loss": 2.3016, - "step": 480420 - }, - { - "epoch": 0.84, - "learning_rate": 8.109390095459983e-06, - "loss": 2.14, - "step": 480430 - }, - { - "epoch": 0.84, - "learning_rate": 8.108518155533157e-06, - "loss": 2.3096, - "step": 480440 - }, - { - "epoch": 0.84, - "learning_rate": 8.107646215606329e-06, - "loss": 2.1247, - "step": 480450 - }, - { - "epoch": 0.84, - "learning_rate": 8.106774275679503e-06, - "loss": 2.2972, - "step": 480460 - }, - { - "epoch": 0.84, - "learning_rate": 8.105902335752676e-06, - "loss": 2.1919, - "step": 480470 - }, - { - "epoch": 0.84, - "learning_rate": 8.10503039582585e-06, - "loss": 2.2875, - "step": 480480 - }, - { - "epoch": 0.84, - "learning_rate": 8.104158455899024e-06, - "loss": 2.2854, - "step": 480490 - }, - { - "epoch": 0.84, - "learning_rate": 8.103286515972196e-06, - "loss": 2.2843, - "step": 480500 - }, - { - "epoch": 0.84, - "learning_rate": 8.10241457604537e-06, - "loss": 2.305, - "step": 480510 - }, - { - "epoch": 0.84, - "learning_rate": 8.101542636118542e-06, - "loss": 2.2146, - "step": 480520 - }, - { - "epoch": 0.84, - "learning_rate": 8.100670696191716e-06, - "loss": 2.3983, - "step": 480530 - }, - { - "epoch": 0.84, - "learning_rate": 8.099798756264888e-06, - "loss": 2.3358, - "step": 480540 - }, - { - "epoch": 0.84, - "learning_rate": 8.098926816338061e-06, - "loss": 2.3233, - "step": 480550 - }, - { - "epoch": 0.84, - "learning_rate": 8.098054876411235e-06, - "loss": 2.3578, - "step": 480560 - }, - { - "epoch": 0.84, - "learning_rate": 8.097182936484409e-06, - "loss": 2.2986, - "step": 480570 - }, - { - "epoch": 0.84, - "learning_rate": 8.096310996557581e-06, - "loss": 2.2543, - "step": 480580 - }, - { - "epoch": 0.84, - "learning_rate": 8.095439056630755e-06, - "loss": 2.3527, - "step": 480590 - }, - { - "epoch": 0.84, - "learning_rate": 8.094567116703929e-06, - "loss": 2.1944, - "step": 480600 - }, - { - "epoch": 0.84, - "learning_rate": 8.0936951767771e-06, - "loss": 2.2564, - "step": 480610 - }, - { - "epoch": 0.84, - "learning_rate": 8.092823236850274e-06, - "loss": 2.3215, - "step": 480620 - }, - { - "epoch": 0.84, - "learning_rate": 8.091951296923448e-06, - "loss": 2.4512, - "step": 480630 - }, - { - "epoch": 0.84, - "learning_rate": 8.091079356996622e-06, - "loss": 2.4279, - "step": 480640 - }, - { - "epoch": 0.84, - "learning_rate": 8.090207417069794e-06, - "loss": 2.212, - "step": 480650 - }, - { - "epoch": 0.84, - "learning_rate": 8.089335477142968e-06, - "loss": 2.2486, - "step": 480660 - }, - { - "epoch": 0.84, - "learning_rate": 8.08846353721614e-06, - "loss": 2.2339, - "step": 480670 - }, - { - "epoch": 0.84, - "learning_rate": 8.087591597289314e-06, - "loss": 2.2987, - "step": 480680 - }, - { - "epoch": 0.84, - "learning_rate": 8.086719657362486e-06, - "loss": 2.1942, - "step": 480690 - }, - { - "epoch": 0.84, - "learning_rate": 8.08584771743566e-06, - "loss": 2.3314, - "step": 480700 - }, - { - "epoch": 0.84, - "learning_rate": 8.084975777508833e-06, - "loss": 2.2799, - "step": 480710 - }, - { - "epoch": 0.84, - "learning_rate": 8.084103837582007e-06, - "loss": 2.2056, - "step": 480720 - }, - { - "epoch": 0.84, - "learning_rate": 8.08323189765518e-06, - "loss": 2.3055, - "step": 480730 - }, - { - "epoch": 0.84, - "learning_rate": 8.082359957728353e-06, - "loss": 2.3243, - "step": 480740 - }, - { - "epoch": 0.84, - "learning_rate": 8.081488017801527e-06, - "loss": 2.2711, - "step": 480750 - }, - { - "epoch": 0.84, - "learning_rate": 8.080616077874699e-06, - "loss": 2.1675, - "step": 480760 - }, - { - "epoch": 0.84, - "learning_rate": 8.079744137947872e-06, - "loss": 2.3482, - "step": 480770 - }, - { - "epoch": 0.84, - "learning_rate": 8.078872198021045e-06, - "loss": 2.3446, - "step": 480780 - }, - { - "epoch": 0.84, - "learning_rate": 8.078000258094218e-06, - "loss": 2.3303, - "step": 480790 - }, - { - "epoch": 0.84, - "learning_rate": 8.077128318167392e-06, - "loss": 1.9281, - "step": 480800 - }, - { - "epoch": 0.84, - "learning_rate": 8.076256378240566e-06, - "loss": 2.3201, - "step": 480810 - }, - { - "epoch": 0.84, - "learning_rate": 8.075384438313738e-06, - "loss": 2.2839, - "step": 480820 - }, - { - "epoch": 0.84, - "learning_rate": 8.074512498386912e-06, - "loss": 2.2934, - "step": 480830 - }, - { - "epoch": 0.84, - "learning_rate": 8.073640558460084e-06, - "loss": 2.193, - "step": 480840 - }, - { - "epoch": 0.84, - "learning_rate": 8.072768618533258e-06, - "loss": 2.3585, - "step": 480850 - }, - { - "epoch": 0.84, - "learning_rate": 8.071896678606431e-06, - "loss": 2.2978, - "step": 480860 - }, - { - "epoch": 0.84, - "learning_rate": 8.071024738679605e-06, - "loss": 2.1496, - "step": 480870 - }, - { - "epoch": 0.84, - "learning_rate": 8.070152798752779e-06, - "loss": 2.2767, - "step": 480880 - }, - { - "epoch": 0.84, - "learning_rate": 8.069280858825951e-06, - "loss": 2.2877, - "step": 480890 - }, - { - "epoch": 0.84, - "learning_rate": 8.068408918899125e-06, - "loss": 2.3053, - "step": 480900 - }, - { - "epoch": 0.84, - "learning_rate": 8.067536978972297e-06, - "loss": 2.3108, - "step": 480910 - }, - { - "epoch": 0.84, - "learning_rate": 8.06666503904547e-06, - "loss": 2.2701, - "step": 480920 - }, - { - "epoch": 0.84, - "learning_rate": 8.065793099118643e-06, - "loss": 2.311, - "step": 480930 - }, - { - "epoch": 0.84, - "learning_rate": 8.064921159191816e-06, - "loss": 2.3655, - "step": 480940 - }, - { - "epoch": 0.84, - "learning_rate": 8.06404921926499e-06, - "loss": 2.2268, - "step": 480950 - }, - { - "epoch": 0.84, - "learning_rate": 8.063177279338164e-06, - "loss": 2.2901, - "step": 480960 - }, - { - "epoch": 0.84, - "learning_rate": 8.062305339411336e-06, - "loss": 2.3973, - "step": 480970 - }, - { - "epoch": 0.84, - "learning_rate": 8.06143339948451e-06, - "loss": 2.2896, - "step": 480980 - }, - { - "epoch": 0.84, - "learning_rate": 8.060561459557684e-06, - "loss": 2.3095, - "step": 480990 - }, - { - "epoch": 0.84, - "learning_rate": 8.059689519630856e-06, - "loss": 2.2738, - "step": 481000 - }, - { - "epoch": 0.84, - "learning_rate": 8.05881757970403e-06, - "loss": 2.2752, - "step": 481010 - }, - { - "epoch": 0.84, - "learning_rate": 8.057945639777201e-06, - "loss": 2.2745, - "step": 481020 - }, - { - "epoch": 0.84, - "learning_rate": 8.057073699850375e-06, - "loss": 2.3201, - "step": 481030 - }, - { - "epoch": 0.84, - "learning_rate": 8.056201759923549e-06, - "loss": 2.2116, - "step": 481040 - }, - { - "epoch": 0.84, - "learning_rate": 8.055329819996723e-06, - "loss": 2.1865, - "step": 481050 - }, - { - "epoch": 0.84, - "learning_rate": 8.054457880069895e-06, - "loss": 2.3133, - "step": 481060 - }, - { - "epoch": 0.84, - "learning_rate": 8.053585940143069e-06, - "loss": 2.3008, - "step": 481070 - }, - { - "epoch": 0.84, - "learning_rate": 8.05271400021624e-06, - "loss": 2.2959, - "step": 481080 - }, - { - "epoch": 0.84, - "learning_rate": 8.051842060289414e-06, - "loss": 2.2652, - "step": 481090 - }, - { - "epoch": 0.84, - "learning_rate": 8.050970120362587e-06, - "loss": 2.2254, - "step": 481100 - }, - { - "epoch": 0.84, - "learning_rate": 8.05009818043576e-06, - "loss": 2.1458, - "step": 481110 - }, - { - "epoch": 0.84, - "learning_rate": 8.049226240508934e-06, - "loss": 2.2771, - "step": 481120 - }, - { - "epoch": 0.84, - "learning_rate": 8.048354300582108e-06, - "loss": 2.3495, - "step": 481130 - }, - { - "epoch": 0.84, - "learning_rate": 8.047482360655282e-06, - "loss": 2.2648, - "step": 481140 - }, - { - "epoch": 0.84, - "learning_rate": 8.046610420728454e-06, - "loss": 2.2246, - "step": 481150 - }, - { - "epoch": 0.84, - "learning_rate": 8.045738480801627e-06, - "loss": 2.3191, - "step": 481160 - }, - { - "epoch": 0.84, - "learning_rate": 8.0448665408748e-06, - "loss": 2.2598, - "step": 481170 - }, - { - "epoch": 0.84, - "learning_rate": 8.043994600947973e-06, - "loss": 2.2898, - "step": 481180 - }, - { - "epoch": 0.84, - "learning_rate": 8.043122661021147e-06, - "loss": 2.395, - "step": 481190 - }, - { - "epoch": 0.84, - "learning_rate": 8.042250721094321e-06, - "loss": 2.2812, - "step": 481200 - }, - { - "epoch": 0.84, - "learning_rate": 8.041378781167493e-06, - "loss": 2.2365, - "step": 481210 - }, - { - "epoch": 0.84, - "learning_rate": 8.040506841240667e-06, - "loss": 2.2365, - "step": 481220 - }, - { - "epoch": 0.84, - "learning_rate": 8.039634901313839e-06, - "loss": 2.2912, - "step": 481230 - }, - { - "epoch": 0.84, - "learning_rate": 8.038762961387013e-06, - "loss": 2.3764, - "step": 481240 - }, - { - "epoch": 0.84, - "learning_rate": 8.037891021460185e-06, - "loss": 2.3605, - "step": 481250 - }, - { - "epoch": 0.84, - "learning_rate": 8.037019081533358e-06, - "loss": 2.3166, - "step": 481260 - }, - { - "epoch": 0.84, - "learning_rate": 8.036147141606532e-06, - "loss": 2.1232, - "step": 481270 - }, - { - "epoch": 0.84, - "learning_rate": 8.035275201679706e-06, - "loss": 2.2318, - "step": 481280 - }, - { - "epoch": 0.84, - "learning_rate": 8.03440326175288e-06, - "loss": 2.3441, - "step": 481290 - }, - { - "epoch": 0.84, - "learning_rate": 8.033531321826052e-06, - "loss": 2.2046, - "step": 481300 - }, - { - "epoch": 0.84, - "learning_rate": 8.032659381899226e-06, - "loss": 2.367, - "step": 481310 - }, - { - "epoch": 0.84, - "learning_rate": 8.031787441972398e-06, - "loss": 2.3114, - "step": 481320 - }, - { - "epoch": 0.84, - "learning_rate": 8.030915502045571e-06, - "loss": 2.3023, - "step": 481330 - }, - { - "epoch": 0.84, - "learning_rate": 8.030043562118743e-06, - "loss": 2.4063, - "step": 481340 - }, - { - "epoch": 0.84, - "learning_rate": 8.029171622191917e-06, - "loss": 2.2693, - "step": 481350 - }, - { - "epoch": 0.84, - "learning_rate": 8.028299682265091e-06, - "loss": 2.2747, - "step": 481360 - }, - { - "epoch": 0.84, - "learning_rate": 8.027427742338265e-06, - "loss": 2.2194, - "step": 481370 - }, - { - "epoch": 0.84, - "learning_rate": 8.026555802411437e-06, - "loss": 2.2243, - "step": 481380 - }, - { - "epoch": 0.84, - "learning_rate": 8.02568386248461e-06, - "loss": 2.1601, - "step": 481390 - }, - { - "epoch": 0.84, - "learning_rate": 8.024811922557784e-06, - "loss": 2.2541, - "step": 481400 - }, - { - "epoch": 0.84, - "learning_rate": 8.023939982630956e-06, - "loss": 2.2709, - "step": 481410 - }, - { - "epoch": 0.84, - "learning_rate": 8.02306804270413e-06, - "loss": 2.3189, - "step": 481420 - }, - { - "epoch": 0.84, - "learning_rate": 8.022196102777304e-06, - "loss": 2.2071, - "step": 481430 - }, - { - "epoch": 0.84, - "learning_rate": 8.021324162850478e-06, - "loss": 2.2273, - "step": 481440 - }, - { - "epoch": 0.84, - "learning_rate": 8.02045222292365e-06, - "loss": 2.2075, - "step": 481450 - }, - { - "epoch": 0.84, - "learning_rate": 8.019580282996824e-06, - "loss": 2.2585, - "step": 481460 - }, - { - "epoch": 0.84, - "learning_rate": 8.018708343069996e-06, - "loss": 2.3204, - "step": 481470 - }, - { - "epoch": 0.84, - "learning_rate": 8.01783640314317e-06, - "loss": 2.2644, - "step": 481480 - }, - { - "epoch": 0.84, - "learning_rate": 8.016964463216342e-06, - "loss": 2.3325, - "step": 481490 - }, - { - "epoch": 0.84, - "learning_rate": 8.016092523289515e-06, - "loss": 2.2745, - "step": 481500 - }, - { - "epoch": 0.84, - "learning_rate": 8.015220583362689e-06, - "loss": 2.2637, - "step": 481510 - }, - { - "epoch": 0.84, - "learning_rate": 8.014348643435863e-06, - "loss": 2.2673, - "step": 481520 - }, - { - "epoch": 0.84, - "learning_rate": 8.013476703509037e-06, - "loss": 2.246, - "step": 481530 - }, - { - "epoch": 0.84, - "learning_rate": 8.012604763582209e-06, - "loss": 2.2795, - "step": 481540 - }, - { - "epoch": 0.84, - "learning_rate": 8.011732823655382e-06, - "loss": 2.378, - "step": 481550 - }, - { - "epoch": 0.84, - "learning_rate": 8.010860883728555e-06, - "loss": 2.2295, - "step": 481560 - }, - { - "epoch": 0.84, - "learning_rate": 8.009988943801728e-06, - "loss": 2.2412, - "step": 481570 - }, - { - "epoch": 0.84, - "learning_rate": 8.0091170038749e-06, - "loss": 2.2282, - "step": 481580 - }, - { - "epoch": 0.84, - "learning_rate": 8.008245063948074e-06, - "loss": 2.1999, - "step": 481590 - }, - { - "epoch": 0.84, - "learning_rate": 8.007373124021248e-06, - "loss": 2.3233, - "step": 481600 - }, - { - "epoch": 0.84, - "learning_rate": 8.006501184094422e-06, - "loss": 2.3583, - "step": 481610 - }, - { - "epoch": 0.84, - "learning_rate": 8.005629244167594e-06, - "loss": 2.2688, - "step": 481620 - }, - { - "epoch": 0.84, - "learning_rate": 8.004757304240768e-06, - "loss": 2.3588, - "step": 481630 - }, - { - "epoch": 0.84, - "learning_rate": 8.00388536431394e-06, - "loss": 2.2733, - "step": 481640 - }, - { - "epoch": 0.84, - "learning_rate": 8.003013424387113e-06, - "loss": 2.2679, - "step": 481650 - }, - { - "epoch": 0.84, - "learning_rate": 8.002141484460287e-06, - "loss": 2.2973, - "step": 481660 - }, - { - "epoch": 0.84, - "learning_rate": 8.001269544533461e-06, - "loss": 2.2765, - "step": 481670 - }, - { - "epoch": 0.84, - "learning_rate": 8.000397604606635e-06, - "loss": 2.2661, - "step": 481680 - }, - { - "epoch": 0.84, - "learning_rate": 7.999525664679807e-06, - "loss": 2.2016, - "step": 481690 - }, - { - "epoch": 0.84, - "learning_rate": 7.99865372475298e-06, - "loss": 2.2232, - "step": 481700 - }, - { - "epoch": 0.84, - "learning_rate": 7.997781784826153e-06, - "loss": 2.4183, - "step": 481710 - }, - { - "epoch": 0.84, - "learning_rate": 7.996909844899326e-06, - "loss": 2.3699, - "step": 481720 - }, - { - "epoch": 0.84, - "learning_rate": 7.996037904972498e-06, - "loss": 2.3149, - "step": 481730 - }, - { - "epoch": 0.84, - "learning_rate": 7.995165965045672e-06, - "loss": 2.3297, - "step": 481740 - }, - { - "epoch": 0.84, - "learning_rate": 7.994294025118846e-06, - "loss": 2.3828, - "step": 481750 - }, - { - "epoch": 0.84, - "learning_rate": 7.99342208519202e-06, - "loss": 2.2527, - "step": 481760 - }, - { - "epoch": 0.84, - "learning_rate": 7.992550145265192e-06, - "loss": 2.2882, - "step": 481770 - }, - { - "epoch": 0.84, - "learning_rate": 7.991678205338366e-06, - "loss": 2.2035, - "step": 481780 - }, - { - "epoch": 0.84, - "learning_rate": 7.99080626541154e-06, - "loss": 2.3197, - "step": 481790 - }, - { - "epoch": 0.84, - "learning_rate": 7.989934325484711e-06, - "loss": 2.471, - "step": 481800 - }, - { - "epoch": 0.84, - "learning_rate": 7.989062385557885e-06, - "loss": 2.3108, - "step": 481810 - }, - { - "epoch": 0.84, - "learning_rate": 7.988190445631057e-06, - "loss": 2.1842, - "step": 481820 - }, - { - "epoch": 0.84, - "learning_rate": 7.987318505704231e-06, - "loss": 2.1747, - "step": 481830 - }, - { - "epoch": 0.84, - "learning_rate": 7.986446565777405e-06, - "loss": 2.3858, - "step": 481840 - }, - { - "epoch": 0.84, - "learning_rate": 7.985574625850579e-06, - "loss": 2.1945, - "step": 481850 - }, - { - "epoch": 0.84, - "learning_rate": 7.98470268592375e-06, - "loss": 2.3256, - "step": 481860 - }, - { - "epoch": 0.84, - "learning_rate": 7.983830745996924e-06, - "loss": 2.4069, - "step": 481870 - }, - { - "epoch": 0.84, - "learning_rate": 7.982958806070097e-06, - "loss": 2.3141, - "step": 481880 - }, - { - "epoch": 0.84, - "learning_rate": 7.98208686614327e-06, - "loss": 2.2631, - "step": 481890 - }, - { - "epoch": 0.84, - "learning_rate": 7.981214926216442e-06, - "loss": 2.2239, - "step": 481900 - }, - { - "epoch": 0.84, - "learning_rate": 7.980342986289618e-06, - "loss": 2.2283, - "step": 481910 - }, - { - "epoch": 0.84, - "learning_rate": 7.979471046362792e-06, - "loss": 2.1656, - "step": 481920 - }, - { - "epoch": 0.84, - "learning_rate": 7.978599106435964e-06, - "loss": 2.0981, - "step": 481930 - }, - { - "epoch": 0.84, - "learning_rate": 7.977727166509137e-06, - "loss": 2.2437, - "step": 481940 - }, - { - "epoch": 0.84, - "learning_rate": 7.97685522658231e-06, - "loss": 2.2785, - "step": 481950 - }, - { - "epoch": 0.84, - "learning_rate": 7.975983286655483e-06, - "loss": 2.2361, - "step": 481960 - }, - { - "epoch": 0.84, - "learning_rate": 7.975111346728655e-06, - "loss": 2.2487, - "step": 481970 - }, - { - "epoch": 0.84, - "learning_rate": 7.97423940680183e-06, - "loss": 2.182, - "step": 481980 - }, - { - "epoch": 0.84, - "learning_rate": 7.973367466875003e-06, - "loss": 2.3306, - "step": 481990 - }, - { - "epoch": 0.84, - "learning_rate": 7.972495526948177e-06, - "loss": 2.2524, - "step": 482000 - }, - { - "epoch": 0.84, - "learning_rate": 7.971623587021349e-06, - "loss": 2.2885, - "step": 482010 - }, - { - "epoch": 0.84, - "learning_rate": 7.970751647094523e-06, - "loss": 2.3216, - "step": 482020 - }, - { - "epoch": 0.84, - "learning_rate": 7.969879707167695e-06, - "loss": 2.248, - "step": 482030 - }, - { - "epoch": 0.84, - "learning_rate": 7.969007767240868e-06, - "loss": 2.2902, - "step": 482040 - }, - { - "epoch": 0.84, - "learning_rate": 7.96813582731404e-06, - "loss": 2.2923, - "step": 482050 - }, - { - "epoch": 0.84, - "learning_rate": 7.967263887387214e-06, - "loss": 2.3319, - "step": 482060 - }, - { - "epoch": 0.84, - "learning_rate": 7.966391947460388e-06, - "loss": 2.296, - "step": 482070 - }, - { - "epoch": 0.84, - "learning_rate": 7.965520007533562e-06, - "loss": 2.2802, - "step": 482080 - }, - { - "epoch": 0.84, - "learning_rate": 7.964648067606736e-06, - "loss": 2.2231, - "step": 482090 - }, - { - "epoch": 0.84, - "learning_rate": 7.963776127679908e-06, - "loss": 2.2073, - "step": 482100 - }, - { - "epoch": 0.84, - "learning_rate": 7.962904187753081e-06, - "loss": 2.2766, - "step": 482110 - }, - { - "epoch": 0.84, - "learning_rate": 7.962032247826253e-06, - "loss": 2.2343, - "step": 482120 - }, - { - "epoch": 0.84, - "learning_rate": 7.961160307899427e-06, - "loss": 2.2984, - "step": 482130 - }, - { - "epoch": 0.84, - "learning_rate": 7.9602883679726e-06, - "loss": 2.2662, - "step": 482140 - }, - { - "epoch": 0.84, - "learning_rate": 7.959416428045773e-06, - "loss": 2.2766, - "step": 482150 - }, - { - "epoch": 0.84, - "learning_rate": 7.958544488118947e-06, - "loss": 2.344, - "step": 482160 - }, - { - "epoch": 0.84, - "learning_rate": 7.95767254819212e-06, - "loss": 2.2194, - "step": 482170 - }, - { - "epoch": 0.84, - "learning_rate": 7.956800608265293e-06, - "loss": 2.433, - "step": 482180 - }, - { - "epoch": 0.84, - "learning_rate": 7.955928668338466e-06, - "loss": 2.2975, - "step": 482190 - }, - { - "epoch": 0.84, - "learning_rate": 7.95505672841164e-06, - "loss": 2.2771, - "step": 482200 - }, - { - "epoch": 0.84, - "learning_rate": 7.954184788484812e-06, - "loss": 2.3416, - "step": 482210 - }, - { - "epoch": 0.84, - "learning_rate": 7.953312848557986e-06, - "loss": 2.2482, - "step": 482220 - }, - { - "epoch": 0.84, - "learning_rate": 7.95244090863116e-06, - "loss": 2.0661, - "step": 482230 - }, - { - "epoch": 0.84, - "learning_rate": 7.951568968704334e-06, - "loss": 2.2038, - "step": 482240 - }, - { - "epoch": 0.84, - "learning_rate": 7.950697028777506e-06, - "loss": 2.1592, - "step": 482250 - }, - { - "epoch": 0.84, - "learning_rate": 7.94982508885068e-06, - "loss": 2.2229, - "step": 482260 - }, - { - "epoch": 0.84, - "learning_rate": 7.948953148923852e-06, - "loss": 2.3125, - "step": 482270 - }, - { - "epoch": 0.84, - "learning_rate": 7.948081208997025e-06, - "loss": 2.2692, - "step": 482280 - }, - { - "epoch": 0.84, - "learning_rate": 7.947209269070197e-06, - "loss": 2.1957, - "step": 482290 - }, - { - "epoch": 0.84, - "learning_rate": 7.946337329143371e-06, - "loss": 2.3325, - "step": 482300 - }, - { - "epoch": 0.84, - "learning_rate": 7.945465389216545e-06, - "loss": 2.2306, - "step": 482310 - }, - { - "epoch": 0.84, - "learning_rate": 7.944593449289719e-06, - "loss": 2.3139, - "step": 482320 - }, - { - "epoch": 0.84, - "learning_rate": 7.943721509362892e-06, - "loss": 2.2754, - "step": 482330 - }, - { - "epoch": 0.84, - "learning_rate": 7.942849569436065e-06, - "loss": 2.3058, - "step": 482340 - }, - { - "epoch": 0.84, - "learning_rate": 7.941977629509238e-06, - "loss": 2.2409, - "step": 482350 - }, - { - "epoch": 0.84, - "learning_rate": 7.94110568958241e-06, - "loss": 2.2294, - "step": 482360 - }, - { - "epoch": 0.84, - "learning_rate": 7.940233749655584e-06, - "loss": 2.478, - "step": 482370 - }, - { - "epoch": 0.84, - "learning_rate": 7.939361809728756e-06, - "loss": 2.2894, - "step": 482380 - }, - { - "epoch": 0.84, - "learning_rate": 7.93848986980193e-06, - "loss": 2.2221, - "step": 482390 - }, - { - "epoch": 0.84, - "learning_rate": 7.937617929875104e-06, - "loss": 2.2204, - "step": 482400 - }, - { - "epoch": 0.84, - "learning_rate": 7.936745989948278e-06, - "loss": 2.4318, - "step": 482410 - }, - { - "epoch": 0.84, - "learning_rate": 7.93587405002145e-06, - "loss": 2.1651, - "step": 482420 - }, - { - "epoch": 0.84, - "learning_rate": 7.935002110094623e-06, - "loss": 2.2457, - "step": 482430 - }, - { - "epoch": 0.84, - "learning_rate": 7.934130170167795e-06, - "loss": 2.1742, - "step": 482440 - }, - { - "epoch": 0.84, - "learning_rate": 7.93325823024097e-06, - "loss": 2.3201, - "step": 482450 - }, - { - "epoch": 0.84, - "learning_rate": 7.932386290314143e-06, - "loss": 2.2146, - "step": 482460 - }, - { - "epoch": 0.84, - "learning_rate": 7.931514350387317e-06, - "loss": 2.4478, - "step": 482470 - }, - { - "epoch": 0.84, - "learning_rate": 7.93064241046049e-06, - "loss": 2.2134, - "step": 482480 - }, - { - "epoch": 0.84, - "learning_rate": 7.929770470533663e-06, - "loss": 2.2311, - "step": 482490 - }, - { - "epoch": 0.84, - "learning_rate": 7.928898530606836e-06, - "loss": 2.2453, - "step": 482500 - }, - { - "epoch": 0.84, - "learning_rate": 7.928026590680008e-06, - "loss": 2.2199, - "step": 482510 - }, - { - "epoch": 0.84, - "learning_rate": 7.927154650753182e-06, - "loss": 2.2751, - "step": 482520 - }, - { - "epoch": 0.84, - "learning_rate": 7.926282710826354e-06, - "loss": 2.249, - "step": 482530 - }, - { - "epoch": 0.84, - "learning_rate": 7.925410770899528e-06, - "loss": 2.255, - "step": 482540 - }, - { - "epoch": 0.84, - "learning_rate": 7.924538830972702e-06, - "loss": 2.2289, - "step": 482550 - }, - { - "epoch": 0.84, - "learning_rate": 7.923666891045876e-06, - "loss": 2.2173, - "step": 482560 - }, - { - "epoch": 0.84, - "learning_rate": 7.922794951119048e-06, - "loss": 2.2612, - "step": 482570 - }, - { - "epoch": 0.84, - "learning_rate": 7.921923011192221e-06, - "loss": 2.2585, - "step": 482580 - }, - { - "epoch": 0.84, - "learning_rate": 7.921051071265395e-06, - "loss": 2.2574, - "step": 482590 - }, - { - "epoch": 0.84, - "learning_rate": 7.920179131338567e-06, - "loss": 2.3683, - "step": 482600 - }, - { - "epoch": 0.84, - "learning_rate": 7.919307191411741e-06, - "loss": 2.212, - "step": 482610 - }, - { - "epoch": 0.84, - "learning_rate": 7.918435251484913e-06, - "loss": 2.3168, - "step": 482620 - }, - { - "epoch": 0.84, - "learning_rate": 7.917563311558087e-06, - "loss": 2.3799, - "step": 482630 - }, - { - "epoch": 0.84, - "learning_rate": 7.91669137163126e-06, - "loss": 2.2189, - "step": 482640 - }, - { - "epoch": 0.84, - "learning_rate": 7.915819431704434e-06, - "loss": 2.1916, - "step": 482650 - }, - { - "epoch": 0.84, - "learning_rate": 7.914947491777607e-06, - "loss": 2.3723, - "step": 482660 - }, - { - "epoch": 0.84, - "learning_rate": 7.91407555185078e-06, - "loss": 2.2485, - "step": 482670 - }, - { - "epoch": 0.84, - "learning_rate": 7.913203611923952e-06, - "loss": 2.226, - "step": 482680 - }, - { - "epoch": 0.84, - "learning_rate": 7.912331671997126e-06, - "loss": 2.3607, - "step": 482690 - }, - { - "epoch": 0.84, - "learning_rate": 7.911459732070298e-06, - "loss": 2.244, - "step": 482700 - }, - { - "epoch": 0.84, - "learning_rate": 7.910587792143474e-06, - "loss": 2.2499, - "step": 482710 - }, - { - "epoch": 0.84, - "learning_rate": 7.909715852216647e-06, - "loss": 2.296, - "step": 482720 - }, - { - "epoch": 0.84, - "learning_rate": 7.90884391228982e-06, - "loss": 2.2911, - "step": 482730 - }, - { - "epoch": 0.84, - "learning_rate": 7.907971972362993e-06, - "loss": 2.2646, - "step": 482740 - }, - { - "epoch": 0.84, - "learning_rate": 7.907100032436165e-06, - "loss": 2.2111, - "step": 482750 - }, - { - "epoch": 0.84, - "learning_rate": 7.90622809250934e-06, - "loss": 2.3213, - "step": 482760 - }, - { - "epoch": 0.84, - "learning_rate": 7.905356152582511e-06, - "loss": 2.2885, - "step": 482770 - }, - { - "epoch": 0.84, - "learning_rate": 7.904484212655685e-06, - "loss": 2.2892, - "step": 482780 - }, - { - "epoch": 0.84, - "learning_rate": 7.903612272728859e-06, - "loss": 2.3201, - "step": 482790 - }, - { - "epoch": 0.84, - "learning_rate": 7.902740332802033e-06, - "loss": 2.264, - "step": 482800 - }, - { - "epoch": 0.84, - "learning_rate": 7.901868392875205e-06, - "loss": 2.2464, - "step": 482810 - }, - { - "epoch": 0.84, - "learning_rate": 7.900996452948378e-06, - "loss": 2.2318, - "step": 482820 - }, - { - "epoch": 0.84, - "learning_rate": 7.90012451302155e-06, - "loss": 2.3049, - "step": 482830 - }, - { - "epoch": 0.84, - "learning_rate": 7.899252573094724e-06, - "loss": 2.2443, - "step": 482840 - }, - { - "epoch": 0.84, - "learning_rate": 7.898380633167898e-06, - "loss": 2.4047, - "step": 482850 - }, - { - "epoch": 0.84, - "learning_rate": 7.89750869324107e-06, - "loss": 2.147, - "step": 482860 - }, - { - "epoch": 0.84, - "learning_rate": 7.896636753314244e-06, - "loss": 2.254, - "step": 482870 - }, - { - "epoch": 0.84, - "learning_rate": 7.895764813387418e-06, - "loss": 2.2875, - "step": 482880 - }, - { - "epoch": 0.84, - "learning_rate": 7.894892873460591e-06, - "loss": 2.2995, - "step": 482890 - }, - { - "epoch": 0.84, - "learning_rate": 7.894020933533763e-06, - "loss": 2.2593, - "step": 482900 - }, - { - "epoch": 0.84, - "learning_rate": 7.893148993606937e-06, - "loss": 2.2431, - "step": 482910 - }, - { - "epoch": 0.84, - "learning_rate": 7.89227705368011e-06, - "loss": 2.2541, - "step": 482920 - }, - { - "epoch": 0.84, - "learning_rate": 7.891405113753283e-06, - "loss": 2.2544, - "step": 482930 - }, - { - "epoch": 0.84, - "learning_rate": 7.890533173826455e-06, - "loss": 2.2175, - "step": 482940 - }, - { - "epoch": 0.84, - "learning_rate": 7.88966123389963e-06, - "loss": 2.2598, - "step": 482950 - }, - { - "epoch": 0.84, - "learning_rate": 7.888789293972803e-06, - "loss": 2.3284, - "step": 482960 - }, - { - "epoch": 0.84, - "learning_rate": 7.887917354045976e-06, - "loss": 2.2877, - "step": 482970 - }, - { - "epoch": 0.84, - "learning_rate": 7.887045414119149e-06, - "loss": 2.2957, - "step": 482980 - }, - { - "epoch": 0.84, - "learning_rate": 7.886173474192322e-06, - "loss": 2.264, - "step": 482990 - }, - { - "epoch": 0.84, - "learning_rate": 7.885301534265496e-06, - "loss": 2.2385, - "step": 483000 - }, - { - "epoch": 0.84, - "learning_rate": 7.884429594338668e-06, - "loss": 2.2109, - "step": 483010 - }, - { - "epoch": 0.84, - "learning_rate": 7.883557654411842e-06, - "loss": 2.2989, - "step": 483020 - }, - { - "epoch": 0.84, - "learning_rate": 7.882685714485016e-06, - "loss": 2.3738, - "step": 483030 - }, - { - "epoch": 0.84, - "learning_rate": 7.88181377455819e-06, - "loss": 2.1926, - "step": 483040 - }, - { - "epoch": 0.84, - "learning_rate": 7.880941834631362e-06, - "loss": 2.2615, - "step": 483050 - }, - { - "epoch": 0.84, - "learning_rate": 7.880069894704535e-06, - "loss": 2.2693, - "step": 483060 - }, - { - "epoch": 0.84, - "learning_rate": 7.879197954777707e-06, - "loss": 2.3208, - "step": 483070 - }, - { - "epoch": 0.84, - "learning_rate": 7.878326014850881e-06, - "loss": 2.1845, - "step": 483080 - }, - { - "epoch": 0.84, - "learning_rate": 7.877454074924053e-06, - "loss": 2.1984, - "step": 483090 - }, - { - "epoch": 0.84, - "learning_rate": 7.876582134997227e-06, - "loss": 2.2849, - "step": 483100 - }, - { - "epoch": 0.84, - "learning_rate": 7.8757101950704e-06, - "loss": 2.3199, - "step": 483110 - }, - { - "epoch": 0.84, - "learning_rate": 7.874838255143575e-06, - "loss": 2.2457, - "step": 483120 - }, - { - "epoch": 0.84, - "learning_rate": 7.873966315216748e-06, - "loss": 2.1525, - "step": 483130 - }, - { - "epoch": 0.84, - "learning_rate": 7.87309437528992e-06, - "loss": 2.272, - "step": 483140 - }, - { - "epoch": 0.84, - "learning_rate": 7.872222435363094e-06, - "loss": 2.2595, - "step": 483150 - }, - { - "epoch": 0.84, - "learning_rate": 7.871350495436266e-06, - "loss": 2.3661, - "step": 483160 - }, - { - "epoch": 0.84, - "learning_rate": 7.87047855550944e-06, - "loss": 2.2588, - "step": 483170 - }, - { - "epoch": 0.84, - "learning_rate": 7.869606615582612e-06, - "loss": 2.2744, - "step": 483180 - }, - { - "epoch": 0.84, - "learning_rate": 7.868734675655786e-06, - "loss": 2.3081, - "step": 483190 - }, - { - "epoch": 0.84, - "learning_rate": 7.86786273572896e-06, - "loss": 2.2567, - "step": 483200 - }, - { - "epoch": 0.84, - "learning_rate": 7.866990795802133e-06, - "loss": 2.202, - "step": 483210 - }, - { - "epoch": 0.84, - "learning_rate": 7.866118855875305e-06, - "loss": 2.2736, - "step": 483220 - }, - { - "epoch": 0.84, - "learning_rate": 7.86524691594848e-06, - "loss": 2.3138, - "step": 483230 - }, - { - "epoch": 0.84, - "learning_rate": 7.864374976021651e-06, - "loss": 2.3499, - "step": 483240 - }, - { - "epoch": 0.84, - "learning_rate": 7.863503036094825e-06, - "loss": 2.2265, - "step": 483250 - }, - { - "epoch": 0.84, - "learning_rate": 7.862631096167999e-06, - "loss": 2.3471, - "step": 483260 - }, - { - "epoch": 0.84, - "learning_rate": 7.861759156241173e-06, - "loss": 2.2015, - "step": 483270 - }, - { - "epoch": 0.84, - "learning_rate": 7.860887216314346e-06, - "loss": 2.2773, - "step": 483280 - }, - { - "epoch": 0.84, - "learning_rate": 7.860015276387518e-06, - "loss": 2.2228, - "step": 483290 - }, - { - "epoch": 0.84, - "learning_rate": 7.859143336460692e-06, - "loss": 2.1926, - "step": 483300 - }, - { - "epoch": 0.84, - "learning_rate": 7.858271396533864e-06, - "loss": 2.114, - "step": 483310 - }, - { - "epoch": 0.84, - "learning_rate": 7.857399456607038e-06, - "loss": 2.2676, - "step": 483320 - }, - { - "epoch": 0.84, - "learning_rate": 7.85652751668021e-06, - "loss": 2.2615, - "step": 483330 - }, - { - "epoch": 0.84, - "learning_rate": 7.855655576753384e-06, - "loss": 2.2116, - "step": 483340 - }, - { - "epoch": 0.84, - "learning_rate": 7.854783636826558e-06, - "loss": 2.2735, - "step": 483350 - }, - { - "epoch": 0.84, - "learning_rate": 7.853911696899731e-06, - "loss": 2.2699, - "step": 483360 - }, - { - "epoch": 0.84, - "learning_rate": 7.853039756972904e-06, - "loss": 2.2821, - "step": 483370 - }, - { - "epoch": 0.84, - "learning_rate": 7.852167817046077e-06, - "loss": 2.2151, - "step": 483380 - }, - { - "epoch": 0.84, - "learning_rate": 7.851295877119251e-06, - "loss": 2.2441, - "step": 483390 - }, - { - "epoch": 0.84, - "learning_rate": 7.850423937192423e-06, - "loss": 2.2649, - "step": 483400 - }, - { - "epoch": 0.84, - "learning_rate": 7.849551997265597e-06, - "loss": 2.2314, - "step": 483410 - }, - { - "epoch": 0.84, - "learning_rate": 7.848680057338769e-06, - "loss": 2.2964, - "step": 483420 - }, - { - "epoch": 0.84, - "learning_rate": 7.847808117411943e-06, - "loss": 2.2896, - "step": 483430 - }, - { - "epoch": 0.84, - "learning_rate": 7.846936177485117e-06, - "loss": 2.3486, - "step": 483440 - }, - { - "epoch": 0.84, - "learning_rate": 7.84606423755829e-06, - "loss": 2.2638, - "step": 483450 - }, - { - "epoch": 0.84, - "learning_rate": 7.845192297631462e-06, - "loss": 2.2792, - "step": 483460 - }, - { - "epoch": 0.84, - "learning_rate": 7.844320357704636e-06, - "loss": 2.274, - "step": 483470 - }, - { - "epoch": 0.84, - "learning_rate": 7.843448417777808e-06, - "loss": 2.2456, - "step": 483480 - }, - { - "epoch": 0.84, - "learning_rate": 7.842576477850982e-06, - "loss": 2.2642, - "step": 483490 - }, - { - "epoch": 0.84, - "learning_rate": 7.841704537924154e-06, - "loss": 2.2928, - "step": 483500 - }, - { - "epoch": 0.84, - "learning_rate": 7.84083259799733e-06, - "loss": 2.1762, - "step": 483510 - }, - { - "epoch": 0.84, - "learning_rate": 7.839960658070503e-06, - "loss": 2.2726, - "step": 483520 - }, - { - "epoch": 0.84, - "learning_rate": 7.839088718143675e-06, - "loss": 2.3034, - "step": 483530 - }, - { - "epoch": 0.84, - "learning_rate": 7.83821677821685e-06, - "loss": 2.1792, - "step": 483540 - }, - { - "epoch": 0.84, - "learning_rate": 7.837344838290021e-06, - "loss": 2.2649, - "step": 483550 - }, - { - "epoch": 0.84, - "learning_rate": 7.836472898363195e-06, - "loss": 2.2118, - "step": 483560 - }, - { - "epoch": 0.84, - "learning_rate": 7.835600958436367e-06, - "loss": 2.2619, - "step": 483570 - }, - { - "epoch": 0.84, - "learning_rate": 7.834729018509541e-06, - "loss": 2.2363, - "step": 483580 - }, - { - "epoch": 0.84, - "learning_rate": 7.833857078582715e-06, - "loss": 2.2621, - "step": 483590 - }, - { - "epoch": 0.84, - "learning_rate": 7.832985138655888e-06, - "loss": 2.3381, - "step": 483600 - }, - { - "epoch": 0.84, - "learning_rate": 7.83211319872906e-06, - "loss": 2.3934, - "step": 483610 - }, - { - "epoch": 0.84, - "learning_rate": 7.831241258802234e-06, - "loss": 2.1945, - "step": 483620 - }, - { - "epoch": 0.84, - "learning_rate": 7.830369318875406e-06, - "loss": 2.2771, - "step": 483630 - }, - { - "epoch": 0.84, - "learning_rate": 7.82949737894858e-06, - "loss": 2.1999, - "step": 483640 - }, - { - "epoch": 0.84, - "learning_rate": 7.828625439021754e-06, - "loss": 2.2997, - "step": 483650 - }, - { - "epoch": 0.84, - "learning_rate": 7.827753499094926e-06, - "loss": 2.2971, - "step": 483660 - }, - { - "epoch": 0.84, - "learning_rate": 7.8268815591681e-06, - "loss": 2.2908, - "step": 483670 - }, - { - "epoch": 0.84, - "learning_rate": 7.826009619241273e-06, - "loss": 2.1961, - "step": 483680 - }, - { - "epoch": 0.84, - "learning_rate": 7.825137679314447e-06, - "loss": 2.2858, - "step": 483690 - }, - { - "epoch": 0.84, - "learning_rate": 7.82426573938762e-06, - "loss": 2.2763, - "step": 483700 - }, - { - "epoch": 0.84, - "learning_rate": 7.823393799460793e-06, - "loss": 2.0637, - "step": 483710 - }, - { - "epoch": 0.84, - "learning_rate": 7.822521859533965e-06, - "loss": 2.2635, - "step": 483720 - }, - { - "epoch": 0.84, - "learning_rate": 7.821649919607139e-06, - "loss": 2.3286, - "step": 483730 - }, - { - "epoch": 0.84, - "learning_rate": 7.820777979680311e-06, - "loss": 2.2272, - "step": 483740 - }, - { - "epoch": 0.84, - "learning_rate": 7.819906039753486e-06, - "loss": 2.4018, - "step": 483750 - }, - { - "epoch": 0.84, - "learning_rate": 7.819034099826659e-06, - "loss": 2.3264, - "step": 483760 - }, - { - "epoch": 0.84, - "learning_rate": 7.818162159899832e-06, - "loss": 2.2522, - "step": 483770 - }, - { - "epoch": 0.84, - "learning_rate": 7.817290219973004e-06, - "loss": 2.2202, - "step": 483780 - }, - { - "epoch": 0.84, - "learning_rate": 7.816418280046178e-06, - "loss": 2.2429, - "step": 483790 - }, - { - "epoch": 0.84, - "learning_rate": 7.815546340119352e-06, - "loss": 2.269, - "step": 483800 - }, - { - "epoch": 0.84, - "learning_rate": 7.814674400192524e-06, - "loss": 2.3056, - "step": 483810 - }, - { - "epoch": 0.84, - "learning_rate": 7.813802460265698e-06, - "loss": 2.271, - "step": 483820 - }, - { - "epoch": 0.84, - "learning_rate": 7.812930520338872e-06, - "loss": 2.2494, - "step": 483830 - }, - { - "epoch": 0.84, - "learning_rate": 7.812058580412045e-06, - "loss": 2.2365, - "step": 483840 - }, - { - "epoch": 0.84, - "learning_rate": 7.811186640485217e-06, - "loss": 2.2356, - "step": 483850 - }, - { - "epoch": 0.84, - "learning_rate": 7.810314700558391e-06, - "loss": 2.2075, - "step": 483860 - }, - { - "epoch": 0.84, - "learning_rate": 7.809442760631563e-06, - "loss": 2.2118, - "step": 483870 - }, - { - "epoch": 0.84, - "learning_rate": 7.808570820704737e-06, - "loss": 2.2528, - "step": 483880 - }, - { - "epoch": 0.84, - "learning_rate": 7.807698880777909e-06, - "loss": 2.345, - "step": 483890 - }, - { - "epoch": 0.84, - "learning_rate": 7.806826940851083e-06, - "loss": 2.1163, - "step": 483900 - }, - { - "epoch": 0.84, - "learning_rate": 7.805955000924257e-06, - "loss": 2.1868, - "step": 483910 - }, - { - "epoch": 0.84, - "learning_rate": 7.80508306099743e-06, - "loss": 2.2573, - "step": 483920 - }, - { - "epoch": 0.84, - "learning_rate": 7.804211121070604e-06, - "loss": 2.2434, - "step": 483930 - }, - { - "epoch": 0.84, - "learning_rate": 7.803339181143776e-06, - "loss": 2.3736, - "step": 483940 - }, - { - "epoch": 0.84, - "learning_rate": 7.80246724121695e-06, - "loss": 2.2786, - "step": 483950 - }, - { - "epoch": 0.84, - "learning_rate": 7.801595301290122e-06, - "loss": 2.2668, - "step": 483960 - }, - { - "epoch": 0.84, - "learning_rate": 7.800723361363296e-06, - "loss": 2.3071, - "step": 483970 - }, - { - "epoch": 0.84, - "learning_rate": 7.799851421436468e-06, - "loss": 2.3283, - "step": 483980 - }, - { - "epoch": 0.84, - "learning_rate": 7.798979481509643e-06, - "loss": 2.2232, - "step": 483990 - }, - { - "epoch": 0.84, - "learning_rate": 7.798107541582815e-06, - "loss": 2.2561, - "step": 484000 - }, - { - "epoch": 0.84, - "learning_rate": 7.79723560165599e-06, - "loss": 2.3272, - "step": 484010 - }, - { - "epoch": 0.84, - "learning_rate": 7.796363661729161e-06, - "loss": 2.3263, - "step": 484020 - }, - { - "epoch": 0.84, - "learning_rate": 7.795491721802335e-06, - "loss": 2.3731, - "step": 484030 - }, - { - "epoch": 0.84, - "learning_rate": 7.794619781875507e-06, - "loss": 2.2418, - "step": 484040 - }, - { - "epoch": 0.84, - "learning_rate": 7.793747841948681e-06, - "loss": 2.248, - "step": 484050 - }, - { - "epoch": 0.84, - "learning_rate": 7.792875902021855e-06, - "loss": 2.2559, - "step": 484060 - }, - { - "epoch": 0.84, - "learning_rate": 7.792003962095028e-06, - "loss": 2.2633, - "step": 484070 - }, - { - "epoch": 0.84, - "learning_rate": 7.791132022168202e-06, - "loss": 2.3486, - "step": 484080 - }, - { - "epoch": 0.84, - "learning_rate": 7.790260082241374e-06, - "loss": 2.304, - "step": 484090 - }, - { - "epoch": 0.84, - "learning_rate": 7.789388142314548e-06, - "loss": 2.2317, - "step": 484100 - }, - { - "epoch": 0.84, - "learning_rate": 7.78851620238772e-06, - "loss": 2.3637, - "step": 484110 - }, - { - "epoch": 0.84, - "learning_rate": 7.787644262460894e-06, - "loss": 2.2878, - "step": 484120 - }, - { - "epoch": 0.84, - "learning_rate": 7.786772322534066e-06, - "loss": 2.3091, - "step": 484130 - }, - { - "epoch": 0.84, - "learning_rate": 7.78590038260724e-06, - "loss": 2.2362, - "step": 484140 - }, - { - "epoch": 0.84, - "learning_rate": 7.785028442680414e-06, - "loss": 2.2733, - "step": 484150 - }, - { - "epoch": 0.84, - "learning_rate": 7.784156502753587e-06, - "loss": 2.3058, - "step": 484160 - }, - { - "epoch": 0.84, - "learning_rate": 7.78328456282676e-06, - "loss": 2.3175, - "step": 484170 - }, - { - "epoch": 0.84, - "learning_rate": 7.782412622899933e-06, - "loss": 2.3108, - "step": 484180 - }, - { - "epoch": 0.84, - "learning_rate": 7.781540682973107e-06, - "loss": 2.2391, - "step": 484190 - }, - { - "epoch": 0.84, - "learning_rate": 7.780668743046279e-06, - "loss": 2.2223, - "step": 484200 - }, - { - "epoch": 0.84, - "learning_rate": 7.779796803119453e-06, - "loss": 2.2976, - "step": 484210 - }, - { - "epoch": 0.84, - "learning_rate": 7.778924863192625e-06, - "loss": 2.3151, - "step": 484220 - }, - { - "epoch": 0.84, - "learning_rate": 7.778052923265799e-06, - "loss": 2.3548, - "step": 484230 - }, - { - "epoch": 0.84, - "learning_rate": 7.777180983338972e-06, - "loss": 2.3421, - "step": 484240 - }, - { - "epoch": 0.84, - "learning_rate": 7.776309043412146e-06, - "loss": 2.2165, - "step": 484250 - }, - { - "epoch": 0.84, - "learning_rate": 7.775437103485318e-06, - "loss": 2.2888, - "step": 484260 - }, - { - "epoch": 0.84, - "learning_rate": 7.774565163558492e-06, - "loss": 2.2736, - "step": 484270 - }, - { - "epoch": 0.84, - "learning_rate": 7.773693223631664e-06, - "loss": 2.2908, - "step": 484280 - }, - { - "epoch": 0.84, - "learning_rate": 7.772821283704838e-06, - "loss": 2.3298, - "step": 484290 - }, - { - "epoch": 0.84, - "learning_rate": 7.771949343778012e-06, - "loss": 2.2873, - "step": 484300 - }, - { - "epoch": 0.84, - "learning_rate": 7.771077403851185e-06, - "loss": 2.3299, - "step": 484310 - }, - { - "epoch": 0.84, - "learning_rate": 7.77020546392436e-06, - "loss": 2.2875, - "step": 484320 - }, - { - "epoch": 0.84, - "learning_rate": 7.769333523997531e-06, - "loss": 2.32, - "step": 484330 - }, - { - "epoch": 0.84, - "learning_rate": 7.768461584070705e-06, - "loss": 2.2955, - "step": 484340 - }, - { - "epoch": 0.84, - "learning_rate": 7.767589644143877e-06, - "loss": 2.3086, - "step": 484350 - }, - { - "epoch": 0.84, - "learning_rate": 7.766717704217051e-06, - "loss": 2.3181, - "step": 484360 - }, - { - "epoch": 0.84, - "learning_rate": 7.765845764290223e-06, - "loss": 2.323, - "step": 484370 - }, - { - "epoch": 0.84, - "learning_rate": 7.764973824363397e-06, - "loss": 2.2557, - "step": 484380 - }, - { - "epoch": 0.84, - "learning_rate": 7.76410188443657e-06, - "loss": 2.2539, - "step": 484390 - }, - { - "epoch": 0.84, - "learning_rate": 7.763229944509744e-06, - "loss": 2.2526, - "step": 484400 - }, - { - "epoch": 0.84, - "learning_rate": 7.762358004582916e-06, - "loss": 2.4283, - "step": 484410 - }, - { - "epoch": 0.84, - "learning_rate": 7.76148606465609e-06, - "loss": 2.3352, - "step": 484420 - }, - { - "epoch": 0.84, - "learning_rate": 7.760614124729262e-06, - "loss": 2.2371, - "step": 484430 - }, - { - "epoch": 0.84, - "learning_rate": 7.759742184802436e-06, - "loss": 2.2171, - "step": 484440 - }, - { - "epoch": 0.84, - "learning_rate": 7.75887024487561e-06, - "loss": 2.2623, - "step": 484450 - }, - { - "epoch": 0.84, - "learning_rate": 7.757998304948782e-06, - "loss": 2.2231, - "step": 484460 - }, - { - "epoch": 0.84, - "learning_rate": 7.757126365021956e-06, - "loss": 2.2643, - "step": 484470 - }, - { - "epoch": 0.84, - "learning_rate": 7.75625442509513e-06, - "loss": 2.268, - "step": 484480 - }, - { - "epoch": 0.84, - "learning_rate": 7.755382485168303e-06, - "loss": 2.2968, - "step": 484490 - }, - { - "epoch": 0.84, - "learning_rate": 7.754510545241475e-06, - "loss": 2.3126, - "step": 484500 - }, - { - "epoch": 0.84, - "learning_rate": 7.753638605314649e-06, - "loss": 2.334, - "step": 484510 - }, - { - "epoch": 0.84, - "learning_rate": 7.752766665387821e-06, - "loss": 2.2026, - "step": 484520 - }, - { - "epoch": 0.84, - "learning_rate": 7.751894725460995e-06, - "loss": 2.249, - "step": 484530 - }, - { - "epoch": 0.84, - "learning_rate": 7.751022785534167e-06, - "loss": 2.3138, - "step": 484540 - }, - { - "epoch": 0.84, - "learning_rate": 7.750150845607342e-06, - "loss": 2.2811, - "step": 484550 - }, - { - "epoch": 0.85, - "learning_rate": 7.749278905680514e-06, - "loss": 2.3089, - "step": 484560 - }, - { - "epoch": 0.85, - "learning_rate": 7.748406965753688e-06, - "loss": 2.3342, - "step": 484570 - }, - { - "epoch": 0.85, - "learning_rate": 7.747535025826862e-06, - "loss": 2.2926, - "step": 484580 - }, - { - "epoch": 0.85, - "learning_rate": 7.746663085900034e-06, - "loss": 2.3253, - "step": 484590 - }, - { - "epoch": 0.85, - "learning_rate": 7.745791145973208e-06, - "loss": 2.3187, - "step": 484600 - }, - { - "epoch": 0.85, - "learning_rate": 7.74491920604638e-06, - "loss": 2.2676, - "step": 484610 - }, - { - "epoch": 0.85, - "learning_rate": 7.744047266119554e-06, - "loss": 2.1997, - "step": 484620 - }, - { - "epoch": 0.85, - "learning_rate": 7.743175326192727e-06, - "loss": 2.3419, - "step": 484630 - }, - { - "epoch": 0.85, - "learning_rate": 7.742303386265901e-06, - "loss": 2.393, - "step": 484640 - }, - { - "epoch": 0.85, - "learning_rate": 7.741431446339073e-06, - "loss": 2.4141, - "step": 484650 - }, - { - "epoch": 0.85, - "learning_rate": 7.740559506412247e-06, - "loss": 2.2358, - "step": 484660 - }, - { - "epoch": 0.85, - "learning_rate": 7.739687566485419e-06, - "loss": 2.2349, - "step": 484670 - }, - { - "epoch": 0.85, - "learning_rate": 7.738815626558593e-06, - "loss": 2.1731, - "step": 484680 - }, - { - "epoch": 0.85, - "learning_rate": 7.737943686631765e-06, - "loss": 2.2725, - "step": 484690 - }, - { - "epoch": 0.85, - "learning_rate": 7.737071746704939e-06, - "loss": 2.1843, - "step": 484700 - }, - { - "epoch": 0.85, - "learning_rate": 7.736199806778112e-06, - "loss": 2.2665, - "step": 484710 - }, - { - "epoch": 0.85, - "learning_rate": 7.735327866851286e-06, - "loss": 2.2645, - "step": 484720 - }, - { - "epoch": 0.85, - "learning_rate": 7.73445592692446e-06, - "loss": 2.3645, - "step": 484730 - }, - { - "epoch": 0.85, - "learning_rate": 7.733583986997632e-06, - "loss": 2.358, - "step": 484740 - }, - { - "epoch": 0.85, - "learning_rate": 7.732712047070806e-06, - "loss": 2.2633, - "step": 484750 - }, - { - "epoch": 0.85, - "learning_rate": 7.731840107143978e-06, - "loss": 2.3653, - "step": 484760 - }, - { - "epoch": 0.85, - "learning_rate": 7.730968167217152e-06, - "loss": 2.2654, - "step": 484770 - }, - { - "epoch": 0.85, - "learning_rate": 7.730096227290324e-06, - "loss": 2.2933, - "step": 484780 - }, - { - "epoch": 0.85, - "learning_rate": 7.7292242873635e-06, - "loss": 2.1925, - "step": 484790 - }, - { - "epoch": 0.85, - "learning_rate": 7.728352347436671e-06, - "loss": 2.3759, - "step": 484800 - }, - { - "epoch": 0.85, - "learning_rate": 7.727480407509845e-06, - "loss": 2.3295, - "step": 484810 - }, - { - "epoch": 0.85, - "learning_rate": 7.726608467583017e-06, - "loss": 2.3277, - "step": 484820 - }, - { - "epoch": 0.85, - "learning_rate": 7.725736527656191e-06, - "loss": 2.2654, - "step": 484830 - }, - { - "epoch": 0.85, - "learning_rate": 7.724864587729363e-06, - "loss": 2.1662, - "step": 484840 - }, - { - "epoch": 0.85, - "learning_rate": 7.723992647802537e-06, - "loss": 2.2701, - "step": 484850 - }, - { - "epoch": 0.85, - "learning_rate": 7.72312070787571e-06, - "loss": 2.2491, - "step": 484860 - }, - { - "epoch": 0.85, - "learning_rate": 7.722248767948884e-06, - "loss": 2.4304, - "step": 484870 - }, - { - "epoch": 0.85, - "learning_rate": 7.721376828022058e-06, - "loss": 2.1588, - "step": 484880 - }, - { - "epoch": 0.85, - "learning_rate": 7.72050488809523e-06, - "loss": 2.3052, - "step": 484890 - }, - { - "epoch": 0.85, - "learning_rate": 7.719632948168404e-06, - "loss": 2.2529, - "step": 484900 - }, - { - "epoch": 0.85, - "learning_rate": 7.718761008241576e-06, - "loss": 2.3276, - "step": 484910 - }, - { - "epoch": 0.85, - "learning_rate": 7.71788906831475e-06, - "loss": 2.3165, - "step": 484920 - }, - { - "epoch": 0.85, - "learning_rate": 7.717017128387922e-06, - "loss": 2.26, - "step": 484930 - }, - { - "epoch": 0.85, - "learning_rate": 7.716145188461096e-06, - "loss": 2.1396, - "step": 484940 - }, - { - "epoch": 0.85, - "learning_rate": 7.71527324853427e-06, - "loss": 2.1313, - "step": 484950 - }, - { - "epoch": 0.85, - "learning_rate": 7.714401308607443e-06, - "loss": 2.2277, - "step": 484960 - }, - { - "epoch": 0.85, - "learning_rate": 7.713529368680615e-06, - "loss": 2.1621, - "step": 484970 - }, - { - "epoch": 0.85, - "learning_rate": 7.712657428753789e-06, - "loss": 2.2454, - "step": 484980 - }, - { - "epoch": 0.85, - "learning_rate": 7.711785488826963e-06, - "loss": 2.2467, - "step": 484990 - }, - { - "epoch": 0.85, - "learning_rate": 7.710913548900135e-06, - "loss": 2.2044, - "step": 485000 - }, - { - "epoch": 0.85, - "learning_rate": 7.710041608973309e-06, - "loss": 2.2884, - "step": 485010 - }, - { - "epoch": 0.85, - "learning_rate": 7.70916966904648e-06, - "loss": 2.2872, - "step": 485020 - }, - { - "epoch": 0.85, - "learning_rate": 7.708297729119656e-06, - "loss": 2.2723, - "step": 485030 - }, - { - "epoch": 0.85, - "learning_rate": 7.707425789192828e-06, - "loss": 2.3601, - "step": 485040 - }, - { - "epoch": 0.85, - "learning_rate": 7.706553849266002e-06, - "loss": 2.3119, - "step": 485050 - }, - { - "epoch": 0.85, - "learning_rate": 7.705681909339174e-06, - "loss": 2.2233, - "step": 485060 - }, - { - "epoch": 0.85, - "learning_rate": 7.704809969412348e-06, - "loss": 2.3079, - "step": 485070 - }, - { - "epoch": 0.85, - "learning_rate": 7.70393802948552e-06, - "loss": 2.2534, - "step": 485080 - }, - { - "epoch": 0.85, - "learning_rate": 7.703066089558694e-06, - "loss": 2.4119, - "step": 485090 - }, - { - "epoch": 0.85, - "learning_rate": 7.702194149631868e-06, - "loss": 2.2984, - "step": 485100 - }, - { - "epoch": 0.85, - "learning_rate": 7.701322209705041e-06, - "loss": 2.2289, - "step": 485110 - }, - { - "epoch": 0.85, - "learning_rate": 7.700450269778215e-06, - "loss": 2.2811, - "step": 485120 - }, - { - "epoch": 0.85, - "learning_rate": 7.699578329851387e-06, - "loss": 2.306, - "step": 485130 - }, - { - "epoch": 0.85, - "learning_rate": 7.698706389924561e-06, - "loss": 2.326, - "step": 485140 - }, - { - "epoch": 0.85, - "learning_rate": 7.697834449997733e-06, - "loss": 2.3186, - "step": 485150 - }, - { - "epoch": 0.85, - "learning_rate": 7.696962510070907e-06, - "loss": 2.2661, - "step": 485160 - }, - { - "epoch": 0.85, - "learning_rate": 7.696090570144079e-06, - "loss": 2.3287, - "step": 485170 - }, - { - "epoch": 0.85, - "learning_rate": 7.695218630217253e-06, - "loss": 2.24, - "step": 485180 - }, - { - "epoch": 0.85, - "learning_rate": 7.694346690290426e-06, - "loss": 2.3606, - "step": 485190 - }, - { - "epoch": 0.85, - "learning_rate": 7.6934747503636e-06, - "loss": 2.3171, - "step": 485200 - }, - { - "epoch": 0.85, - "learning_rate": 7.692602810436772e-06, - "loss": 2.1413, - "step": 485210 - }, - { - "epoch": 0.85, - "learning_rate": 7.691730870509946e-06, - "loss": 2.3122, - "step": 485220 - }, - { - "epoch": 0.85, - "learning_rate": 7.690858930583118e-06, - "loss": 2.3129, - "step": 485230 - }, - { - "epoch": 0.85, - "learning_rate": 7.689986990656292e-06, - "loss": 2.3033, - "step": 485240 - }, - { - "epoch": 0.85, - "learning_rate": 7.689115050729466e-06, - "loss": 2.3307, - "step": 485250 - }, - { - "epoch": 0.85, - "learning_rate": 7.688243110802638e-06, - "loss": 2.2715, - "step": 485260 - }, - { - "epoch": 0.85, - "learning_rate": 7.687371170875811e-06, - "loss": 2.159, - "step": 485270 - }, - { - "epoch": 0.85, - "learning_rate": 7.686499230948985e-06, - "loss": 2.2846, - "step": 485280 - }, - { - "epoch": 0.85, - "learning_rate": 7.685627291022159e-06, - "loss": 2.2921, - "step": 485290 - }, - { - "epoch": 0.85, - "learning_rate": 7.684755351095331e-06, - "loss": 2.2583, - "step": 485300 - }, - { - "epoch": 0.85, - "learning_rate": 7.683883411168505e-06, - "loss": 2.361, - "step": 485310 - }, - { - "epoch": 0.85, - "learning_rate": 7.683011471241677e-06, - "loss": 2.2551, - "step": 485320 - }, - { - "epoch": 0.85, - "learning_rate": 7.68213953131485e-06, - "loss": 2.2036, - "step": 485330 - }, - { - "epoch": 0.85, - "learning_rate": 7.681267591388024e-06, - "loss": 2.2307, - "step": 485340 - }, - { - "epoch": 0.85, - "learning_rate": 7.680395651461198e-06, - "loss": 2.2709, - "step": 485350 - }, - { - "epoch": 0.85, - "learning_rate": 7.67952371153437e-06, - "loss": 2.2992, - "step": 485360 - }, - { - "epoch": 0.85, - "learning_rate": 7.678651771607544e-06, - "loss": 2.2997, - "step": 485370 - }, - { - "epoch": 0.85, - "learning_rate": 7.677779831680718e-06, - "loss": 2.2777, - "step": 485380 - }, - { - "epoch": 0.85, - "learning_rate": 7.67690789175389e-06, - "loss": 2.3082, - "step": 485390 - }, - { - "epoch": 0.85, - "learning_rate": 7.676035951827064e-06, - "loss": 2.2955, - "step": 485400 - }, - { - "epoch": 0.85, - "learning_rate": 7.675164011900236e-06, - "loss": 2.335, - "step": 485410 - }, - { - "epoch": 0.85, - "learning_rate": 7.67429207197341e-06, - "loss": 2.2998, - "step": 485420 - }, - { - "epoch": 0.85, - "learning_rate": 7.673420132046583e-06, - "loss": 2.1105, - "step": 485430 - }, - { - "epoch": 0.85, - "learning_rate": 7.672548192119757e-06, - "loss": 2.3399, - "step": 485440 - }, - { - "epoch": 0.85, - "learning_rate": 7.671676252192929e-06, - "loss": 2.2472, - "step": 485450 - }, - { - "epoch": 0.85, - "learning_rate": 7.670804312266103e-06, - "loss": 2.3351, - "step": 485460 - }, - { - "epoch": 0.85, - "learning_rate": 7.669932372339275e-06, - "loss": 2.3055, - "step": 485470 - }, - { - "epoch": 0.85, - "learning_rate": 7.669060432412449e-06, - "loss": 2.32, - "step": 485480 - }, - { - "epoch": 0.85, - "learning_rate": 7.66818849248562e-06, - "loss": 2.3373, - "step": 485490 - }, - { - "epoch": 0.85, - "learning_rate": 7.667316552558795e-06, - "loss": 2.2351, - "step": 485500 - }, - { - "epoch": 0.85, - "learning_rate": 7.666444612631968e-06, - "loss": 2.2511, - "step": 485510 - }, - { - "epoch": 0.85, - "learning_rate": 7.665572672705142e-06, - "loss": 2.2039, - "step": 485520 - }, - { - "epoch": 0.85, - "learning_rate": 7.664700732778316e-06, - "loss": 2.3319, - "step": 485530 - }, - { - "epoch": 0.85, - "learning_rate": 7.663828792851488e-06, - "loss": 2.1844, - "step": 485540 - }, - { - "epoch": 0.85, - "learning_rate": 7.662956852924662e-06, - "loss": 2.3083, - "step": 485550 - }, - { - "epoch": 0.85, - "learning_rate": 7.662084912997834e-06, - "loss": 2.3512, - "step": 485560 - }, - { - "epoch": 0.85, - "learning_rate": 7.661212973071008e-06, - "loss": 2.2928, - "step": 485570 - }, - { - "epoch": 0.85, - "learning_rate": 7.66034103314418e-06, - "loss": 2.2668, - "step": 485580 - }, - { - "epoch": 0.85, - "learning_rate": 7.659469093217355e-06, - "loss": 2.3348, - "step": 485590 - }, - { - "epoch": 0.85, - "learning_rate": 7.658597153290527e-06, - "loss": 2.2456, - "step": 485600 - }, - { - "epoch": 0.85, - "learning_rate": 7.657725213363701e-06, - "loss": 2.1811, - "step": 485610 - }, - { - "epoch": 0.85, - "learning_rate": 7.656853273436873e-06, - "loss": 2.2857, - "step": 485620 - }, - { - "epoch": 0.85, - "learning_rate": 7.655981333510047e-06, - "loss": 2.2511, - "step": 485630 - }, - { - "epoch": 0.85, - "learning_rate": 7.655109393583219e-06, - "loss": 2.1977, - "step": 485640 - }, - { - "epoch": 0.85, - "learning_rate": 7.654237453656393e-06, - "loss": 2.2263, - "step": 485650 - }, - { - "epoch": 0.85, - "learning_rate": 7.653365513729566e-06, - "loss": 2.1881, - "step": 485660 - }, - { - "epoch": 0.85, - "learning_rate": 7.65249357380274e-06, - "loss": 2.2875, - "step": 485670 - }, - { - "epoch": 0.85, - "learning_rate": 7.651621633875914e-06, - "loss": 2.2482, - "step": 485680 - }, - { - "epoch": 0.85, - "learning_rate": 7.650749693949086e-06, - "loss": 2.2775, - "step": 485690 - }, - { - "epoch": 0.85, - "learning_rate": 7.64987775402226e-06, - "loss": 2.3486, - "step": 485700 - }, - { - "epoch": 0.85, - "learning_rate": 7.649005814095432e-06, - "loss": 2.2916, - "step": 485710 - }, - { - "epoch": 0.85, - "learning_rate": 7.648133874168606e-06, - "loss": 2.2437, - "step": 485720 - }, - { - "epoch": 0.85, - "learning_rate": 7.647261934241778e-06, - "loss": 2.3511, - "step": 485730 - }, - { - "epoch": 0.85, - "learning_rate": 7.646389994314952e-06, - "loss": 2.1838, - "step": 485740 - }, - { - "epoch": 0.85, - "learning_rate": 7.645518054388125e-06, - "loss": 2.3624, - "step": 485750 - }, - { - "epoch": 0.85, - "learning_rate": 7.644646114461299e-06, - "loss": 2.2629, - "step": 485760 - }, - { - "epoch": 0.85, - "learning_rate": 7.643774174534471e-06, - "loss": 2.305, - "step": 485770 - }, - { - "epoch": 0.85, - "learning_rate": 7.642902234607645e-06, - "loss": 2.1795, - "step": 485780 - }, - { - "epoch": 0.85, - "learning_rate": 7.642030294680819e-06, - "loss": 2.2297, - "step": 485790 - }, - { - "epoch": 0.85, - "learning_rate": 7.64115835475399e-06, - "loss": 2.2627, - "step": 485800 - }, - { - "epoch": 0.85, - "learning_rate": 7.640286414827165e-06, - "loss": 2.364, - "step": 485810 - }, - { - "epoch": 0.85, - "learning_rate": 7.639414474900337e-06, - "loss": 2.1962, - "step": 485820 - }, - { - "epoch": 0.85, - "learning_rate": 7.638542534973512e-06, - "loss": 2.3892, - "step": 485830 - }, - { - "epoch": 0.85, - "learning_rate": 7.637670595046684e-06, - "loss": 2.3058, - "step": 485840 - }, - { - "epoch": 0.85, - "learning_rate": 7.636798655119858e-06, - "loss": 2.3093, - "step": 485850 - }, - { - "epoch": 0.85, - "learning_rate": 7.63592671519303e-06, - "loss": 2.2722, - "step": 485860 - }, - { - "epoch": 0.85, - "learning_rate": 7.635054775266204e-06, - "loss": 2.3481, - "step": 485870 - }, - { - "epoch": 0.85, - "learning_rate": 7.634182835339376e-06, - "loss": 2.2425, - "step": 485880 - }, - { - "epoch": 0.85, - "learning_rate": 7.63331089541255e-06, - "loss": 2.2236, - "step": 485890 - }, - { - "epoch": 0.85, - "learning_rate": 7.632438955485723e-06, - "loss": 2.3177, - "step": 485900 - }, - { - "epoch": 0.85, - "learning_rate": 7.631567015558897e-06, - "loss": 2.3645, - "step": 485910 - }, - { - "epoch": 0.85, - "learning_rate": 7.630695075632071e-06, - "loss": 2.2126, - "step": 485920 - }, - { - "epoch": 0.85, - "learning_rate": 7.629823135705243e-06, - "loss": 2.2845, - "step": 485930 - }, - { - "epoch": 0.85, - "learning_rate": 7.628951195778417e-06, - "loss": 2.2769, - "step": 485940 - }, - { - "epoch": 0.85, - "learning_rate": 7.628079255851589e-06, - "loss": 2.3101, - "step": 485950 - }, - { - "epoch": 0.85, - "learning_rate": 7.627207315924763e-06, - "loss": 2.2356, - "step": 485960 - }, - { - "epoch": 0.85, - "learning_rate": 7.6263353759979355e-06, - "loss": 2.2343, - "step": 485970 - }, - { - "epoch": 0.85, - "learning_rate": 7.625463436071109e-06, - "loss": 2.2893, - "step": 485980 - }, - { - "epoch": 0.85, - "learning_rate": 7.624591496144281e-06, - "loss": 2.3034, - "step": 485990 - }, - { - "epoch": 0.85, - "learning_rate": 7.623719556217455e-06, - "loss": 2.3118, - "step": 486000 - }, - { - "epoch": 0.85, - "learning_rate": 7.622847616290628e-06, - "loss": 2.2785, - "step": 486010 - }, - { - "epoch": 0.85, - "learning_rate": 7.621975676363802e-06, - "loss": 2.3328, - "step": 486020 - }, - { - "epoch": 0.85, - "learning_rate": 7.621103736436974e-06, - "loss": 2.3455, - "step": 486030 - }, - { - "epoch": 0.85, - "learning_rate": 7.620231796510148e-06, - "loss": 2.2331, - "step": 486040 - }, - { - "epoch": 0.85, - "learning_rate": 7.6193598565833214e-06, - "loss": 2.2217, - "step": 486050 - }, - { - "epoch": 0.85, - "learning_rate": 7.618487916656494e-06, - "loss": 2.3461, - "step": 486060 - }, - { - "epoch": 0.85, - "learning_rate": 7.617615976729668e-06, - "loss": 2.3637, - "step": 486070 - }, - { - "epoch": 0.85, - "learning_rate": 7.61674403680284e-06, - "loss": 2.2669, - "step": 486080 - }, - { - "epoch": 0.85, - "learning_rate": 7.615872096876015e-06, - "loss": 2.1995, - "step": 486090 - }, - { - "epoch": 0.85, - "learning_rate": 7.615000156949187e-06, - "loss": 2.2986, - "step": 486100 - }, - { - "epoch": 0.85, - "learning_rate": 7.614128217022361e-06, - "loss": 2.3728, - "step": 486110 - }, - { - "epoch": 0.85, - "learning_rate": 7.613256277095534e-06, - "loss": 2.2571, - "step": 486120 - }, - { - "epoch": 0.85, - "learning_rate": 7.612384337168707e-06, - "loss": 2.4478, - "step": 486130 - }, - { - "epoch": 0.85, - "learning_rate": 7.6115123972418794e-06, - "loss": 2.2601, - "step": 486140 - }, - { - "epoch": 0.85, - "learning_rate": 7.610640457315053e-06, - "loss": 2.3479, - "step": 486150 - }, - { - "epoch": 0.85, - "learning_rate": 7.609768517388226e-06, - "loss": 2.1764, - "step": 486160 - }, - { - "epoch": 0.85, - "learning_rate": 7.6088965774614e-06, - "loss": 2.1565, - "step": 486170 - }, - { - "epoch": 0.85, - "learning_rate": 7.608024637534574e-06, - "loss": 2.1417, - "step": 486180 - }, - { - "epoch": 0.85, - "learning_rate": 7.607152697607746e-06, - "loss": 2.2751, - "step": 486190 - }, - { - "epoch": 0.85, - "learning_rate": 7.6062807576809195e-06, - "loss": 2.1282, - "step": 486200 - }, - { - "epoch": 0.85, - "learning_rate": 7.6054088177540924e-06, - "loss": 2.208, - "step": 486210 - }, - { - "epoch": 0.85, - "learning_rate": 7.604536877827266e-06, - "loss": 2.2577, - "step": 486220 - }, - { - "epoch": 0.85, - "learning_rate": 7.603664937900438e-06, - "loss": 2.26, - "step": 486230 - }, - { - "epoch": 0.85, - "learning_rate": 7.602792997973612e-06, - "loss": 2.4519, - "step": 486240 - }, - { - "epoch": 0.85, - "learning_rate": 7.601921058046785e-06, - "loss": 2.3063, - "step": 486250 - }, - { - "epoch": 0.85, - "learning_rate": 7.601049118119959e-06, - "loss": 2.3331, - "step": 486260 - }, - { - "epoch": 0.85, - "learning_rate": 7.600177178193131e-06, - "loss": 2.3024, - "step": 486270 - }, - { - "epoch": 0.85, - "learning_rate": 7.599305238266305e-06, - "loss": 2.1673, - "step": 486280 - }, - { - "epoch": 0.85, - "learning_rate": 7.5984332983394775e-06, - "loss": 2.2991, - "step": 486290 - }, - { - "epoch": 0.85, - "learning_rate": 7.597561358412651e-06, - "loss": 2.287, - "step": 486300 - }, - { - "epoch": 0.85, - "learning_rate": 7.596689418485825e-06, - "loss": 2.2391, - "step": 486310 - }, - { - "epoch": 0.85, - "learning_rate": 7.595817478558997e-06, - "loss": 2.3477, - "step": 486320 - }, - { - "epoch": 0.85, - "learning_rate": 7.594945538632172e-06, - "loss": 2.2136, - "step": 486330 - }, - { - "epoch": 0.85, - "learning_rate": 7.594073598705344e-06, - "loss": 2.2098, - "step": 486340 - }, - { - "epoch": 0.85, - "learning_rate": 7.593201658778518e-06, - "loss": 2.2896, - "step": 486350 - }, - { - "epoch": 0.85, - "learning_rate": 7.59232971885169e-06, - "loss": 2.3196, - "step": 486360 - }, - { - "epoch": 0.85, - "learning_rate": 7.591457778924864e-06, - "loss": 2.1714, - "step": 486370 - }, - { - "epoch": 0.85, - "learning_rate": 7.590585838998036e-06, - "loss": 2.3018, - "step": 486380 - }, - { - "epoch": 0.85, - "learning_rate": 7.58971389907121e-06, - "loss": 2.3179, - "step": 486390 - }, - { - "epoch": 0.85, - "learning_rate": 7.588841959144383e-06, - "loss": 2.3275, - "step": 486400 - }, - { - "epoch": 0.85, - "learning_rate": 7.587970019217557e-06, - "loss": 2.3279, - "step": 486410 - }, - { - "epoch": 0.85, - "learning_rate": 7.587098079290729e-06, - "loss": 2.3503, - "step": 486420 - }, - { - "epoch": 0.85, - "learning_rate": 7.586226139363903e-06, - "loss": 2.32, - "step": 486430 - }, - { - "epoch": 0.85, - "learning_rate": 7.585354199437076e-06, - "loss": 2.2832, - "step": 486440 - }, - { - "epoch": 0.85, - "learning_rate": 7.584482259510249e-06, - "loss": 2.2844, - "step": 486450 - }, - { - "epoch": 0.85, - "learning_rate": 7.583610319583423e-06, - "loss": 2.1871, - "step": 486460 - }, - { - "epoch": 0.85, - "learning_rate": 7.582738379656595e-06, - "loss": 2.3042, - "step": 486470 - }, - { - "epoch": 0.85, - "learning_rate": 7.581866439729769e-06, - "loss": 2.1921, - "step": 486480 - }, - { - "epoch": 0.85, - "learning_rate": 7.580994499802942e-06, - "loss": 2.2958, - "step": 486490 - }, - { - "epoch": 0.85, - "learning_rate": 7.580122559876116e-06, - "loss": 2.2383, - "step": 486500 - }, - { - "epoch": 0.85, - "learning_rate": 7.579250619949288e-06, - "loss": 2.3124, - "step": 486510 - }, - { - "epoch": 0.85, - "learning_rate": 7.5783786800224615e-06, - "loss": 2.3111, - "step": 486520 - }, - { - "epoch": 0.85, - "learning_rate": 7.5775067400956344e-06, - "loss": 2.2648, - "step": 486530 - }, - { - "epoch": 0.85, - "learning_rate": 7.576634800168808e-06, - "loss": 2.2464, - "step": 486540 - }, - { - "epoch": 0.85, - "learning_rate": 7.57576286024198e-06, - "loss": 2.2251, - "step": 486550 - }, - { - "epoch": 0.85, - "learning_rate": 7.574890920315154e-06, - "loss": 2.2343, - "step": 486560 - }, - { - "epoch": 0.85, - "learning_rate": 7.574018980388327e-06, - "loss": 2.1838, - "step": 486570 - }, - { - "epoch": 0.85, - "learning_rate": 7.573147040461501e-06, - "loss": 2.2262, - "step": 486580 - }, - { - "epoch": 0.85, - "learning_rate": 7.5722751005346745e-06, - "loss": 2.3549, - "step": 486590 - }, - { - "epoch": 0.85, - "learning_rate": 7.571403160607847e-06, - "loss": 2.2804, - "step": 486600 - }, - { - "epoch": 0.85, - "learning_rate": 7.570531220681021e-06, - "loss": 2.2679, - "step": 486610 - }, - { - "epoch": 0.85, - "learning_rate": 7.569659280754193e-06, - "loss": 2.2875, - "step": 486620 - }, - { - "epoch": 0.85, - "learning_rate": 7.568787340827367e-06, - "loss": 2.2383, - "step": 486630 - }, - { - "epoch": 0.85, - "learning_rate": 7.56791540090054e-06, - "loss": 2.2306, - "step": 486640 - }, - { - "epoch": 0.85, - "learning_rate": 7.567043460973714e-06, - "loss": 2.2356, - "step": 486650 - }, - { - "epoch": 0.85, - "learning_rate": 7.566171521046886e-06, - "loss": 2.384, - "step": 486660 - }, - { - "epoch": 0.85, - "learning_rate": 7.56529958112006e-06, - "loss": 2.255, - "step": 486670 - }, - { - "epoch": 0.85, - "learning_rate": 7.5644276411932325e-06, - "loss": 2.1711, - "step": 486680 - }, - { - "epoch": 0.85, - "learning_rate": 7.563555701266406e-06, - "loss": 2.1872, - "step": 486690 - }, - { - "epoch": 0.85, - "learning_rate": 7.562683761339578e-06, - "loss": 2.2562, - "step": 486700 - }, - { - "epoch": 0.85, - "learning_rate": 7.561811821412752e-06, - "loss": 2.2386, - "step": 486710 - }, - { - "epoch": 0.85, - "learning_rate": 7.560939881485926e-06, - "loss": 2.2809, - "step": 486720 - }, - { - "epoch": 0.85, - "learning_rate": 7.560067941559099e-06, - "loss": 2.3796, - "step": 486730 - }, - { - "epoch": 0.85, - "learning_rate": 7.559196001632273e-06, - "loss": 2.2968, - "step": 486740 - }, - { - "epoch": 0.85, - "learning_rate": 7.558324061705445e-06, - "loss": 2.3429, - "step": 486750 - }, - { - "epoch": 0.85, - "learning_rate": 7.5574521217786184e-06, - "loss": 2.3267, - "step": 486760 - }, - { - "epoch": 0.85, - "learning_rate": 7.556580181851791e-06, - "loss": 2.292, - "step": 486770 - }, - { - "epoch": 0.85, - "learning_rate": 7.555708241924965e-06, - "loss": 2.2791, - "step": 486780 - }, - { - "epoch": 0.85, - "learning_rate": 7.554836301998137e-06, - "loss": 2.2913, - "step": 486790 - }, - { - "epoch": 0.85, - "learning_rate": 7.553964362071311e-06, - "loss": 2.3307, - "step": 486800 - }, - { - "epoch": 0.85, - "learning_rate": 7.553092422144484e-06, - "loss": 2.2825, - "step": 486810 - }, - { - "epoch": 0.85, - "learning_rate": 7.552220482217658e-06, - "loss": 2.3192, - "step": 486820 - }, - { - "epoch": 0.85, - "learning_rate": 7.55134854229083e-06, - "loss": 2.2921, - "step": 486830 - }, - { - "epoch": 0.85, - "learning_rate": 7.5504766023640035e-06, - "loss": 2.3547, - "step": 486840 - }, - { - "epoch": 0.85, - "learning_rate": 7.549604662437178e-06, - "loss": 2.1858, - "step": 486850 - }, - { - "epoch": 0.85, - "learning_rate": 7.54873272251035e-06, - "loss": 2.2401, - "step": 486860 - }, - { - "epoch": 0.85, - "learning_rate": 7.547860782583524e-06, - "loss": 2.1303, - "step": 486870 - }, - { - "epoch": 0.85, - "learning_rate": 7.546988842656697e-06, - "loss": 2.2987, - "step": 486880 - }, - { - "epoch": 0.85, - "learning_rate": 7.546116902729871e-06, - "loss": 2.3014, - "step": 486890 - }, - { - "epoch": 0.85, - "learning_rate": 7.545244962803043e-06, - "loss": 2.284, - "step": 486900 - }, - { - "epoch": 0.85, - "learning_rate": 7.5443730228762165e-06, - "loss": 2.313, - "step": 486910 - }, - { - "epoch": 0.85, - "learning_rate": 7.5435010829493894e-06, - "loss": 2.1366, - "step": 486920 - }, - { - "epoch": 0.85, - "learning_rate": 7.542629143022563e-06, - "loss": 2.286, - "step": 486930 - }, - { - "epoch": 0.85, - "learning_rate": 7.541757203095735e-06, - "loss": 2.2323, - "step": 486940 - }, - { - "epoch": 0.85, - "learning_rate": 7.540885263168909e-06, - "loss": 2.2169, - "step": 486950 - }, - { - "epoch": 0.85, - "learning_rate": 7.540013323242082e-06, - "loss": 2.1969, - "step": 486960 - }, - { - "epoch": 0.85, - "learning_rate": 7.539141383315256e-06, - "loss": 2.2009, - "step": 486970 - }, - { - "epoch": 0.85, - "learning_rate": 7.5382694433884295e-06, - "loss": 2.2584, - "step": 486980 - }, - { - "epoch": 0.85, - "learning_rate": 7.537397503461602e-06, - "loss": 2.1687, - "step": 486990 - }, - { - "epoch": 0.85, - "learning_rate": 7.536525563534775e-06, - "loss": 2.2942, - "step": 487000 - }, - { - "epoch": 0.85, - "learning_rate": 7.535653623607948e-06, - "loss": 2.2104, - "step": 487010 - }, - { - "epoch": 0.85, - "learning_rate": 7.534781683681122e-06, - "loss": 2.2686, - "step": 487020 - }, - { - "epoch": 0.85, - "learning_rate": 7.533909743754294e-06, - "loss": 2.427, - "step": 487030 - }, - { - "epoch": 0.85, - "learning_rate": 7.533037803827468e-06, - "loss": 2.2831, - "step": 487040 - }, - { - "epoch": 0.85, - "learning_rate": 7.532165863900641e-06, - "loss": 2.2973, - "step": 487050 - }, - { - "epoch": 0.85, - "learning_rate": 7.531293923973815e-06, - "loss": 2.1598, - "step": 487060 - }, - { - "epoch": 0.85, - "learning_rate": 7.530421984046987e-06, - "loss": 2.1756, - "step": 487070 - }, - { - "epoch": 0.85, - "learning_rate": 7.5295500441201604e-06, - "loss": 2.2231, - "step": 487080 - }, - { - "epoch": 0.85, - "learning_rate": 7.528678104193333e-06, - "loss": 2.3232, - "step": 487090 - }, - { - "epoch": 0.85, - "learning_rate": 7.527806164266507e-06, - "loss": 2.2239, - "step": 487100 - }, - { - "epoch": 0.85, - "learning_rate": 7.526934224339681e-06, - "loss": 2.3334, - "step": 487110 - }, - { - "epoch": 0.85, - "learning_rate": 7.526062284412853e-06, - "loss": 2.2613, - "step": 487120 - }, - { - "epoch": 0.85, - "learning_rate": 7.525190344486028e-06, - "loss": 2.251, - "step": 487130 - }, - { - "epoch": 0.85, - "learning_rate": 7.5243184045592e-06, - "loss": 2.2604, - "step": 487140 - }, - { - "epoch": 0.85, - "learning_rate": 7.5234464646323734e-06, - "loss": 2.3849, - "step": 487150 - }, - { - "epoch": 0.85, - "learning_rate": 7.522574524705546e-06, - "loss": 2.1162, - "step": 487160 - }, - { - "epoch": 0.85, - "learning_rate": 7.52170258477872e-06, - "loss": 2.2948, - "step": 487170 - }, - { - "epoch": 0.85, - "learning_rate": 7.520830644851892e-06, - "loss": 2.3177, - "step": 487180 - }, - { - "epoch": 0.85, - "learning_rate": 7.519958704925066e-06, - "loss": 2.2022, - "step": 487190 - }, - { - "epoch": 0.85, - "learning_rate": 7.519086764998239e-06, - "loss": 2.2748, - "step": 487200 - }, - { - "epoch": 0.85, - "learning_rate": 7.518214825071413e-06, - "loss": 2.256, - "step": 487210 - }, - { - "epoch": 0.85, - "learning_rate": 7.517342885144585e-06, - "loss": 2.2879, - "step": 487220 - }, - { - "epoch": 0.85, - "learning_rate": 7.5164709452177585e-06, - "loss": 2.2262, - "step": 487230 - }, - { - "epoch": 0.85, - "learning_rate": 7.515599005290932e-06, - "loss": 2.2635, - "step": 487240 - }, - { - "epoch": 0.85, - "learning_rate": 7.514727065364105e-06, - "loss": 2.2797, - "step": 487250 - }, - { - "epoch": 0.85, - "learning_rate": 7.513855125437279e-06, - "loss": 2.1437, - "step": 487260 - }, - { - "epoch": 0.85, - "learning_rate": 7.512983185510451e-06, - "loss": 2.3121, - "step": 487270 - }, - { - "epoch": 0.85, - "learning_rate": 7.512111245583625e-06, - "loss": 2.1767, - "step": 487280 - }, - { - "epoch": 0.85, - "learning_rate": 7.511239305656798e-06, - "loss": 2.2782, - "step": 487290 - }, - { - "epoch": 0.85, - "learning_rate": 7.5103673657299715e-06, - "loss": 2.2798, - "step": 487300 - }, - { - "epoch": 0.85, - "learning_rate": 7.509495425803144e-06, - "loss": 2.2335, - "step": 487310 - }, - { - "epoch": 0.85, - "learning_rate": 7.508623485876317e-06, - "loss": 2.3635, - "step": 487320 - }, - { - "epoch": 0.85, - "learning_rate": 7.50775154594949e-06, - "loss": 2.3183, - "step": 487330 - }, - { - "epoch": 0.85, - "learning_rate": 7.506879606022664e-06, - "loss": 2.2326, - "step": 487340 - }, - { - "epoch": 0.85, - "learning_rate": 7.506007666095836e-06, - "loss": 2.2571, - "step": 487350 - }, - { - "epoch": 0.85, - "learning_rate": 7.50513572616901e-06, - "loss": 2.4077, - "step": 487360 - }, - { - "epoch": 0.85, - "learning_rate": 7.504263786242183e-06, - "loss": 2.2621, - "step": 487370 - }, - { - "epoch": 0.85, - "learning_rate": 7.503391846315357e-06, - "loss": 2.2753, - "step": 487380 - }, - { - "epoch": 0.85, - "learning_rate": 7.50251990638853e-06, - "loss": 2.3506, - "step": 487390 - }, - { - "epoch": 0.85, - "learning_rate": 7.501647966461703e-06, - "loss": 2.265, - "step": 487400 - }, - { - "epoch": 0.85, - "learning_rate": 7.500776026534877e-06, - "loss": 2.2268, - "step": 487410 - }, - { - "epoch": 0.85, - "learning_rate": 7.499904086608049e-06, - "loss": 2.3303, - "step": 487420 - }, - { - "epoch": 0.85, - "learning_rate": 7.499032146681223e-06, - "loss": 2.3319, - "step": 487430 - }, - { - "epoch": 0.85, - "learning_rate": 7.498160206754396e-06, - "loss": 2.2101, - "step": 487440 - }, - { - "epoch": 0.85, - "learning_rate": 7.49728826682757e-06, - "loss": 2.3595, - "step": 487450 - }, - { - "epoch": 0.85, - "learning_rate": 7.496416326900742e-06, - "loss": 2.2228, - "step": 487460 - }, - { - "epoch": 0.85, - "learning_rate": 7.4955443869739154e-06, - "loss": 2.2563, - "step": 487470 - }, - { - "epoch": 0.85, - "learning_rate": 7.494672447047088e-06, - "loss": 2.2504, - "step": 487480 - }, - { - "epoch": 0.85, - "learning_rate": 7.493800507120262e-06, - "loss": 2.3041, - "step": 487490 - }, - { - "epoch": 0.85, - "learning_rate": 7.492928567193434e-06, - "loss": 2.3591, - "step": 487500 - }, - { - "epoch": 0.85, - "learning_rate": 7.492056627266608e-06, - "loss": 2.346, - "step": 487510 - }, - { - "epoch": 0.85, - "learning_rate": 7.491184687339782e-06, - "loss": 2.2341, - "step": 487520 - }, - { - "epoch": 0.85, - "learning_rate": 7.490312747412955e-06, - "loss": 2.2425, - "step": 487530 - }, - { - "epoch": 0.85, - "learning_rate": 7.4894408074861284e-06, - "loss": 2.3138, - "step": 487540 - }, - { - "epoch": 0.85, - "learning_rate": 7.4885688675593005e-06, - "loss": 2.3643, - "step": 487550 - }, - { - "epoch": 0.85, - "learning_rate": 7.487696927632474e-06, - "loss": 2.2012, - "step": 487560 - }, - { - "epoch": 0.85, - "learning_rate": 7.486824987705647e-06, - "loss": 2.1722, - "step": 487570 - }, - { - "epoch": 0.85, - "learning_rate": 7.485953047778821e-06, - "loss": 2.2643, - "step": 487580 - }, - { - "epoch": 0.85, - "learning_rate": 7.485081107851993e-06, - "loss": 2.2666, - "step": 487590 - }, - { - "epoch": 0.85, - "learning_rate": 7.484209167925167e-06, - "loss": 2.2925, - "step": 487600 - }, - { - "epoch": 0.85, - "learning_rate": 7.48333722799834e-06, - "loss": 2.3562, - "step": 487610 - }, - { - "epoch": 0.85, - "learning_rate": 7.4824652880715135e-06, - "loss": 2.1808, - "step": 487620 - }, - { - "epoch": 0.85, - "learning_rate": 7.481593348144686e-06, - "loss": 2.1558, - "step": 487630 - }, - { - "epoch": 0.85, - "learning_rate": 7.480721408217859e-06, - "loss": 2.2519, - "step": 487640 - }, - { - "epoch": 0.85, - "learning_rate": 7.479849468291034e-06, - "loss": 2.2337, - "step": 487650 - }, - { - "epoch": 0.85, - "learning_rate": 7.478977528364206e-06, - "loss": 2.2949, - "step": 487660 - }, - { - "epoch": 0.85, - "learning_rate": 7.47810558843738e-06, - "loss": 2.2147, - "step": 487670 - }, - { - "epoch": 0.85, - "learning_rate": 7.477233648510553e-06, - "loss": 2.2189, - "step": 487680 - }, - { - "epoch": 0.85, - "learning_rate": 7.4763617085837265e-06, - "loss": 2.2955, - "step": 487690 - }, - { - "epoch": 0.85, - "learning_rate": 7.475489768656899e-06, - "loss": 2.2588, - "step": 487700 - }, - { - "epoch": 0.85, - "learning_rate": 7.474617828730072e-06, - "loss": 2.2907, - "step": 487710 - }, - { - "epoch": 0.85, - "learning_rate": 7.473745888803245e-06, - "loss": 2.2112, - "step": 487720 - }, - { - "epoch": 0.85, - "learning_rate": 7.472873948876419e-06, - "loss": 2.2777, - "step": 487730 - }, - { - "epoch": 0.85, - "learning_rate": 7.472002008949591e-06, - "loss": 2.1689, - "step": 487740 - }, - { - "epoch": 0.85, - "learning_rate": 7.471130069022765e-06, - "loss": 2.2749, - "step": 487750 - }, - { - "epoch": 0.85, - "learning_rate": 7.470258129095938e-06, - "loss": 2.2954, - "step": 487760 - }, - { - "epoch": 0.85, - "learning_rate": 7.469386189169112e-06, - "loss": 2.3837, - "step": 487770 - }, - { - "epoch": 0.85, - "learning_rate": 7.468514249242285e-06, - "loss": 2.3991, - "step": 487780 - }, - { - "epoch": 0.85, - "learning_rate": 7.4676423093154574e-06, - "loss": 2.2795, - "step": 487790 - }, - { - "epoch": 0.85, - "learning_rate": 7.466770369388631e-06, - "loss": 2.3496, - "step": 487800 - }, - { - "epoch": 0.85, - "learning_rate": 7.465898429461804e-06, - "loss": 2.2487, - "step": 487810 - }, - { - "epoch": 0.85, - "learning_rate": 7.465026489534978e-06, - "loss": 2.2547, - "step": 487820 - }, - { - "epoch": 0.85, - "learning_rate": 7.46415454960815e-06, - "loss": 2.256, - "step": 487830 - }, - { - "epoch": 0.85, - "learning_rate": 7.463282609681324e-06, - "loss": 2.2997, - "step": 487840 - }, - { - "epoch": 0.85, - "learning_rate": 7.462410669754497e-06, - "loss": 2.2889, - "step": 487850 - }, - { - "epoch": 0.85, - "learning_rate": 7.4615387298276704e-06, - "loss": 2.3635, - "step": 487860 - }, - { - "epoch": 0.85, - "learning_rate": 7.4606667899008425e-06, - "loss": 2.3904, - "step": 487870 - }, - { - "epoch": 0.85, - "learning_rate": 7.459794849974016e-06, - "loss": 2.3115, - "step": 487880 - }, - { - "epoch": 0.85, - "learning_rate": 7.458922910047189e-06, - "loss": 2.297, - "step": 487890 - }, - { - "epoch": 0.85, - "learning_rate": 7.458050970120363e-06, - "loss": 2.3441, - "step": 487900 - }, - { - "epoch": 0.85, - "learning_rate": 7.457179030193537e-06, - "loss": 2.2392, - "step": 487910 - }, - { - "epoch": 0.85, - "learning_rate": 7.45630709026671e-06, - "loss": 2.2215, - "step": 487920 - }, - { - "epoch": 0.85, - "learning_rate": 7.4554351503398834e-06, - "loss": 2.2784, - "step": 487930 - }, - { - "epoch": 0.85, - "learning_rate": 7.4545632104130555e-06, - "loss": 2.18, - "step": 487940 - }, - { - "epoch": 0.85, - "learning_rate": 7.453691270486229e-06, - "loss": 2.267, - "step": 487950 - }, - { - "epoch": 0.85, - "learning_rate": 7.452819330559402e-06, - "loss": 2.1743, - "step": 487960 - }, - { - "epoch": 0.85, - "learning_rate": 7.451947390632576e-06, - "loss": 2.2988, - "step": 487970 - }, - { - "epoch": 0.85, - "learning_rate": 7.451075450705748e-06, - "loss": 2.2676, - "step": 487980 - }, - { - "epoch": 0.85, - "learning_rate": 7.450203510778922e-06, - "loss": 2.1717, - "step": 487990 - }, - { - "epoch": 0.85, - "learning_rate": 7.449331570852095e-06, - "loss": 2.365, - "step": 488000 - }, - { - "epoch": 0.85, - "learning_rate": 7.4484596309252685e-06, - "loss": 2.2207, - "step": 488010 - }, - { - "epoch": 0.85, - "learning_rate": 7.447587690998441e-06, - "loss": 2.1882, - "step": 488020 - }, - { - "epoch": 0.85, - "learning_rate": 7.446715751071614e-06, - "loss": 2.3069, - "step": 488030 - }, - { - "epoch": 0.85, - "learning_rate": 7.445843811144788e-06, - "loss": 2.3327, - "step": 488040 - }, - { - "epoch": 0.85, - "learning_rate": 7.444971871217961e-06, - "loss": 2.2388, - "step": 488050 - }, - { - "epoch": 0.85, - "learning_rate": 7.444099931291135e-06, - "loss": 2.3733, - "step": 488060 - }, - { - "epoch": 0.85, - "learning_rate": 7.443227991364307e-06, - "loss": 2.1782, - "step": 488070 - }, - { - "epoch": 0.85, - "learning_rate": 7.442356051437481e-06, - "loss": 2.1468, - "step": 488080 - }, - { - "epoch": 0.85, - "learning_rate": 7.441484111510654e-06, - "loss": 2.2498, - "step": 488090 - }, - { - "epoch": 0.85, - "learning_rate": 7.440612171583827e-06, - "loss": 2.2886, - "step": 488100 - }, - { - "epoch": 0.85, - "learning_rate": 7.4397402316569994e-06, - "loss": 2.25, - "step": 488110 - }, - { - "epoch": 0.85, - "learning_rate": 7.438868291730173e-06, - "loss": 2.2192, - "step": 488120 - }, - { - "epoch": 0.85, - "learning_rate": 7.437996351803346e-06, - "loss": 2.2734, - "step": 488130 - }, - { - "epoch": 0.85, - "learning_rate": 7.43712441187652e-06, - "loss": 2.2445, - "step": 488140 - }, - { - "epoch": 0.85, - "learning_rate": 7.436252471949692e-06, - "loss": 2.3195, - "step": 488150 - }, - { - "epoch": 0.85, - "learning_rate": 7.435380532022866e-06, - "loss": 2.2516, - "step": 488160 - }, - { - "epoch": 0.85, - "learning_rate": 7.434508592096039e-06, - "loss": 2.2615, - "step": 488170 - }, - { - "epoch": 0.85, - "learning_rate": 7.4336366521692124e-06, - "loss": 2.1851, - "step": 488180 - }, - { - "epoch": 0.85, - "learning_rate": 7.432764712242386e-06, - "loss": 2.2736, - "step": 488190 - }, - { - "epoch": 0.85, - "learning_rate": 7.431892772315559e-06, - "loss": 2.2339, - "step": 488200 - }, - { - "epoch": 0.85, - "learning_rate": 7.431020832388733e-06, - "loss": 2.2734, - "step": 488210 - }, - { - "epoch": 0.85, - "learning_rate": 7.430148892461905e-06, - "loss": 2.3155, - "step": 488220 - }, - { - "epoch": 0.85, - "learning_rate": 7.429276952535079e-06, - "loss": 2.2423, - "step": 488230 - }, - { - "epoch": 0.85, - "learning_rate": 7.428405012608252e-06, - "loss": 2.1962, - "step": 488240 - }, - { - "epoch": 0.85, - "learning_rate": 7.4275330726814255e-06, - "loss": 2.2171, - "step": 488250 - }, - { - "epoch": 0.85, - "learning_rate": 7.4266611327545975e-06, - "loss": 2.2701, - "step": 488260 - }, - { - "epoch": 0.85, - "learning_rate": 7.425789192827771e-06, - "loss": 2.3245, - "step": 488270 - }, - { - "epoch": 0.85, - "learning_rate": 7.424917252900944e-06, - "loss": 2.2043, - "step": 488280 - }, - { - "epoch": 0.85, - "learning_rate": 7.424045312974118e-06, - "loss": 2.2889, - "step": 488290 - }, - { - "epoch": 0.85, - "learning_rate": 7.42317337304729e-06, - "loss": 2.2216, - "step": 488300 - }, - { - "epoch": 0.85, - "learning_rate": 7.422301433120464e-06, - "loss": 2.2641, - "step": 488310 - }, - { - "epoch": 0.85, - "learning_rate": 7.421429493193638e-06, - "loss": 2.2366, - "step": 488320 - }, - { - "epoch": 0.85, - "learning_rate": 7.4205575532668105e-06, - "loss": 2.1707, - "step": 488330 - }, - { - "epoch": 0.85, - "learning_rate": 7.419685613339984e-06, - "loss": 2.2422, - "step": 488340 - }, - { - "epoch": 0.85, - "learning_rate": 7.418813673413156e-06, - "loss": 2.2985, - "step": 488350 - }, - { - "epoch": 0.85, - "learning_rate": 7.41794173348633e-06, - "loss": 2.2492, - "step": 488360 - }, - { - "epoch": 0.85, - "learning_rate": 7.417069793559503e-06, - "loss": 2.2119, - "step": 488370 - }, - { - "epoch": 0.85, - "learning_rate": 7.416197853632677e-06, - "loss": 2.3334, - "step": 488380 - }, - { - "epoch": 0.85, - "learning_rate": 7.415325913705849e-06, - "loss": 2.2824, - "step": 488390 - }, - { - "epoch": 0.85, - "learning_rate": 7.414453973779023e-06, - "loss": 2.2591, - "step": 488400 - }, - { - "epoch": 0.85, - "learning_rate": 7.413582033852196e-06, - "loss": 2.3258, - "step": 488410 - }, - { - "epoch": 0.85, - "learning_rate": 7.412710093925369e-06, - "loss": 2.4162, - "step": 488420 - }, - { - "epoch": 0.85, - "learning_rate": 7.4118381539985415e-06, - "loss": 2.2568, - "step": 488430 - }, - { - "epoch": 0.85, - "learning_rate": 7.410966214071716e-06, - "loss": 2.2738, - "step": 488440 - }, - { - "epoch": 0.85, - "learning_rate": 7.41009427414489e-06, - "loss": 2.2146, - "step": 488450 - }, - { - "epoch": 0.85, - "learning_rate": 7.409222334218062e-06, - "loss": 2.1826, - "step": 488460 - }, - { - "epoch": 0.85, - "learning_rate": 7.408350394291236e-06, - "loss": 2.1177, - "step": 488470 - }, - { - "epoch": 0.85, - "learning_rate": 7.407478454364409e-06, - "loss": 2.2278, - "step": 488480 - }, - { - "epoch": 0.85, - "learning_rate": 7.406606514437582e-06, - "loss": 2.2778, - "step": 488490 - }, - { - "epoch": 0.85, - "learning_rate": 7.4057345745107545e-06, - "loss": 2.3045, - "step": 488500 - }, - { - "epoch": 0.85, - "learning_rate": 7.404862634583928e-06, - "loss": 2.2331, - "step": 488510 - }, - { - "epoch": 0.85, - "learning_rate": 7.403990694657101e-06, - "loss": 2.1754, - "step": 488520 - }, - { - "epoch": 0.85, - "learning_rate": 7.403118754730275e-06, - "loss": 2.2963, - "step": 488530 - }, - { - "epoch": 0.85, - "learning_rate": 7.402246814803447e-06, - "loss": 2.3209, - "step": 488540 - }, - { - "epoch": 0.85, - "learning_rate": 7.401374874876621e-06, - "loss": 2.311, - "step": 488550 - }, - { - "epoch": 0.85, - "learning_rate": 7.400502934949794e-06, - "loss": 2.3281, - "step": 488560 - }, - { - "epoch": 0.85, - "learning_rate": 7.3996309950229675e-06, - "loss": 2.3034, - "step": 488570 - }, - { - "epoch": 0.85, - "learning_rate": 7.398759055096141e-06, - "loss": 2.2344, - "step": 488580 - }, - { - "epoch": 0.85, - "learning_rate": 7.397887115169313e-06, - "loss": 2.3145, - "step": 488590 - }, - { - "epoch": 0.85, - "learning_rate": 7.397015175242487e-06, - "loss": 2.2102, - "step": 488600 - }, - { - "epoch": 0.85, - "learning_rate": 7.39614323531566e-06, - "loss": 2.3309, - "step": 488610 - }, - { - "epoch": 0.85, - "learning_rate": 7.395271295388834e-06, - "loss": 2.2908, - "step": 488620 - }, - { - "epoch": 0.85, - "learning_rate": 7.394399355462006e-06, - "loss": 2.2114, - "step": 488630 - }, - { - "epoch": 0.85, - "learning_rate": 7.39352741553518e-06, - "loss": 2.3491, - "step": 488640 - }, - { - "epoch": 0.85, - "learning_rate": 7.3926554756083525e-06, - "loss": 2.1639, - "step": 488650 - }, - { - "epoch": 0.85, - "learning_rate": 7.391783535681526e-06, - "loss": 2.2653, - "step": 488660 - }, - { - "epoch": 0.85, - "learning_rate": 7.390911595754698e-06, - "loss": 2.162, - "step": 488670 - }, - { - "epoch": 0.85, - "learning_rate": 7.390039655827872e-06, - "loss": 2.2477, - "step": 488680 - }, - { - "epoch": 0.85, - "learning_rate": 7.389167715901045e-06, - "loss": 2.1763, - "step": 488690 - }, - { - "epoch": 0.85, - "learning_rate": 7.388295775974219e-06, - "loss": 2.2065, - "step": 488700 - }, - { - "epoch": 0.85, - "learning_rate": 7.387423836047393e-06, - "loss": 2.2691, - "step": 488710 - }, - { - "epoch": 0.85, - "learning_rate": 7.3865518961205655e-06, - "loss": 2.318, - "step": 488720 - }, - { - "epoch": 0.85, - "learning_rate": 7.385679956193739e-06, - "loss": 2.2995, - "step": 488730 - }, - { - "epoch": 0.85, - "learning_rate": 7.384808016266911e-06, - "loss": 2.4208, - "step": 488740 - }, - { - "epoch": 0.85, - "learning_rate": 7.383936076340085e-06, - "loss": 2.2747, - "step": 488750 - }, - { - "epoch": 0.85, - "learning_rate": 7.383064136413258e-06, - "loss": 2.2657, - "step": 488760 - }, - { - "epoch": 0.85, - "learning_rate": 7.382192196486432e-06, - "loss": 2.3187, - "step": 488770 - }, - { - "epoch": 0.85, - "learning_rate": 7.381320256559604e-06, - "loss": 2.1994, - "step": 488780 - }, - { - "epoch": 0.85, - "learning_rate": 7.380448316632778e-06, - "loss": 2.2621, - "step": 488790 - }, - { - "epoch": 0.85, - "learning_rate": 7.379576376705951e-06, - "loss": 2.3117, - "step": 488800 - }, - { - "epoch": 0.85, - "learning_rate": 7.378704436779124e-06, - "loss": 2.341, - "step": 488810 - }, - { - "epoch": 0.85, - "learning_rate": 7.3778324968522965e-06, - "loss": 2.1714, - "step": 488820 - }, - { - "epoch": 0.85, - "learning_rate": 7.37696055692547e-06, - "loss": 2.3251, - "step": 488830 - }, - { - "epoch": 0.85, - "learning_rate": 7.376088616998644e-06, - "loss": 2.3213, - "step": 488840 - }, - { - "epoch": 0.85, - "learning_rate": 7.375216677071817e-06, - "loss": 2.3351, - "step": 488850 - }, - { - "epoch": 0.85, - "learning_rate": 7.374344737144991e-06, - "loss": 2.2161, - "step": 488860 - }, - { - "epoch": 0.85, - "learning_rate": 7.373472797218163e-06, - "loss": 2.2426, - "step": 488870 - }, - { - "epoch": 0.85, - "learning_rate": 7.3726008572913365e-06, - "loss": 2.3433, - "step": 488880 - }, - { - "epoch": 0.85, - "learning_rate": 7.3717289173645095e-06, - "loss": 2.3313, - "step": 488890 - }, - { - "epoch": 0.85, - "learning_rate": 7.370856977437683e-06, - "loss": 2.3141, - "step": 488900 - }, - { - "epoch": 0.85, - "learning_rate": 7.369985037510855e-06, - "loss": 2.296, - "step": 488910 - }, - { - "epoch": 0.85, - "learning_rate": 7.369113097584029e-06, - "loss": 2.2954, - "step": 488920 - }, - { - "epoch": 0.85, - "learning_rate": 7.368241157657202e-06, - "loss": 2.1596, - "step": 488930 - }, - { - "epoch": 0.85, - "learning_rate": 7.367369217730376e-06, - "loss": 2.0843, - "step": 488940 - }, - { - "epoch": 0.85, - "learning_rate": 7.366497277803548e-06, - "loss": 2.2865, - "step": 488950 - }, - { - "epoch": 0.85, - "learning_rate": 7.3656253378767225e-06, - "loss": 2.2038, - "step": 488960 - }, - { - "epoch": 0.85, - "learning_rate": 7.364753397949896e-06, - "loss": 2.3094, - "step": 488970 - }, - { - "epoch": 0.85, - "learning_rate": 7.363881458023068e-06, - "loss": 2.0581, - "step": 488980 - }, - { - "epoch": 0.85, - "learning_rate": 7.363009518096242e-06, - "loss": 2.273, - "step": 488990 - }, - { - "epoch": 0.85, - "learning_rate": 7.362137578169415e-06, - "loss": 2.3308, - "step": 489000 - }, - { - "epoch": 0.85, - "learning_rate": 7.361265638242589e-06, - "loss": 2.1916, - "step": 489010 - }, - { - "epoch": 0.85, - "learning_rate": 7.360393698315761e-06, - "loss": 2.2316, - "step": 489020 - }, - { - "epoch": 0.85, - "learning_rate": 7.359521758388935e-06, - "loss": 2.2676, - "step": 489030 - }, - { - "epoch": 0.85, - "learning_rate": 7.3586498184621075e-06, - "loss": 2.3559, - "step": 489040 - }, - { - "epoch": 0.85, - "learning_rate": 7.357777878535281e-06, - "loss": 2.3371, - "step": 489050 - }, - { - "epoch": 0.85, - "learning_rate": 7.356905938608453e-06, - "loss": 2.0913, - "step": 489060 - }, - { - "epoch": 0.85, - "learning_rate": 7.356033998681627e-06, - "loss": 2.2731, - "step": 489070 - }, - { - "epoch": 0.85, - "learning_rate": 7.3551620587548e-06, - "loss": 2.2893, - "step": 489080 - }, - { - "epoch": 0.85, - "learning_rate": 7.354290118827974e-06, - "loss": 2.307, - "step": 489090 - }, - { - "epoch": 0.85, - "learning_rate": 7.353418178901146e-06, - "loss": 2.243, - "step": 489100 - }, - { - "epoch": 0.85, - "learning_rate": 7.35254623897432e-06, - "loss": 2.278, - "step": 489110 - }, - { - "epoch": 0.85, - "learning_rate": 7.3516742990474935e-06, - "loss": 2.3433, - "step": 489120 - }, - { - "epoch": 0.85, - "learning_rate": 7.350802359120666e-06, - "loss": 2.2911, - "step": 489130 - }, - { - "epoch": 0.85, - "learning_rate": 7.34993041919384e-06, - "loss": 2.2428, - "step": 489140 - }, - { - "epoch": 0.85, - "learning_rate": 7.349058479267012e-06, - "loss": 2.3332, - "step": 489150 - }, - { - "epoch": 0.85, - "learning_rate": 7.348186539340186e-06, - "loss": 2.1387, - "step": 489160 - }, - { - "epoch": 0.85, - "learning_rate": 7.347314599413359e-06, - "loss": 2.1746, - "step": 489170 - }, - { - "epoch": 0.85, - "learning_rate": 7.346442659486533e-06, - "loss": 2.2614, - "step": 489180 - }, - { - "epoch": 0.85, - "learning_rate": 7.345570719559705e-06, - "loss": 2.1747, - "step": 489190 - }, - { - "epoch": 0.85, - "learning_rate": 7.3446987796328785e-06, - "loss": 2.36, - "step": 489200 - }, - { - "epoch": 0.85, - "learning_rate": 7.3438268397060515e-06, - "loss": 2.2332, - "step": 489210 - }, - { - "epoch": 0.85, - "learning_rate": 7.342954899779225e-06, - "loss": 2.1985, - "step": 489220 - }, - { - "epoch": 0.85, - "learning_rate": 7.342082959852397e-06, - "loss": 2.2762, - "step": 489230 - }, - { - "epoch": 0.85, - "learning_rate": 7.341211019925572e-06, - "loss": 2.237, - "step": 489240 - }, - { - "epoch": 0.85, - "learning_rate": 7.340339079998746e-06, - "loss": 2.3834, - "step": 489250 - }, - { - "epoch": 0.85, - "learning_rate": 7.339467140071918e-06, - "loss": 2.2096, - "step": 489260 - }, - { - "epoch": 0.85, - "learning_rate": 7.3385952001450915e-06, - "loss": 2.3063, - "step": 489270 - }, - { - "epoch": 0.85, - "learning_rate": 7.3377232602182645e-06, - "loss": 2.2976, - "step": 489280 - }, - { - "epoch": 0.85, - "learning_rate": 7.336851320291438e-06, - "loss": 2.2913, - "step": 489290 - }, - { - "epoch": 0.85, - "learning_rate": 7.33597938036461e-06, - "loss": 2.4103, - "step": 489300 - }, - { - "epoch": 0.85, - "learning_rate": 7.335107440437784e-06, - "loss": 2.3401, - "step": 489310 - }, - { - "epoch": 0.85, - "learning_rate": 7.334235500510957e-06, - "loss": 2.3319, - "step": 489320 - }, - { - "epoch": 0.85, - "learning_rate": 7.333363560584131e-06, - "loss": 2.2605, - "step": 489330 - }, - { - "epoch": 0.85, - "learning_rate": 7.332491620657303e-06, - "loss": 2.2567, - "step": 489340 - }, - { - "epoch": 0.85, - "learning_rate": 7.331619680730477e-06, - "loss": 2.2418, - "step": 489350 - }, - { - "epoch": 0.85, - "learning_rate": 7.3307477408036495e-06, - "loss": 2.342, - "step": 489360 - }, - { - "epoch": 0.85, - "learning_rate": 7.329875800876823e-06, - "loss": 2.3049, - "step": 489370 - }, - { - "epoch": 0.85, - "learning_rate": 7.329003860949997e-06, - "loss": 2.3274, - "step": 489380 - }, - { - "epoch": 0.85, - "learning_rate": 7.328131921023169e-06, - "loss": 2.3493, - "step": 489390 - }, - { - "epoch": 0.85, - "learning_rate": 7.327259981096343e-06, - "loss": 2.2817, - "step": 489400 - }, - { - "epoch": 0.85, - "learning_rate": 7.326388041169516e-06, - "loss": 2.1627, - "step": 489410 - }, - { - "epoch": 0.85, - "learning_rate": 7.32551610124269e-06, - "loss": 2.1969, - "step": 489420 - }, - { - "epoch": 0.85, - "learning_rate": 7.324644161315862e-06, - "loss": 2.264, - "step": 489430 - }, - { - "epoch": 0.85, - "learning_rate": 7.3237722213890355e-06, - "loss": 2.2868, - "step": 489440 - }, - { - "epoch": 0.85, - "learning_rate": 7.322900281462208e-06, - "loss": 2.2036, - "step": 489450 - }, - { - "epoch": 0.85, - "learning_rate": 7.322028341535382e-06, - "loss": 2.2916, - "step": 489460 - }, - { - "epoch": 0.85, - "learning_rate": 7.321156401608554e-06, - "loss": 2.2892, - "step": 489470 - }, - { - "epoch": 0.85, - "learning_rate": 7.320284461681729e-06, - "loss": 2.2584, - "step": 489480 - }, - { - "epoch": 0.85, - "learning_rate": 7.319412521754901e-06, - "loss": 2.1255, - "step": 489490 - }, - { - "epoch": 0.85, - "learning_rate": 7.318540581828075e-06, - "loss": 2.2453, - "step": 489500 - }, - { - "epoch": 0.85, - "learning_rate": 7.3176686419012485e-06, - "loss": 2.3066, - "step": 489510 - }, - { - "epoch": 0.85, - "learning_rate": 7.316796701974421e-06, - "loss": 2.2188, - "step": 489520 - }, - { - "epoch": 0.85, - "learning_rate": 7.315924762047595e-06, - "loss": 2.2441, - "step": 489530 - }, - { - "epoch": 0.85, - "learning_rate": 7.315052822120767e-06, - "loss": 2.2616, - "step": 489540 - }, - { - "epoch": 0.85, - "learning_rate": 7.314180882193941e-06, - "loss": 2.2131, - "step": 489550 - }, - { - "epoch": 0.85, - "learning_rate": 7.313308942267114e-06, - "loss": 2.1966, - "step": 489560 - }, - { - "epoch": 0.85, - "learning_rate": 7.312437002340288e-06, - "loss": 2.3693, - "step": 489570 - }, - { - "epoch": 0.85, - "learning_rate": 7.31156506241346e-06, - "loss": 2.3017, - "step": 489580 - }, - { - "epoch": 0.85, - "learning_rate": 7.3106931224866335e-06, - "loss": 2.3305, - "step": 489590 - }, - { - "epoch": 0.85, - "learning_rate": 7.3098211825598065e-06, - "loss": 2.3194, - "step": 489600 - }, - { - "epoch": 0.85, - "learning_rate": 7.30894924263298e-06, - "loss": 2.2864, - "step": 489610 - }, - { - "epoch": 0.85, - "learning_rate": 7.308077302706152e-06, - "loss": 2.3317, - "step": 489620 - }, - { - "epoch": 0.85, - "learning_rate": 7.307205362779326e-06, - "loss": 2.2741, - "step": 489630 - }, - { - "epoch": 0.85, - "learning_rate": 7.3063334228525e-06, - "loss": 2.2116, - "step": 489640 - }, - { - "epoch": 0.85, - "learning_rate": 7.305461482925673e-06, - "loss": 2.2967, - "step": 489650 - }, - { - "epoch": 0.85, - "learning_rate": 7.3045895429988465e-06, - "loss": 2.2608, - "step": 489660 - }, - { - "epoch": 0.85, - "learning_rate": 7.303717603072019e-06, - "loss": 2.2642, - "step": 489670 - }, - { - "epoch": 0.85, - "learning_rate": 7.302845663145192e-06, - "loss": 2.2697, - "step": 489680 - }, - { - "epoch": 0.85, - "learning_rate": 7.301973723218365e-06, - "loss": 2.3391, - "step": 489690 - }, - { - "epoch": 0.85, - "learning_rate": 7.301101783291539e-06, - "loss": 2.2696, - "step": 489700 - }, - { - "epoch": 0.85, - "learning_rate": 7.300229843364711e-06, - "loss": 2.2739, - "step": 489710 - }, - { - "epoch": 0.85, - "learning_rate": 7.299357903437885e-06, - "loss": 2.1696, - "step": 489720 - }, - { - "epoch": 0.85, - "learning_rate": 7.298485963511058e-06, - "loss": 2.2714, - "step": 489730 - }, - { - "epoch": 0.85, - "learning_rate": 7.297614023584232e-06, - "loss": 2.2939, - "step": 489740 - }, - { - "epoch": 0.85, - "learning_rate": 7.296742083657404e-06, - "loss": 2.4328, - "step": 489750 - }, - { - "epoch": 0.85, - "learning_rate": 7.295870143730578e-06, - "loss": 2.1666, - "step": 489760 - }, - { - "epoch": 0.85, - "learning_rate": 7.294998203803752e-06, - "loss": 2.1896, - "step": 489770 - }, - { - "epoch": 0.85, - "learning_rate": 7.294126263876924e-06, - "loss": 2.3261, - "step": 489780 - }, - { - "epoch": 0.85, - "learning_rate": 7.293254323950098e-06, - "loss": 2.2662, - "step": 489790 - }, - { - "epoch": 0.85, - "learning_rate": 7.292382384023271e-06, - "loss": 2.2585, - "step": 489800 - }, - { - "epoch": 0.85, - "learning_rate": 7.291510444096445e-06, - "loss": 2.2884, - "step": 489810 - }, - { - "epoch": 0.85, - "learning_rate": 7.290638504169617e-06, - "loss": 2.3343, - "step": 489820 - }, - { - "epoch": 0.85, - "learning_rate": 7.2897665642427905e-06, - "loss": 2.2775, - "step": 489830 - }, - { - "epoch": 0.85, - "learning_rate": 7.288894624315963e-06, - "loss": 2.229, - "step": 489840 - }, - { - "epoch": 0.85, - "learning_rate": 7.288022684389137e-06, - "loss": 2.326, - "step": 489850 - }, - { - "epoch": 0.85, - "learning_rate": 7.287150744462309e-06, - "loss": 2.18, - "step": 489860 - }, - { - "epoch": 0.85, - "learning_rate": 7.286278804535483e-06, - "loss": 2.2859, - "step": 489870 - }, - { - "epoch": 0.85, - "learning_rate": 7.285406864608656e-06, - "loss": 2.2543, - "step": 489880 - }, - { - "epoch": 0.85, - "learning_rate": 7.28453492468183e-06, - "loss": 2.3532, - "step": 489890 - }, - { - "epoch": 0.85, - "learning_rate": 7.2836629847550035e-06, - "loss": 2.2402, - "step": 489900 - }, - { - "epoch": 0.85, - "learning_rate": 7.2827910448281755e-06, - "loss": 2.2813, - "step": 489910 - }, - { - "epoch": 0.85, - "learning_rate": 7.281919104901349e-06, - "loss": 2.329, - "step": 489920 - }, - { - "epoch": 0.85, - "learning_rate": 7.281047164974522e-06, - "loss": 2.1686, - "step": 489930 - }, - { - "epoch": 0.85, - "learning_rate": 7.280175225047696e-06, - "loss": 2.1193, - "step": 489940 - }, - { - "epoch": 0.85, - "learning_rate": 7.279303285120868e-06, - "loss": 2.3518, - "step": 489950 - }, - { - "epoch": 0.85, - "learning_rate": 7.278431345194042e-06, - "loss": 2.3028, - "step": 489960 - }, - { - "epoch": 0.85, - "learning_rate": 7.277559405267215e-06, - "loss": 2.2609, - "step": 489970 - }, - { - "epoch": 0.85, - "learning_rate": 7.2766874653403885e-06, - "loss": 2.3671, - "step": 489980 - }, - { - "epoch": 0.85, - "learning_rate": 7.275815525413561e-06, - "loss": 2.2513, - "step": 489990 - }, - { - "epoch": 0.85, - "learning_rate": 7.274943585486735e-06, - "loss": 2.2094, - "step": 490000 - }, - { - "epoch": 0.85, - "learning_rate": 7.274071645559907e-06, - "loss": 2.2535, - "step": 490010 - }, - { - "epoch": 0.85, - "learning_rate": 7.273199705633081e-06, - "loss": 2.2882, - "step": 490020 - }, - { - "epoch": 0.85, - "learning_rate": 7.272327765706253e-06, - "loss": 2.3013, - "step": 490030 - }, - { - "epoch": 0.85, - "learning_rate": 7.271455825779428e-06, - "loss": 2.2704, - "step": 490040 - }, - { - "epoch": 0.85, - "learning_rate": 7.2705838858526015e-06, - "loss": 2.3253, - "step": 490050 - }, - { - "epoch": 0.85, - "learning_rate": 7.269711945925774e-06, - "loss": 2.2121, - "step": 490060 - }, - { - "epoch": 0.85, - "learning_rate": 7.268840005998947e-06, - "loss": 2.2209, - "step": 490070 - }, - { - "epoch": 0.85, - "learning_rate": 7.26796806607212e-06, - "loss": 2.2641, - "step": 490080 - }, - { - "epoch": 0.85, - "learning_rate": 7.267096126145294e-06, - "loss": 2.3552, - "step": 490090 - }, - { - "epoch": 0.85, - "learning_rate": 7.266224186218466e-06, - "loss": 2.3753, - "step": 490100 - }, - { - "epoch": 0.85, - "learning_rate": 7.26535224629164e-06, - "loss": 2.3394, - "step": 490110 - }, - { - "epoch": 0.85, - "learning_rate": 7.264480306364813e-06, - "loss": 2.2483, - "step": 490120 - }, - { - "epoch": 0.85, - "learning_rate": 7.263608366437987e-06, - "loss": 2.1825, - "step": 490130 - }, - { - "epoch": 0.85, - "learning_rate": 7.262736426511159e-06, - "loss": 2.3079, - "step": 490140 - }, - { - "epoch": 0.85, - "learning_rate": 7.2618644865843325e-06, - "loss": 2.2183, - "step": 490150 - }, - { - "epoch": 0.85, - "learning_rate": 7.260992546657505e-06, - "loss": 2.3022, - "step": 490160 - }, - { - "epoch": 0.85, - "learning_rate": 7.260120606730679e-06, - "loss": 2.168, - "step": 490170 - }, - { - "epoch": 0.85, - "learning_rate": 7.259248666803853e-06, - "loss": 2.3101, - "step": 490180 - }, - { - "epoch": 0.85, - "learning_rate": 7.258376726877025e-06, - "loss": 2.3843, - "step": 490190 - }, - { - "epoch": 0.85, - "learning_rate": 7.257504786950199e-06, - "loss": 2.2365, - "step": 490200 - }, - { - "epoch": 0.85, - "learning_rate": 7.256632847023372e-06, - "loss": 2.375, - "step": 490210 - }, - { - "epoch": 0.85, - "learning_rate": 7.2557609070965455e-06, - "loss": 2.3023, - "step": 490220 - }, - { - "epoch": 0.85, - "learning_rate": 7.2548889671697175e-06, - "loss": 2.167, - "step": 490230 - }, - { - "epoch": 0.85, - "learning_rate": 7.254017027242891e-06, - "loss": 2.2414, - "step": 490240 - }, - { - "epoch": 0.85, - "learning_rate": 7.253145087316064e-06, - "loss": 2.3377, - "step": 490250 - }, - { - "epoch": 0.85, - "learning_rate": 7.252273147389238e-06, - "loss": 2.2582, - "step": 490260 - }, - { - "epoch": 0.85, - "learning_rate": 7.25140120746241e-06, - "loss": 2.2323, - "step": 490270 - }, - { - "epoch": 0.85, - "learning_rate": 7.250529267535585e-06, - "loss": 2.2128, - "step": 490280 - }, - { - "epoch": 0.86, - "learning_rate": 7.249657327608757e-06, - "loss": 2.1968, - "step": 490290 - }, - { - "epoch": 0.86, - "learning_rate": 7.2487853876819305e-06, - "loss": 2.3124, - "step": 490300 - }, - { - "epoch": 0.86, - "learning_rate": 7.247913447755104e-06, - "loss": 2.2026, - "step": 490310 - }, - { - "epoch": 0.86, - "learning_rate": 7.247041507828277e-06, - "loss": 2.34, - "step": 490320 - }, - { - "epoch": 0.86, - "learning_rate": 7.246169567901451e-06, - "loss": 2.2295, - "step": 490330 - }, - { - "epoch": 0.86, - "learning_rate": 7.245297627974623e-06, - "loss": 2.2798, - "step": 490340 - }, - { - "epoch": 0.86, - "learning_rate": 7.244425688047797e-06, - "loss": 2.2929, - "step": 490350 - }, - { - "epoch": 0.86, - "learning_rate": 7.24355374812097e-06, - "loss": 2.1791, - "step": 490360 - }, - { - "epoch": 0.86, - "learning_rate": 7.2426818081941435e-06, - "loss": 2.2333, - "step": 490370 - }, - { - "epoch": 0.86, - "learning_rate": 7.241809868267316e-06, - "loss": 2.2952, - "step": 490380 - }, - { - "epoch": 0.86, - "learning_rate": 7.240937928340489e-06, - "loss": 2.2817, - "step": 490390 - }, - { - "epoch": 0.86, - "learning_rate": 7.240065988413662e-06, - "loss": 2.2804, - "step": 490400 - }, - { - "epoch": 0.86, - "learning_rate": 7.239194048486836e-06, - "loss": 2.1985, - "step": 490410 - }, - { - "epoch": 0.86, - "learning_rate": 7.238322108560008e-06, - "loss": 2.179, - "step": 490420 - }, - { - "epoch": 0.86, - "learning_rate": 7.237450168633182e-06, - "loss": 2.1695, - "step": 490430 - }, - { - "epoch": 0.86, - "learning_rate": 7.236578228706356e-06, - "loss": 2.2148, - "step": 490440 - }, - { - "epoch": 0.86, - "learning_rate": 7.235706288779529e-06, - "loss": 2.2293, - "step": 490450 - }, - { - "epoch": 0.86, - "learning_rate": 7.234834348852702e-06, - "loss": 2.3529, - "step": 490460 - }, - { - "epoch": 0.86, - "learning_rate": 7.2339624089258745e-06, - "loss": 2.3419, - "step": 490470 - }, - { - "epoch": 0.86, - "learning_rate": 7.233090468999048e-06, - "loss": 2.2039, - "step": 490480 - }, - { - "epoch": 0.86, - "learning_rate": 7.232218529072221e-06, - "loss": 2.268, - "step": 490490 - }, - { - "epoch": 0.86, - "learning_rate": 7.231346589145395e-06, - "loss": 2.2708, - "step": 490500 - }, - { - "epoch": 0.86, - "learning_rate": 7.230474649218567e-06, - "loss": 2.2648, - "step": 490510 - }, - { - "epoch": 0.86, - "learning_rate": 7.229602709291742e-06, - "loss": 2.2154, - "step": 490520 - }, - { - "epoch": 0.86, - "learning_rate": 7.228730769364914e-06, - "loss": 2.2347, - "step": 490530 - }, - { - "epoch": 0.86, - "learning_rate": 7.2278588294380875e-06, - "loss": 2.4097, - "step": 490540 - }, - { - "epoch": 0.86, - "learning_rate": 7.2269868895112595e-06, - "loss": 2.2517, - "step": 490550 - }, - { - "epoch": 0.86, - "learning_rate": 7.226114949584434e-06, - "loss": 2.3174, - "step": 490560 - }, - { - "epoch": 0.86, - "learning_rate": 7.225243009657608e-06, - "loss": 2.1855, - "step": 490570 - }, - { - "epoch": 0.86, - "learning_rate": 7.22437106973078e-06, - "loss": 2.4178, - "step": 490580 - }, - { - "epoch": 0.86, - "learning_rate": 7.223499129803954e-06, - "loss": 2.3377, - "step": 490590 - }, - { - "epoch": 0.86, - "learning_rate": 7.222627189877127e-06, - "loss": 2.1377, - "step": 490600 - }, - { - "epoch": 0.86, - "learning_rate": 7.2217552499503005e-06, - "loss": 2.19, - "step": 490610 - }, - { - "epoch": 0.86, - "learning_rate": 7.2208833100234725e-06, - "loss": 2.2891, - "step": 490620 - }, - { - "epoch": 0.86, - "learning_rate": 7.220011370096646e-06, - "loss": 2.2361, - "step": 490630 - }, - { - "epoch": 0.86, - "learning_rate": 7.219139430169819e-06, - "loss": 2.2849, - "step": 490640 - }, - { - "epoch": 0.86, - "learning_rate": 7.218267490242993e-06, - "loss": 2.3665, - "step": 490650 - }, - { - "epoch": 0.86, - "learning_rate": 7.217395550316165e-06, - "loss": 2.2062, - "step": 490660 - }, - { - "epoch": 0.86, - "learning_rate": 7.216523610389339e-06, - "loss": 2.3396, - "step": 490670 - }, - { - "epoch": 0.86, - "learning_rate": 7.215651670462512e-06, - "loss": 2.2351, - "step": 490680 - }, - { - "epoch": 0.86, - "learning_rate": 7.2147797305356855e-06, - "loss": 2.3219, - "step": 490690 - }, - { - "epoch": 0.86, - "learning_rate": 7.213907790608859e-06, - "loss": 2.3861, - "step": 490700 - }, - { - "epoch": 0.86, - "learning_rate": 7.213035850682031e-06, - "loss": 2.2006, - "step": 490710 - }, - { - "epoch": 0.86, - "learning_rate": 7.212163910755205e-06, - "loss": 2.2352, - "step": 490720 - }, - { - "epoch": 0.86, - "learning_rate": 7.211291970828378e-06, - "loss": 2.3639, - "step": 490730 - }, - { - "epoch": 0.86, - "learning_rate": 7.210420030901552e-06, - "loss": 2.3061, - "step": 490740 - }, - { - "epoch": 0.86, - "learning_rate": 7.209548090974724e-06, - "loss": 2.2821, - "step": 490750 - }, - { - "epoch": 0.86, - "learning_rate": 7.208676151047898e-06, - "loss": 2.2808, - "step": 490760 - }, - { - "epoch": 0.86, - "learning_rate": 7.207804211121071e-06, - "loss": 2.2034, - "step": 490770 - }, - { - "epoch": 0.86, - "learning_rate": 7.206932271194244e-06, - "loss": 2.2106, - "step": 490780 - }, - { - "epoch": 0.86, - "learning_rate": 7.2060603312674165e-06, - "loss": 2.2655, - "step": 490790 - }, - { - "epoch": 0.86, - "learning_rate": 7.205188391340591e-06, - "loss": 2.2404, - "step": 490800 - }, - { - "epoch": 0.86, - "learning_rate": 7.204316451413763e-06, - "loss": 2.1837, - "step": 490810 - }, - { - "epoch": 0.86, - "learning_rate": 7.203444511486937e-06, - "loss": 2.2904, - "step": 490820 - }, - { - "epoch": 0.86, - "learning_rate": 7.20257257156011e-06, - "loss": 2.2536, - "step": 490830 - }, - { - "epoch": 0.86, - "learning_rate": 7.201700631633284e-06, - "loss": 2.2474, - "step": 490840 - }, - { - "epoch": 0.86, - "learning_rate": 7.200828691706457e-06, - "loss": 2.2436, - "step": 490850 - }, - { - "epoch": 0.86, - "learning_rate": 7.1999567517796295e-06, - "loss": 2.3284, - "step": 490860 - }, - { - "epoch": 0.86, - "learning_rate": 7.199084811852803e-06, - "loss": 2.2175, - "step": 490870 - }, - { - "epoch": 0.86, - "learning_rate": 7.198212871925976e-06, - "loss": 2.1309, - "step": 490880 - }, - { - "epoch": 0.86, - "learning_rate": 7.19734093199915e-06, - "loss": 2.2811, - "step": 490890 - }, - { - "epoch": 0.86, - "learning_rate": 7.196468992072322e-06, - "loss": 2.2327, - "step": 490900 - }, - { - "epoch": 0.86, - "learning_rate": 7.195597052145496e-06, - "loss": 2.333, - "step": 490910 - }, - { - "epoch": 0.86, - "learning_rate": 7.194725112218669e-06, - "loss": 2.3091, - "step": 490920 - }, - { - "epoch": 0.86, - "learning_rate": 7.1938531722918425e-06, - "loss": 2.2529, - "step": 490930 - }, - { - "epoch": 0.86, - "learning_rate": 7.1929812323650145e-06, - "loss": 2.2789, - "step": 490940 - }, - { - "epoch": 0.86, - "learning_rate": 7.192109292438188e-06, - "loss": 2.3151, - "step": 490950 - }, - { - "epoch": 0.86, - "learning_rate": 7.191237352511361e-06, - "loss": 2.2324, - "step": 490960 - }, - { - "epoch": 0.86, - "learning_rate": 7.190365412584535e-06, - "loss": 2.4171, - "step": 490970 - }, - { - "epoch": 0.86, - "learning_rate": 7.189493472657709e-06, - "loss": 2.2538, - "step": 490980 - }, - { - "epoch": 0.86, - "learning_rate": 7.188621532730881e-06, - "loss": 2.262, - "step": 490990 - }, - { - "epoch": 0.86, - "learning_rate": 7.187749592804055e-06, - "loss": 2.202, - "step": 491000 - }, - { - "epoch": 0.86, - "learning_rate": 7.1868776528772276e-06, - "loss": 2.3304, - "step": 491010 - }, - { - "epoch": 0.86, - "learning_rate": 7.186005712950401e-06, - "loss": 2.2938, - "step": 491020 - }, - { - "epoch": 0.86, - "learning_rate": 7.185133773023573e-06, - "loss": 2.2364, - "step": 491030 - }, - { - "epoch": 0.86, - "learning_rate": 7.184261833096748e-06, - "loss": 2.2575, - "step": 491040 - }, - { - "epoch": 0.86, - "learning_rate": 7.18338989316992e-06, - "loss": 2.2477, - "step": 491050 - }, - { - "epoch": 0.86, - "learning_rate": 7.182517953243094e-06, - "loss": 2.2819, - "step": 491060 - }, - { - "epoch": 0.86, - "learning_rate": 7.181646013316266e-06, - "loss": 2.2582, - "step": 491070 - }, - { - "epoch": 0.86, - "learning_rate": 7.1807740733894406e-06, - "loss": 2.2606, - "step": 491080 - }, - { - "epoch": 0.86, - "learning_rate": 7.179902133462613e-06, - "loss": 2.2452, - "step": 491090 - }, - { - "epoch": 0.86, - "learning_rate": 7.179030193535786e-06, - "loss": 2.1988, - "step": 491100 - }, - { - "epoch": 0.86, - "learning_rate": 7.17815825360896e-06, - "loss": 2.2147, - "step": 491110 - }, - { - "epoch": 0.86, - "learning_rate": 7.177286313682133e-06, - "loss": 2.2347, - "step": 491120 - }, - { - "epoch": 0.86, - "learning_rate": 7.176414373755307e-06, - "loss": 2.2959, - "step": 491130 - }, - { - "epoch": 0.86, - "learning_rate": 7.175542433828479e-06, - "loss": 2.3285, - "step": 491140 - }, - { - "epoch": 0.86, - "learning_rate": 7.174670493901653e-06, - "loss": 2.3505, - "step": 491150 - }, - { - "epoch": 0.86, - "learning_rate": 7.173798553974826e-06, - "loss": 2.2911, - "step": 491160 - }, - { - "epoch": 0.86, - "learning_rate": 7.172926614047999e-06, - "loss": 2.2617, - "step": 491170 - }, - { - "epoch": 0.86, - "learning_rate": 7.1720546741211715e-06, - "loss": 2.2367, - "step": 491180 - }, - { - "epoch": 0.86, - "learning_rate": 7.171182734194345e-06, - "loss": 2.2482, - "step": 491190 - }, - { - "epoch": 0.86, - "learning_rate": 7.170310794267518e-06, - "loss": 2.2833, - "step": 491200 - }, - { - "epoch": 0.86, - "learning_rate": 7.169438854340692e-06, - "loss": 2.2375, - "step": 491210 - }, - { - "epoch": 0.86, - "learning_rate": 7.168566914413864e-06, - "loss": 2.2774, - "step": 491220 - }, - { - "epoch": 0.86, - "learning_rate": 7.167694974487038e-06, - "loss": 2.2396, - "step": 491230 - }, - { - "epoch": 0.86, - "learning_rate": 7.1668230345602116e-06, - "loss": 2.2629, - "step": 491240 - }, - { - "epoch": 0.86, - "learning_rate": 7.1659510946333845e-06, - "loss": 2.2728, - "step": 491250 - }, - { - "epoch": 0.86, - "learning_rate": 7.165079154706558e-06, - "loss": 2.3715, - "step": 491260 - }, - { - "epoch": 0.86, - "learning_rate": 7.16420721477973e-06, - "loss": 2.3131, - "step": 491270 - }, - { - "epoch": 0.86, - "learning_rate": 7.163335274852904e-06, - "loss": 2.3197, - "step": 491280 - }, - { - "epoch": 0.86, - "learning_rate": 7.162463334926077e-06, - "loss": 2.3056, - "step": 491290 - }, - { - "epoch": 0.86, - "learning_rate": 7.161591394999251e-06, - "loss": 2.3058, - "step": 491300 - }, - { - "epoch": 0.86, - "learning_rate": 7.160719455072423e-06, - "loss": 2.1736, - "step": 491310 - }, - { - "epoch": 0.86, - "learning_rate": 7.1598475151455975e-06, - "loss": 2.285, - "step": 491320 - }, - { - "epoch": 0.86, - "learning_rate": 7.1589755752187696e-06, - "loss": 2.3253, - "step": 491330 - }, - { - "epoch": 0.86, - "learning_rate": 7.158103635291943e-06, - "loss": 2.1655, - "step": 491340 - }, - { - "epoch": 0.86, - "learning_rate": 7.157231695365116e-06, - "loss": 2.3626, - "step": 491350 - }, - { - "epoch": 0.86, - "learning_rate": 7.15635975543829e-06, - "loss": 2.2398, - "step": 491360 - }, - { - "epoch": 0.86, - "learning_rate": 7.155487815511464e-06, - "loss": 2.2916, - "step": 491370 - }, - { - "epoch": 0.86, - "learning_rate": 7.154615875584636e-06, - "loss": 2.2638, - "step": 491380 - }, - { - "epoch": 0.86, - "learning_rate": 7.15374393565781e-06, - "loss": 2.308, - "step": 491390 - }, - { - "epoch": 0.86, - "learning_rate": 7.1528719957309826e-06, - "loss": 2.4081, - "step": 491400 - }, - { - "epoch": 0.86, - "learning_rate": 7.152000055804156e-06, - "loss": 2.3345, - "step": 491410 - }, - { - "epoch": 0.86, - "learning_rate": 7.151128115877328e-06, - "loss": 2.2071, - "step": 491420 - }, - { - "epoch": 0.86, - "learning_rate": 7.150256175950502e-06, - "loss": 2.2828, - "step": 491430 - }, - { - "epoch": 0.86, - "learning_rate": 7.149384236023675e-06, - "loss": 2.2848, - "step": 491440 - }, - { - "epoch": 0.86, - "learning_rate": 7.148512296096849e-06, - "loss": 2.1753, - "step": 491450 - }, - { - "epoch": 0.86, - "learning_rate": 7.147640356170021e-06, - "loss": 2.3245, - "step": 491460 - }, - { - "epoch": 0.86, - "learning_rate": 7.146768416243195e-06, - "loss": 2.3237, - "step": 491470 - }, - { - "epoch": 0.86, - "learning_rate": 7.145896476316368e-06, - "loss": 2.3745, - "step": 491480 - }, - { - "epoch": 0.86, - "learning_rate": 7.145024536389541e-06, - "loss": 2.2108, - "step": 491490 - }, - { - "epoch": 0.86, - "learning_rate": 7.144152596462715e-06, - "loss": 2.2238, - "step": 491500 - }, - { - "epoch": 0.86, - "learning_rate": 7.143280656535887e-06, - "loss": 2.3076, - "step": 491510 - }, - { - "epoch": 0.86, - "learning_rate": 7.142408716609061e-06, - "loss": 2.252, - "step": 491520 - }, - { - "epoch": 0.86, - "learning_rate": 7.141536776682234e-06, - "loss": 2.3689, - "step": 491530 - }, - { - "epoch": 0.86, - "learning_rate": 7.140664836755408e-06, - "loss": 2.2149, - "step": 491540 - }, - { - "epoch": 0.86, - "learning_rate": 7.13979289682858e-06, - "loss": 2.4114, - "step": 491550 - }, - { - "epoch": 0.86, - "learning_rate": 7.138920956901754e-06, - "loss": 2.2376, - "step": 491560 - }, - { - "epoch": 0.86, - "learning_rate": 7.1380490169749265e-06, - "loss": 2.2119, - "step": 491570 - }, - { - "epoch": 0.86, - "learning_rate": 7.1371770770481e-06, - "loss": 2.2693, - "step": 491580 - }, - { - "epoch": 0.86, - "learning_rate": 7.136305137121272e-06, - "loss": 2.3823, - "step": 491590 - }, - { - "epoch": 0.86, - "learning_rate": 7.135433197194447e-06, - "loss": 2.3516, - "step": 491600 - }, - { - "epoch": 0.86, - "learning_rate": 7.134561257267619e-06, - "loss": 2.3695, - "step": 491610 - }, - { - "epoch": 0.86, - "learning_rate": 7.133689317340793e-06, - "loss": 2.2496, - "step": 491620 - }, - { - "epoch": 0.86, - "learning_rate": 7.1328173774139666e-06, - "loss": 2.2539, - "step": 491630 - }, - { - "epoch": 0.86, - "learning_rate": 7.1319454374871395e-06, - "loss": 2.2693, - "step": 491640 - }, - { - "epoch": 0.86, - "learning_rate": 7.131073497560313e-06, - "loss": 2.1577, - "step": 491650 - }, - { - "epoch": 0.86, - "learning_rate": 7.130201557633485e-06, - "loss": 2.2777, - "step": 491660 - }, - { - "epoch": 0.86, - "learning_rate": 7.129329617706659e-06, - "loss": 2.2711, - "step": 491670 - }, - { - "epoch": 0.86, - "learning_rate": 7.128457677779832e-06, - "loss": 2.2505, - "step": 491680 - }, - { - "epoch": 0.86, - "learning_rate": 7.127585737853006e-06, - "loss": 2.3252, - "step": 491690 - }, - { - "epoch": 0.86, - "learning_rate": 7.126713797926178e-06, - "loss": 2.2518, - "step": 491700 - }, - { - "epoch": 0.86, - "learning_rate": 7.125841857999352e-06, - "loss": 2.273, - "step": 491710 - }, - { - "epoch": 0.86, - "learning_rate": 7.1249699180725246e-06, - "loss": 2.3634, - "step": 491720 - }, - { - "epoch": 0.86, - "learning_rate": 7.124097978145698e-06, - "loss": 2.3221, - "step": 491730 - }, - { - "epoch": 0.86, - "learning_rate": 7.12322603821887e-06, - "loss": 2.2884, - "step": 491740 - }, - { - "epoch": 0.86, - "learning_rate": 7.122354098292044e-06, - "loss": 2.2642, - "step": 491750 - }, - { - "epoch": 0.86, - "learning_rate": 7.121482158365217e-06, - "loss": 2.2908, - "step": 491760 - }, - { - "epoch": 0.86, - "learning_rate": 7.120610218438391e-06, - "loss": 2.3513, - "step": 491770 - }, - { - "epoch": 0.86, - "learning_rate": 7.119738278511565e-06, - "loss": 2.1703, - "step": 491780 - }, - { - "epoch": 0.86, - "learning_rate": 7.118866338584737e-06, - "loss": 2.3353, - "step": 491790 - }, - { - "epoch": 0.86, - "learning_rate": 7.1179943986579105e-06, - "loss": 2.2966, - "step": 491800 - }, - { - "epoch": 0.86, - "learning_rate": 7.117122458731083e-06, - "loss": 2.3196, - "step": 491810 - }, - { - "epoch": 0.86, - "learning_rate": 7.116250518804257e-06, - "loss": 2.2236, - "step": 491820 - }, - { - "epoch": 0.86, - "learning_rate": 7.115378578877429e-06, - "loss": 2.3005, - "step": 491830 - }, - { - "epoch": 0.86, - "learning_rate": 7.114506638950604e-06, - "loss": 2.2306, - "step": 491840 - }, - { - "epoch": 0.86, - "learning_rate": 7.113634699023776e-06, - "loss": 2.3426, - "step": 491850 - }, - { - "epoch": 0.86, - "learning_rate": 7.11276275909695e-06, - "loss": 2.176, - "step": 491860 - }, - { - "epoch": 0.86, - "learning_rate": 7.111890819170123e-06, - "loss": 2.192, - "step": 491870 - }, - { - "epoch": 0.86, - "learning_rate": 7.111018879243296e-06, - "loss": 2.273, - "step": 491880 - }, - { - "epoch": 0.86, - "learning_rate": 7.1101469393164685e-06, - "loss": 2.148, - "step": 491890 - }, - { - "epoch": 0.86, - "learning_rate": 7.109274999389642e-06, - "loss": 2.3241, - "step": 491900 - }, - { - "epoch": 0.86, - "learning_rate": 7.108403059462816e-06, - "loss": 2.2953, - "step": 491910 - }, - { - "epoch": 0.86, - "learning_rate": 7.107531119535989e-06, - "loss": 2.197, - "step": 491920 - }, - { - "epoch": 0.86, - "learning_rate": 7.106659179609163e-06, - "loss": 2.2428, - "step": 491930 - }, - { - "epoch": 0.86, - "learning_rate": 7.105787239682335e-06, - "loss": 2.2842, - "step": 491940 - }, - { - "epoch": 0.86, - "learning_rate": 7.1049152997555086e-06, - "loss": 2.3542, - "step": 491950 - }, - { - "epoch": 0.86, - "learning_rate": 7.1040433598286815e-06, - "loss": 2.3086, - "step": 491960 - }, - { - "epoch": 0.86, - "learning_rate": 7.103171419901855e-06, - "loss": 2.188, - "step": 491970 - }, - { - "epoch": 0.86, - "learning_rate": 7.102299479975027e-06, - "loss": 2.3268, - "step": 491980 - }, - { - "epoch": 0.86, - "learning_rate": 7.101427540048201e-06, - "loss": 2.2068, - "step": 491990 - }, - { - "epoch": 0.86, - "learning_rate": 7.100555600121374e-06, - "loss": 2.2462, - "step": 492000 - }, - { - "epoch": 0.86, - "learning_rate": 7.099683660194548e-06, - "loss": 2.2604, - "step": 492010 - }, - { - "epoch": 0.86, - "learning_rate": 7.09881172026772e-06, - "loss": 2.3068, - "step": 492020 - }, - { - "epoch": 0.86, - "learning_rate": 7.097939780340894e-06, - "loss": 2.2627, - "step": 492030 - }, - { - "epoch": 0.86, - "learning_rate": 7.097067840414067e-06, - "loss": 2.3703, - "step": 492040 - }, - { - "epoch": 0.86, - "learning_rate": 7.09619590048724e-06, - "loss": 2.2649, - "step": 492050 - }, - { - "epoch": 0.86, - "learning_rate": 7.095323960560414e-06, - "loss": 2.267, - "step": 492060 - }, - { - "epoch": 0.86, - "learning_rate": 7.094452020633586e-06, - "loss": 2.2518, - "step": 492070 - }, - { - "epoch": 0.86, - "learning_rate": 7.093580080706761e-06, - "loss": 2.1402, - "step": 492080 - }, - { - "epoch": 0.86, - "learning_rate": 7.092708140779933e-06, - "loss": 2.2791, - "step": 492090 - }, - { - "epoch": 0.86, - "learning_rate": 7.091836200853107e-06, - "loss": 2.3716, - "step": 492100 - }, - { - "epoch": 0.86, - "learning_rate": 7.090964260926279e-06, - "loss": 2.2451, - "step": 492110 - }, - { - "epoch": 0.86, - "learning_rate": 7.090092320999453e-06, - "loss": 2.3976, - "step": 492120 - }, - { - "epoch": 0.86, - "learning_rate": 7.089220381072625e-06, - "loss": 2.415, - "step": 492130 - }, - { - "epoch": 0.86, - "learning_rate": 7.088348441145799e-06, - "loss": 2.241, - "step": 492140 - }, - { - "epoch": 0.86, - "learning_rate": 7.087476501218972e-06, - "loss": 2.1811, - "step": 492150 - }, - { - "epoch": 0.86, - "learning_rate": 7.086604561292146e-06, - "loss": 2.3021, - "step": 492160 - }, - { - "epoch": 0.86, - "learning_rate": 7.08573262136532e-06, - "loss": 2.1775, - "step": 492170 - }, - { - "epoch": 0.86, - "learning_rate": 7.084860681438492e-06, - "loss": 2.2876, - "step": 492180 - }, - { - "epoch": 0.86, - "learning_rate": 7.0839887415116655e-06, - "loss": 2.2662, - "step": 492190 - }, - { - "epoch": 0.86, - "learning_rate": 7.083116801584838e-06, - "loss": 2.2319, - "step": 492200 - }, - { - "epoch": 0.86, - "learning_rate": 7.082244861658012e-06, - "loss": 2.3639, - "step": 492210 - }, - { - "epoch": 0.86, - "learning_rate": 7.081372921731184e-06, - "loss": 2.2274, - "step": 492220 - }, - { - "epoch": 0.86, - "learning_rate": 7.080500981804358e-06, - "loss": 2.2304, - "step": 492230 - }, - { - "epoch": 0.86, - "learning_rate": 7.079629041877531e-06, - "loss": 2.3087, - "step": 492240 - }, - { - "epoch": 0.86, - "learning_rate": 7.078757101950705e-06, - "loss": 2.2185, - "step": 492250 - }, - { - "epoch": 0.86, - "learning_rate": 7.077885162023877e-06, - "loss": 2.3446, - "step": 492260 - }, - { - "epoch": 0.86, - "learning_rate": 7.0770132220970506e-06, - "loss": 2.29, - "step": 492270 - }, - { - "epoch": 0.86, - "learning_rate": 7.0761412821702235e-06, - "loss": 2.1773, - "step": 492280 - }, - { - "epoch": 0.86, - "learning_rate": 7.075269342243397e-06, - "loss": 2.2835, - "step": 492290 - }, - { - "epoch": 0.86, - "learning_rate": 7.074397402316571e-06, - "loss": 2.2067, - "step": 492300 - }, - { - "epoch": 0.86, - "learning_rate": 7.073525462389743e-06, - "loss": 2.1986, - "step": 492310 - }, - { - "epoch": 0.86, - "learning_rate": 7.072653522462917e-06, - "loss": 2.166, - "step": 492320 - }, - { - "epoch": 0.86, - "learning_rate": 7.07178158253609e-06, - "loss": 2.3822, - "step": 492330 - }, - { - "epoch": 0.86, - "learning_rate": 7.0709096426092636e-06, - "loss": 2.3889, - "step": 492340 - }, - { - "epoch": 0.86, - "learning_rate": 7.070037702682436e-06, - "loss": 2.2556, - "step": 492350 - }, - { - "epoch": 0.86, - "learning_rate": 7.06916576275561e-06, - "loss": 2.2898, - "step": 492360 - }, - { - "epoch": 0.86, - "learning_rate": 7.068293822828782e-06, - "loss": 2.3172, - "step": 492370 - }, - { - "epoch": 0.86, - "learning_rate": 7.067421882901956e-06, - "loss": 2.3715, - "step": 492380 - }, - { - "epoch": 0.86, - "learning_rate": 7.066549942975129e-06, - "loss": 2.252, - "step": 492390 - }, - { - "epoch": 0.86, - "learning_rate": 7.065678003048303e-06, - "loss": 2.4679, - "step": 492400 - }, - { - "epoch": 0.86, - "learning_rate": 7.064806063121475e-06, - "loss": 2.268, - "step": 492410 - }, - { - "epoch": 0.86, - "learning_rate": 7.063934123194649e-06, - "loss": 2.2387, - "step": 492420 - }, - { - "epoch": 0.86, - "learning_rate": 7.063062183267822e-06, - "loss": 2.3308, - "step": 492430 - }, - { - "epoch": 0.86, - "learning_rate": 7.062190243340995e-06, - "loss": 2.1983, - "step": 492440 - }, - { - "epoch": 0.86, - "learning_rate": 7.061318303414169e-06, - "loss": 2.2995, - "step": 492450 - }, - { - "epoch": 0.86, - "learning_rate": 7.060446363487341e-06, - "loss": 2.2759, - "step": 492460 - }, - { - "epoch": 0.86, - "learning_rate": 7.059574423560515e-06, - "loss": 2.2394, - "step": 492470 - }, - { - "epoch": 0.86, - "learning_rate": 7.058702483633688e-06, - "loss": 2.3107, - "step": 492480 - }, - { - "epoch": 0.86, - "learning_rate": 7.057830543706862e-06, - "loss": 2.2147, - "step": 492490 - }, - { - "epoch": 0.86, - "learning_rate": 7.056958603780034e-06, - "loss": 2.1598, - "step": 492500 - }, - { - "epoch": 0.86, - "learning_rate": 7.0560866638532075e-06, - "loss": 2.2757, - "step": 492510 - }, - { - "epoch": 0.86, - "learning_rate": 7.05521472392638e-06, - "loss": 2.2957, - "step": 492520 - }, - { - "epoch": 0.86, - "learning_rate": 7.054342783999554e-06, - "loss": 2.2083, - "step": 492530 - }, - { - "epoch": 0.86, - "learning_rate": 7.053470844072726e-06, - "loss": 2.3185, - "step": 492540 - }, - { - "epoch": 0.86, - "learning_rate": 7.0525989041459e-06, - "loss": 2.4051, - "step": 492550 - }, - { - "epoch": 0.86, - "learning_rate": 7.051726964219074e-06, - "loss": 2.2514, - "step": 492560 - }, - { - "epoch": 0.86, - "learning_rate": 7.050855024292247e-06, - "loss": 2.2199, - "step": 492570 - }, - { - "epoch": 0.86, - "learning_rate": 7.0499830843654205e-06, - "loss": 2.2839, - "step": 492580 - }, - { - "epoch": 0.86, - "learning_rate": 7.0491111444385926e-06, - "loss": 2.2525, - "step": 492590 - }, - { - "epoch": 0.86, - "learning_rate": 7.048239204511767e-06, - "loss": 2.3305, - "step": 492600 - }, - { - "epoch": 0.86, - "learning_rate": 7.047367264584939e-06, - "loss": 2.3163, - "step": 492610 - }, - { - "epoch": 0.86, - "learning_rate": 7.046495324658113e-06, - "loss": 2.3509, - "step": 492620 - }, - { - "epoch": 0.86, - "learning_rate": 7.045623384731285e-06, - "loss": 2.1959, - "step": 492630 - }, - { - "epoch": 0.86, - "learning_rate": 7.04475144480446e-06, - "loss": 2.2636, - "step": 492640 - }, - { - "epoch": 0.86, - "learning_rate": 7.043879504877632e-06, - "loss": 2.3846, - "step": 492650 - }, - { - "epoch": 0.86, - "learning_rate": 7.0430075649508056e-06, - "loss": 2.2863, - "step": 492660 - }, - { - "epoch": 0.86, - "learning_rate": 7.0421356250239785e-06, - "loss": 2.2983, - "step": 492670 - }, - { - "epoch": 0.86, - "learning_rate": 7.041263685097152e-06, - "loss": 2.3423, - "step": 492680 - }, - { - "epoch": 0.86, - "learning_rate": 7.040391745170324e-06, - "loss": 2.1202, - "step": 492690 - }, - { - "epoch": 0.86, - "learning_rate": 7.039519805243498e-06, - "loss": 2.1706, - "step": 492700 - }, - { - "epoch": 0.86, - "learning_rate": 7.038647865316672e-06, - "loss": 2.2813, - "step": 492710 - }, - { - "epoch": 0.86, - "learning_rate": 7.037775925389845e-06, - "loss": 2.2591, - "step": 492720 - }, - { - "epoch": 0.86, - "learning_rate": 7.0369039854630186e-06, - "loss": 2.2748, - "step": 492730 - }, - { - "epoch": 0.86, - "learning_rate": 7.036032045536191e-06, - "loss": 2.3331, - "step": 492740 - }, - { - "epoch": 0.86, - "learning_rate": 7.035160105609364e-06, - "loss": 2.1277, - "step": 492750 - }, - { - "epoch": 0.86, - "learning_rate": 7.034288165682537e-06, - "loss": 2.2513, - "step": 492760 - }, - { - "epoch": 0.86, - "learning_rate": 7.033416225755711e-06, - "loss": 2.2047, - "step": 492770 - }, - { - "epoch": 0.86, - "learning_rate": 7.032544285828883e-06, - "loss": 2.248, - "step": 492780 - }, - { - "epoch": 0.86, - "learning_rate": 7.031672345902057e-06, - "loss": 2.3164, - "step": 492790 - }, - { - "epoch": 0.86, - "learning_rate": 7.03080040597523e-06, - "loss": 2.2632, - "step": 492800 - }, - { - "epoch": 0.86, - "learning_rate": 7.029928466048404e-06, - "loss": 2.2293, - "step": 492810 - }, - { - "epoch": 0.86, - "learning_rate": 7.029056526121576e-06, - "loss": 2.2279, - "step": 492820 - }, - { - "epoch": 0.86, - "learning_rate": 7.0281845861947495e-06, - "loss": 2.3302, - "step": 492830 - }, - { - "epoch": 0.86, - "learning_rate": 7.027312646267923e-06, - "loss": 2.3197, - "step": 492840 - }, - { - "epoch": 0.86, - "learning_rate": 7.026440706341096e-06, - "loss": 2.229, - "step": 492850 - }, - { - "epoch": 0.86, - "learning_rate": 7.02556876641427e-06, - "loss": 2.2661, - "step": 492860 - }, - { - "epoch": 0.86, - "learning_rate": 7.024696826487442e-06, - "loss": 2.2234, - "step": 492870 - }, - { - "epoch": 0.86, - "learning_rate": 7.023824886560617e-06, - "loss": 2.2048, - "step": 492880 - }, - { - "epoch": 0.86, - "learning_rate": 7.022952946633789e-06, - "loss": 2.3769, - "step": 492890 - }, - { - "epoch": 0.86, - "learning_rate": 7.0220810067069625e-06, - "loss": 2.2381, - "step": 492900 - }, - { - "epoch": 0.86, - "learning_rate": 7.021209066780135e-06, - "loss": 2.2385, - "step": 492910 - }, - { - "epoch": 0.86, - "learning_rate": 7.020337126853309e-06, - "loss": 2.275, - "step": 492920 - }, - { - "epoch": 0.86, - "learning_rate": 7.019465186926481e-06, - "loss": 2.2692, - "step": 492930 - }, - { - "epoch": 0.86, - "learning_rate": 7.018593246999655e-06, - "loss": 2.2923, - "step": 492940 - }, - { - "epoch": 0.86, - "learning_rate": 7.017721307072828e-06, - "loss": 2.3301, - "step": 492950 - }, - { - "epoch": 0.86, - "learning_rate": 7.016849367146002e-06, - "loss": 2.2932, - "step": 492960 - }, - { - "epoch": 0.86, - "learning_rate": 7.0159774272191755e-06, - "loss": 2.1555, - "step": 492970 - }, - { - "epoch": 0.86, - "learning_rate": 7.0151054872923476e-06, - "loss": 2.247, - "step": 492980 - }, - { - "epoch": 0.86, - "learning_rate": 7.014233547365521e-06, - "loss": 2.3397, - "step": 492990 - }, - { - "epoch": 0.86, - "learning_rate": 7.013361607438694e-06, - "loss": 2.3298, - "step": 493000 - }, - { - "epoch": 0.86, - "learning_rate": 7.012489667511868e-06, - "loss": 2.1598, - "step": 493010 - }, - { - "epoch": 0.86, - "learning_rate": 7.01161772758504e-06, - "loss": 2.1671, - "step": 493020 - }, - { - "epoch": 0.86, - "learning_rate": 7.010745787658214e-06, - "loss": 2.3906, - "step": 493030 - }, - { - "epoch": 0.86, - "learning_rate": 7.009873847731387e-06, - "loss": 2.2771, - "step": 493040 - }, - { - "epoch": 0.86, - "learning_rate": 7.0090019078045606e-06, - "loss": 2.4038, - "step": 493050 - }, - { - "epoch": 0.86, - "learning_rate": 7.008129967877733e-06, - "loss": 2.3138, - "step": 493060 - }, - { - "epoch": 0.86, - "learning_rate": 7.007258027950906e-06, - "loss": 2.2129, - "step": 493070 - }, - { - "epoch": 0.86, - "learning_rate": 7.006386088024079e-06, - "loss": 2.3145, - "step": 493080 - }, - { - "epoch": 0.86, - "learning_rate": 7.005514148097253e-06, - "loss": 2.3518, - "step": 493090 - }, - { - "epoch": 0.86, - "learning_rate": 7.004642208170427e-06, - "loss": 2.2899, - "step": 493100 - }, - { - "epoch": 0.86, - "learning_rate": 7.003770268243599e-06, - "loss": 2.2048, - "step": 493110 - }, - { - "epoch": 0.86, - "learning_rate": 7.0028983283167736e-06, - "loss": 2.2867, - "step": 493120 - }, - { - "epoch": 0.86, - "learning_rate": 7.002026388389946e-06, - "loss": 2.2658, - "step": 493130 - }, - { - "epoch": 0.86, - "learning_rate": 7.001154448463119e-06, - "loss": 2.2669, - "step": 493140 - }, - { - "epoch": 0.86, - "learning_rate": 7.000282508536292e-06, - "loss": 2.2707, - "step": 493150 - }, - { - "epoch": 0.86, - "learning_rate": 6.999410568609466e-06, - "loss": 2.3003, - "step": 493160 - }, - { - "epoch": 0.86, - "learning_rate": 6.998538628682638e-06, - "loss": 2.246, - "step": 493170 - }, - { - "epoch": 0.86, - "learning_rate": 6.997666688755812e-06, - "loss": 2.1995, - "step": 493180 - }, - { - "epoch": 0.86, - "learning_rate": 6.996794748828985e-06, - "loss": 2.3261, - "step": 493190 - }, - { - "epoch": 0.86, - "learning_rate": 6.995922808902159e-06, - "loss": 2.2565, - "step": 493200 - }, - { - "epoch": 0.86, - "learning_rate": 6.995050868975331e-06, - "loss": 2.2452, - "step": 493210 - }, - { - "epoch": 0.86, - "learning_rate": 6.9941789290485045e-06, - "loss": 2.2415, - "step": 493220 - }, - { - "epoch": 0.86, - "learning_rate": 6.993306989121678e-06, - "loss": 2.232, - "step": 493230 - }, - { - "epoch": 0.86, - "learning_rate": 6.992435049194851e-06, - "loss": 2.2527, - "step": 493240 - }, - { - "epoch": 0.86, - "learning_rate": 6.991563109268025e-06, - "loss": 2.2259, - "step": 493250 - }, - { - "epoch": 0.86, - "learning_rate": 6.990691169341197e-06, - "loss": 2.2903, - "step": 493260 - }, - { - "epoch": 0.86, - "learning_rate": 6.989819229414371e-06, - "loss": 2.2564, - "step": 493270 - }, - { - "epoch": 0.86, - "learning_rate": 6.988947289487544e-06, - "loss": 2.3334, - "step": 493280 - }, - { - "epoch": 0.86, - "learning_rate": 6.9880753495607175e-06, - "loss": 2.249, - "step": 493290 - }, - { - "epoch": 0.86, - "learning_rate": 6.9872034096338896e-06, - "loss": 2.2013, - "step": 493300 - }, - { - "epoch": 0.86, - "learning_rate": 6.986331469707063e-06, - "loss": 2.3594, - "step": 493310 - }, - { - "epoch": 0.86, - "learning_rate": 6.985459529780236e-06, - "loss": 2.1805, - "step": 493320 - }, - { - "epoch": 0.86, - "learning_rate": 6.98458758985341e-06, - "loss": 2.2813, - "step": 493330 - }, - { - "epoch": 0.86, - "learning_rate": 6.983715649926582e-06, - "loss": 2.3558, - "step": 493340 - }, - { - "epoch": 0.86, - "learning_rate": 6.982843709999756e-06, - "loss": 2.2561, - "step": 493350 - }, - { - "epoch": 0.86, - "learning_rate": 6.9819717700729305e-06, - "loss": 2.3435, - "step": 493360 - }, - { - "epoch": 0.86, - "learning_rate": 6.9810998301461026e-06, - "loss": 2.3056, - "step": 493370 - }, - { - "epoch": 0.86, - "learning_rate": 6.980227890219276e-06, - "loss": 2.3097, - "step": 493380 - }, - { - "epoch": 0.86, - "learning_rate": 6.979355950292448e-06, - "loss": 2.3446, - "step": 493390 - }, - { - "epoch": 0.86, - "learning_rate": 6.978484010365623e-06, - "loss": 2.2499, - "step": 493400 - }, - { - "epoch": 0.86, - "learning_rate": 6.977612070438795e-06, - "loss": 2.2601, - "step": 493410 - }, - { - "epoch": 0.86, - "learning_rate": 6.976740130511969e-06, - "loss": 2.3857, - "step": 493420 - }, - { - "epoch": 0.86, - "learning_rate": 6.975868190585142e-06, - "loss": 2.2299, - "step": 493430 - }, - { - "epoch": 0.86, - "learning_rate": 6.9749962506583156e-06, - "loss": 2.2769, - "step": 493440 - }, - { - "epoch": 0.86, - "learning_rate": 6.974124310731488e-06, - "loss": 2.26, - "step": 493450 - }, - { - "epoch": 0.86, - "learning_rate": 6.973252370804661e-06, - "loss": 2.2788, - "step": 493460 - }, - { - "epoch": 0.86, - "learning_rate": 6.972380430877834e-06, - "loss": 2.2937, - "step": 493470 - }, - { - "epoch": 0.86, - "learning_rate": 6.971508490951008e-06, - "loss": 2.3094, - "step": 493480 - }, - { - "epoch": 0.86, - "learning_rate": 6.97063655102418e-06, - "loss": 2.2693, - "step": 493490 - }, - { - "epoch": 0.86, - "learning_rate": 6.969764611097354e-06, - "loss": 2.2856, - "step": 493500 - }, - { - "epoch": 0.86, - "learning_rate": 6.968892671170528e-06, - "loss": 2.2143, - "step": 493510 - }, - { - "epoch": 0.86, - "learning_rate": 6.968020731243701e-06, - "loss": 2.3052, - "step": 493520 - }, - { - "epoch": 0.86, - "learning_rate": 6.967148791316874e-06, - "loss": 2.2432, - "step": 493530 - }, - { - "epoch": 0.86, - "learning_rate": 6.9662768513900465e-06, - "loss": 2.2899, - "step": 493540 - }, - { - "epoch": 0.86, - "learning_rate": 6.96540491146322e-06, - "loss": 2.303, - "step": 493550 - }, - { - "epoch": 0.86, - "learning_rate": 6.964532971536393e-06, - "loss": 2.2357, - "step": 493560 - }, - { - "epoch": 0.86, - "learning_rate": 6.963661031609567e-06, - "loss": 2.2526, - "step": 493570 - }, - { - "epoch": 0.86, - "learning_rate": 6.962789091682739e-06, - "loss": 2.1885, - "step": 493580 - }, - { - "epoch": 0.86, - "learning_rate": 6.961917151755913e-06, - "loss": 2.2284, - "step": 493590 - }, - { - "epoch": 0.86, - "learning_rate": 6.961045211829086e-06, - "loss": 2.2116, - "step": 493600 - }, - { - "epoch": 0.86, - "learning_rate": 6.9601732719022595e-06, - "loss": 2.316, - "step": 493610 - }, - { - "epoch": 0.86, - "learning_rate": 6.9593013319754316e-06, - "loss": 2.2843, - "step": 493620 - }, - { - "epoch": 0.86, - "learning_rate": 6.958429392048605e-06, - "loss": 2.2663, - "step": 493630 - }, - { - "epoch": 0.86, - "learning_rate": 6.95755745212178e-06, - "loss": 2.3515, - "step": 493640 - }, - { - "epoch": 0.86, - "learning_rate": 6.956685512194952e-06, - "loss": 2.2624, - "step": 493650 - }, - { - "epoch": 0.86, - "learning_rate": 6.955813572268126e-06, - "loss": 2.2965, - "step": 493660 - }, - { - "epoch": 0.86, - "learning_rate": 6.954941632341299e-06, - "loss": 2.2894, - "step": 493670 - }, - { - "epoch": 0.86, - "learning_rate": 6.9540696924144725e-06, - "loss": 2.2458, - "step": 493680 - }, - { - "epoch": 0.86, - "learning_rate": 6.9531977524876446e-06, - "loss": 2.2076, - "step": 493690 - }, - { - "epoch": 0.86, - "learning_rate": 6.952325812560818e-06, - "loss": 2.2601, - "step": 493700 - }, - { - "epoch": 0.86, - "learning_rate": 6.951453872633991e-06, - "loss": 2.2887, - "step": 493710 - }, - { - "epoch": 0.86, - "learning_rate": 6.950581932707165e-06, - "loss": 2.2356, - "step": 493720 - }, - { - "epoch": 0.86, - "learning_rate": 6.949709992780337e-06, - "loss": 2.2468, - "step": 493730 - }, - { - "epoch": 0.86, - "learning_rate": 6.948838052853511e-06, - "loss": 2.2699, - "step": 493740 - }, - { - "epoch": 0.86, - "learning_rate": 6.947966112926684e-06, - "loss": 2.1775, - "step": 493750 - }, - { - "epoch": 0.86, - "learning_rate": 6.9470941729998576e-06, - "loss": 2.3336, - "step": 493760 - }, - { - "epoch": 0.86, - "learning_rate": 6.946222233073031e-06, - "loss": 2.3073, - "step": 493770 - }, - { - "epoch": 0.86, - "learning_rate": 6.945350293146203e-06, - "loss": 2.4057, - "step": 493780 - }, - { - "epoch": 0.86, - "learning_rate": 6.944478353219377e-06, - "loss": 2.1868, - "step": 493790 - }, - { - "epoch": 0.86, - "learning_rate": 6.94360641329255e-06, - "loss": 2.3896, - "step": 493800 - }, - { - "epoch": 0.86, - "learning_rate": 6.942734473365724e-06, - "loss": 2.3032, - "step": 493810 - }, - { - "epoch": 0.86, - "learning_rate": 6.941862533438896e-06, - "loss": 2.2338, - "step": 493820 - }, - { - "epoch": 0.86, - "learning_rate": 6.94099059351207e-06, - "loss": 2.2604, - "step": 493830 - }, - { - "epoch": 0.86, - "learning_rate": 6.940118653585243e-06, - "loss": 2.2255, - "step": 493840 - }, - { - "epoch": 0.86, - "learning_rate": 6.939246713658416e-06, - "loss": 2.4237, - "step": 493850 - }, - { - "epoch": 0.86, - "learning_rate": 6.9383747737315885e-06, - "loss": 2.1819, - "step": 493860 - }, - { - "epoch": 0.86, - "learning_rate": 6.937502833804762e-06, - "loss": 2.175, - "step": 493870 - }, - { - "epoch": 0.86, - "learning_rate": 6.936630893877935e-06, - "loss": 2.2294, - "step": 493880 - }, - { - "epoch": 0.86, - "learning_rate": 6.935758953951109e-06, - "loss": 2.4538, - "step": 493890 - }, - { - "epoch": 0.86, - "learning_rate": 6.934887014024283e-06, - "loss": 2.1606, - "step": 493900 - }, - { - "epoch": 0.86, - "learning_rate": 6.934015074097455e-06, - "loss": 2.3045, - "step": 493910 - }, - { - "epoch": 0.86, - "learning_rate": 6.933143134170629e-06, - "loss": 2.2781, - "step": 493920 - }, - { - "epoch": 0.86, - "learning_rate": 6.9322711942438015e-06, - "loss": 2.2394, - "step": 493930 - }, - { - "epoch": 0.86, - "learning_rate": 6.931399254316975e-06, - "loss": 2.2605, - "step": 493940 - }, - { - "epoch": 0.86, - "learning_rate": 6.930527314390148e-06, - "loss": 2.2258, - "step": 493950 - }, - { - "epoch": 0.86, - "learning_rate": 6.929655374463322e-06, - "loss": 2.1637, - "step": 493960 - }, - { - "epoch": 0.86, - "learning_rate": 6.928783434536494e-06, - "loss": 2.2622, - "step": 493970 - }, - { - "epoch": 0.86, - "learning_rate": 6.927911494609668e-06, - "loss": 2.213, - "step": 493980 - }, - { - "epoch": 0.86, - "learning_rate": 6.927039554682841e-06, - "loss": 2.3772, - "step": 493990 - }, - { - "epoch": 0.86, - "learning_rate": 6.9261676147560145e-06, - "loss": 2.1914, - "step": 494000 - }, - { - "epoch": 0.86, - "learning_rate": 6.9252956748291866e-06, - "loss": 2.1667, - "step": 494010 - }, - { - "epoch": 0.86, - "learning_rate": 6.92442373490236e-06, - "loss": 2.257, - "step": 494020 - }, - { - "epoch": 0.86, - "learning_rate": 6.923551794975534e-06, - "loss": 2.2518, - "step": 494030 - }, - { - "epoch": 0.86, - "learning_rate": 6.922679855048707e-06, - "loss": 2.2805, - "step": 494040 - }, - { - "epoch": 0.86, - "learning_rate": 6.921807915121881e-06, - "loss": 2.1944, - "step": 494050 - }, - { - "epoch": 0.86, - "learning_rate": 6.920935975195053e-06, - "loss": 2.2594, - "step": 494060 - }, - { - "epoch": 0.86, - "learning_rate": 6.920064035268227e-06, - "loss": 2.1558, - "step": 494070 - }, - { - "epoch": 0.86, - "learning_rate": 6.9191920953414e-06, - "loss": 2.2425, - "step": 494080 - }, - { - "epoch": 0.86, - "learning_rate": 6.918320155414573e-06, - "loss": 2.3517, - "step": 494090 - }, - { - "epoch": 0.86, - "learning_rate": 6.917448215487745e-06, - "loss": 2.3403, - "step": 494100 - }, - { - "epoch": 0.86, - "learning_rate": 6.916576275560919e-06, - "loss": 2.2275, - "step": 494110 - }, - { - "epoch": 0.86, - "learning_rate": 6.915704335634092e-06, - "loss": 2.2435, - "step": 494120 - }, - { - "epoch": 0.86, - "learning_rate": 6.914832395707266e-06, - "loss": 2.2853, - "step": 494130 - }, - { - "epoch": 0.86, - "learning_rate": 6.913960455780438e-06, - "loss": 2.3753, - "step": 494140 - }, - { - "epoch": 0.86, - "learning_rate": 6.913088515853612e-06, - "loss": 2.335, - "step": 494150 - }, - { - "epoch": 0.86, - "learning_rate": 6.912216575926786e-06, - "loss": 2.3265, - "step": 494160 - }, - { - "epoch": 0.86, - "learning_rate": 6.9113446359999584e-06, - "loss": 2.2078, - "step": 494170 - }, - { - "epoch": 0.86, - "learning_rate": 6.910472696073132e-06, - "loss": 2.3712, - "step": 494180 - }, - { - "epoch": 0.86, - "learning_rate": 6.909600756146305e-06, - "loss": 2.246, - "step": 494190 - }, - { - "epoch": 0.86, - "learning_rate": 6.908728816219479e-06, - "loss": 2.2593, - "step": 494200 - }, - { - "epoch": 0.86, - "learning_rate": 6.907856876292651e-06, - "loss": 2.2813, - "step": 494210 - }, - { - "epoch": 0.86, - "learning_rate": 6.906984936365825e-06, - "loss": 2.2689, - "step": 494220 - }, - { - "epoch": 0.86, - "learning_rate": 6.906112996438998e-06, - "loss": 2.3262, - "step": 494230 - }, - { - "epoch": 0.86, - "learning_rate": 6.9052410565121714e-06, - "loss": 2.2975, - "step": 494240 - }, - { - "epoch": 0.86, - "learning_rate": 6.9043691165853435e-06, - "loss": 2.3202, - "step": 494250 - }, - { - "epoch": 0.86, - "learning_rate": 6.903497176658517e-06, - "loss": 2.2635, - "step": 494260 - }, - { - "epoch": 0.86, - "learning_rate": 6.90262523673169e-06, - "loss": 2.1557, - "step": 494270 - }, - { - "epoch": 0.86, - "learning_rate": 6.901753296804864e-06, - "loss": 2.1736, - "step": 494280 - }, - { - "epoch": 0.86, - "learning_rate": 6.900881356878038e-06, - "loss": 2.3028, - "step": 494290 - }, - { - "epoch": 0.86, - "learning_rate": 6.90000941695121e-06, - "loss": 2.2788, - "step": 494300 - }, - { - "epoch": 0.86, - "learning_rate": 6.899137477024384e-06, - "loss": 2.2355, - "step": 494310 - }, - { - "epoch": 0.86, - "learning_rate": 6.8982655370975565e-06, - "loss": 2.4365, - "step": 494320 - }, - { - "epoch": 0.86, - "learning_rate": 6.89739359717073e-06, - "loss": 2.2381, - "step": 494330 - }, - { - "epoch": 0.86, - "learning_rate": 6.896521657243902e-06, - "loss": 2.2849, - "step": 494340 - }, - { - "epoch": 0.86, - "learning_rate": 6.895649717317076e-06, - "loss": 2.1855, - "step": 494350 - }, - { - "epoch": 0.86, - "learning_rate": 6.894777777390249e-06, - "loss": 2.2542, - "step": 494360 - }, - { - "epoch": 0.86, - "learning_rate": 6.893905837463423e-06, - "loss": 2.3094, - "step": 494370 - }, - { - "epoch": 0.86, - "learning_rate": 6.893033897536595e-06, - "loss": 2.1885, - "step": 494380 - }, - { - "epoch": 0.86, - "learning_rate": 6.892161957609769e-06, - "loss": 2.2973, - "step": 494390 - }, - { - "epoch": 0.86, - "learning_rate": 6.891290017682942e-06, - "loss": 2.3519, - "step": 494400 - }, - { - "epoch": 0.86, - "learning_rate": 6.890418077756115e-06, - "loss": 2.2632, - "step": 494410 - }, - { - "epoch": 0.86, - "learning_rate": 6.8895461378292874e-06, - "loss": 2.132, - "step": 494420 - }, - { - "epoch": 0.86, - "learning_rate": 6.888674197902461e-06, - "loss": 2.2477, - "step": 494430 - }, - { - "epoch": 0.86, - "learning_rate": 6.887802257975636e-06, - "loss": 2.3418, - "step": 494440 - }, - { - "epoch": 0.86, - "learning_rate": 6.886930318048808e-06, - "loss": 2.3013, - "step": 494450 - }, - { - "epoch": 0.86, - "learning_rate": 6.886058378121982e-06, - "loss": 2.3442, - "step": 494460 - }, - { - "epoch": 0.86, - "learning_rate": 6.885186438195155e-06, - "loss": 2.2954, - "step": 494470 - }, - { - "epoch": 0.86, - "learning_rate": 6.884314498268328e-06, - "loss": 2.2547, - "step": 494480 - }, - { - "epoch": 0.86, - "learning_rate": 6.8834425583415004e-06, - "loss": 2.1425, - "step": 494490 - }, - { - "epoch": 0.86, - "learning_rate": 6.882570618414674e-06, - "loss": 2.369, - "step": 494500 - }, - { - "epoch": 0.86, - "learning_rate": 6.881698678487847e-06, - "loss": 2.2156, - "step": 494510 - }, - { - "epoch": 0.86, - "learning_rate": 6.880826738561021e-06, - "loss": 2.3663, - "step": 494520 - }, - { - "epoch": 0.86, - "learning_rate": 6.879954798634193e-06, - "loss": 2.2695, - "step": 494530 - }, - { - "epoch": 0.86, - "learning_rate": 6.879082858707367e-06, - "loss": 2.2013, - "step": 494540 - }, - { - "epoch": 0.86, - "learning_rate": 6.87821091878054e-06, - "loss": 2.2853, - "step": 494550 - }, - { - "epoch": 0.86, - "learning_rate": 6.8773389788537134e-06, - "loss": 2.174, - "step": 494560 - }, - { - "epoch": 0.86, - "learning_rate": 6.876467038926887e-06, - "loss": 2.2519, - "step": 494570 - }, - { - "epoch": 0.86, - "learning_rate": 6.875595099000059e-06, - "loss": 2.4297, - "step": 494580 - }, - { - "epoch": 0.86, - "learning_rate": 6.874723159073233e-06, - "loss": 2.2577, - "step": 494590 - }, - { - "epoch": 0.86, - "learning_rate": 6.873851219146406e-06, - "loss": 2.2446, - "step": 494600 - }, - { - "epoch": 0.86, - "learning_rate": 6.87297927921958e-06, - "loss": 2.2195, - "step": 494610 - }, - { - "epoch": 0.86, - "learning_rate": 6.872107339292752e-06, - "loss": 2.3473, - "step": 494620 - }, - { - "epoch": 0.86, - "learning_rate": 6.871235399365926e-06, - "loss": 2.1609, - "step": 494630 - }, - { - "epoch": 0.86, - "learning_rate": 6.8703634594390985e-06, - "loss": 2.1663, - "step": 494640 - }, - { - "epoch": 0.86, - "learning_rate": 6.869491519512272e-06, - "loss": 2.2799, - "step": 494650 - }, - { - "epoch": 0.86, - "learning_rate": 6.868619579585444e-06, - "loss": 2.1754, - "step": 494660 - }, - { - "epoch": 0.86, - "learning_rate": 6.867747639658618e-06, - "loss": 2.3741, - "step": 494670 - }, - { - "epoch": 0.86, - "learning_rate": 6.866875699731791e-06, - "loss": 2.2911, - "step": 494680 - }, - { - "epoch": 0.86, - "learning_rate": 6.866003759804965e-06, - "loss": 2.2381, - "step": 494690 - }, - { - "epoch": 0.86, - "learning_rate": 6.865131819878139e-06, - "loss": 2.249, - "step": 494700 - }, - { - "epoch": 0.86, - "learning_rate": 6.8642598799513115e-06, - "loss": 2.2972, - "step": 494710 - }, - { - "epoch": 0.86, - "learning_rate": 6.863387940024485e-06, - "loss": 2.3474, - "step": 494720 - }, - { - "epoch": 0.86, - "learning_rate": 6.862516000097657e-06, - "loss": 2.2827, - "step": 494730 - }, - { - "epoch": 0.86, - "learning_rate": 6.861644060170831e-06, - "loss": 2.2396, - "step": 494740 - }, - { - "epoch": 0.86, - "learning_rate": 6.860772120244004e-06, - "loss": 2.2831, - "step": 494750 - }, - { - "epoch": 0.86, - "learning_rate": 6.859900180317178e-06, - "loss": 2.2551, - "step": 494760 - }, - { - "epoch": 0.86, - "learning_rate": 6.85902824039035e-06, - "loss": 2.3341, - "step": 494770 - }, - { - "epoch": 0.86, - "learning_rate": 6.858156300463524e-06, - "loss": 2.18, - "step": 494780 - }, - { - "epoch": 0.86, - "learning_rate": 6.857284360536697e-06, - "loss": 2.3317, - "step": 494790 - }, - { - "epoch": 0.86, - "learning_rate": 6.85641242060987e-06, - "loss": 2.3285, - "step": 494800 - }, - { - "epoch": 0.86, - "learning_rate": 6.8555404806830424e-06, - "loss": 2.1835, - "step": 494810 - }, - { - "epoch": 0.86, - "learning_rate": 6.854668540756216e-06, - "loss": 2.241, - "step": 494820 - }, - { - "epoch": 0.86, - "learning_rate": 6.85379660082939e-06, - "loss": 2.2664, - "step": 494830 - }, - { - "epoch": 0.86, - "learning_rate": 6.852924660902563e-06, - "loss": 2.3555, - "step": 494840 - }, - { - "epoch": 0.86, - "learning_rate": 6.852052720975737e-06, - "loss": 2.2827, - "step": 494850 - }, - { - "epoch": 0.86, - "learning_rate": 6.851180781048909e-06, - "loss": 2.2121, - "step": 494860 - }, - { - "epoch": 0.86, - "learning_rate": 6.8503088411220825e-06, - "loss": 2.3567, - "step": 494870 - }, - { - "epoch": 0.86, - "learning_rate": 6.8494369011952554e-06, - "loss": 2.3041, - "step": 494880 - }, - { - "epoch": 0.86, - "learning_rate": 6.848564961268429e-06, - "loss": 2.1218, - "step": 494890 - }, - { - "epoch": 0.86, - "learning_rate": 6.847693021341601e-06, - "loss": 2.3986, - "step": 494900 - }, - { - "epoch": 0.86, - "learning_rate": 6.846821081414775e-06, - "loss": 2.3006, - "step": 494910 - }, - { - "epoch": 0.86, - "learning_rate": 6.845949141487948e-06, - "loss": 2.3612, - "step": 494920 - }, - { - "epoch": 0.86, - "learning_rate": 6.845077201561122e-06, - "loss": 2.3564, - "step": 494930 - }, - { - "epoch": 0.86, - "learning_rate": 6.844205261634294e-06, - "loss": 2.2648, - "step": 494940 - }, - { - "epoch": 0.86, - "learning_rate": 6.843333321707468e-06, - "loss": 2.2063, - "step": 494950 - }, - { - "epoch": 0.86, - "learning_rate": 6.842461381780642e-06, - "loss": 2.3429, - "step": 494960 - }, - { - "epoch": 0.86, - "learning_rate": 6.841589441853814e-06, - "loss": 2.1973, - "step": 494970 - }, - { - "epoch": 0.86, - "learning_rate": 6.840717501926988e-06, - "loss": 2.2993, - "step": 494980 - }, - { - "epoch": 0.86, - "learning_rate": 6.839845562000161e-06, - "loss": 2.2689, - "step": 494990 - }, - { - "epoch": 0.86, - "learning_rate": 6.838973622073335e-06, - "loss": 2.1457, - "step": 495000 - }, - { - "epoch": 0.86, - "learning_rate": 6.838101682146507e-06, - "loss": 2.2821, - "step": 495010 - }, - { - "epoch": 0.86, - "learning_rate": 6.837229742219681e-06, - "loss": 2.3167, - "step": 495020 - }, - { - "epoch": 0.86, - "learning_rate": 6.8363578022928535e-06, - "loss": 2.3984, - "step": 495030 - }, - { - "epoch": 0.86, - "learning_rate": 6.835485862366027e-06, - "loss": 2.243, - "step": 495040 - }, - { - "epoch": 0.86, - "learning_rate": 6.834613922439199e-06, - "loss": 2.3946, - "step": 495050 - }, - { - "epoch": 0.86, - "learning_rate": 6.833741982512373e-06, - "loss": 2.2791, - "step": 495060 - }, - { - "epoch": 0.86, - "learning_rate": 6.832870042585546e-06, - "loss": 2.3226, - "step": 495070 - }, - { - "epoch": 0.86, - "learning_rate": 6.83199810265872e-06, - "loss": 2.2489, - "step": 495080 - }, - { - "epoch": 0.86, - "learning_rate": 6.831126162731894e-06, - "loss": 2.3572, - "step": 495090 - }, - { - "epoch": 0.86, - "learning_rate": 6.830254222805066e-06, - "loss": 2.2141, - "step": 495100 - }, - { - "epoch": 0.86, - "learning_rate": 6.8293822828782394e-06, - "loss": 2.2381, - "step": 495110 - }, - { - "epoch": 0.86, - "learning_rate": 6.828510342951412e-06, - "loss": 2.2641, - "step": 495120 - }, - { - "epoch": 0.86, - "learning_rate": 6.827638403024586e-06, - "loss": 2.3152, - "step": 495130 - }, - { - "epoch": 0.86, - "learning_rate": 6.826766463097758e-06, - "loss": 2.2922, - "step": 495140 - }, - { - "epoch": 0.86, - "learning_rate": 6.825894523170932e-06, - "loss": 2.2134, - "step": 495150 - }, - { - "epoch": 0.86, - "learning_rate": 6.825022583244105e-06, - "loss": 2.2382, - "step": 495160 - }, - { - "epoch": 0.86, - "learning_rate": 6.824150643317279e-06, - "loss": 2.294, - "step": 495170 - }, - { - "epoch": 0.86, - "learning_rate": 6.823278703390451e-06, - "loss": 2.257, - "step": 495180 - }, - { - "epoch": 0.86, - "learning_rate": 6.8224067634636245e-06, - "loss": 2.2597, - "step": 495190 - }, - { - "epoch": 0.86, - "learning_rate": 6.8215348235367974e-06, - "loss": 2.3223, - "step": 495200 - }, - { - "epoch": 0.86, - "learning_rate": 6.820662883609971e-06, - "loss": 2.3986, - "step": 495210 - }, - { - "epoch": 0.86, - "learning_rate": 6.819790943683143e-06, - "loss": 2.1784, - "step": 495220 - }, - { - "epoch": 0.86, - "learning_rate": 6.818919003756318e-06, - "loss": 2.3564, - "step": 495230 - }, - { - "epoch": 0.86, - "learning_rate": 6.818047063829492e-06, - "loss": 2.3773, - "step": 495240 - }, - { - "epoch": 0.86, - "learning_rate": 6.817175123902664e-06, - "loss": 2.1704, - "step": 495250 - }, - { - "epoch": 0.86, - "learning_rate": 6.8163031839758375e-06, - "loss": 2.3365, - "step": 495260 - }, - { - "epoch": 0.86, - "learning_rate": 6.8154312440490104e-06, - "loss": 2.2069, - "step": 495270 - }, - { - "epoch": 0.86, - "learning_rate": 6.814559304122184e-06, - "loss": 2.161, - "step": 495280 - }, - { - "epoch": 0.86, - "learning_rate": 6.813687364195356e-06, - "loss": 2.324, - "step": 495290 - }, - { - "epoch": 0.86, - "learning_rate": 6.81281542426853e-06, - "loss": 2.1686, - "step": 495300 - }, - { - "epoch": 0.86, - "learning_rate": 6.811943484341703e-06, - "loss": 2.3227, - "step": 495310 - }, - { - "epoch": 0.86, - "learning_rate": 6.811071544414877e-06, - "loss": 2.2339, - "step": 495320 - }, - { - "epoch": 0.86, - "learning_rate": 6.810199604488049e-06, - "loss": 2.272, - "step": 495330 - }, - { - "epoch": 0.86, - "learning_rate": 6.809327664561223e-06, - "loss": 2.2856, - "step": 495340 - }, - { - "epoch": 0.86, - "learning_rate": 6.8084557246343955e-06, - "loss": 2.224, - "step": 495350 - }, - { - "epoch": 0.86, - "learning_rate": 6.807583784707569e-06, - "loss": 2.2811, - "step": 495360 - }, - { - "epoch": 0.86, - "learning_rate": 6.806711844780743e-06, - "loss": 2.2378, - "step": 495370 - }, - { - "epoch": 0.86, - "learning_rate": 6.805839904853915e-06, - "loss": 2.2971, - "step": 495380 - }, - { - "epoch": 0.86, - "learning_rate": 6.804967964927089e-06, - "loss": 2.1687, - "step": 495390 - }, - { - "epoch": 0.86, - "learning_rate": 6.804096025000262e-06, - "loss": 2.3633, - "step": 495400 - }, - { - "epoch": 0.86, - "learning_rate": 6.803224085073436e-06, - "loss": 2.3449, - "step": 495410 - }, - { - "epoch": 0.86, - "learning_rate": 6.802352145146608e-06, - "loss": 2.0926, - "step": 495420 - }, - { - "epoch": 0.86, - "learning_rate": 6.8014802052197814e-06, - "loss": 2.2262, - "step": 495430 - }, - { - "epoch": 0.86, - "learning_rate": 6.800608265292954e-06, - "loss": 2.2498, - "step": 495440 - }, - { - "epoch": 0.86, - "learning_rate": 6.799736325366128e-06, - "loss": 2.2151, - "step": 495450 - }, - { - "epoch": 0.86, - "learning_rate": 6.7988643854393e-06, - "loss": 2.2798, - "step": 495460 - }, - { - "epoch": 0.86, - "learning_rate": 6.797992445512474e-06, - "loss": 2.2448, - "step": 495470 - }, - { - "epoch": 0.86, - "learning_rate": 6.797120505585647e-06, - "loss": 2.2446, - "step": 495480 - }, - { - "epoch": 0.86, - "learning_rate": 6.796248565658821e-06, - "loss": 2.3456, - "step": 495490 - }, - { - "epoch": 0.86, - "learning_rate": 6.7953766257319944e-06, - "loss": 2.2843, - "step": 495500 - }, - { - "epoch": 0.86, - "learning_rate": 6.794504685805167e-06, - "loss": 2.2169, - "step": 495510 - }, - { - "epoch": 0.86, - "learning_rate": 6.793632745878341e-06, - "loss": 2.2161, - "step": 495520 - }, - { - "epoch": 0.86, - "learning_rate": 6.792760805951513e-06, - "loss": 2.2914, - "step": 495530 - }, - { - "epoch": 0.86, - "learning_rate": 6.791888866024687e-06, - "loss": 2.2404, - "step": 495540 - }, - { - "epoch": 0.86, - "learning_rate": 6.79101692609786e-06, - "loss": 2.272, - "step": 495550 - }, - { - "epoch": 0.86, - "learning_rate": 6.790144986171034e-06, - "loss": 2.2701, - "step": 495560 - }, - { - "epoch": 0.86, - "learning_rate": 6.789273046244206e-06, - "loss": 2.2607, - "step": 495570 - }, - { - "epoch": 0.86, - "learning_rate": 6.7884011063173795e-06, - "loss": 2.1095, - "step": 495580 - }, - { - "epoch": 0.86, - "learning_rate": 6.7875291663905524e-06, - "loss": 2.2624, - "step": 495590 - }, - { - "epoch": 0.86, - "learning_rate": 6.786657226463726e-06, - "loss": 2.2299, - "step": 495600 - }, - { - "epoch": 0.86, - "learning_rate": 6.785785286536898e-06, - "loss": 2.1394, - "step": 495610 - }, - { - "epoch": 0.86, - "learning_rate": 6.784913346610072e-06, - "loss": 2.2946, - "step": 495620 - }, - { - "epoch": 0.86, - "learning_rate": 6.784041406683246e-06, - "loss": 2.2819, - "step": 495630 - }, - { - "epoch": 0.86, - "learning_rate": 6.783169466756419e-06, - "loss": 2.2586, - "step": 495640 - }, - { - "epoch": 0.86, - "learning_rate": 6.7822975268295925e-06, - "loss": 2.1604, - "step": 495650 - }, - { - "epoch": 0.86, - "learning_rate": 6.781425586902765e-06, - "loss": 2.2257, - "step": 495660 - }, - { - "epoch": 0.86, - "learning_rate": 6.780553646975938e-06, - "loss": 2.2917, - "step": 495670 - }, - { - "epoch": 0.86, - "learning_rate": 6.779681707049111e-06, - "loss": 2.2206, - "step": 495680 - }, - { - "epoch": 0.86, - "learning_rate": 6.778809767122285e-06, - "loss": 2.2187, - "step": 495690 - }, - { - "epoch": 0.86, - "learning_rate": 6.777937827195457e-06, - "loss": 2.1951, - "step": 495700 - }, - { - "epoch": 0.86, - "learning_rate": 6.777065887268631e-06, - "loss": 2.3185, - "step": 495710 - }, - { - "epoch": 0.86, - "learning_rate": 6.776193947341804e-06, - "loss": 2.3422, - "step": 495720 - }, - { - "epoch": 0.86, - "learning_rate": 6.775322007414978e-06, - "loss": 2.1997, - "step": 495730 - }, - { - "epoch": 0.86, - "learning_rate": 6.77445006748815e-06, - "loss": 2.193, - "step": 495740 - }, - { - "epoch": 0.86, - "learning_rate": 6.773578127561324e-06, - "loss": 2.2442, - "step": 495750 - }, - { - "epoch": 0.86, - "learning_rate": 6.772706187634498e-06, - "loss": 2.266, - "step": 495760 - }, - { - "epoch": 0.86, - "learning_rate": 6.77183424770767e-06, - "loss": 2.304, - "step": 495770 - }, - { - "epoch": 0.86, - "learning_rate": 6.770962307780844e-06, - "loss": 2.3616, - "step": 495780 - }, - { - "epoch": 0.86, - "learning_rate": 6.770090367854017e-06, - "loss": 2.3511, - "step": 495790 - }, - { - "epoch": 0.86, - "learning_rate": 6.769218427927191e-06, - "loss": 2.285, - "step": 495800 - }, - { - "epoch": 0.86, - "learning_rate": 6.768346488000363e-06, - "loss": 2.2403, - "step": 495810 - }, - { - "epoch": 0.86, - "learning_rate": 6.7674745480735364e-06, - "loss": 2.2594, - "step": 495820 - }, - { - "epoch": 0.86, - "learning_rate": 6.766602608146709e-06, - "loss": 2.129, - "step": 495830 - }, - { - "epoch": 0.86, - "learning_rate": 6.765730668219883e-06, - "loss": 2.1893, - "step": 495840 - }, - { - "epoch": 0.86, - "learning_rate": 6.764858728293055e-06, - "loss": 2.2369, - "step": 495850 - }, - { - "epoch": 0.86, - "learning_rate": 6.763986788366229e-06, - "loss": 2.3015, - "step": 495860 - }, - { - "epoch": 0.86, - "learning_rate": 6.763114848439402e-06, - "loss": 2.287, - "step": 495870 - }, - { - "epoch": 0.86, - "learning_rate": 6.762242908512576e-06, - "loss": 2.3251, - "step": 495880 - }, - { - "epoch": 0.86, - "learning_rate": 6.7613709685857494e-06, - "loss": 2.3067, - "step": 495890 - }, - { - "epoch": 0.86, - "learning_rate": 6.7604990286589215e-06, - "loss": 2.1939, - "step": 495900 - }, - { - "epoch": 0.86, - "learning_rate": 6.759627088732095e-06, - "loss": 2.11, - "step": 495910 - }, - { - "epoch": 0.86, - "learning_rate": 6.758755148805268e-06, - "loss": 2.2598, - "step": 495920 - }, - { - "epoch": 0.86, - "learning_rate": 6.757883208878442e-06, - "loss": 2.2402, - "step": 495930 - }, - { - "epoch": 0.86, - "learning_rate": 6.757011268951614e-06, - "loss": 2.3305, - "step": 495940 - }, - { - "epoch": 0.86, - "learning_rate": 6.756139329024788e-06, - "loss": 2.2203, - "step": 495950 - }, - { - "epoch": 0.86, - "learning_rate": 6.755267389097961e-06, - "loss": 2.2187, - "step": 495960 - }, - { - "epoch": 0.86, - "learning_rate": 6.7543954491711345e-06, - "loss": 2.2939, - "step": 495970 - }, - { - "epoch": 0.86, - "learning_rate": 6.753523509244307e-06, - "loss": 2.3299, - "step": 495980 - }, - { - "epoch": 0.86, - "learning_rate": 6.75265156931748e-06, - "loss": 2.2492, - "step": 495990 - }, - { - "epoch": 0.86, - "learning_rate": 6.751779629390653e-06, - "loss": 2.2995, - "step": 496000 - }, - { - "epoch": 0.86, - "learning_rate": 6.750907689463827e-06, - "loss": 2.3562, - "step": 496010 - }, - { - "epoch": 0.86, - "learning_rate": 6.750035749537001e-06, - "loss": 2.2835, - "step": 496020 - }, - { - "epoch": 0.87, - "learning_rate": 6.749163809610174e-06, - "loss": 2.3326, - "step": 496030 - }, - { - "epoch": 0.87, - "learning_rate": 6.7482918696833475e-06, - "loss": 2.2162, - "step": 496040 - }, - { - "epoch": 0.87, - "learning_rate": 6.74741992975652e-06, - "loss": 2.2491, - "step": 496050 - }, - { - "epoch": 0.87, - "learning_rate": 6.746547989829693e-06, - "loss": 2.0698, - "step": 496060 - }, - { - "epoch": 0.87, - "learning_rate": 6.745676049902866e-06, - "loss": 2.3627, - "step": 496070 - }, - { - "epoch": 0.87, - "learning_rate": 6.74480410997604e-06, - "loss": 2.3129, - "step": 496080 - }, - { - "epoch": 0.87, - "learning_rate": 6.743932170049212e-06, - "loss": 2.1984, - "step": 496090 - }, - { - "epoch": 0.87, - "learning_rate": 6.743060230122386e-06, - "loss": 2.2968, - "step": 496100 - }, - { - "epoch": 0.87, - "learning_rate": 6.742188290195559e-06, - "loss": 2.2669, - "step": 496110 - }, - { - "epoch": 0.87, - "learning_rate": 6.741316350268733e-06, - "loss": 2.2146, - "step": 496120 - }, - { - "epoch": 0.87, - "learning_rate": 6.740444410341905e-06, - "loss": 2.3552, - "step": 496130 - }, - { - "epoch": 0.87, - "learning_rate": 6.7395724704150784e-06, - "loss": 2.1588, - "step": 496140 - }, - { - "epoch": 0.87, - "learning_rate": 6.738700530488251e-06, - "loss": 2.2919, - "step": 496150 - }, - { - "epoch": 0.87, - "learning_rate": 6.737828590561425e-06, - "loss": 2.3535, - "step": 496160 - }, - { - "epoch": 0.87, - "learning_rate": 6.736956650634599e-06, - "loss": 2.1639, - "step": 496170 - }, - { - "epoch": 0.87, - "learning_rate": 6.736084710707771e-06, - "loss": 2.2413, - "step": 496180 - }, - { - "epoch": 0.87, - "learning_rate": 6.735212770780945e-06, - "loss": 2.3071, - "step": 496190 - }, - { - "epoch": 0.87, - "learning_rate": 6.734340830854118e-06, - "loss": 2.1466, - "step": 496200 - }, - { - "epoch": 0.87, - "learning_rate": 6.7334688909272914e-06, - "loss": 2.1824, - "step": 496210 - }, - { - "epoch": 0.87, - "learning_rate": 6.7325969510004635e-06, - "loss": 2.3701, - "step": 496220 - }, - { - "epoch": 0.87, - "learning_rate": 6.731725011073637e-06, - "loss": 2.2886, - "step": 496230 - }, - { - "epoch": 0.87, - "learning_rate": 6.73085307114681e-06, - "loss": 2.1967, - "step": 496240 - }, - { - "epoch": 0.87, - "learning_rate": 6.729981131219984e-06, - "loss": 2.2978, - "step": 496250 - }, - { - "epoch": 0.87, - "learning_rate": 6.729109191293156e-06, - "loss": 2.1873, - "step": 496260 - }, - { - "epoch": 0.87, - "learning_rate": 6.728237251366331e-06, - "loss": 2.1498, - "step": 496270 - }, - { - "epoch": 0.87, - "learning_rate": 6.727365311439503e-06, - "loss": 2.2573, - "step": 496280 - }, - { - "epoch": 0.87, - "learning_rate": 6.7264933715126765e-06, - "loss": 2.3332, - "step": 496290 - }, - { - "epoch": 0.87, - "learning_rate": 6.72562143158585e-06, - "loss": 2.164, - "step": 496300 - }, - { - "epoch": 0.87, - "learning_rate": 6.724749491659023e-06, - "loss": 2.2278, - "step": 496310 - }, - { - "epoch": 0.87, - "learning_rate": 6.723877551732197e-06, - "loss": 2.2725, - "step": 496320 - }, - { - "epoch": 0.87, - "learning_rate": 6.723005611805369e-06, - "loss": 2.3475, - "step": 496330 - }, - { - "epoch": 0.87, - "learning_rate": 6.722133671878543e-06, - "loss": 2.3727, - "step": 496340 - }, - { - "epoch": 0.87, - "learning_rate": 6.721261731951716e-06, - "loss": 2.3069, - "step": 496350 - }, - { - "epoch": 0.87, - "learning_rate": 6.7203897920248895e-06, - "loss": 2.301, - "step": 496360 - }, - { - "epoch": 0.87, - "learning_rate": 6.719517852098062e-06, - "loss": 2.3096, - "step": 496370 - }, - { - "epoch": 0.87, - "learning_rate": 6.718645912171235e-06, - "loss": 2.2701, - "step": 496380 - }, - { - "epoch": 0.87, - "learning_rate": 6.717773972244408e-06, - "loss": 2.2068, - "step": 496390 - }, - { - "epoch": 0.87, - "learning_rate": 6.716902032317582e-06, - "loss": 2.304, - "step": 496400 - }, - { - "epoch": 0.87, - "learning_rate": 6.716030092390754e-06, - "loss": 2.2702, - "step": 496410 - }, - { - "epoch": 0.87, - "learning_rate": 6.715158152463928e-06, - "loss": 2.2761, - "step": 496420 - }, - { - "epoch": 0.87, - "learning_rate": 6.714286212537102e-06, - "loss": 2.1879, - "step": 496430 - }, - { - "epoch": 0.87, - "learning_rate": 6.713414272610275e-06, - "loss": 2.2588, - "step": 496440 - }, - { - "epoch": 0.87, - "learning_rate": 6.712542332683448e-06, - "loss": 2.3045, - "step": 496450 - }, - { - "epoch": 0.87, - "learning_rate": 6.7116703927566204e-06, - "loss": 2.3466, - "step": 496460 - }, - { - "epoch": 0.87, - "learning_rate": 6.710798452829794e-06, - "loss": 2.3163, - "step": 496470 - }, - { - "epoch": 0.87, - "learning_rate": 6.709926512902967e-06, - "loss": 2.3681, - "step": 496480 - }, - { - "epoch": 0.87, - "learning_rate": 6.709054572976141e-06, - "loss": 2.2415, - "step": 496490 - }, - { - "epoch": 0.87, - "learning_rate": 6.708182633049313e-06, - "loss": 2.2988, - "step": 496500 - }, - { - "epoch": 0.87, - "learning_rate": 6.707310693122487e-06, - "loss": 2.3127, - "step": 496510 - }, - { - "epoch": 0.87, - "learning_rate": 6.70643875319566e-06, - "loss": 2.4065, - "step": 496520 - }, - { - "epoch": 0.87, - "learning_rate": 6.7055668132688334e-06, - "loss": 2.2302, - "step": 496530 - }, - { - "epoch": 0.87, - "learning_rate": 6.7046948733420055e-06, - "loss": 2.2056, - "step": 496540 - }, - { - "epoch": 0.87, - "learning_rate": 6.70382293341518e-06, - "loss": 2.3248, - "step": 496550 - }, - { - "epoch": 0.87, - "learning_rate": 6.702950993488354e-06, - "loss": 2.2207, - "step": 496560 - }, - { - "epoch": 0.87, - "learning_rate": 6.702079053561526e-06, - "loss": 2.2611, - "step": 496570 - }, - { - "epoch": 0.87, - "learning_rate": 6.7012071136347e-06, - "loss": 2.1848, - "step": 496580 - }, - { - "epoch": 0.87, - "learning_rate": 6.700335173707873e-06, - "loss": 2.3351, - "step": 496590 - }, - { - "epoch": 0.87, - "learning_rate": 6.6994632337810464e-06, - "loss": 2.2275, - "step": 496600 - }, - { - "epoch": 0.87, - "learning_rate": 6.6985912938542185e-06, - "loss": 2.2949, - "step": 496610 - }, - { - "epoch": 0.87, - "learning_rate": 6.697719353927392e-06, - "loss": 2.2873, - "step": 496620 - }, - { - "epoch": 0.87, - "learning_rate": 6.696847414000565e-06, - "loss": 2.4162, - "step": 496630 - }, - { - "epoch": 0.87, - "learning_rate": 6.695975474073739e-06, - "loss": 2.2596, - "step": 496640 - }, - { - "epoch": 0.87, - "learning_rate": 6.695103534146911e-06, - "loss": 2.2456, - "step": 496650 - }, - { - "epoch": 0.87, - "learning_rate": 6.694231594220085e-06, - "loss": 2.2713, - "step": 496660 - }, - { - "epoch": 0.87, - "learning_rate": 6.693359654293258e-06, - "loss": 2.3049, - "step": 496670 - }, - { - "epoch": 0.87, - "learning_rate": 6.6924877143664315e-06, - "loss": 2.1896, - "step": 496680 - }, - { - "epoch": 0.87, - "learning_rate": 6.691615774439605e-06, - "loss": 2.1907, - "step": 496690 - }, - { - "epoch": 0.87, - "learning_rate": 6.690743834512777e-06, - "loss": 2.2799, - "step": 496700 - }, - { - "epoch": 0.87, - "learning_rate": 6.689871894585951e-06, - "loss": 2.3016, - "step": 496710 - }, - { - "epoch": 0.87, - "learning_rate": 6.688999954659124e-06, - "loss": 2.3169, - "step": 496720 - }, - { - "epoch": 0.87, - "learning_rate": 6.688128014732298e-06, - "loss": 2.2664, - "step": 496730 - }, - { - "epoch": 0.87, - "learning_rate": 6.68725607480547e-06, - "loss": 2.2256, - "step": 496740 - }, - { - "epoch": 0.87, - "learning_rate": 6.686384134878644e-06, - "loss": 2.2203, - "step": 496750 - }, - { - "epoch": 0.87, - "learning_rate": 6.685512194951817e-06, - "loss": 2.1937, - "step": 496760 - }, - { - "epoch": 0.87, - "learning_rate": 6.68464025502499e-06, - "loss": 2.3157, - "step": 496770 - }, - { - "epoch": 0.87, - "learning_rate": 6.6837683150981624e-06, - "loss": 2.3031, - "step": 496780 - }, - { - "epoch": 0.87, - "learning_rate": 6.682896375171337e-06, - "loss": 2.3472, - "step": 496790 - }, - { - "epoch": 0.87, - "learning_rate": 6.682024435244509e-06, - "loss": 2.3385, - "step": 496800 - }, - { - "epoch": 0.87, - "learning_rate": 6.681152495317683e-06, - "loss": 2.1245, - "step": 496810 - }, - { - "epoch": 0.87, - "learning_rate": 6.680280555390857e-06, - "loss": 2.2813, - "step": 496820 - }, - { - "epoch": 0.87, - "learning_rate": 6.67940861546403e-06, - "loss": 2.3698, - "step": 496830 - }, - { - "epoch": 0.87, - "learning_rate": 6.678536675537203e-06, - "loss": 2.2705, - "step": 496840 - }, - { - "epoch": 0.87, - "learning_rate": 6.6776647356103754e-06, - "loss": 2.2508, - "step": 496850 - }, - { - "epoch": 0.87, - "learning_rate": 6.676792795683549e-06, - "loss": 2.4017, - "step": 496860 - }, - { - "epoch": 0.87, - "learning_rate": 6.675920855756722e-06, - "loss": 2.2243, - "step": 496870 - }, - { - "epoch": 0.87, - "learning_rate": 6.675048915829896e-06, - "loss": 2.2557, - "step": 496880 - }, - { - "epoch": 0.87, - "learning_rate": 6.674176975903068e-06, - "loss": 2.1204, - "step": 496890 - }, - { - "epoch": 0.87, - "learning_rate": 6.673305035976242e-06, - "loss": 2.2205, - "step": 496900 - }, - { - "epoch": 0.87, - "learning_rate": 6.672433096049415e-06, - "loss": 2.2811, - "step": 496910 - }, - { - "epoch": 0.87, - "learning_rate": 6.6715611561225884e-06, - "loss": 2.2715, - "step": 496920 - }, - { - "epoch": 0.87, - "learning_rate": 6.6706892161957605e-06, - "loss": 2.2494, - "step": 496930 - }, - { - "epoch": 0.87, - "learning_rate": 6.669817276268934e-06, - "loss": 2.1941, - "step": 496940 - }, - { - "epoch": 0.87, - "learning_rate": 6.668945336342108e-06, - "loss": 2.3087, - "step": 496950 - }, - { - "epoch": 0.87, - "learning_rate": 6.668073396415281e-06, - "loss": 2.1692, - "step": 496960 - }, - { - "epoch": 0.87, - "learning_rate": 6.667201456488455e-06, - "loss": 2.2045, - "step": 496970 - }, - { - "epoch": 0.87, - "learning_rate": 6.666329516561627e-06, - "loss": 2.227, - "step": 496980 - }, - { - "epoch": 0.87, - "learning_rate": 6.665457576634801e-06, - "loss": 2.3445, - "step": 496990 - }, - { - "epoch": 0.87, - "learning_rate": 6.6645856367079735e-06, - "loss": 2.2607, - "step": 497000 - }, - { - "epoch": 0.87, - "learning_rate": 6.663713696781147e-06, - "loss": 2.2094, - "step": 497010 - }, - { - "epoch": 0.87, - "learning_rate": 6.662841756854319e-06, - "loss": 2.3149, - "step": 497020 - }, - { - "epoch": 0.87, - "learning_rate": 6.661969816927493e-06, - "loss": 2.3336, - "step": 497030 - }, - { - "epoch": 0.87, - "learning_rate": 6.661097877000666e-06, - "loss": 2.329, - "step": 497040 - }, - { - "epoch": 0.87, - "learning_rate": 6.66022593707384e-06, - "loss": 2.3451, - "step": 497050 - }, - { - "epoch": 0.87, - "learning_rate": 6.659353997147012e-06, - "loss": 2.3543, - "step": 497060 - }, - { - "epoch": 0.87, - "learning_rate": 6.6584820572201865e-06, - "loss": 2.0888, - "step": 497070 - }, - { - "epoch": 0.87, - "learning_rate": 6.657610117293359e-06, - "loss": 2.2282, - "step": 497080 - }, - { - "epoch": 0.87, - "learning_rate": 6.656738177366532e-06, - "loss": 2.3113, - "step": 497090 - }, - { - "epoch": 0.87, - "learning_rate": 6.655866237439706e-06, - "loss": 2.2781, - "step": 497100 - }, - { - "epoch": 0.87, - "learning_rate": 6.654994297512879e-06, - "loss": 2.2673, - "step": 497110 - }, - { - "epoch": 0.87, - "learning_rate": 6.654122357586053e-06, - "loss": 2.2208, - "step": 497120 - }, - { - "epoch": 0.87, - "learning_rate": 6.653250417659225e-06, - "loss": 2.2407, - "step": 497130 - }, - { - "epoch": 0.87, - "learning_rate": 6.652378477732399e-06, - "loss": 2.3016, - "step": 497140 - }, - { - "epoch": 0.87, - "learning_rate": 6.651506537805572e-06, - "loss": 2.2859, - "step": 497150 - }, - { - "epoch": 0.87, - "learning_rate": 6.650634597878745e-06, - "loss": 2.3199, - "step": 497160 - }, - { - "epoch": 0.87, - "learning_rate": 6.6497626579519174e-06, - "loss": 2.2596, - "step": 497170 - }, - { - "epoch": 0.87, - "learning_rate": 6.648890718025091e-06, - "loss": 2.3318, - "step": 497180 - }, - { - "epoch": 0.87, - "learning_rate": 6.648018778098264e-06, - "loss": 2.2614, - "step": 497190 - }, - { - "epoch": 0.87, - "learning_rate": 6.647146838171438e-06, - "loss": 2.2251, - "step": 497200 - }, - { - "epoch": 0.87, - "learning_rate": 6.64627489824461e-06, - "loss": 2.2919, - "step": 497210 - }, - { - "epoch": 0.87, - "learning_rate": 6.645402958317784e-06, - "loss": 2.2478, - "step": 497220 - }, - { - "epoch": 0.87, - "learning_rate": 6.6445310183909575e-06, - "loss": 2.3767, - "step": 497230 - }, - { - "epoch": 0.87, - "learning_rate": 6.6436590784641305e-06, - "loss": 2.3291, - "step": 497240 - }, - { - "epoch": 0.87, - "learning_rate": 6.642787138537304e-06, - "loss": 2.176, - "step": 497250 - }, - { - "epoch": 0.87, - "learning_rate": 6.641915198610476e-06, - "loss": 2.2394, - "step": 497260 - }, - { - "epoch": 0.87, - "learning_rate": 6.64104325868365e-06, - "loss": 2.2757, - "step": 497270 - }, - { - "epoch": 0.87, - "learning_rate": 6.640171318756823e-06, - "loss": 2.2702, - "step": 497280 - }, - { - "epoch": 0.87, - "learning_rate": 6.639299378829997e-06, - "loss": 2.2739, - "step": 497290 - }, - { - "epoch": 0.87, - "learning_rate": 6.638427438903169e-06, - "loss": 2.2799, - "step": 497300 - }, - { - "epoch": 0.87, - "learning_rate": 6.6375554989763435e-06, - "loss": 2.2849, - "step": 497310 - }, - { - "epoch": 0.87, - "learning_rate": 6.6366835590495155e-06, - "loss": 2.3241, - "step": 497320 - }, - { - "epoch": 0.87, - "learning_rate": 6.635811619122689e-06, - "loss": 2.301, - "step": 497330 - }, - { - "epoch": 0.87, - "learning_rate": 6.634939679195861e-06, - "loss": 2.1314, - "step": 497340 - }, - { - "epoch": 0.87, - "learning_rate": 6.634067739269036e-06, - "loss": 2.2159, - "step": 497350 - }, - { - "epoch": 0.87, - "learning_rate": 6.63319579934221e-06, - "loss": 2.3009, - "step": 497360 - }, - { - "epoch": 0.87, - "learning_rate": 6.632323859415382e-06, - "loss": 2.1207, - "step": 497370 - }, - { - "epoch": 0.87, - "learning_rate": 6.631451919488556e-06, - "loss": 2.3404, - "step": 497380 - }, - { - "epoch": 0.87, - "learning_rate": 6.6305799795617285e-06, - "loss": 2.2425, - "step": 497390 - }, - { - "epoch": 0.87, - "learning_rate": 6.629708039634902e-06, - "loss": 2.2985, - "step": 497400 - }, - { - "epoch": 0.87, - "learning_rate": 6.628836099708074e-06, - "loss": 2.2844, - "step": 497410 - }, - { - "epoch": 0.87, - "learning_rate": 6.627964159781248e-06, - "loss": 2.2452, - "step": 497420 - }, - { - "epoch": 0.87, - "learning_rate": 6.627092219854421e-06, - "loss": 2.3098, - "step": 497430 - }, - { - "epoch": 0.87, - "learning_rate": 6.626220279927595e-06, - "loss": 2.2141, - "step": 497440 - }, - { - "epoch": 0.87, - "learning_rate": 6.625348340000767e-06, - "loss": 2.2374, - "step": 497450 - }, - { - "epoch": 0.87, - "learning_rate": 6.624476400073941e-06, - "loss": 2.2466, - "step": 497460 - }, - { - "epoch": 0.87, - "learning_rate": 6.623604460147114e-06, - "loss": 2.3086, - "step": 497470 - }, - { - "epoch": 0.87, - "learning_rate": 6.622732520220287e-06, - "loss": 2.2436, - "step": 497480 - }, - { - "epoch": 0.87, - "learning_rate": 6.621860580293461e-06, - "loss": 2.3492, - "step": 497490 - }, - { - "epoch": 0.87, - "learning_rate": 6.620988640366633e-06, - "loss": 2.2227, - "step": 497500 - }, - { - "epoch": 0.87, - "learning_rate": 6.620116700439807e-06, - "loss": 2.313, - "step": 497510 - }, - { - "epoch": 0.87, - "learning_rate": 6.61924476051298e-06, - "loss": 2.2208, - "step": 497520 - }, - { - "epoch": 0.87, - "learning_rate": 6.618372820586154e-06, - "loss": 2.1578, - "step": 497530 - }, - { - "epoch": 0.87, - "learning_rate": 6.617500880659326e-06, - "loss": 2.2955, - "step": 497540 - }, - { - "epoch": 0.87, - "learning_rate": 6.6166289407324995e-06, - "loss": 2.2413, - "step": 497550 - }, - { - "epoch": 0.87, - "learning_rate": 6.6157570008056725e-06, - "loss": 2.3287, - "step": 497560 - }, - { - "epoch": 0.87, - "learning_rate": 6.614885060878846e-06, - "loss": 2.2918, - "step": 497570 - }, - { - "epoch": 0.87, - "learning_rate": 6.614013120952018e-06, - "loss": 2.1891, - "step": 497580 - }, - { - "epoch": 0.87, - "learning_rate": 6.613141181025193e-06, - "loss": 2.1764, - "step": 497590 - }, - { - "epoch": 0.87, - "learning_rate": 6.612269241098365e-06, - "loss": 2.3685, - "step": 497600 - }, - { - "epoch": 0.87, - "learning_rate": 6.611397301171539e-06, - "loss": 2.2807, - "step": 497610 - }, - { - "epoch": 0.87, - "learning_rate": 6.6105253612447125e-06, - "loss": 2.2839, - "step": 497620 - }, - { - "epoch": 0.87, - "learning_rate": 6.6096534213178855e-06, - "loss": 2.2478, - "step": 497630 - }, - { - "epoch": 0.87, - "learning_rate": 6.608781481391059e-06, - "loss": 2.2923, - "step": 497640 - }, - { - "epoch": 0.87, - "learning_rate": 6.607909541464231e-06, - "loss": 2.3016, - "step": 497650 - }, - { - "epoch": 0.87, - "learning_rate": 6.607037601537405e-06, - "loss": 2.2717, - "step": 497660 - }, - { - "epoch": 0.87, - "learning_rate": 6.606165661610578e-06, - "loss": 2.2596, - "step": 497670 - }, - { - "epoch": 0.87, - "learning_rate": 6.605293721683752e-06, - "loss": 2.2362, - "step": 497680 - }, - { - "epoch": 0.87, - "learning_rate": 6.604421781756924e-06, - "loss": 2.304, - "step": 497690 - }, - { - "epoch": 0.87, - "learning_rate": 6.603549841830098e-06, - "loss": 2.2564, - "step": 497700 - }, - { - "epoch": 0.87, - "learning_rate": 6.6026779019032705e-06, - "loss": 2.3532, - "step": 497710 - }, - { - "epoch": 0.87, - "learning_rate": 6.601805961976444e-06, - "loss": 2.2758, - "step": 497720 - }, - { - "epoch": 0.87, - "learning_rate": 6.600934022049616e-06, - "loss": 2.2896, - "step": 497730 - }, - { - "epoch": 0.87, - "learning_rate": 6.60006208212279e-06, - "loss": 2.1937, - "step": 497740 - }, - { - "epoch": 0.87, - "learning_rate": 6.599190142195964e-06, - "loss": 2.1898, - "step": 497750 - }, - { - "epoch": 0.87, - "learning_rate": 6.598318202269137e-06, - "loss": 2.2814, - "step": 497760 - }, - { - "epoch": 0.87, - "learning_rate": 6.597446262342311e-06, - "loss": 2.1735, - "step": 497770 - }, - { - "epoch": 0.87, - "learning_rate": 6.596574322415483e-06, - "loss": 2.2067, - "step": 497780 - }, - { - "epoch": 0.87, - "learning_rate": 6.5957023824886565e-06, - "loss": 2.2177, - "step": 497790 - }, - { - "epoch": 0.87, - "learning_rate": 6.594830442561829e-06, - "loss": 2.3217, - "step": 497800 - }, - { - "epoch": 0.87, - "learning_rate": 6.593958502635003e-06, - "loss": 2.2764, - "step": 497810 - }, - { - "epoch": 0.87, - "learning_rate": 6.593086562708175e-06, - "loss": 2.3262, - "step": 497820 - }, - { - "epoch": 0.87, - "learning_rate": 6.59221462278135e-06, - "loss": 2.3219, - "step": 497830 - }, - { - "epoch": 0.87, - "learning_rate": 6.591342682854522e-06, - "loss": 2.2284, - "step": 497840 - }, - { - "epoch": 0.87, - "learning_rate": 6.590470742927696e-06, - "loss": 2.228, - "step": 497850 - }, - { - "epoch": 0.87, - "learning_rate": 6.589598803000868e-06, - "loss": 2.2296, - "step": 497860 - }, - { - "epoch": 0.87, - "learning_rate": 6.588726863074042e-06, - "loss": 2.1489, - "step": 497870 - }, - { - "epoch": 0.87, - "learning_rate": 6.5878549231472145e-06, - "loss": 2.335, - "step": 497880 - }, - { - "epoch": 0.87, - "learning_rate": 6.586982983220388e-06, - "loss": 2.1794, - "step": 497890 - }, - { - "epoch": 0.87, - "learning_rate": 6.586111043293562e-06, - "loss": 2.2348, - "step": 497900 - }, - { - "epoch": 0.87, - "learning_rate": 6.585239103366735e-06, - "loss": 2.1412, - "step": 497910 - }, - { - "epoch": 0.87, - "learning_rate": 6.584367163439909e-06, - "loss": 2.1341, - "step": 497920 - }, - { - "epoch": 0.87, - "learning_rate": 6.583495223513081e-06, - "loss": 2.2275, - "step": 497930 - }, - { - "epoch": 0.87, - "learning_rate": 6.5826232835862545e-06, - "loss": 2.2512, - "step": 497940 - }, - { - "epoch": 0.87, - "learning_rate": 6.5817513436594275e-06, - "loss": 2.3393, - "step": 497950 - }, - { - "epoch": 0.87, - "learning_rate": 6.580879403732601e-06, - "loss": 2.253, - "step": 497960 - }, - { - "epoch": 0.87, - "learning_rate": 6.580007463805773e-06, - "loss": 2.241, - "step": 497970 - }, - { - "epoch": 0.87, - "learning_rate": 6.579135523878947e-06, - "loss": 2.2782, - "step": 497980 - }, - { - "epoch": 0.87, - "learning_rate": 6.57826358395212e-06, - "loss": 2.2229, - "step": 497990 - }, - { - "epoch": 0.87, - "learning_rate": 6.577391644025294e-06, - "loss": 2.2057, - "step": 498000 - }, - { - "epoch": 0.87, - "learning_rate": 6.576519704098466e-06, - "loss": 2.3082, - "step": 498010 - }, - { - "epoch": 0.87, - "learning_rate": 6.57564776417164e-06, - "loss": 2.1696, - "step": 498020 - }, - { - "epoch": 0.87, - "learning_rate": 6.574775824244813e-06, - "loss": 2.2872, - "step": 498030 - }, - { - "epoch": 0.87, - "learning_rate": 6.573903884317986e-06, - "loss": 2.1235, - "step": 498040 - }, - { - "epoch": 0.87, - "learning_rate": 6.57303194439116e-06, - "loss": 2.2331, - "step": 498050 - }, - { - "epoch": 0.87, - "learning_rate": 6.572160004464332e-06, - "loss": 2.2611, - "step": 498060 - }, - { - "epoch": 0.87, - "learning_rate": 6.571288064537506e-06, - "loss": 2.2968, - "step": 498070 - }, - { - "epoch": 0.87, - "learning_rate": 6.570416124610679e-06, - "loss": 2.3134, - "step": 498080 - }, - { - "epoch": 0.87, - "learning_rate": 6.569544184683853e-06, - "loss": 2.2642, - "step": 498090 - }, - { - "epoch": 0.87, - "learning_rate": 6.568672244757025e-06, - "loss": 2.3128, - "step": 498100 - }, - { - "epoch": 0.87, - "learning_rate": 6.567800304830199e-06, - "loss": 2.363, - "step": 498110 - }, - { - "epoch": 0.87, - "learning_rate": 6.566928364903371e-06, - "loss": 2.2552, - "step": 498120 - }, - { - "epoch": 0.87, - "learning_rate": 6.566056424976545e-06, - "loss": 2.2726, - "step": 498130 - }, - { - "epoch": 0.87, - "learning_rate": 6.565184485049718e-06, - "loss": 2.3154, - "step": 498140 - }, - { - "epoch": 0.87, - "learning_rate": 6.564312545122892e-06, - "loss": 2.2463, - "step": 498150 - }, - { - "epoch": 0.87, - "learning_rate": 6.563440605196066e-06, - "loss": 2.2307, - "step": 498160 - }, - { - "epoch": 0.87, - "learning_rate": 6.562568665269238e-06, - "loss": 2.2806, - "step": 498170 - }, - { - "epoch": 0.87, - "learning_rate": 6.5616967253424115e-06, - "loss": 2.2261, - "step": 498180 - }, - { - "epoch": 0.87, - "learning_rate": 6.560824785415584e-06, - "loss": 2.3742, - "step": 498190 - }, - { - "epoch": 0.87, - "learning_rate": 6.559952845488758e-06, - "loss": 2.3112, - "step": 498200 - }, - { - "epoch": 0.87, - "learning_rate": 6.55908090556193e-06, - "loss": 2.2655, - "step": 498210 - }, - { - "epoch": 0.87, - "learning_rate": 6.558208965635104e-06, - "loss": 2.2361, - "step": 498220 - }, - { - "epoch": 0.87, - "learning_rate": 6.557337025708277e-06, - "loss": 2.3268, - "step": 498230 - }, - { - "epoch": 0.87, - "learning_rate": 6.556465085781451e-06, - "loss": 2.2815, - "step": 498240 - }, - { - "epoch": 0.87, - "learning_rate": 6.555593145854623e-06, - "loss": 2.2705, - "step": 498250 - }, - { - "epoch": 0.87, - "learning_rate": 6.5547212059277965e-06, - "loss": 2.2095, - "step": 498260 - }, - { - "epoch": 0.87, - "learning_rate": 6.5538492660009695e-06, - "loss": 2.2287, - "step": 498270 - }, - { - "epoch": 0.87, - "learning_rate": 6.552977326074143e-06, - "loss": 2.2173, - "step": 498280 - }, - { - "epoch": 0.87, - "learning_rate": 6.552105386147317e-06, - "loss": 2.2164, - "step": 498290 - }, - { - "epoch": 0.87, - "learning_rate": 6.551233446220489e-06, - "loss": 2.2719, - "step": 498300 - }, - { - "epoch": 0.87, - "learning_rate": 6.550361506293663e-06, - "loss": 2.2613, - "step": 498310 - }, - { - "epoch": 0.87, - "learning_rate": 6.549489566366836e-06, - "loss": 2.3216, - "step": 498320 - }, - { - "epoch": 0.87, - "learning_rate": 6.5486176264400095e-06, - "loss": 2.1718, - "step": 498330 - }, - { - "epoch": 0.87, - "learning_rate": 6.547745686513182e-06, - "loss": 2.2225, - "step": 498340 - }, - { - "epoch": 0.87, - "learning_rate": 6.546873746586356e-06, - "loss": 2.2677, - "step": 498350 - }, - { - "epoch": 0.87, - "learning_rate": 6.546001806659528e-06, - "loss": 2.327, - "step": 498360 - }, - { - "epoch": 0.87, - "learning_rate": 6.545129866732702e-06, - "loss": 2.3273, - "step": 498370 - }, - { - "epoch": 0.87, - "learning_rate": 6.544257926805874e-06, - "loss": 2.2488, - "step": 498380 - }, - { - "epoch": 0.87, - "learning_rate": 6.543385986879049e-06, - "loss": 2.2587, - "step": 498390 - }, - { - "epoch": 0.87, - "learning_rate": 6.542514046952221e-06, - "loss": 2.197, - "step": 498400 - }, - { - "epoch": 0.87, - "learning_rate": 6.541642107025395e-06, - "loss": 2.1263, - "step": 498410 - }, - { - "epoch": 0.87, - "learning_rate": 6.540770167098568e-06, - "loss": 2.2254, - "step": 498420 - }, - { - "epoch": 0.87, - "learning_rate": 6.539898227171741e-06, - "loss": 2.1753, - "step": 498430 - }, - { - "epoch": 0.87, - "learning_rate": 6.539026287244915e-06, - "loss": 2.308, - "step": 498440 - }, - { - "epoch": 0.87, - "learning_rate": 6.538154347318087e-06, - "loss": 2.1931, - "step": 498450 - }, - { - "epoch": 0.87, - "learning_rate": 6.537282407391261e-06, - "loss": 2.2116, - "step": 498460 - }, - { - "epoch": 0.87, - "learning_rate": 6.536410467464434e-06, - "loss": 2.3286, - "step": 498470 - }, - { - "epoch": 0.87, - "learning_rate": 6.535538527537608e-06, - "loss": 2.224, - "step": 498480 - }, - { - "epoch": 0.87, - "learning_rate": 6.53466658761078e-06, - "loss": 2.3616, - "step": 498490 - }, - { - "epoch": 0.87, - "learning_rate": 6.5337946476839535e-06, - "loss": 2.3033, - "step": 498500 - }, - { - "epoch": 0.87, - "learning_rate": 6.532922707757126e-06, - "loss": 2.2119, - "step": 498510 - }, - { - "epoch": 0.87, - "learning_rate": 6.5320507678303e-06, - "loss": 2.3236, - "step": 498520 - }, - { - "epoch": 0.87, - "learning_rate": 6.531178827903472e-06, - "loss": 2.1773, - "step": 498530 - }, - { - "epoch": 0.87, - "learning_rate": 6.530306887976646e-06, - "loss": 2.2974, - "step": 498540 - }, - { - "epoch": 0.87, - "learning_rate": 6.52943494804982e-06, - "loss": 2.3389, - "step": 498550 - }, - { - "epoch": 0.87, - "learning_rate": 6.528563008122993e-06, - "loss": 2.2076, - "step": 498560 - }, - { - "epoch": 0.87, - "learning_rate": 6.5276910681961665e-06, - "loss": 2.3385, - "step": 498570 - }, - { - "epoch": 0.87, - "learning_rate": 6.5268191282693385e-06, - "loss": 2.2404, - "step": 498580 - }, - { - "epoch": 0.87, - "learning_rate": 6.525947188342512e-06, - "loss": 2.2759, - "step": 498590 - }, - { - "epoch": 0.87, - "learning_rate": 6.525075248415685e-06, - "loss": 2.2613, - "step": 498600 - }, - { - "epoch": 0.87, - "learning_rate": 6.524203308488859e-06, - "loss": 2.2303, - "step": 498610 - }, - { - "epoch": 0.87, - "learning_rate": 6.523331368562031e-06, - "loss": 2.2349, - "step": 498620 - }, - { - "epoch": 0.87, - "learning_rate": 6.522459428635206e-06, - "loss": 2.3338, - "step": 498630 - }, - { - "epoch": 0.87, - "learning_rate": 6.521587488708378e-06, - "loss": 2.4016, - "step": 498640 - }, - { - "epoch": 0.87, - "learning_rate": 6.5207155487815515e-06, - "loss": 2.1868, - "step": 498650 - }, - { - "epoch": 0.87, - "learning_rate": 6.5198436088547245e-06, - "loss": 2.3032, - "step": 498660 - }, - { - "epoch": 0.87, - "learning_rate": 6.518971668927898e-06, - "loss": 2.3448, - "step": 498670 - }, - { - "epoch": 0.87, - "learning_rate": 6.518099729001072e-06, - "loss": 2.1882, - "step": 498680 - }, - { - "epoch": 0.87, - "learning_rate": 6.517227789074244e-06, - "loss": 2.3155, - "step": 498690 - }, - { - "epoch": 0.87, - "learning_rate": 6.516355849147418e-06, - "loss": 2.2741, - "step": 498700 - }, - { - "epoch": 0.87, - "learning_rate": 6.515483909220591e-06, - "loss": 2.3214, - "step": 498710 - }, - { - "epoch": 0.87, - "learning_rate": 6.5146119692937645e-06, - "loss": 2.2066, - "step": 498720 - }, - { - "epoch": 0.87, - "learning_rate": 6.513740029366937e-06, - "loss": 2.3949, - "step": 498730 - }, - { - "epoch": 0.87, - "learning_rate": 6.51286808944011e-06, - "loss": 2.2584, - "step": 498740 - }, - { - "epoch": 0.87, - "learning_rate": 6.511996149513283e-06, - "loss": 2.1812, - "step": 498750 - }, - { - "epoch": 0.87, - "learning_rate": 6.511124209586457e-06, - "loss": 2.291, - "step": 498760 - }, - { - "epoch": 0.87, - "learning_rate": 6.510252269659629e-06, - "loss": 2.2665, - "step": 498770 - }, - { - "epoch": 0.87, - "learning_rate": 6.509380329732803e-06, - "loss": 2.2607, - "step": 498780 - }, - { - "epoch": 0.87, - "learning_rate": 6.508508389805976e-06, - "loss": 2.1855, - "step": 498790 - }, - { - "epoch": 0.87, - "learning_rate": 6.50763644987915e-06, - "loss": 2.2916, - "step": 498800 - }, - { - "epoch": 0.87, - "learning_rate": 6.506764509952322e-06, - "loss": 2.2464, - "step": 498810 - }, - { - "epoch": 0.87, - "learning_rate": 6.5058925700254955e-06, - "loss": 2.3325, - "step": 498820 - }, - { - "epoch": 0.87, - "learning_rate": 6.505020630098669e-06, - "loss": 2.2917, - "step": 498830 - }, - { - "epoch": 0.87, - "learning_rate": 6.504148690171842e-06, - "loss": 2.1707, - "step": 498840 - }, - { - "epoch": 0.87, - "learning_rate": 6.503276750245016e-06, - "loss": 2.2581, - "step": 498850 - }, - { - "epoch": 0.87, - "learning_rate": 6.502404810318188e-06, - "loss": 2.1627, - "step": 498860 - }, - { - "epoch": 0.87, - "learning_rate": 6.501532870391363e-06, - "loss": 2.245, - "step": 498870 - }, - { - "epoch": 0.87, - "learning_rate": 6.500660930464535e-06, - "loss": 2.2638, - "step": 498880 - }, - { - "epoch": 0.87, - "learning_rate": 6.4997889905377085e-06, - "loss": 2.3052, - "step": 498890 - }, - { - "epoch": 0.87, - "learning_rate": 6.4989170506108805e-06, - "loss": 2.2942, - "step": 498900 - }, - { - "epoch": 0.87, - "learning_rate": 6.498045110684055e-06, - "loss": 2.1937, - "step": 498910 - }, - { - "epoch": 0.87, - "learning_rate": 6.497173170757227e-06, - "loss": 2.3353, - "step": 498920 - }, - { - "epoch": 0.87, - "learning_rate": 6.496301230830401e-06, - "loss": 2.3074, - "step": 498930 - }, - { - "epoch": 0.87, - "learning_rate": 6.495429290903574e-06, - "loss": 2.2816, - "step": 498940 - }, - { - "epoch": 0.87, - "learning_rate": 6.494557350976748e-06, - "loss": 2.2889, - "step": 498950 - }, - { - "epoch": 0.87, - "learning_rate": 6.4936854110499215e-06, - "loss": 2.3058, - "step": 498960 - }, - { - "epoch": 0.87, - "learning_rate": 6.4928134711230935e-06, - "loss": 2.2421, - "step": 498970 - }, - { - "epoch": 0.87, - "learning_rate": 6.491941531196267e-06, - "loss": 2.1909, - "step": 498980 - }, - { - "epoch": 0.87, - "learning_rate": 6.49106959126944e-06, - "loss": 2.1934, - "step": 498990 - }, - { - "epoch": 0.87, - "learning_rate": 6.490197651342614e-06, - "loss": 2.3474, - "step": 499000 - }, - { - "epoch": 0.87, - "learning_rate": 6.489325711415786e-06, - "loss": 2.2747, - "step": 499010 - }, - { - "epoch": 0.87, - "learning_rate": 6.48845377148896e-06, - "loss": 2.268, - "step": 499020 - }, - { - "epoch": 0.87, - "learning_rate": 6.487581831562133e-06, - "loss": 2.3106, - "step": 499030 - }, - { - "epoch": 0.87, - "learning_rate": 6.4867098916353065e-06, - "loss": 2.2857, - "step": 499040 - }, - { - "epoch": 0.87, - "learning_rate": 6.485837951708479e-06, - "loss": 2.3634, - "step": 499050 - }, - { - "epoch": 0.87, - "learning_rate": 6.484966011781652e-06, - "loss": 2.2039, - "step": 499060 - }, - { - "epoch": 0.87, - "learning_rate": 6.484094071854825e-06, - "loss": 2.2524, - "step": 499070 - }, - { - "epoch": 0.87, - "learning_rate": 6.483222131927999e-06, - "loss": 2.23, - "step": 499080 - }, - { - "epoch": 0.87, - "learning_rate": 6.482350192001173e-06, - "loss": 2.3385, - "step": 499090 - }, - { - "epoch": 0.87, - "learning_rate": 6.481478252074345e-06, - "loss": 2.2786, - "step": 499100 - }, - { - "epoch": 0.87, - "learning_rate": 6.480606312147519e-06, - "loss": 2.1769, - "step": 499110 - }, - { - "epoch": 0.87, - "learning_rate": 6.479734372220692e-06, - "loss": 2.1731, - "step": 499120 - }, - { - "epoch": 0.87, - "learning_rate": 6.478862432293865e-06, - "loss": 2.3326, - "step": 499130 - }, - { - "epoch": 0.87, - "learning_rate": 6.4779904923670375e-06, - "loss": 2.3854, - "step": 499140 - }, - { - "epoch": 0.87, - "learning_rate": 6.477118552440212e-06, - "loss": 2.2737, - "step": 499150 - }, - { - "epoch": 0.87, - "learning_rate": 6.476246612513384e-06, - "loss": 2.2221, - "step": 499160 - }, - { - "epoch": 0.87, - "learning_rate": 6.475374672586558e-06, - "loss": 2.2787, - "step": 499170 - }, - { - "epoch": 0.87, - "learning_rate": 6.474502732659731e-06, - "loss": 2.2923, - "step": 499180 - }, - { - "epoch": 0.87, - "learning_rate": 6.473630792732905e-06, - "loss": 2.3435, - "step": 499190 - }, - { - "epoch": 0.87, - "learning_rate": 6.472758852806077e-06, - "loss": 2.2098, - "step": 499200 - }, - { - "epoch": 0.87, - "learning_rate": 6.4718869128792505e-06, - "loss": 2.1515, - "step": 499210 - }, - { - "epoch": 0.87, - "learning_rate": 6.471014972952424e-06, - "loss": 2.291, - "step": 499220 - }, - { - "epoch": 0.87, - "learning_rate": 6.470143033025597e-06, - "loss": 2.318, - "step": 499230 - }, - { - "epoch": 0.87, - "learning_rate": 6.469271093098771e-06, - "loss": 2.3249, - "step": 499240 - }, - { - "epoch": 0.87, - "learning_rate": 6.468399153171943e-06, - "loss": 2.2203, - "step": 499250 - }, - { - "epoch": 0.87, - "learning_rate": 6.467527213245117e-06, - "loss": 2.2438, - "step": 499260 - }, - { - "epoch": 0.87, - "learning_rate": 6.46665527331829e-06, - "loss": 2.3548, - "step": 499270 - }, - { - "epoch": 0.87, - "learning_rate": 6.4657833333914635e-06, - "loss": 2.2404, - "step": 499280 - }, - { - "epoch": 0.87, - "learning_rate": 6.4649113934646355e-06, - "loss": 2.2624, - "step": 499290 - }, - { - "epoch": 0.87, - "learning_rate": 6.464039453537809e-06, - "loss": 2.1846, - "step": 499300 - }, - { - "epoch": 0.87, - "learning_rate": 6.463167513610982e-06, - "loss": 2.2327, - "step": 499310 - }, - { - "epoch": 0.87, - "learning_rate": 6.462295573684156e-06, - "loss": 2.3926, - "step": 499320 - }, - { - "epoch": 0.87, - "learning_rate": 6.461423633757328e-06, - "loss": 2.2635, - "step": 499330 - }, - { - "epoch": 0.87, - "learning_rate": 6.460551693830502e-06, - "loss": 2.3113, - "step": 499340 - }, - { - "epoch": 0.87, - "learning_rate": 6.459679753903676e-06, - "loss": 2.3495, - "step": 499350 - }, - { - "epoch": 0.87, - "learning_rate": 6.4588078139768485e-06, - "loss": 2.2396, - "step": 499360 - }, - { - "epoch": 0.87, - "learning_rate": 6.457935874050022e-06, - "loss": 2.2489, - "step": 499370 - }, - { - "epoch": 0.87, - "learning_rate": 6.457063934123194e-06, - "loss": 2.2225, - "step": 499380 - }, - { - "epoch": 0.87, - "learning_rate": 6.456191994196369e-06, - "loss": 2.2759, - "step": 499390 - }, - { - "epoch": 0.87, - "learning_rate": 6.455320054269541e-06, - "loss": 2.3294, - "step": 499400 - }, - { - "epoch": 0.87, - "learning_rate": 6.454448114342715e-06, - "loss": 2.1931, - "step": 499410 - }, - { - "epoch": 0.87, - "learning_rate": 6.453576174415888e-06, - "loss": 2.3295, - "step": 499420 - }, - { - "epoch": 0.87, - "learning_rate": 6.4527042344890615e-06, - "loss": 2.2764, - "step": 499430 - }, - { - "epoch": 0.87, - "learning_rate": 6.451832294562234e-06, - "loss": 2.0526, - "step": 499440 - }, - { - "epoch": 0.87, - "learning_rate": 6.450960354635407e-06, - "loss": 2.2423, - "step": 499450 - }, - { - "epoch": 0.87, - "learning_rate": 6.45008841470858e-06, - "loss": 2.3582, - "step": 499460 - }, - { - "epoch": 0.87, - "learning_rate": 6.449216474781754e-06, - "loss": 2.3281, - "step": 499470 - }, - { - "epoch": 0.87, - "learning_rate": 6.448344534854928e-06, - "loss": 2.3032, - "step": 499480 - }, - { - "epoch": 0.87, - "learning_rate": 6.4474725949281e-06, - "loss": 2.2486, - "step": 499490 - }, - { - "epoch": 0.87, - "learning_rate": 6.446600655001274e-06, - "loss": 2.482, - "step": 499500 - }, - { - "epoch": 0.87, - "learning_rate": 6.445728715074447e-06, - "loss": 2.3227, - "step": 499510 - }, - { - "epoch": 0.87, - "learning_rate": 6.44485677514762e-06, - "loss": 2.2508, - "step": 499520 - }, - { - "epoch": 0.87, - "learning_rate": 6.4439848352207925e-06, - "loss": 2.2386, - "step": 499530 - }, - { - "epoch": 0.87, - "learning_rate": 6.443112895293966e-06, - "loss": 2.1731, - "step": 499540 - }, - { - "epoch": 0.87, - "learning_rate": 6.442240955367139e-06, - "loss": 2.157, - "step": 499550 - }, - { - "epoch": 0.87, - "learning_rate": 6.441369015440313e-06, - "loss": 2.3516, - "step": 499560 - }, - { - "epoch": 0.87, - "learning_rate": 6.440497075513485e-06, - "loss": 2.2478, - "step": 499570 - }, - { - "epoch": 0.87, - "learning_rate": 6.439625135586659e-06, - "loss": 2.257, - "step": 499580 - }, - { - "epoch": 0.87, - "learning_rate": 6.438753195659832e-06, - "loss": 2.2879, - "step": 499590 - }, - { - "epoch": 0.87, - "learning_rate": 6.4378812557330055e-06, - "loss": 2.249, - "step": 499600 - }, - { - "epoch": 0.87, - "learning_rate": 6.437009315806179e-06, - "loss": 2.2173, - "step": 499610 - }, - { - "epoch": 0.87, - "learning_rate": 6.436137375879351e-06, - "loss": 2.302, - "step": 499620 - }, - { - "epoch": 0.87, - "learning_rate": 6.435265435952526e-06, - "loss": 2.284, - "step": 499630 - }, - { - "epoch": 0.87, - "learning_rate": 6.434393496025698e-06, - "loss": 2.3584, - "step": 499640 - }, - { - "epoch": 0.87, - "learning_rate": 6.433521556098872e-06, - "loss": 2.2245, - "step": 499650 - }, - { - "epoch": 0.87, - "learning_rate": 6.432649616172044e-06, - "loss": 2.3412, - "step": 499660 - }, - { - "epoch": 0.87, - "learning_rate": 6.4317776762452185e-06, - "loss": 2.2575, - "step": 499670 - }, - { - "epoch": 0.87, - "learning_rate": 6.4309057363183905e-06, - "loss": 2.2678, - "step": 499680 - }, - { - "epoch": 0.87, - "learning_rate": 6.430033796391564e-06, - "loss": 2.3505, - "step": 499690 - }, - { - "epoch": 0.87, - "learning_rate": 6.429161856464737e-06, - "loss": 2.258, - "step": 499700 - }, - { - "epoch": 0.87, - "learning_rate": 6.428289916537911e-06, - "loss": 2.2945, - "step": 499710 - }, - { - "epoch": 0.87, - "learning_rate": 6.427417976611083e-06, - "loss": 2.2827, - "step": 499720 - }, - { - "epoch": 0.87, - "learning_rate": 6.426546036684257e-06, - "loss": 2.3341, - "step": 499730 - }, - { - "epoch": 0.87, - "learning_rate": 6.42567409675743e-06, - "loss": 2.2713, - "step": 499740 - }, - { - "epoch": 0.87, - "learning_rate": 6.4248021568306035e-06, - "loss": 2.1662, - "step": 499750 - }, - { - "epoch": 0.87, - "learning_rate": 6.423930216903777e-06, - "loss": 2.3324, - "step": 499760 - }, - { - "epoch": 0.87, - "learning_rate": 6.423058276976949e-06, - "loss": 2.3939, - "step": 499770 - }, - { - "epoch": 0.87, - "learning_rate": 6.422186337050123e-06, - "loss": 2.4703, - "step": 499780 - }, - { - "epoch": 0.87, - "learning_rate": 6.421314397123296e-06, - "loss": 2.3147, - "step": 499790 - }, - { - "epoch": 0.87, - "learning_rate": 6.42044245719647e-06, - "loss": 2.201, - "step": 499800 - }, - { - "epoch": 0.87, - "learning_rate": 6.419570517269642e-06, - "loss": 2.2675, - "step": 499810 - }, - { - "epoch": 0.87, - "learning_rate": 6.418698577342816e-06, - "loss": 2.2701, - "step": 499820 - }, - { - "epoch": 0.87, - "learning_rate": 6.417826637415989e-06, - "loss": 2.3119, - "step": 499830 - }, - { - "epoch": 0.87, - "learning_rate": 6.416954697489162e-06, - "loss": 2.295, - "step": 499840 - }, - { - "epoch": 0.87, - "learning_rate": 6.4160827575623345e-06, - "loss": 2.3536, - "step": 499850 - }, - { - "epoch": 0.87, - "learning_rate": 6.415210817635508e-06, - "loss": 2.3161, - "step": 499860 - }, - { - "epoch": 0.87, - "learning_rate": 6.414338877708681e-06, - "loss": 2.2183, - "step": 499870 - }, - { - "epoch": 0.87, - "learning_rate": 6.413466937781855e-06, - "loss": 2.2751, - "step": 499880 - }, - { - "epoch": 0.87, - "learning_rate": 6.412594997855029e-06, - "loss": 2.267, - "step": 499890 - }, - { - "epoch": 0.87, - "learning_rate": 6.411723057928201e-06, - "loss": 2.2859, - "step": 499900 - }, - { - "epoch": 0.87, - "learning_rate": 6.410851118001375e-06, - "loss": 2.3136, - "step": 499910 - }, - { - "epoch": 0.87, - "learning_rate": 6.4099791780745475e-06, - "loss": 2.1233, - "step": 499920 - }, - { - "epoch": 0.87, - "learning_rate": 6.409107238147721e-06, - "loss": 2.1935, - "step": 499930 - }, - { - "epoch": 0.87, - "learning_rate": 6.408235298220894e-06, - "loss": 2.2883, - "step": 499940 - }, - { - "epoch": 0.87, - "learning_rate": 6.407363358294068e-06, - "loss": 2.2693, - "step": 499950 - }, - { - "epoch": 0.87, - "learning_rate": 6.40649141836724e-06, - "loss": 2.2949, - "step": 499960 - }, - { - "epoch": 0.87, - "learning_rate": 6.405619478440414e-06, - "loss": 2.4242, - "step": 499970 - }, - { - "epoch": 0.87, - "learning_rate": 6.404747538513587e-06, - "loss": 2.1458, - "step": 499980 - }, - { - "epoch": 0.87, - "learning_rate": 6.4038755985867605e-06, - "loss": 2.2496, - "step": 499990 - }, - { - "epoch": 0.87, - "learning_rate": 6.4030036586599326e-06, - "loss": 2.2421, - "step": 500000 - }, - { - "epoch": 0.87, - "learning_rate": 6.402131718733106e-06, - "loss": 2.3332, - "step": 500010 - }, - { - "epoch": 0.87, - "learning_rate": 6.40125977880628e-06, - "loss": 2.2208, - "step": 500020 - }, - { - "epoch": 0.87, - "learning_rate": 6.400387838879453e-06, - "loss": 2.2898, - "step": 500030 - }, - { - "epoch": 0.87, - "learning_rate": 6.399515898952627e-06, - "loss": 2.2042, - "step": 500040 - }, - { - "epoch": 0.87, - "learning_rate": 6.398643959025799e-06, - "loss": 2.3528, - "step": 500050 - }, - { - "epoch": 0.87, - "learning_rate": 6.397772019098973e-06, - "loss": 2.3925, - "step": 500060 - }, - { - "epoch": 0.87, - "learning_rate": 6.3969000791721456e-06, - "loss": 2.2716, - "step": 500070 - }, - { - "epoch": 0.87, - "learning_rate": 6.396028139245319e-06, - "loss": 2.2415, - "step": 500080 - }, - { - "epoch": 0.87, - "learning_rate": 6.395156199318491e-06, - "loss": 2.2198, - "step": 500090 - }, - { - "epoch": 0.87, - "learning_rate": 6.394284259391665e-06, - "loss": 2.2259, - "step": 500100 - }, - { - "epoch": 0.87, - "learning_rate": 6.393412319464838e-06, - "loss": 2.2742, - "step": 500110 - }, - { - "epoch": 0.87, - "learning_rate": 6.392540379538012e-06, - "loss": 2.1857, - "step": 500120 - }, - { - "epoch": 0.87, - "learning_rate": 6.391668439611184e-06, - "loss": 2.3398, - "step": 500130 - }, - { - "epoch": 0.87, - "learning_rate": 6.390796499684358e-06, - "loss": 2.263, - "step": 500140 - }, - { - "epoch": 0.87, - "learning_rate": 6.389924559757532e-06, - "loss": 2.2602, - "step": 500150 - }, - { - "epoch": 0.87, - "learning_rate": 6.389052619830704e-06, - "loss": 2.2097, - "step": 500160 - }, - { - "epoch": 0.87, - "learning_rate": 6.388180679903878e-06, - "loss": 2.1323, - "step": 500170 - }, - { - "epoch": 0.87, - "learning_rate": 6.38730873997705e-06, - "loss": 2.2409, - "step": 500180 - }, - { - "epoch": 0.87, - "learning_rate": 6.386436800050225e-06, - "loss": 2.2686, - "step": 500190 - }, - { - "epoch": 0.87, - "learning_rate": 6.385564860123397e-06, - "loss": 2.2216, - "step": 500200 - }, - { - "epoch": 0.87, - "learning_rate": 6.384692920196571e-06, - "loss": 2.2068, - "step": 500210 - }, - { - "epoch": 0.87, - "learning_rate": 6.383820980269744e-06, - "loss": 2.3252, - "step": 500220 - }, - { - "epoch": 0.87, - "learning_rate": 6.382949040342917e-06, - "loss": 2.2985, - "step": 500230 - }, - { - "epoch": 0.87, - "learning_rate": 6.3820771004160895e-06, - "loss": 2.2631, - "step": 500240 - }, - { - "epoch": 0.87, - "learning_rate": 6.381205160489263e-06, - "loss": 2.2294, - "step": 500250 - }, - { - "epoch": 0.87, - "learning_rate": 6.380333220562436e-06, - "loss": 2.2044, - "step": 500260 - }, - { - "epoch": 0.87, - "learning_rate": 6.37946128063561e-06, - "loss": 2.3103, - "step": 500270 - }, - { - "epoch": 0.87, - "learning_rate": 6.378589340708784e-06, - "loss": 2.2311, - "step": 500280 - }, - { - "epoch": 0.87, - "learning_rate": 6.377717400781956e-06, - "loss": 2.2914, - "step": 500290 - }, - { - "epoch": 0.87, - "learning_rate": 6.3768454608551296e-06, - "loss": 2.1067, - "step": 500300 - }, - { - "epoch": 0.87, - "learning_rate": 6.3759735209283025e-06, - "loss": 2.2371, - "step": 500310 - }, - { - "epoch": 0.87, - "learning_rate": 6.375101581001476e-06, - "loss": 2.3209, - "step": 500320 - }, - { - "epoch": 0.87, - "learning_rate": 6.374229641074648e-06, - "loss": 2.2413, - "step": 500330 - }, - { - "epoch": 0.87, - "learning_rate": 6.373357701147822e-06, - "loss": 2.2787, - "step": 500340 - }, - { - "epoch": 0.87, - "learning_rate": 6.372485761220995e-06, - "loss": 2.2704, - "step": 500350 - }, - { - "epoch": 0.87, - "learning_rate": 6.371613821294169e-06, - "loss": 2.1319, - "step": 500360 - }, - { - "epoch": 0.87, - "learning_rate": 6.370741881367341e-06, - "loss": 2.2345, - "step": 500370 - }, - { - "epoch": 0.87, - "learning_rate": 6.369869941440515e-06, - "loss": 2.3687, - "step": 500380 - }, - { - "epoch": 0.87, - "learning_rate": 6.3689980015136876e-06, - "loss": 2.1393, - "step": 500390 - }, - { - "epoch": 0.87, - "learning_rate": 6.368126061586861e-06, - "loss": 2.1953, - "step": 500400 - }, - { - "epoch": 0.87, - "learning_rate": 6.367254121660035e-06, - "loss": 2.211, - "step": 500410 - }, - { - "epoch": 0.87, - "learning_rate": 6.366382181733207e-06, - "loss": 2.215, - "step": 500420 - }, - { - "epoch": 0.87, - "learning_rate": 6.365510241806382e-06, - "loss": 2.2302, - "step": 500430 - }, - { - "epoch": 0.87, - "learning_rate": 6.364638301879554e-06, - "loss": 2.3597, - "step": 500440 - }, - { - "epoch": 0.87, - "learning_rate": 6.363766361952728e-06, - "loss": 2.1408, - "step": 500450 - }, - { - "epoch": 0.87, - "learning_rate": 6.3628944220259006e-06, - "loss": 2.2521, - "step": 500460 - }, - { - "epoch": 0.87, - "learning_rate": 6.362022482099074e-06, - "loss": 2.2135, - "step": 500470 - }, - { - "epoch": 0.87, - "learning_rate": 6.361150542172246e-06, - "loss": 2.2428, - "step": 500480 - }, - { - "epoch": 0.87, - "learning_rate": 6.36027860224542e-06, - "loss": 2.3035, - "step": 500490 - }, - { - "epoch": 0.87, - "learning_rate": 6.359406662318593e-06, - "loss": 2.3079, - "step": 500500 - }, - { - "epoch": 0.87, - "learning_rate": 6.358534722391767e-06, - "loss": 2.3362, - "step": 500510 - }, - { - "epoch": 0.87, - "learning_rate": 6.357662782464939e-06, - "loss": 2.2898, - "step": 500520 - }, - { - "epoch": 0.87, - "learning_rate": 6.356790842538113e-06, - "loss": 2.2604, - "step": 500530 - }, - { - "epoch": 0.87, - "learning_rate": 6.355918902611286e-06, - "loss": 2.3497, - "step": 500540 - }, - { - "epoch": 0.87, - "learning_rate": 6.355046962684459e-06, - "loss": 2.1422, - "step": 500550 - }, - { - "epoch": 0.87, - "learning_rate": 6.354175022757633e-06, - "loss": 2.2949, - "step": 500560 - }, - { - "epoch": 0.87, - "learning_rate": 6.353303082830805e-06, - "loss": 2.3505, - "step": 500570 - }, - { - "epoch": 0.87, - "learning_rate": 6.352431142903979e-06, - "loss": 2.1684, - "step": 500580 - }, - { - "epoch": 0.87, - "learning_rate": 6.351559202977152e-06, - "loss": 2.3015, - "step": 500590 - }, - { - "epoch": 0.87, - "learning_rate": 6.350687263050326e-06, - "loss": 2.225, - "step": 500600 - }, - { - "epoch": 0.87, - "learning_rate": 6.349815323123498e-06, - "loss": 2.2301, - "step": 500610 - }, - { - "epoch": 0.87, - "learning_rate": 6.3489433831966716e-06, - "loss": 2.2418, - "step": 500620 - }, - { - "epoch": 0.87, - "learning_rate": 6.3480714432698445e-06, - "loss": 2.2809, - "step": 500630 - }, - { - "epoch": 0.87, - "learning_rate": 6.347199503343018e-06, - "loss": 2.246, - "step": 500640 - }, - { - "epoch": 0.87, - "learning_rate": 6.34632756341619e-06, - "loss": 2.3246, - "step": 500650 - }, - { - "epoch": 0.87, - "learning_rate": 6.345455623489364e-06, - "loss": 2.111, - "step": 500660 - }, - { - "epoch": 0.87, - "learning_rate": 6.344583683562537e-06, - "loss": 2.2568, - "step": 500670 - }, - { - "epoch": 0.87, - "learning_rate": 6.343711743635711e-06, - "loss": 2.1685, - "step": 500680 - }, - { - "epoch": 0.87, - "learning_rate": 6.3428398037088846e-06, - "loss": 2.3374, - "step": 500690 - }, - { - "epoch": 0.87, - "learning_rate": 6.341967863782057e-06, - "loss": 2.2815, - "step": 500700 - }, - { - "epoch": 0.87, - "learning_rate": 6.341095923855231e-06, - "loss": 2.2834, - "step": 500710 - }, - { - "epoch": 0.87, - "learning_rate": 6.340223983928403e-06, - "loss": 2.3296, - "step": 500720 - }, - { - "epoch": 0.87, - "learning_rate": 6.339352044001577e-06, - "loss": 2.2576, - "step": 500730 - }, - { - "epoch": 0.87, - "learning_rate": 6.33848010407475e-06, - "loss": 2.3097, - "step": 500740 - }, - { - "epoch": 0.87, - "learning_rate": 6.337608164147924e-06, - "loss": 2.3379, - "step": 500750 - }, - { - "epoch": 0.87, - "learning_rate": 6.336736224221096e-06, - "loss": 2.2889, - "step": 500760 - }, - { - "epoch": 0.87, - "learning_rate": 6.33586428429427e-06, - "loss": 2.2348, - "step": 500770 - }, - { - "epoch": 0.87, - "learning_rate": 6.3349923443674426e-06, - "loss": 2.1828, - "step": 500780 - }, - { - "epoch": 0.87, - "learning_rate": 6.334120404440616e-06, - "loss": 2.2882, - "step": 500790 - }, - { - "epoch": 0.87, - "learning_rate": 6.333248464513788e-06, - "loss": 2.2353, - "step": 500800 - }, - { - "epoch": 0.87, - "learning_rate": 6.332376524586962e-06, - "loss": 2.2576, - "step": 500810 - }, - { - "epoch": 0.87, - "learning_rate": 6.331504584660136e-06, - "loss": 2.2172, - "step": 500820 - }, - { - "epoch": 0.87, - "learning_rate": 6.330632644733309e-06, - "loss": 2.1372, - "step": 500830 - }, - { - "epoch": 0.87, - "learning_rate": 6.329760704806483e-06, - "loss": 2.2122, - "step": 500840 - }, - { - "epoch": 0.87, - "learning_rate": 6.328888764879655e-06, - "loss": 2.2753, - "step": 500850 - }, - { - "epoch": 0.87, - "learning_rate": 6.3280168249528285e-06, - "loss": 2.297, - "step": 500860 - }, - { - "epoch": 0.87, - "learning_rate": 6.327144885026001e-06, - "loss": 2.2797, - "step": 500870 - }, - { - "epoch": 0.87, - "learning_rate": 6.326272945099175e-06, - "loss": 2.289, - "step": 500880 - }, - { - "epoch": 0.87, - "learning_rate": 6.325401005172347e-06, - "loss": 2.2051, - "step": 500890 - }, - { - "epoch": 0.87, - "learning_rate": 6.324529065245521e-06, - "loss": 2.3045, - "step": 500900 - }, - { - "epoch": 0.87, - "learning_rate": 6.323657125318694e-06, - "loss": 2.2798, - "step": 500910 - }, - { - "epoch": 0.87, - "learning_rate": 6.322785185391868e-06, - "loss": 2.2991, - "step": 500920 - }, - { - "epoch": 0.87, - "learning_rate": 6.32191324546504e-06, - "loss": 2.3561, - "step": 500930 - }, - { - "epoch": 0.87, - "learning_rate": 6.3210413055382136e-06, - "loss": 2.3479, - "step": 500940 - }, - { - "epoch": 0.87, - "learning_rate": 6.320169365611388e-06, - "loss": 2.2869, - "step": 500950 - }, - { - "epoch": 0.87, - "learning_rate": 6.31929742568456e-06, - "loss": 2.2811, - "step": 500960 - }, - { - "epoch": 0.87, - "learning_rate": 6.318425485757734e-06, - "loss": 2.2683, - "step": 500970 - }, - { - "epoch": 0.87, - "learning_rate": 6.317553545830907e-06, - "loss": 2.2276, - "step": 500980 - }, - { - "epoch": 0.87, - "learning_rate": 6.316681605904081e-06, - "loss": 2.1738, - "step": 500990 - }, - { - "epoch": 0.87, - "learning_rate": 6.315809665977253e-06, - "loss": 2.2791, - "step": 501000 - }, - { - "epoch": 0.87, - "learning_rate": 6.3149377260504266e-06, - "loss": 2.38, - "step": 501010 - }, - { - "epoch": 0.87, - "learning_rate": 6.3140657861235995e-06, - "loss": 2.2896, - "step": 501020 - }, - { - "epoch": 0.87, - "learning_rate": 6.313193846196773e-06, - "loss": 2.2731, - "step": 501030 - }, - { - "epoch": 0.87, - "learning_rate": 6.312321906269945e-06, - "loss": 2.3262, - "step": 501040 - }, - { - "epoch": 0.87, - "learning_rate": 6.311449966343119e-06, - "loss": 2.3911, - "step": 501050 - }, - { - "epoch": 0.87, - "learning_rate": 6.310578026416292e-06, - "loss": 2.174, - "step": 501060 - }, - { - "epoch": 0.87, - "learning_rate": 6.309706086489466e-06, - "loss": 2.2631, - "step": 501070 - }, - { - "epoch": 0.87, - "learning_rate": 6.3088341465626396e-06, - "loss": 2.2664, - "step": 501080 - }, - { - "epoch": 0.87, - "learning_rate": 6.307962206635812e-06, - "loss": 2.2414, - "step": 501090 - }, - { - "epoch": 0.87, - "learning_rate": 6.307090266708985e-06, - "loss": 2.2554, - "step": 501100 - }, - { - "epoch": 0.87, - "learning_rate": 6.306218326782158e-06, - "loss": 2.3292, - "step": 501110 - }, - { - "epoch": 0.87, - "learning_rate": 6.305346386855332e-06, - "loss": 2.2805, - "step": 501120 - }, - { - "epoch": 0.87, - "learning_rate": 6.304474446928504e-06, - "loss": 2.3584, - "step": 501130 - }, - { - "epoch": 0.87, - "learning_rate": 6.303602507001678e-06, - "loss": 2.2757, - "step": 501140 - }, - { - "epoch": 0.87, - "learning_rate": 6.302730567074851e-06, - "loss": 2.2463, - "step": 501150 - }, - { - "epoch": 0.87, - "learning_rate": 6.301858627148025e-06, - "loss": 2.2143, - "step": 501160 - }, - { - "epoch": 0.87, - "learning_rate": 6.300986687221197e-06, - "loss": 2.2835, - "step": 501170 - }, - { - "epoch": 0.87, - "learning_rate": 6.3001147472943705e-06, - "loss": 2.1911, - "step": 501180 - }, - { - "epoch": 0.87, - "learning_rate": 6.299242807367543e-06, - "loss": 2.1995, - "step": 501190 - }, - { - "epoch": 0.87, - "learning_rate": 6.298370867440717e-06, - "loss": 2.3001, - "step": 501200 - }, - { - "epoch": 0.87, - "learning_rate": 6.297498927513891e-06, - "loss": 2.1906, - "step": 501210 - }, - { - "epoch": 0.87, - "learning_rate": 6.296626987587063e-06, - "loss": 2.258, - "step": 501220 - }, - { - "epoch": 0.87, - "learning_rate": 6.295755047660238e-06, - "loss": 2.2151, - "step": 501230 - }, - { - "epoch": 0.87, - "learning_rate": 6.29488310773341e-06, - "loss": 2.2972, - "step": 501240 - }, - { - "epoch": 0.87, - "learning_rate": 6.2940111678065835e-06, - "loss": 2.3644, - "step": 501250 - }, - { - "epoch": 0.87, - "learning_rate": 6.293139227879756e-06, - "loss": 2.3537, - "step": 501260 - }, - { - "epoch": 0.87, - "learning_rate": 6.29226728795293e-06, - "loss": 2.2808, - "step": 501270 - }, - { - "epoch": 0.87, - "learning_rate": 6.291395348026102e-06, - "loss": 2.3265, - "step": 501280 - }, - { - "epoch": 0.87, - "learning_rate": 6.290523408099276e-06, - "loss": 2.2175, - "step": 501290 - }, - { - "epoch": 0.87, - "learning_rate": 6.289651468172449e-06, - "loss": 2.2653, - "step": 501300 - }, - { - "epoch": 0.87, - "learning_rate": 6.288779528245623e-06, - "loss": 2.2342, - "step": 501310 - }, - { - "epoch": 0.87, - "learning_rate": 6.287907588318795e-06, - "loss": 2.2997, - "step": 501320 - }, - { - "epoch": 0.87, - "learning_rate": 6.2870356483919686e-06, - "loss": 2.3674, - "step": 501330 - }, - { - "epoch": 0.87, - "learning_rate": 6.286163708465142e-06, - "loss": 2.2447, - "step": 501340 - }, - { - "epoch": 0.87, - "learning_rate": 6.285291768538315e-06, - "loss": 2.2001, - "step": 501350 - }, - { - "epoch": 0.87, - "learning_rate": 6.284419828611489e-06, - "loss": 2.2534, - "step": 501360 - }, - { - "epoch": 0.87, - "learning_rate": 6.283547888684661e-06, - "loss": 2.2117, - "step": 501370 - }, - { - "epoch": 0.87, - "learning_rate": 6.282675948757835e-06, - "loss": 2.3578, - "step": 501380 - }, - { - "epoch": 0.87, - "learning_rate": 6.281804008831008e-06, - "loss": 2.3648, - "step": 501390 - }, - { - "epoch": 0.87, - "learning_rate": 6.2809320689041816e-06, - "loss": 2.3638, - "step": 501400 - }, - { - "epoch": 0.87, - "learning_rate": 6.280060128977354e-06, - "loss": 2.2622, - "step": 501410 - }, - { - "epoch": 0.87, - "learning_rate": 6.279188189050527e-06, - "loss": 2.2662, - "step": 501420 - }, - { - "epoch": 0.87, - "learning_rate": 6.2783162491237e-06, - "loss": 2.2398, - "step": 501430 - }, - { - "epoch": 0.87, - "learning_rate": 6.277444309196874e-06, - "loss": 2.1692, - "step": 501440 - }, - { - "epoch": 0.87, - "learning_rate": 6.276572369270046e-06, - "loss": 2.2505, - "step": 501450 - }, - { - "epoch": 0.87, - "learning_rate": 6.27570042934322e-06, - "loss": 2.3539, - "step": 501460 - }, - { - "epoch": 0.87, - "learning_rate": 6.274828489416393e-06, - "loss": 2.2715, - "step": 501470 - }, - { - "epoch": 0.87, - "learning_rate": 6.273956549489567e-06, - "loss": 2.2269, - "step": 501480 - }, - { - "epoch": 0.87, - "learning_rate": 6.27308460956274e-06, - "loss": 2.287, - "step": 501490 - }, - { - "epoch": 0.87, - "learning_rate": 6.272212669635913e-06, - "loss": 2.4111, - "step": 501500 - }, - { - "epoch": 0.87, - "learning_rate": 6.271340729709087e-06, - "loss": 2.1125, - "step": 501510 - }, - { - "epoch": 0.87, - "learning_rate": 6.270468789782259e-06, - "loss": 2.2084, - "step": 501520 - }, - { - "epoch": 0.87, - "learning_rate": 6.269596849855433e-06, - "loss": 2.2129, - "step": 501530 - }, - { - "epoch": 0.87, - "learning_rate": 6.268724909928606e-06, - "loss": 2.145, - "step": 501540 - }, - { - "epoch": 0.87, - "learning_rate": 6.26785297000178e-06, - "loss": 2.2609, - "step": 501550 - }, - { - "epoch": 0.87, - "learning_rate": 6.266981030074952e-06, - "loss": 2.3183, - "step": 501560 - }, - { - "epoch": 0.87, - "learning_rate": 6.2661090901481255e-06, - "loss": 2.3174, - "step": 501570 - }, - { - "epoch": 0.87, - "learning_rate": 6.265237150221298e-06, - "loss": 2.2598, - "step": 501580 - }, - { - "epoch": 0.87, - "learning_rate": 6.264365210294472e-06, - "loss": 2.3058, - "step": 501590 - }, - { - "epoch": 0.87, - "learning_rate": 6.263493270367644e-06, - "loss": 2.2617, - "step": 501600 - }, - { - "epoch": 0.87, - "learning_rate": 6.262621330440818e-06, - "loss": 2.302, - "step": 501610 - }, - { - "epoch": 0.87, - "learning_rate": 6.261749390513992e-06, - "loss": 2.3612, - "step": 501620 - }, - { - "epoch": 0.87, - "learning_rate": 6.260877450587165e-06, - "loss": 2.239, - "step": 501630 - }, - { - "epoch": 0.87, - "learning_rate": 6.2600055106603385e-06, - "loss": 2.3514, - "step": 501640 - }, - { - "epoch": 0.87, - "learning_rate": 6.2591335707335106e-06, - "loss": 2.374, - "step": 501650 - }, - { - "epoch": 0.87, - "learning_rate": 6.258261630806684e-06, - "loss": 2.1015, - "step": 501660 - }, - { - "epoch": 0.87, - "learning_rate": 6.257389690879857e-06, - "loss": 2.2665, - "step": 501670 - }, - { - "epoch": 0.87, - "learning_rate": 6.256517750953031e-06, - "loss": 2.2074, - "step": 501680 - }, - { - "epoch": 0.87, - "learning_rate": 6.255645811026203e-06, - "loss": 2.2674, - "step": 501690 - }, - { - "epoch": 0.87, - "learning_rate": 6.254773871099377e-06, - "loss": 2.3677, - "step": 501700 - }, - { - "epoch": 0.87, - "learning_rate": 6.25390193117255e-06, - "loss": 2.3134, - "step": 501710 - }, - { - "epoch": 0.87, - "learning_rate": 6.2530299912457236e-06, - "loss": 2.235, - "step": 501720 - }, - { - "epoch": 0.87, - "learning_rate": 6.252158051318896e-06, - "loss": 2.2009, - "step": 501730 - }, - { - "epoch": 0.87, - "learning_rate": 6.251286111392069e-06, - "loss": 2.2837, - "step": 501740 - }, - { - "epoch": 0.87, - "learning_rate": 6.250414171465244e-06, - "loss": 2.1998, - "step": 501750 - }, - { - "epoch": 0.88, - "learning_rate": 6.249542231538416e-06, - "loss": 2.2533, - "step": 501760 - }, - { - "epoch": 0.88, - "learning_rate": 6.248670291611589e-06, - "loss": 2.2138, - "step": 501770 - }, - { - "epoch": 0.88, - "learning_rate": 6.247798351684763e-06, - "loss": 2.2734, - "step": 501780 - }, - { - "epoch": 0.88, - "learning_rate": 6.246926411757936e-06, - "loss": 2.2649, - "step": 501790 - }, - { - "epoch": 0.88, - "learning_rate": 6.246054471831109e-06, - "loss": 2.3235, - "step": 501800 - }, - { - "epoch": 0.88, - "learning_rate": 6.245182531904282e-06, - "loss": 2.2048, - "step": 501810 - }, - { - "epoch": 0.88, - "learning_rate": 6.244310591977455e-06, - "loss": 2.1426, - "step": 501820 - }, - { - "epoch": 0.88, - "learning_rate": 6.243438652050629e-06, - "loss": 2.2931, - "step": 501830 - }, - { - "epoch": 0.88, - "learning_rate": 6.242566712123802e-06, - "loss": 2.2571, - "step": 501840 - }, - { - "epoch": 0.88, - "learning_rate": 6.241694772196975e-06, - "loss": 2.1535, - "step": 501850 - }, - { - "epoch": 0.88, - "learning_rate": 6.240822832270148e-06, - "loss": 2.2192, - "step": 501860 - }, - { - "epoch": 0.88, - "learning_rate": 6.239950892343322e-06, - "loss": 2.1789, - "step": 501870 - }, - { - "epoch": 0.88, - "learning_rate": 6.2390789524164946e-06, - "loss": 2.2066, - "step": 501880 - }, - { - "epoch": 0.88, - "learning_rate": 6.2382070124896675e-06, - "loss": 2.2442, - "step": 501890 - }, - { - "epoch": 0.88, - "learning_rate": 6.237335072562841e-06, - "loss": 2.2635, - "step": 501900 - }, - { - "epoch": 0.88, - "learning_rate": 6.236463132636014e-06, - "loss": 2.2874, - "step": 501910 - }, - { - "epoch": 0.88, - "learning_rate": 6.235591192709187e-06, - "loss": 2.2955, - "step": 501920 - }, - { - "epoch": 0.88, - "learning_rate": 6.23471925278236e-06, - "loss": 2.3536, - "step": 501930 - }, - { - "epoch": 0.88, - "learning_rate": 6.233847312855534e-06, - "loss": 2.365, - "step": 501940 - }, - { - "epoch": 0.88, - "learning_rate": 6.2329753729287076e-06, - "loss": 2.2343, - "step": 501950 - }, - { - "epoch": 0.88, - "learning_rate": 6.2321034330018805e-06, - "loss": 2.2412, - "step": 501960 - }, - { - "epoch": 0.88, - "learning_rate": 6.231231493075053e-06, - "loss": 2.297, - "step": 501970 - }, - { - "epoch": 0.88, - "learning_rate": 6.230359553148226e-06, - "loss": 2.2162, - "step": 501980 - }, - { - "epoch": 0.88, - "learning_rate": 6.2294876132214e-06, - "loss": 2.3832, - "step": 501990 - }, - { - "epoch": 0.88, - "learning_rate": 6.228615673294573e-06, - "loss": 2.2731, - "step": 502000 - }, - { - "epoch": 0.88, - "learning_rate": 6.227743733367746e-06, - "loss": 2.2535, - "step": 502010 - }, - { - "epoch": 0.88, - "learning_rate": 6.22687179344092e-06, - "loss": 2.1911, - "step": 502020 - }, - { - "epoch": 0.88, - "learning_rate": 6.225999853514093e-06, - "loss": 2.3217, - "step": 502030 - }, - { - "epoch": 0.88, - "learning_rate": 6.2251279135872656e-06, - "loss": 2.321, - "step": 502040 - }, - { - "epoch": 0.88, - "learning_rate": 6.2242559736604385e-06, - "loss": 2.318, - "step": 502050 - }, - { - "epoch": 0.88, - "learning_rate": 6.223384033733612e-06, - "loss": 2.2277, - "step": 502060 - }, - { - "epoch": 0.88, - "learning_rate": 6.222512093806785e-06, - "loss": 2.2887, - "step": 502070 - }, - { - "epoch": 0.88, - "learning_rate": 6.221640153879959e-06, - "loss": 2.2113, - "step": 502080 - }, - { - "epoch": 0.88, - "learning_rate": 6.220768213953132e-06, - "loss": 2.2665, - "step": 502090 - }, - { - "epoch": 0.88, - "learning_rate": 6.219896274026305e-06, - "loss": 2.1246, - "step": 502100 - }, - { - "epoch": 0.88, - "learning_rate": 6.2190243340994786e-06, - "loss": 2.2417, - "step": 502110 - }, - { - "epoch": 0.88, - "learning_rate": 6.2181523941726515e-06, - "loss": 2.2818, - "step": 502120 - }, - { - "epoch": 0.88, - "learning_rate": 6.217280454245824e-06, - "loss": 2.3272, - "step": 502130 - }, - { - "epoch": 0.88, - "learning_rate": 6.216408514318997e-06, - "loss": 2.3612, - "step": 502140 - }, - { - "epoch": 0.88, - "learning_rate": 6.215536574392171e-06, - "loss": 2.2885, - "step": 502150 - }, - { - "epoch": 0.88, - "learning_rate": 6.214664634465344e-06, - "loss": 2.2033, - "step": 502160 - }, - { - "epoch": 0.88, - "learning_rate": 6.213792694538517e-06, - "loss": 2.2633, - "step": 502170 - }, - { - "epoch": 0.88, - "learning_rate": 6.212920754611691e-06, - "loss": 2.3387, - "step": 502180 - }, - { - "epoch": 0.88, - "learning_rate": 6.212048814684864e-06, - "loss": 2.2911, - "step": 502190 - }, - { - "epoch": 0.88, - "learning_rate": 6.2111768747580366e-06, - "loss": 2.3144, - "step": 502200 - }, - { - "epoch": 0.88, - "learning_rate": 6.21030493483121e-06, - "loss": 2.2786, - "step": 502210 - }, - { - "epoch": 0.88, - "learning_rate": 6.209432994904383e-06, - "loss": 2.2242, - "step": 502220 - }, - { - "epoch": 0.88, - "learning_rate": 6.208561054977557e-06, - "loss": 2.31, - "step": 502230 - }, - { - "epoch": 0.88, - "learning_rate": 6.20768911505073e-06, - "loss": 2.2305, - "step": 502240 - }, - { - "epoch": 0.88, - "learning_rate": 6.206817175123903e-06, - "loss": 2.2292, - "step": 502250 - }, - { - "epoch": 0.88, - "learning_rate": 6.205945235197076e-06, - "loss": 2.2512, - "step": 502260 - }, - { - "epoch": 0.88, - "learning_rate": 6.2050732952702496e-06, - "loss": 2.3828, - "step": 502270 - }, - { - "epoch": 0.88, - "learning_rate": 6.2042013553434225e-06, - "loss": 2.275, - "step": 502280 - }, - { - "epoch": 0.88, - "learning_rate": 6.203329415416595e-06, - "loss": 2.2548, - "step": 502290 - }, - { - "epoch": 0.88, - "learning_rate": 6.202457475489769e-06, - "loss": 2.2983, - "step": 502300 - }, - { - "epoch": 0.88, - "learning_rate": 6.201585535562942e-06, - "loss": 2.2263, - "step": 502310 - }, - { - "epoch": 0.88, - "learning_rate": 6.200713595636115e-06, - "loss": 2.3338, - "step": 502320 - }, - { - "epoch": 0.88, - "learning_rate": 6.199841655709288e-06, - "loss": 2.2187, - "step": 502330 - }, - { - "epoch": 0.88, - "learning_rate": 6.198969715782462e-06, - "loss": 2.258, - "step": 502340 - }, - { - "epoch": 0.88, - "learning_rate": 6.1980977758556355e-06, - "loss": 2.2603, - "step": 502350 - }, - { - "epoch": 0.88, - "learning_rate": 6.197225835928808e-06, - "loss": 2.2957, - "step": 502360 - }, - { - "epoch": 0.88, - "learning_rate": 6.196353896001981e-06, - "loss": 2.2864, - "step": 502370 - }, - { - "epoch": 0.88, - "learning_rate": 6.195481956075154e-06, - "loss": 2.3206, - "step": 502380 - }, - { - "epoch": 0.88, - "learning_rate": 6.194610016148328e-06, - "loss": 2.2552, - "step": 502390 - }, - { - "epoch": 0.88, - "learning_rate": 6.193738076221501e-06, - "loss": 2.3713, - "step": 502400 - }, - { - "epoch": 0.88, - "learning_rate": 6.192866136294674e-06, - "loss": 2.3164, - "step": 502410 - }, - { - "epoch": 0.88, - "learning_rate": 6.191994196367848e-06, - "loss": 2.2193, - "step": 502420 - }, - { - "epoch": 0.88, - "learning_rate": 6.1911222564410206e-06, - "loss": 2.2031, - "step": 502430 - }, - { - "epoch": 0.88, - "learning_rate": 6.1902503165141935e-06, - "loss": 2.2437, - "step": 502440 - }, - { - "epoch": 0.88, - "learning_rate": 6.189378376587366e-06, - "loss": 2.3648, - "step": 502450 - }, - { - "epoch": 0.88, - "learning_rate": 6.18850643666054e-06, - "loss": 2.3077, - "step": 502460 - }, - { - "epoch": 0.88, - "learning_rate": 6.187634496733714e-06, - "loss": 2.2532, - "step": 502470 - }, - { - "epoch": 0.88, - "learning_rate": 6.186762556806887e-06, - "loss": 2.2183, - "step": 502480 - }, - { - "epoch": 0.88, - "learning_rate": 6.18589061688006e-06, - "loss": 2.1425, - "step": 502490 - }, - { - "epoch": 0.88, - "learning_rate": 6.185018676953233e-06, - "loss": 2.1368, - "step": 502500 - }, - { - "epoch": 0.88, - "learning_rate": 6.1841467370264065e-06, - "loss": 2.2663, - "step": 502510 - }, - { - "epoch": 0.88, - "learning_rate": 6.183274797099579e-06, - "loss": 2.221, - "step": 502520 - }, - { - "epoch": 0.88, - "learning_rate": 6.182402857172752e-06, - "loss": 2.291, - "step": 502530 - }, - { - "epoch": 0.88, - "learning_rate": 6.181530917245926e-06, - "loss": 2.2433, - "step": 502540 - }, - { - "epoch": 0.88, - "learning_rate": 6.180658977319099e-06, - "loss": 2.2758, - "step": 502550 - }, - { - "epoch": 0.88, - "learning_rate": 6.179787037392272e-06, - "loss": 2.2706, - "step": 502560 - }, - { - "epoch": 0.88, - "learning_rate": 6.178915097465445e-06, - "loss": 2.3154, - "step": 502570 - }, - { - "epoch": 0.88, - "learning_rate": 6.178043157538619e-06, - "loss": 2.2916, - "step": 502580 - }, - { - "epoch": 0.88, - "learning_rate": 6.1771712176117916e-06, - "loss": 2.4584, - "step": 502590 - }, - { - "epoch": 0.88, - "learning_rate": 6.1762992776849645e-06, - "loss": 2.2252, - "step": 502600 - }, - { - "epoch": 0.88, - "learning_rate": 6.175427337758138e-06, - "loss": 2.3022, - "step": 502610 - }, - { - "epoch": 0.88, - "learning_rate": 6.174555397831311e-06, - "loss": 2.1847, - "step": 502620 - }, - { - "epoch": 0.88, - "learning_rate": 6.173683457904485e-06, - "loss": 2.2601, - "step": 502630 - }, - { - "epoch": 0.88, - "learning_rate": 6.172811517977658e-06, - "loss": 2.1647, - "step": 502640 - }, - { - "epoch": 0.88, - "learning_rate": 6.171939578050831e-06, - "loss": 2.4013, - "step": 502650 - }, - { - "epoch": 0.88, - "learning_rate": 6.1710676381240046e-06, - "loss": 2.1595, - "step": 502660 - }, - { - "epoch": 0.88, - "learning_rate": 6.1701956981971775e-06, - "loss": 2.2213, - "step": 502670 - }, - { - "epoch": 0.88, - "learning_rate": 6.16932375827035e-06, - "loss": 2.2757, - "step": 502680 - }, - { - "epoch": 0.88, - "learning_rate": 6.168451818343523e-06, - "loss": 2.3575, - "step": 502690 - }, - { - "epoch": 0.88, - "learning_rate": 6.167579878416697e-06, - "loss": 2.3443, - "step": 502700 - }, - { - "epoch": 0.88, - "learning_rate": 6.16670793848987e-06, - "loss": 2.2546, - "step": 502710 - }, - { - "epoch": 0.88, - "learning_rate": 6.165835998563043e-06, - "loss": 2.2963, - "step": 502720 - }, - { - "epoch": 0.88, - "learning_rate": 6.164964058636216e-06, - "loss": 2.2903, - "step": 502730 - }, - { - "epoch": 0.88, - "learning_rate": 6.16409211870939e-06, - "loss": 2.2862, - "step": 502740 - }, - { - "epoch": 0.88, - "learning_rate": 6.163220178782563e-06, - "loss": 2.2904, - "step": 502750 - }, - { - "epoch": 0.88, - "learning_rate": 6.162348238855736e-06, - "loss": 2.2397, - "step": 502760 - }, - { - "epoch": 0.88, - "learning_rate": 6.161476298928909e-06, - "loss": 2.2298, - "step": 502770 - }, - { - "epoch": 0.88, - "learning_rate": 6.160604359002082e-06, - "loss": 2.1525, - "step": 502780 - }, - { - "epoch": 0.88, - "learning_rate": 6.159732419075256e-06, - "loss": 2.3089, - "step": 502790 - }, - { - "epoch": 0.88, - "learning_rate": 6.158860479148429e-06, - "loss": 2.3739, - "step": 502800 - }, - { - "epoch": 0.88, - "learning_rate": 6.157988539221602e-06, - "loss": 2.3877, - "step": 502810 - }, - { - "epoch": 0.88, - "learning_rate": 6.1571165992947756e-06, - "loss": 2.3023, - "step": 502820 - }, - { - "epoch": 0.88, - "learning_rate": 6.1562446593679485e-06, - "loss": 2.2943, - "step": 502830 - }, - { - "epoch": 0.88, - "learning_rate": 6.155372719441121e-06, - "loss": 2.2968, - "step": 502840 - }, - { - "epoch": 0.88, - "learning_rate": 6.154500779514294e-06, - "loss": 2.1743, - "step": 502850 - }, - { - "epoch": 0.88, - "learning_rate": 6.153628839587468e-06, - "loss": 2.2356, - "step": 502860 - }, - { - "epoch": 0.88, - "learning_rate": 6.152756899660642e-06, - "loss": 2.2782, - "step": 502870 - }, - { - "epoch": 0.88, - "learning_rate": 6.151884959733815e-06, - "loss": 2.1589, - "step": 502880 - }, - { - "epoch": 0.88, - "learning_rate": 6.151013019806988e-06, - "loss": 2.1578, - "step": 502890 - }, - { - "epoch": 0.88, - "learning_rate": 6.150141079880161e-06, - "loss": 2.3311, - "step": 502900 - }, - { - "epoch": 0.88, - "learning_rate": 6.149269139953334e-06, - "loss": 2.2869, - "step": 502910 - }, - { - "epoch": 0.88, - "learning_rate": 6.148397200026507e-06, - "loss": 2.2978, - "step": 502920 - }, - { - "epoch": 0.88, - "learning_rate": 6.14752526009968e-06, - "loss": 2.3188, - "step": 502930 - }, - { - "epoch": 0.88, - "learning_rate": 6.146653320172854e-06, - "loss": 2.3747, - "step": 502940 - }, - { - "epoch": 0.88, - "learning_rate": 6.145781380246027e-06, - "loss": 2.3121, - "step": 502950 - }, - { - "epoch": 0.88, - "learning_rate": 6.1449094403192e-06, - "loss": 2.2794, - "step": 502960 - }, - { - "epoch": 0.88, - "learning_rate": 6.144037500392373e-06, - "loss": 2.2548, - "step": 502970 - }, - { - "epoch": 0.88, - "learning_rate": 6.143165560465547e-06, - "loss": 2.2328, - "step": 502980 - }, - { - "epoch": 0.88, - "learning_rate": 6.1422936205387195e-06, - "loss": 2.2272, - "step": 502990 - }, - { - "epoch": 0.88, - "learning_rate": 6.141421680611892e-06, - "loss": 2.2221, - "step": 503000 - }, - { - "epoch": 0.88, - "learning_rate": 6.140549740685066e-06, - "loss": 2.2594, - "step": 503010 - }, - { - "epoch": 0.88, - "learning_rate": 6.139677800758239e-06, - "loss": 2.3371, - "step": 503020 - }, - { - "epoch": 0.88, - "learning_rate": 6.138805860831413e-06, - "loss": 2.3756, - "step": 503030 - }, - { - "epoch": 0.88, - "learning_rate": 6.137933920904586e-06, - "loss": 2.2558, - "step": 503040 - }, - { - "epoch": 0.88, - "learning_rate": 6.137061980977759e-06, - "loss": 2.2564, - "step": 503050 - }, - { - "epoch": 0.88, - "learning_rate": 6.1361900410509325e-06, - "loss": 2.2399, - "step": 503060 - }, - { - "epoch": 0.88, - "learning_rate": 6.1353181011241054e-06, - "loss": 2.2326, - "step": 503070 - }, - { - "epoch": 0.88, - "learning_rate": 6.134446161197278e-06, - "loss": 2.3023, - "step": 503080 - }, - { - "epoch": 0.88, - "learning_rate": 6.133574221270451e-06, - "loss": 2.2165, - "step": 503090 - }, - { - "epoch": 0.88, - "learning_rate": 6.132702281343625e-06, - "loss": 2.1936, - "step": 503100 - }, - { - "epoch": 0.88, - "learning_rate": 6.131830341416798e-06, - "loss": 2.3687, - "step": 503110 - }, - { - "epoch": 0.88, - "learning_rate": 6.130958401489971e-06, - "loss": 2.3988, - "step": 503120 - }, - { - "epoch": 0.88, - "learning_rate": 6.130086461563144e-06, - "loss": 2.1694, - "step": 503130 - }, - { - "epoch": 0.88, - "learning_rate": 6.129214521636318e-06, - "loss": 2.4002, - "step": 503140 - }, - { - "epoch": 0.88, - "learning_rate": 6.128342581709491e-06, - "loss": 2.3012, - "step": 503150 - }, - { - "epoch": 0.88, - "learning_rate": 6.127470641782664e-06, - "loss": 2.3023, - "step": 503160 - }, - { - "epoch": 0.88, - "learning_rate": 6.126598701855837e-06, - "loss": 2.2928, - "step": 503170 - }, - { - "epoch": 0.88, - "learning_rate": 6.125726761929011e-06, - "loss": 2.1748, - "step": 503180 - }, - { - "epoch": 0.88, - "learning_rate": 6.124854822002184e-06, - "loss": 2.2303, - "step": 503190 - }, - { - "epoch": 0.88, - "learning_rate": 6.123982882075357e-06, - "loss": 2.2236, - "step": 503200 - }, - { - "epoch": 0.88, - "learning_rate": 6.12311094214853e-06, - "loss": 2.3132, - "step": 503210 - }, - { - "epoch": 0.88, - "learning_rate": 6.1222390022217035e-06, - "loss": 2.3672, - "step": 503220 - }, - { - "epoch": 0.88, - "learning_rate": 6.1213670622948764e-06, - "loss": 2.3187, - "step": 503230 - }, - { - "epoch": 0.88, - "learning_rate": 6.120495122368049e-06, - "loss": 2.3598, - "step": 503240 - }, - { - "epoch": 0.88, - "learning_rate": 6.119623182441222e-06, - "loss": 2.2127, - "step": 503250 - }, - { - "epoch": 0.88, - "learning_rate": 6.118751242514396e-06, - "loss": 2.3009, - "step": 503260 - }, - { - "epoch": 0.88, - "learning_rate": 6.11787930258757e-06, - "loss": 2.4085, - "step": 503270 - }, - { - "epoch": 0.88, - "learning_rate": 6.117007362660743e-06, - "loss": 2.1982, - "step": 503280 - }, - { - "epoch": 0.88, - "learning_rate": 6.116135422733916e-06, - "loss": 2.2798, - "step": 503290 - }, - { - "epoch": 0.88, - "learning_rate": 6.115263482807089e-06, - "loss": 2.3549, - "step": 503300 - }, - { - "epoch": 0.88, - "learning_rate": 6.114391542880262e-06, - "loss": 2.3395, - "step": 503310 - }, - { - "epoch": 0.88, - "learning_rate": 6.113519602953435e-06, - "loss": 2.1083, - "step": 503320 - }, - { - "epoch": 0.88, - "learning_rate": 6.112647663026608e-06, - "loss": 2.2785, - "step": 503330 - }, - { - "epoch": 0.88, - "learning_rate": 6.111775723099782e-06, - "loss": 2.2088, - "step": 503340 - }, - { - "epoch": 0.88, - "learning_rate": 6.110903783172955e-06, - "loss": 2.3008, - "step": 503350 - }, - { - "epoch": 0.88, - "learning_rate": 6.110031843246128e-06, - "loss": 2.3467, - "step": 503360 - }, - { - "epoch": 0.88, - "learning_rate": 6.109159903319301e-06, - "loss": 2.2852, - "step": 503370 - }, - { - "epoch": 0.88, - "learning_rate": 6.1082879633924745e-06, - "loss": 2.3214, - "step": 503380 - }, - { - "epoch": 0.88, - "learning_rate": 6.1074160234656474e-06, - "loss": 2.3271, - "step": 503390 - }, - { - "epoch": 0.88, - "learning_rate": 6.10654408353882e-06, - "loss": 2.248, - "step": 503400 - }, - { - "epoch": 0.88, - "learning_rate": 6.105672143611994e-06, - "loss": 2.3307, - "step": 503410 - }, - { - "epoch": 0.88, - "learning_rate": 6.104800203685167e-06, - "loss": 2.3284, - "step": 503420 - }, - { - "epoch": 0.88, - "learning_rate": 6.103928263758341e-06, - "loss": 2.2207, - "step": 503430 - }, - { - "epoch": 0.88, - "learning_rate": 6.103056323831514e-06, - "loss": 2.2188, - "step": 503440 - }, - { - "epoch": 0.88, - "learning_rate": 6.102184383904687e-06, - "loss": 2.2535, - "step": 503450 - }, - { - "epoch": 0.88, - "learning_rate": 6.1013124439778604e-06, - "loss": 2.333, - "step": 503460 - }, - { - "epoch": 0.88, - "learning_rate": 6.100440504051033e-06, - "loss": 2.3099, - "step": 503470 - }, - { - "epoch": 0.88, - "learning_rate": 6.099568564124206e-06, - "loss": 2.3169, - "step": 503480 - }, - { - "epoch": 0.88, - "learning_rate": 6.098696624197379e-06, - "loss": 2.2328, - "step": 503490 - }, - { - "epoch": 0.88, - "learning_rate": 6.097824684270553e-06, - "loss": 2.299, - "step": 503500 - }, - { - "epoch": 0.88, - "learning_rate": 6.096952744343726e-06, - "loss": 2.2947, - "step": 503510 - }, - { - "epoch": 0.88, - "learning_rate": 6.096080804416899e-06, - "loss": 2.3063, - "step": 503520 - }, - { - "epoch": 0.88, - "learning_rate": 6.095208864490072e-06, - "loss": 2.1897, - "step": 503530 - }, - { - "epoch": 0.88, - "learning_rate": 6.0943369245632455e-06, - "loss": 2.2391, - "step": 503540 - }, - { - "epoch": 0.88, - "learning_rate": 6.093464984636419e-06, - "loss": 2.2264, - "step": 503550 - }, - { - "epoch": 0.88, - "learning_rate": 6.092593044709592e-06, - "loss": 2.2294, - "step": 503560 - }, - { - "epoch": 0.88, - "learning_rate": 6.091721104782765e-06, - "loss": 2.3361, - "step": 503570 - }, - { - "epoch": 0.88, - "learning_rate": 6.090849164855939e-06, - "loss": 2.2565, - "step": 503580 - }, - { - "epoch": 0.88, - "learning_rate": 6.089977224929112e-06, - "loss": 2.2684, - "step": 503590 - }, - { - "epoch": 0.88, - "learning_rate": 6.089105285002285e-06, - "loss": 2.2345, - "step": 503600 - }, - { - "epoch": 0.88, - "learning_rate": 6.088233345075458e-06, - "loss": 2.2616, - "step": 503610 - }, - { - "epoch": 0.88, - "learning_rate": 6.0873614051486314e-06, - "loss": 2.1968, - "step": 503620 - }, - { - "epoch": 0.88, - "learning_rate": 6.086489465221804e-06, - "loss": 2.2128, - "step": 503630 - }, - { - "epoch": 0.88, - "learning_rate": 6.085617525294977e-06, - "loss": 2.1837, - "step": 503640 - }, - { - "epoch": 0.88, - "learning_rate": 6.08474558536815e-06, - "loss": 2.1963, - "step": 503650 - }, - { - "epoch": 0.88, - "learning_rate": 6.083873645441324e-06, - "loss": 2.3946, - "step": 503660 - }, - { - "epoch": 0.88, - "learning_rate": 6.083001705514498e-06, - "loss": 2.2932, - "step": 503670 - }, - { - "epoch": 0.88, - "learning_rate": 6.082129765587671e-06, - "loss": 2.2042, - "step": 503680 - }, - { - "epoch": 0.88, - "learning_rate": 6.081257825660844e-06, - "loss": 2.2688, - "step": 503690 - }, - { - "epoch": 0.88, - "learning_rate": 6.080385885734017e-06, - "loss": 2.285, - "step": 503700 - }, - { - "epoch": 0.88, - "learning_rate": 6.07951394580719e-06, - "loss": 2.2752, - "step": 503710 - }, - { - "epoch": 0.88, - "learning_rate": 6.078642005880363e-06, - "loss": 2.3406, - "step": 503720 - }, - { - "epoch": 0.88, - "learning_rate": 6.077770065953536e-06, - "loss": 2.2143, - "step": 503730 - }, - { - "epoch": 0.88, - "learning_rate": 6.07689812602671e-06, - "loss": 2.328, - "step": 503740 - }, - { - "epoch": 0.88, - "learning_rate": 6.076026186099883e-06, - "loss": 2.2449, - "step": 503750 - }, - { - "epoch": 0.88, - "learning_rate": 6.075154246173056e-06, - "loss": 2.179, - "step": 503760 - }, - { - "epoch": 0.88, - "learning_rate": 6.074282306246229e-06, - "loss": 2.2531, - "step": 503770 - }, - { - "epoch": 0.88, - "learning_rate": 6.0734103663194024e-06, - "loss": 2.2722, - "step": 503780 - }, - { - "epoch": 0.88, - "learning_rate": 6.072538426392575e-06, - "loss": 2.255, - "step": 503790 - }, - { - "epoch": 0.88, - "learning_rate": 6.071666486465749e-06, - "loss": 2.2671, - "step": 503800 - }, - { - "epoch": 0.88, - "learning_rate": 6.070794546538922e-06, - "loss": 2.1863, - "step": 503810 - }, - { - "epoch": 0.88, - "learning_rate": 6.069922606612095e-06, - "loss": 2.196, - "step": 503820 - }, - { - "epoch": 0.88, - "learning_rate": 6.069050666685269e-06, - "loss": 2.2472, - "step": 503830 - }, - { - "epoch": 0.88, - "learning_rate": 6.068178726758442e-06, - "loss": 2.2824, - "step": 503840 - }, - { - "epoch": 0.88, - "learning_rate": 6.067306786831615e-06, - "loss": 2.274, - "step": 503850 - }, - { - "epoch": 0.88, - "learning_rate": 6.066434846904788e-06, - "loss": 2.2509, - "step": 503860 - }, - { - "epoch": 0.88, - "learning_rate": 6.065562906977961e-06, - "loss": 2.3182, - "step": 503870 - }, - { - "epoch": 0.88, - "learning_rate": 6.064690967051134e-06, - "loss": 2.257, - "step": 503880 - }, - { - "epoch": 0.88, - "learning_rate": 6.063819027124307e-06, - "loss": 2.1844, - "step": 503890 - }, - { - "epoch": 0.88, - "learning_rate": 6.062947087197481e-06, - "loss": 2.2823, - "step": 503900 - }, - { - "epoch": 0.88, - "learning_rate": 6.062075147270654e-06, - "loss": 2.1947, - "step": 503910 - }, - { - "epoch": 0.88, - "learning_rate": 6.061203207343827e-06, - "loss": 2.166, - "step": 503920 - }, - { - "epoch": 0.88, - "learning_rate": 6.060331267417e-06, - "loss": 2.2796, - "step": 503930 - }, - { - "epoch": 0.88, - "learning_rate": 6.0594593274901734e-06, - "loss": 2.2683, - "step": 503940 - }, - { - "epoch": 0.88, - "learning_rate": 6.058587387563347e-06, - "loss": 2.1012, - "step": 503950 - }, - { - "epoch": 0.88, - "learning_rate": 6.05771544763652e-06, - "loss": 2.2116, - "step": 503960 - }, - { - "epoch": 0.88, - "learning_rate": 6.056843507709693e-06, - "loss": 2.2852, - "step": 503970 - }, - { - "epoch": 0.88, - "learning_rate": 6.055971567782867e-06, - "loss": 2.3761, - "step": 503980 - }, - { - "epoch": 0.88, - "learning_rate": 6.05509962785604e-06, - "loss": 2.3524, - "step": 503990 - }, - { - "epoch": 0.88, - "learning_rate": 6.054227687929213e-06, - "loss": 2.3603, - "step": 504000 - }, - { - "epoch": 0.88, - "learning_rate": 6.053355748002386e-06, - "loss": 2.2855, - "step": 504010 - }, - { - "epoch": 0.88, - "learning_rate": 6.052483808075559e-06, - "loss": 2.2876, - "step": 504020 - }, - { - "epoch": 0.88, - "learning_rate": 6.051611868148732e-06, - "loss": 2.214, - "step": 504030 - }, - { - "epoch": 0.88, - "learning_rate": 6.050739928221905e-06, - "loss": 2.2364, - "step": 504040 - }, - { - "epoch": 0.88, - "learning_rate": 6.049867988295078e-06, - "loss": 2.2753, - "step": 504050 - }, - { - "epoch": 0.88, - "learning_rate": 6.048996048368252e-06, - "loss": 2.2328, - "step": 504060 - }, - { - "epoch": 0.88, - "learning_rate": 6.048124108441426e-06, - "loss": 2.1637, - "step": 504070 - }, - { - "epoch": 0.88, - "learning_rate": 6.047252168514599e-06, - "loss": 2.1728, - "step": 504080 - }, - { - "epoch": 0.88, - "learning_rate": 6.0463802285877715e-06, - "loss": 2.3199, - "step": 504090 - }, - { - "epoch": 0.88, - "learning_rate": 6.045508288660945e-06, - "loss": 2.324, - "step": 504100 - }, - { - "epoch": 0.88, - "learning_rate": 6.044636348734118e-06, - "loss": 2.1746, - "step": 504110 - }, - { - "epoch": 0.88, - "learning_rate": 6.043764408807291e-06, - "loss": 2.305, - "step": 504120 - }, - { - "epoch": 0.88, - "learning_rate": 6.042892468880464e-06, - "loss": 2.2355, - "step": 504130 - }, - { - "epoch": 0.88, - "learning_rate": 6.042020528953638e-06, - "loss": 2.2908, - "step": 504140 - }, - { - "epoch": 0.88, - "learning_rate": 6.041148589026811e-06, - "loss": 2.3518, - "step": 504150 - }, - { - "epoch": 0.88, - "learning_rate": 6.040276649099984e-06, - "loss": 2.3325, - "step": 504160 - }, - { - "epoch": 0.88, - "learning_rate": 6.039404709173157e-06, - "loss": 2.305, - "step": 504170 - }, - { - "epoch": 0.88, - "learning_rate": 6.03853276924633e-06, - "loss": 2.2567, - "step": 504180 - }, - { - "epoch": 0.88, - "learning_rate": 6.037660829319503e-06, - "loss": 2.1234, - "step": 504190 - }, - { - "epoch": 0.88, - "learning_rate": 6.036788889392677e-06, - "loss": 2.3435, - "step": 504200 - }, - { - "epoch": 0.88, - "learning_rate": 6.03591694946585e-06, - "loss": 2.2623, - "step": 504210 - }, - { - "epoch": 0.88, - "learning_rate": 6.035045009539024e-06, - "loss": 2.2281, - "step": 504220 - }, - { - "epoch": 0.88, - "learning_rate": 6.034173069612197e-06, - "loss": 2.2201, - "step": 504230 - }, - { - "epoch": 0.88, - "learning_rate": 6.03330112968537e-06, - "loss": 2.2533, - "step": 504240 - }, - { - "epoch": 0.88, - "learning_rate": 6.0324291897585425e-06, - "loss": 2.2881, - "step": 504250 - }, - { - "epoch": 0.88, - "learning_rate": 6.031557249831716e-06, - "loss": 2.3189, - "step": 504260 - }, - { - "epoch": 0.88, - "learning_rate": 6.030685309904889e-06, - "loss": 2.2176, - "step": 504270 - }, - { - "epoch": 0.88, - "learning_rate": 6.029813369978062e-06, - "loss": 2.2414, - "step": 504280 - }, - { - "epoch": 0.88, - "learning_rate": 6.028941430051235e-06, - "loss": 2.2304, - "step": 504290 - }, - { - "epoch": 0.88, - "learning_rate": 6.028069490124409e-06, - "loss": 2.2351, - "step": 504300 - }, - { - "epoch": 0.88, - "learning_rate": 6.027197550197582e-06, - "loss": 2.2721, - "step": 504310 - }, - { - "epoch": 0.88, - "learning_rate": 6.026325610270755e-06, - "loss": 2.1513, - "step": 504320 - }, - { - "epoch": 0.88, - "learning_rate": 6.025453670343928e-06, - "loss": 2.3397, - "step": 504330 - }, - { - "epoch": 0.88, - "learning_rate": 6.024581730417101e-06, - "loss": 2.3377, - "step": 504340 - }, - { - "epoch": 0.88, - "learning_rate": 6.023709790490275e-06, - "loss": 2.2378, - "step": 504350 - }, - { - "epoch": 0.88, - "learning_rate": 6.022837850563448e-06, - "loss": 2.2486, - "step": 504360 - }, - { - "epoch": 0.88, - "learning_rate": 6.021965910636621e-06, - "loss": 2.1847, - "step": 504370 - }, - { - "epoch": 0.88, - "learning_rate": 6.021093970709795e-06, - "loss": 2.2553, - "step": 504380 - }, - { - "epoch": 0.88, - "learning_rate": 6.020222030782968e-06, - "loss": 2.2091, - "step": 504390 - }, - { - "epoch": 0.88, - "learning_rate": 6.019350090856141e-06, - "loss": 2.2609, - "step": 504400 - }, - { - "epoch": 0.88, - "learning_rate": 6.0184781509293135e-06, - "loss": 2.2416, - "step": 504410 - }, - { - "epoch": 0.88, - "learning_rate": 6.017606211002487e-06, - "loss": 2.3394, - "step": 504420 - }, - { - "epoch": 0.88, - "learning_rate": 6.01673427107566e-06, - "loss": 2.2591, - "step": 504430 - }, - { - "epoch": 0.88, - "learning_rate": 6.015862331148833e-06, - "loss": 2.3234, - "step": 504440 - }, - { - "epoch": 0.88, - "learning_rate": 6.014990391222006e-06, - "loss": 2.2538, - "step": 504450 - }, - { - "epoch": 0.88, - "learning_rate": 6.01411845129518e-06, - "loss": 2.1451, - "step": 504460 - }, - { - "epoch": 0.88, - "learning_rate": 6.013246511368354e-06, - "loss": 2.2928, - "step": 504470 - }, - { - "epoch": 0.88, - "learning_rate": 6.0123745714415265e-06, - "loss": 2.3485, - "step": 504480 - }, - { - "epoch": 0.88, - "learning_rate": 6.0115026315146994e-06, - "loss": 2.2812, - "step": 504490 - }, - { - "epoch": 0.88, - "learning_rate": 6.010630691587873e-06, - "loss": 2.2599, - "step": 504500 - }, - { - "epoch": 0.88, - "learning_rate": 6.009758751661046e-06, - "loss": 2.1919, - "step": 504510 - }, - { - "epoch": 0.88, - "learning_rate": 6.008886811734219e-06, - "loss": 2.1873, - "step": 504520 - }, - { - "epoch": 0.88, - "learning_rate": 6.008014871807392e-06, - "loss": 2.1192, - "step": 504530 - }, - { - "epoch": 0.88, - "learning_rate": 6.007142931880566e-06, - "loss": 2.2493, - "step": 504540 - }, - { - "epoch": 0.88, - "learning_rate": 6.006270991953739e-06, - "loss": 2.1024, - "step": 504550 - }, - { - "epoch": 0.88, - "learning_rate": 6.005399052026912e-06, - "loss": 2.2715, - "step": 504560 - }, - { - "epoch": 0.88, - "learning_rate": 6.0045271121000845e-06, - "loss": 2.1626, - "step": 504570 - }, - { - "epoch": 0.88, - "learning_rate": 6.003655172173258e-06, - "loss": 2.3375, - "step": 504580 - }, - { - "epoch": 0.88, - "learning_rate": 6.002783232246431e-06, - "loss": 2.283, - "step": 504590 - }, - { - "epoch": 0.88, - "learning_rate": 6.001911292319605e-06, - "loss": 2.422, - "step": 504600 - }, - { - "epoch": 0.88, - "learning_rate": 6.001039352392778e-06, - "loss": 2.3267, - "step": 504610 - }, - { - "epoch": 0.88, - "learning_rate": 6.000167412465952e-06, - "loss": 2.272, - "step": 504620 - }, - { - "epoch": 0.88, - "learning_rate": 5.999295472539125e-06, - "loss": 2.2836, - "step": 504630 - }, - { - "epoch": 0.88, - "learning_rate": 5.9984235326122975e-06, - "loss": 2.2458, - "step": 504640 - }, - { - "epoch": 0.88, - "learning_rate": 5.9975515926854704e-06, - "loss": 2.2765, - "step": 504650 - }, - { - "epoch": 0.88, - "learning_rate": 5.996679652758644e-06, - "loss": 2.269, - "step": 504660 - }, - { - "epoch": 0.88, - "learning_rate": 5.995807712831817e-06, - "loss": 2.3309, - "step": 504670 - }, - { - "epoch": 0.88, - "learning_rate": 5.99493577290499e-06, - "loss": 2.4122, - "step": 504680 - }, - { - "epoch": 0.88, - "learning_rate": 5.994063832978163e-06, - "loss": 2.3374, - "step": 504690 - }, - { - "epoch": 0.88, - "learning_rate": 5.993191893051337e-06, - "loss": 2.2533, - "step": 504700 - }, - { - "epoch": 0.88, - "learning_rate": 5.99231995312451e-06, - "loss": 2.2944, - "step": 504710 - }, - { - "epoch": 0.88, - "learning_rate": 5.991448013197683e-06, - "loss": 2.1812, - "step": 504720 - }, - { - "epoch": 0.88, - "learning_rate": 5.9905760732708555e-06, - "loss": 2.2835, - "step": 504730 - }, - { - "epoch": 0.88, - "learning_rate": 5.98970413334403e-06, - "loss": 2.5013, - "step": 504740 - }, - { - "epoch": 0.88, - "learning_rate": 5.988832193417203e-06, - "loss": 2.2331, - "step": 504750 - }, - { - "epoch": 0.88, - "learning_rate": 5.987960253490376e-06, - "loss": 2.3191, - "step": 504760 - }, - { - "epoch": 0.88, - "learning_rate": 5.987088313563549e-06, - "loss": 2.2918, - "step": 504770 - }, - { - "epoch": 0.88, - "learning_rate": 5.986216373636723e-06, - "loss": 2.2193, - "step": 504780 - }, - { - "epoch": 0.88, - "learning_rate": 5.985344433709896e-06, - "loss": 2.2609, - "step": 504790 - }, - { - "epoch": 0.88, - "learning_rate": 5.9844724937830685e-06, - "loss": 2.2938, - "step": 504800 - }, - { - "epoch": 0.88, - "learning_rate": 5.9836005538562414e-06, - "loss": 2.223, - "step": 504810 - }, - { - "epoch": 0.88, - "learning_rate": 5.982728613929415e-06, - "loss": 2.3108, - "step": 504820 - }, - { - "epoch": 0.88, - "learning_rate": 5.981856674002588e-06, - "loss": 2.3887, - "step": 504830 - }, - { - "epoch": 0.88, - "learning_rate": 5.980984734075761e-06, - "loss": 2.118, - "step": 504840 - }, - { - "epoch": 0.88, - "learning_rate": 5.980112794148934e-06, - "loss": 2.2887, - "step": 504850 - }, - { - "epoch": 0.88, - "learning_rate": 5.979240854222108e-06, - "loss": 2.2597, - "step": 504860 - }, - { - "epoch": 0.88, - "learning_rate": 5.9783689142952815e-06, - "loss": 2.326, - "step": 504870 - }, - { - "epoch": 0.88, - "learning_rate": 5.9774969743684544e-06, - "loss": 2.2691, - "step": 504880 - }, - { - "epoch": 0.88, - "learning_rate": 5.976625034441627e-06, - "loss": 2.0894, - "step": 504890 - }, - { - "epoch": 0.88, - "learning_rate": 5.975753094514801e-06, - "loss": 2.3005, - "step": 504900 - }, - { - "epoch": 0.88, - "learning_rate": 5.974881154587974e-06, - "loss": 2.2846, - "step": 504910 - }, - { - "epoch": 0.88, - "learning_rate": 5.974009214661147e-06, - "loss": 2.2827, - "step": 504920 - }, - { - "epoch": 0.88, - "learning_rate": 5.97313727473432e-06, - "loss": 2.2847, - "step": 504930 - }, - { - "epoch": 0.88, - "learning_rate": 5.972265334807494e-06, - "loss": 2.2287, - "step": 504940 - }, - { - "epoch": 0.88, - "learning_rate": 5.971393394880667e-06, - "loss": 2.1411, - "step": 504950 - }, - { - "epoch": 0.88, - "learning_rate": 5.9705214549538395e-06, - "loss": 2.2558, - "step": 504960 - }, - { - "epoch": 0.88, - "learning_rate": 5.9696495150270124e-06, - "loss": 2.2027, - "step": 504970 - }, - { - "epoch": 0.88, - "learning_rate": 5.968777575100186e-06, - "loss": 2.2661, - "step": 504980 - }, - { - "epoch": 0.88, - "learning_rate": 5.967905635173359e-06, - "loss": 2.2892, - "step": 504990 - }, - { - "epoch": 0.88, - "learning_rate": 5.967033695246533e-06, - "loss": 2.0233, - "step": 505000 - }, - { - "epoch": 0.88, - "learning_rate": 5.966161755319706e-06, - "loss": 2.3244, - "step": 505010 - }, - { - "epoch": 0.88, - "learning_rate": 5.96528981539288e-06, - "loss": 2.235, - "step": 505020 - }, - { - "epoch": 0.88, - "learning_rate": 5.9644178754660525e-06, - "loss": 2.2332, - "step": 505030 - }, - { - "epoch": 0.88, - "learning_rate": 5.9635459355392254e-06, - "loss": 2.3269, - "step": 505040 - }, - { - "epoch": 0.88, - "learning_rate": 5.962673995612398e-06, - "loss": 2.2901, - "step": 505050 - }, - { - "epoch": 0.88, - "learning_rate": 5.961802055685572e-06, - "loss": 2.2578, - "step": 505060 - }, - { - "epoch": 0.88, - "learning_rate": 5.960930115758745e-06, - "loss": 2.3126, - "step": 505070 - }, - { - "epoch": 0.88, - "learning_rate": 5.960058175831918e-06, - "loss": 2.2606, - "step": 505080 - }, - { - "epoch": 0.88, - "learning_rate": 5.959186235905091e-06, - "loss": 2.2293, - "step": 505090 - }, - { - "epoch": 0.88, - "learning_rate": 5.958314295978265e-06, - "loss": 2.3416, - "step": 505100 - }, - { - "epoch": 0.88, - "learning_rate": 5.957442356051438e-06, - "loss": 2.2432, - "step": 505110 - }, - { - "epoch": 0.88, - "learning_rate": 5.9565704161246105e-06, - "loss": 2.2655, - "step": 505120 - }, - { - "epoch": 0.88, - "learning_rate": 5.9556984761977834e-06, - "loss": 2.343, - "step": 505130 - }, - { - "epoch": 0.88, - "learning_rate": 5.954826536270958e-06, - "loss": 2.2262, - "step": 505140 - }, - { - "epoch": 0.88, - "learning_rate": 5.953954596344131e-06, - "loss": 2.3598, - "step": 505150 - }, - { - "epoch": 0.88, - "learning_rate": 5.953082656417304e-06, - "loss": 2.2133, - "step": 505160 - }, - { - "epoch": 0.88, - "learning_rate": 5.952210716490477e-06, - "loss": 2.3604, - "step": 505170 - }, - { - "epoch": 0.88, - "learning_rate": 5.951338776563651e-06, - "loss": 2.1591, - "step": 505180 - }, - { - "epoch": 0.88, - "learning_rate": 5.9504668366368235e-06, - "loss": 2.3171, - "step": 505190 - }, - { - "epoch": 0.88, - "learning_rate": 5.9495948967099964e-06, - "loss": 2.1952, - "step": 505200 - }, - { - "epoch": 0.88, - "learning_rate": 5.948722956783169e-06, - "loss": 2.2835, - "step": 505210 - }, - { - "epoch": 0.88, - "learning_rate": 5.947851016856343e-06, - "loss": 2.1934, - "step": 505220 - }, - { - "epoch": 0.88, - "learning_rate": 5.946979076929516e-06, - "loss": 2.2408, - "step": 505230 - }, - { - "epoch": 0.88, - "learning_rate": 5.946107137002689e-06, - "loss": 2.1946, - "step": 505240 - }, - { - "epoch": 0.88, - "learning_rate": 5.945235197075862e-06, - "loss": 2.2925, - "step": 505250 - }, - { - "epoch": 0.88, - "learning_rate": 5.944363257149036e-06, - "loss": 2.2929, - "step": 505260 - }, - { - "epoch": 0.88, - "learning_rate": 5.9434913172222094e-06, - "loss": 2.392, - "step": 505270 - }, - { - "epoch": 0.88, - "learning_rate": 5.942619377295382e-06, - "loss": 2.2917, - "step": 505280 - }, - { - "epoch": 0.88, - "learning_rate": 5.941747437368555e-06, - "loss": 2.2019, - "step": 505290 - }, - { - "epoch": 0.88, - "learning_rate": 5.940875497441729e-06, - "loss": 2.3115, - "step": 505300 - }, - { - "epoch": 0.88, - "learning_rate": 5.940003557514902e-06, - "loss": 2.2177, - "step": 505310 - }, - { - "epoch": 0.88, - "learning_rate": 5.939131617588075e-06, - "loss": 2.1573, - "step": 505320 - }, - { - "epoch": 0.88, - "learning_rate": 5.938259677661248e-06, - "loss": 2.3938, - "step": 505330 - }, - { - "epoch": 0.88, - "learning_rate": 5.937387737734422e-06, - "loss": 2.2405, - "step": 505340 - }, - { - "epoch": 0.88, - "learning_rate": 5.9365157978075945e-06, - "loss": 2.2734, - "step": 505350 - }, - { - "epoch": 0.88, - "learning_rate": 5.9356438578807674e-06, - "loss": 2.2592, - "step": 505360 - }, - { - "epoch": 0.88, - "learning_rate": 5.93477191795394e-06, - "loss": 2.3116, - "step": 505370 - }, - { - "epoch": 0.88, - "learning_rate": 5.933899978027114e-06, - "loss": 2.2581, - "step": 505380 - }, - { - "epoch": 0.88, - "learning_rate": 5.933028038100287e-06, - "loss": 2.3374, - "step": 505390 - }, - { - "epoch": 0.88, - "learning_rate": 5.932156098173461e-06, - "loss": 2.2194, - "step": 505400 - }, - { - "epoch": 0.88, - "learning_rate": 5.931284158246634e-06, - "loss": 2.2296, - "step": 505410 - }, - { - "epoch": 0.88, - "learning_rate": 5.9304122183198075e-06, - "loss": 2.2656, - "step": 505420 - }, - { - "epoch": 0.88, - "learning_rate": 5.9295402783929804e-06, - "loss": 2.3702, - "step": 505430 - }, - { - "epoch": 0.88, - "learning_rate": 5.928668338466153e-06, - "loss": 2.2552, - "step": 505440 - }, - { - "epoch": 0.88, - "learning_rate": 5.927796398539326e-06, - "loss": 2.2734, - "step": 505450 - }, - { - "epoch": 0.88, - "learning_rate": 5.9269244586125e-06, - "loss": 2.259, - "step": 505460 - }, - { - "epoch": 0.88, - "learning_rate": 5.926052518685673e-06, - "loss": 2.3049, - "step": 505470 - }, - { - "epoch": 0.88, - "learning_rate": 5.925180578758846e-06, - "loss": 2.2054, - "step": 505480 - }, - { - "epoch": 0.88, - "learning_rate": 5.924308638832019e-06, - "loss": 2.3534, - "step": 505490 - }, - { - "epoch": 0.88, - "learning_rate": 5.923436698905193e-06, - "loss": 2.3905, - "step": 505500 - }, - { - "epoch": 0.88, - "learning_rate": 5.9225647589783655e-06, - "loss": 2.3821, - "step": 505510 - }, - { - "epoch": 0.88, - "learning_rate": 5.9216928190515384e-06, - "loss": 2.2059, - "step": 505520 - }, - { - "epoch": 0.88, - "learning_rate": 5.920820879124712e-06, - "loss": 2.2774, - "step": 505530 - }, - { - "epoch": 0.88, - "learning_rate": 5.919948939197886e-06, - "loss": 2.2483, - "step": 505540 - }, - { - "epoch": 0.88, - "learning_rate": 5.919076999271059e-06, - "loss": 2.3305, - "step": 505550 - }, - { - "epoch": 0.88, - "learning_rate": 5.918205059344232e-06, - "loss": 2.2977, - "step": 505560 - }, - { - "epoch": 0.88, - "learning_rate": 5.917333119417405e-06, - "loss": 2.2344, - "step": 505570 - }, - { - "epoch": 0.88, - "learning_rate": 5.9164611794905785e-06, - "loss": 2.3334, - "step": 505580 - }, - { - "epoch": 0.88, - "learning_rate": 5.9155892395637514e-06, - "loss": 2.2496, - "step": 505590 - }, - { - "epoch": 0.88, - "learning_rate": 5.914717299636924e-06, - "loss": 2.2213, - "step": 505600 - }, - { - "epoch": 0.88, - "learning_rate": 5.913845359710097e-06, - "loss": 2.3434, - "step": 505610 - }, - { - "epoch": 0.88, - "learning_rate": 5.912973419783271e-06, - "loss": 2.2079, - "step": 505620 - }, - { - "epoch": 0.88, - "learning_rate": 5.912101479856444e-06, - "loss": 2.3473, - "step": 505630 - }, - { - "epoch": 0.88, - "learning_rate": 5.911229539929617e-06, - "loss": 2.3574, - "step": 505640 - }, - { - "epoch": 0.88, - "learning_rate": 5.91035760000279e-06, - "loss": 2.2323, - "step": 505650 - }, - { - "epoch": 0.88, - "learning_rate": 5.909485660075964e-06, - "loss": 2.2781, - "step": 505660 - }, - { - "epoch": 0.88, - "learning_rate": 5.908613720149137e-06, - "loss": 2.2111, - "step": 505670 - }, - { - "epoch": 0.88, - "learning_rate": 5.90774178022231e-06, - "loss": 2.3631, - "step": 505680 - }, - { - "epoch": 0.88, - "learning_rate": 5.906869840295483e-06, - "loss": 2.3411, - "step": 505690 - }, - { - "epoch": 0.88, - "learning_rate": 5.905997900368657e-06, - "loss": 2.3623, - "step": 505700 - }, - { - "epoch": 0.88, - "learning_rate": 5.90512596044183e-06, - "loss": 2.2026, - "step": 505710 - }, - { - "epoch": 0.88, - "learning_rate": 5.904254020515003e-06, - "loss": 2.3234, - "step": 505720 - }, - { - "epoch": 0.88, - "learning_rate": 5.903382080588176e-06, - "loss": 2.3293, - "step": 505730 - }, - { - "epoch": 0.88, - "learning_rate": 5.9025101406613495e-06, - "loss": 2.3164, - "step": 505740 - }, - { - "epoch": 0.88, - "learning_rate": 5.9016382007345224e-06, - "loss": 2.4097, - "step": 505750 - }, - { - "epoch": 0.88, - "learning_rate": 5.900766260807695e-06, - "loss": 2.3372, - "step": 505760 - }, - { - "epoch": 0.88, - "learning_rate": 5.899894320880868e-06, - "loss": 2.2314, - "step": 505770 - }, - { - "epoch": 0.88, - "learning_rate": 5.899022380954042e-06, - "loss": 2.2228, - "step": 505780 - }, - { - "epoch": 0.88, - "learning_rate": 5.898150441027215e-06, - "loss": 2.3019, - "step": 505790 - }, - { - "epoch": 0.88, - "learning_rate": 5.897278501100389e-06, - "loss": 2.2635, - "step": 505800 - }, - { - "epoch": 0.88, - "learning_rate": 5.896406561173562e-06, - "loss": 2.2029, - "step": 505810 - }, - { - "epoch": 0.88, - "learning_rate": 5.8955346212467354e-06, - "loss": 2.2756, - "step": 505820 - }, - { - "epoch": 0.88, - "learning_rate": 5.894662681319908e-06, - "loss": 2.2515, - "step": 505830 - }, - { - "epoch": 0.88, - "learning_rate": 5.893790741393081e-06, - "loss": 2.2345, - "step": 505840 - }, - { - "epoch": 0.88, - "learning_rate": 5.892918801466254e-06, - "loss": 2.2893, - "step": 505850 - }, - { - "epoch": 0.88, - "learning_rate": 5.892046861539428e-06, - "loss": 2.2091, - "step": 505860 - }, - { - "epoch": 0.88, - "learning_rate": 5.891174921612601e-06, - "loss": 2.2346, - "step": 505870 - }, - { - "epoch": 0.88, - "learning_rate": 5.890302981685774e-06, - "loss": 2.2947, - "step": 505880 - }, - { - "epoch": 0.88, - "learning_rate": 5.889431041758947e-06, - "loss": 2.2515, - "step": 505890 - }, - { - "epoch": 0.88, - "learning_rate": 5.8885591018321205e-06, - "loss": 2.1527, - "step": 505900 - }, - { - "epoch": 0.88, - "learning_rate": 5.8876871619052934e-06, - "loss": 2.328, - "step": 505910 - }, - { - "epoch": 0.88, - "learning_rate": 5.886815221978466e-06, - "loss": 2.2585, - "step": 505920 - }, - { - "epoch": 0.88, - "learning_rate": 5.88594328205164e-06, - "loss": 2.2678, - "step": 505930 - }, - { - "epoch": 0.88, - "learning_rate": 5.885071342124814e-06, - "loss": 2.3366, - "step": 505940 - }, - { - "epoch": 0.88, - "learning_rate": 5.884199402197987e-06, - "loss": 2.3573, - "step": 505950 - }, - { - "epoch": 0.88, - "learning_rate": 5.88332746227116e-06, - "loss": 2.2316, - "step": 505960 - }, - { - "epoch": 0.88, - "learning_rate": 5.882455522344333e-06, - "loss": 2.4203, - "step": 505970 - }, - { - "epoch": 0.88, - "learning_rate": 5.8815835824175064e-06, - "loss": 2.279, - "step": 505980 - }, - { - "epoch": 0.88, - "learning_rate": 5.880711642490679e-06, - "loss": 2.3188, - "step": 505990 - }, - { - "epoch": 0.88, - "learning_rate": 5.879839702563852e-06, - "loss": 2.1873, - "step": 506000 - }, - { - "epoch": 0.88, - "learning_rate": 5.878967762637025e-06, - "loss": 2.296, - "step": 506010 - }, - { - "epoch": 0.88, - "learning_rate": 5.878095822710199e-06, - "loss": 2.2989, - "step": 506020 - }, - { - "epoch": 0.88, - "learning_rate": 5.877223882783372e-06, - "loss": 2.2962, - "step": 506030 - }, - { - "epoch": 0.88, - "learning_rate": 5.876351942856545e-06, - "loss": 2.2517, - "step": 506040 - }, - { - "epoch": 0.88, - "learning_rate": 5.875480002929718e-06, - "loss": 2.28, - "step": 506050 - }, - { - "epoch": 0.88, - "learning_rate": 5.8746080630028915e-06, - "loss": 2.0983, - "step": 506060 - }, - { - "epoch": 0.88, - "learning_rate": 5.873736123076065e-06, - "loss": 2.1725, - "step": 506070 - }, - { - "epoch": 0.88, - "learning_rate": 5.872864183149238e-06, - "loss": 2.2885, - "step": 506080 - }, - { - "epoch": 0.88, - "learning_rate": 5.871992243222411e-06, - "loss": 2.3218, - "step": 506090 - }, - { - "epoch": 0.88, - "learning_rate": 5.871120303295585e-06, - "loss": 2.3351, - "step": 506100 - }, - { - "epoch": 0.88, - "learning_rate": 5.870248363368758e-06, - "loss": 2.315, - "step": 506110 - }, - { - "epoch": 0.88, - "learning_rate": 5.869376423441931e-06, - "loss": 2.2568, - "step": 506120 - }, - { - "epoch": 0.88, - "learning_rate": 5.868504483515104e-06, - "loss": 2.3316, - "step": 506130 - }, - { - "epoch": 0.88, - "learning_rate": 5.8676325435882775e-06, - "loss": 2.3978, - "step": 506140 - }, - { - "epoch": 0.88, - "learning_rate": 5.86676060366145e-06, - "loss": 2.3257, - "step": 506150 - }, - { - "epoch": 0.88, - "learning_rate": 5.865888663734623e-06, - "loss": 2.2531, - "step": 506160 - }, - { - "epoch": 0.88, - "learning_rate": 5.865016723807796e-06, - "loss": 2.2085, - "step": 506170 - }, - { - "epoch": 0.88, - "learning_rate": 5.86414478388097e-06, - "loss": 2.2197, - "step": 506180 - }, - { - "epoch": 0.88, - "learning_rate": 5.863272843954143e-06, - "loss": 2.3153, - "step": 506190 - }, - { - "epoch": 0.88, - "learning_rate": 5.862400904027317e-06, - "loss": 2.3282, - "step": 506200 - }, - { - "epoch": 0.88, - "learning_rate": 5.86152896410049e-06, - "loss": 2.2734, - "step": 506210 - }, - { - "epoch": 0.88, - "learning_rate": 5.860657024173663e-06, - "loss": 2.3093, - "step": 506220 - }, - { - "epoch": 0.88, - "learning_rate": 5.859785084246836e-06, - "loss": 2.2821, - "step": 506230 - }, - { - "epoch": 0.88, - "learning_rate": 5.858913144320009e-06, - "loss": 2.3079, - "step": 506240 - }, - { - "epoch": 0.88, - "learning_rate": 5.858041204393182e-06, - "loss": 2.1759, - "step": 506250 - }, - { - "epoch": 0.88, - "learning_rate": 5.857169264466356e-06, - "loss": 2.2268, - "step": 506260 - }, - { - "epoch": 0.88, - "learning_rate": 5.856297324539529e-06, - "loss": 2.2884, - "step": 506270 - }, - { - "epoch": 0.88, - "learning_rate": 5.855425384612702e-06, - "loss": 2.2753, - "step": 506280 - }, - { - "epoch": 0.88, - "learning_rate": 5.854553444685875e-06, - "loss": 2.2648, - "step": 506290 - }, - { - "epoch": 0.88, - "learning_rate": 5.8536815047590485e-06, - "loss": 2.1654, - "step": 506300 - }, - { - "epoch": 0.88, - "learning_rate": 5.852809564832221e-06, - "loss": 2.3206, - "step": 506310 - }, - { - "epoch": 0.88, - "learning_rate": 5.851937624905394e-06, - "loss": 2.1915, - "step": 506320 - }, - { - "epoch": 0.88, - "learning_rate": 5.851065684978568e-06, - "loss": 2.2022, - "step": 506330 - }, - { - "epoch": 0.88, - "learning_rate": 5.850193745051742e-06, - "loss": 2.3051, - "step": 506340 - }, - { - "epoch": 0.88, - "learning_rate": 5.849321805124915e-06, - "loss": 2.2439, - "step": 506350 - }, - { - "epoch": 0.88, - "learning_rate": 5.848449865198088e-06, - "loss": 2.254, - "step": 506360 - }, - { - "epoch": 0.88, - "learning_rate": 5.847577925271261e-06, - "loss": 2.3314, - "step": 506370 - }, - { - "epoch": 0.88, - "learning_rate": 5.846705985344434e-06, - "loss": 2.2831, - "step": 506380 - }, - { - "epoch": 0.88, - "learning_rate": 5.845834045417607e-06, - "loss": 2.1705, - "step": 506390 - }, - { - "epoch": 0.88, - "learning_rate": 5.84496210549078e-06, - "loss": 2.2739, - "step": 506400 - }, - { - "epoch": 0.88, - "learning_rate": 5.844090165563953e-06, - "loss": 2.3445, - "step": 506410 - }, - { - "epoch": 0.88, - "learning_rate": 5.843218225637127e-06, - "loss": 2.2613, - "step": 506420 - }, - { - "epoch": 0.88, - "learning_rate": 5.8423462857103e-06, - "loss": 2.2154, - "step": 506430 - }, - { - "epoch": 0.88, - "learning_rate": 5.841474345783473e-06, - "loss": 2.1861, - "step": 506440 - }, - { - "epoch": 0.88, - "learning_rate": 5.840602405856646e-06, - "loss": 2.1977, - "step": 506450 - }, - { - "epoch": 0.88, - "learning_rate": 5.8397304659298195e-06, - "loss": 2.2759, - "step": 506460 - }, - { - "epoch": 0.88, - "learning_rate": 5.838858526002993e-06, - "loss": 2.1746, - "step": 506470 - }, - { - "epoch": 0.88, - "learning_rate": 5.837986586076166e-06, - "loss": 2.3245, - "step": 506480 - }, - { - "epoch": 0.88, - "learning_rate": 5.837114646149339e-06, - "loss": 2.307, - "step": 506490 - }, - { - "epoch": 0.88, - "learning_rate": 5.836242706222513e-06, - "loss": 2.3257, - "step": 506500 - }, - { - "epoch": 0.88, - "learning_rate": 5.835370766295686e-06, - "loss": 2.3491, - "step": 506510 - }, - { - "epoch": 0.88, - "learning_rate": 5.834498826368859e-06, - "loss": 2.2192, - "step": 506520 - }, - { - "epoch": 0.88, - "learning_rate": 5.833626886442032e-06, - "loss": 2.1974, - "step": 506530 - }, - { - "epoch": 0.88, - "learning_rate": 5.832754946515205e-06, - "loss": 2.3456, - "step": 506540 - }, - { - "epoch": 0.88, - "learning_rate": 5.831883006588378e-06, - "loss": 2.3026, - "step": 506550 - }, - { - "epoch": 0.88, - "learning_rate": 5.831011066661551e-06, - "loss": 2.2649, - "step": 506560 - }, - { - "epoch": 0.88, - "learning_rate": 5.830139126734724e-06, - "loss": 2.2988, - "step": 506570 - }, - { - "epoch": 0.88, - "learning_rate": 5.829267186807898e-06, - "loss": 2.3582, - "step": 506580 - }, - { - "epoch": 0.88, - "learning_rate": 5.828395246881071e-06, - "loss": 2.2697, - "step": 506590 - }, - { - "epoch": 0.88, - "learning_rate": 5.827523306954245e-06, - "loss": 2.2404, - "step": 506600 - }, - { - "epoch": 0.88, - "learning_rate": 5.8266513670274175e-06, - "loss": 2.2176, - "step": 506610 - }, - { - "epoch": 0.88, - "learning_rate": 5.825779427100591e-06, - "loss": 2.3063, - "step": 506620 - }, - { - "epoch": 0.88, - "learning_rate": 5.824907487173764e-06, - "loss": 2.2959, - "step": 506630 - }, - { - "epoch": 0.88, - "learning_rate": 5.824035547246937e-06, - "loss": 2.2251, - "step": 506640 - }, - { - "epoch": 0.88, - "learning_rate": 5.82316360732011e-06, - "loss": 2.2855, - "step": 506650 - }, - { - "epoch": 0.88, - "learning_rate": 5.822291667393284e-06, - "loss": 2.2483, - "step": 506660 - }, - { - "epoch": 0.88, - "learning_rate": 5.821419727466457e-06, - "loss": 2.2547, - "step": 506670 - }, - { - "epoch": 0.88, - "learning_rate": 5.82054778753963e-06, - "loss": 2.2811, - "step": 506680 - }, - { - "epoch": 0.88, - "learning_rate": 5.819675847612803e-06, - "loss": 2.3059, - "step": 506690 - }, - { - "epoch": 0.88, - "learning_rate": 5.818803907685976e-06, - "loss": 2.3138, - "step": 506700 - }, - { - "epoch": 0.88, - "learning_rate": 5.817931967759149e-06, - "loss": 2.3022, - "step": 506710 - }, - { - "epoch": 0.88, - "learning_rate": 5.817060027832322e-06, - "loss": 2.2181, - "step": 506720 - }, - { - "epoch": 0.88, - "learning_rate": 5.816188087905496e-06, - "loss": 2.2574, - "step": 506730 - }, - { - "epoch": 0.88, - "learning_rate": 5.81531614797867e-06, - "loss": 2.2064, - "step": 506740 - }, - { - "epoch": 0.88, - "learning_rate": 5.814444208051843e-06, - "loss": 2.334, - "step": 506750 - }, - { - "epoch": 0.88, - "learning_rate": 5.813572268125016e-06, - "loss": 2.2757, - "step": 506760 - }, - { - "epoch": 0.88, - "learning_rate": 5.8127003281981885e-06, - "loss": 2.2326, - "step": 506770 - }, - { - "epoch": 0.88, - "learning_rate": 5.811828388271362e-06, - "loss": 2.2112, - "step": 506780 - }, - { - "epoch": 0.88, - "learning_rate": 5.810956448344535e-06, - "loss": 2.3646, - "step": 506790 - }, - { - "epoch": 0.88, - "learning_rate": 5.810084508417708e-06, - "loss": 2.28, - "step": 506800 - }, - { - "epoch": 0.88, - "learning_rate": 5.809212568490881e-06, - "loss": 2.4025, - "step": 506810 - }, - { - "epoch": 0.88, - "learning_rate": 5.808340628564055e-06, - "loss": 2.285, - "step": 506820 - }, - { - "epoch": 0.88, - "learning_rate": 5.807468688637228e-06, - "loss": 2.2277, - "step": 506830 - }, - { - "epoch": 0.88, - "learning_rate": 5.806596748710401e-06, - "loss": 2.2025, - "step": 506840 - }, - { - "epoch": 0.88, - "learning_rate": 5.805724808783574e-06, - "loss": 2.2385, - "step": 506850 - }, - { - "epoch": 0.88, - "learning_rate": 5.804852868856748e-06, - "loss": 2.279, - "step": 506860 - }, - { - "epoch": 0.88, - "learning_rate": 5.803980928929921e-06, - "loss": 2.2824, - "step": 506870 - }, - { - "epoch": 0.88, - "learning_rate": 5.803108989003094e-06, - "loss": 2.33, - "step": 506880 - }, - { - "epoch": 0.88, - "learning_rate": 5.802237049076267e-06, - "loss": 2.2934, - "step": 506890 - }, - { - "epoch": 0.88, - "learning_rate": 5.801365109149441e-06, - "loss": 2.3387, - "step": 506900 - }, - { - "epoch": 0.88, - "learning_rate": 5.800493169222614e-06, - "loss": 2.2666, - "step": 506910 - }, - { - "epoch": 0.88, - "learning_rate": 5.799621229295787e-06, - "loss": 2.1586, - "step": 506920 - }, - { - "epoch": 0.88, - "learning_rate": 5.7987492893689595e-06, - "loss": 2.4137, - "step": 506930 - }, - { - "epoch": 0.88, - "learning_rate": 5.797877349442133e-06, - "loss": 2.2563, - "step": 506940 - }, - { - "epoch": 0.88, - "learning_rate": 5.797005409515306e-06, - "loss": 2.3133, - "step": 506950 - }, - { - "epoch": 0.88, - "learning_rate": 5.796133469588479e-06, - "loss": 2.3061, - "step": 506960 - }, - { - "epoch": 0.88, - "learning_rate": 5.795261529661652e-06, - "loss": 2.2821, - "step": 506970 - }, - { - "epoch": 0.88, - "learning_rate": 5.794389589734826e-06, - "loss": 2.1772, - "step": 506980 - }, - { - "epoch": 0.88, - "learning_rate": 5.793517649807999e-06, - "loss": 2.2926, - "step": 506990 - }, - { - "epoch": 0.88, - "learning_rate": 5.7926457098811725e-06, - "loss": 2.1406, - "step": 507000 - }, - { - "epoch": 0.88, - "learning_rate": 5.7917737699543455e-06, - "loss": 2.2409, - "step": 507010 - }, - { - "epoch": 0.88, - "learning_rate": 5.790901830027519e-06, - "loss": 2.18, - "step": 507020 - }, - { - "epoch": 0.88, - "learning_rate": 5.790029890100692e-06, - "loss": 2.3222, - "step": 507030 - }, - { - "epoch": 0.88, - "learning_rate": 5.789157950173865e-06, - "loss": 2.2658, - "step": 507040 - }, - { - "epoch": 0.88, - "learning_rate": 5.788286010247038e-06, - "loss": 2.3395, - "step": 507050 - }, - { - "epoch": 0.88, - "learning_rate": 5.787414070320212e-06, - "loss": 2.2941, - "step": 507060 - }, - { - "epoch": 0.88, - "learning_rate": 5.786542130393385e-06, - "loss": 2.1891, - "step": 507070 - }, - { - "epoch": 0.88, - "learning_rate": 5.785670190466558e-06, - "loss": 2.3804, - "step": 507080 - }, - { - "epoch": 0.88, - "learning_rate": 5.7847982505397305e-06, - "loss": 2.3123, - "step": 507090 - }, - { - "epoch": 0.88, - "learning_rate": 5.783926310612904e-06, - "loss": 2.3092, - "step": 507100 - }, - { - "epoch": 0.88, - "learning_rate": 5.783054370686077e-06, - "loss": 2.2597, - "step": 507110 - }, - { - "epoch": 0.88, - "learning_rate": 5.78218243075925e-06, - "loss": 2.2342, - "step": 507120 - }, - { - "epoch": 0.88, - "learning_rate": 5.781310490832424e-06, - "loss": 2.3818, - "step": 507130 - }, - { - "epoch": 0.88, - "learning_rate": 5.780438550905598e-06, - "loss": 2.3167, - "step": 507140 - }, - { - "epoch": 0.88, - "learning_rate": 5.779566610978771e-06, - "loss": 2.1835, - "step": 507150 - }, - { - "epoch": 0.88, - "learning_rate": 5.7786946710519435e-06, - "loss": 2.3104, - "step": 507160 - }, - { - "epoch": 0.88, - "learning_rate": 5.7778227311251165e-06, - "loss": 2.2155, - "step": 507170 - }, - { - "epoch": 0.88, - "learning_rate": 5.77695079119829e-06, - "loss": 2.3822, - "step": 507180 - }, - { - "epoch": 0.88, - "learning_rate": 5.776078851271463e-06, - "loss": 2.2339, - "step": 507190 - }, - { - "epoch": 0.88, - "learning_rate": 5.775206911344636e-06, - "loss": 2.1568, - "step": 507200 - }, - { - "epoch": 0.88, - "learning_rate": 5.774334971417809e-06, - "loss": 2.2835, - "step": 507210 - }, - { - "epoch": 0.88, - "learning_rate": 5.773463031490983e-06, - "loss": 2.1812, - "step": 507220 - }, - { - "epoch": 0.88, - "learning_rate": 5.772591091564156e-06, - "loss": 2.207, - "step": 507230 - }, - { - "epoch": 0.88, - "learning_rate": 5.771719151637329e-06, - "loss": 2.2133, - "step": 507240 - }, - { - "epoch": 0.88, - "learning_rate": 5.770847211710502e-06, - "loss": 2.1831, - "step": 507250 - }, - { - "epoch": 0.88, - "learning_rate": 5.769975271783676e-06, - "loss": 2.1571, - "step": 507260 - }, - { - "epoch": 0.88, - "learning_rate": 5.769103331856849e-06, - "loss": 2.2771, - "step": 507270 - }, - { - "epoch": 0.88, - "learning_rate": 5.768231391930022e-06, - "loss": 2.2669, - "step": 507280 - }, - { - "epoch": 0.88, - "learning_rate": 5.767359452003195e-06, - "loss": 2.2692, - "step": 507290 - }, - { - "epoch": 0.88, - "learning_rate": 5.766487512076369e-06, - "loss": 2.2293, - "step": 507300 - }, - { - "epoch": 0.88, - "learning_rate": 5.765615572149542e-06, - "loss": 2.2946, - "step": 507310 - }, - { - "epoch": 0.88, - "learning_rate": 5.7647436322227145e-06, - "loss": 2.3794, - "step": 507320 - }, - { - "epoch": 0.88, - "learning_rate": 5.7638716922958875e-06, - "loss": 2.2572, - "step": 507330 - }, - { - "epoch": 0.88, - "learning_rate": 5.762999752369061e-06, - "loss": 2.2854, - "step": 507340 - }, - { - "epoch": 0.88, - "learning_rate": 5.762127812442234e-06, - "loss": 2.2377, - "step": 507350 - }, - { - "epoch": 0.88, - "learning_rate": 5.761255872515407e-06, - "loss": 2.3623, - "step": 507360 - }, - { - "epoch": 0.88, - "learning_rate": 5.76038393258858e-06, - "loss": 2.3184, - "step": 507370 - }, - { - "epoch": 0.88, - "learning_rate": 5.759511992661754e-06, - "loss": 2.2181, - "step": 507380 - }, - { - "epoch": 0.88, - "learning_rate": 5.758640052734927e-06, - "loss": 2.0929, - "step": 507390 - }, - { - "epoch": 0.88, - "learning_rate": 5.7577681128081005e-06, - "loss": 2.2355, - "step": 507400 - }, - { - "epoch": 0.88, - "learning_rate": 5.756896172881273e-06, - "loss": 2.2028, - "step": 507410 - }, - { - "epoch": 0.88, - "learning_rate": 5.756024232954447e-06, - "loss": 2.324, - "step": 507420 - }, - { - "epoch": 0.88, - "learning_rate": 5.75515229302762e-06, - "loss": 2.3351, - "step": 507430 - }, - { - "epoch": 0.88, - "learning_rate": 5.754280353100793e-06, - "loss": 2.2654, - "step": 507440 - }, - { - "epoch": 0.88, - "learning_rate": 5.753408413173966e-06, - "loss": 2.2679, - "step": 507450 - }, - { - "epoch": 0.88, - "learning_rate": 5.75253647324714e-06, - "loss": 2.2423, - "step": 507460 - }, - { - "epoch": 0.88, - "learning_rate": 5.751664533320313e-06, - "loss": 2.2844, - "step": 507470 - }, - { - "epoch": 0.88, - "learning_rate": 5.7507925933934855e-06, - "loss": 2.327, - "step": 507480 - }, - { - "epoch": 0.89, - "learning_rate": 5.7499206534666585e-06, - "loss": 2.1965, - "step": 507490 - }, - { - "epoch": 0.89, - "learning_rate": 5.749048713539832e-06, - "loss": 2.2727, - "step": 507500 - }, - { - "epoch": 0.89, - "learning_rate": 5.748176773613005e-06, - "loss": 2.2318, - "step": 507510 - }, - { - "epoch": 0.89, - "learning_rate": 5.747304833686178e-06, - "loss": 2.2222, - "step": 507520 - }, - { - "epoch": 0.89, - "learning_rate": 5.746432893759352e-06, - "loss": 2.2806, - "step": 507530 - }, - { - "epoch": 0.89, - "learning_rate": 5.745560953832526e-06, - "loss": 2.2742, - "step": 507540 - }, - { - "epoch": 0.89, - "learning_rate": 5.7446890139056985e-06, - "loss": 2.2687, - "step": 507550 - }, - { - "epoch": 0.89, - "learning_rate": 5.7438170739788715e-06, - "loss": 2.2482, - "step": 507560 - }, - { - "epoch": 0.89, - "learning_rate": 5.742945134052044e-06, - "loss": 2.2421, - "step": 507570 - }, - { - "epoch": 0.89, - "learning_rate": 5.742073194125218e-06, - "loss": 2.3521, - "step": 507580 - }, - { - "epoch": 0.89, - "learning_rate": 5.741201254198391e-06, - "loss": 2.2226, - "step": 507590 - }, - { - "epoch": 0.89, - "learning_rate": 5.740329314271564e-06, - "loss": 2.2991, - "step": 507600 - }, - { - "epoch": 0.89, - "learning_rate": 5.739457374344737e-06, - "loss": 2.1765, - "step": 507610 - }, - { - "epoch": 0.89, - "learning_rate": 5.738585434417911e-06, - "loss": 2.2347, - "step": 507620 - }, - { - "epoch": 0.89, - "learning_rate": 5.737713494491084e-06, - "loss": 2.3583, - "step": 507630 - }, - { - "epoch": 0.89, - "learning_rate": 5.7368415545642565e-06, - "loss": 2.337, - "step": 507640 - }, - { - "epoch": 0.89, - "learning_rate": 5.73596961463743e-06, - "loss": 2.2809, - "step": 507650 - }, - { - "epoch": 0.89, - "learning_rate": 5.735097674710604e-06, - "loss": 2.3128, - "step": 507660 - }, - { - "epoch": 0.89, - "learning_rate": 5.734225734783777e-06, - "loss": 2.2637, - "step": 507670 - }, - { - "epoch": 0.89, - "learning_rate": 5.73335379485695e-06, - "loss": 2.3128, - "step": 507680 - }, - { - "epoch": 0.89, - "learning_rate": 5.732481854930123e-06, - "loss": 2.3341, - "step": 507690 - }, - { - "epoch": 0.89, - "learning_rate": 5.731609915003297e-06, - "loss": 2.1824, - "step": 507700 - }, - { - "epoch": 0.89, - "learning_rate": 5.7307379750764695e-06, - "loss": 2.1223, - "step": 507710 - }, - { - "epoch": 0.89, - "learning_rate": 5.7298660351496425e-06, - "loss": 2.3157, - "step": 507720 - }, - { - "epoch": 0.89, - "learning_rate": 5.728994095222815e-06, - "loss": 2.2845, - "step": 507730 - }, - { - "epoch": 0.89, - "learning_rate": 5.728122155295989e-06, - "loss": 2.1556, - "step": 507740 - }, - { - "epoch": 0.89, - "learning_rate": 5.727250215369162e-06, - "loss": 2.1919, - "step": 507750 - }, - { - "epoch": 0.89, - "learning_rate": 5.726378275442335e-06, - "loss": 2.3584, - "step": 507760 - }, - { - "epoch": 0.89, - "learning_rate": 5.725506335515509e-06, - "loss": 2.3213, - "step": 507770 - }, - { - "epoch": 0.89, - "learning_rate": 5.724634395588682e-06, - "loss": 2.2011, - "step": 507780 - }, - { - "epoch": 0.89, - "learning_rate": 5.723762455661855e-06, - "loss": 2.2641, - "step": 507790 - }, - { - "epoch": 0.89, - "learning_rate": 5.722890515735028e-06, - "loss": 2.1921, - "step": 507800 - }, - { - "epoch": 0.89, - "learning_rate": 5.722018575808201e-06, - "loss": 2.2275, - "step": 507810 - }, - { - "epoch": 0.89, - "learning_rate": 5.721146635881375e-06, - "loss": 2.2031, - "step": 507820 - }, - { - "epoch": 0.89, - "learning_rate": 5.720274695954548e-06, - "loss": 2.1487, - "step": 507830 - }, - { - "epoch": 0.89, - "learning_rate": 5.719402756027721e-06, - "loss": 2.2538, - "step": 507840 - }, - { - "epoch": 0.89, - "learning_rate": 5.718530816100894e-06, - "loss": 2.275, - "step": 507850 - }, - { - "epoch": 0.89, - "learning_rate": 5.717658876174068e-06, - "loss": 2.2334, - "step": 507860 - }, - { - "epoch": 0.89, - "learning_rate": 5.7167869362472405e-06, - "loss": 2.2557, - "step": 507870 - }, - { - "epoch": 0.89, - "learning_rate": 5.7159149963204135e-06, - "loss": 2.256, - "step": 507880 - }, - { - "epoch": 0.89, - "learning_rate": 5.715043056393586e-06, - "loss": 2.4313, - "step": 507890 - }, - { - "epoch": 0.89, - "learning_rate": 5.71417111646676e-06, - "loss": 2.3864, - "step": 507900 - }, - { - "epoch": 0.89, - "learning_rate": 5.713299176539933e-06, - "loss": 2.2452, - "step": 507910 - }, - { - "epoch": 0.89, - "learning_rate": 5.712427236613106e-06, - "loss": 2.2527, - "step": 507920 - }, - { - "epoch": 0.89, - "learning_rate": 5.71155529668628e-06, - "loss": 2.2199, - "step": 507930 - }, - { - "epoch": 0.89, - "learning_rate": 5.7106833567594535e-06, - "loss": 2.2827, - "step": 507940 - }, - { - "epoch": 0.89, - "learning_rate": 5.7098114168326265e-06, - "loss": 2.222, - "step": 507950 - }, - { - "epoch": 0.89, - "learning_rate": 5.708939476905799e-06, - "loss": 2.2148, - "step": 507960 - }, - { - "epoch": 0.89, - "learning_rate": 5.708067536978972e-06, - "loss": 2.2388, - "step": 507970 - }, - { - "epoch": 0.89, - "learning_rate": 5.707195597052146e-06, - "loss": 2.3229, - "step": 507980 - }, - { - "epoch": 0.89, - "learning_rate": 5.706323657125319e-06, - "loss": 2.3126, - "step": 507990 - }, - { - "epoch": 0.89, - "learning_rate": 5.705451717198492e-06, - "loss": 2.1982, - "step": 508000 - }, - { - "epoch": 0.89, - "learning_rate": 5.704579777271665e-06, - "loss": 2.2714, - "step": 508010 - }, - { - "epoch": 0.89, - "learning_rate": 5.703707837344839e-06, - "loss": 2.3084, - "step": 508020 - }, - { - "epoch": 0.89, - "learning_rate": 5.7028358974180115e-06, - "loss": 2.2577, - "step": 508030 - }, - { - "epoch": 0.89, - "learning_rate": 5.7019639574911845e-06, - "loss": 2.2718, - "step": 508040 - }, - { - "epoch": 0.89, - "learning_rate": 5.701092017564358e-06, - "loss": 2.1751, - "step": 508050 - }, - { - "epoch": 0.89, - "learning_rate": 5.700220077637532e-06, - "loss": 2.3317, - "step": 508060 - }, - { - "epoch": 0.89, - "learning_rate": 5.699348137710705e-06, - "loss": 2.3454, - "step": 508070 - }, - { - "epoch": 0.89, - "learning_rate": 5.698476197783878e-06, - "loss": 2.2169, - "step": 508080 - }, - { - "epoch": 0.89, - "learning_rate": 5.697604257857051e-06, - "loss": 2.2388, - "step": 508090 - }, - { - "epoch": 0.89, - "learning_rate": 5.6967323179302245e-06, - "loss": 2.2028, - "step": 508100 - }, - { - "epoch": 0.89, - "learning_rate": 5.6958603780033975e-06, - "loss": 2.1465, - "step": 508110 - }, - { - "epoch": 0.89, - "learning_rate": 5.69498843807657e-06, - "loss": 2.3082, - "step": 508120 - }, - { - "epoch": 0.89, - "learning_rate": 5.694116498149743e-06, - "loss": 2.2831, - "step": 508130 - }, - { - "epoch": 0.89, - "learning_rate": 5.693244558222917e-06, - "loss": 2.2562, - "step": 508140 - }, - { - "epoch": 0.89, - "learning_rate": 5.69237261829609e-06, - "loss": 2.2695, - "step": 508150 - }, - { - "epoch": 0.89, - "learning_rate": 5.691500678369263e-06, - "loss": 2.1748, - "step": 508160 - }, - { - "epoch": 0.89, - "learning_rate": 5.690628738442437e-06, - "loss": 2.2731, - "step": 508170 - }, - { - "epoch": 0.89, - "learning_rate": 5.68975679851561e-06, - "loss": 2.2868, - "step": 508180 - }, - { - "epoch": 0.89, - "learning_rate": 5.688884858588783e-06, - "loss": 2.3056, - "step": 508190 - }, - { - "epoch": 0.89, - "learning_rate": 5.688012918661956e-06, - "loss": 2.2643, - "step": 508200 - }, - { - "epoch": 0.89, - "learning_rate": 5.687140978735129e-06, - "loss": 2.359, - "step": 508210 - }, - { - "epoch": 0.89, - "learning_rate": 5.686269038808303e-06, - "loss": 2.3279, - "step": 508220 - }, - { - "epoch": 0.89, - "learning_rate": 5.685397098881476e-06, - "loss": 2.2654, - "step": 508230 - }, - { - "epoch": 0.89, - "learning_rate": 5.684525158954649e-06, - "loss": 2.2779, - "step": 508240 - }, - { - "epoch": 0.89, - "learning_rate": 5.683653219027822e-06, - "loss": 2.2687, - "step": 508250 - }, - { - "epoch": 0.89, - "learning_rate": 5.6827812791009955e-06, - "loss": 2.3052, - "step": 508260 - }, - { - "epoch": 0.89, - "learning_rate": 5.6819093391741685e-06, - "loss": 2.149, - "step": 508270 - }, - { - "epoch": 0.89, - "learning_rate": 5.681037399247341e-06, - "loss": 2.3526, - "step": 508280 - }, - { - "epoch": 0.89, - "learning_rate": 5.680165459320515e-06, - "loss": 2.3333, - "step": 508290 - }, - { - "epoch": 0.89, - "learning_rate": 5.679293519393688e-06, - "loss": 2.2149, - "step": 508300 - }, - { - "epoch": 0.89, - "learning_rate": 5.678421579466861e-06, - "loss": 2.2141, - "step": 508310 - }, - { - "epoch": 0.89, - "learning_rate": 5.677549639540034e-06, - "loss": 2.2877, - "step": 508320 - }, - { - "epoch": 0.89, - "learning_rate": 5.676677699613208e-06, - "loss": 2.4112, - "step": 508330 - }, - { - "epoch": 0.89, - "learning_rate": 5.6758057596863815e-06, - "loss": 2.2136, - "step": 508340 - }, - { - "epoch": 0.89, - "learning_rate": 5.674933819759554e-06, - "loss": 2.4205, - "step": 508350 - }, - { - "epoch": 0.89, - "learning_rate": 5.674061879832727e-06, - "loss": 2.2566, - "step": 508360 - }, - { - "epoch": 0.89, - "learning_rate": 5.6731899399059e-06, - "loss": 2.2396, - "step": 508370 - }, - { - "epoch": 0.89, - "learning_rate": 5.672317999979074e-06, - "loss": 2.2402, - "step": 508380 - }, - { - "epoch": 0.89, - "learning_rate": 5.671446060052247e-06, - "loss": 2.2509, - "step": 508390 - }, - { - "epoch": 0.89, - "learning_rate": 5.67057412012542e-06, - "loss": 2.3423, - "step": 508400 - }, - { - "epoch": 0.89, - "learning_rate": 5.669702180198593e-06, - "loss": 2.2695, - "step": 508410 - }, - { - "epoch": 0.89, - "learning_rate": 5.6688302402717665e-06, - "loss": 2.2431, - "step": 508420 - }, - { - "epoch": 0.89, - "learning_rate": 5.6679583003449395e-06, - "loss": 2.3034, - "step": 508430 - }, - { - "epoch": 0.89, - "learning_rate": 5.667086360418112e-06, - "loss": 2.2382, - "step": 508440 - }, - { - "epoch": 0.89, - "learning_rate": 5.666214420491286e-06, - "loss": 2.2747, - "step": 508450 - }, - { - "epoch": 0.89, - "learning_rate": 5.66534248056446e-06, - "loss": 2.1605, - "step": 508460 - }, - { - "epoch": 0.89, - "learning_rate": 5.664470540637633e-06, - "loss": 2.1508, - "step": 508470 - }, - { - "epoch": 0.89, - "learning_rate": 5.663598600710806e-06, - "loss": 2.2271, - "step": 508480 - }, - { - "epoch": 0.89, - "learning_rate": 5.662726660783979e-06, - "loss": 2.2681, - "step": 508490 - }, - { - "epoch": 0.89, - "learning_rate": 5.6618547208571525e-06, - "loss": 2.3624, - "step": 508500 - }, - { - "epoch": 0.89, - "learning_rate": 5.660982780930325e-06, - "loss": 2.2473, - "step": 508510 - }, - { - "epoch": 0.89, - "learning_rate": 5.660110841003498e-06, - "loss": 2.2852, - "step": 508520 - }, - { - "epoch": 0.89, - "learning_rate": 5.659238901076671e-06, - "loss": 2.1924, - "step": 508530 - }, - { - "epoch": 0.89, - "learning_rate": 5.658366961149845e-06, - "loss": 2.3621, - "step": 508540 - }, - { - "epoch": 0.89, - "learning_rate": 5.657495021223018e-06, - "loss": 2.2584, - "step": 508550 - }, - { - "epoch": 0.89, - "learning_rate": 5.656623081296191e-06, - "loss": 2.1234, - "step": 508560 - }, - { - "epoch": 0.89, - "learning_rate": 5.655751141369365e-06, - "loss": 2.2888, - "step": 508570 - }, - { - "epoch": 0.89, - "learning_rate": 5.6548792014425375e-06, - "loss": 2.2229, - "step": 508580 - }, - { - "epoch": 0.89, - "learning_rate": 5.654007261515711e-06, - "loss": 2.1316, - "step": 508590 - }, - { - "epoch": 0.89, - "learning_rate": 5.653135321588884e-06, - "loss": 2.2716, - "step": 508600 - }, - { - "epoch": 0.89, - "learning_rate": 5.652263381662057e-06, - "loss": 2.3036, - "step": 508610 - }, - { - "epoch": 0.89, - "learning_rate": 5.651391441735231e-06, - "loss": 2.2546, - "step": 508620 - }, - { - "epoch": 0.89, - "learning_rate": 5.650519501808404e-06, - "loss": 2.276, - "step": 508630 - }, - { - "epoch": 0.89, - "learning_rate": 5.649647561881577e-06, - "loss": 2.1455, - "step": 508640 - }, - { - "epoch": 0.89, - "learning_rate": 5.64877562195475e-06, - "loss": 2.1219, - "step": 508650 - }, - { - "epoch": 0.89, - "learning_rate": 5.6479036820279235e-06, - "loss": 2.2864, - "step": 508660 - }, - { - "epoch": 0.89, - "learning_rate": 5.647031742101096e-06, - "loss": 2.2614, - "step": 508670 - }, - { - "epoch": 0.89, - "learning_rate": 5.646159802174269e-06, - "loss": 2.3457, - "step": 508680 - }, - { - "epoch": 0.89, - "learning_rate": 5.645287862247443e-06, - "loss": 2.3227, - "step": 508690 - }, - { - "epoch": 0.89, - "learning_rate": 5.644415922320616e-06, - "loss": 2.3275, - "step": 508700 - }, - { - "epoch": 0.89, - "learning_rate": 5.643543982393789e-06, - "loss": 2.3277, - "step": 508710 - }, - { - "epoch": 0.89, - "learning_rate": 5.642672042466962e-06, - "loss": 2.37, - "step": 508720 - }, - { - "epoch": 0.89, - "learning_rate": 5.641800102540136e-06, - "loss": 2.2139, - "step": 508730 - }, - { - "epoch": 0.89, - "learning_rate": 5.640928162613309e-06, - "loss": 2.2418, - "step": 508740 - }, - { - "epoch": 0.89, - "learning_rate": 5.640056222686482e-06, - "loss": 2.3203, - "step": 508750 - }, - { - "epoch": 0.89, - "learning_rate": 5.639184282759655e-06, - "loss": 2.2974, - "step": 508760 - }, - { - "epoch": 0.89, - "learning_rate": 5.638312342832828e-06, - "loss": 2.283, - "step": 508770 - }, - { - "epoch": 0.89, - "learning_rate": 5.637440402906002e-06, - "loss": 2.1615, - "step": 508780 - }, - { - "epoch": 0.89, - "learning_rate": 5.636568462979175e-06, - "loss": 2.3011, - "step": 508790 - }, - { - "epoch": 0.89, - "learning_rate": 5.635696523052348e-06, - "loss": 2.2619, - "step": 508800 - }, - { - "epoch": 0.89, - "learning_rate": 5.6348245831255216e-06, - "loss": 2.1892, - "step": 508810 - }, - { - "epoch": 0.89, - "learning_rate": 5.6339526431986945e-06, - "loss": 2.2376, - "step": 508820 - }, - { - "epoch": 0.89, - "learning_rate": 5.633080703271867e-06, - "loss": 2.2442, - "step": 508830 - }, - { - "epoch": 0.89, - "learning_rate": 5.63220876334504e-06, - "loss": 2.2402, - "step": 508840 - }, - { - "epoch": 0.89, - "learning_rate": 5.631336823418214e-06, - "loss": 2.2933, - "step": 508850 - }, - { - "epoch": 0.89, - "learning_rate": 5.630464883491388e-06, - "loss": 2.2493, - "step": 508860 - }, - { - "epoch": 0.89, - "learning_rate": 5.629592943564561e-06, - "loss": 2.3678, - "step": 508870 - }, - { - "epoch": 0.89, - "learning_rate": 5.628721003637734e-06, - "loss": 2.258, - "step": 508880 - }, - { - "epoch": 0.89, - "learning_rate": 5.627849063710907e-06, - "loss": 2.1946, - "step": 508890 - }, - { - "epoch": 0.89, - "learning_rate": 5.62697712378408e-06, - "loss": 2.3496, - "step": 508900 - }, - { - "epoch": 0.89, - "learning_rate": 5.626105183857253e-06, - "loss": 2.1847, - "step": 508910 - }, - { - "epoch": 0.89, - "learning_rate": 5.625233243930426e-06, - "loss": 2.2342, - "step": 508920 - }, - { - "epoch": 0.89, - "learning_rate": 5.6243613040036e-06, - "loss": 2.2799, - "step": 508930 - }, - { - "epoch": 0.89, - "learning_rate": 5.623489364076773e-06, - "loss": 2.1736, - "step": 508940 - }, - { - "epoch": 0.89, - "learning_rate": 5.622617424149946e-06, - "loss": 2.2335, - "step": 508950 - }, - { - "epoch": 0.89, - "learning_rate": 5.621745484223119e-06, - "loss": 2.2124, - "step": 508960 - }, - { - "epoch": 0.89, - "learning_rate": 5.6208735442962926e-06, - "loss": 2.2341, - "step": 508970 - }, - { - "epoch": 0.89, - "learning_rate": 5.6200016043694655e-06, - "loss": 2.2023, - "step": 508980 - }, - { - "epoch": 0.89, - "learning_rate": 5.619129664442639e-06, - "loss": 2.1772, - "step": 508990 - }, - { - "epoch": 0.89, - "learning_rate": 5.618257724515812e-06, - "loss": 2.2641, - "step": 509000 - }, - { - "epoch": 0.89, - "learning_rate": 5.617385784588985e-06, - "loss": 2.3531, - "step": 509010 - }, - { - "epoch": 0.89, - "learning_rate": 5.616513844662159e-06, - "loss": 2.3268, - "step": 509020 - }, - { - "epoch": 0.89, - "learning_rate": 5.615641904735332e-06, - "loss": 2.3518, - "step": 509030 - }, - { - "epoch": 0.89, - "learning_rate": 5.614769964808505e-06, - "loss": 2.1771, - "step": 509040 - }, - { - "epoch": 0.89, - "learning_rate": 5.613898024881678e-06, - "loss": 2.1436, - "step": 509050 - }, - { - "epoch": 0.89, - "learning_rate": 5.613026084954851e-06, - "loss": 2.2757, - "step": 509060 - }, - { - "epoch": 0.89, - "learning_rate": 5.612154145028024e-06, - "loss": 2.2329, - "step": 509070 - }, - { - "epoch": 0.89, - "learning_rate": 5.611282205101197e-06, - "loss": 2.1862, - "step": 509080 - }, - { - "epoch": 0.89, - "learning_rate": 5.610410265174371e-06, - "loss": 2.2006, - "step": 509090 - }, - { - "epoch": 0.89, - "learning_rate": 5.609538325247544e-06, - "loss": 2.2121, - "step": 509100 - }, - { - "epoch": 0.89, - "learning_rate": 5.608666385320717e-06, - "loss": 2.2618, - "step": 509110 - }, - { - "epoch": 0.89, - "learning_rate": 5.60779444539389e-06, - "loss": 2.1605, - "step": 509120 - }, - { - "epoch": 0.89, - "learning_rate": 5.6069225054670636e-06, - "loss": 2.2777, - "step": 509130 - }, - { - "epoch": 0.89, - "learning_rate": 5.606050565540237e-06, - "loss": 2.1992, - "step": 509140 - }, - { - "epoch": 0.89, - "learning_rate": 5.60517862561341e-06, - "loss": 2.4289, - "step": 509150 - }, - { - "epoch": 0.89, - "learning_rate": 5.604306685686583e-06, - "loss": 2.2566, - "step": 509160 - }, - { - "epoch": 0.89, - "learning_rate": 5.603434745759756e-06, - "loss": 2.1922, - "step": 509170 - }, - { - "epoch": 0.89, - "learning_rate": 5.60256280583293e-06, - "loss": 2.3092, - "step": 509180 - }, - { - "epoch": 0.89, - "learning_rate": 5.601690865906103e-06, - "loss": 2.256, - "step": 509190 - }, - { - "epoch": 0.89, - "learning_rate": 5.600818925979276e-06, - "loss": 2.3, - "step": 509200 - }, - { - "epoch": 0.89, - "learning_rate": 5.5999469860524495e-06, - "loss": 2.2695, - "step": 509210 - }, - { - "epoch": 0.89, - "learning_rate": 5.599075046125622e-06, - "loss": 2.2693, - "step": 509220 - }, - { - "epoch": 0.89, - "learning_rate": 5.598203106198795e-06, - "loss": 2.2433, - "step": 509230 - }, - { - "epoch": 0.89, - "learning_rate": 5.597331166271968e-06, - "loss": 2.3508, - "step": 509240 - }, - { - "epoch": 0.89, - "learning_rate": 5.596459226345142e-06, - "loss": 2.2617, - "step": 509250 - }, - { - "epoch": 0.89, - "learning_rate": 5.595587286418316e-06, - "loss": 2.3461, - "step": 509260 - }, - { - "epoch": 0.89, - "learning_rate": 5.594715346491489e-06, - "loss": 2.3406, - "step": 509270 - }, - { - "epoch": 0.89, - "learning_rate": 5.593843406564662e-06, - "loss": 2.2003, - "step": 509280 - }, - { - "epoch": 0.89, - "learning_rate": 5.5929714666378346e-06, - "loss": 2.3152, - "step": 509290 - }, - { - "epoch": 0.89, - "learning_rate": 5.592099526711008e-06, - "loss": 2.3209, - "step": 509300 - }, - { - "epoch": 0.89, - "learning_rate": 5.591227586784181e-06, - "loss": 2.316, - "step": 509310 - }, - { - "epoch": 0.89, - "learning_rate": 5.590355646857354e-06, - "loss": 2.2704, - "step": 509320 - }, - { - "epoch": 0.89, - "learning_rate": 5.589483706930528e-06, - "loss": 2.2949, - "step": 509330 - }, - { - "epoch": 0.89, - "learning_rate": 5.588611767003701e-06, - "loss": 2.2128, - "step": 509340 - }, - { - "epoch": 0.89, - "learning_rate": 5.587739827076874e-06, - "loss": 2.2718, - "step": 509350 - }, - { - "epoch": 0.89, - "learning_rate": 5.586867887150047e-06, - "loss": 2.2374, - "step": 509360 - }, - { - "epoch": 0.89, - "learning_rate": 5.5859959472232205e-06, - "loss": 2.3771, - "step": 509370 - }, - { - "epoch": 0.89, - "learning_rate": 5.585124007296393e-06, - "loss": 2.2608, - "step": 509380 - }, - { - "epoch": 0.89, - "learning_rate": 5.584252067369567e-06, - "loss": 2.3412, - "step": 509390 - }, - { - "epoch": 0.89, - "learning_rate": 5.58338012744274e-06, - "loss": 2.3458, - "step": 509400 - }, - { - "epoch": 0.89, - "learning_rate": 5.582508187515913e-06, - "loss": 2.229, - "step": 509410 - }, - { - "epoch": 0.89, - "learning_rate": 5.581636247589087e-06, - "loss": 2.1803, - "step": 509420 - }, - { - "epoch": 0.89, - "learning_rate": 5.58076430766226e-06, - "loss": 2.3263, - "step": 509430 - }, - { - "epoch": 0.89, - "learning_rate": 5.579892367735433e-06, - "loss": 2.3836, - "step": 509440 - }, - { - "epoch": 0.89, - "learning_rate": 5.579020427808606e-06, - "loss": 2.3734, - "step": 509450 - }, - { - "epoch": 0.89, - "learning_rate": 5.578148487881779e-06, - "loss": 2.2686, - "step": 509460 - }, - { - "epoch": 0.89, - "learning_rate": 5.577276547954952e-06, - "loss": 2.2114, - "step": 509470 - }, - { - "epoch": 0.89, - "learning_rate": 5.576404608028125e-06, - "loss": 2.2455, - "step": 509480 - }, - { - "epoch": 0.89, - "learning_rate": 5.575532668101299e-06, - "loss": 2.2265, - "step": 509490 - }, - { - "epoch": 0.89, - "learning_rate": 5.574660728174472e-06, - "loss": 2.2569, - "step": 509500 - }, - { - "epoch": 0.89, - "learning_rate": 5.573788788247645e-06, - "loss": 2.3354, - "step": 509510 - }, - { - "epoch": 0.89, - "learning_rate": 5.5729168483208186e-06, - "loss": 2.2563, - "step": 509520 - }, - { - "epoch": 0.89, - "learning_rate": 5.5720449083939915e-06, - "loss": 2.2377, - "step": 509530 - }, - { - "epoch": 0.89, - "learning_rate": 5.571172968467165e-06, - "loss": 2.1521, - "step": 509540 - }, - { - "epoch": 0.89, - "learning_rate": 5.570301028540338e-06, - "loss": 2.2455, - "step": 509550 - }, - { - "epoch": 0.89, - "learning_rate": 5.569429088613511e-06, - "loss": 2.2584, - "step": 509560 - }, - { - "epoch": 0.89, - "learning_rate": 5.568557148686684e-06, - "loss": 2.1928, - "step": 509570 - }, - { - "epoch": 0.89, - "learning_rate": 5.567685208759858e-06, - "loss": 2.3143, - "step": 509580 - }, - { - "epoch": 0.89, - "learning_rate": 5.566813268833031e-06, - "loss": 2.2344, - "step": 509590 - }, - { - "epoch": 0.89, - "learning_rate": 5.565941328906204e-06, - "loss": 2.2295, - "step": 509600 - }, - { - "epoch": 0.89, - "learning_rate": 5.565069388979377e-06, - "loss": 2.2551, - "step": 509610 - }, - { - "epoch": 0.89, - "learning_rate": 5.56419744905255e-06, - "loss": 2.1605, - "step": 509620 - }, - { - "epoch": 0.89, - "learning_rate": 5.563325509125723e-06, - "loss": 2.3948, - "step": 509630 - }, - { - "epoch": 0.89, - "learning_rate": 5.562453569198896e-06, - "loss": 2.2506, - "step": 509640 - }, - { - "epoch": 0.89, - "learning_rate": 5.56158162927207e-06, - "loss": 2.1878, - "step": 509650 - }, - { - "epoch": 0.89, - "learning_rate": 5.560709689345244e-06, - "loss": 2.1889, - "step": 509660 - }, - { - "epoch": 0.89, - "learning_rate": 5.559837749418417e-06, - "loss": 2.3158, - "step": 509670 - }, - { - "epoch": 0.89, - "learning_rate": 5.5589658094915896e-06, - "loss": 2.3191, - "step": 509680 - }, - { - "epoch": 0.89, - "learning_rate": 5.5580938695647625e-06, - "loss": 2.3427, - "step": 509690 - }, - { - "epoch": 0.89, - "learning_rate": 5.557221929637936e-06, - "loss": 2.2423, - "step": 509700 - }, - { - "epoch": 0.89, - "learning_rate": 5.556349989711109e-06, - "loss": 2.2898, - "step": 509710 - }, - { - "epoch": 0.89, - "learning_rate": 5.555478049784282e-06, - "loss": 2.2235, - "step": 509720 - }, - { - "epoch": 0.89, - "learning_rate": 5.554606109857456e-06, - "loss": 2.2739, - "step": 509730 - }, - { - "epoch": 0.89, - "learning_rate": 5.553734169930629e-06, - "loss": 2.2351, - "step": 509740 - }, - { - "epoch": 0.89, - "learning_rate": 5.552862230003802e-06, - "loss": 2.3216, - "step": 509750 - }, - { - "epoch": 0.89, - "learning_rate": 5.551990290076975e-06, - "loss": 2.2189, - "step": 509760 - }, - { - "epoch": 0.89, - "learning_rate": 5.551118350150148e-06, - "loss": 2.2153, - "step": 509770 - }, - { - "epoch": 0.89, - "learning_rate": 5.550246410223321e-06, - "loss": 2.3335, - "step": 509780 - }, - { - "epoch": 0.89, - "learning_rate": 5.549374470296495e-06, - "loss": 2.1769, - "step": 509790 - }, - { - "epoch": 0.89, - "learning_rate": 5.548502530369668e-06, - "loss": 2.3327, - "step": 509800 - }, - { - "epoch": 0.89, - "learning_rate": 5.547630590442841e-06, - "loss": 2.3144, - "step": 509810 - }, - { - "epoch": 0.89, - "learning_rate": 5.546758650516015e-06, - "loss": 2.3472, - "step": 509820 - }, - { - "epoch": 0.89, - "learning_rate": 5.545886710589188e-06, - "loss": 2.3731, - "step": 509830 - }, - { - "epoch": 0.89, - "learning_rate": 5.5450147706623606e-06, - "loss": 2.1678, - "step": 509840 - }, - { - "epoch": 0.89, - "learning_rate": 5.544142830735534e-06, - "loss": 2.2282, - "step": 509850 - }, - { - "epoch": 0.89, - "learning_rate": 5.543270890808707e-06, - "loss": 2.274, - "step": 509860 - }, - { - "epoch": 0.89, - "learning_rate": 5.54239895088188e-06, - "loss": 2.2727, - "step": 509870 - }, - { - "epoch": 0.89, - "learning_rate": 5.541527010955053e-06, - "loss": 2.2405, - "step": 509880 - }, - { - "epoch": 0.89, - "learning_rate": 5.540655071028227e-06, - "loss": 2.3198, - "step": 509890 - }, - { - "epoch": 0.89, - "learning_rate": 5.5397831311014e-06, - "loss": 2.1958, - "step": 509900 - }, - { - "epoch": 0.89, - "learning_rate": 5.538911191174573e-06, - "loss": 2.3599, - "step": 509910 - }, - { - "epoch": 0.89, - "learning_rate": 5.5380392512477465e-06, - "loss": 2.1867, - "step": 509920 - }, - { - "epoch": 0.89, - "learning_rate": 5.537167311320919e-06, - "loss": 2.3251, - "step": 509930 - }, - { - "epoch": 0.89, - "learning_rate": 5.536295371394093e-06, - "loss": 2.2423, - "step": 509940 - }, - { - "epoch": 0.89, - "learning_rate": 5.535423431467266e-06, - "loss": 2.2667, - "step": 509950 - }, - { - "epoch": 0.89, - "learning_rate": 5.534551491540439e-06, - "loss": 2.2884, - "step": 509960 - }, - { - "epoch": 0.89, - "learning_rate": 5.533679551613613e-06, - "loss": 2.3662, - "step": 509970 - }, - { - "epoch": 0.89, - "learning_rate": 5.532807611686786e-06, - "loss": 2.2808, - "step": 509980 - }, - { - "epoch": 0.89, - "learning_rate": 5.531935671759959e-06, - "loss": 2.3832, - "step": 509990 - }, - { - "epoch": 0.89, - "learning_rate": 5.5310637318331316e-06, - "loss": 2.4144, - "step": 510000 - }, - { - "epoch": 0.89, - "learning_rate": 5.530191791906305e-06, - "loss": 2.2125, - "step": 510010 - }, - { - "epoch": 0.89, - "learning_rate": 5.529319851979478e-06, - "loss": 2.3048, - "step": 510020 - }, - { - "epoch": 0.89, - "learning_rate": 5.528447912052651e-06, - "loss": 2.2973, - "step": 510030 - }, - { - "epoch": 0.89, - "learning_rate": 5.527575972125824e-06, - "loss": 2.3235, - "step": 510040 - }, - { - "epoch": 0.89, - "learning_rate": 5.526704032198998e-06, - "loss": 2.2495, - "step": 510050 - }, - { - "epoch": 0.89, - "learning_rate": 5.525832092272172e-06, - "loss": 2.2436, - "step": 510060 - }, - { - "epoch": 0.89, - "learning_rate": 5.5249601523453446e-06, - "loss": 2.3565, - "step": 510070 - }, - { - "epoch": 0.89, - "learning_rate": 5.5240882124185175e-06, - "loss": 2.2507, - "step": 510080 - }, - { - "epoch": 0.89, - "learning_rate": 5.52321627249169e-06, - "loss": 2.3677, - "step": 510090 - }, - { - "epoch": 0.89, - "learning_rate": 5.522344332564864e-06, - "loss": 2.2861, - "step": 510100 - }, - { - "epoch": 0.89, - "learning_rate": 5.521472392638037e-06, - "loss": 2.1411, - "step": 510110 - }, - { - "epoch": 0.89, - "learning_rate": 5.52060045271121e-06, - "loss": 2.1852, - "step": 510120 - }, - { - "epoch": 0.89, - "learning_rate": 5.519728512784384e-06, - "loss": 2.216, - "step": 510130 - }, - { - "epoch": 0.89, - "learning_rate": 5.518856572857557e-06, - "loss": 2.2152, - "step": 510140 - }, - { - "epoch": 0.89, - "learning_rate": 5.51798463293073e-06, - "loss": 2.1945, - "step": 510150 - }, - { - "epoch": 0.89, - "learning_rate": 5.5171126930039026e-06, - "loss": 2.2576, - "step": 510160 - }, - { - "epoch": 0.89, - "learning_rate": 5.516240753077076e-06, - "loss": 2.1602, - "step": 510170 - }, - { - "epoch": 0.89, - "learning_rate": 5.515368813150249e-06, - "loss": 2.2727, - "step": 510180 - }, - { - "epoch": 0.89, - "learning_rate": 5.514496873223423e-06, - "loss": 2.4091, - "step": 510190 - }, - { - "epoch": 0.89, - "learning_rate": 5.513624933296596e-06, - "loss": 2.4259, - "step": 510200 - }, - { - "epoch": 0.89, - "learning_rate": 5.512752993369769e-06, - "loss": 2.2588, - "step": 510210 - }, - { - "epoch": 0.89, - "learning_rate": 5.511881053442943e-06, - "loss": 2.2757, - "step": 510220 - }, - { - "epoch": 0.89, - "learning_rate": 5.5110091135161156e-06, - "loss": 2.2651, - "step": 510230 - }, - { - "epoch": 0.89, - "learning_rate": 5.5101371735892885e-06, - "loss": 2.2957, - "step": 510240 - }, - { - "epoch": 0.89, - "learning_rate": 5.509265233662462e-06, - "loss": 2.2636, - "step": 510250 - }, - { - "epoch": 0.89, - "learning_rate": 5.508393293735635e-06, - "loss": 2.3808, - "step": 510260 - }, - { - "epoch": 0.89, - "learning_rate": 5.507521353808808e-06, - "loss": 2.1696, - "step": 510270 - }, - { - "epoch": 0.89, - "learning_rate": 5.506649413881981e-06, - "loss": 2.4681, - "step": 510280 - }, - { - "epoch": 0.89, - "learning_rate": 5.505777473955155e-06, - "loss": 2.2999, - "step": 510290 - }, - { - "epoch": 0.89, - "learning_rate": 5.504905534028328e-06, - "loss": 2.3176, - "step": 510300 - }, - { - "epoch": 0.89, - "learning_rate": 5.504033594101501e-06, - "loss": 2.2589, - "step": 510310 - }, - { - "epoch": 0.89, - "learning_rate": 5.503161654174674e-06, - "loss": 2.1961, - "step": 510320 - }, - { - "epoch": 0.89, - "learning_rate": 5.502289714247847e-06, - "loss": 2.2342, - "step": 510330 - }, - { - "epoch": 0.89, - "learning_rate": 5.501417774321021e-06, - "loss": 2.2668, - "step": 510340 - }, - { - "epoch": 0.89, - "learning_rate": 5.500545834394194e-06, - "loss": 2.2841, - "step": 510350 - }, - { - "epoch": 0.89, - "learning_rate": 5.499673894467367e-06, - "loss": 2.2494, - "step": 510360 - }, - { - "epoch": 0.89, - "learning_rate": 5.498801954540541e-06, - "loss": 2.2685, - "step": 510370 - }, - { - "epoch": 0.89, - "learning_rate": 5.497930014613714e-06, - "loss": 2.2777, - "step": 510380 - }, - { - "epoch": 0.89, - "learning_rate": 5.4970580746868866e-06, - "loss": 2.246, - "step": 510390 - }, - { - "epoch": 0.89, - "learning_rate": 5.4961861347600595e-06, - "loss": 2.2426, - "step": 510400 - }, - { - "epoch": 0.89, - "learning_rate": 5.495314194833233e-06, - "loss": 2.2796, - "step": 510410 - }, - { - "epoch": 0.89, - "learning_rate": 5.494442254906406e-06, - "loss": 2.2836, - "step": 510420 - }, - { - "epoch": 0.89, - "learning_rate": 5.493570314979579e-06, - "loss": 2.1937, - "step": 510430 - }, - { - "epoch": 0.89, - "learning_rate": 5.492698375052752e-06, - "loss": 2.3509, - "step": 510440 - }, - { - "epoch": 0.89, - "learning_rate": 5.491826435125926e-06, - "loss": 2.3269, - "step": 510450 - }, - { - "epoch": 0.89, - "learning_rate": 5.4909544951990996e-06, - "loss": 2.2404, - "step": 510460 - }, - { - "epoch": 0.89, - "learning_rate": 5.4900825552722725e-06, - "loss": 2.3262, - "step": 510470 - }, - { - "epoch": 0.89, - "learning_rate": 5.489210615345445e-06, - "loss": 2.3424, - "step": 510480 - }, - { - "epoch": 0.89, - "learning_rate": 5.488338675418619e-06, - "loss": 2.2848, - "step": 510490 - }, - { - "epoch": 0.89, - "learning_rate": 5.487466735491792e-06, - "loss": 2.3122, - "step": 510500 - }, - { - "epoch": 0.89, - "learning_rate": 5.486594795564965e-06, - "loss": 2.2951, - "step": 510510 - }, - { - "epoch": 0.89, - "learning_rate": 5.485722855638138e-06, - "loss": 2.436, - "step": 510520 - }, - { - "epoch": 0.89, - "learning_rate": 5.484850915711312e-06, - "loss": 2.2551, - "step": 510530 - }, - { - "epoch": 0.89, - "learning_rate": 5.483978975784485e-06, - "loss": 2.3071, - "step": 510540 - }, - { - "epoch": 0.89, - "learning_rate": 5.4831070358576576e-06, - "loss": 2.2426, - "step": 510550 - }, - { - "epoch": 0.89, - "learning_rate": 5.4822350959308305e-06, - "loss": 2.2609, - "step": 510560 - }, - { - "epoch": 0.89, - "learning_rate": 5.481363156004004e-06, - "loss": 2.2851, - "step": 510570 - }, - { - "epoch": 0.89, - "learning_rate": 5.480491216077177e-06, - "loss": 2.3156, - "step": 510580 - }, - { - "epoch": 0.89, - "learning_rate": 5.479619276150351e-06, - "loss": 2.3329, - "step": 510590 - }, - { - "epoch": 0.89, - "learning_rate": 5.478747336223524e-06, - "loss": 2.2982, - "step": 510600 - }, - { - "epoch": 0.89, - "learning_rate": 5.477875396296697e-06, - "loss": 2.3496, - "step": 510610 - }, - { - "epoch": 0.89, - "learning_rate": 5.4770034563698706e-06, - "loss": 2.2336, - "step": 510620 - }, - { - "epoch": 0.89, - "learning_rate": 5.4761315164430435e-06, - "loss": 2.2675, - "step": 510630 - }, - { - "epoch": 0.89, - "learning_rate": 5.475259576516216e-06, - "loss": 2.3663, - "step": 510640 - }, - { - "epoch": 0.89, - "learning_rate": 5.47438763658939e-06, - "loss": 2.3795, - "step": 510650 - }, - { - "epoch": 0.89, - "learning_rate": 5.473515696662563e-06, - "loss": 2.233, - "step": 510660 - }, - { - "epoch": 0.89, - "learning_rate": 5.472643756735736e-06, - "loss": 2.1794, - "step": 510670 - }, - { - "epoch": 0.89, - "learning_rate": 5.471771816808909e-06, - "loss": 2.1895, - "step": 510680 - }, - { - "epoch": 0.89, - "learning_rate": 5.470899876882083e-06, - "loss": 2.2726, - "step": 510690 - }, - { - "epoch": 0.89, - "learning_rate": 5.470027936955256e-06, - "loss": 2.2078, - "step": 510700 - }, - { - "epoch": 0.89, - "learning_rate": 5.4691559970284286e-06, - "loss": 2.3125, - "step": 510710 - }, - { - "epoch": 0.89, - "learning_rate": 5.468284057101602e-06, - "loss": 2.1808, - "step": 510720 - }, - { - "epoch": 0.89, - "learning_rate": 5.467412117174775e-06, - "loss": 2.264, - "step": 510730 - }, - { - "epoch": 0.89, - "learning_rate": 5.466540177247949e-06, - "loss": 2.3058, - "step": 510740 - }, - { - "epoch": 0.89, - "learning_rate": 5.465668237321122e-06, - "loss": 2.2239, - "step": 510750 - }, - { - "epoch": 0.89, - "learning_rate": 5.464796297394295e-06, - "loss": 2.2397, - "step": 510760 - }, - { - "epoch": 0.89, - "learning_rate": 5.463924357467469e-06, - "loss": 2.2723, - "step": 510770 - }, - { - "epoch": 0.89, - "learning_rate": 5.4630524175406416e-06, - "loss": 2.3224, - "step": 510780 - }, - { - "epoch": 0.89, - "learning_rate": 5.4621804776138145e-06, - "loss": 2.238, - "step": 510790 - }, - { - "epoch": 0.89, - "learning_rate": 5.461308537686987e-06, - "loss": 2.2611, - "step": 510800 - }, - { - "epoch": 0.89, - "learning_rate": 5.460436597760161e-06, - "loss": 2.1392, - "step": 510810 - }, - { - "epoch": 0.89, - "learning_rate": 5.459564657833334e-06, - "loss": 2.3178, - "step": 510820 - }, - { - "epoch": 0.89, - "learning_rate": 5.458692717906507e-06, - "loss": 2.2393, - "step": 510830 - }, - { - "epoch": 0.89, - "learning_rate": 5.45782077797968e-06, - "loss": 2.2603, - "step": 510840 - }, - { - "epoch": 0.89, - "learning_rate": 5.456948838052854e-06, - "loss": 2.3749, - "step": 510850 - }, - { - "epoch": 0.89, - "learning_rate": 5.4560768981260275e-06, - "loss": 2.2313, - "step": 510860 - }, - { - "epoch": 0.89, - "learning_rate": 5.4552049581992e-06, - "loss": 2.2373, - "step": 510870 - }, - { - "epoch": 0.89, - "learning_rate": 5.454333018272373e-06, - "loss": 2.2272, - "step": 510880 - }, - { - "epoch": 0.89, - "learning_rate": 5.453461078345547e-06, - "loss": 2.2774, - "step": 510890 - }, - { - "epoch": 0.89, - "learning_rate": 5.45258913841872e-06, - "loss": 2.283, - "step": 510900 - }, - { - "epoch": 0.89, - "learning_rate": 5.451717198491893e-06, - "loss": 2.2939, - "step": 510910 - }, - { - "epoch": 0.89, - "learning_rate": 5.450845258565066e-06, - "loss": 2.2598, - "step": 510920 - }, - { - "epoch": 0.89, - "learning_rate": 5.44997331863824e-06, - "loss": 2.221, - "step": 510930 - }, - { - "epoch": 0.89, - "learning_rate": 5.4491013787114126e-06, - "loss": 2.1936, - "step": 510940 - }, - { - "epoch": 0.89, - "learning_rate": 5.4482294387845855e-06, - "loss": 2.1843, - "step": 510950 - }, - { - "epoch": 0.89, - "learning_rate": 5.447357498857758e-06, - "loss": 2.1677, - "step": 510960 - }, - { - "epoch": 0.89, - "learning_rate": 5.446485558930932e-06, - "loss": 2.2848, - "step": 510970 - }, - { - "epoch": 0.89, - "learning_rate": 5.445613619004105e-06, - "loss": 2.3419, - "step": 510980 - }, - { - "epoch": 0.89, - "learning_rate": 5.444741679077279e-06, - "loss": 2.1729, - "step": 510990 - }, - { - "epoch": 0.89, - "learning_rate": 5.443869739150452e-06, - "loss": 2.2758, - "step": 511000 - }, - { - "epoch": 0.89, - "learning_rate": 5.4429977992236256e-06, - "loss": 2.1078, - "step": 511010 - }, - { - "epoch": 0.89, - "learning_rate": 5.4421258592967985e-06, - "loss": 2.1945, - "step": 511020 - }, - { - "epoch": 0.89, - "learning_rate": 5.441253919369971e-06, - "loss": 2.1896, - "step": 511030 - }, - { - "epoch": 0.89, - "learning_rate": 5.440381979443144e-06, - "loss": 2.2856, - "step": 511040 - }, - { - "epoch": 0.89, - "learning_rate": 5.439510039516318e-06, - "loss": 2.2946, - "step": 511050 - }, - { - "epoch": 0.89, - "learning_rate": 5.438638099589491e-06, - "loss": 2.258, - "step": 511060 - }, - { - "epoch": 0.89, - "learning_rate": 5.437766159662664e-06, - "loss": 2.2819, - "step": 511070 - }, - { - "epoch": 0.89, - "learning_rate": 5.436894219735837e-06, - "loss": 2.2698, - "step": 511080 - }, - { - "epoch": 0.89, - "learning_rate": 5.436022279809011e-06, - "loss": 2.1662, - "step": 511090 - }, - { - "epoch": 0.89, - "learning_rate": 5.4351503398821836e-06, - "loss": 2.3341, - "step": 511100 - }, - { - "epoch": 0.89, - "learning_rate": 5.4342783999553565e-06, - "loss": 2.2918, - "step": 511110 - }, - { - "epoch": 0.89, - "learning_rate": 5.43340646002853e-06, - "loss": 2.3677, - "step": 511120 - }, - { - "epoch": 0.89, - "learning_rate": 5.432534520101703e-06, - "loss": 2.1571, - "step": 511130 - }, - { - "epoch": 0.89, - "learning_rate": 5.431662580174877e-06, - "loss": 2.2662, - "step": 511140 - }, - { - "epoch": 0.89, - "learning_rate": 5.43079064024805e-06, - "loss": 2.3866, - "step": 511150 - }, - { - "epoch": 0.89, - "learning_rate": 5.429918700321223e-06, - "loss": 2.2723, - "step": 511160 - }, - { - "epoch": 0.89, - "learning_rate": 5.4290467603943966e-06, - "loss": 2.3294, - "step": 511170 - }, - { - "epoch": 0.89, - "learning_rate": 5.4281748204675695e-06, - "loss": 2.3692, - "step": 511180 - }, - { - "epoch": 0.89, - "learning_rate": 5.427302880540742e-06, - "loss": 2.3073, - "step": 511190 - }, - { - "epoch": 0.89, - "learning_rate": 5.426430940613915e-06, - "loss": 2.2144, - "step": 511200 - }, - { - "epoch": 0.89, - "learning_rate": 5.425559000687089e-06, - "loss": 2.3322, - "step": 511210 - }, - { - "epoch": 0.89, - "learning_rate": 5.424687060760262e-06, - "loss": 2.302, - "step": 511220 - }, - { - "epoch": 0.89, - "learning_rate": 5.423815120833435e-06, - "loss": 2.2616, - "step": 511230 - }, - { - "epoch": 0.89, - "learning_rate": 5.422943180906608e-06, - "loss": 2.2938, - "step": 511240 - }, - { - "epoch": 0.89, - "learning_rate": 5.422071240979782e-06, - "loss": 2.2663, - "step": 511250 - }, - { - "epoch": 0.89, - "learning_rate": 5.421199301052955e-06, - "loss": 2.224, - "step": 511260 - }, - { - "epoch": 0.89, - "learning_rate": 5.420327361126128e-06, - "loss": 2.2447, - "step": 511270 - }, - { - "epoch": 0.89, - "learning_rate": 5.419455421199301e-06, - "loss": 2.2854, - "step": 511280 - }, - { - "epoch": 0.89, - "learning_rate": 5.418583481272475e-06, - "loss": 2.1463, - "step": 511290 - }, - { - "epoch": 0.89, - "learning_rate": 5.417711541345648e-06, - "loss": 2.2236, - "step": 511300 - }, - { - "epoch": 0.89, - "learning_rate": 5.416839601418821e-06, - "loss": 2.2563, - "step": 511310 - }, - { - "epoch": 0.89, - "learning_rate": 5.415967661491994e-06, - "loss": 2.2948, - "step": 511320 - }, - { - "epoch": 0.89, - "learning_rate": 5.4150957215651676e-06, - "loss": 2.2942, - "step": 511330 - }, - { - "epoch": 0.89, - "learning_rate": 5.4142237816383405e-06, - "loss": 2.2339, - "step": 511340 - }, - { - "epoch": 0.89, - "learning_rate": 5.413351841711513e-06, - "loss": 2.2539, - "step": 511350 - }, - { - "epoch": 0.89, - "learning_rate": 5.412479901784686e-06, - "loss": 2.1802, - "step": 511360 - }, - { - "epoch": 0.89, - "learning_rate": 5.41160796185786e-06, - "loss": 2.4136, - "step": 511370 - }, - { - "epoch": 0.89, - "learning_rate": 5.410736021931033e-06, - "loss": 2.3511, - "step": 511380 - }, - { - "epoch": 0.89, - "learning_rate": 5.409864082004207e-06, - "loss": 2.3067, - "step": 511390 - }, - { - "epoch": 0.89, - "learning_rate": 5.40899214207738e-06, - "loss": 2.124, - "step": 511400 - }, - { - "epoch": 0.89, - "learning_rate": 5.4081202021505535e-06, - "loss": 2.2015, - "step": 511410 - }, - { - "epoch": 0.89, - "learning_rate": 5.407248262223726e-06, - "loss": 2.3994, - "step": 511420 - }, - { - "epoch": 0.89, - "learning_rate": 5.406376322296899e-06, - "loss": 2.3992, - "step": 511430 - }, - { - "epoch": 0.89, - "learning_rate": 5.405504382370072e-06, - "loss": 2.3409, - "step": 511440 - }, - { - "epoch": 0.89, - "learning_rate": 5.404632442443246e-06, - "loss": 2.1062, - "step": 511450 - }, - { - "epoch": 0.89, - "learning_rate": 5.403760502516419e-06, - "loss": 2.3719, - "step": 511460 - }, - { - "epoch": 0.89, - "learning_rate": 5.402888562589592e-06, - "loss": 2.1949, - "step": 511470 - }, - { - "epoch": 0.89, - "learning_rate": 5.402016622662765e-06, - "loss": 2.2991, - "step": 511480 - }, - { - "epoch": 0.89, - "learning_rate": 5.4011446827359386e-06, - "loss": 2.2542, - "step": 511490 - }, - { - "epoch": 0.89, - "learning_rate": 5.4002727428091115e-06, - "loss": 2.1685, - "step": 511500 - }, - { - "epoch": 0.89, - "learning_rate": 5.399400802882284e-06, - "loss": 2.2354, - "step": 511510 - }, - { - "epoch": 0.89, - "learning_rate": 5.398528862955458e-06, - "loss": 2.3169, - "step": 511520 - }, - { - "epoch": 0.89, - "learning_rate": 5.397656923028632e-06, - "loss": 2.2275, - "step": 511530 - }, - { - "epoch": 0.89, - "learning_rate": 5.396784983101805e-06, - "loss": 2.2645, - "step": 511540 - }, - { - "epoch": 0.89, - "learning_rate": 5.395913043174978e-06, - "loss": 2.2077, - "step": 511550 - }, - { - "epoch": 0.89, - "learning_rate": 5.395041103248151e-06, - "loss": 2.1074, - "step": 511560 - }, - { - "epoch": 0.89, - "learning_rate": 5.3941691633213245e-06, - "loss": 2.1995, - "step": 511570 - }, - { - "epoch": 0.89, - "learning_rate": 5.393297223394497e-06, - "loss": 2.2277, - "step": 511580 - }, - { - "epoch": 0.89, - "learning_rate": 5.39242528346767e-06, - "loss": 2.3782, - "step": 511590 - }, - { - "epoch": 0.89, - "learning_rate": 5.391553343540843e-06, - "loss": 2.2061, - "step": 511600 - }, - { - "epoch": 0.89, - "learning_rate": 5.390681403614017e-06, - "loss": 2.1489, - "step": 511610 - }, - { - "epoch": 0.89, - "learning_rate": 5.38980946368719e-06, - "loss": 2.2483, - "step": 511620 - }, - { - "epoch": 0.89, - "learning_rate": 5.388937523760363e-06, - "loss": 2.2349, - "step": 511630 - }, - { - "epoch": 0.89, - "learning_rate": 5.388065583833536e-06, - "loss": 2.24, - "step": 511640 - }, - { - "epoch": 0.89, - "learning_rate": 5.3871936439067096e-06, - "loss": 2.3654, - "step": 511650 - }, - { - "epoch": 0.89, - "learning_rate": 5.386321703979883e-06, - "loss": 2.2811, - "step": 511660 - }, - { - "epoch": 0.89, - "learning_rate": 5.385449764053056e-06, - "loss": 2.2968, - "step": 511670 - }, - { - "epoch": 0.89, - "learning_rate": 5.384577824126229e-06, - "loss": 2.2853, - "step": 511680 - }, - { - "epoch": 0.89, - "learning_rate": 5.383705884199403e-06, - "loss": 2.2684, - "step": 511690 - }, - { - "epoch": 0.89, - "learning_rate": 5.382833944272576e-06, - "loss": 2.2308, - "step": 511700 - }, - { - "epoch": 0.89, - "learning_rate": 5.381962004345749e-06, - "loss": 2.2383, - "step": 511710 - }, - { - "epoch": 0.89, - "learning_rate": 5.381090064418922e-06, - "loss": 2.2661, - "step": 511720 - }, - { - "epoch": 0.89, - "learning_rate": 5.3802181244920955e-06, - "loss": 2.3197, - "step": 511730 - }, - { - "epoch": 0.89, - "learning_rate": 5.379346184565268e-06, - "loss": 2.2325, - "step": 511740 - }, - { - "epoch": 0.89, - "learning_rate": 5.378474244638441e-06, - "loss": 2.302, - "step": 511750 - }, - { - "epoch": 0.89, - "learning_rate": 5.377602304711614e-06, - "loss": 2.27, - "step": 511760 - }, - { - "epoch": 0.89, - "learning_rate": 5.376730364784788e-06, - "loss": 2.2423, - "step": 511770 - }, - { - "epoch": 0.89, - "learning_rate": 5.375858424857961e-06, - "loss": 2.2773, - "step": 511780 - }, - { - "epoch": 0.89, - "learning_rate": 5.374986484931135e-06, - "loss": 2.2993, - "step": 511790 - }, - { - "epoch": 0.89, - "learning_rate": 5.374114545004308e-06, - "loss": 2.3681, - "step": 511800 - }, - { - "epoch": 0.89, - "learning_rate": 5.373242605077481e-06, - "loss": 2.3318, - "step": 511810 - }, - { - "epoch": 0.89, - "learning_rate": 5.372370665150654e-06, - "loss": 2.2256, - "step": 511820 - }, - { - "epoch": 0.89, - "learning_rate": 5.371498725223827e-06, - "loss": 2.156, - "step": 511830 - }, - { - "epoch": 0.89, - "learning_rate": 5.370626785297e-06, - "loss": 2.2427, - "step": 511840 - }, - { - "epoch": 0.89, - "learning_rate": 5.369754845370174e-06, - "loss": 2.2281, - "step": 511850 - }, - { - "epoch": 0.89, - "learning_rate": 5.368882905443347e-06, - "loss": 2.3782, - "step": 511860 - }, - { - "epoch": 0.89, - "learning_rate": 5.36801096551652e-06, - "loss": 2.3052, - "step": 511870 - }, - { - "epoch": 0.89, - "learning_rate": 5.367139025589693e-06, - "loss": 2.2224, - "step": 511880 - }, - { - "epoch": 0.89, - "learning_rate": 5.3662670856628665e-06, - "loss": 2.2821, - "step": 511890 - }, - { - "epoch": 0.89, - "learning_rate": 5.365395145736039e-06, - "loss": 2.1424, - "step": 511900 - }, - { - "epoch": 0.89, - "learning_rate": 5.364523205809212e-06, - "loss": 2.293, - "step": 511910 - }, - { - "epoch": 0.89, - "learning_rate": 5.363651265882386e-06, - "loss": 2.2403, - "step": 511920 - }, - { - "epoch": 0.89, - "learning_rate": 5.36277932595556e-06, - "loss": 2.3008, - "step": 511930 - }, - { - "epoch": 0.89, - "learning_rate": 5.361907386028733e-06, - "loss": 2.2682, - "step": 511940 - }, - { - "epoch": 0.89, - "learning_rate": 5.361035446101906e-06, - "loss": 2.2489, - "step": 511950 - }, - { - "epoch": 0.89, - "learning_rate": 5.360163506175079e-06, - "loss": 2.2857, - "step": 511960 - }, - { - "epoch": 0.89, - "learning_rate": 5.3592915662482524e-06, - "loss": 2.1506, - "step": 511970 - }, - { - "epoch": 0.89, - "learning_rate": 5.358419626321425e-06, - "loss": 2.2695, - "step": 511980 - }, - { - "epoch": 0.89, - "learning_rate": 5.357547686394598e-06, - "loss": 2.2661, - "step": 511990 - }, - { - "epoch": 0.89, - "learning_rate": 5.356675746467771e-06, - "loss": 2.2549, - "step": 512000 - }, - { - "epoch": 0.89, - "learning_rate": 5.355803806540945e-06, - "loss": 2.2187, - "step": 512010 - }, - { - "epoch": 0.89, - "learning_rate": 5.354931866614118e-06, - "loss": 2.27, - "step": 512020 - }, - { - "epoch": 0.89, - "learning_rate": 5.354059926687291e-06, - "loss": 2.306, - "step": 512030 - }, - { - "epoch": 0.89, - "learning_rate": 5.353187986760464e-06, - "loss": 2.2194, - "step": 512040 - }, - { - "epoch": 0.89, - "learning_rate": 5.352316046833638e-06, - "loss": 2.3538, - "step": 512050 - }, - { - "epoch": 0.89, - "learning_rate": 5.351444106906811e-06, - "loss": 2.3239, - "step": 512060 - }, - { - "epoch": 0.89, - "learning_rate": 5.350572166979984e-06, - "loss": 2.3953, - "step": 512070 - }, - { - "epoch": 0.89, - "learning_rate": 5.349700227053157e-06, - "loss": 2.2457, - "step": 512080 - }, - { - "epoch": 0.89, - "learning_rate": 5.348828287126331e-06, - "loss": 2.2872, - "step": 512090 - }, - { - "epoch": 0.89, - "learning_rate": 5.347956347199504e-06, - "loss": 2.299, - "step": 512100 - }, - { - "epoch": 0.89, - "learning_rate": 5.347084407272677e-06, - "loss": 2.1982, - "step": 512110 - }, - { - "epoch": 0.89, - "learning_rate": 5.34621246734585e-06, - "loss": 2.3518, - "step": 512120 - }, - { - "epoch": 0.89, - "learning_rate": 5.3453405274190234e-06, - "loss": 2.2571, - "step": 512130 - }, - { - "epoch": 0.89, - "learning_rate": 5.344468587492196e-06, - "loss": 2.1696, - "step": 512140 - }, - { - "epoch": 0.89, - "learning_rate": 5.343596647565369e-06, - "loss": 2.2993, - "step": 512150 - }, - { - "epoch": 0.89, - "learning_rate": 5.342724707638542e-06, - "loss": 2.2531, - "step": 512160 - }, - { - "epoch": 0.89, - "learning_rate": 5.341852767711716e-06, - "loss": 2.2456, - "step": 512170 - }, - { - "epoch": 0.89, - "learning_rate": 5.34098082778489e-06, - "loss": 2.2739, - "step": 512180 - }, - { - "epoch": 0.89, - "learning_rate": 5.340108887858063e-06, - "loss": 2.2563, - "step": 512190 - }, - { - "epoch": 0.89, - "learning_rate": 5.339236947931236e-06, - "loss": 2.2973, - "step": 512200 - }, - { - "epoch": 0.89, - "learning_rate": 5.338365008004409e-06, - "loss": 2.351, - "step": 512210 - }, - { - "epoch": 0.89, - "learning_rate": 5.337493068077582e-06, - "loss": 2.3167, - "step": 512220 - }, - { - "epoch": 0.89, - "learning_rate": 5.336621128150755e-06, - "loss": 2.3529, - "step": 512230 - }, - { - "epoch": 0.89, - "learning_rate": 5.335749188223928e-06, - "loss": 2.3235, - "step": 512240 - }, - { - "epoch": 0.89, - "learning_rate": 5.334877248297102e-06, - "loss": 2.3297, - "step": 512250 - }, - { - "epoch": 0.89, - "learning_rate": 5.334005308370275e-06, - "loss": 2.2412, - "step": 512260 - }, - { - "epoch": 0.89, - "learning_rate": 5.333133368443448e-06, - "loss": 2.3433, - "step": 512270 - }, - { - "epoch": 0.89, - "learning_rate": 5.332261428516621e-06, - "loss": 2.3544, - "step": 512280 - }, - { - "epoch": 0.89, - "learning_rate": 5.3313894885897944e-06, - "loss": 2.2506, - "step": 512290 - }, - { - "epoch": 0.89, - "learning_rate": 5.330517548662967e-06, - "loss": 2.2883, - "step": 512300 - }, - { - "epoch": 0.89, - "learning_rate": 5.32964560873614e-06, - "loss": 2.4513, - "step": 512310 - }, - { - "epoch": 0.89, - "learning_rate": 5.328773668809314e-06, - "loss": 2.1872, - "step": 512320 - }, - { - "epoch": 0.89, - "learning_rate": 5.327901728882488e-06, - "loss": 2.274, - "step": 512330 - }, - { - "epoch": 0.89, - "learning_rate": 5.327029788955661e-06, - "loss": 2.2684, - "step": 512340 - }, - { - "epoch": 0.89, - "learning_rate": 5.326157849028834e-06, - "loss": 2.2136, - "step": 512350 - }, - { - "epoch": 0.89, - "learning_rate": 5.325285909102007e-06, - "loss": 2.2834, - "step": 512360 - }, - { - "epoch": 0.89, - "learning_rate": 5.32441396917518e-06, - "loss": 2.2629, - "step": 512370 - }, - { - "epoch": 0.89, - "learning_rate": 5.323542029248353e-06, - "loss": 2.2922, - "step": 512380 - }, - { - "epoch": 0.89, - "learning_rate": 5.322670089321526e-06, - "loss": 2.2504, - "step": 512390 - }, - { - "epoch": 0.89, - "learning_rate": 5.321798149394699e-06, - "loss": 2.2566, - "step": 512400 - }, - { - "epoch": 0.89, - "learning_rate": 5.320926209467873e-06, - "loss": 2.2666, - "step": 512410 - }, - { - "epoch": 0.89, - "learning_rate": 5.320054269541046e-06, - "loss": 2.2112, - "step": 512420 - }, - { - "epoch": 0.89, - "learning_rate": 5.319182329614219e-06, - "loss": 2.2987, - "step": 512430 - }, - { - "epoch": 0.89, - "learning_rate": 5.318310389687392e-06, - "loss": 2.2448, - "step": 512440 - }, - { - "epoch": 0.89, - "learning_rate": 5.317438449760566e-06, - "loss": 2.4219, - "step": 512450 - }, - { - "epoch": 0.89, - "learning_rate": 5.316566509833739e-06, - "loss": 2.3049, - "step": 512460 - }, - { - "epoch": 0.89, - "learning_rate": 5.315694569906912e-06, - "loss": 2.0955, - "step": 512470 - }, - { - "epoch": 0.89, - "learning_rate": 5.314822629980085e-06, - "loss": 2.2934, - "step": 512480 - }, - { - "epoch": 0.89, - "learning_rate": 5.313950690053259e-06, - "loss": 2.2965, - "step": 512490 - }, - { - "epoch": 0.89, - "learning_rate": 5.313078750126432e-06, - "loss": 2.2089, - "step": 512500 - }, - { - "epoch": 0.89, - "learning_rate": 5.312206810199605e-06, - "loss": 2.2439, - "step": 512510 - }, - { - "epoch": 0.89, - "learning_rate": 5.311334870272778e-06, - "loss": 2.1566, - "step": 512520 - }, - { - "epoch": 0.89, - "learning_rate": 5.310462930345951e-06, - "loss": 2.2268, - "step": 512530 - }, - { - "epoch": 0.89, - "learning_rate": 5.309590990419124e-06, - "loss": 2.2544, - "step": 512540 - }, - { - "epoch": 0.89, - "learning_rate": 5.308719050492297e-06, - "loss": 2.3779, - "step": 512550 - }, - { - "epoch": 0.89, - "learning_rate": 5.30784711056547e-06, - "loss": 2.2076, - "step": 512560 - }, - { - "epoch": 0.89, - "learning_rate": 5.306975170638644e-06, - "loss": 2.1645, - "step": 512570 - }, - { - "epoch": 0.89, - "learning_rate": 5.306103230711818e-06, - "loss": 2.3083, - "step": 512580 - }, - { - "epoch": 0.89, - "learning_rate": 5.305231290784991e-06, - "loss": 2.3269, - "step": 512590 - }, - { - "epoch": 0.89, - "learning_rate": 5.3043593508581635e-06, - "loss": 2.2693, - "step": 512600 - }, - { - "epoch": 0.89, - "learning_rate": 5.303487410931337e-06, - "loss": 2.2745, - "step": 512610 - }, - { - "epoch": 0.89, - "learning_rate": 5.30261547100451e-06, - "loss": 2.4016, - "step": 512620 - }, - { - "epoch": 0.89, - "learning_rate": 5.301743531077683e-06, - "loss": 2.2593, - "step": 512630 - }, - { - "epoch": 0.89, - "learning_rate": 5.300871591150856e-06, - "loss": 2.2923, - "step": 512640 - }, - { - "epoch": 0.89, - "learning_rate": 5.29999965122403e-06, - "loss": 2.1238, - "step": 512650 - }, - { - "epoch": 0.89, - "learning_rate": 5.299127711297203e-06, - "loss": 2.2287, - "step": 512660 - }, - { - "epoch": 0.89, - "learning_rate": 5.298255771370376e-06, - "loss": 2.3338, - "step": 512670 - }, - { - "epoch": 0.89, - "learning_rate": 5.297383831443549e-06, - "loss": 2.3479, - "step": 512680 - }, - { - "epoch": 0.89, - "learning_rate": 5.296511891516722e-06, - "loss": 2.2157, - "step": 512690 - }, - { - "epoch": 0.89, - "learning_rate": 5.295639951589895e-06, - "loss": 2.3302, - "step": 512700 - }, - { - "epoch": 0.89, - "learning_rate": 5.294768011663068e-06, - "loss": 2.2426, - "step": 512710 - }, - { - "epoch": 0.89, - "learning_rate": 5.293896071736242e-06, - "loss": 2.2872, - "step": 512720 - }, - { - "epoch": 0.89, - "learning_rate": 5.293024131809416e-06, - "loss": 2.3373, - "step": 512730 - }, - { - "epoch": 0.89, - "learning_rate": 5.292152191882589e-06, - "loss": 2.2322, - "step": 512740 - }, - { - "epoch": 0.89, - "learning_rate": 5.291280251955762e-06, - "loss": 2.3059, - "step": 512750 - }, - { - "epoch": 0.89, - "learning_rate": 5.2904083120289345e-06, - "loss": 2.3434, - "step": 512760 - }, - { - "epoch": 0.89, - "learning_rate": 5.289536372102108e-06, - "loss": 2.322, - "step": 512770 - }, - { - "epoch": 0.89, - "learning_rate": 5.288664432175281e-06, - "loss": 2.2284, - "step": 512780 - }, - { - "epoch": 0.89, - "learning_rate": 5.287792492248454e-06, - "loss": 2.1309, - "step": 512790 - }, - { - "epoch": 0.89, - "learning_rate": 5.286920552321627e-06, - "loss": 2.2271, - "step": 512800 - }, - { - "epoch": 0.89, - "learning_rate": 5.286048612394801e-06, - "loss": 2.344, - "step": 512810 - }, - { - "epoch": 0.89, - "learning_rate": 5.285176672467974e-06, - "loss": 2.2979, - "step": 512820 - }, - { - "epoch": 0.89, - "learning_rate": 5.284304732541147e-06, - "loss": 2.1304, - "step": 512830 - }, - { - "epoch": 0.89, - "learning_rate": 5.28343279261432e-06, - "loss": 2.3161, - "step": 512840 - }, - { - "epoch": 0.89, - "learning_rate": 5.282560852687494e-06, - "loss": 2.1802, - "step": 512850 - }, - { - "epoch": 0.89, - "learning_rate": 5.281688912760667e-06, - "loss": 2.3718, - "step": 512860 - }, - { - "epoch": 0.89, - "learning_rate": 5.28081697283384e-06, - "loss": 2.2452, - "step": 512870 - }, - { - "epoch": 0.89, - "learning_rate": 5.279945032907013e-06, - "loss": 2.315, - "step": 512880 - }, - { - "epoch": 0.89, - "learning_rate": 5.279073092980187e-06, - "loss": 2.2408, - "step": 512890 - }, - { - "epoch": 0.89, - "learning_rate": 5.27820115305336e-06, - "loss": 2.246, - "step": 512900 - }, - { - "epoch": 0.89, - "learning_rate": 5.277329213126533e-06, - "loss": 2.1831, - "step": 512910 - }, - { - "epoch": 0.89, - "learning_rate": 5.2764572731997055e-06, - "loss": 2.2811, - "step": 512920 - }, - { - "epoch": 0.89, - "learning_rate": 5.275585333272879e-06, - "loss": 2.2394, - "step": 512930 - }, - { - "epoch": 0.89, - "learning_rate": 5.274713393346052e-06, - "loss": 2.3966, - "step": 512940 - }, - { - "epoch": 0.89, - "learning_rate": 5.273841453419225e-06, - "loss": 2.2805, - "step": 512950 - }, - { - "epoch": 0.89, - "learning_rate": 5.272969513492398e-06, - "loss": 2.446, - "step": 512960 - }, - { - "epoch": 0.89, - "learning_rate": 5.272097573565572e-06, - "loss": 2.2132, - "step": 512970 - }, - { - "epoch": 0.89, - "learning_rate": 5.271225633638746e-06, - "loss": 2.3732, - "step": 512980 - }, - { - "epoch": 0.89, - "learning_rate": 5.2703536937119185e-06, - "loss": 2.2326, - "step": 512990 - }, - { - "epoch": 0.89, - "learning_rate": 5.2694817537850914e-06, - "loss": 2.2309, - "step": 513000 - }, - { - "epoch": 0.89, - "learning_rate": 5.268609813858265e-06, - "loss": 2.1917, - "step": 513010 - }, - { - "epoch": 0.89, - "learning_rate": 5.267737873931438e-06, - "loss": 2.2397, - "step": 513020 - }, - { - "epoch": 0.89, - "learning_rate": 5.266865934004611e-06, - "loss": 2.3611, - "step": 513030 - }, - { - "epoch": 0.89, - "learning_rate": 5.265993994077784e-06, - "loss": 2.2185, - "step": 513040 - }, - { - "epoch": 0.89, - "learning_rate": 5.265122054150958e-06, - "loss": 2.2885, - "step": 513050 - }, - { - "epoch": 0.89, - "learning_rate": 5.264250114224131e-06, - "loss": 2.2926, - "step": 513060 - }, - { - "epoch": 0.89, - "learning_rate": 5.263378174297304e-06, - "loss": 2.2783, - "step": 513070 - }, - { - "epoch": 0.89, - "learning_rate": 5.2625062343704765e-06, - "loss": 2.3394, - "step": 513080 - }, - { - "epoch": 0.89, - "learning_rate": 5.26163429444365e-06, - "loss": 2.2252, - "step": 513090 - }, - { - "epoch": 0.89, - "learning_rate": 5.260762354516823e-06, - "loss": 2.2015, - "step": 513100 - }, - { - "epoch": 0.89, - "learning_rate": 5.259890414589996e-06, - "loss": 2.3232, - "step": 513110 - }, - { - "epoch": 0.89, - "learning_rate": 5.25901847466317e-06, - "loss": 2.2167, - "step": 513120 - }, - { - "epoch": 0.89, - "learning_rate": 5.258146534736344e-06, - "loss": 2.3465, - "step": 513130 - }, - { - "epoch": 0.89, - "learning_rate": 5.257274594809517e-06, - "loss": 2.2193, - "step": 513140 - }, - { - "epoch": 0.89, - "learning_rate": 5.2564026548826895e-06, - "loss": 2.2969, - "step": 513150 - }, - { - "epoch": 0.89, - "learning_rate": 5.2555307149558624e-06, - "loss": 2.3211, - "step": 513160 - }, - { - "epoch": 0.89, - "learning_rate": 5.254658775029036e-06, - "loss": 2.1609, - "step": 513170 - }, - { - "epoch": 0.89, - "learning_rate": 5.253786835102209e-06, - "loss": 2.3062, - "step": 513180 - }, - { - "epoch": 0.89, - "learning_rate": 5.252914895175382e-06, - "loss": 2.1905, - "step": 513190 - }, - { - "epoch": 0.89, - "learning_rate": 5.252042955248555e-06, - "loss": 2.2434, - "step": 513200 - }, - { - "epoch": 0.89, - "learning_rate": 5.251171015321729e-06, - "loss": 2.2633, - "step": 513210 - }, - { - "epoch": 0.89, - "learning_rate": 5.250299075394902e-06, - "loss": 2.2319, - "step": 513220 - }, - { - "epoch": 0.9, - "learning_rate": 5.249427135468075e-06, - "loss": 2.2493, - "step": 513230 - }, - { - "epoch": 0.9, - "learning_rate": 5.2485551955412475e-06, - "loss": 2.2346, - "step": 513240 - }, - { - "epoch": 0.9, - "learning_rate": 5.247683255614422e-06, - "loss": 2.2032, - "step": 513250 - }, - { - "epoch": 0.9, - "learning_rate": 5.246811315687595e-06, - "loss": 2.1809, - "step": 513260 - }, - { - "epoch": 0.9, - "learning_rate": 5.245939375760768e-06, - "loss": 2.2361, - "step": 513270 - }, - { - "epoch": 0.9, - "learning_rate": 5.245067435833941e-06, - "loss": 2.2075, - "step": 513280 - }, - { - "epoch": 0.9, - "learning_rate": 5.244195495907115e-06, - "loss": 2.313, - "step": 513290 - }, - { - "epoch": 0.9, - "learning_rate": 5.243323555980288e-06, - "loss": 2.2252, - "step": 513300 - }, - { - "epoch": 0.9, - "learning_rate": 5.2424516160534605e-06, - "loss": 2.2204, - "step": 513310 - }, - { - "epoch": 0.9, - "learning_rate": 5.2415796761266334e-06, - "loss": 2.3906, - "step": 513320 - }, - { - "epoch": 0.9, - "learning_rate": 5.240707736199807e-06, - "loss": 2.18, - "step": 513330 - }, - { - "epoch": 0.9, - "learning_rate": 5.23983579627298e-06, - "loss": 2.3192, - "step": 513340 - }, - { - "epoch": 0.9, - "learning_rate": 5.238963856346153e-06, - "loss": 2.3066, - "step": 513350 - }, - { - "epoch": 0.9, - "learning_rate": 5.238091916419326e-06, - "loss": 2.2329, - "step": 513360 - }, - { - "epoch": 0.9, - "learning_rate": 5.2372199764925e-06, - "loss": 2.2315, - "step": 513370 - }, - { - "epoch": 0.9, - "learning_rate": 5.2363480365656735e-06, - "loss": 2.2982, - "step": 513380 - }, - { - "epoch": 0.9, - "learning_rate": 5.2354760966388464e-06, - "loss": 2.2814, - "step": 513390 - }, - { - "epoch": 0.9, - "learning_rate": 5.234604156712019e-06, - "loss": 2.2339, - "step": 513400 - }, - { - "epoch": 0.9, - "learning_rate": 5.233732216785193e-06, - "loss": 2.2323, - "step": 513410 - }, - { - "epoch": 0.9, - "learning_rate": 5.232860276858366e-06, - "loss": 2.1848, - "step": 513420 - }, - { - "epoch": 0.9, - "learning_rate": 5.231988336931539e-06, - "loss": 2.2788, - "step": 513430 - }, - { - "epoch": 0.9, - "learning_rate": 5.231116397004712e-06, - "loss": 2.2934, - "step": 513440 - }, - { - "epoch": 0.9, - "learning_rate": 5.230244457077886e-06, - "loss": 2.2143, - "step": 513450 - }, - { - "epoch": 0.9, - "learning_rate": 5.229372517151059e-06, - "loss": 2.2688, - "step": 513460 - }, - { - "epoch": 0.9, - "learning_rate": 5.2285005772242315e-06, - "loss": 2.19, - "step": 513470 - }, - { - "epoch": 0.9, - "learning_rate": 5.2276286372974044e-06, - "loss": 2.3097, - "step": 513480 - }, - { - "epoch": 0.9, - "learning_rate": 5.226756697370578e-06, - "loss": 2.2913, - "step": 513490 - }, - { - "epoch": 0.9, - "learning_rate": 5.225884757443751e-06, - "loss": 2.3146, - "step": 513500 - }, - { - "epoch": 0.9, - "learning_rate": 5.225012817516924e-06, - "loss": 2.2467, - "step": 513510 - }, - { - "epoch": 0.9, - "learning_rate": 5.224140877590098e-06, - "loss": 2.3027, - "step": 513520 - }, - { - "epoch": 0.9, - "learning_rate": 5.223268937663272e-06, - "loss": 2.2686, - "step": 513530 - }, - { - "epoch": 0.9, - "learning_rate": 5.2223969977364445e-06, - "loss": 2.2298, - "step": 513540 - }, - { - "epoch": 0.9, - "learning_rate": 5.2215250578096174e-06, - "loss": 2.3097, - "step": 513550 - }, - { - "epoch": 0.9, - "learning_rate": 5.22065311788279e-06, - "loss": 2.2786, - "step": 513560 - }, - { - "epoch": 0.9, - "learning_rate": 5.219781177955964e-06, - "loss": 2.2232, - "step": 513570 - }, - { - "epoch": 0.9, - "learning_rate": 5.218909238029137e-06, - "loss": 2.2427, - "step": 513580 - }, - { - "epoch": 0.9, - "learning_rate": 5.21803729810231e-06, - "loss": 2.2906, - "step": 513590 - }, - { - "epoch": 0.9, - "learning_rate": 5.217165358175483e-06, - "loss": 2.2631, - "step": 513600 - }, - { - "epoch": 0.9, - "learning_rate": 5.216293418248657e-06, - "loss": 2.2727, - "step": 513610 - }, - { - "epoch": 0.9, - "learning_rate": 5.21542147832183e-06, - "loss": 2.2733, - "step": 513620 - }, - { - "epoch": 0.9, - "learning_rate": 5.2145495383950025e-06, - "loss": 2.205, - "step": 513630 - }, - { - "epoch": 0.9, - "learning_rate": 5.2136775984681754e-06, - "loss": 2.2376, - "step": 513640 - }, - { - "epoch": 0.9, - "learning_rate": 5.21280565854135e-06, - "loss": 2.2815, - "step": 513650 - }, - { - "epoch": 0.9, - "learning_rate": 5.211933718614523e-06, - "loss": 2.2405, - "step": 513660 - }, - { - "epoch": 0.9, - "learning_rate": 5.211061778687696e-06, - "loss": 2.2366, - "step": 513670 - }, - { - "epoch": 0.9, - "learning_rate": 5.210189838760869e-06, - "loss": 2.3076, - "step": 513680 - }, - { - "epoch": 0.9, - "learning_rate": 5.209317898834043e-06, - "loss": 2.3428, - "step": 513690 - }, - { - "epoch": 0.9, - "learning_rate": 5.2084459589072155e-06, - "loss": 2.2164, - "step": 513700 - }, - { - "epoch": 0.9, - "learning_rate": 5.2075740189803884e-06, - "loss": 2.2783, - "step": 513710 - }, - { - "epoch": 0.9, - "learning_rate": 5.206702079053561e-06, - "loss": 2.2364, - "step": 513720 - }, - { - "epoch": 0.9, - "learning_rate": 5.205830139126735e-06, - "loss": 2.2361, - "step": 513730 - }, - { - "epoch": 0.9, - "learning_rate": 5.204958199199908e-06, - "loss": 2.2871, - "step": 513740 - }, - { - "epoch": 0.9, - "learning_rate": 5.204086259273081e-06, - "loss": 2.2327, - "step": 513750 - }, - { - "epoch": 0.9, - "learning_rate": 5.203214319346254e-06, - "loss": 2.2165, - "step": 513760 - }, - { - "epoch": 0.9, - "learning_rate": 5.202342379419428e-06, - "loss": 2.2321, - "step": 513770 - }, - { - "epoch": 0.9, - "learning_rate": 5.2014704394926014e-06, - "loss": 2.3313, - "step": 513780 - }, - { - "epoch": 0.9, - "learning_rate": 5.200598499565774e-06, - "loss": 2.2406, - "step": 513790 - }, - { - "epoch": 0.9, - "learning_rate": 5.199726559638947e-06, - "loss": 2.3602, - "step": 513800 - }, - { - "epoch": 0.9, - "learning_rate": 5.198854619712121e-06, - "loss": 2.2617, - "step": 513810 - }, - { - "epoch": 0.9, - "learning_rate": 5.197982679785294e-06, - "loss": 2.279, - "step": 513820 - }, - { - "epoch": 0.9, - "learning_rate": 5.197110739858467e-06, - "loss": 2.2192, - "step": 513830 - }, - { - "epoch": 0.9, - "learning_rate": 5.19623879993164e-06, - "loss": 2.3324, - "step": 513840 - }, - { - "epoch": 0.9, - "learning_rate": 5.195366860004814e-06, - "loss": 2.1915, - "step": 513850 - }, - { - "epoch": 0.9, - "learning_rate": 5.1944949200779865e-06, - "loss": 2.1952, - "step": 513860 - }, - { - "epoch": 0.9, - "learning_rate": 5.1936229801511594e-06, - "loss": 2.3669, - "step": 513870 - }, - { - "epoch": 0.9, - "learning_rate": 5.192751040224332e-06, - "loss": 2.2627, - "step": 513880 - }, - { - "epoch": 0.9, - "learning_rate": 5.191879100297506e-06, - "loss": 2.2434, - "step": 513890 - }, - { - "epoch": 0.9, - "learning_rate": 5.191007160370679e-06, - "loss": 2.2205, - "step": 513900 - }, - { - "epoch": 0.9, - "learning_rate": 5.190135220443853e-06, - "loss": 2.2157, - "step": 513910 - }, - { - "epoch": 0.9, - "learning_rate": 5.189263280517026e-06, - "loss": 2.3101, - "step": 513920 - }, - { - "epoch": 0.9, - "learning_rate": 5.1883913405901995e-06, - "loss": 2.2545, - "step": 513930 - }, - { - "epoch": 0.9, - "learning_rate": 5.1875194006633724e-06, - "loss": 2.1713, - "step": 513940 - }, - { - "epoch": 0.9, - "learning_rate": 5.186647460736545e-06, - "loss": 2.3031, - "step": 513950 - }, - { - "epoch": 0.9, - "learning_rate": 5.185775520809718e-06, - "loss": 2.3885, - "step": 513960 - }, - { - "epoch": 0.9, - "learning_rate": 5.184903580882892e-06, - "loss": 2.1403, - "step": 513970 - }, - { - "epoch": 0.9, - "learning_rate": 5.184031640956065e-06, - "loss": 2.2268, - "step": 513980 - }, - { - "epoch": 0.9, - "learning_rate": 5.183159701029238e-06, - "loss": 2.395, - "step": 513990 - }, - { - "epoch": 0.9, - "learning_rate": 5.182287761102411e-06, - "loss": 2.2282, - "step": 514000 - }, - { - "epoch": 0.9, - "learning_rate": 5.181415821175585e-06, - "loss": 2.2612, - "step": 514010 - }, - { - "epoch": 0.9, - "learning_rate": 5.1805438812487575e-06, - "loss": 2.1963, - "step": 514020 - }, - { - "epoch": 0.9, - "learning_rate": 5.1796719413219304e-06, - "loss": 2.3589, - "step": 514030 - }, - { - "epoch": 0.9, - "learning_rate": 5.178800001395104e-06, - "loss": 2.3, - "step": 514040 - }, - { - "epoch": 0.9, - "learning_rate": 5.177928061468278e-06, - "loss": 2.3973, - "step": 514050 - }, - { - "epoch": 0.9, - "learning_rate": 5.177056121541451e-06, - "loss": 2.2845, - "step": 514060 - }, - { - "epoch": 0.9, - "learning_rate": 5.176184181614624e-06, - "loss": 2.2899, - "step": 514070 - }, - { - "epoch": 0.9, - "learning_rate": 5.175312241687797e-06, - "loss": 2.2468, - "step": 514080 - }, - { - "epoch": 0.9, - "learning_rate": 5.1744403017609705e-06, - "loss": 2.2456, - "step": 514090 - }, - { - "epoch": 0.9, - "learning_rate": 5.1735683618341434e-06, - "loss": 2.3201, - "step": 514100 - }, - { - "epoch": 0.9, - "learning_rate": 5.172696421907316e-06, - "loss": 2.3784, - "step": 514110 - }, - { - "epoch": 0.9, - "learning_rate": 5.171824481980489e-06, - "loss": 2.2391, - "step": 514120 - }, - { - "epoch": 0.9, - "learning_rate": 5.170952542053663e-06, - "loss": 2.3727, - "step": 514130 - }, - { - "epoch": 0.9, - "learning_rate": 5.170080602126836e-06, - "loss": 2.215, - "step": 514140 - }, - { - "epoch": 0.9, - "learning_rate": 5.169208662200009e-06, - "loss": 2.2997, - "step": 514150 - }, - { - "epoch": 0.9, - "learning_rate": 5.168336722273182e-06, - "loss": 2.2188, - "step": 514160 - }, - { - "epoch": 0.9, - "learning_rate": 5.167464782346356e-06, - "loss": 2.1892, - "step": 514170 - }, - { - "epoch": 0.9, - "learning_rate": 5.166592842419529e-06, - "loss": 2.2618, - "step": 514180 - }, - { - "epoch": 0.9, - "learning_rate": 5.165720902492702e-06, - "loss": 2.1794, - "step": 514190 - }, - { - "epoch": 0.9, - "learning_rate": 5.164848962565875e-06, - "loss": 2.2582, - "step": 514200 - }, - { - "epoch": 0.9, - "learning_rate": 5.163977022639049e-06, - "loss": 2.2837, - "step": 514210 - }, - { - "epoch": 0.9, - "learning_rate": 5.163105082712222e-06, - "loss": 2.2692, - "step": 514220 - }, - { - "epoch": 0.9, - "learning_rate": 5.162233142785395e-06, - "loss": 2.2486, - "step": 514230 - }, - { - "epoch": 0.9, - "learning_rate": 5.161361202858568e-06, - "loss": 2.291, - "step": 514240 - }, - { - "epoch": 0.9, - "learning_rate": 5.1604892629317415e-06, - "loss": 2.317, - "step": 514250 - }, - { - "epoch": 0.9, - "learning_rate": 5.1596173230049144e-06, - "loss": 2.2754, - "step": 514260 - }, - { - "epoch": 0.9, - "learning_rate": 5.158745383078087e-06, - "loss": 2.3341, - "step": 514270 - }, - { - "epoch": 0.9, - "learning_rate": 5.15787344315126e-06, - "loss": 2.2683, - "step": 514280 - }, - { - "epoch": 0.9, - "learning_rate": 5.157001503224434e-06, - "loss": 2.3755, - "step": 514290 - }, - { - "epoch": 0.9, - "learning_rate": 5.156129563297607e-06, - "loss": 2.2242, - "step": 514300 - }, - { - "epoch": 0.9, - "learning_rate": 5.155257623370781e-06, - "loss": 2.3078, - "step": 514310 - }, - { - "epoch": 0.9, - "learning_rate": 5.154385683443954e-06, - "loss": 2.3127, - "step": 514320 - }, - { - "epoch": 0.9, - "learning_rate": 5.1535137435171274e-06, - "loss": 2.2057, - "step": 514330 - }, - { - "epoch": 0.9, - "learning_rate": 5.1526418035903e-06, - "loss": 2.1615, - "step": 514340 - }, - { - "epoch": 0.9, - "learning_rate": 5.151769863663473e-06, - "loss": 2.3326, - "step": 514350 - }, - { - "epoch": 0.9, - "learning_rate": 5.150897923736646e-06, - "loss": 2.2082, - "step": 514360 - }, - { - "epoch": 0.9, - "learning_rate": 5.15002598380982e-06, - "loss": 2.3897, - "step": 514370 - }, - { - "epoch": 0.9, - "learning_rate": 5.149154043882993e-06, - "loss": 2.2876, - "step": 514380 - }, - { - "epoch": 0.9, - "learning_rate": 5.148282103956166e-06, - "loss": 2.2841, - "step": 514390 - }, - { - "epoch": 0.9, - "learning_rate": 5.147410164029339e-06, - "loss": 2.3195, - "step": 514400 - }, - { - "epoch": 0.9, - "learning_rate": 5.1465382241025125e-06, - "loss": 2.1948, - "step": 514410 - }, - { - "epoch": 0.9, - "learning_rate": 5.1456662841756854e-06, - "loss": 2.2485, - "step": 514420 - }, - { - "epoch": 0.9, - "learning_rate": 5.144794344248858e-06, - "loss": 2.3106, - "step": 514430 - }, - { - "epoch": 0.9, - "learning_rate": 5.143922404322032e-06, - "loss": 2.2281, - "step": 514440 - }, - { - "epoch": 0.9, - "learning_rate": 5.143050464395206e-06, - "loss": 2.3458, - "step": 514450 - }, - { - "epoch": 0.9, - "learning_rate": 5.142178524468379e-06, - "loss": 2.3234, - "step": 514460 - }, - { - "epoch": 0.9, - "learning_rate": 5.141306584541552e-06, - "loss": 2.2389, - "step": 514470 - }, - { - "epoch": 0.9, - "learning_rate": 5.140434644614725e-06, - "loss": 2.3251, - "step": 514480 - }, - { - "epoch": 0.9, - "learning_rate": 5.1395627046878984e-06, - "loss": 2.3358, - "step": 514490 - }, - { - "epoch": 0.9, - "learning_rate": 5.138690764761071e-06, - "loss": 2.2691, - "step": 514500 - }, - { - "epoch": 0.9, - "learning_rate": 5.137818824834244e-06, - "loss": 2.2367, - "step": 514510 - }, - { - "epoch": 0.9, - "learning_rate": 5.136946884907417e-06, - "loss": 2.1643, - "step": 514520 - }, - { - "epoch": 0.9, - "learning_rate": 5.136074944980591e-06, - "loss": 2.2477, - "step": 514530 - }, - { - "epoch": 0.9, - "learning_rate": 5.135203005053764e-06, - "loss": 2.2165, - "step": 514540 - }, - { - "epoch": 0.9, - "learning_rate": 5.134331065126937e-06, - "loss": 2.3012, - "step": 514550 - }, - { - "epoch": 0.9, - "learning_rate": 5.133459125200111e-06, - "loss": 2.258, - "step": 514560 - }, - { - "epoch": 0.9, - "learning_rate": 5.1325871852732835e-06, - "loss": 2.1746, - "step": 514570 - }, - { - "epoch": 0.9, - "learning_rate": 5.131715245346457e-06, - "loss": 2.2574, - "step": 514580 - }, - { - "epoch": 0.9, - "learning_rate": 5.13084330541963e-06, - "loss": 2.1625, - "step": 514590 - }, - { - "epoch": 0.9, - "learning_rate": 5.129971365492803e-06, - "loss": 2.1993, - "step": 514600 - }, - { - "epoch": 0.9, - "learning_rate": 5.129099425565977e-06, - "loss": 2.2614, - "step": 514610 - }, - { - "epoch": 0.9, - "learning_rate": 5.12822748563915e-06, - "loss": 2.3084, - "step": 514620 - }, - { - "epoch": 0.9, - "learning_rate": 5.127355545712323e-06, - "loss": 2.3887, - "step": 514630 - }, - { - "epoch": 0.9, - "learning_rate": 5.126483605785496e-06, - "loss": 2.2438, - "step": 514640 - }, - { - "epoch": 0.9, - "learning_rate": 5.1256116658586694e-06, - "loss": 2.2365, - "step": 514650 - }, - { - "epoch": 0.9, - "learning_rate": 5.124739725931842e-06, - "loss": 2.1789, - "step": 514660 - }, - { - "epoch": 0.9, - "learning_rate": 5.123867786005015e-06, - "loss": 2.0957, - "step": 514670 - }, - { - "epoch": 0.9, - "learning_rate": 5.122995846078188e-06, - "loss": 2.2446, - "step": 514680 - }, - { - "epoch": 0.9, - "learning_rate": 5.122123906151362e-06, - "loss": 2.106, - "step": 514690 - }, - { - "epoch": 0.9, - "learning_rate": 5.121251966224535e-06, - "loss": 2.1888, - "step": 514700 - }, - { - "epoch": 0.9, - "learning_rate": 5.120380026297709e-06, - "loss": 2.3343, - "step": 514710 - }, - { - "epoch": 0.9, - "learning_rate": 5.119508086370882e-06, - "loss": 2.2012, - "step": 514720 - }, - { - "epoch": 0.9, - "learning_rate": 5.118636146444055e-06, - "loss": 2.2114, - "step": 514730 - }, - { - "epoch": 0.9, - "learning_rate": 5.117764206517228e-06, - "loss": 2.2862, - "step": 514740 - }, - { - "epoch": 0.9, - "learning_rate": 5.116892266590401e-06, - "loss": 2.2171, - "step": 514750 - }, - { - "epoch": 0.9, - "learning_rate": 5.116020326663574e-06, - "loss": 2.2877, - "step": 514760 - }, - { - "epoch": 0.9, - "learning_rate": 5.115148386736748e-06, - "loss": 2.2584, - "step": 514770 - }, - { - "epoch": 0.9, - "learning_rate": 5.114276446809921e-06, - "loss": 2.3612, - "step": 514780 - }, - { - "epoch": 0.9, - "learning_rate": 5.113404506883094e-06, - "loss": 2.225, - "step": 514790 - }, - { - "epoch": 0.9, - "learning_rate": 5.112532566956267e-06, - "loss": 2.1403, - "step": 514800 - }, - { - "epoch": 0.9, - "learning_rate": 5.1116606270294404e-06, - "loss": 2.2973, - "step": 514810 - }, - { - "epoch": 0.9, - "learning_rate": 5.110788687102613e-06, - "loss": 2.2042, - "step": 514820 - }, - { - "epoch": 0.9, - "learning_rate": 5.109916747175786e-06, - "loss": 2.2414, - "step": 514830 - }, - { - "epoch": 0.9, - "learning_rate": 5.10904480724896e-06, - "loss": 2.2583, - "step": 514840 - }, - { - "epoch": 0.9, - "learning_rate": 5.108172867322134e-06, - "loss": 2.1739, - "step": 514850 - }, - { - "epoch": 0.9, - "learning_rate": 5.107300927395307e-06, - "loss": 2.3166, - "step": 514860 - }, - { - "epoch": 0.9, - "learning_rate": 5.10642898746848e-06, - "loss": 2.1834, - "step": 514870 - }, - { - "epoch": 0.9, - "learning_rate": 5.105557047541653e-06, - "loss": 2.2431, - "step": 514880 - }, - { - "epoch": 0.9, - "learning_rate": 5.104685107614826e-06, - "loss": 2.2381, - "step": 514890 - }, - { - "epoch": 0.9, - "learning_rate": 5.103813167687999e-06, - "loss": 2.368, - "step": 514900 - }, - { - "epoch": 0.9, - "learning_rate": 5.102941227761172e-06, - "loss": 2.1904, - "step": 514910 - }, - { - "epoch": 0.9, - "learning_rate": 5.102069287834345e-06, - "loss": 2.2537, - "step": 514920 - }, - { - "epoch": 0.9, - "learning_rate": 5.101197347907519e-06, - "loss": 2.3752, - "step": 514930 - }, - { - "epoch": 0.9, - "learning_rate": 5.100325407980692e-06, - "loss": 2.3194, - "step": 514940 - }, - { - "epoch": 0.9, - "learning_rate": 5.099453468053865e-06, - "loss": 2.1961, - "step": 514950 - }, - { - "epoch": 0.9, - "learning_rate": 5.0985815281270385e-06, - "loss": 2.3353, - "step": 514960 - }, - { - "epoch": 0.9, - "learning_rate": 5.0977095882002114e-06, - "loss": 2.2617, - "step": 514970 - }, - { - "epoch": 0.9, - "learning_rate": 5.096837648273385e-06, - "loss": 2.3163, - "step": 514980 - }, - { - "epoch": 0.9, - "learning_rate": 5.095965708346558e-06, - "loss": 2.371, - "step": 514990 - }, - { - "epoch": 0.9, - "learning_rate": 5.095093768419731e-06, - "loss": 2.2294, - "step": 515000 - }, - { - "epoch": 0.9, - "learning_rate": 5.094221828492905e-06, - "loss": 2.3285, - "step": 515010 - }, - { - "epoch": 0.9, - "learning_rate": 5.093349888566078e-06, - "loss": 2.3376, - "step": 515020 - }, - { - "epoch": 0.9, - "learning_rate": 5.092477948639251e-06, - "loss": 2.283, - "step": 515030 - }, - { - "epoch": 0.9, - "learning_rate": 5.091606008712424e-06, - "loss": 2.3314, - "step": 515040 - }, - { - "epoch": 0.9, - "learning_rate": 5.090734068785597e-06, - "loss": 2.2515, - "step": 515050 - }, - { - "epoch": 0.9, - "learning_rate": 5.08986212885877e-06, - "loss": 2.209, - "step": 515060 - }, - { - "epoch": 0.9, - "learning_rate": 5.088990188931943e-06, - "loss": 2.2928, - "step": 515070 - }, - { - "epoch": 0.9, - "learning_rate": 5.088118249005117e-06, - "loss": 2.3726, - "step": 515080 - }, - { - "epoch": 0.9, - "learning_rate": 5.08724630907829e-06, - "loss": 2.2422, - "step": 515090 - }, - { - "epoch": 0.9, - "learning_rate": 5.086374369151463e-06, - "loss": 2.1573, - "step": 515100 - }, - { - "epoch": 0.9, - "learning_rate": 5.085502429224637e-06, - "loss": 2.3291, - "step": 515110 - }, - { - "epoch": 0.9, - "learning_rate": 5.0846304892978095e-06, - "loss": 2.2443, - "step": 515120 - }, - { - "epoch": 0.9, - "learning_rate": 5.083758549370983e-06, - "loss": 2.2336, - "step": 515130 - }, - { - "epoch": 0.9, - "learning_rate": 5.082886609444156e-06, - "loss": 2.2559, - "step": 515140 - }, - { - "epoch": 0.9, - "learning_rate": 5.082014669517329e-06, - "loss": 2.299, - "step": 515150 - }, - { - "epoch": 0.9, - "learning_rate": 5.081142729590502e-06, - "loss": 2.2009, - "step": 515160 - }, - { - "epoch": 0.9, - "learning_rate": 5.080270789663676e-06, - "loss": 2.3425, - "step": 515170 - }, - { - "epoch": 0.9, - "learning_rate": 5.079398849736849e-06, - "loss": 2.293, - "step": 515180 - }, - { - "epoch": 0.9, - "learning_rate": 5.078526909810022e-06, - "loss": 2.362, - "step": 515190 - }, - { - "epoch": 0.9, - "learning_rate": 5.0776549698831955e-06, - "loss": 2.2181, - "step": 515200 - }, - { - "epoch": 0.9, - "learning_rate": 5.076783029956368e-06, - "loss": 2.2915, - "step": 515210 - }, - { - "epoch": 0.9, - "learning_rate": 5.075911090029541e-06, - "loss": 2.2451, - "step": 515220 - }, - { - "epoch": 0.9, - "learning_rate": 5.075039150102714e-06, - "loss": 2.3105, - "step": 515230 - }, - { - "epoch": 0.9, - "learning_rate": 5.074167210175888e-06, - "loss": 2.0912, - "step": 515240 - }, - { - "epoch": 0.9, - "learning_rate": 5.073295270249062e-06, - "loss": 2.1843, - "step": 515250 - }, - { - "epoch": 0.9, - "learning_rate": 5.072423330322235e-06, - "loss": 2.2207, - "step": 515260 - }, - { - "epoch": 0.9, - "learning_rate": 5.071551390395408e-06, - "loss": 2.219, - "step": 515270 - }, - { - "epoch": 0.9, - "learning_rate": 5.0706794504685805e-06, - "loss": 2.2459, - "step": 515280 - }, - { - "epoch": 0.9, - "learning_rate": 5.069807510541754e-06, - "loss": 2.2264, - "step": 515290 - }, - { - "epoch": 0.9, - "learning_rate": 5.068935570614927e-06, - "loss": 2.2928, - "step": 515300 - }, - { - "epoch": 0.9, - "learning_rate": 5.0680636306881e-06, - "loss": 2.2671, - "step": 515310 - }, - { - "epoch": 0.9, - "learning_rate": 5.067191690761273e-06, - "loss": 2.3022, - "step": 515320 - }, - { - "epoch": 0.9, - "learning_rate": 5.066319750834447e-06, - "loss": 2.2385, - "step": 515330 - }, - { - "epoch": 0.9, - "learning_rate": 5.06544781090762e-06, - "loss": 2.2358, - "step": 515340 - }, - { - "epoch": 0.9, - "learning_rate": 5.064575870980793e-06, - "loss": 2.2837, - "step": 515350 - }, - { - "epoch": 0.9, - "learning_rate": 5.0637039310539665e-06, - "loss": 2.2385, - "step": 515360 - }, - { - "epoch": 0.9, - "learning_rate": 5.062831991127139e-06, - "loss": 2.271, - "step": 515370 - }, - { - "epoch": 0.9, - "learning_rate": 5.061960051200313e-06, - "loss": 2.3844, - "step": 515380 - }, - { - "epoch": 0.9, - "learning_rate": 5.061088111273486e-06, - "loss": 2.3452, - "step": 515390 - }, - { - "epoch": 0.9, - "learning_rate": 5.060216171346659e-06, - "loss": 2.3057, - "step": 515400 - }, - { - "epoch": 0.9, - "learning_rate": 5.059344231419833e-06, - "loss": 2.2243, - "step": 515410 - }, - { - "epoch": 0.9, - "learning_rate": 5.058472291493006e-06, - "loss": 2.2366, - "step": 515420 - }, - { - "epoch": 0.9, - "learning_rate": 5.057600351566179e-06, - "loss": 2.1997, - "step": 515430 - }, - { - "epoch": 0.9, - "learning_rate": 5.0567284116393515e-06, - "loss": 2.3399, - "step": 515440 - }, - { - "epoch": 0.9, - "learning_rate": 5.055856471712525e-06, - "loss": 2.2418, - "step": 515450 - }, - { - "epoch": 0.9, - "learning_rate": 5.054984531785698e-06, - "loss": 2.222, - "step": 515460 - }, - { - "epoch": 0.9, - "learning_rate": 5.054112591858871e-06, - "loss": 2.3959, - "step": 515470 - }, - { - "epoch": 0.9, - "learning_rate": 5.053240651932045e-06, - "loss": 2.3114, - "step": 515480 - }, - { - "epoch": 0.9, - "learning_rate": 5.052368712005218e-06, - "loss": 2.3983, - "step": 515490 - }, - { - "epoch": 0.9, - "learning_rate": 5.051496772078391e-06, - "loss": 2.2309, - "step": 515500 - }, - { - "epoch": 0.9, - "learning_rate": 5.0506248321515645e-06, - "loss": 2.2379, - "step": 515510 - }, - { - "epoch": 0.9, - "learning_rate": 5.0497528922247375e-06, - "loss": 2.3814, - "step": 515520 - }, - { - "epoch": 0.9, - "learning_rate": 5.048880952297911e-06, - "loss": 2.3612, - "step": 515530 - }, - { - "epoch": 0.9, - "learning_rate": 5.048009012371084e-06, - "loss": 2.3129, - "step": 515540 - }, - { - "epoch": 0.9, - "learning_rate": 5.047137072444257e-06, - "loss": 2.1822, - "step": 515550 - }, - { - "epoch": 0.9, - "learning_rate": 5.04626513251743e-06, - "loss": 2.233, - "step": 515560 - }, - { - "epoch": 0.9, - "learning_rate": 5.045393192590604e-06, - "loss": 2.2463, - "step": 515570 - }, - { - "epoch": 0.9, - "learning_rate": 5.044521252663777e-06, - "loss": 2.1413, - "step": 515580 - }, - { - "epoch": 0.9, - "learning_rate": 5.04364931273695e-06, - "loss": 2.1995, - "step": 515590 - }, - { - "epoch": 0.9, - "learning_rate": 5.042777372810123e-06, - "loss": 2.2349, - "step": 515600 - }, - { - "epoch": 0.9, - "learning_rate": 5.041905432883296e-06, - "loss": 2.2724, - "step": 515610 - }, - { - "epoch": 0.9, - "learning_rate": 5.041033492956469e-06, - "loss": 2.3007, - "step": 515620 - }, - { - "epoch": 0.9, - "learning_rate": 5.040161553029642e-06, - "loss": 2.2676, - "step": 515630 - }, - { - "epoch": 0.9, - "learning_rate": 5.039289613102816e-06, - "loss": 2.1814, - "step": 515640 - }, - { - "epoch": 0.9, - "learning_rate": 5.03841767317599e-06, - "loss": 2.3337, - "step": 515650 - }, - { - "epoch": 0.9, - "learning_rate": 5.037545733249163e-06, - "loss": 2.2476, - "step": 515660 - }, - { - "epoch": 0.9, - "learning_rate": 5.0366737933223355e-06, - "loss": 2.1537, - "step": 515670 - }, - { - "epoch": 0.9, - "learning_rate": 5.0358018533955085e-06, - "loss": 2.2787, - "step": 515680 - }, - { - "epoch": 0.9, - "learning_rate": 5.034929913468682e-06, - "loss": 2.3596, - "step": 515690 - }, - { - "epoch": 0.9, - "learning_rate": 5.034057973541855e-06, - "loss": 2.3354, - "step": 515700 - }, - { - "epoch": 0.9, - "learning_rate": 5.033186033615028e-06, - "loss": 2.1667, - "step": 515710 - }, - { - "epoch": 0.9, - "learning_rate": 5.032314093688202e-06, - "loss": 2.2424, - "step": 515720 - }, - { - "epoch": 0.9, - "learning_rate": 5.031442153761375e-06, - "loss": 2.2309, - "step": 515730 - }, - { - "epoch": 0.9, - "learning_rate": 5.030570213834548e-06, - "loss": 2.2756, - "step": 515740 - }, - { - "epoch": 0.9, - "learning_rate": 5.029698273907721e-06, - "loss": 2.3845, - "step": 515750 - }, - { - "epoch": 0.9, - "learning_rate": 5.028826333980894e-06, - "loss": 2.3226, - "step": 515760 - }, - { - "epoch": 0.9, - "learning_rate": 5.027954394054067e-06, - "loss": 2.2358, - "step": 515770 - }, - { - "epoch": 0.9, - "learning_rate": 5.027082454127241e-06, - "loss": 2.2563, - "step": 515780 - }, - { - "epoch": 0.9, - "learning_rate": 5.026210514200414e-06, - "loss": 2.3253, - "step": 515790 - }, - { - "epoch": 0.9, - "learning_rate": 5.025338574273587e-06, - "loss": 2.2957, - "step": 515800 - }, - { - "epoch": 0.9, - "learning_rate": 5.024466634346761e-06, - "loss": 2.4156, - "step": 515810 - }, - { - "epoch": 0.9, - "learning_rate": 5.023594694419934e-06, - "loss": 2.2477, - "step": 515820 - }, - { - "epoch": 0.9, - "learning_rate": 5.0227227544931065e-06, - "loss": 2.4053, - "step": 515830 - }, - { - "epoch": 0.9, - "learning_rate": 5.0218508145662795e-06, - "loss": 2.2033, - "step": 515840 - }, - { - "epoch": 0.9, - "learning_rate": 5.020978874639453e-06, - "loss": 2.1988, - "step": 515850 - }, - { - "epoch": 0.9, - "learning_rate": 5.020106934712626e-06, - "loss": 2.2329, - "step": 515860 - }, - { - "epoch": 0.9, - "learning_rate": 5.019234994785799e-06, - "loss": 2.2905, - "step": 515870 - }, - { - "epoch": 0.9, - "learning_rate": 5.018363054858973e-06, - "loss": 2.2456, - "step": 515880 - }, - { - "epoch": 0.9, - "learning_rate": 5.017491114932146e-06, - "loss": 2.1733, - "step": 515890 - }, - { - "epoch": 0.9, - "learning_rate": 5.016619175005319e-06, - "loss": 2.1341, - "step": 515900 - }, - { - "epoch": 0.9, - "learning_rate": 5.0157472350784925e-06, - "loss": 2.2859, - "step": 515910 - }, - { - "epoch": 0.9, - "learning_rate": 5.014875295151665e-06, - "loss": 2.2788, - "step": 515920 - }, - { - "epoch": 0.9, - "learning_rate": 5.014003355224839e-06, - "loss": 2.1581, - "step": 515930 - }, - { - "epoch": 0.9, - "learning_rate": 5.013131415298012e-06, - "loss": 2.274, - "step": 515940 - }, - { - "epoch": 0.9, - "learning_rate": 5.012259475371185e-06, - "loss": 2.3442, - "step": 515950 - }, - { - "epoch": 0.9, - "learning_rate": 5.011387535444358e-06, - "loss": 2.2392, - "step": 515960 - }, - { - "epoch": 0.9, - "learning_rate": 5.010515595517532e-06, - "loss": 2.1771, - "step": 515970 - }, - { - "epoch": 0.9, - "learning_rate": 5.009643655590705e-06, - "loss": 2.2765, - "step": 515980 - }, - { - "epoch": 0.9, - "learning_rate": 5.0087717156638775e-06, - "loss": 2.3045, - "step": 515990 - }, - { - "epoch": 0.9, - "learning_rate": 5.007899775737051e-06, - "loss": 2.3904, - "step": 516000 - }, - { - "epoch": 0.9, - "learning_rate": 5.007027835810224e-06, - "loss": 2.3085, - "step": 516010 - }, - { - "epoch": 0.9, - "learning_rate": 5.006155895883397e-06, - "loss": 2.2574, - "step": 516020 - }, - { - "epoch": 0.9, - "learning_rate": 5.00528395595657e-06, - "loss": 2.2557, - "step": 516030 - }, - { - "epoch": 0.9, - "learning_rate": 5.004412016029744e-06, - "loss": 2.2655, - "step": 516040 - }, - { - "epoch": 0.9, - "learning_rate": 5.003540076102918e-06, - "loss": 2.2381, - "step": 516050 - }, - { - "epoch": 0.9, - "learning_rate": 5.0026681361760905e-06, - "loss": 2.2262, - "step": 516060 - }, - { - "epoch": 0.9, - "learning_rate": 5.0017961962492635e-06, - "loss": 2.1584, - "step": 516070 - }, - { - "epoch": 0.9, - "learning_rate": 5.000924256322436e-06, - "loss": 2.2374, - "step": 516080 - }, - { - "epoch": 0.9, - "learning_rate": 5.00005231639561e-06, - "loss": 2.2973, - "step": 516090 - }, - { - "epoch": 0.9, - "learning_rate": 4.999180376468783e-06, - "loss": 2.3639, - "step": 516100 - }, - { - "epoch": 0.9, - "learning_rate": 4.998308436541956e-06, - "loss": 2.1865, - "step": 516110 - }, - { - "epoch": 0.9, - "learning_rate": 4.99743649661513e-06, - "loss": 2.2764, - "step": 516120 - }, - { - "epoch": 0.9, - "learning_rate": 4.996564556688303e-06, - "loss": 2.2123, - "step": 516130 - }, - { - "epoch": 0.9, - "learning_rate": 4.995692616761476e-06, - "loss": 2.2367, - "step": 516140 - }, - { - "epoch": 0.9, - "learning_rate": 4.9948206768346485e-06, - "loss": 2.3461, - "step": 516150 - }, - { - "epoch": 0.9, - "learning_rate": 4.993948736907822e-06, - "loss": 2.3886, - "step": 516160 - }, - { - "epoch": 0.9, - "learning_rate": 4.993076796980995e-06, - "loss": 2.136, - "step": 516170 - }, - { - "epoch": 0.9, - "learning_rate": 4.992204857054169e-06, - "loss": 2.3385, - "step": 516180 - }, - { - "epoch": 0.9, - "learning_rate": 4.991332917127342e-06, - "loss": 2.249, - "step": 516190 - }, - { - "epoch": 0.9, - "learning_rate": 4.990460977200515e-06, - "loss": 2.3329, - "step": 516200 - }, - { - "epoch": 0.9, - "learning_rate": 4.989589037273689e-06, - "loss": 2.3299, - "step": 516210 - }, - { - "epoch": 0.9, - "learning_rate": 4.9887170973468615e-06, - "loss": 2.2525, - "step": 516220 - }, - { - "epoch": 0.9, - "learning_rate": 4.9878451574200345e-06, - "loss": 2.2441, - "step": 516230 - }, - { - "epoch": 0.9, - "learning_rate": 4.986973217493208e-06, - "loss": 2.1992, - "step": 516240 - }, - { - "epoch": 0.9, - "learning_rate": 4.986101277566381e-06, - "loss": 2.2443, - "step": 516250 - }, - { - "epoch": 0.9, - "learning_rate": 4.985229337639554e-06, - "loss": 2.245, - "step": 516260 - }, - { - "epoch": 0.9, - "learning_rate": 4.984357397712727e-06, - "loss": 2.2566, - "step": 516270 - }, - { - "epoch": 0.9, - "learning_rate": 4.983485457785901e-06, - "loss": 2.2225, - "step": 516280 - }, - { - "epoch": 0.9, - "learning_rate": 4.982613517859074e-06, - "loss": 2.298, - "step": 516290 - }, - { - "epoch": 0.9, - "learning_rate": 4.981741577932247e-06, - "loss": 2.1575, - "step": 516300 - }, - { - "epoch": 0.9, - "learning_rate": 4.98086963800542e-06, - "loss": 2.2745, - "step": 516310 - }, - { - "epoch": 0.9, - "learning_rate": 4.979997698078593e-06, - "loss": 2.2714, - "step": 516320 - }, - { - "epoch": 0.9, - "learning_rate": 4.979125758151767e-06, - "loss": 2.3187, - "step": 516330 - }, - { - "epoch": 0.9, - "learning_rate": 4.97825381822494e-06, - "loss": 2.1677, - "step": 516340 - }, - { - "epoch": 0.9, - "learning_rate": 4.977381878298113e-06, - "loss": 2.3026, - "step": 516350 - }, - { - "epoch": 0.9, - "learning_rate": 4.976509938371286e-06, - "loss": 2.1221, - "step": 516360 - }, - { - "epoch": 0.9, - "learning_rate": 4.97563799844446e-06, - "loss": 2.1953, - "step": 516370 - }, - { - "epoch": 0.9, - "learning_rate": 4.9747660585176325e-06, - "loss": 2.167, - "step": 516380 - }, - { - "epoch": 0.9, - "learning_rate": 4.9738941185908055e-06, - "loss": 2.3566, - "step": 516390 - }, - { - "epoch": 0.9, - "learning_rate": 4.973022178663979e-06, - "loss": 2.2889, - "step": 516400 - }, - { - "epoch": 0.9, - "learning_rate": 4.972150238737152e-06, - "loss": 2.3423, - "step": 516410 - }, - { - "epoch": 0.9, - "learning_rate": 4.971278298810325e-06, - "loss": 2.1115, - "step": 516420 - }, - { - "epoch": 0.9, - "learning_rate": 4.970406358883498e-06, - "loss": 2.2903, - "step": 516430 - }, - { - "epoch": 0.9, - "learning_rate": 4.969534418956672e-06, - "loss": 2.3075, - "step": 516440 - }, - { - "epoch": 0.9, - "learning_rate": 4.9686624790298455e-06, - "loss": 2.1575, - "step": 516450 - }, - { - "epoch": 0.9, - "learning_rate": 4.9677905391030185e-06, - "loss": 2.2927, - "step": 516460 - }, - { - "epoch": 0.9, - "learning_rate": 4.966918599176191e-06, - "loss": 2.2265, - "step": 516470 - }, - { - "epoch": 0.9, - "learning_rate": 4.966046659249364e-06, - "loss": 2.2283, - "step": 516480 - }, - { - "epoch": 0.9, - "learning_rate": 4.965174719322538e-06, - "loss": 2.2185, - "step": 516490 - }, - { - "epoch": 0.9, - "learning_rate": 4.964302779395711e-06, - "loss": 2.1322, - "step": 516500 - }, - { - "epoch": 0.9, - "learning_rate": 4.963430839468884e-06, - "loss": 2.2759, - "step": 516510 - }, - { - "epoch": 0.9, - "learning_rate": 4.962558899542058e-06, - "loss": 2.2681, - "step": 516520 - }, - { - "epoch": 0.9, - "learning_rate": 4.961686959615231e-06, - "loss": 2.346, - "step": 516530 - }, - { - "epoch": 0.9, - "learning_rate": 4.9608150196884035e-06, - "loss": 2.2638, - "step": 516540 - }, - { - "epoch": 0.9, - "learning_rate": 4.9599430797615765e-06, - "loss": 2.2963, - "step": 516550 - }, - { - "epoch": 0.9, - "learning_rate": 4.95907113983475e-06, - "loss": 2.2735, - "step": 516560 - }, - { - "epoch": 0.9, - "learning_rate": 4.958199199907924e-06, - "loss": 2.1827, - "step": 516570 - }, - { - "epoch": 0.9, - "learning_rate": 4.957327259981097e-06, - "loss": 2.3428, - "step": 516580 - }, - { - "epoch": 0.9, - "learning_rate": 4.95645532005427e-06, - "loss": 2.295, - "step": 516590 - }, - { - "epoch": 0.9, - "learning_rate": 4.955583380127443e-06, - "loss": 2.165, - "step": 516600 - }, - { - "epoch": 0.9, - "learning_rate": 4.9547114402006165e-06, - "loss": 2.2697, - "step": 516610 - }, - { - "epoch": 0.9, - "learning_rate": 4.9538395002737895e-06, - "loss": 2.2651, - "step": 516620 - }, - { - "epoch": 0.9, - "learning_rate": 4.952967560346962e-06, - "loss": 2.2574, - "step": 516630 - }, - { - "epoch": 0.9, - "learning_rate": 4.952095620420136e-06, - "loss": 2.2722, - "step": 516640 - }, - { - "epoch": 0.9, - "learning_rate": 4.951223680493309e-06, - "loss": 2.2483, - "step": 516650 - }, - { - "epoch": 0.9, - "learning_rate": 4.950351740566482e-06, - "loss": 2.2582, - "step": 516660 - }, - { - "epoch": 0.9, - "learning_rate": 4.949479800639655e-06, - "loss": 2.2807, - "step": 516670 - }, - { - "epoch": 0.9, - "learning_rate": 4.948607860712829e-06, - "loss": 2.347, - "step": 516680 - }, - { - "epoch": 0.9, - "learning_rate": 4.947735920786002e-06, - "loss": 2.2594, - "step": 516690 - }, - { - "epoch": 0.9, - "learning_rate": 4.9468639808591745e-06, - "loss": 2.3294, - "step": 516700 - }, - { - "epoch": 0.9, - "learning_rate": 4.945992040932348e-06, - "loss": 2.2368, - "step": 516710 - }, - { - "epoch": 0.9, - "learning_rate": 4.945120101005521e-06, - "loss": 2.3005, - "step": 516720 - }, - { - "epoch": 0.9, - "learning_rate": 4.944248161078695e-06, - "loss": 2.2077, - "step": 516730 - }, - { - "epoch": 0.9, - "learning_rate": 4.943376221151868e-06, - "loss": 2.228, - "step": 516740 - }, - { - "epoch": 0.9, - "learning_rate": 4.942504281225041e-06, - "loss": 2.2913, - "step": 516750 - }, - { - "epoch": 0.9, - "learning_rate": 4.941632341298215e-06, - "loss": 2.3237, - "step": 516760 - }, - { - "epoch": 0.9, - "learning_rate": 4.9407604013713875e-06, - "loss": 2.156, - "step": 516770 - }, - { - "epoch": 0.9, - "learning_rate": 4.9398884614445605e-06, - "loss": 2.2199, - "step": 516780 - }, - { - "epoch": 0.9, - "learning_rate": 4.939016521517733e-06, - "loss": 2.3261, - "step": 516790 - }, - { - "epoch": 0.9, - "learning_rate": 4.938144581590907e-06, - "loss": 2.2322, - "step": 516800 - }, - { - "epoch": 0.9, - "learning_rate": 4.93727264166408e-06, - "loss": 2.313, - "step": 516810 - }, - { - "epoch": 0.9, - "learning_rate": 4.936400701737253e-06, - "loss": 2.2629, - "step": 516820 - }, - { - "epoch": 0.9, - "learning_rate": 4.935528761810426e-06, - "loss": 2.2396, - "step": 516830 - }, - { - "epoch": 0.9, - "learning_rate": 4.9346568218836e-06, - "loss": 2.2931, - "step": 516840 - }, - { - "epoch": 0.9, - "learning_rate": 4.9337848819567735e-06, - "loss": 2.3325, - "step": 516850 - }, - { - "epoch": 0.9, - "learning_rate": 4.932912942029946e-06, - "loss": 2.2249, - "step": 516860 - }, - { - "epoch": 0.9, - "learning_rate": 4.932041002103119e-06, - "loss": 2.2363, - "step": 516870 - }, - { - "epoch": 0.9, - "learning_rate": 4.931169062176292e-06, - "loss": 2.2975, - "step": 516880 - }, - { - "epoch": 0.9, - "learning_rate": 4.930297122249466e-06, - "loss": 2.312, - "step": 516890 - }, - { - "epoch": 0.9, - "learning_rate": 4.929425182322639e-06, - "loss": 2.1997, - "step": 516900 - }, - { - "epoch": 0.9, - "learning_rate": 4.928553242395812e-06, - "loss": 2.2384, - "step": 516910 - }, - { - "epoch": 0.9, - "learning_rate": 4.927681302468986e-06, - "loss": 2.2324, - "step": 516920 - }, - { - "epoch": 0.9, - "learning_rate": 4.9268093625421585e-06, - "loss": 2.3465, - "step": 516930 - }, - { - "epoch": 0.9, - "learning_rate": 4.9259374226153315e-06, - "loss": 2.3503, - "step": 516940 - }, - { - "epoch": 0.9, - "learning_rate": 4.925065482688504e-06, - "loss": 2.2614, - "step": 516950 - }, - { - "epoch": 0.9, - "learning_rate": 4.924193542761678e-06, - "loss": 2.1566, - "step": 516960 - }, - { - "epoch": 0.9, - "learning_rate": 4.923321602834852e-06, - "loss": 2.2764, - "step": 516970 - }, - { - "epoch": 0.9, - "learning_rate": 4.922449662908025e-06, - "loss": 2.2292, - "step": 516980 - }, - { - "epoch": 0.9, - "learning_rate": 4.921577722981198e-06, - "loss": 2.2491, - "step": 516990 - }, - { - "epoch": 0.9, - "learning_rate": 4.920705783054371e-06, - "loss": 2.021, - "step": 517000 - }, - { - "epoch": 0.9, - "learning_rate": 4.9198338431275445e-06, - "loss": 2.4153, - "step": 517010 - }, - { - "epoch": 0.9, - "learning_rate": 4.918961903200717e-06, - "loss": 2.2409, - "step": 517020 - }, - { - "epoch": 0.9, - "learning_rate": 4.91808996327389e-06, - "loss": 2.2498, - "step": 517030 - }, - { - "epoch": 0.9, - "learning_rate": 4.917218023347064e-06, - "loss": 2.2052, - "step": 517040 - }, - { - "epoch": 0.9, - "learning_rate": 4.916346083420237e-06, - "loss": 2.17, - "step": 517050 - }, - { - "epoch": 0.9, - "learning_rate": 4.91547414349341e-06, - "loss": 2.2164, - "step": 517060 - }, - { - "epoch": 0.9, - "learning_rate": 4.914602203566583e-06, - "loss": 2.2584, - "step": 517070 - }, - { - "epoch": 0.9, - "learning_rate": 4.913730263639757e-06, - "loss": 2.2216, - "step": 517080 - }, - { - "epoch": 0.9, - "learning_rate": 4.9128583237129295e-06, - "loss": 2.3262, - "step": 517090 - }, - { - "epoch": 0.9, - "learning_rate": 4.9119863837861025e-06, - "loss": 2.408, - "step": 517100 - }, - { - "epoch": 0.9, - "learning_rate": 4.911114443859276e-06, - "loss": 2.3195, - "step": 517110 - }, - { - "epoch": 0.9, - "learning_rate": 4.910242503932449e-06, - "loss": 2.2597, - "step": 517120 - }, - { - "epoch": 0.9, - "learning_rate": 4.909370564005623e-06, - "loss": 2.2937, - "step": 517130 - }, - { - "epoch": 0.9, - "learning_rate": 4.908498624078796e-06, - "loss": 2.1008, - "step": 517140 - }, - { - "epoch": 0.9, - "learning_rate": 4.907626684151969e-06, - "loss": 2.2273, - "step": 517150 - }, - { - "epoch": 0.9, - "learning_rate": 4.9067547442251425e-06, - "loss": 2.1828, - "step": 517160 - }, - { - "epoch": 0.9, - "learning_rate": 4.9058828042983155e-06, - "loss": 2.1789, - "step": 517170 - }, - { - "epoch": 0.9, - "learning_rate": 4.905010864371488e-06, - "loss": 2.2693, - "step": 517180 - }, - { - "epoch": 0.9, - "learning_rate": 4.904138924444661e-06, - "loss": 2.2206, - "step": 517190 - }, - { - "epoch": 0.9, - "learning_rate": 4.903266984517835e-06, - "loss": 2.3709, - "step": 517200 - }, - { - "epoch": 0.9, - "learning_rate": 4.902395044591008e-06, - "loss": 2.1628, - "step": 517210 - }, - { - "epoch": 0.9, - "learning_rate": 4.901523104664181e-06, - "loss": 2.3745, - "step": 517220 - }, - { - "epoch": 0.9, - "learning_rate": 4.900651164737354e-06, - "loss": 2.3108, - "step": 517230 - }, - { - "epoch": 0.9, - "learning_rate": 4.899779224810528e-06, - "loss": 2.2408, - "step": 517240 - }, - { - "epoch": 0.9, - "learning_rate": 4.898907284883701e-06, - "loss": 2.3299, - "step": 517250 - }, - { - "epoch": 0.9, - "learning_rate": 4.898035344956874e-06, - "loss": 2.3378, - "step": 517260 - }, - { - "epoch": 0.9, - "learning_rate": 4.897163405030047e-06, - "loss": 2.256, - "step": 517270 - }, - { - "epoch": 0.9, - "learning_rate": 4.896291465103221e-06, - "loss": 2.3389, - "step": 517280 - }, - { - "epoch": 0.9, - "learning_rate": 4.895419525176394e-06, - "loss": 2.3593, - "step": 517290 - }, - { - "epoch": 0.9, - "learning_rate": 4.894547585249567e-06, - "loss": 2.4192, - "step": 517300 - }, - { - "epoch": 0.9, - "learning_rate": 4.89367564532274e-06, - "loss": 2.2739, - "step": 517310 - }, - { - "epoch": 0.9, - "learning_rate": 4.8928037053959135e-06, - "loss": 2.2442, - "step": 517320 - }, - { - "epoch": 0.9, - "learning_rate": 4.8919317654690865e-06, - "loss": 2.2653, - "step": 517330 - }, - { - "epoch": 0.9, - "learning_rate": 4.891059825542259e-06, - "loss": 2.3294, - "step": 517340 - }, - { - "epoch": 0.9, - "learning_rate": 4.890187885615432e-06, - "loss": 2.4141, - "step": 517350 - }, - { - "epoch": 0.9, - "learning_rate": 4.889315945688606e-06, - "loss": 2.2614, - "step": 517360 - }, - { - "epoch": 0.9, - "learning_rate": 4.88844400576178e-06, - "loss": 2.3904, - "step": 517370 - }, - { - "epoch": 0.9, - "learning_rate": 4.887572065834953e-06, - "loss": 2.285, - "step": 517380 - }, - { - "epoch": 0.9, - "learning_rate": 4.886700125908126e-06, - "loss": 2.3902, - "step": 517390 - }, - { - "epoch": 0.9, - "learning_rate": 4.885828185981299e-06, - "loss": 2.2744, - "step": 517400 - }, - { - "epoch": 0.9, - "learning_rate": 4.884956246054472e-06, - "loss": 2.3109, - "step": 517410 - }, - { - "epoch": 0.9, - "learning_rate": 4.884084306127645e-06, - "loss": 2.3087, - "step": 517420 - }, - { - "epoch": 0.9, - "learning_rate": 4.883212366200818e-06, - "loss": 2.2958, - "step": 517430 - }, - { - "epoch": 0.9, - "learning_rate": 4.882340426273992e-06, - "loss": 2.2499, - "step": 517440 - }, - { - "epoch": 0.9, - "learning_rate": 4.881468486347165e-06, - "loss": 2.4022, - "step": 517450 - }, - { - "epoch": 0.9, - "learning_rate": 4.880596546420338e-06, - "loss": 2.2908, - "step": 517460 - }, - { - "epoch": 0.9, - "learning_rate": 4.879724606493511e-06, - "loss": 2.2606, - "step": 517470 - }, - { - "epoch": 0.9, - "learning_rate": 4.8788526665666845e-06, - "loss": 2.2385, - "step": 517480 - }, - { - "epoch": 0.9, - "learning_rate": 4.8779807266398575e-06, - "loss": 2.309, - "step": 517490 - }, - { - "epoch": 0.9, - "learning_rate": 4.87710878671303e-06, - "loss": 2.1161, - "step": 517500 - }, - { - "epoch": 0.9, - "learning_rate": 4.876236846786204e-06, - "loss": 2.2822, - "step": 517510 - }, - { - "epoch": 0.9, - "learning_rate": 4.875364906859377e-06, - "loss": 2.174, - "step": 517520 - }, - { - "epoch": 0.9, - "learning_rate": 4.874492966932551e-06, - "loss": 2.3102, - "step": 517530 - }, - { - "epoch": 0.9, - "learning_rate": 4.873621027005724e-06, - "loss": 2.2916, - "step": 517540 - }, - { - "epoch": 0.9, - "learning_rate": 4.872749087078897e-06, - "loss": 2.3445, - "step": 517550 - }, - { - "epoch": 0.9, - "learning_rate": 4.8718771471520705e-06, - "loss": 2.2016, - "step": 517560 - }, - { - "epoch": 0.9, - "learning_rate": 4.871005207225243e-06, - "loss": 2.2454, - "step": 517570 - }, - { - "epoch": 0.9, - "learning_rate": 4.870133267298416e-06, - "loss": 2.2614, - "step": 517580 - }, - { - "epoch": 0.9, - "learning_rate": 4.869261327371589e-06, - "loss": 2.3917, - "step": 517590 - }, - { - "epoch": 0.9, - "learning_rate": 4.868389387444763e-06, - "loss": 2.3839, - "step": 517600 - }, - { - "epoch": 0.9, - "learning_rate": 4.867517447517936e-06, - "loss": 2.2226, - "step": 517610 - }, - { - "epoch": 0.9, - "learning_rate": 4.866645507591109e-06, - "loss": 2.2344, - "step": 517620 - }, - { - "epoch": 0.9, - "learning_rate": 4.865773567664282e-06, - "loss": 2.1646, - "step": 517630 - }, - { - "epoch": 0.9, - "learning_rate": 4.8649016277374555e-06, - "loss": 2.3275, - "step": 517640 - }, - { - "epoch": 0.9, - "learning_rate": 4.864029687810629e-06, - "loss": 2.3507, - "step": 517650 - }, - { - "epoch": 0.9, - "learning_rate": 4.863157747883802e-06, - "loss": 2.293, - "step": 517660 - }, - { - "epoch": 0.9, - "learning_rate": 4.862285807956975e-06, - "loss": 2.298, - "step": 517670 - }, - { - "epoch": 0.9, - "learning_rate": 4.861413868030149e-06, - "loss": 2.252, - "step": 517680 - }, - { - "epoch": 0.9, - "learning_rate": 4.860541928103322e-06, - "loss": 2.1324, - "step": 517690 - }, - { - "epoch": 0.9, - "learning_rate": 4.859669988176495e-06, - "loss": 2.0959, - "step": 517700 - }, - { - "epoch": 0.9, - "learning_rate": 4.858798048249668e-06, - "loss": 2.2444, - "step": 517710 - }, - { - "epoch": 0.9, - "learning_rate": 4.8579261083228415e-06, - "loss": 2.3031, - "step": 517720 - }, - { - "epoch": 0.9, - "learning_rate": 4.857054168396014e-06, - "loss": 2.3105, - "step": 517730 - }, - { - "epoch": 0.9, - "learning_rate": 4.856182228469187e-06, - "loss": 2.2465, - "step": 517740 - }, - { - "epoch": 0.9, - "learning_rate": 4.85531028854236e-06, - "loss": 2.3536, - "step": 517750 - }, - { - "epoch": 0.9, - "learning_rate": 4.854438348615534e-06, - "loss": 2.2137, - "step": 517760 - }, - { - "epoch": 0.9, - "learning_rate": 4.853566408688708e-06, - "loss": 2.2788, - "step": 517770 - }, - { - "epoch": 0.9, - "learning_rate": 4.852694468761881e-06, - "loss": 2.2455, - "step": 517780 - }, - { - "epoch": 0.9, - "learning_rate": 4.851822528835054e-06, - "loss": 2.3437, - "step": 517790 - }, - { - "epoch": 0.9, - "learning_rate": 4.850950588908227e-06, - "loss": 2.2497, - "step": 517800 - }, - { - "epoch": 0.9, - "learning_rate": 4.8500786489814e-06, - "loss": 2.2132, - "step": 517810 - }, - { - "epoch": 0.9, - "learning_rate": 4.849206709054573e-06, - "loss": 2.1862, - "step": 517820 - }, - { - "epoch": 0.9, - "learning_rate": 4.848334769127746e-06, - "loss": 2.2844, - "step": 517830 - }, - { - "epoch": 0.9, - "learning_rate": 4.84746282920092e-06, - "loss": 2.2077, - "step": 517840 - }, - { - "epoch": 0.9, - "learning_rate": 4.846590889274093e-06, - "loss": 2.1901, - "step": 517850 - }, - { - "epoch": 0.9, - "learning_rate": 4.845718949347266e-06, - "loss": 2.2205, - "step": 517860 - }, - { - "epoch": 0.9, - "learning_rate": 4.844847009420439e-06, - "loss": 2.2424, - "step": 517870 - }, - { - "epoch": 0.9, - "learning_rate": 4.8439750694936125e-06, - "loss": 2.2203, - "step": 517880 - }, - { - "epoch": 0.9, - "learning_rate": 4.843103129566785e-06, - "loss": 2.3677, - "step": 517890 - }, - { - "epoch": 0.9, - "learning_rate": 4.842231189639959e-06, - "loss": 2.2976, - "step": 517900 - }, - { - "epoch": 0.9, - "learning_rate": 4.841359249713132e-06, - "loss": 2.243, - "step": 517910 - }, - { - "epoch": 0.9, - "learning_rate": 4.840487309786305e-06, - "loss": 2.2548, - "step": 517920 - }, - { - "epoch": 0.9, - "learning_rate": 4.839615369859479e-06, - "loss": 2.1795, - "step": 517930 - }, - { - "epoch": 0.9, - "learning_rate": 4.838743429932652e-06, - "loss": 2.3143, - "step": 517940 - }, - { - "epoch": 0.9, - "learning_rate": 4.837871490005825e-06, - "loss": 2.2133, - "step": 517950 - }, - { - "epoch": 0.9, - "learning_rate": 4.836999550078998e-06, - "loss": 2.3473, - "step": 517960 - }, - { - "epoch": 0.9, - "learning_rate": 4.836127610152171e-06, - "loss": 2.3385, - "step": 517970 - }, - { - "epoch": 0.9, - "learning_rate": 4.835255670225344e-06, - "loss": 2.1654, - "step": 517980 - }, - { - "epoch": 0.9, - "learning_rate": 4.834383730298517e-06, - "loss": 2.2415, - "step": 517990 - }, - { - "epoch": 0.9, - "learning_rate": 4.833511790371691e-06, - "loss": 2.2849, - "step": 518000 - }, - { - "epoch": 0.9, - "learning_rate": 4.832639850444864e-06, - "loss": 2.2003, - "step": 518010 - }, - { - "epoch": 0.9, - "learning_rate": 4.831767910518037e-06, - "loss": 2.3576, - "step": 518020 - }, - { - "epoch": 0.9, - "learning_rate": 4.83089597059121e-06, - "loss": 2.2044, - "step": 518030 - }, - { - "epoch": 0.9, - "learning_rate": 4.8300240306643835e-06, - "loss": 2.1732, - "step": 518040 - }, - { - "epoch": 0.9, - "learning_rate": 4.829152090737557e-06, - "loss": 2.3106, - "step": 518050 - }, - { - "epoch": 0.9, - "learning_rate": 4.82828015081073e-06, - "loss": 2.2601, - "step": 518060 - }, - { - "epoch": 0.9, - "learning_rate": 4.827408210883903e-06, - "loss": 2.2045, - "step": 518070 - }, - { - "epoch": 0.9, - "learning_rate": 4.826536270957077e-06, - "loss": 2.2676, - "step": 518080 - }, - { - "epoch": 0.9, - "learning_rate": 4.82566433103025e-06, - "loss": 2.3086, - "step": 518090 - }, - { - "epoch": 0.9, - "learning_rate": 4.824792391103423e-06, - "loss": 2.3402, - "step": 518100 - }, - { - "epoch": 0.9, - "learning_rate": 4.823920451176596e-06, - "loss": 2.1356, - "step": 518110 - }, - { - "epoch": 0.9, - "learning_rate": 4.823048511249769e-06, - "loss": 2.1805, - "step": 518120 - }, - { - "epoch": 0.9, - "learning_rate": 4.822176571322942e-06, - "loss": 2.2203, - "step": 518130 - }, - { - "epoch": 0.9, - "learning_rate": 4.821304631396115e-06, - "loss": 2.2753, - "step": 518140 - }, - { - "epoch": 0.9, - "learning_rate": 4.820432691469288e-06, - "loss": 2.2778, - "step": 518150 - }, - { - "epoch": 0.9, - "learning_rate": 4.819560751542462e-06, - "loss": 2.2145, - "step": 518160 - }, - { - "epoch": 0.9, - "learning_rate": 4.818688811615636e-06, - "loss": 2.2337, - "step": 518170 - }, - { - "epoch": 0.9, - "learning_rate": 4.817816871688809e-06, - "loss": 2.225, - "step": 518180 - }, - { - "epoch": 0.9, - "learning_rate": 4.8169449317619816e-06, - "loss": 2.3067, - "step": 518190 - }, - { - "epoch": 0.9, - "learning_rate": 4.816072991835155e-06, - "loss": 2.319, - "step": 518200 - }, - { - "epoch": 0.9, - "learning_rate": 4.815201051908328e-06, - "loss": 2.294, - "step": 518210 - }, - { - "epoch": 0.9, - "learning_rate": 4.814329111981501e-06, - "loss": 2.3031, - "step": 518220 - }, - { - "epoch": 0.9, - "learning_rate": 4.813457172054674e-06, - "loss": 2.332, - "step": 518230 - }, - { - "epoch": 0.9, - "learning_rate": 4.812585232127848e-06, - "loss": 2.2063, - "step": 518240 - }, - { - "epoch": 0.9, - "learning_rate": 4.811713292201021e-06, - "loss": 2.3409, - "step": 518250 - }, - { - "epoch": 0.9, - "learning_rate": 4.810841352274194e-06, - "loss": 2.319, - "step": 518260 - }, - { - "epoch": 0.9, - "learning_rate": 4.809969412347367e-06, - "loss": 2.3883, - "step": 518270 - }, - { - "epoch": 0.9, - "learning_rate": 4.80909747242054e-06, - "loss": 2.2975, - "step": 518280 - }, - { - "epoch": 0.9, - "learning_rate": 4.808225532493713e-06, - "loss": 2.3095, - "step": 518290 - }, - { - "epoch": 0.9, - "learning_rate": 4.807353592566887e-06, - "loss": 2.3051, - "step": 518300 - }, - { - "epoch": 0.9, - "learning_rate": 4.80648165264006e-06, - "loss": 2.249, - "step": 518310 - }, - { - "epoch": 0.9, - "learning_rate": 4.805609712713234e-06, - "loss": 2.2534, - "step": 518320 - }, - { - "epoch": 0.9, - "learning_rate": 4.804737772786407e-06, - "loss": 2.2529, - "step": 518330 - }, - { - "epoch": 0.9, - "learning_rate": 4.80386583285958e-06, - "loss": 2.2693, - "step": 518340 - }, - { - "epoch": 0.9, - "learning_rate": 4.8029938929327526e-06, - "loss": 2.3338, - "step": 518350 - }, - { - "epoch": 0.9, - "learning_rate": 4.802121953005926e-06, - "loss": 2.258, - "step": 518360 - }, - { - "epoch": 0.9, - "learning_rate": 4.801250013079099e-06, - "loss": 2.1887, - "step": 518370 - }, - { - "epoch": 0.9, - "learning_rate": 4.800378073152272e-06, - "loss": 2.1109, - "step": 518380 - }, - { - "epoch": 0.9, - "learning_rate": 4.799506133225445e-06, - "loss": 2.2301, - "step": 518390 - }, - { - "epoch": 0.9, - "learning_rate": 4.798634193298619e-06, - "loss": 2.2808, - "step": 518400 - }, - { - "epoch": 0.9, - "learning_rate": 4.797762253371792e-06, - "loss": 2.2619, - "step": 518410 - }, - { - "epoch": 0.9, - "learning_rate": 4.796890313444965e-06, - "loss": 2.3314, - "step": 518420 - }, - { - "epoch": 0.9, - "learning_rate": 4.796018373518138e-06, - "loss": 2.2917, - "step": 518430 - }, - { - "epoch": 0.9, - "learning_rate": 4.795146433591312e-06, - "loss": 2.1935, - "step": 518440 - }, - { - "epoch": 0.9, - "learning_rate": 4.794274493664485e-06, - "loss": 2.2761, - "step": 518450 - }, - { - "epoch": 0.9, - "learning_rate": 4.793402553737658e-06, - "loss": 2.1917, - "step": 518460 - }, - { - "epoch": 0.9, - "learning_rate": 4.792530613810831e-06, - "loss": 2.2842, - "step": 518470 - }, - { - "epoch": 0.9, - "learning_rate": 4.791658673884005e-06, - "loss": 2.324, - "step": 518480 - }, - { - "epoch": 0.9, - "learning_rate": 4.790786733957178e-06, - "loss": 2.2002, - "step": 518490 - }, - { - "epoch": 0.9, - "learning_rate": 4.789914794030351e-06, - "loss": 2.1899, - "step": 518500 - }, - { - "epoch": 0.9, - "learning_rate": 4.7890428541035236e-06, - "loss": 2.2465, - "step": 518510 - }, - { - "epoch": 0.9, - "learning_rate": 4.788170914176697e-06, - "loss": 2.3321, - "step": 518520 - }, - { - "epoch": 0.9, - "learning_rate": 4.78729897424987e-06, - "loss": 2.205, - "step": 518530 - }, - { - "epoch": 0.9, - "learning_rate": 4.786427034323043e-06, - "loss": 2.1979, - "step": 518540 - }, - { - "epoch": 0.9, - "learning_rate": 4.785555094396216e-06, - "loss": 2.2515, - "step": 518550 - }, - { - "epoch": 0.9, - "learning_rate": 4.78468315446939e-06, - "loss": 2.2574, - "step": 518560 - }, - { - "epoch": 0.9, - "learning_rate": 4.783811214542564e-06, - "loss": 2.1699, - "step": 518570 - }, - { - "epoch": 0.9, - "learning_rate": 4.7829392746157366e-06, - "loss": 2.2546, - "step": 518580 - }, - { - "epoch": 0.9, - "learning_rate": 4.7820673346889095e-06, - "loss": 2.2855, - "step": 518590 - }, - { - "epoch": 0.9, - "learning_rate": 4.781195394762083e-06, - "loss": 2.2718, - "step": 518600 - }, - { - "epoch": 0.9, - "learning_rate": 4.780323454835256e-06, - "loss": 2.1966, - "step": 518610 - }, - { - "epoch": 0.9, - "learning_rate": 4.779451514908429e-06, - "loss": 2.3435, - "step": 518620 - }, - { - "epoch": 0.9, - "learning_rate": 4.778579574981602e-06, - "loss": 2.3211, - "step": 518630 - }, - { - "epoch": 0.9, - "learning_rate": 4.777707635054776e-06, - "loss": 2.1434, - "step": 518640 - }, - { - "epoch": 0.9, - "learning_rate": 4.776835695127949e-06, - "loss": 2.1636, - "step": 518650 - }, - { - "epoch": 0.9, - "learning_rate": 4.775963755201122e-06, - "loss": 2.2717, - "step": 518660 - }, - { - "epoch": 0.9, - "learning_rate": 4.7750918152742946e-06, - "loss": 2.2347, - "step": 518670 - }, - { - "epoch": 0.9, - "learning_rate": 4.774219875347468e-06, - "loss": 2.203, - "step": 518680 - }, - { - "epoch": 0.9, - "learning_rate": 4.773347935420641e-06, - "loss": 2.2639, - "step": 518690 - }, - { - "epoch": 0.9, - "learning_rate": 4.772475995493815e-06, - "loss": 2.3326, - "step": 518700 - }, - { - "epoch": 0.9, - "learning_rate": 4.771604055566988e-06, - "loss": 2.2055, - "step": 518710 - }, - { - "epoch": 0.9, - "learning_rate": 4.770732115640162e-06, - "loss": 2.2069, - "step": 518720 - }, - { - "epoch": 0.9, - "learning_rate": 4.769860175713335e-06, - "loss": 2.2563, - "step": 518730 - }, - { - "epoch": 0.9, - "learning_rate": 4.7689882357865076e-06, - "loss": 2.293, - "step": 518740 - }, - { - "epoch": 0.9, - "learning_rate": 4.7681162958596805e-06, - "loss": 2.1521, - "step": 518750 - }, - { - "epoch": 0.9, - "learning_rate": 4.767244355932854e-06, - "loss": 2.3362, - "step": 518760 - }, - { - "epoch": 0.9, - "learning_rate": 4.766372416006027e-06, - "loss": 2.2801, - "step": 518770 - }, - { - "epoch": 0.9, - "learning_rate": 4.7655004760792e-06, - "loss": 2.306, - "step": 518780 - }, - { - "epoch": 0.9, - "learning_rate": 4.764628536152373e-06, - "loss": 2.3007, - "step": 518790 - }, - { - "epoch": 0.9, - "learning_rate": 4.763756596225547e-06, - "loss": 2.2216, - "step": 518800 - }, - { - "epoch": 0.9, - "learning_rate": 4.76288465629872e-06, - "loss": 2.3038, - "step": 518810 - }, - { - "epoch": 0.9, - "learning_rate": 4.762012716371893e-06, - "loss": 2.1701, - "step": 518820 - }, - { - "epoch": 0.9, - "learning_rate": 4.7611407764450656e-06, - "loss": 2.3011, - "step": 518830 - }, - { - "epoch": 0.9, - "learning_rate": 4.76026883651824e-06, - "loss": 2.325, - "step": 518840 - }, - { - "epoch": 0.9, - "learning_rate": 4.759396896591413e-06, - "loss": 2.367, - "step": 518850 - }, - { - "epoch": 0.9, - "learning_rate": 4.758524956664586e-06, - "loss": 2.2332, - "step": 518860 - }, - { - "epoch": 0.9, - "learning_rate": 4.757653016737759e-06, - "loss": 2.1726, - "step": 518870 - }, - { - "epoch": 0.9, - "learning_rate": 4.756781076810933e-06, - "loss": 2.2593, - "step": 518880 - }, - { - "epoch": 0.9, - "learning_rate": 4.755909136884106e-06, - "loss": 2.206, - "step": 518890 - }, - { - "epoch": 0.9, - "learning_rate": 4.7550371969572786e-06, - "loss": 2.1553, - "step": 518900 - }, - { - "epoch": 0.9, - "learning_rate": 4.7541652570304515e-06, - "loss": 2.3242, - "step": 518910 - }, - { - "epoch": 0.9, - "learning_rate": 4.753293317103625e-06, - "loss": 2.1702, - "step": 518920 - }, - { - "epoch": 0.9, - "learning_rate": 4.752421377176798e-06, - "loss": 2.2147, - "step": 518930 - }, - { - "epoch": 0.9, - "learning_rate": 4.751549437249971e-06, - "loss": 2.1708, - "step": 518940 - }, - { - "epoch": 0.9, - "learning_rate": 4.750677497323144e-06, - "loss": 2.2867, - "step": 518950 - }, - { - "epoch": 0.91, - "learning_rate": 4.749805557396318e-06, - "loss": 2.2438, - "step": 518960 - }, - { - "epoch": 0.91, - "learning_rate": 4.7489336174694916e-06, - "loss": 2.1737, - "step": 518970 - }, - { - "epoch": 0.91, - "learning_rate": 4.7480616775426645e-06, - "loss": 2.2318, - "step": 518980 - }, - { - "epoch": 0.91, - "learning_rate": 4.747189737615837e-06, - "loss": 2.3003, - "step": 518990 - }, - { - "epoch": 0.91, - "learning_rate": 4.746317797689011e-06, - "loss": 2.178, - "step": 519000 - }, - { - "epoch": 0.91, - "learning_rate": 4.745445857762184e-06, - "loss": 2.2521, - "step": 519010 - }, - { - "epoch": 0.91, - "learning_rate": 4.744573917835357e-06, - "loss": 2.2311, - "step": 519020 - }, - { - "epoch": 0.91, - "learning_rate": 4.74370197790853e-06, - "loss": 2.3246, - "step": 519030 - }, - { - "epoch": 0.91, - "learning_rate": 4.742830037981704e-06, - "loss": 2.2157, - "step": 519040 - }, - { - "epoch": 0.91, - "learning_rate": 4.741958098054877e-06, - "loss": 2.295, - "step": 519050 - }, - { - "epoch": 0.91, - "learning_rate": 4.7410861581280496e-06, - "loss": 2.2274, - "step": 519060 - }, - { - "epoch": 0.91, - "learning_rate": 4.7402142182012225e-06, - "loss": 2.2393, - "step": 519070 - }, - { - "epoch": 0.91, - "learning_rate": 4.739342278274396e-06, - "loss": 2.1999, - "step": 519080 - }, - { - "epoch": 0.91, - "learning_rate": 4.738470338347569e-06, - "loss": 2.2952, - "step": 519090 - }, - { - "epoch": 0.91, - "learning_rate": 4.737598398420743e-06, - "loss": 2.2439, - "step": 519100 - }, - { - "epoch": 0.91, - "learning_rate": 4.736726458493916e-06, - "loss": 2.3159, - "step": 519110 - }, - { - "epoch": 0.91, - "learning_rate": 4.73585451856709e-06, - "loss": 2.2118, - "step": 519120 - }, - { - "epoch": 0.91, - "learning_rate": 4.7349825786402626e-06, - "loss": 2.2365, - "step": 519130 - }, - { - "epoch": 0.91, - "learning_rate": 4.7341106387134355e-06, - "loss": 2.306, - "step": 519140 - }, - { - "epoch": 0.91, - "learning_rate": 4.733238698786608e-06, - "loss": 2.3649, - "step": 519150 - }, - { - "epoch": 0.91, - "learning_rate": 4.732366758859782e-06, - "loss": 2.2981, - "step": 519160 - }, - { - "epoch": 0.91, - "learning_rate": 4.731494818932955e-06, - "loss": 2.1671, - "step": 519170 - }, - { - "epoch": 0.91, - "learning_rate": 4.730622879006128e-06, - "loss": 2.2176, - "step": 519180 - }, - { - "epoch": 0.91, - "learning_rate": 4.729750939079301e-06, - "loss": 2.1458, - "step": 519190 - }, - { - "epoch": 0.91, - "learning_rate": 4.728878999152475e-06, - "loss": 2.2731, - "step": 519200 - }, - { - "epoch": 0.91, - "learning_rate": 4.728007059225648e-06, - "loss": 2.1592, - "step": 519210 - }, - { - "epoch": 0.91, - "learning_rate": 4.7271351192988206e-06, - "loss": 2.2031, - "step": 519220 - }, - { - "epoch": 0.91, - "learning_rate": 4.726263179371994e-06, - "loss": 2.391, - "step": 519230 - }, - { - "epoch": 0.91, - "learning_rate": 4.725391239445168e-06, - "loss": 2.2574, - "step": 519240 - }, - { - "epoch": 0.91, - "learning_rate": 4.724519299518341e-06, - "loss": 2.2277, - "step": 519250 - }, - { - "epoch": 0.91, - "learning_rate": 4.723647359591514e-06, - "loss": 2.2207, - "step": 519260 - }, - { - "epoch": 0.91, - "learning_rate": 4.722775419664687e-06, - "loss": 2.2143, - "step": 519270 - }, - { - "epoch": 0.91, - "learning_rate": 4.721903479737861e-06, - "loss": 2.2796, - "step": 519280 - }, - { - "epoch": 0.91, - "learning_rate": 4.7210315398110336e-06, - "loss": 2.2805, - "step": 519290 - }, - { - "epoch": 0.91, - "learning_rate": 4.7201595998842065e-06, - "loss": 2.347, - "step": 519300 - }, - { - "epoch": 0.91, - "learning_rate": 4.719287659957379e-06, - "loss": 2.2684, - "step": 519310 - }, - { - "epoch": 0.91, - "learning_rate": 4.718415720030553e-06, - "loss": 2.2481, - "step": 519320 - }, - { - "epoch": 0.91, - "learning_rate": 4.717543780103726e-06, - "loss": 2.2519, - "step": 519330 - }, - { - "epoch": 0.91, - "learning_rate": 4.716671840176899e-06, - "loss": 2.2758, - "step": 519340 - }, - { - "epoch": 0.91, - "learning_rate": 4.715799900250072e-06, - "loss": 2.3208, - "step": 519350 - }, - { - "epoch": 0.91, - "learning_rate": 4.714927960323246e-06, - "loss": 2.1506, - "step": 519360 - }, - { - "epoch": 0.91, - "learning_rate": 4.7140560203964195e-06, - "loss": 2.198, - "step": 519370 - }, - { - "epoch": 0.91, - "learning_rate": 4.713184080469592e-06, - "loss": 2.222, - "step": 519380 - }, - { - "epoch": 0.91, - "learning_rate": 4.712312140542765e-06, - "loss": 2.2739, - "step": 519390 - }, - { - "epoch": 0.91, - "learning_rate": 4.711440200615939e-06, - "loss": 2.3377, - "step": 519400 - }, - { - "epoch": 0.91, - "learning_rate": 4.710568260689112e-06, - "loss": 2.3312, - "step": 519410 - }, - { - "epoch": 0.91, - "learning_rate": 4.709696320762285e-06, - "loss": 2.1592, - "step": 519420 - }, - { - "epoch": 0.91, - "learning_rate": 4.708824380835458e-06, - "loss": 2.2814, - "step": 519430 - }, - { - "epoch": 0.91, - "learning_rate": 4.707952440908632e-06, - "loss": 2.268, - "step": 519440 - }, - { - "epoch": 0.91, - "learning_rate": 4.7070805009818046e-06, - "loss": 2.2954, - "step": 519450 - }, - { - "epoch": 0.91, - "learning_rate": 4.7062085610549775e-06, - "loss": 2.2689, - "step": 519460 - }, - { - "epoch": 0.91, - "learning_rate": 4.70533662112815e-06, - "loss": 2.2415, - "step": 519470 - }, - { - "epoch": 0.91, - "learning_rate": 4.704464681201324e-06, - "loss": 2.234, - "step": 519480 - }, - { - "epoch": 0.91, - "learning_rate": 4.703592741274497e-06, - "loss": 2.2008, - "step": 519490 - }, - { - "epoch": 0.91, - "learning_rate": 4.702720801347671e-06, - "loss": 2.1912, - "step": 519500 - }, - { - "epoch": 0.91, - "learning_rate": 4.701848861420844e-06, - "loss": 2.2668, - "step": 519510 - }, - { - "epoch": 0.91, - "learning_rate": 4.7009769214940176e-06, - "loss": 2.2157, - "step": 519520 - }, - { - "epoch": 0.91, - "learning_rate": 4.7001049815671905e-06, - "loss": 2.291, - "step": 519530 - }, - { - "epoch": 0.91, - "learning_rate": 4.699233041640363e-06, - "loss": 2.2927, - "step": 519540 - }, - { - "epoch": 0.91, - "learning_rate": 4.698361101713536e-06, - "loss": 2.3232, - "step": 519550 - }, - { - "epoch": 0.91, - "learning_rate": 4.69748916178671e-06, - "loss": 2.2606, - "step": 519560 - }, - { - "epoch": 0.91, - "learning_rate": 4.696617221859883e-06, - "loss": 2.3043, - "step": 519570 - }, - { - "epoch": 0.91, - "learning_rate": 4.695745281933056e-06, - "loss": 2.23, - "step": 519580 - }, - { - "epoch": 0.91, - "learning_rate": 4.694873342006229e-06, - "loss": 2.3128, - "step": 519590 - }, - { - "epoch": 0.91, - "learning_rate": 4.694001402079403e-06, - "loss": 2.1875, - "step": 519600 - }, - { - "epoch": 0.91, - "learning_rate": 4.6931294621525756e-06, - "loss": 2.2819, - "step": 519610 - }, - { - "epoch": 0.91, - "learning_rate": 4.6922575222257485e-06, - "loss": 2.1714, - "step": 519620 - }, - { - "epoch": 0.91, - "learning_rate": 4.691385582298922e-06, - "loss": 2.2599, - "step": 519630 - }, - { - "epoch": 0.91, - "learning_rate": 4.690513642372096e-06, - "loss": 2.2069, - "step": 519640 - }, - { - "epoch": 0.91, - "learning_rate": 4.689641702445269e-06, - "loss": 2.2624, - "step": 519650 - }, - { - "epoch": 0.91, - "learning_rate": 4.688769762518442e-06, - "loss": 2.2246, - "step": 519660 - }, - { - "epoch": 0.91, - "learning_rate": 4.687897822591615e-06, - "loss": 2.2216, - "step": 519670 - }, - { - "epoch": 0.91, - "learning_rate": 4.6870258826647886e-06, - "loss": 2.2127, - "step": 519680 - }, - { - "epoch": 0.91, - "learning_rate": 4.6861539427379615e-06, - "loss": 2.2759, - "step": 519690 - }, - { - "epoch": 0.91, - "learning_rate": 4.685282002811134e-06, - "loss": 2.2155, - "step": 519700 - }, - { - "epoch": 0.91, - "learning_rate": 4.684410062884307e-06, - "loss": 2.2671, - "step": 519710 - }, - { - "epoch": 0.91, - "learning_rate": 4.683538122957481e-06, - "loss": 2.2637, - "step": 519720 - }, - { - "epoch": 0.91, - "learning_rate": 4.682666183030654e-06, - "loss": 2.2963, - "step": 519730 - }, - { - "epoch": 0.91, - "learning_rate": 4.681794243103827e-06, - "loss": 2.1704, - "step": 519740 - }, - { - "epoch": 0.91, - "learning_rate": 4.680922303177e-06, - "loss": 2.2044, - "step": 519750 - }, - { - "epoch": 0.91, - "learning_rate": 4.680050363250174e-06, - "loss": 2.1472, - "step": 519760 - }, - { - "epoch": 0.91, - "learning_rate": 4.679178423323347e-06, - "loss": 2.2598, - "step": 519770 - }, - { - "epoch": 0.91, - "learning_rate": 4.67830648339652e-06, - "loss": 2.1935, - "step": 519780 - }, - { - "epoch": 0.91, - "learning_rate": 4.677434543469693e-06, - "loss": 2.2581, - "step": 519790 - }, - { - "epoch": 0.91, - "learning_rate": 4.676562603542867e-06, - "loss": 2.1783, - "step": 519800 - }, - { - "epoch": 0.91, - "learning_rate": 4.67569066361604e-06, - "loss": 2.273, - "step": 519810 - }, - { - "epoch": 0.91, - "learning_rate": 4.674818723689213e-06, - "loss": 2.3338, - "step": 519820 - }, - { - "epoch": 0.91, - "learning_rate": 4.673946783762386e-06, - "loss": 2.3115, - "step": 519830 - }, - { - "epoch": 0.91, - "learning_rate": 4.6730748438355596e-06, - "loss": 2.1326, - "step": 519840 - }, - { - "epoch": 0.91, - "learning_rate": 4.6722029039087325e-06, - "loss": 2.2006, - "step": 519850 - }, - { - "epoch": 0.91, - "learning_rate": 4.671330963981905e-06, - "loss": 2.2574, - "step": 519860 - }, - { - "epoch": 0.91, - "learning_rate": 4.670459024055078e-06, - "loss": 2.3322, - "step": 519870 - }, - { - "epoch": 0.91, - "learning_rate": 4.669587084128252e-06, - "loss": 2.245, - "step": 519880 - }, - { - "epoch": 0.91, - "learning_rate": 4.668715144201425e-06, - "loss": 2.2983, - "step": 519890 - }, - { - "epoch": 0.91, - "learning_rate": 4.667843204274599e-06, - "loss": 2.159, - "step": 519900 - }, - { - "epoch": 0.91, - "learning_rate": 4.666971264347772e-06, - "loss": 2.3708, - "step": 519910 - }, - { - "epoch": 0.91, - "learning_rate": 4.6660993244209455e-06, - "loss": 2.3166, - "step": 519920 - }, - { - "epoch": 0.91, - "learning_rate": 4.665227384494118e-06, - "loss": 2.2799, - "step": 519930 - }, - { - "epoch": 0.91, - "learning_rate": 4.664355444567291e-06, - "loss": 2.2539, - "step": 519940 - }, - { - "epoch": 0.91, - "learning_rate": 4.663483504640464e-06, - "loss": 2.3011, - "step": 519950 - }, - { - "epoch": 0.91, - "learning_rate": 4.662611564713638e-06, - "loss": 2.2846, - "step": 519960 - }, - { - "epoch": 0.91, - "learning_rate": 4.661739624786811e-06, - "loss": 2.3012, - "step": 519970 - }, - { - "epoch": 0.91, - "learning_rate": 4.660867684859984e-06, - "loss": 2.2712, - "step": 519980 - }, - { - "epoch": 0.91, - "learning_rate": 4.659995744933157e-06, - "loss": 2.3342, - "step": 519990 - }, - { - "epoch": 0.91, - "learning_rate": 4.6591238050063306e-06, - "loss": 2.1685, - "step": 520000 - }, - { - "epoch": 0.91, - "learning_rate": 4.6582518650795035e-06, - "loss": 2.3016, - "step": 520010 - }, - { - "epoch": 0.91, - "learning_rate": 4.657379925152676e-06, - "loss": 2.2537, - "step": 520020 - }, - { - "epoch": 0.91, - "learning_rate": 4.65650798522585e-06, - "loss": 2.3285, - "step": 520030 - }, - { - "epoch": 0.91, - "learning_rate": 4.655636045299024e-06, - "loss": 2.1658, - "step": 520040 - }, - { - "epoch": 0.91, - "learning_rate": 4.654764105372197e-06, - "loss": 2.35, - "step": 520050 - }, - { - "epoch": 0.91, - "learning_rate": 4.65389216544537e-06, - "loss": 2.3797, - "step": 520060 - }, - { - "epoch": 0.91, - "learning_rate": 4.653020225518543e-06, - "loss": 2.2385, - "step": 520070 - }, - { - "epoch": 0.91, - "learning_rate": 4.6521482855917165e-06, - "loss": 2.1436, - "step": 520080 - }, - { - "epoch": 0.91, - "learning_rate": 4.651276345664889e-06, - "loss": 2.3222, - "step": 520090 - }, - { - "epoch": 0.91, - "learning_rate": 4.650404405738062e-06, - "loss": 2.2467, - "step": 520100 - }, - { - "epoch": 0.91, - "learning_rate": 4.649532465811235e-06, - "loss": 2.2107, - "step": 520110 - }, - { - "epoch": 0.91, - "learning_rate": 4.648660525884409e-06, - "loss": 2.1603, - "step": 520120 - }, - { - "epoch": 0.91, - "learning_rate": 4.647788585957582e-06, - "loss": 2.1369, - "step": 520130 - }, - { - "epoch": 0.91, - "learning_rate": 4.646916646030755e-06, - "loss": 2.2594, - "step": 520140 - }, - { - "epoch": 0.91, - "learning_rate": 4.646044706103928e-06, - "loss": 2.4254, - "step": 520150 - }, - { - "epoch": 0.91, - "learning_rate": 4.6451727661771016e-06, - "loss": 2.2682, - "step": 520160 - }, - { - "epoch": 0.91, - "learning_rate": 4.644300826250275e-06, - "loss": 2.2347, - "step": 520170 - }, - { - "epoch": 0.91, - "learning_rate": 4.643428886323448e-06, - "loss": 2.2949, - "step": 520180 - }, - { - "epoch": 0.91, - "learning_rate": 4.642556946396621e-06, - "loss": 2.1521, - "step": 520190 - }, - { - "epoch": 0.91, - "learning_rate": 4.641685006469795e-06, - "loss": 2.315, - "step": 520200 - }, - { - "epoch": 0.91, - "learning_rate": 4.640813066542968e-06, - "loss": 2.2884, - "step": 520210 - }, - { - "epoch": 0.91, - "learning_rate": 4.639941126616141e-06, - "loss": 2.2692, - "step": 520220 - }, - { - "epoch": 0.91, - "learning_rate": 4.639069186689314e-06, - "loss": 2.2676, - "step": 520230 - }, - { - "epoch": 0.91, - "learning_rate": 4.6381972467624875e-06, - "loss": 2.203, - "step": 520240 - }, - { - "epoch": 0.91, - "learning_rate": 4.63732530683566e-06, - "loss": 2.2797, - "step": 520250 - }, - { - "epoch": 0.91, - "learning_rate": 4.636453366908833e-06, - "loss": 2.2721, - "step": 520260 - }, - { - "epoch": 0.91, - "learning_rate": 4.635581426982006e-06, - "loss": 2.2585, - "step": 520270 - }, - { - "epoch": 0.91, - "learning_rate": 4.63470948705518e-06, - "loss": 2.2067, - "step": 520280 - }, - { - "epoch": 0.91, - "learning_rate": 4.633837547128353e-06, - "loss": 2.3015, - "step": 520290 - }, - { - "epoch": 0.91, - "learning_rate": 4.632965607201527e-06, - "loss": 2.29, - "step": 520300 - }, - { - "epoch": 0.91, - "learning_rate": 4.6320936672747e-06, - "loss": 2.2389, - "step": 520310 - }, - { - "epoch": 0.91, - "learning_rate": 4.631221727347873e-06, - "loss": 2.1654, - "step": 520320 - }, - { - "epoch": 0.91, - "learning_rate": 4.630349787421046e-06, - "loss": 2.3011, - "step": 520330 - }, - { - "epoch": 0.91, - "learning_rate": 4.629477847494219e-06, - "loss": 2.2714, - "step": 520340 - }, - { - "epoch": 0.91, - "learning_rate": 4.628605907567392e-06, - "loss": 2.2411, - "step": 520350 - }, - { - "epoch": 0.91, - "learning_rate": 4.627733967640566e-06, - "loss": 2.3538, - "step": 520360 - }, - { - "epoch": 0.91, - "learning_rate": 4.626862027713739e-06, - "loss": 2.2988, - "step": 520370 - }, - { - "epoch": 0.91, - "learning_rate": 4.625990087786912e-06, - "loss": 2.2913, - "step": 520380 - }, - { - "epoch": 0.91, - "learning_rate": 4.625118147860085e-06, - "loss": 2.3293, - "step": 520390 - }, - { - "epoch": 0.91, - "learning_rate": 4.6242462079332585e-06, - "loss": 2.1829, - "step": 520400 - }, - { - "epoch": 0.91, - "learning_rate": 4.623374268006431e-06, - "loss": 2.3432, - "step": 520410 - }, - { - "epoch": 0.91, - "learning_rate": 4.622502328079604e-06, - "loss": 2.3285, - "step": 520420 - }, - { - "epoch": 0.91, - "learning_rate": 4.621630388152778e-06, - "loss": 2.3599, - "step": 520430 - }, - { - "epoch": 0.91, - "learning_rate": 4.620758448225952e-06, - "loss": 2.2147, - "step": 520440 - }, - { - "epoch": 0.91, - "learning_rate": 4.619886508299125e-06, - "loss": 2.1874, - "step": 520450 - }, - { - "epoch": 0.91, - "learning_rate": 4.619014568372298e-06, - "loss": 2.2609, - "step": 520460 - }, - { - "epoch": 0.91, - "learning_rate": 4.618142628445471e-06, - "loss": 2.2766, - "step": 520470 - }, - { - "epoch": 0.91, - "learning_rate": 4.617270688518644e-06, - "loss": 2.244, - "step": 520480 - }, - { - "epoch": 0.91, - "learning_rate": 4.616398748591817e-06, - "loss": 2.1716, - "step": 520490 - }, - { - "epoch": 0.91, - "learning_rate": 4.61552680866499e-06, - "loss": 2.2857, - "step": 520500 - }, - { - "epoch": 0.91, - "learning_rate": 4.614654868738163e-06, - "loss": 2.1742, - "step": 520510 - }, - { - "epoch": 0.91, - "learning_rate": 4.613782928811337e-06, - "loss": 2.2265, - "step": 520520 - }, - { - "epoch": 0.91, - "learning_rate": 4.61291098888451e-06, - "loss": 2.2155, - "step": 520530 - }, - { - "epoch": 0.91, - "learning_rate": 4.612039048957683e-06, - "loss": 2.2668, - "step": 520540 - }, - { - "epoch": 0.91, - "learning_rate": 4.611167109030856e-06, - "loss": 2.1951, - "step": 520550 - }, - { - "epoch": 0.91, - "learning_rate": 4.61029516910403e-06, - "loss": 2.1697, - "step": 520560 - }, - { - "epoch": 0.91, - "learning_rate": 4.609423229177203e-06, - "loss": 2.1701, - "step": 520570 - }, - { - "epoch": 0.91, - "learning_rate": 4.608551289250376e-06, - "loss": 2.2188, - "step": 520580 - }, - { - "epoch": 0.91, - "learning_rate": 4.607679349323549e-06, - "loss": 2.3005, - "step": 520590 - }, - { - "epoch": 0.91, - "learning_rate": 4.606807409396723e-06, - "loss": 2.3291, - "step": 520600 - }, - { - "epoch": 0.91, - "learning_rate": 4.605935469469896e-06, - "loss": 2.2166, - "step": 520610 - }, - { - "epoch": 0.91, - "learning_rate": 4.605063529543069e-06, - "loss": 2.2286, - "step": 520620 - }, - { - "epoch": 0.91, - "learning_rate": 4.604191589616242e-06, - "loss": 2.1674, - "step": 520630 - }, - { - "epoch": 0.91, - "learning_rate": 4.603319649689415e-06, - "loss": 2.2672, - "step": 520640 - }, - { - "epoch": 0.91, - "learning_rate": 4.602447709762588e-06, - "loss": 2.2692, - "step": 520650 - }, - { - "epoch": 0.91, - "learning_rate": 4.601575769835761e-06, - "loss": 2.3595, - "step": 520660 - }, - { - "epoch": 0.91, - "learning_rate": 4.600703829908934e-06, - "loss": 2.2824, - "step": 520670 - }, - { - "epoch": 0.91, - "learning_rate": 4.599831889982108e-06, - "loss": 2.3147, - "step": 520680 - }, - { - "epoch": 0.91, - "learning_rate": 4.598959950055281e-06, - "loss": 2.212, - "step": 520690 - }, - { - "epoch": 0.91, - "learning_rate": 4.598088010128455e-06, - "loss": 2.2772, - "step": 520700 - }, - { - "epoch": 0.91, - "learning_rate": 4.5972160702016276e-06, - "loss": 2.2945, - "step": 520710 - }, - { - "epoch": 0.91, - "learning_rate": 4.596344130274801e-06, - "loss": 2.2449, - "step": 520720 - }, - { - "epoch": 0.91, - "learning_rate": 4.595472190347974e-06, - "loss": 2.2391, - "step": 520730 - }, - { - "epoch": 0.91, - "learning_rate": 4.594600250421147e-06, - "loss": 2.3061, - "step": 520740 - }, - { - "epoch": 0.91, - "learning_rate": 4.59372831049432e-06, - "loss": 2.3927, - "step": 520750 - }, - { - "epoch": 0.91, - "learning_rate": 4.592856370567494e-06, - "loss": 2.1692, - "step": 520760 - }, - { - "epoch": 0.91, - "learning_rate": 4.591984430640667e-06, - "loss": 2.1208, - "step": 520770 - }, - { - "epoch": 0.91, - "learning_rate": 4.59111249071384e-06, - "loss": 2.3644, - "step": 520780 - }, - { - "epoch": 0.91, - "learning_rate": 4.590240550787013e-06, - "loss": 2.1738, - "step": 520790 - }, - { - "epoch": 0.91, - "learning_rate": 4.589368610860186e-06, - "loss": 2.2213, - "step": 520800 - }, - { - "epoch": 0.91, - "learning_rate": 4.588496670933359e-06, - "loss": 2.2286, - "step": 520810 - }, - { - "epoch": 0.91, - "learning_rate": 4.587624731006532e-06, - "loss": 2.2682, - "step": 520820 - }, - { - "epoch": 0.91, - "learning_rate": 4.586752791079706e-06, - "loss": 2.2426, - "step": 520830 - }, - { - "epoch": 0.91, - "learning_rate": 4.58588085115288e-06, - "loss": 2.3903, - "step": 520840 - }, - { - "epoch": 0.91, - "learning_rate": 4.585008911226053e-06, - "loss": 2.326, - "step": 520850 - }, - { - "epoch": 0.91, - "learning_rate": 4.584136971299226e-06, - "loss": 2.2706, - "step": 520860 - }, - { - "epoch": 0.91, - "learning_rate": 4.583265031372399e-06, - "loss": 2.2593, - "step": 520870 - }, - { - "epoch": 0.91, - "learning_rate": 4.582393091445572e-06, - "loss": 2.2249, - "step": 520880 - }, - { - "epoch": 0.91, - "learning_rate": 4.581521151518745e-06, - "loss": 2.3073, - "step": 520890 - }, - { - "epoch": 0.91, - "learning_rate": 4.580649211591918e-06, - "loss": 2.2803, - "step": 520900 - }, - { - "epoch": 0.91, - "learning_rate": 4.579777271665091e-06, - "loss": 2.1851, - "step": 520910 - }, - { - "epoch": 0.91, - "learning_rate": 4.578905331738265e-06, - "loss": 2.3609, - "step": 520920 - }, - { - "epoch": 0.91, - "learning_rate": 4.578033391811438e-06, - "loss": 2.2761, - "step": 520930 - }, - { - "epoch": 0.91, - "learning_rate": 4.577161451884611e-06, - "loss": 2.2159, - "step": 520940 - }, - { - "epoch": 0.91, - "learning_rate": 4.576289511957784e-06, - "loss": 2.2548, - "step": 520950 - }, - { - "epoch": 0.91, - "learning_rate": 4.575417572030958e-06, - "loss": 2.2635, - "step": 520960 - }, - { - "epoch": 0.91, - "learning_rate": 4.574545632104131e-06, - "loss": 2.2066, - "step": 520970 - }, - { - "epoch": 0.91, - "learning_rate": 4.573673692177304e-06, - "loss": 2.2074, - "step": 520980 - }, - { - "epoch": 0.91, - "learning_rate": 4.572801752250477e-06, - "loss": 2.3085, - "step": 520990 - }, - { - "epoch": 0.91, - "learning_rate": 4.571929812323651e-06, - "loss": 2.3399, - "step": 521000 - }, - { - "epoch": 0.91, - "learning_rate": 4.571057872396824e-06, - "loss": 2.2008, - "step": 521010 - }, - { - "epoch": 0.91, - "learning_rate": 4.570185932469997e-06, - "loss": 2.2416, - "step": 521020 - }, - { - "epoch": 0.91, - "learning_rate": 4.56931399254317e-06, - "loss": 2.2755, - "step": 521030 - }, - { - "epoch": 0.91, - "learning_rate": 4.568442052616343e-06, - "loss": 2.1817, - "step": 521040 - }, - { - "epoch": 0.91, - "learning_rate": 4.567570112689516e-06, - "loss": 2.2879, - "step": 521050 - }, - { - "epoch": 0.91, - "learning_rate": 4.566698172762689e-06, - "loss": 2.2524, - "step": 521060 - }, - { - "epoch": 0.91, - "learning_rate": 4.565826232835862e-06, - "loss": 2.1722, - "step": 521070 - }, - { - "epoch": 0.91, - "learning_rate": 4.564954292909036e-06, - "loss": 2.1678, - "step": 521080 - }, - { - "epoch": 0.91, - "learning_rate": 4.564082352982209e-06, - "loss": 2.3102, - "step": 521090 - }, - { - "epoch": 0.91, - "learning_rate": 4.563210413055383e-06, - "loss": 2.2194, - "step": 521100 - }, - { - "epoch": 0.91, - "learning_rate": 4.5623384731285555e-06, - "loss": 2.2301, - "step": 521110 - }, - { - "epoch": 0.91, - "learning_rate": 4.561466533201729e-06, - "loss": 2.3635, - "step": 521120 - }, - { - "epoch": 0.91, - "learning_rate": 4.560594593274902e-06, - "loss": 2.3131, - "step": 521130 - }, - { - "epoch": 0.91, - "learning_rate": 4.559722653348075e-06, - "loss": 2.3232, - "step": 521140 - }, - { - "epoch": 0.91, - "learning_rate": 4.558850713421248e-06, - "loss": 2.2839, - "step": 521150 - }, - { - "epoch": 0.91, - "learning_rate": 4.557978773494422e-06, - "loss": 2.1884, - "step": 521160 - }, - { - "epoch": 0.91, - "learning_rate": 4.557106833567595e-06, - "loss": 2.3465, - "step": 521170 - }, - { - "epoch": 0.91, - "learning_rate": 4.556234893640768e-06, - "loss": 2.1999, - "step": 521180 - }, - { - "epoch": 0.91, - "learning_rate": 4.555362953713941e-06, - "loss": 2.348, - "step": 521190 - }, - { - "epoch": 0.91, - "learning_rate": 4.554491013787114e-06, - "loss": 2.2628, - "step": 521200 - }, - { - "epoch": 0.91, - "learning_rate": 4.553619073860287e-06, - "loss": 2.1762, - "step": 521210 - }, - { - "epoch": 0.91, - "learning_rate": 4.55274713393346e-06, - "loss": 2.3473, - "step": 521220 - }, - { - "epoch": 0.91, - "learning_rate": 4.551875194006634e-06, - "loss": 2.3311, - "step": 521230 - }, - { - "epoch": 0.91, - "learning_rate": 4.551003254079808e-06, - "loss": 2.2614, - "step": 521240 - }, - { - "epoch": 0.91, - "learning_rate": 4.550131314152981e-06, - "loss": 2.3464, - "step": 521250 - }, - { - "epoch": 0.91, - "learning_rate": 4.549259374226154e-06, - "loss": 2.2444, - "step": 521260 - }, - { - "epoch": 0.91, - "learning_rate": 4.5483874342993265e-06, - "loss": 2.3506, - "step": 521270 - }, - { - "epoch": 0.91, - "learning_rate": 4.5475154943725e-06, - "loss": 2.2469, - "step": 521280 - }, - { - "epoch": 0.91, - "learning_rate": 4.546643554445673e-06, - "loss": 2.2461, - "step": 521290 - }, - { - "epoch": 0.91, - "learning_rate": 4.545771614518846e-06, - "loss": 2.2721, - "step": 521300 - }, - { - "epoch": 0.91, - "learning_rate": 4.544899674592019e-06, - "loss": 2.1982, - "step": 521310 - }, - { - "epoch": 0.91, - "learning_rate": 4.544027734665193e-06, - "loss": 2.3201, - "step": 521320 - }, - { - "epoch": 0.91, - "learning_rate": 4.543155794738366e-06, - "loss": 2.2216, - "step": 521330 - }, - { - "epoch": 0.91, - "learning_rate": 4.542283854811539e-06, - "loss": 2.229, - "step": 521340 - }, - { - "epoch": 0.91, - "learning_rate": 4.5414119148847124e-06, - "loss": 2.2788, - "step": 521350 - }, - { - "epoch": 0.91, - "learning_rate": 4.540539974957886e-06, - "loss": 2.2437, - "step": 521360 - }, - { - "epoch": 0.91, - "learning_rate": 4.539668035031059e-06, - "loss": 2.2655, - "step": 521370 - }, - { - "epoch": 0.91, - "learning_rate": 4.538796095104232e-06, - "loss": 2.2818, - "step": 521380 - }, - { - "epoch": 0.91, - "learning_rate": 4.537924155177405e-06, - "loss": 2.1202, - "step": 521390 - }, - { - "epoch": 0.91, - "learning_rate": 4.537052215250579e-06, - "loss": 2.3304, - "step": 521400 - }, - { - "epoch": 0.91, - "learning_rate": 4.536180275323752e-06, - "loss": 2.2397, - "step": 521410 - }, - { - "epoch": 0.91, - "learning_rate": 4.535308335396925e-06, - "loss": 2.2682, - "step": 521420 - }, - { - "epoch": 0.91, - "learning_rate": 4.5344363954700975e-06, - "loss": 2.1234, - "step": 521430 - }, - { - "epoch": 0.91, - "learning_rate": 4.533564455543271e-06, - "loss": 2.197, - "step": 521440 - }, - { - "epoch": 0.91, - "learning_rate": 4.532692515616444e-06, - "loss": 2.2653, - "step": 521450 - }, - { - "epoch": 0.91, - "learning_rate": 4.531820575689617e-06, - "loss": 2.2121, - "step": 521460 - }, - { - "epoch": 0.91, - "learning_rate": 4.53094863576279e-06, - "loss": 2.2759, - "step": 521470 - }, - { - "epoch": 0.91, - "learning_rate": 4.530076695835964e-06, - "loss": 2.2123, - "step": 521480 - }, - { - "epoch": 0.91, - "learning_rate": 4.529204755909137e-06, - "loss": 2.2254, - "step": 521490 - }, - { - "epoch": 0.91, - "learning_rate": 4.5283328159823105e-06, - "loss": 2.2612, - "step": 521500 - }, - { - "epoch": 0.91, - "learning_rate": 4.5274608760554834e-06, - "loss": 2.2731, - "step": 521510 - }, - { - "epoch": 0.91, - "learning_rate": 4.526588936128657e-06, - "loss": 2.21, - "step": 521520 - }, - { - "epoch": 0.91, - "learning_rate": 4.52571699620183e-06, - "loss": 2.3597, - "step": 521530 - }, - { - "epoch": 0.91, - "learning_rate": 4.524845056275003e-06, - "loss": 2.2603, - "step": 521540 - }, - { - "epoch": 0.91, - "learning_rate": 4.523973116348176e-06, - "loss": 2.2669, - "step": 521550 - }, - { - "epoch": 0.91, - "learning_rate": 4.52310117642135e-06, - "loss": 2.2558, - "step": 521560 - }, - { - "epoch": 0.91, - "learning_rate": 4.522229236494523e-06, - "loss": 2.2924, - "step": 521570 - }, - { - "epoch": 0.91, - "learning_rate": 4.521357296567696e-06, - "loss": 2.2186, - "step": 521580 - }, - { - "epoch": 0.91, - "learning_rate": 4.5204853566408685e-06, - "loss": 2.376, - "step": 521590 - }, - { - "epoch": 0.91, - "learning_rate": 4.519613416714042e-06, - "loss": 2.2943, - "step": 521600 - }, - { - "epoch": 0.91, - "learning_rate": 4.518741476787215e-06, - "loss": 2.2836, - "step": 521610 - }, - { - "epoch": 0.91, - "learning_rate": 4.517869536860388e-06, - "loss": 2.2854, - "step": 521620 - }, - { - "epoch": 0.91, - "learning_rate": 4.516997596933562e-06, - "loss": 2.2732, - "step": 521630 - }, - { - "epoch": 0.91, - "learning_rate": 4.516125657006736e-06, - "loss": 2.2073, - "step": 521640 - }, - { - "epoch": 0.91, - "learning_rate": 4.515253717079909e-06, - "loss": 2.2786, - "step": 521650 - }, - { - "epoch": 0.91, - "learning_rate": 4.5143817771530815e-06, - "loss": 2.1159, - "step": 521660 - }, - { - "epoch": 0.91, - "learning_rate": 4.5135098372262544e-06, - "loss": 2.2905, - "step": 521670 - }, - { - "epoch": 0.91, - "learning_rate": 4.512637897299428e-06, - "loss": 2.2582, - "step": 521680 - }, - { - "epoch": 0.91, - "learning_rate": 4.511765957372601e-06, - "loss": 2.3724, - "step": 521690 - }, - { - "epoch": 0.91, - "learning_rate": 4.510894017445774e-06, - "loss": 2.2298, - "step": 521700 - }, - { - "epoch": 0.91, - "learning_rate": 4.510022077518947e-06, - "loss": 2.4006, - "step": 521710 - }, - { - "epoch": 0.91, - "learning_rate": 4.509150137592121e-06, - "loss": 2.1767, - "step": 521720 - }, - { - "epoch": 0.91, - "learning_rate": 4.508278197665294e-06, - "loss": 2.2982, - "step": 521730 - }, - { - "epoch": 0.91, - "learning_rate": 4.507406257738467e-06, - "loss": 2.2558, - "step": 521740 - }, - { - "epoch": 0.91, - "learning_rate": 4.50653431781164e-06, - "loss": 2.1785, - "step": 521750 - }, - { - "epoch": 0.91, - "learning_rate": 4.505662377884814e-06, - "loss": 2.2843, - "step": 521760 - }, - { - "epoch": 0.91, - "learning_rate": 4.504790437957987e-06, - "loss": 2.2004, - "step": 521770 - }, - { - "epoch": 0.91, - "learning_rate": 4.50391849803116e-06, - "loss": 2.2653, - "step": 521780 - }, - { - "epoch": 0.91, - "learning_rate": 4.503046558104333e-06, - "loss": 2.24, - "step": 521790 - }, - { - "epoch": 0.91, - "learning_rate": 4.502174618177507e-06, - "loss": 2.2728, - "step": 521800 - }, - { - "epoch": 0.91, - "learning_rate": 4.50130267825068e-06, - "loss": 2.2372, - "step": 521810 - }, - { - "epoch": 0.91, - "learning_rate": 4.5004307383238525e-06, - "loss": 2.2197, - "step": 521820 - }, - { - "epoch": 0.91, - "learning_rate": 4.4995587983970254e-06, - "loss": 2.2801, - "step": 521830 - }, - { - "epoch": 0.91, - "learning_rate": 4.498686858470199e-06, - "loss": 2.3318, - "step": 521840 - }, - { - "epoch": 0.91, - "learning_rate": 4.497814918543372e-06, - "loss": 2.1956, - "step": 521850 - }, - { - "epoch": 0.91, - "learning_rate": 4.496942978616545e-06, - "loss": 2.246, - "step": 521860 - }, - { - "epoch": 0.91, - "learning_rate": 4.496071038689719e-06, - "loss": 2.2857, - "step": 521870 - }, - { - "epoch": 0.91, - "learning_rate": 4.495199098762892e-06, - "loss": 2.2168, - "step": 521880 - }, - { - "epoch": 0.91, - "learning_rate": 4.494327158836065e-06, - "loss": 2.2831, - "step": 521890 - }, - { - "epoch": 0.91, - "learning_rate": 4.4934552189092384e-06, - "loss": 2.2514, - "step": 521900 - }, - { - "epoch": 0.91, - "learning_rate": 4.492583278982411e-06, - "loss": 2.388, - "step": 521910 - }, - { - "epoch": 0.91, - "learning_rate": 4.491711339055585e-06, - "loss": 2.2675, - "step": 521920 - }, - { - "epoch": 0.91, - "learning_rate": 4.490839399128758e-06, - "loss": 2.2358, - "step": 521930 - }, - { - "epoch": 0.91, - "learning_rate": 4.489967459201931e-06, - "loss": 2.4247, - "step": 521940 - }, - { - "epoch": 0.91, - "learning_rate": 4.489095519275104e-06, - "loss": 2.3451, - "step": 521950 - }, - { - "epoch": 0.91, - "learning_rate": 4.488223579348278e-06, - "loss": 2.1031, - "step": 521960 - }, - { - "epoch": 0.91, - "learning_rate": 4.487351639421451e-06, - "loss": 2.2714, - "step": 521970 - }, - { - "epoch": 0.91, - "learning_rate": 4.4864796994946235e-06, - "loss": 2.2105, - "step": 521980 - }, - { - "epoch": 0.91, - "learning_rate": 4.485607759567797e-06, - "loss": 2.2386, - "step": 521990 - }, - { - "epoch": 0.91, - "learning_rate": 4.48473581964097e-06, - "loss": 2.2191, - "step": 522000 - }, - { - "epoch": 0.91, - "learning_rate": 4.483863879714143e-06, - "loss": 2.3744, - "step": 522010 - }, - { - "epoch": 0.91, - "learning_rate": 4.482991939787316e-06, - "loss": 2.2134, - "step": 522020 - }, - { - "epoch": 0.91, - "learning_rate": 4.48211999986049e-06, - "loss": 2.2435, - "step": 522030 - }, - { - "epoch": 0.91, - "learning_rate": 4.481248059933664e-06, - "loss": 2.3294, - "step": 522040 - }, - { - "epoch": 0.91, - "learning_rate": 4.4803761200068365e-06, - "loss": 2.378, - "step": 522050 - }, - { - "epoch": 0.91, - "learning_rate": 4.4795041800800094e-06, - "loss": 2.2273, - "step": 522060 - }, - { - "epoch": 0.91, - "learning_rate": 4.478632240153182e-06, - "loss": 2.2501, - "step": 522070 - }, - { - "epoch": 0.91, - "learning_rate": 4.477760300226356e-06, - "loss": 2.2528, - "step": 522080 - }, - { - "epoch": 0.91, - "learning_rate": 4.476888360299529e-06, - "loss": 2.2815, - "step": 522090 - }, - { - "epoch": 0.91, - "learning_rate": 4.476016420372702e-06, - "loss": 2.2052, - "step": 522100 - }, - { - "epoch": 0.91, - "learning_rate": 4.475144480445875e-06, - "loss": 2.3264, - "step": 522110 - }, - { - "epoch": 0.91, - "learning_rate": 4.474272540519049e-06, - "loss": 2.1876, - "step": 522120 - }, - { - "epoch": 0.91, - "learning_rate": 4.473400600592222e-06, - "loss": 2.2572, - "step": 522130 - }, - { - "epoch": 0.91, - "learning_rate": 4.4725286606653945e-06, - "loss": 2.246, - "step": 522140 - }, - { - "epoch": 0.91, - "learning_rate": 4.471656720738568e-06, - "loss": 2.2393, - "step": 522150 - }, - { - "epoch": 0.91, - "learning_rate": 4.470784780811742e-06, - "loss": 2.23, - "step": 522160 - }, - { - "epoch": 0.91, - "learning_rate": 4.469912840884915e-06, - "loss": 2.3891, - "step": 522170 - }, - { - "epoch": 0.91, - "learning_rate": 4.469040900958088e-06, - "loss": 2.2913, - "step": 522180 - }, - { - "epoch": 0.91, - "learning_rate": 4.468168961031261e-06, - "loss": 2.3577, - "step": 522190 - }, - { - "epoch": 0.91, - "learning_rate": 4.467297021104435e-06, - "loss": 2.3611, - "step": 522200 - }, - { - "epoch": 0.91, - "learning_rate": 4.4664250811776075e-06, - "loss": 2.2036, - "step": 522210 - }, - { - "epoch": 0.91, - "learning_rate": 4.4655531412507804e-06, - "loss": 2.2824, - "step": 522220 - }, - { - "epoch": 0.91, - "learning_rate": 4.464681201323953e-06, - "loss": 2.2213, - "step": 522230 - }, - { - "epoch": 0.91, - "learning_rate": 4.463809261397127e-06, - "loss": 2.2571, - "step": 522240 - }, - { - "epoch": 0.91, - "learning_rate": 4.4629373214703e-06, - "loss": 2.3081, - "step": 522250 - }, - { - "epoch": 0.91, - "learning_rate": 4.462065381543473e-06, - "loss": 2.2632, - "step": 522260 - }, - { - "epoch": 0.91, - "learning_rate": 4.461193441616647e-06, - "loss": 2.2238, - "step": 522270 - }, - { - "epoch": 0.91, - "learning_rate": 4.46032150168982e-06, - "loss": 2.2512, - "step": 522280 - }, - { - "epoch": 0.91, - "learning_rate": 4.4594495617629934e-06, - "loss": 2.1427, - "step": 522290 - }, - { - "epoch": 0.91, - "learning_rate": 4.458577621836166e-06, - "loss": 2.2568, - "step": 522300 - }, - { - "epoch": 0.91, - "learning_rate": 4.457705681909339e-06, - "loss": 2.2624, - "step": 522310 - }, - { - "epoch": 0.91, - "learning_rate": 4.456833741982513e-06, - "loss": 2.2634, - "step": 522320 - }, - { - "epoch": 0.91, - "learning_rate": 4.455961802055686e-06, - "loss": 2.3088, - "step": 522330 - }, - { - "epoch": 0.91, - "learning_rate": 4.455089862128859e-06, - "loss": 2.2338, - "step": 522340 - }, - { - "epoch": 0.91, - "learning_rate": 4.454217922202032e-06, - "loss": 2.24, - "step": 522350 - }, - { - "epoch": 0.91, - "learning_rate": 4.453345982275206e-06, - "loss": 2.2797, - "step": 522360 - }, - { - "epoch": 0.91, - "learning_rate": 4.4524740423483785e-06, - "loss": 2.2457, - "step": 522370 - }, - { - "epoch": 0.91, - "learning_rate": 4.4516021024215514e-06, - "loss": 2.2637, - "step": 522380 - }, - { - "epoch": 0.91, - "learning_rate": 4.450730162494725e-06, - "loss": 2.3, - "step": 522390 - }, - { - "epoch": 0.91, - "learning_rate": 4.449858222567898e-06, - "loss": 2.1743, - "step": 522400 - }, - { - "epoch": 0.91, - "learning_rate": 4.448986282641071e-06, - "loss": 2.246, - "step": 522410 - }, - { - "epoch": 0.91, - "learning_rate": 4.448114342714244e-06, - "loss": 2.2834, - "step": 522420 - }, - { - "epoch": 0.91, - "learning_rate": 4.447242402787418e-06, - "loss": 2.2142, - "step": 522430 - }, - { - "epoch": 0.91, - "learning_rate": 4.4463704628605915e-06, - "loss": 2.2216, - "step": 522440 - }, - { - "epoch": 0.91, - "learning_rate": 4.4454985229337644e-06, - "loss": 2.2062, - "step": 522450 - }, - { - "epoch": 0.91, - "learning_rate": 4.444626583006937e-06, - "loss": 2.2578, - "step": 522460 - }, - { - "epoch": 0.91, - "learning_rate": 4.44375464308011e-06, - "loss": 2.1922, - "step": 522470 - }, - { - "epoch": 0.91, - "learning_rate": 4.442882703153284e-06, - "loss": 2.2169, - "step": 522480 - }, - { - "epoch": 0.91, - "learning_rate": 4.442010763226457e-06, - "loss": 2.3594, - "step": 522490 - }, - { - "epoch": 0.91, - "learning_rate": 4.44113882329963e-06, - "loss": 2.3865, - "step": 522500 - }, - { - "epoch": 0.91, - "learning_rate": 4.440266883372804e-06, - "loss": 2.1929, - "step": 522510 - }, - { - "epoch": 0.91, - "learning_rate": 4.439394943445977e-06, - "loss": 2.3305, - "step": 522520 - }, - { - "epoch": 0.91, - "learning_rate": 4.4385230035191495e-06, - "loss": 2.4118, - "step": 522530 - }, - { - "epoch": 0.91, - "learning_rate": 4.4376510635923224e-06, - "loss": 2.2385, - "step": 522540 - }, - { - "epoch": 0.91, - "learning_rate": 4.436779123665496e-06, - "loss": 2.1673, - "step": 522550 - }, - { - "epoch": 0.91, - "learning_rate": 4.43590718373867e-06, - "loss": 2.1009, - "step": 522560 - }, - { - "epoch": 0.91, - "learning_rate": 4.435035243811843e-06, - "loss": 2.307, - "step": 522570 - }, - { - "epoch": 0.91, - "learning_rate": 4.434163303885016e-06, - "loss": 2.25, - "step": 522580 - }, - { - "epoch": 0.91, - "learning_rate": 4.433291363958189e-06, - "loss": 2.2726, - "step": 522590 - }, - { - "epoch": 0.91, - "learning_rate": 4.4324194240313625e-06, - "loss": 2.325, - "step": 522600 - }, - { - "epoch": 0.91, - "learning_rate": 4.4315474841045354e-06, - "loss": 2.3794, - "step": 522610 - }, - { - "epoch": 0.91, - "learning_rate": 4.430675544177708e-06, - "loss": 2.1977, - "step": 522620 - }, - { - "epoch": 0.91, - "learning_rate": 4.429803604250881e-06, - "loss": 2.1705, - "step": 522630 - }, - { - "epoch": 0.91, - "learning_rate": 4.428931664324055e-06, - "loss": 2.2186, - "step": 522640 - }, - { - "epoch": 0.91, - "learning_rate": 4.428059724397228e-06, - "loss": 2.3045, - "step": 522650 - }, - { - "epoch": 0.91, - "learning_rate": 4.427187784470401e-06, - "loss": 2.3445, - "step": 522660 - }, - { - "epoch": 0.91, - "learning_rate": 4.426315844543575e-06, - "loss": 2.2632, - "step": 522670 - }, - { - "epoch": 0.91, - "learning_rate": 4.425443904616748e-06, - "loss": 2.2751, - "step": 522680 - }, - { - "epoch": 0.91, - "learning_rate": 4.424571964689921e-06, - "loss": 2.2609, - "step": 522690 - }, - { - "epoch": 0.91, - "learning_rate": 4.423700024763094e-06, - "loss": 2.373, - "step": 522700 - }, - { - "epoch": 0.91, - "learning_rate": 4.422828084836267e-06, - "loss": 2.1794, - "step": 522710 - }, - { - "epoch": 0.91, - "learning_rate": 4.421956144909441e-06, - "loss": 2.2538, - "step": 522720 - }, - { - "epoch": 0.91, - "learning_rate": 4.421084204982614e-06, - "loss": 2.3618, - "step": 522730 - }, - { - "epoch": 0.91, - "learning_rate": 4.420212265055787e-06, - "loss": 2.2792, - "step": 522740 - }, - { - "epoch": 0.91, - "learning_rate": 4.41934032512896e-06, - "loss": 2.3149, - "step": 522750 - }, - { - "epoch": 0.91, - "learning_rate": 4.4184683852021335e-06, - "loss": 2.1791, - "step": 522760 - }, - { - "epoch": 0.91, - "learning_rate": 4.4175964452753064e-06, - "loss": 2.2557, - "step": 522770 - }, - { - "epoch": 0.91, - "learning_rate": 4.416724505348479e-06, - "loss": 2.3118, - "step": 522780 - }, - { - "epoch": 0.91, - "learning_rate": 4.415852565421653e-06, - "loss": 2.2866, - "step": 522790 - }, - { - "epoch": 0.91, - "learning_rate": 4.414980625494826e-06, - "loss": 2.1489, - "step": 522800 - }, - { - "epoch": 0.91, - "learning_rate": 4.414108685567999e-06, - "loss": 2.2303, - "step": 522810 - }, - { - "epoch": 0.91, - "learning_rate": 4.413236745641172e-06, - "loss": 2.1695, - "step": 522820 - }, - { - "epoch": 0.91, - "learning_rate": 4.412364805714346e-06, - "loss": 2.3656, - "step": 522830 - }, - { - "epoch": 0.91, - "learning_rate": 4.4114928657875194e-06, - "loss": 2.1515, - "step": 522840 - }, - { - "epoch": 0.91, - "learning_rate": 4.410620925860692e-06, - "loss": 2.2728, - "step": 522850 - }, - { - "epoch": 0.91, - "learning_rate": 4.409748985933865e-06, - "loss": 2.2534, - "step": 522860 - }, - { - "epoch": 0.91, - "learning_rate": 4.408877046007038e-06, - "loss": 2.2639, - "step": 522870 - }, - { - "epoch": 0.91, - "learning_rate": 4.408005106080212e-06, - "loss": 2.2781, - "step": 522880 - }, - { - "epoch": 0.91, - "learning_rate": 4.407133166153385e-06, - "loss": 2.2793, - "step": 522890 - }, - { - "epoch": 0.91, - "learning_rate": 4.406261226226558e-06, - "loss": 2.285, - "step": 522900 - }, - { - "epoch": 0.91, - "learning_rate": 4.405389286299732e-06, - "loss": 2.2699, - "step": 522910 - }, - { - "epoch": 0.91, - "learning_rate": 4.4045173463729045e-06, - "loss": 2.258, - "step": 522920 - }, - { - "epoch": 0.91, - "learning_rate": 4.4036454064460774e-06, - "loss": 2.2401, - "step": 522930 - }, - { - "epoch": 0.91, - "learning_rate": 4.40277346651925e-06, - "loss": 2.2836, - "step": 522940 - }, - { - "epoch": 0.91, - "learning_rate": 4.401901526592424e-06, - "loss": 2.1401, - "step": 522950 - }, - { - "epoch": 0.91, - "learning_rate": 4.401029586665598e-06, - "loss": 2.2195, - "step": 522960 - }, - { - "epoch": 0.91, - "learning_rate": 4.400157646738771e-06, - "loss": 2.2619, - "step": 522970 - }, - { - "epoch": 0.91, - "learning_rate": 4.399285706811944e-06, - "loss": 2.2969, - "step": 522980 - }, - { - "epoch": 0.91, - "learning_rate": 4.398413766885117e-06, - "loss": 2.2825, - "step": 522990 - }, - { - "epoch": 0.91, - "learning_rate": 4.3975418269582904e-06, - "loss": 2.2971, - "step": 523000 - }, - { - "epoch": 0.91, - "learning_rate": 4.396669887031463e-06, - "loss": 2.2427, - "step": 523010 - }, - { - "epoch": 0.91, - "learning_rate": 4.395797947104636e-06, - "loss": 2.4066, - "step": 523020 - }, - { - "epoch": 0.91, - "learning_rate": 4.39492600717781e-06, - "loss": 2.2377, - "step": 523030 - }, - { - "epoch": 0.91, - "learning_rate": 4.394054067250983e-06, - "loss": 2.2361, - "step": 523040 - }, - { - "epoch": 0.91, - "learning_rate": 4.393182127324156e-06, - "loss": 2.3028, - "step": 523050 - }, - { - "epoch": 0.91, - "learning_rate": 4.392310187397329e-06, - "loss": 2.208, - "step": 523060 - }, - { - "epoch": 0.91, - "learning_rate": 4.391438247470503e-06, - "loss": 2.2517, - "step": 523070 - }, - { - "epoch": 0.91, - "learning_rate": 4.3905663075436755e-06, - "loss": 2.2806, - "step": 523080 - }, - { - "epoch": 0.91, - "learning_rate": 4.389694367616849e-06, - "loss": 2.1425, - "step": 523090 - }, - { - "epoch": 0.91, - "learning_rate": 4.388822427690022e-06, - "loss": 2.2914, - "step": 523100 - }, - { - "epoch": 0.91, - "learning_rate": 4.387950487763195e-06, - "loss": 2.255, - "step": 523110 - }, - { - "epoch": 0.91, - "learning_rate": 4.387078547836369e-06, - "loss": 2.3288, - "step": 523120 - }, - { - "epoch": 0.91, - "learning_rate": 4.386206607909542e-06, - "loss": 2.241, - "step": 523130 - }, - { - "epoch": 0.91, - "learning_rate": 4.385334667982715e-06, - "loss": 2.2676, - "step": 523140 - }, - { - "epoch": 0.91, - "learning_rate": 4.384462728055888e-06, - "loss": 2.2661, - "step": 523150 - }, - { - "epoch": 0.91, - "learning_rate": 4.3835907881290614e-06, - "loss": 2.3039, - "step": 523160 - }, - { - "epoch": 0.91, - "learning_rate": 4.382718848202234e-06, - "loss": 2.2893, - "step": 523170 - }, - { - "epoch": 0.91, - "learning_rate": 4.381846908275407e-06, - "loss": 2.229, - "step": 523180 - }, - { - "epoch": 0.91, - "learning_rate": 4.380974968348581e-06, - "loss": 2.124, - "step": 523190 - }, - { - "epoch": 0.91, - "learning_rate": 4.380103028421754e-06, - "loss": 2.2696, - "step": 523200 - }, - { - "epoch": 0.91, - "learning_rate": 4.379231088494927e-06, - "loss": 2.2509, - "step": 523210 - }, - { - "epoch": 0.91, - "learning_rate": 4.3783591485681e-06, - "loss": 2.2396, - "step": 523220 - }, - { - "epoch": 0.91, - "learning_rate": 4.377487208641274e-06, - "loss": 2.1772, - "step": 523230 - }, - { - "epoch": 0.91, - "learning_rate": 4.376615268714447e-06, - "loss": 2.275, - "step": 523240 - }, - { - "epoch": 0.91, - "learning_rate": 4.37574332878762e-06, - "loss": 2.1885, - "step": 523250 - }, - { - "epoch": 0.91, - "learning_rate": 4.374871388860793e-06, - "loss": 2.1831, - "step": 523260 - }, - { - "epoch": 0.91, - "learning_rate": 4.373999448933966e-06, - "loss": 2.2609, - "step": 523270 - }, - { - "epoch": 0.91, - "learning_rate": 4.37312750900714e-06, - "loss": 2.2716, - "step": 523280 - }, - { - "epoch": 0.91, - "learning_rate": 4.372255569080313e-06, - "loss": 2.2767, - "step": 523290 - }, - { - "epoch": 0.91, - "learning_rate": 4.371383629153486e-06, - "loss": 2.2484, - "step": 523300 - }, - { - "epoch": 0.91, - "learning_rate": 4.3705116892266595e-06, - "loss": 2.1358, - "step": 523310 - }, - { - "epoch": 0.91, - "learning_rate": 4.3696397492998324e-06, - "loss": 2.3058, - "step": 523320 - }, - { - "epoch": 0.91, - "learning_rate": 4.368767809373005e-06, - "loss": 2.2636, - "step": 523330 - }, - { - "epoch": 0.91, - "learning_rate": 4.367895869446178e-06, - "loss": 2.1938, - "step": 523340 - }, - { - "epoch": 0.91, - "learning_rate": 4.367023929519352e-06, - "loss": 2.1991, - "step": 523350 - }, - { - "epoch": 0.91, - "learning_rate": 4.366151989592526e-06, - "loss": 2.3136, - "step": 523360 - }, - { - "epoch": 0.91, - "learning_rate": 4.365280049665699e-06, - "loss": 2.2655, - "step": 523370 - }, - { - "epoch": 0.91, - "learning_rate": 4.364408109738872e-06, - "loss": 2.1674, - "step": 523380 - }, - { - "epoch": 0.91, - "learning_rate": 4.363536169812045e-06, - "loss": 2.2408, - "step": 523390 - }, - { - "epoch": 0.91, - "learning_rate": 4.362664229885218e-06, - "loss": 2.2841, - "step": 523400 - }, - { - "epoch": 0.91, - "learning_rate": 4.361792289958391e-06, - "loss": 2.2889, - "step": 523410 - }, - { - "epoch": 0.91, - "learning_rate": 4.360920350031564e-06, - "loss": 2.0985, - "step": 523420 - }, - { - "epoch": 0.91, - "learning_rate": 4.360048410104738e-06, - "loss": 2.1592, - "step": 523430 - }, - { - "epoch": 0.91, - "learning_rate": 4.359176470177911e-06, - "loss": 2.3365, - "step": 523440 - }, - { - "epoch": 0.91, - "learning_rate": 4.358304530251084e-06, - "loss": 2.1893, - "step": 523450 - }, - { - "epoch": 0.91, - "learning_rate": 4.357432590324257e-06, - "loss": 2.3454, - "step": 523460 - }, - { - "epoch": 0.91, - "learning_rate": 4.3565606503974305e-06, - "loss": 2.2722, - "step": 523470 - }, - { - "epoch": 0.91, - "learning_rate": 4.3556887104706034e-06, - "loss": 2.3411, - "step": 523480 - }, - { - "epoch": 0.91, - "learning_rate": 4.354816770543777e-06, - "loss": 2.2835, - "step": 523490 - }, - { - "epoch": 0.91, - "learning_rate": 4.35394483061695e-06, - "loss": 2.3194, - "step": 523500 - }, - { - "epoch": 0.91, - "learning_rate": 4.353072890690123e-06, - "loss": 2.2758, - "step": 523510 - }, - { - "epoch": 0.91, - "learning_rate": 4.352200950763297e-06, - "loss": 2.3241, - "step": 523520 - }, - { - "epoch": 0.91, - "learning_rate": 4.35132901083647e-06, - "loss": 2.1809, - "step": 523530 - }, - { - "epoch": 0.91, - "learning_rate": 4.350457070909643e-06, - "loss": 2.1931, - "step": 523540 - }, - { - "epoch": 0.91, - "learning_rate": 4.3495851309828164e-06, - "loss": 2.3809, - "step": 523550 - }, - { - "epoch": 0.91, - "learning_rate": 4.348713191055989e-06, - "loss": 2.2213, - "step": 523560 - }, - { - "epoch": 0.91, - "learning_rate": 4.347841251129162e-06, - "loss": 2.2748, - "step": 523570 - }, - { - "epoch": 0.91, - "learning_rate": 4.346969311202335e-06, - "loss": 2.3982, - "step": 523580 - }, - { - "epoch": 0.91, - "learning_rate": 4.346097371275509e-06, - "loss": 2.2082, - "step": 523590 - }, - { - "epoch": 0.91, - "learning_rate": 4.345225431348682e-06, - "loss": 2.2654, - "step": 523600 - }, - { - "epoch": 0.91, - "learning_rate": 4.344353491421855e-06, - "loss": 2.1955, - "step": 523610 - }, - { - "epoch": 0.91, - "learning_rate": 4.343481551495029e-06, - "loss": 2.3126, - "step": 523620 - }, - { - "epoch": 0.91, - "learning_rate": 4.3426096115682015e-06, - "loss": 2.189, - "step": 523630 - }, - { - "epoch": 0.91, - "learning_rate": 4.341737671641375e-06, - "loss": 2.1327, - "step": 523640 - }, - { - "epoch": 0.91, - "learning_rate": 4.340865731714548e-06, - "loss": 2.2753, - "step": 523650 - }, - { - "epoch": 0.91, - "learning_rate": 4.339993791787721e-06, - "loss": 2.2809, - "step": 523660 - }, - { - "epoch": 0.91, - "learning_rate": 4.339121851860894e-06, - "loss": 2.2495, - "step": 523670 - }, - { - "epoch": 0.91, - "learning_rate": 4.338249911934068e-06, - "loss": 2.1929, - "step": 523680 - }, - { - "epoch": 0.91, - "learning_rate": 4.337377972007241e-06, - "loss": 2.0763, - "step": 523690 - }, - { - "epoch": 0.91, - "learning_rate": 4.336506032080414e-06, - "loss": 2.32, - "step": 523700 - }, - { - "epoch": 0.91, - "learning_rate": 4.3356340921535874e-06, - "loss": 2.1719, - "step": 523710 - }, - { - "epoch": 0.91, - "learning_rate": 4.33476215222676e-06, - "loss": 2.1905, - "step": 523720 - }, - { - "epoch": 0.91, - "learning_rate": 4.333890212299933e-06, - "loss": 2.2513, - "step": 523730 - }, - { - "epoch": 0.91, - "learning_rate": 4.333018272373106e-06, - "loss": 2.2131, - "step": 523740 - }, - { - "epoch": 0.91, - "learning_rate": 4.33214633244628e-06, - "loss": 2.3029, - "step": 523750 - }, - { - "epoch": 0.91, - "learning_rate": 4.331274392519454e-06, - "loss": 2.2545, - "step": 523760 - }, - { - "epoch": 0.91, - "learning_rate": 4.330402452592627e-06, - "loss": 2.2149, - "step": 523770 - }, - { - "epoch": 0.91, - "learning_rate": 4.3295305126658e-06, - "loss": 2.1568, - "step": 523780 - }, - { - "epoch": 0.91, - "learning_rate": 4.3286585727389725e-06, - "loss": 2.3272, - "step": 523790 - }, - { - "epoch": 0.91, - "learning_rate": 4.327786632812146e-06, - "loss": 2.3888, - "step": 523800 - }, - { - "epoch": 0.91, - "learning_rate": 4.326914692885319e-06, - "loss": 2.1563, - "step": 523810 - }, - { - "epoch": 0.91, - "learning_rate": 4.326042752958492e-06, - "loss": 2.2635, - "step": 523820 - }, - { - "epoch": 0.91, - "learning_rate": 4.325170813031666e-06, - "loss": 2.2907, - "step": 523830 - }, - { - "epoch": 0.91, - "learning_rate": 4.324298873104839e-06, - "loss": 2.3339, - "step": 523840 - }, - { - "epoch": 0.91, - "learning_rate": 4.323426933178012e-06, - "loss": 2.2755, - "step": 523850 - }, - { - "epoch": 0.91, - "learning_rate": 4.322554993251185e-06, - "loss": 2.2847, - "step": 523860 - }, - { - "epoch": 0.91, - "learning_rate": 4.3216830533243584e-06, - "loss": 2.1935, - "step": 523870 - }, - { - "epoch": 0.91, - "learning_rate": 4.320811113397531e-06, - "loss": 2.2794, - "step": 523880 - }, - { - "epoch": 0.91, - "learning_rate": 4.319939173470705e-06, - "loss": 2.3311, - "step": 523890 - }, - { - "epoch": 0.91, - "learning_rate": 4.319067233543878e-06, - "loss": 2.1107, - "step": 523900 - }, - { - "epoch": 0.91, - "learning_rate": 4.318195293617051e-06, - "loss": 2.2222, - "step": 523910 - }, - { - "epoch": 0.91, - "learning_rate": 4.317323353690225e-06, - "loss": 2.2201, - "step": 523920 - }, - { - "epoch": 0.91, - "learning_rate": 4.316451413763398e-06, - "loss": 2.1969, - "step": 523930 - }, - { - "epoch": 0.91, - "learning_rate": 4.315579473836571e-06, - "loss": 2.2537, - "step": 523940 - }, - { - "epoch": 0.91, - "learning_rate": 4.314707533909744e-06, - "loss": 2.2125, - "step": 523950 - }, - { - "epoch": 0.91, - "learning_rate": 4.313835593982917e-06, - "loss": 2.3324, - "step": 523960 - }, - { - "epoch": 0.91, - "learning_rate": 4.31296365405609e-06, - "loss": 2.3295, - "step": 523970 - }, - { - "epoch": 0.91, - "learning_rate": 4.312091714129263e-06, - "loss": 2.3567, - "step": 523980 - }, - { - "epoch": 0.91, - "learning_rate": 4.311219774202437e-06, - "loss": 2.2278, - "step": 523990 - }, - { - "epoch": 0.91, - "learning_rate": 4.31034783427561e-06, - "loss": 2.2195, - "step": 524000 - }, - { - "epoch": 0.91, - "learning_rate": 4.309475894348783e-06, - "loss": 2.194, - "step": 524010 - }, - { - "epoch": 0.91, - "learning_rate": 4.3086039544219565e-06, - "loss": 2.2129, - "step": 524020 - }, - { - "epoch": 0.91, - "learning_rate": 4.3077320144951295e-06, - "loss": 2.3386, - "step": 524030 - }, - { - "epoch": 0.91, - "learning_rate": 4.306860074568303e-06, - "loss": 2.2601, - "step": 524040 - }, - { - "epoch": 0.91, - "learning_rate": 4.305988134641476e-06, - "loss": 2.2428, - "step": 524050 - }, - { - "epoch": 0.91, - "learning_rate": 4.305116194714649e-06, - "loss": 2.2451, - "step": 524060 - }, - { - "epoch": 0.91, - "learning_rate": 4.304244254787823e-06, - "loss": 2.2863, - "step": 524070 - }, - { - "epoch": 0.91, - "learning_rate": 4.303372314860996e-06, - "loss": 2.2713, - "step": 524080 - }, - { - "epoch": 0.91, - "learning_rate": 4.302500374934169e-06, - "loss": 2.3861, - "step": 524090 - }, - { - "epoch": 0.91, - "learning_rate": 4.301628435007342e-06, - "loss": 2.2212, - "step": 524100 - }, - { - "epoch": 0.91, - "learning_rate": 4.300756495080515e-06, - "loss": 2.1726, - "step": 524110 - }, - { - "epoch": 0.91, - "learning_rate": 4.299884555153688e-06, - "loss": 2.2006, - "step": 524120 - }, - { - "epoch": 0.91, - "learning_rate": 4.299012615226861e-06, - "loss": 2.2635, - "step": 524130 - }, - { - "epoch": 0.91, - "learning_rate": 4.298140675300034e-06, - "loss": 2.1635, - "step": 524140 - }, - { - "epoch": 0.91, - "learning_rate": 4.297268735373208e-06, - "loss": 2.2922, - "step": 524150 - }, - { - "epoch": 0.91, - "learning_rate": 4.296396795446382e-06, - "loss": 2.2775, - "step": 524160 - }, - { - "epoch": 0.91, - "learning_rate": 4.295524855519555e-06, - "loss": 2.2788, - "step": 524170 - }, - { - "epoch": 0.91, - "learning_rate": 4.2946529155927275e-06, - "loss": 2.3075, - "step": 524180 - }, - { - "epoch": 0.91, - "learning_rate": 4.2937809756659005e-06, - "loss": 2.2584, - "step": 524190 - }, - { - "epoch": 0.91, - "learning_rate": 4.292909035739074e-06, - "loss": 2.3435, - "step": 524200 - }, - { - "epoch": 0.91, - "learning_rate": 4.292037095812247e-06, - "loss": 2.2588, - "step": 524210 - }, - { - "epoch": 0.91, - "learning_rate": 4.29116515588542e-06, - "loss": 2.2838, - "step": 524220 - }, - { - "epoch": 0.91, - "learning_rate": 4.290293215958594e-06, - "loss": 2.1948, - "step": 524230 - }, - { - "epoch": 0.91, - "learning_rate": 4.289421276031767e-06, - "loss": 2.2861, - "step": 524240 - }, - { - "epoch": 0.91, - "learning_rate": 4.28854933610494e-06, - "loss": 2.224, - "step": 524250 - }, - { - "epoch": 0.91, - "learning_rate": 4.287677396178113e-06, - "loss": 2.27, - "step": 524260 - }, - { - "epoch": 0.91, - "learning_rate": 4.286805456251286e-06, - "loss": 2.3412, - "step": 524270 - }, - { - "epoch": 0.91, - "learning_rate": 4.285933516324459e-06, - "loss": 2.2338, - "step": 524280 - }, - { - "epoch": 0.91, - "learning_rate": 4.285061576397633e-06, - "loss": 2.3385, - "step": 524290 - }, - { - "epoch": 0.91, - "learning_rate": 4.284189636470806e-06, - "loss": 2.311, - "step": 524300 - }, - { - "epoch": 0.91, - "learning_rate": 4.283317696543979e-06, - "loss": 2.1625, - "step": 524310 - }, - { - "epoch": 0.91, - "learning_rate": 4.282445756617153e-06, - "loss": 2.0859, - "step": 524320 - }, - { - "epoch": 0.91, - "learning_rate": 4.281573816690326e-06, - "loss": 2.2345, - "step": 524330 - }, - { - "epoch": 0.91, - "learning_rate": 4.2807018767634985e-06, - "loss": 2.3011, - "step": 524340 - }, - { - "epoch": 0.91, - "learning_rate": 4.279829936836672e-06, - "loss": 2.2709, - "step": 524350 - }, - { - "epoch": 0.91, - "learning_rate": 4.278957996909845e-06, - "loss": 2.3174, - "step": 524360 - }, - { - "epoch": 0.91, - "learning_rate": 4.278086056983018e-06, - "loss": 2.2861, - "step": 524370 - }, - { - "epoch": 0.91, - "learning_rate": 4.277214117056191e-06, - "loss": 2.2127, - "step": 524380 - }, - { - "epoch": 0.91, - "learning_rate": 4.276342177129365e-06, - "loss": 2.3079, - "step": 524390 - }, - { - "epoch": 0.91, - "learning_rate": 4.275470237202538e-06, - "loss": 2.1626, - "step": 524400 - }, - { - "epoch": 0.91, - "learning_rate": 4.274598297275711e-06, - "loss": 2.237, - "step": 524410 - }, - { - "epoch": 0.91, - "learning_rate": 4.2737263573488845e-06, - "loss": 2.1662, - "step": 524420 - }, - { - "epoch": 0.91, - "learning_rate": 4.272854417422057e-06, - "loss": 2.2173, - "step": 524430 - }, - { - "epoch": 0.91, - "learning_rate": 4.271982477495231e-06, - "loss": 2.217, - "step": 524440 - }, - { - "epoch": 0.91, - "learning_rate": 4.271110537568404e-06, - "loss": 2.2995, - "step": 524450 - }, - { - "epoch": 0.91, - "learning_rate": 4.270238597641577e-06, - "loss": 2.2609, - "step": 524460 - }, - { - "epoch": 0.91, - "learning_rate": 4.269366657714751e-06, - "loss": 2.3309, - "step": 524470 - }, - { - "epoch": 0.91, - "learning_rate": 4.268494717787924e-06, - "loss": 2.2072, - "step": 524480 - }, - { - "epoch": 0.91, - "learning_rate": 4.267622777861097e-06, - "loss": 2.269, - "step": 524490 - }, - { - "epoch": 0.91, - "learning_rate": 4.2667508379342695e-06, - "loss": 2.292, - "step": 524500 - }, - { - "epoch": 0.91, - "learning_rate": 4.265878898007443e-06, - "loss": 2.3779, - "step": 524510 - }, - { - "epoch": 0.91, - "learning_rate": 4.265006958080616e-06, - "loss": 2.2087, - "step": 524520 - }, - { - "epoch": 0.91, - "learning_rate": 4.264135018153789e-06, - "loss": 2.2291, - "step": 524530 - }, - { - "epoch": 0.91, - "learning_rate": 4.263263078226962e-06, - "loss": 2.3039, - "step": 524540 - }, - { - "epoch": 0.91, - "learning_rate": 4.262391138300136e-06, - "loss": 2.3413, - "step": 524550 - }, - { - "epoch": 0.91, - "learning_rate": 4.26151919837331e-06, - "loss": 2.2534, - "step": 524560 - }, - { - "epoch": 0.91, - "learning_rate": 4.2606472584464825e-06, - "loss": 2.3304, - "step": 524570 - }, - { - "epoch": 0.91, - "learning_rate": 4.2597753185196555e-06, - "loss": 2.3653, - "step": 524580 - }, - { - "epoch": 0.91, - "learning_rate": 4.258903378592829e-06, - "loss": 2.2174, - "step": 524590 - }, - { - "epoch": 0.91, - "learning_rate": 4.258031438666002e-06, - "loss": 2.34, - "step": 524600 - }, - { - "epoch": 0.91, - "learning_rate": 4.257159498739175e-06, - "loss": 2.3092, - "step": 524610 - }, - { - "epoch": 0.91, - "learning_rate": 4.256287558812348e-06, - "loss": 2.1299, - "step": 524620 - }, - { - "epoch": 0.91, - "learning_rate": 4.255415618885522e-06, - "loss": 2.2581, - "step": 524630 - }, - { - "epoch": 0.91, - "learning_rate": 4.254543678958695e-06, - "loss": 2.2446, - "step": 524640 - }, - { - "epoch": 0.91, - "learning_rate": 4.253671739031868e-06, - "loss": 2.2705, - "step": 524650 - }, - { - "epoch": 0.91, - "learning_rate": 4.2527997991050405e-06, - "loss": 2.2663, - "step": 524660 - }, - { - "epoch": 0.91, - "learning_rate": 4.251927859178214e-06, - "loss": 2.2988, - "step": 524670 - }, - { - "epoch": 0.91, - "learning_rate": 4.251055919251387e-06, - "loss": 2.3314, - "step": 524680 - }, - { - "epoch": 0.91, - "learning_rate": 4.250183979324561e-06, - "loss": 2.2478, - "step": 524690 - }, - { - "epoch": 0.92, - "learning_rate": 4.249312039397734e-06, - "loss": 2.1767, - "step": 524700 - }, - { - "epoch": 0.92, - "learning_rate": 4.248440099470907e-06, - "loss": 2.2016, - "step": 524710 - }, - { - "epoch": 0.92, - "learning_rate": 4.247568159544081e-06, - "loss": 2.231, - "step": 524720 - }, - { - "epoch": 0.92, - "learning_rate": 4.2466962196172535e-06, - "loss": 2.1828, - "step": 524730 - }, - { - "epoch": 0.92, - "learning_rate": 4.2458242796904265e-06, - "loss": 2.2944, - "step": 524740 - }, - { - "epoch": 0.92, - "learning_rate": 4.2449523397636e-06, - "loss": 2.2231, - "step": 524750 - }, - { - "epoch": 0.92, - "learning_rate": 4.244080399836773e-06, - "loss": 2.2405, - "step": 524760 - }, - { - "epoch": 0.92, - "learning_rate": 4.243208459909946e-06, - "loss": 2.2625, - "step": 524770 - }, - { - "epoch": 0.92, - "learning_rate": 4.242336519983119e-06, - "loss": 2.2583, - "step": 524780 - }, - { - "epoch": 0.92, - "learning_rate": 4.241464580056293e-06, - "loss": 2.2856, - "step": 524790 - }, - { - "epoch": 0.92, - "learning_rate": 4.240592640129466e-06, - "loss": 2.3381, - "step": 524800 - }, - { - "epoch": 0.92, - "learning_rate": 4.239720700202639e-06, - "loss": 2.2116, - "step": 524810 - }, - { - "epoch": 0.92, - "learning_rate": 4.238848760275812e-06, - "loss": 2.2969, - "step": 524820 - }, - { - "epoch": 0.92, - "learning_rate": 4.237976820348985e-06, - "loss": 2.2277, - "step": 524830 - }, - { - "epoch": 0.92, - "learning_rate": 4.237104880422159e-06, - "loss": 2.2164, - "step": 524840 - }, - { - "epoch": 0.92, - "learning_rate": 4.236232940495332e-06, - "loss": 2.3616, - "step": 524850 - }, - { - "epoch": 0.92, - "learning_rate": 4.235361000568505e-06, - "loss": 2.2364, - "step": 524860 - }, - { - "epoch": 0.92, - "learning_rate": 4.234489060641679e-06, - "loss": 2.1789, - "step": 524870 - }, - { - "epoch": 0.92, - "learning_rate": 4.233617120714852e-06, - "loss": 2.303, - "step": 524880 - }, - { - "epoch": 0.92, - "learning_rate": 4.2327451807880245e-06, - "loss": 2.2831, - "step": 524890 - }, - { - "epoch": 0.92, - "learning_rate": 4.2318732408611975e-06, - "loss": 2.2216, - "step": 524900 - }, - { - "epoch": 0.92, - "learning_rate": 4.231001300934371e-06, - "loss": 2.3201, - "step": 524910 - }, - { - "epoch": 0.92, - "learning_rate": 4.230129361007544e-06, - "loss": 2.092, - "step": 524920 - }, - { - "epoch": 0.92, - "learning_rate": 4.229257421080717e-06, - "loss": 2.4244, - "step": 524930 - }, - { - "epoch": 0.92, - "learning_rate": 4.22838548115389e-06, - "loss": 2.1549, - "step": 524940 - }, - { - "epoch": 0.92, - "learning_rate": 4.227513541227064e-06, - "loss": 2.3095, - "step": 524950 - }, - { - "epoch": 0.92, - "learning_rate": 4.2266416013002375e-06, - "loss": 2.3141, - "step": 524960 - }, - { - "epoch": 0.92, - "learning_rate": 4.2257696613734105e-06, - "loss": 2.0473, - "step": 524970 - }, - { - "epoch": 0.92, - "learning_rate": 4.224897721446583e-06, - "loss": 2.2837, - "step": 524980 - }, - { - "epoch": 0.92, - "learning_rate": 4.224025781519757e-06, - "loss": 2.3068, - "step": 524990 - }, - { - "epoch": 0.92, - "learning_rate": 4.22315384159293e-06, - "loss": 2.1835, - "step": 525000 - }, - { - "epoch": 0.92, - "learning_rate": 4.222281901666103e-06, - "loss": 2.2447, - "step": 525010 - }, - { - "epoch": 0.92, - "learning_rate": 4.221409961739276e-06, - "loss": 2.3238, - "step": 525020 - }, - { - "epoch": 0.92, - "learning_rate": 4.22053802181245e-06, - "loss": 2.2, - "step": 525030 - }, - { - "epoch": 0.92, - "learning_rate": 4.219666081885623e-06, - "loss": 2.2723, - "step": 525040 - }, - { - "epoch": 0.92, - "learning_rate": 4.2187941419587955e-06, - "loss": 2.3285, - "step": 525050 - }, - { - "epoch": 0.92, - "learning_rate": 4.2179222020319685e-06, - "loss": 2.1688, - "step": 525060 - }, - { - "epoch": 0.92, - "learning_rate": 4.217050262105142e-06, - "loss": 2.2522, - "step": 525070 - }, - { - "epoch": 0.92, - "learning_rate": 4.216178322178315e-06, - "loss": 2.3372, - "step": 525080 - }, - { - "epoch": 0.92, - "learning_rate": 4.215306382251489e-06, - "loss": 2.1993, - "step": 525090 - }, - { - "epoch": 0.92, - "learning_rate": 4.214434442324662e-06, - "loss": 2.2811, - "step": 525100 - }, - { - "epoch": 0.92, - "learning_rate": 4.213562502397836e-06, - "loss": 2.2924, - "step": 525110 - }, - { - "epoch": 0.92, - "learning_rate": 4.2126905624710085e-06, - "loss": 2.1553, - "step": 525120 - }, - { - "epoch": 0.92, - "learning_rate": 4.2118186225441815e-06, - "loss": 2.3028, - "step": 525130 - }, - { - "epoch": 0.92, - "learning_rate": 4.210946682617354e-06, - "loss": 2.1805, - "step": 525140 - }, - { - "epoch": 0.92, - "learning_rate": 4.210074742690528e-06, - "loss": 2.2228, - "step": 525150 - }, - { - "epoch": 0.92, - "learning_rate": 4.209202802763701e-06, - "loss": 2.2988, - "step": 525160 - }, - { - "epoch": 0.92, - "learning_rate": 4.208330862836874e-06, - "loss": 2.2497, - "step": 525170 - }, - { - "epoch": 0.92, - "learning_rate": 4.207458922910047e-06, - "loss": 2.2429, - "step": 525180 - }, - { - "epoch": 0.92, - "learning_rate": 4.206586982983221e-06, - "loss": 2.3436, - "step": 525190 - }, - { - "epoch": 0.92, - "learning_rate": 4.205715043056394e-06, - "loss": 2.3538, - "step": 525200 - }, - { - "epoch": 0.92, - "learning_rate": 4.2048431031295665e-06, - "loss": 2.2119, - "step": 525210 - }, - { - "epoch": 0.92, - "learning_rate": 4.20397116320274e-06, - "loss": 2.3014, - "step": 525220 - }, - { - "epoch": 0.92, - "learning_rate": 4.203099223275914e-06, - "loss": 2.0969, - "step": 525230 - }, - { - "epoch": 0.92, - "learning_rate": 4.202227283349087e-06, - "loss": 2.2711, - "step": 525240 - }, - { - "epoch": 0.92, - "learning_rate": 4.20135534342226e-06, - "loss": 2.3631, - "step": 525250 - }, - { - "epoch": 0.92, - "learning_rate": 4.200483403495433e-06, - "loss": 2.1742, - "step": 525260 - }, - { - "epoch": 0.92, - "learning_rate": 4.199611463568607e-06, - "loss": 2.2525, - "step": 525270 - }, - { - "epoch": 0.92, - "learning_rate": 4.1987395236417795e-06, - "loss": 2.3417, - "step": 525280 - }, - { - "epoch": 0.92, - "learning_rate": 4.1978675837149525e-06, - "loss": 2.1182, - "step": 525290 - }, - { - "epoch": 0.92, - "learning_rate": 4.196995643788125e-06, - "loss": 2.2201, - "step": 525300 - }, - { - "epoch": 0.92, - "learning_rate": 4.196123703861299e-06, - "loss": 2.3397, - "step": 525310 - }, - { - "epoch": 0.92, - "learning_rate": 4.195251763934472e-06, - "loss": 2.2416, - "step": 525320 - }, - { - "epoch": 0.92, - "learning_rate": 4.194379824007645e-06, - "loss": 2.2389, - "step": 525330 - }, - { - "epoch": 0.92, - "learning_rate": 4.193507884080818e-06, - "loss": 2.2053, - "step": 525340 - }, - { - "epoch": 0.92, - "learning_rate": 4.192635944153992e-06, - "loss": 2.3344, - "step": 525350 - }, - { - "epoch": 0.92, - "learning_rate": 4.1917640042271655e-06, - "loss": 2.1932, - "step": 525360 - }, - { - "epoch": 0.92, - "learning_rate": 4.190892064300338e-06, - "loss": 2.2534, - "step": 525370 - }, - { - "epoch": 0.92, - "learning_rate": 4.190020124373511e-06, - "loss": 2.2061, - "step": 525380 - }, - { - "epoch": 0.92, - "learning_rate": 4.189148184446685e-06, - "loss": 2.388, - "step": 525390 - }, - { - "epoch": 0.92, - "learning_rate": 4.188276244519858e-06, - "loss": 2.2649, - "step": 525400 - }, - { - "epoch": 0.92, - "learning_rate": 4.187404304593031e-06, - "loss": 2.3011, - "step": 525410 - }, - { - "epoch": 0.92, - "learning_rate": 4.186532364666204e-06, - "loss": 2.2205, - "step": 525420 - }, - { - "epoch": 0.92, - "learning_rate": 4.185660424739378e-06, - "loss": 2.3215, - "step": 525430 - }, - { - "epoch": 0.92, - "learning_rate": 4.1847884848125505e-06, - "loss": 2.1708, - "step": 525440 - }, - { - "epoch": 0.92, - "learning_rate": 4.1839165448857235e-06, - "loss": 2.2485, - "step": 525450 - }, - { - "epoch": 0.92, - "learning_rate": 4.183044604958896e-06, - "loss": 2.1665, - "step": 525460 - }, - { - "epoch": 0.92, - "learning_rate": 4.18217266503207e-06, - "loss": 2.2526, - "step": 525470 - }, - { - "epoch": 0.92, - "learning_rate": 4.181300725105243e-06, - "loss": 2.2074, - "step": 525480 - }, - { - "epoch": 0.92, - "learning_rate": 4.180428785178417e-06, - "loss": 2.2847, - "step": 525490 - }, - { - "epoch": 0.92, - "learning_rate": 4.17955684525159e-06, - "loss": 2.2469, - "step": 525500 - }, - { - "epoch": 0.92, - "learning_rate": 4.1786849053247635e-06, - "loss": 2.2725, - "step": 525510 - }, - { - "epoch": 0.92, - "learning_rate": 4.1778129653979365e-06, - "loss": 2.3005, - "step": 525520 - }, - { - "epoch": 0.92, - "learning_rate": 4.176941025471109e-06, - "loss": 2.204, - "step": 525530 - }, - { - "epoch": 0.92, - "learning_rate": 4.176069085544282e-06, - "loss": 2.3262, - "step": 525540 - }, - { - "epoch": 0.92, - "learning_rate": 4.175197145617456e-06, - "loss": 2.2414, - "step": 525550 - }, - { - "epoch": 0.92, - "learning_rate": 4.174325205690629e-06, - "loss": 2.304, - "step": 525560 - }, - { - "epoch": 0.92, - "learning_rate": 4.173453265763802e-06, - "loss": 2.359, - "step": 525570 - }, - { - "epoch": 0.92, - "learning_rate": 4.172581325836975e-06, - "loss": 2.3795, - "step": 525580 - }, - { - "epoch": 0.92, - "learning_rate": 4.171709385910149e-06, - "loss": 2.2151, - "step": 525590 - }, - { - "epoch": 0.92, - "learning_rate": 4.1708374459833215e-06, - "loss": 2.1345, - "step": 525600 - }, - { - "epoch": 0.92, - "learning_rate": 4.1699655060564945e-06, - "loss": 2.1767, - "step": 525610 - }, - { - "epoch": 0.92, - "learning_rate": 4.169093566129668e-06, - "loss": 2.2723, - "step": 525620 - }, - { - "epoch": 0.92, - "learning_rate": 4.168221626202842e-06, - "loss": 2.3386, - "step": 525630 - }, - { - "epoch": 0.92, - "learning_rate": 4.167349686276015e-06, - "loss": 2.3171, - "step": 525640 - }, - { - "epoch": 0.92, - "learning_rate": 4.166477746349188e-06, - "loss": 2.1866, - "step": 525650 - }, - { - "epoch": 0.92, - "learning_rate": 4.165605806422361e-06, - "loss": 2.3122, - "step": 525660 - }, - { - "epoch": 0.92, - "learning_rate": 4.1647338664955345e-06, - "loss": 2.2578, - "step": 525670 - }, - { - "epoch": 0.92, - "learning_rate": 4.1638619265687075e-06, - "loss": 2.3011, - "step": 525680 - }, - { - "epoch": 0.92, - "learning_rate": 4.16298998664188e-06, - "loss": 2.2281, - "step": 525690 - }, - { - "epoch": 0.92, - "learning_rate": 4.162118046715053e-06, - "loss": 2.2919, - "step": 525700 - }, - { - "epoch": 0.92, - "learning_rate": 4.161246106788227e-06, - "loss": 2.2264, - "step": 525710 - }, - { - "epoch": 0.92, - "learning_rate": 4.1603741668614e-06, - "loss": 2.2879, - "step": 525720 - }, - { - "epoch": 0.92, - "learning_rate": 4.159502226934573e-06, - "loss": 2.234, - "step": 525730 - }, - { - "epoch": 0.92, - "learning_rate": 4.158630287007746e-06, - "loss": 2.1407, - "step": 525740 - }, - { - "epoch": 0.92, - "learning_rate": 4.1577583470809205e-06, - "loss": 2.2943, - "step": 525750 - }, - { - "epoch": 0.92, - "learning_rate": 4.156886407154093e-06, - "loss": 2.275, - "step": 525760 - }, - { - "epoch": 0.92, - "learning_rate": 4.156014467227266e-06, - "loss": 2.2766, - "step": 525770 - }, - { - "epoch": 0.92, - "learning_rate": 4.155142527300439e-06, - "loss": 2.3296, - "step": 525780 - }, - { - "epoch": 0.92, - "learning_rate": 4.154270587373613e-06, - "loss": 2.2534, - "step": 525790 - }, - { - "epoch": 0.92, - "learning_rate": 4.153398647446786e-06, - "loss": 2.2264, - "step": 525800 - }, - { - "epoch": 0.92, - "learning_rate": 4.152526707519959e-06, - "loss": 2.2127, - "step": 525810 - }, - { - "epoch": 0.92, - "learning_rate": 4.151654767593132e-06, - "loss": 2.2569, - "step": 525820 - }, - { - "epoch": 0.92, - "learning_rate": 4.1507828276663055e-06, - "loss": 2.3557, - "step": 525830 - }, - { - "epoch": 0.92, - "learning_rate": 4.1499108877394785e-06, - "loss": 2.2681, - "step": 525840 - }, - { - "epoch": 0.92, - "learning_rate": 4.149038947812651e-06, - "loss": 2.2359, - "step": 525850 - }, - { - "epoch": 0.92, - "learning_rate": 4.148167007885824e-06, - "loss": 2.2085, - "step": 525860 - }, - { - "epoch": 0.92, - "learning_rate": 4.147295067958998e-06, - "loss": 2.1686, - "step": 525870 - }, - { - "epoch": 0.92, - "learning_rate": 4.146423128032171e-06, - "loss": 2.3166, - "step": 525880 - }, - { - "epoch": 0.92, - "learning_rate": 4.145551188105345e-06, - "loss": 2.2383, - "step": 525890 - }, - { - "epoch": 0.92, - "learning_rate": 4.144679248178518e-06, - "loss": 2.1974, - "step": 525900 - }, - { - "epoch": 0.92, - "learning_rate": 4.1438073082516915e-06, - "loss": 2.2717, - "step": 525910 - }, - { - "epoch": 0.92, - "learning_rate": 4.142935368324864e-06, - "loss": 2.2326, - "step": 525920 - }, - { - "epoch": 0.92, - "learning_rate": 4.142063428398037e-06, - "loss": 2.2403, - "step": 525930 - }, - { - "epoch": 0.92, - "learning_rate": 4.14119148847121e-06, - "loss": 2.2045, - "step": 525940 - }, - { - "epoch": 0.92, - "learning_rate": 4.140319548544384e-06, - "loss": 2.2893, - "step": 525950 - }, - { - "epoch": 0.92, - "learning_rate": 4.139447608617557e-06, - "loss": 2.2702, - "step": 525960 - }, - { - "epoch": 0.92, - "learning_rate": 4.13857566869073e-06, - "loss": 2.3295, - "step": 525970 - }, - { - "epoch": 0.92, - "learning_rate": 4.137703728763903e-06, - "loss": 2.219, - "step": 525980 - }, - { - "epoch": 0.92, - "learning_rate": 4.1368317888370765e-06, - "loss": 2.2874, - "step": 525990 - }, - { - "epoch": 0.92, - "learning_rate": 4.1359598489102495e-06, - "loss": 2.2038, - "step": 526000 - }, - { - "epoch": 0.92, - "learning_rate": 4.135087908983422e-06, - "loss": 2.3248, - "step": 526010 - }, - { - "epoch": 0.92, - "learning_rate": 4.134215969056596e-06, - "loss": 2.164, - "step": 526020 - }, - { - "epoch": 0.92, - "learning_rate": 4.13334402912977e-06, - "loss": 2.3733, - "step": 526030 - }, - { - "epoch": 0.92, - "learning_rate": 4.132472089202943e-06, - "loss": 2.1867, - "step": 526040 - }, - { - "epoch": 0.92, - "learning_rate": 4.131600149276116e-06, - "loss": 2.2794, - "step": 526050 - }, - { - "epoch": 0.92, - "learning_rate": 4.130728209349289e-06, - "loss": 2.2505, - "step": 526060 - }, - { - "epoch": 0.92, - "learning_rate": 4.1298562694224625e-06, - "loss": 2.2821, - "step": 526070 - }, - { - "epoch": 0.92, - "learning_rate": 4.128984329495635e-06, - "loss": 2.2083, - "step": 526080 - }, - { - "epoch": 0.92, - "learning_rate": 4.128112389568808e-06, - "loss": 2.1228, - "step": 526090 - }, - { - "epoch": 0.92, - "learning_rate": 4.127240449641981e-06, - "loss": 2.2392, - "step": 526100 - }, - { - "epoch": 0.92, - "learning_rate": 4.126368509715155e-06, - "loss": 2.2093, - "step": 526110 - }, - { - "epoch": 0.92, - "learning_rate": 4.125496569788328e-06, - "loss": 2.2158, - "step": 526120 - }, - { - "epoch": 0.92, - "learning_rate": 4.124624629861501e-06, - "loss": 2.2944, - "step": 526130 - }, - { - "epoch": 0.92, - "learning_rate": 4.123752689934674e-06, - "loss": 2.1447, - "step": 526140 - }, - { - "epoch": 0.92, - "learning_rate": 4.122880750007848e-06, - "loss": 2.377, - "step": 526150 - }, - { - "epoch": 0.92, - "learning_rate": 4.122008810081021e-06, - "loss": 2.2488, - "step": 526160 - }, - { - "epoch": 0.92, - "learning_rate": 4.121136870154194e-06, - "loss": 2.2675, - "step": 526170 - }, - { - "epoch": 0.92, - "learning_rate": 4.120264930227367e-06, - "loss": 2.309, - "step": 526180 - }, - { - "epoch": 0.92, - "learning_rate": 4.119392990300541e-06, - "loss": 2.2725, - "step": 526190 - }, - { - "epoch": 0.92, - "learning_rate": 4.118521050373714e-06, - "loss": 2.2767, - "step": 526200 - }, - { - "epoch": 0.92, - "learning_rate": 4.117649110446887e-06, - "loss": 2.3226, - "step": 526210 - }, - { - "epoch": 0.92, - "learning_rate": 4.11677717052006e-06, - "loss": 2.307, - "step": 526220 - }, - { - "epoch": 0.92, - "learning_rate": 4.1159052305932335e-06, - "loss": 2.3517, - "step": 526230 - }, - { - "epoch": 0.92, - "learning_rate": 4.115033290666406e-06, - "loss": 2.1607, - "step": 526240 - }, - { - "epoch": 0.92, - "learning_rate": 4.114161350739579e-06, - "loss": 2.2584, - "step": 526250 - }, - { - "epoch": 0.92, - "learning_rate": 4.113289410812752e-06, - "loss": 2.2097, - "step": 526260 - }, - { - "epoch": 0.92, - "learning_rate": 4.112417470885926e-06, - "loss": 2.335, - "step": 526270 - }, - { - "epoch": 0.92, - "learning_rate": 4.1115455309591e-06, - "loss": 2.2114, - "step": 526280 - }, - { - "epoch": 0.92, - "learning_rate": 4.110673591032273e-06, - "loss": 2.1757, - "step": 526290 - }, - { - "epoch": 0.92, - "learning_rate": 4.109801651105446e-06, - "loss": 2.2542, - "step": 526300 - }, - { - "epoch": 0.92, - "learning_rate": 4.108929711178619e-06, - "loss": 2.3363, - "step": 526310 - }, - { - "epoch": 0.92, - "learning_rate": 4.108057771251792e-06, - "loss": 2.2447, - "step": 526320 - }, - { - "epoch": 0.92, - "learning_rate": 4.107185831324965e-06, - "loss": 2.2973, - "step": 526330 - }, - { - "epoch": 0.92, - "learning_rate": 4.106313891398138e-06, - "loss": 2.2709, - "step": 526340 - }, - { - "epoch": 0.92, - "learning_rate": 4.105441951471312e-06, - "loss": 2.3695, - "step": 526350 - }, - { - "epoch": 0.92, - "learning_rate": 4.104570011544485e-06, - "loss": 2.3727, - "step": 526360 - }, - { - "epoch": 0.92, - "learning_rate": 4.103698071617658e-06, - "loss": 2.1751, - "step": 526370 - }, - { - "epoch": 0.92, - "learning_rate": 4.102826131690831e-06, - "loss": 2.3086, - "step": 526380 - }, - { - "epoch": 0.92, - "learning_rate": 4.1019541917640045e-06, - "loss": 2.3918, - "step": 526390 - }, - { - "epoch": 0.92, - "learning_rate": 4.101082251837177e-06, - "loss": 2.2846, - "step": 526400 - }, - { - "epoch": 0.92, - "learning_rate": 4.10021031191035e-06, - "loss": 2.183, - "step": 526410 - }, - { - "epoch": 0.92, - "learning_rate": 4.099338371983524e-06, - "loss": 2.2612, - "step": 526420 - }, - { - "epoch": 0.92, - "learning_rate": 4.098466432056698e-06, - "loss": 2.281, - "step": 526430 - }, - { - "epoch": 0.92, - "learning_rate": 4.097594492129871e-06, - "loss": 2.2789, - "step": 526440 - }, - { - "epoch": 0.92, - "learning_rate": 4.096722552203044e-06, - "loss": 2.3434, - "step": 526450 - }, - { - "epoch": 0.92, - "learning_rate": 4.095850612276217e-06, - "loss": 2.3214, - "step": 526460 - }, - { - "epoch": 0.92, - "learning_rate": 4.09497867234939e-06, - "loss": 2.2796, - "step": 526470 - }, - { - "epoch": 0.92, - "learning_rate": 4.094106732422563e-06, - "loss": 2.2638, - "step": 526480 - }, - { - "epoch": 0.92, - "learning_rate": 4.093234792495736e-06, - "loss": 2.1996, - "step": 526490 - }, - { - "epoch": 0.92, - "learning_rate": 4.092362852568909e-06, - "loss": 2.2768, - "step": 526500 - }, - { - "epoch": 0.92, - "learning_rate": 4.091490912642083e-06, - "loss": 2.1659, - "step": 526510 - }, - { - "epoch": 0.92, - "learning_rate": 4.090618972715256e-06, - "loss": 2.2286, - "step": 526520 - }, - { - "epoch": 0.92, - "learning_rate": 4.089747032788429e-06, - "loss": 2.1999, - "step": 526530 - }, - { - "epoch": 0.92, - "learning_rate": 4.088875092861602e-06, - "loss": 2.2197, - "step": 526540 - }, - { - "epoch": 0.92, - "learning_rate": 4.088003152934776e-06, - "loss": 2.3097, - "step": 526550 - }, - { - "epoch": 0.92, - "learning_rate": 4.087131213007949e-06, - "loss": 2.3029, - "step": 526560 - }, - { - "epoch": 0.92, - "learning_rate": 4.086259273081122e-06, - "loss": 2.2483, - "step": 526570 - }, - { - "epoch": 0.92, - "learning_rate": 4.085387333154295e-06, - "loss": 2.2688, - "step": 526580 - }, - { - "epoch": 0.92, - "learning_rate": 4.084515393227469e-06, - "loss": 2.3244, - "step": 526590 - }, - { - "epoch": 0.92, - "learning_rate": 4.083643453300642e-06, - "loss": 2.2282, - "step": 526600 - }, - { - "epoch": 0.92, - "learning_rate": 4.082771513373815e-06, - "loss": 2.2642, - "step": 526610 - }, - { - "epoch": 0.92, - "learning_rate": 4.081899573446988e-06, - "loss": 2.3301, - "step": 526620 - }, - { - "epoch": 0.92, - "learning_rate": 4.081027633520161e-06, - "loss": 2.1841, - "step": 526630 - }, - { - "epoch": 0.92, - "learning_rate": 4.080155693593334e-06, - "loss": 2.1505, - "step": 526640 - }, - { - "epoch": 0.92, - "learning_rate": 4.079283753666507e-06, - "loss": 2.1908, - "step": 526650 - }, - { - "epoch": 0.92, - "learning_rate": 4.07841181373968e-06, - "loss": 2.2076, - "step": 526660 - }, - { - "epoch": 0.92, - "learning_rate": 4.077539873812854e-06, - "loss": 2.3354, - "step": 526670 - }, - { - "epoch": 0.92, - "learning_rate": 4.076667933886028e-06, - "loss": 2.2379, - "step": 526680 - }, - { - "epoch": 0.92, - "learning_rate": 4.075795993959201e-06, - "loss": 2.275, - "step": 526690 - }, - { - "epoch": 0.92, - "learning_rate": 4.0749240540323736e-06, - "loss": 2.1511, - "step": 526700 - }, - { - "epoch": 0.92, - "learning_rate": 4.074052114105547e-06, - "loss": 2.3195, - "step": 526710 - }, - { - "epoch": 0.92, - "learning_rate": 4.07318017417872e-06, - "loss": 2.1612, - "step": 526720 - }, - { - "epoch": 0.92, - "learning_rate": 4.072308234251893e-06, - "loss": 2.3068, - "step": 526730 - }, - { - "epoch": 0.92, - "learning_rate": 4.071436294325066e-06, - "loss": 2.3423, - "step": 526740 - }, - { - "epoch": 0.92, - "learning_rate": 4.07056435439824e-06, - "loss": 2.1899, - "step": 526750 - }, - { - "epoch": 0.92, - "learning_rate": 4.069692414471413e-06, - "loss": 2.241, - "step": 526760 - }, - { - "epoch": 0.92, - "learning_rate": 4.068820474544586e-06, - "loss": 2.2165, - "step": 526770 - }, - { - "epoch": 0.92, - "learning_rate": 4.067948534617759e-06, - "loss": 2.2441, - "step": 526780 - }, - { - "epoch": 0.92, - "learning_rate": 4.067076594690932e-06, - "loss": 2.3173, - "step": 526790 - }, - { - "epoch": 0.92, - "learning_rate": 4.066204654764105e-06, - "loss": 2.3008, - "step": 526800 - }, - { - "epoch": 0.92, - "learning_rate": 4.065332714837278e-06, - "loss": 2.1971, - "step": 526810 - }, - { - "epoch": 0.92, - "learning_rate": 4.064460774910452e-06, - "loss": 2.2885, - "step": 526820 - }, - { - "epoch": 0.92, - "learning_rate": 4.063588834983626e-06, - "loss": 2.2869, - "step": 526830 - }, - { - "epoch": 0.92, - "learning_rate": 4.062716895056799e-06, - "loss": 2.2346, - "step": 526840 - }, - { - "epoch": 0.92, - "learning_rate": 4.061844955129972e-06, - "loss": 2.2611, - "step": 526850 - }, - { - "epoch": 0.92, - "learning_rate": 4.0609730152031446e-06, - "loss": 2.2892, - "step": 526860 - }, - { - "epoch": 0.92, - "learning_rate": 4.060101075276318e-06, - "loss": 2.2345, - "step": 526870 - }, - { - "epoch": 0.92, - "learning_rate": 4.059229135349491e-06, - "loss": 2.1319, - "step": 526880 - }, - { - "epoch": 0.92, - "learning_rate": 4.058357195422664e-06, - "loss": 2.2496, - "step": 526890 - }, - { - "epoch": 0.92, - "learning_rate": 4.057485255495837e-06, - "loss": 2.2792, - "step": 526900 - }, - { - "epoch": 0.92, - "learning_rate": 4.056613315569011e-06, - "loss": 2.3585, - "step": 526910 - }, - { - "epoch": 0.92, - "learning_rate": 4.055741375642184e-06, - "loss": 2.2754, - "step": 526920 - }, - { - "epoch": 0.92, - "learning_rate": 4.054869435715357e-06, - "loss": 2.239, - "step": 526930 - }, - { - "epoch": 0.92, - "learning_rate": 4.05399749578853e-06, - "loss": 2.339, - "step": 526940 - }, - { - "epoch": 0.92, - "learning_rate": 4.053125555861704e-06, - "loss": 2.3632, - "step": 526950 - }, - { - "epoch": 0.92, - "learning_rate": 4.052253615934877e-06, - "loss": 2.2536, - "step": 526960 - }, - { - "epoch": 0.92, - "learning_rate": 4.05138167600805e-06, - "loss": 2.2613, - "step": 526970 - }, - { - "epoch": 0.92, - "learning_rate": 4.050509736081223e-06, - "loss": 2.3474, - "step": 526980 - }, - { - "epoch": 0.92, - "learning_rate": 4.049637796154397e-06, - "loss": 2.2979, - "step": 526990 - }, - { - "epoch": 0.92, - "learning_rate": 4.04876585622757e-06, - "loss": 2.2537, - "step": 527000 - }, - { - "epoch": 0.92, - "learning_rate": 4.047893916300743e-06, - "loss": 2.3303, - "step": 527010 - }, - { - "epoch": 0.92, - "learning_rate": 4.0470219763739156e-06, - "loss": 2.3239, - "step": 527020 - }, - { - "epoch": 0.92, - "learning_rate": 4.046150036447089e-06, - "loss": 2.2694, - "step": 527030 - }, - { - "epoch": 0.92, - "learning_rate": 4.045278096520262e-06, - "loss": 2.2977, - "step": 527040 - }, - { - "epoch": 0.92, - "learning_rate": 4.044406156593435e-06, - "loss": 2.2209, - "step": 527050 - }, - { - "epoch": 0.92, - "learning_rate": 4.043534216666608e-06, - "loss": 2.2043, - "step": 527060 - }, - { - "epoch": 0.92, - "learning_rate": 4.042662276739782e-06, - "loss": 2.2195, - "step": 527070 - }, - { - "epoch": 0.92, - "learning_rate": 4.041790336812956e-06, - "loss": 2.2269, - "step": 527080 - }, - { - "epoch": 0.92, - "learning_rate": 4.0409183968861286e-06, - "loss": 2.4366, - "step": 527090 - }, - { - "epoch": 0.92, - "learning_rate": 4.0400464569593015e-06, - "loss": 2.2583, - "step": 527100 - }, - { - "epoch": 0.92, - "learning_rate": 4.039174517032475e-06, - "loss": 2.2263, - "step": 527110 - }, - { - "epoch": 0.92, - "learning_rate": 4.038302577105648e-06, - "loss": 2.2255, - "step": 527120 - }, - { - "epoch": 0.92, - "learning_rate": 4.037430637178821e-06, - "loss": 2.3571, - "step": 527130 - }, - { - "epoch": 0.92, - "learning_rate": 4.036558697251994e-06, - "loss": 2.2686, - "step": 527140 - }, - { - "epoch": 0.92, - "learning_rate": 4.035686757325168e-06, - "loss": 2.1992, - "step": 527150 - }, - { - "epoch": 0.92, - "learning_rate": 4.034814817398341e-06, - "loss": 2.2058, - "step": 527160 - }, - { - "epoch": 0.92, - "learning_rate": 4.033942877471514e-06, - "loss": 2.3167, - "step": 527170 - }, - { - "epoch": 0.92, - "learning_rate": 4.0330709375446866e-06, - "loss": 2.2181, - "step": 527180 - }, - { - "epoch": 0.92, - "learning_rate": 4.03219899761786e-06, - "loss": 2.2527, - "step": 527190 - }, - { - "epoch": 0.92, - "learning_rate": 4.031327057691033e-06, - "loss": 2.191, - "step": 527200 - }, - { - "epoch": 0.92, - "learning_rate": 4.030455117764206e-06, - "loss": 2.2868, - "step": 527210 - }, - { - "epoch": 0.92, - "learning_rate": 4.02958317783738e-06, - "loss": 2.3074, - "step": 527220 - }, - { - "epoch": 0.92, - "learning_rate": 4.028711237910554e-06, - "loss": 2.2522, - "step": 527230 - }, - { - "epoch": 0.92, - "learning_rate": 4.027839297983727e-06, - "loss": 2.2763, - "step": 527240 - }, - { - "epoch": 0.92, - "learning_rate": 4.0269673580568996e-06, - "loss": 2.2701, - "step": 527250 - }, - { - "epoch": 0.92, - "learning_rate": 4.0260954181300725e-06, - "loss": 2.34, - "step": 527260 - }, - { - "epoch": 0.92, - "learning_rate": 4.025223478203246e-06, - "loss": 2.1928, - "step": 527270 - }, - { - "epoch": 0.92, - "learning_rate": 4.024351538276419e-06, - "loss": 2.2227, - "step": 527280 - }, - { - "epoch": 0.92, - "learning_rate": 4.023479598349592e-06, - "loss": 2.2964, - "step": 527290 - }, - { - "epoch": 0.92, - "learning_rate": 4.022607658422765e-06, - "loss": 2.3117, - "step": 527300 - }, - { - "epoch": 0.92, - "learning_rate": 4.021735718495939e-06, - "loss": 2.1696, - "step": 527310 - }, - { - "epoch": 0.92, - "learning_rate": 4.020863778569112e-06, - "loss": 2.2097, - "step": 527320 - }, - { - "epoch": 0.92, - "learning_rate": 4.019991838642285e-06, - "loss": 2.2953, - "step": 527330 - }, - { - "epoch": 0.92, - "learning_rate": 4.0191198987154576e-06, - "loss": 2.228, - "step": 527340 - }, - { - "epoch": 0.92, - "learning_rate": 4.018247958788632e-06, - "loss": 2.3049, - "step": 527350 - }, - { - "epoch": 0.92, - "learning_rate": 4.017376018861805e-06, - "loss": 2.3029, - "step": 527360 - }, - { - "epoch": 0.92, - "learning_rate": 4.016504078934978e-06, - "loss": 2.2321, - "step": 527370 - }, - { - "epoch": 0.92, - "learning_rate": 4.015632139008151e-06, - "loss": 2.3452, - "step": 527380 - }, - { - "epoch": 0.92, - "learning_rate": 4.014760199081325e-06, - "loss": 2.2498, - "step": 527390 - }, - { - "epoch": 0.92, - "learning_rate": 4.013888259154498e-06, - "loss": 2.339, - "step": 527400 - }, - { - "epoch": 0.92, - "learning_rate": 4.0130163192276706e-06, - "loss": 2.2688, - "step": 527410 - }, - { - "epoch": 0.92, - "learning_rate": 4.0121443793008435e-06, - "loss": 2.2345, - "step": 527420 - }, - { - "epoch": 0.92, - "learning_rate": 4.011272439374017e-06, - "loss": 2.2583, - "step": 527430 - }, - { - "epoch": 0.92, - "learning_rate": 4.01040049944719e-06, - "loss": 2.3136, - "step": 527440 - }, - { - "epoch": 0.92, - "learning_rate": 4.009528559520363e-06, - "loss": 2.3222, - "step": 527450 - }, - { - "epoch": 0.92, - "learning_rate": 4.008656619593536e-06, - "loss": 2.1823, - "step": 527460 - }, - { - "epoch": 0.92, - "learning_rate": 4.00778467966671e-06, - "loss": 2.2457, - "step": 527470 - }, - { - "epoch": 0.92, - "learning_rate": 4.0069127397398836e-06, - "loss": 2.3609, - "step": 527480 - }, - { - "epoch": 0.92, - "learning_rate": 4.0060407998130565e-06, - "loss": 2.2309, - "step": 527490 - }, - { - "epoch": 0.92, - "learning_rate": 4.005168859886229e-06, - "loss": 2.3113, - "step": 527500 - }, - { - "epoch": 0.92, - "learning_rate": 4.004296919959403e-06, - "loss": 2.3069, - "step": 527510 - }, - { - "epoch": 0.92, - "learning_rate": 4.003424980032576e-06, - "loss": 2.2096, - "step": 527520 - }, - { - "epoch": 0.92, - "learning_rate": 4.002553040105749e-06, - "loss": 2.1956, - "step": 527530 - }, - { - "epoch": 0.92, - "learning_rate": 4.001681100178922e-06, - "loss": 2.2356, - "step": 527540 - }, - { - "epoch": 0.92, - "learning_rate": 4.000809160252096e-06, - "loss": 2.2159, - "step": 527550 - }, - { - "epoch": 0.92, - "learning_rate": 3.999937220325269e-06, - "loss": 2.2556, - "step": 527560 - }, - { - "epoch": 0.92, - "learning_rate": 3.9990652803984416e-06, - "loss": 2.3314, - "step": 527570 - }, - { - "epoch": 0.92, - "learning_rate": 3.9981933404716145e-06, - "loss": 2.3466, - "step": 527580 - }, - { - "epoch": 0.92, - "learning_rate": 3.997321400544788e-06, - "loss": 2.2307, - "step": 527590 - }, - { - "epoch": 0.92, - "learning_rate": 3.996449460617961e-06, - "loss": 2.2271, - "step": 527600 - }, - { - "epoch": 0.92, - "learning_rate": 3.995577520691135e-06, - "loss": 2.3454, - "step": 527610 - }, - { - "epoch": 0.92, - "learning_rate": 3.994705580764308e-06, - "loss": 2.2227, - "step": 527620 - }, - { - "epoch": 0.92, - "learning_rate": 3.993833640837482e-06, - "loss": 2.2691, - "step": 527630 - }, - { - "epoch": 0.92, - "learning_rate": 3.9929617009106546e-06, - "loss": 2.2316, - "step": 527640 - }, - { - "epoch": 0.92, - "learning_rate": 3.9920897609838275e-06, - "loss": 2.2441, - "step": 527650 - }, - { - "epoch": 0.92, - "learning_rate": 3.991217821057e-06, - "loss": 2.2461, - "step": 527660 - }, - { - "epoch": 0.92, - "learning_rate": 3.990345881130174e-06, - "loss": 2.2502, - "step": 527670 - }, - { - "epoch": 0.92, - "learning_rate": 3.989473941203347e-06, - "loss": 2.2748, - "step": 527680 - }, - { - "epoch": 0.92, - "learning_rate": 3.98860200127652e-06, - "loss": 2.2449, - "step": 527690 - }, - { - "epoch": 0.92, - "learning_rate": 3.987730061349693e-06, - "loss": 2.2761, - "step": 527700 - }, - { - "epoch": 0.92, - "learning_rate": 3.986858121422867e-06, - "loss": 2.2865, - "step": 527710 - }, - { - "epoch": 0.92, - "learning_rate": 3.98598618149604e-06, - "loss": 2.2278, - "step": 527720 - }, - { - "epoch": 0.92, - "learning_rate": 3.9851142415692126e-06, - "loss": 2.2691, - "step": 527730 - }, - { - "epoch": 0.92, - "learning_rate": 3.9842423016423855e-06, - "loss": 2.254, - "step": 527740 - }, - { - "epoch": 0.92, - "learning_rate": 3.98337036171556e-06, - "loss": 2.2851, - "step": 527750 - }, - { - "epoch": 0.92, - "learning_rate": 3.982498421788733e-06, - "loss": 2.2058, - "step": 527760 - }, - { - "epoch": 0.92, - "learning_rate": 3.981626481861906e-06, - "loss": 2.385, - "step": 527770 - }, - { - "epoch": 0.92, - "learning_rate": 3.980754541935079e-06, - "loss": 2.3016, - "step": 527780 - }, - { - "epoch": 0.92, - "learning_rate": 3.979882602008253e-06, - "loss": 2.2447, - "step": 527790 - }, - { - "epoch": 0.92, - "learning_rate": 3.9790106620814256e-06, - "loss": 2.3309, - "step": 527800 - }, - { - "epoch": 0.92, - "learning_rate": 3.9781387221545985e-06, - "loss": 2.3085, - "step": 527810 - }, - { - "epoch": 0.92, - "learning_rate": 3.977266782227771e-06, - "loss": 2.2069, - "step": 527820 - }, - { - "epoch": 0.92, - "learning_rate": 3.976394842300945e-06, - "loss": 2.2713, - "step": 527830 - }, - { - "epoch": 0.92, - "learning_rate": 3.975522902374118e-06, - "loss": 2.3137, - "step": 527840 - }, - { - "epoch": 0.92, - "learning_rate": 3.974650962447291e-06, - "loss": 2.1463, - "step": 527850 - }, - { - "epoch": 0.92, - "learning_rate": 3.973779022520464e-06, - "loss": 2.2211, - "step": 527860 - }, - { - "epoch": 0.92, - "learning_rate": 3.972907082593638e-06, - "loss": 2.3777, - "step": 527870 - }, - { - "epoch": 0.92, - "learning_rate": 3.9720351426668115e-06, - "loss": 2.2397, - "step": 527880 - }, - { - "epoch": 0.92, - "learning_rate": 3.971163202739984e-06, - "loss": 2.4369, - "step": 527890 - }, - { - "epoch": 0.92, - "learning_rate": 3.970291262813157e-06, - "loss": 2.1798, - "step": 527900 - }, - { - "epoch": 0.92, - "learning_rate": 3.969419322886331e-06, - "loss": 2.249, - "step": 527910 - }, - { - "epoch": 0.92, - "learning_rate": 3.968547382959504e-06, - "loss": 2.1415, - "step": 527920 - }, - { - "epoch": 0.92, - "learning_rate": 3.967675443032677e-06, - "loss": 2.2752, - "step": 527930 - }, - { - "epoch": 0.92, - "learning_rate": 3.96680350310585e-06, - "loss": 2.3479, - "step": 527940 - }, - { - "epoch": 0.92, - "learning_rate": 3.965931563179024e-06, - "loss": 2.2582, - "step": 527950 - }, - { - "epoch": 0.92, - "learning_rate": 3.9650596232521966e-06, - "loss": 2.1987, - "step": 527960 - }, - { - "epoch": 0.92, - "learning_rate": 3.9641876833253695e-06, - "loss": 2.3131, - "step": 527970 - }, - { - "epoch": 0.92, - "learning_rate": 3.963315743398542e-06, - "loss": 2.3295, - "step": 527980 - }, - { - "epoch": 0.92, - "learning_rate": 3.962443803471716e-06, - "loss": 2.2973, - "step": 527990 - }, - { - "epoch": 0.92, - "learning_rate": 3.961571863544889e-06, - "loss": 2.3396, - "step": 528000 - }, - { - "epoch": 0.92, - "learning_rate": 3.960699923618063e-06, - "loss": 2.2433, - "step": 528010 - }, - { - "epoch": 0.92, - "learning_rate": 3.959827983691236e-06, - "loss": 2.2913, - "step": 528020 - }, - { - "epoch": 0.92, - "learning_rate": 3.9589560437644096e-06, - "loss": 2.2854, - "step": 528030 - }, - { - "epoch": 0.92, - "learning_rate": 3.9580841038375825e-06, - "loss": 2.1932, - "step": 528040 - }, - { - "epoch": 0.92, - "learning_rate": 3.957212163910755e-06, - "loss": 2.2231, - "step": 528050 - }, - { - "epoch": 0.92, - "learning_rate": 3.956340223983928e-06, - "loss": 2.2105, - "step": 528060 - }, - { - "epoch": 0.92, - "learning_rate": 3.955468284057102e-06, - "loss": 2.1757, - "step": 528070 - }, - { - "epoch": 0.92, - "learning_rate": 3.954596344130275e-06, - "loss": 2.2595, - "step": 528080 - }, - { - "epoch": 0.92, - "learning_rate": 3.953724404203448e-06, - "loss": 2.2567, - "step": 528090 - }, - { - "epoch": 0.92, - "learning_rate": 3.952852464276621e-06, - "loss": 2.3215, - "step": 528100 - }, - { - "epoch": 0.92, - "learning_rate": 3.951980524349795e-06, - "loss": 2.3092, - "step": 528110 - }, - { - "epoch": 0.92, - "learning_rate": 3.9511085844229676e-06, - "loss": 2.187, - "step": 528120 - }, - { - "epoch": 0.92, - "learning_rate": 3.9502366444961405e-06, - "loss": 2.2467, - "step": 528130 - }, - { - "epoch": 0.92, - "learning_rate": 3.949364704569314e-06, - "loss": 2.2985, - "step": 528140 - }, - { - "epoch": 0.92, - "learning_rate": 3.948492764642488e-06, - "loss": 2.2686, - "step": 528150 - }, - { - "epoch": 0.92, - "learning_rate": 3.947620824715661e-06, - "loss": 2.2456, - "step": 528160 - }, - { - "epoch": 0.92, - "learning_rate": 3.946748884788834e-06, - "loss": 2.3095, - "step": 528170 - }, - { - "epoch": 0.92, - "learning_rate": 3.945876944862007e-06, - "loss": 2.286, - "step": 528180 - }, - { - "epoch": 0.92, - "learning_rate": 3.9450050049351806e-06, - "loss": 2.2551, - "step": 528190 - }, - { - "epoch": 0.92, - "learning_rate": 3.9441330650083535e-06, - "loss": 2.2478, - "step": 528200 - }, - { - "epoch": 0.92, - "learning_rate": 3.943261125081526e-06, - "loss": 2.257, - "step": 528210 - }, - { - "epoch": 0.92, - "learning_rate": 3.942389185154699e-06, - "loss": 2.1974, - "step": 528220 - }, - { - "epoch": 0.92, - "learning_rate": 3.941517245227873e-06, - "loss": 2.2346, - "step": 528230 - }, - { - "epoch": 0.92, - "learning_rate": 3.940645305301046e-06, - "loss": 2.2197, - "step": 528240 - }, - { - "epoch": 0.92, - "learning_rate": 3.939773365374219e-06, - "loss": 2.3732, - "step": 528250 - }, - { - "epoch": 0.92, - "learning_rate": 3.938901425447393e-06, - "loss": 2.2154, - "step": 528260 - }, - { - "epoch": 0.92, - "learning_rate": 3.938029485520566e-06, - "loss": 2.2959, - "step": 528270 - }, - { - "epoch": 0.92, - "learning_rate": 3.937157545593739e-06, - "loss": 2.2118, - "step": 528280 - }, - { - "epoch": 0.92, - "learning_rate": 3.936285605666912e-06, - "loss": 2.2474, - "step": 528290 - }, - { - "epoch": 0.92, - "learning_rate": 3.935413665740085e-06, - "loss": 2.3191, - "step": 528300 - }, - { - "epoch": 0.92, - "learning_rate": 3.934541725813259e-06, - "loss": 2.2538, - "step": 528310 - }, - { - "epoch": 0.92, - "learning_rate": 3.933669785886432e-06, - "loss": 2.2869, - "step": 528320 - }, - { - "epoch": 0.92, - "learning_rate": 3.932797845959605e-06, - "loss": 2.2409, - "step": 528330 - }, - { - "epoch": 0.92, - "learning_rate": 3.931925906032778e-06, - "loss": 2.2917, - "step": 528340 - }, - { - "epoch": 0.92, - "learning_rate": 3.9310539661059516e-06, - "loss": 2.3185, - "step": 528350 - }, - { - "epoch": 0.92, - "learning_rate": 3.9301820261791245e-06, - "loss": 2.2106, - "step": 528360 - }, - { - "epoch": 0.92, - "learning_rate": 3.929310086252297e-06, - "loss": 2.3676, - "step": 528370 - }, - { - "epoch": 0.92, - "learning_rate": 3.92843814632547e-06, - "loss": 2.2674, - "step": 528380 - }, - { - "epoch": 0.92, - "learning_rate": 3.927566206398644e-06, - "loss": 2.1977, - "step": 528390 - }, - { - "epoch": 0.92, - "learning_rate": 3.926694266471817e-06, - "loss": 2.07, - "step": 528400 - }, - { - "epoch": 0.92, - "learning_rate": 3.925822326544991e-06, - "loss": 2.2054, - "step": 528410 - }, - { - "epoch": 0.92, - "learning_rate": 3.924950386618164e-06, - "loss": 2.2063, - "step": 528420 - }, - { - "epoch": 0.92, - "learning_rate": 3.9240784466913375e-06, - "loss": 2.3726, - "step": 528430 - }, - { - "epoch": 0.92, - "learning_rate": 3.92320650676451e-06, - "loss": 2.2558, - "step": 528440 - }, - { - "epoch": 0.92, - "learning_rate": 3.922334566837683e-06, - "loss": 2.2481, - "step": 528450 - }, - { - "epoch": 0.92, - "learning_rate": 3.921462626910856e-06, - "loss": 2.2905, - "step": 528460 - }, - { - "epoch": 0.92, - "learning_rate": 3.92059068698403e-06, - "loss": 2.3244, - "step": 528470 - }, - { - "epoch": 0.92, - "learning_rate": 3.919718747057203e-06, - "loss": 2.1739, - "step": 528480 - }, - { - "epoch": 0.92, - "learning_rate": 3.918846807130376e-06, - "loss": 2.1749, - "step": 528490 - }, - { - "epoch": 0.92, - "learning_rate": 3.917974867203549e-06, - "loss": 2.2803, - "step": 528500 - }, - { - "epoch": 0.92, - "learning_rate": 3.9171029272767226e-06, - "loss": 2.2765, - "step": 528510 - }, - { - "epoch": 0.92, - "learning_rate": 3.9162309873498955e-06, - "loss": 2.2405, - "step": 528520 - }, - { - "epoch": 0.92, - "learning_rate": 3.915359047423068e-06, - "loss": 2.2172, - "step": 528530 - }, - { - "epoch": 0.92, - "learning_rate": 3.914487107496242e-06, - "loss": 2.3489, - "step": 528540 - }, - { - "epoch": 0.92, - "learning_rate": 3.913615167569416e-06, - "loss": 2.3097, - "step": 528550 - }, - { - "epoch": 0.92, - "learning_rate": 3.912743227642589e-06, - "loss": 2.2798, - "step": 528560 - }, - { - "epoch": 0.92, - "learning_rate": 3.911871287715762e-06, - "loss": 2.279, - "step": 528570 - }, - { - "epoch": 0.92, - "learning_rate": 3.910999347788935e-06, - "loss": 2.2782, - "step": 528580 - }, - { - "epoch": 0.92, - "learning_rate": 3.9101274078621085e-06, - "loss": 2.2503, - "step": 528590 - }, - { - "epoch": 0.92, - "learning_rate": 3.909255467935281e-06, - "loss": 2.3154, - "step": 528600 - }, - { - "epoch": 0.92, - "learning_rate": 3.908383528008454e-06, - "loss": 2.2351, - "step": 528610 - }, - { - "epoch": 0.92, - "learning_rate": 3.907511588081627e-06, - "loss": 2.1463, - "step": 528620 - }, - { - "epoch": 0.92, - "learning_rate": 3.906639648154801e-06, - "loss": 2.4308, - "step": 528630 - }, - { - "epoch": 0.92, - "learning_rate": 3.905767708227974e-06, - "loss": 2.2107, - "step": 528640 - }, - { - "epoch": 0.92, - "learning_rate": 3.904895768301147e-06, - "loss": 2.3068, - "step": 528650 - }, - { - "epoch": 0.92, - "learning_rate": 3.904023828374321e-06, - "loss": 2.2423, - "step": 528660 - }, - { - "epoch": 0.92, - "learning_rate": 3.9031518884474936e-06, - "loss": 2.2561, - "step": 528670 - }, - { - "epoch": 0.92, - "learning_rate": 3.902279948520667e-06, - "loss": 2.1994, - "step": 528680 - }, - { - "epoch": 0.92, - "learning_rate": 3.90140800859384e-06, - "loss": 2.3444, - "step": 528690 - }, - { - "epoch": 0.92, - "learning_rate": 3.900536068667013e-06, - "loss": 2.1698, - "step": 528700 - }, - { - "epoch": 0.92, - "learning_rate": 3.899664128740187e-06, - "loss": 2.2861, - "step": 528710 - }, - { - "epoch": 0.92, - "learning_rate": 3.89879218881336e-06, - "loss": 2.3246, - "step": 528720 - }, - { - "epoch": 0.92, - "learning_rate": 3.897920248886533e-06, - "loss": 2.3169, - "step": 528730 - }, - { - "epoch": 0.92, - "learning_rate": 3.897048308959706e-06, - "loss": 2.311, - "step": 528740 - }, - { - "epoch": 0.92, - "learning_rate": 3.8961763690328795e-06, - "loss": 2.2523, - "step": 528750 - }, - { - "epoch": 0.92, - "learning_rate": 3.895304429106052e-06, - "loss": 2.3164, - "step": 528760 - }, - { - "epoch": 0.92, - "learning_rate": 3.894432489179225e-06, - "loss": 2.1571, - "step": 528770 - }, - { - "epoch": 0.92, - "learning_rate": 3.893560549252399e-06, - "loss": 2.2802, - "step": 528780 - }, - { - "epoch": 0.92, - "learning_rate": 3.892688609325572e-06, - "loss": 2.249, - "step": 528790 - }, - { - "epoch": 0.92, - "learning_rate": 3.891816669398745e-06, - "loss": 2.2856, - "step": 528800 - }, - { - "epoch": 0.92, - "learning_rate": 3.890944729471919e-06, - "loss": 2.3186, - "step": 528810 - }, - { - "epoch": 0.92, - "learning_rate": 3.890072789545092e-06, - "loss": 2.3591, - "step": 528820 - }, - { - "epoch": 0.92, - "learning_rate": 3.889200849618265e-06, - "loss": 2.3525, - "step": 528830 - }, - { - "epoch": 0.92, - "learning_rate": 3.888328909691438e-06, - "loss": 2.3595, - "step": 528840 - }, - { - "epoch": 0.92, - "learning_rate": 3.887456969764611e-06, - "loss": 2.2556, - "step": 528850 - }, - { - "epoch": 0.92, - "learning_rate": 3.886585029837784e-06, - "loss": 2.2157, - "step": 528860 - }, - { - "epoch": 0.92, - "learning_rate": 3.885713089910958e-06, - "loss": 2.1867, - "step": 528870 - }, - { - "epoch": 0.92, - "learning_rate": 3.884841149984131e-06, - "loss": 2.3758, - "step": 528880 - }, - { - "epoch": 0.92, - "learning_rate": 3.883969210057304e-06, - "loss": 2.3033, - "step": 528890 - }, - { - "epoch": 0.92, - "learning_rate": 3.883097270130477e-06, - "loss": 2.2239, - "step": 528900 - }, - { - "epoch": 0.92, - "learning_rate": 3.8822253302036505e-06, - "loss": 2.17, - "step": 528910 - }, - { - "epoch": 0.92, - "learning_rate": 3.881353390276823e-06, - "loss": 2.3107, - "step": 528920 - }, - { - "epoch": 0.92, - "learning_rate": 3.880481450349996e-06, - "loss": 2.3168, - "step": 528930 - }, - { - "epoch": 0.92, - "learning_rate": 3.87960951042317e-06, - "loss": 2.3086, - "step": 528940 - }, - { - "epoch": 0.92, - "learning_rate": 3.878737570496344e-06, - "loss": 2.3326, - "step": 528950 - }, - { - "epoch": 0.92, - "learning_rate": 3.877865630569517e-06, - "loss": 2.2973, - "step": 528960 - }, - { - "epoch": 0.92, - "learning_rate": 3.87699369064269e-06, - "loss": 2.2107, - "step": 528970 - }, - { - "epoch": 0.92, - "learning_rate": 3.876121750715863e-06, - "loss": 2.3097, - "step": 528980 - }, - { - "epoch": 0.92, - "learning_rate": 3.875249810789036e-06, - "loss": 2.2641, - "step": 528990 - }, - { - "epoch": 0.92, - "learning_rate": 3.874377870862209e-06, - "loss": 2.1811, - "step": 529000 - }, - { - "epoch": 0.92, - "learning_rate": 3.873505930935382e-06, - "loss": 2.2345, - "step": 529010 - }, - { - "epoch": 0.92, - "learning_rate": 3.872633991008555e-06, - "loss": 2.2934, - "step": 529020 - }, - { - "epoch": 0.92, - "learning_rate": 3.871762051081729e-06, - "loss": 2.3385, - "step": 529030 - }, - { - "epoch": 0.92, - "learning_rate": 3.870890111154902e-06, - "loss": 2.2787, - "step": 529040 - }, - { - "epoch": 0.92, - "learning_rate": 3.870018171228075e-06, - "loss": 2.3171, - "step": 529050 - }, - { - "epoch": 0.92, - "learning_rate": 3.8691462313012486e-06, - "loss": 2.3983, - "step": 529060 - }, - { - "epoch": 0.92, - "learning_rate": 3.8682742913744215e-06, - "loss": 2.4258, - "step": 529070 - }, - { - "epoch": 0.92, - "learning_rate": 3.867402351447595e-06, - "loss": 2.2776, - "step": 529080 - }, - { - "epoch": 0.92, - "learning_rate": 3.866530411520768e-06, - "loss": 2.2025, - "step": 529090 - }, - { - "epoch": 0.92, - "learning_rate": 3.865658471593941e-06, - "loss": 2.2437, - "step": 529100 - }, - { - "epoch": 0.92, - "learning_rate": 3.864786531667115e-06, - "loss": 2.3038, - "step": 529110 - }, - { - "epoch": 0.92, - "learning_rate": 3.863914591740288e-06, - "loss": 2.2225, - "step": 529120 - }, - { - "epoch": 0.92, - "learning_rate": 3.863042651813461e-06, - "loss": 2.2331, - "step": 529130 - }, - { - "epoch": 0.92, - "learning_rate": 3.862170711886634e-06, - "loss": 2.1838, - "step": 529140 - }, - { - "epoch": 0.92, - "learning_rate": 3.861298771959807e-06, - "loss": 2.1961, - "step": 529150 - }, - { - "epoch": 0.92, - "learning_rate": 3.86042683203298e-06, - "loss": 2.2117, - "step": 529160 - }, - { - "epoch": 0.92, - "learning_rate": 3.859554892106153e-06, - "loss": 2.3353, - "step": 529170 - }, - { - "epoch": 0.92, - "learning_rate": 3.858682952179327e-06, - "loss": 2.2302, - "step": 529180 - }, - { - "epoch": 0.92, - "learning_rate": 3.8578110122525e-06, - "loss": 2.2929, - "step": 529190 - }, - { - "epoch": 0.92, - "learning_rate": 3.856939072325673e-06, - "loss": 2.3193, - "step": 529200 - }, - { - "epoch": 0.92, - "learning_rate": 3.856067132398847e-06, - "loss": 2.285, - "step": 529210 - }, - { - "epoch": 0.92, - "learning_rate": 3.8551951924720196e-06, - "loss": 2.218, - "step": 529220 - }, - { - "epoch": 0.92, - "learning_rate": 3.854323252545193e-06, - "loss": 2.1947, - "step": 529230 - }, - { - "epoch": 0.92, - "learning_rate": 3.853451312618366e-06, - "loss": 2.2639, - "step": 529240 - }, - { - "epoch": 0.92, - "learning_rate": 3.852579372691539e-06, - "loss": 2.2939, - "step": 529250 - }, - { - "epoch": 0.92, - "learning_rate": 3.851707432764712e-06, - "loss": 2.1668, - "step": 529260 - }, - { - "epoch": 0.92, - "learning_rate": 3.850835492837886e-06, - "loss": 2.2045, - "step": 529270 - }, - { - "epoch": 0.92, - "learning_rate": 3.849963552911059e-06, - "loss": 2.1408, - "step": 529280 - }, - { - "epoch": 0.92, - "learning_rate": 3.849091612984232e-06, - "loss": 2.2926, - "step": 529290 - }, - { - "epoch": 0.92, - "learning_rate": 3.8482196730574055e-06, - "loss": 2.2405, - "step": 529300 - }, - { - "epoch": 0.92, - "learning_rate": 3.847347733130578e-06, - "loss": 2.2676, - "step": 529310 - }, - { - "epoch": 0.92, - "learning_rate": 3.846475793203751e-06, - "loss": 2.2342, - "step": 529320 - }, - { - "epoch": 0.92, - "learning_rate": 3.845603853276924e-06, - "loss": 2.1874, - "step": 529330 - }, - { - "epoch": 0.92, - "learning_rate": 3.844731913350098e-06, - "loss": 2.3103, - "step": 529340 - }, - { - "epoch": 0.92, - "learning_rate": 3.843859973423272e-06, - "loss": 2.1242, - "step": 529350 - }, - { - "epoch": 0.92, - "learning_rate": 3.842988033496445e-06, - "loss": 2.2337, - "step": 529360 - }, - { - "epoch": 0.92, - "learning_rate": 3.842116093569618e-06, - "loss": 2.2281, - "step": 529370 - }, - { - "epoch": 0.92, - "learning_rate": 3.8412441536427906e-06, - "loss": 2.2996, - "step": 529380 - }, - { - "epoch": 0.92, - "learning_rate": 3.840372213715964e-06, - "loss": 2.2428, - "step": 529390 - }, - { - "epoch": 0.92, - "learning_rate": 3.839500273789137e-06, - "loss": 2.3157, - "step": 529400 - }, - { - "epoch": 0.92, - "learning_rate": 3.83862833386231e-06, - "loss": 2.3267, - "step": 529410 - }, - { - "epoch": 0.92, - "learning_rate": 3.837756393935483e-06, - "loss": 2.3833, - "step": 529420 - }, - { - "epoch": 0.92, - "learning_rate": 3.836884454008657e-06, - "loss": 2.2929, - "step": 529430 - }, - { - "epoch": 0.92, - "learning_rate": 3.83601251408183e-06, - "loss": 2.1754, - "step": 529440 - }, - { - "epoch": 0.92, - "learning_rate": 3.835140574155003e-06, - "loss": 2.2474, - "step": 529450 - }, - { - "epoch": 0.92, - "learning_rate": 3.8342686342281765e-06, - "loss": 2.2271, - "step": 529460 - }, - { - "epoch": 0.92, - "learning_rate": 3.833396694301349e-06, - "loss": 2.1705, - "step": 529470 - }, - { - "epoch": 0.92, - "learning_rate": 3.832524754374523e-06, - "loss": 2.2791, - "step": 529480 - }, - { - "epoch": 0.92, - "learning_rate": 3.831652814447696e-06, - "loss": 2.3624, - "step": 529490 - }, - { - "epoch": 0.92, - "learning_rate": 3.830780874520869e-06, - "loss": 2.2585, - "step": 529500 - }, - { - "epoch": 0.92, - "learning_rate": 3.829908934594043e-06, - "loss": 2.2992, - "step": 529510 - }, - { - "epoch": 0.92, - "learning_rate": 3.829036994667216e-06, - "loss": 2.2235, - "step": 529520 - }, - { - "epoch": 0.92, - "learning_rate": 3.828165054740389e-06, - "loss": 2.263, - "step": 529530 - }, - { - "epoch": 0.92, - "learning_rate": 3.8272931148135616e-06, - "loss": 2.3141, - "step": 529540 - }, - { - "epoch": 0.92, - "learning_rate": 3.826421174886735e-06, - "loss": 2.2888, - "step": 529550 - }, - { - "epoch": 0.92, - "learning_rate": 3.825549234959908e-06, - "loss": 2.253, - "step": 529560 - }, - { - "epoch": 0.92, - "learning_rate": 3.824677295033081e-06, - "loss": 2.1746, - "step": 529570 - }, - { - "epoch": 0.92, - "learning_rate": 3.823805355106255e-06, - "loss": 2.293, - "step": 529580 - }, - { - "epoch": 0.92, - "learning_rate": 3.822933415179428e-06, - "loss": 2.2782, - "step": 529590 - }, - { - "epoch": 0.92, - "learning_rate": 3.822061475252601e-06, - "loss": 2.254, - "step": 529600 - }, - { - "epoch": 0.92, - "learning_rate": 3.8211895353257746e-06, - "loss": 2.329, - "step": 529610 - }, - { - "epoch": 0.92, - "learning_rate": 3.8203175953989475e-06, - "loss": 2.2292, - "step": 529620 - }, - { - "epoch": 0.92, - "learning_rate": 3.819445655472121e-06, - "loss": 2.2585, - "step": 529630 - }, - { - "epoch": 0.92, - "learning_rate": 3.818573715545294e-06, - "loss": 2.343, - "step": 529640 - }, - { - "epoch": 0.92, - "learning_rate": 3.817701775618467e-06, - "loss": 2.0914, - "step": 529650 - }, - { - "epoch": 0.92, - "learning_rate": 3.81682983569164e-06, - "loss": 2.3212, - "step": 529660 - }, - { - "epoch": 0.92, - "learning_rate": 3.815957895764814e-06, - "loss": 2.361, - "step": 529670 - }, - { - "epoch": 0.92, - "learning_rate": 3.815085955837987e-06, - "loss": 2.3497, - "step": 529680 - }, - { - "epoch": 0.92, - "learning_rate": 3.81421401591116e-06, - "loss": 2.2011, - "step": 529690 - }, - { - "epoch": 0.92, - "learning_rate": 3.813342075984333e-06, - "loss": 2.174, - "step": 529700 - }, - { - "epoch": 0.92, - "learning_rate": 3.8124701360575063e-06, - "loss": 2.1365, - "step": 529710 - }, - { - "epoch": 0.92, - "learning_rate": 3.8115981961306793e-06, - "loss": 2.1215, - "step": 529720 - }, - { - "epoch": 0.92, - "learning_rate": 3.8107262562038526e-06, - "loss": 2.3216, - "step": 529730 - }, - { - "epoch": 0.92, - "learning_rate": 3.8098543162770264e-06, - "loss": 2.3235, - "step": 529740 - }, - { - "epoch": 0.92, - "learning_rate": 3.8089823763501993e-06, - "loss": 2.2905, - "step": 529750 - }, - { - "epoch": 0.92, - "learning_rate": 3.8081104364233727e-06, - "loss": 2.1971, - "step": 529760 - }, - { - "epoch": 0.92, - "learning_rate": 3.8072384964965456e-06, - "loss": 2.2566, - "step": 529770 - }, - { - "epoch": 0.92, - "learning_rate": 3.806366556569719e-06, - "loss": 2.2751, - "step": 529780 - }, - { - "epoch": 0.92, - "learning_rate": 3.805494616642892e-06, - "loss": 2.3119, - "step": 529790 - }, - { - "epoch": 0.92, - "learning_rate": 3.804622676716065e-06, - "loss": 2.224, - "step": 529800 - }, - { - "epoch": 0.92, - "learning_rate": 3.803750736789238e-06, - "loss": 2.3261, - "step": 529810 - }, - { - "epoch": 0.92, - "learning_rate": 3.8028787968624115e-06, - "loss": 2.3354, - "step": 529820 - }, - { - "epoch": 0.92, - "learning_rate": 3.802006856935585e-06, - "loss": 2.2237, - "step": 529830 - }, - { - "epoch": 0.92, - "learning_rate": 3.8011349170087577e-06, - "loss": 2.3126, - "step": 529840 - }, - { - "epoch": 0.92, - "learning_rate": 3.800262977081931e-06, - "loss": 2.2227, - "step": 529850 - }, - { - "epoch": 0.92, - "learning_rate": 3.799391037155104e-06, - "loss": 2.2999, - "step": 529860 - }, - { - "epoch": 0.92, - "learning_rate": 3.7985190972282773e-06, - "loss": 2.3102, - "step": 529870 - }, - { - "epoch": 0.92, - "learning_rate": 3.797647157301451e-06, - "loss": 2.1868, - "step": 529880 - }, - { - "epoch": 0.92, - "learning_rate": 3.796775217374624e-06, - "loss": 2.3093, - "step": 529890 - }, - { - "epoch": 0.92, - "learning_rate": 3.7959032774477974e-06, - "loss": 2.3609, - "step": 529900 - }, - { - "epoch": 0.92, - "learning_rate": 3.7950313375209703e-06, - "loss": 2.2522, - "step": 529910 - }, - { - "epoch": 0.92, - "learning_rate": 3.7941593975941437e-06, - "loss": 2.1952, - "step": 529920 - }, - { - "epoch": 0.92, - "learning_rate": 3.7932874576673166e-06, - "loss": 2.4004, - "step": 529930 - }, - { - "epoch": 0.92, - "learning_rate": 3.79241551774049e-06, - "loss": 2.3281, - "step": 529940 - }, - { - "epoch": 0.92, - "learning_rate": 3.7915435778136633e-06, - "loss": 2.2447, - "step": 529950 - }, - { - "epoch": 0.92, - "learning_rate": 3.790671637886836e-06, - "loss": 2.218, - "step": 529960 - }, - { - "epoch": 0.92, - "learning_rate": 3.7897996979600095e-06, - "loss": 2.1908, - "step": 529970 - }, - { - "epoch": 0.92, - "learning_rate": 3.7889277580331825e-06, - "loss": 2.2895, - "step": 529980 - }, - { - "epoch": 0.92, - "learning_rate": 3.788055818106356e-06, - "loss": 2.281, - "step": 529990 - }, - { - "epoch": 0.92, - "learning_rate": 3.7871838781795287e-06, - "loss": 2.2828, - "step": 530000 - }, - { - "epoch": 0.92, - "learning_rate": 3.7863119382527025e-06, - "loss": 2.1907, - "step": 530010 - }, - { - "epoch": 0.92, - "learning_rate": 3.785439998325876e-06, - "loss": 2.2742, - "step": 530020 - }, - { - "epoch": 0.92, - "learning_rate": 3.7845680583990488e-06, - "loss": 2.1436, - "step": 530030 - }, - { - "epoch": 0.92, - "learning_rate": 3.783696118472222e-06, - "loss": 2.309, - "step": 530040 - }, - { - "epoch": 0.92, - "learning_rate": 3.782824178545395e-06, - "loss": 2.2215, - "step": 530050 - }, - { - "epoch": 0.92, - "learning_rate": 3.7819522386185684e-06, - "loss": 2.2464, - "step": 530060 - }, - { - "epoch": 0.92, - "learning_rate": 3.7810802986917413e-06, - "loss": 2.2355, - "step": 530070 - }, - { - "epoch": 0.92, - "learning_rate": 3.7802083587649147e-06, - "loss": 2.2877, - "step": 530080 - }, - { - "epoch": 0.92, - "learning_rate": 3.779336418838088e-06, - "loss": 2.2456, - "step": 530090 - }, - { - "epoch": 0.92, - "learning_rate": 3.778464478911261e-06, - "loss": 2.1406, - "step": 530100 - }, - { - "epoch": 0.92, - "learning_rate": 3.7775925389844343e-06, - "loss": 2.2534, - "step": 530110 - }, - { - "epoch": 0.92, - "learning_rate": 3.776720599057607e-06, - "loss": 2.2977, - "step": 530120 - }, - { - "epoch": 0.92, - "learning_rate": 3.7758486591307805e-06, - "loss": 2.2675, - "step": 530130 - }, - { - "epoch": 0.92, - "learning_rate": 3.7749767192039543e-06, - "loss": 2.3178, - "step": 530140 - }, - { - "epoch": 0.92, - "learning_rate": 3.7741047792771272e-06, - "loss": 2.2713, - "step": 530150 - }, - { - "epoch": 0.92, - "learning_rate": 3.7732328393503006e-06, - "loss": 2.1764, - "step": 530160 - }, - { - "epoch": 0.92, - "learning_rate": 3.7723608994234735e-06, - "loss": 2.2213, - "step": 530170 - }, - { - "epoch": 0.92, - "learning_rate": 3.771488959496647e-06, - "loss": 2.3288, - "step": 530180 - }, - { - "epoch": 0.92, - "learning_rate": 3.7706170195698198e-06, - "loss": 2.3528, - "step": 530190 - }, - { - "epoch": 0.92, - "learning_rate": 3.769745079642993e-06, - "loss": 2.2147, - "step": 530200 - }, - { - "epoch": 0.92, - "learning_rate": 3.7688731397161665e-06, - "loss": 2.1127, - "step": 530210 - }, - { - "epoch": 0.92, - "learning_rate": 3.7680011997893394e-06, - "loss": 2.2387, - "step": 530220 - }, - { - "epoch": 0.92, - "learning_rate": 3.7671292598625127e-06, - "loss": 2.1301, - "step": 530230 - }, - { - "epoch": 0.92, - "learning_rate": 3.7662573199356857e-06, - "loss": 2.2443, - "step": 530240 - }, - { - "epoch": 0.92, - "learning_rate": 3.765385380008859e-06, - "loss": 2.3442, - "step": 530250 - }, - { - "epoch": 0.92, - "learning_rate": 3.764513440082032e-06, - "loss": 2.3322, - "step": 530260 - }, - { - "epoch": 0.92, - "learning_rate": 3.7636415001552053e-06, - "loss": 2.319, - "step": 530270 - }, - { - "epoch": 0.92, - "learning_rate": 3.762769560228379e-06, - "loss": 2.2485, - "step": 530280 - }, - { - "epoch": 0.92, - "learning_rate": 3.761897620301552e-06, - "loss": 2.3177, - "step": 530290 - }, - { - "epoch": 0.92, - "learning_rate": 3.7610256803747253e-06, - "loss": 2.3409, - "step": 530300 - }, - { - "epoch": 0.92, - "learning_rate": 3.7601537404478982e-06, - "loss": 2.261, - "step": 530310 - }, - { - "epoch": 0.92, - "learning_rate": 3.7592818005210716e-06, - "loss": 2.1737, - "step": 530320 - }, - { - "epoch": 0.92, - "learning_rate": 3.7584098605942445e-06, - "loss": 2.257, - "step": 530330 - }, - { - "epoch": 0.92, - "learning_rate": 3.757537920667418e-06, - "loss": 2.1924, - "step": 530340 - }, - { - "epoch": 0.92, - "learning_rate": 3.756665980740591e-06, - "loss": 2.2326, - "step": 530350 - }, - { - "epoch": 0.92, - "learning_rate": 3.755794040813764e-06, - "loss": 2.3009, - "step": 530360 - }, - { - "epoch": 0.92, - "learning_rate": 3.7549221008869375e-06, - "loss": 2.3173, - "step": 530370 - }, - { - "epoch": 0.92, - "learning_rate": 3.7540501609601104e-06, - "loss": 2.3047, - "step": 530380 - }, - { - "epoch": 0.92, - "learning_rate": 3.7531782210332837e-06, - "loss": 2.2725, - "step": 530390 - }, - { - "epoch": 0.92, - "learning_rate": 3.7523062811064567e-06, - "loss": 2.2791, - "step": 530400 - }, - { - "epoch": 0.92, - "learning_rate": 3.7514343411796304e-06, - "loss": 2.224, - "step": 530410 - }, - { - "epoch": 0.92, - "learning_rate": 3.7505624012528038e-06, - "loss": 2.2095, - "step": 530420 - }, - { - "epoch": 0.93, - "learning_rate": 3.7496904613259767e-06, - "loss": 2.2576, - "step": 530430 - }, - { - "epoch": 0.93, - "learning_rate": 3.74881852139915e-06, - "loss": 2.1874, - "step": 530440 - }, - { - "epoch": 0.93, - "learning_rate": 3.747946581472323e-06, - "loss": 2.2145, - "step": 530450 - }, - { - "epoch": 0.93, - "learning_rate": 3.7470746415454963e-06, - "loss": 2.2775, - "step": 530460 - }, - { - "epoch": 0.93, - "learning_rate": 3.7462027016186697e-06, - "loss": 2.1692, - "step": 530470 - }, - { - "epoch": 0.93, - "learning_rate": 3.7453307616918426e-06, - "loss": 2.3202, - "step": 530480 - }, - { - "epoch": 0.93, - "learning_rate": 3.744458821765016e-06, - "loss": 2.311, - "step": 530490 - }, - { - "epoch": 0.93, - "learning_rate": 3.743586881838189e-06, - "loss": 2.1241, - "step": 530500 - }, - { - "epoch": 0.93, - "learning_rate": 3.742714941911362e-06, - "loss": 2.2372, - "step": 530510 - }, - { - "epoch": 0.93, - "learning_rate": 3.741843001984535e-06, - "loss": 2.3876, - "step": 530520 - }, - { - "epoch": 0.93, - "learning_rate": 3.7409710620577085e-06, - "loss": 2.0389, - "step": 530530 - }, - { - "epoch": 0.93, - "learning_rate": 3.7400991221308822e-06, - "loss": 2.2576, - "step": 530540 - }, - { - "epoch": 0.93, - "learning_rate": 3.739227182204055e-06, - "loss": 2.2618, - "step": 530550 - }, - { - "epoch": 0.93, - "learning_rate": 3.7383552422772285e-06, - "loss": 2.3099, - "step": 530560 - }, - { - "epoch": 0.93, - "learning_rate": 3.7374833023504014e-06, - "loss": 2.2231, - "step": 530570 - }, - { - "epoch": 0.93, - "learning_rate": 3.7366113624235748e-06, - "loss": 2.1881, - "step": 530580 - }, - { - "epoch": 0.93, - "learning_rate": 3.7357394224967477e-06, - "loss": 2.1861, - "step": 530590 - }, - { - "epoch": 0.93, - "learning_rate": 3.734867482569921e-06, - "loss": 2.2241, - "step": 530600 - }, - { - "epoch": 0.93, - "learning_rate": 3.7339955426430944e-06, - "loss": 2.2315, - "step": 530610 - }, - { - "epoch": 0.93, - "learning_rate": 3.7331236027162673e-06, - "loss": 2.1618, - "step": 530620 - }, - { - "epoch": 0.93, - "learning_rate": 3.7322516627894407e-06, - "loss": 2.3327, - "step": 530630 - }, - { - "epoch": 0.93, - "learning_rate": 3.7313797228626136e-06, - "loss": 2.2402, - "step": 530640 - }, - { - "epoch": 0.93, - "learning_rate": 3.730507782935787e-06, - "loss": 2.1857, - "step": 530650 - }, - { - "epoch": 0.93, - "learning_rate": 3.72963584300896e-06, - "loss": 2.3156, - "step": 530660 - }, - { - "epoch": 0.93, - "learning_rate": 3.7287639030821336e-06, - "loss": 2.3496, - "step": 530670 - }, - { - "epoch": 0.93, - "learning_rate": 3.727891963155307e-06, - "loss": 2.275, - "step": 530680 - }, - { - "epoch": 0.93, - "learning_rate": 3.72702002322848e-06, - "loss": 2.1659, - "step": 530690 - }, - { - "epoch": 0.93, - "learning_rate": 3.7261480833016532e-06, - "loss": 2.2946, - "step": 530700 - }, - { - "epoch": 0.93, - "learning_rate": 3.725276143374826e-06, - "loss": 2.2618, - "step": 530710 - }, - { - "epoch": 0.93, - "learning_rate": 3.7244042034479995e-06, - "loss": 2.2274, - "step": 530720 - }, - { - "epoch": 0.93, - "learning_rate": 3.723532263521173e-06, - "loss": 2.2916, - "step": 530730 - }, - { - "epoch": 0.93, - "learning_rate": 3.7226603235943458e-06, - "loss": 2.1984, - "step": 530740 - }, - { - "epoch": 0.93, - "learning_rate": 3.721788383667519e-06, - "loss": 2.2969, - "step": 530750 - }, - { - "epoch": 0.93, - "learning_rate": 3.720916443740692e-06, - "loss": 2.288, - "step": 530760 - }, - { - "epoch": 0.93, - "learning_rate": 3.7200445038138654e-06, - "loss": 2.3209, - "step": 530770 - }, - { - "epoch": 0.93, - "learning_rate": 3.7191725638870383e-06, - "loss": 2.272, - "step": 530780 - }, - { - "epoch": 0.93, - "learning_rate": 3.7183006239602117e-06, - "loss": 2.1877, - "step": 530790 - }, - { - "epoch": 0.93, - "learning_rate": 3.7174286840333846e-06, - "loss": 2.2782, - "step": 530800 - }, - { - "epoch": 0.93, - "learning_rate": 3.7165567441065584e-06, - "loss": 2.2273, - "step": 530810 - }, - { - "epoch": 0.93, - "learning_rate": 3.7156848041797317e-06, - "loss": 2.2624, - "step": 530820 - }, - { - "epoch": 0.93, - "learning_rate": 3.7148128642529046e-06, - "loss": 2.1843, - "step": 530830 - }, - { - "epoch": 0.93, - "learning_rate": 3.713940924326078e-06, - "loss": 2.2825, - "step": 530840 - }, - { - "epoch": 0.93, - "learning_rate": 3.713068984399251e-06, - "loss": 2.2386, - "step": 530850 - }, - { - "epoch": 0.93, - "learning_rate": 3.7121970444724242e-06, - "loss": 2.1365, - "step": 530860 - }, - { - "epoch": 0.93, - "learning_rate": 3.7113251045455976e-06, - "loss": 2.1917, - "step": 530870 - }, - { - "epoch": 0.93, - "learning_rate": 3.7104531646187705e-06, - "loss": 2.303, - "step": 530880 - }, - { - "epoch": 0.93, - "learning_rate": 3.709581224691944e-06, - "loss": 2.2696, - "step": 530890 - }, - { - "epoch": 0.93, - "learning_rate": 3.7087092847651168e-06, - "loss": 2.2281, - "step": 530900 - }, - { - "epoch": 0.93, - "learning_rate": 3.70783734483829e-06, - "loss": 2.1166, - "step": 530910 - }, - { - "epoch": 0.93, - "learning_rate": 3.706965404911463e-06, - "loss": 2.2791, - "step": 530920 - }, - { - "epoch": 0.93, - "learning_rate": 3.7060934649846364e-06, - "loss": 2.3143, - "step": 530930 - }, - { - "epoch": 0.93, - "learning_rate": 3.70522152505781e-06, - "loss": 2.1888, - "step": 530940 - }, - { - "epoch": 0.93, - "learning_rate": 3.704349585130983e-06, - "loss": 2.2018, - "step": 530950 - }, - { - "epoch": 0.93, - "learning_rate": 3.7034776452041564e-06, - "loss": 2.2419, - "step": 530960 - }, - { - "epoch": 0.93, - "learning_rate": 3.7026057052773294e-06, - "loss": 2.3235, - "step": 530970 - }, - { - "epoch": 0.93, - "learning_rate": 3.7017337653505027e-06, - "loss": 2.4075, - "step": 530980 - }, - { - "epoch": 0.93, - "learning_rate": 3.700861825423676e-06, - "loss": 2.2271, - "step": 530990 - }, - { - "epoch": 0.93, - "learning_rate": 3.699989885496849e-06, - "loss": 2.2836, - "step": 531000 - }, - { - "epoch": 0.93, - "learning_rate": 3.6991179455700223e-06, - "loss": 2.2379, - "step": 531010 - }, - { - "epoch": 0.93, - "learning_rate": 3.6982460056431952e-06, - "loss": 2.226, - "step": 531020 - }, - { - "epoch": 0.93, - "learning_rate": 3.6973740657163686e-06, - "loss": 2.3035, - "step": 531030 - }, - { - "epoch": 0.93, - "learning_rate": 3.6965021257895415e-06, - "loss": 2.3299, - "step": 531040 - }, - { - "epoch": 0.93, - "learning_rate": 3.695630185862715e-06, - "loss": 2.2689, - "step": 531050 - }, - { - "epoch": 0.93, - "learning_rate": 3.6947582459358878e-06, - "loss": 2.083, - "step": 531060 - }, - { - "epoch": 0.93, - "learning_rate": 3.6938863060090616e-06, - "loss": 2.3011, - "step": 531070 - }, - { - "epoch": 0.93, - "learning_rate": 3.693014366082235e-06, - "loss": 2.3382, - "step": 531080 - }, - { - "epoch": 0.93, - "learning_rate": 3.692142426155408e-06, - "loss": 2.2576, - "step": 531090 - }, - { - "epoch": 0.93, - "learning_rate": 3.691270486228581e-06, - "loss": 2.2803, - "step": 531100 - }, - { - "epoch": 0.93, - "learning_rate": 3.690398546301754e-06, - "loss": 2.2515, - "step": 531110 - }, - { - "epoch": 0.93, - "learning_rate": 3.6895266063749274e-06, - "loss": 2.2292, - "step": 531120 - }, - { - "epoch": 0.93, - "learning_rate": 3.6886546664481008e-06, - "loss": 2.3099, - "step": 531130 - }, - { - "epoch": 0.93, - "learning_rate": 3.6877827265212737e-06, - "loss": 2.2523, - "step": 531140 - }, - { - "epoch": 0.93, - "learning_rate": 3.686910786594447e-06, - "loss": 2.342, - "step": 531150 - }, - { - "epoch": 0.93, - "learning_rate": 3.68603884666762e-06, - "loss": 2.3068, - "step": 531160 - }, - { - "epoch": 0.93, - "learning_rate": 3.6851669067407933e-06, - "loss": 2.2895, - "step": 531170 - }, - { - "epoch": 0.93, - "learning_rate": 3.6842949668139662e-06, - "loss": 2.1714, - "step": 531180 - }, - { - "epoch": 0.93, - "learning_rate": 3.6834230268871396e-06, - "loss": 2.2728, - "step": 531190 - }, - { - "epoch": 0.93, - "learning_rate": 3.6825510869603125e-06, - "loss": 2.2842, - "step": 531200 - }, - { - "epoch": 0.93, - "learning_rate": 3.6816791470334863e-06, - "loss": 2.153, - "step": 531210 - }, - { - "epoch": 0.93, - "learning_rate": 3.6808072071066596e-06, - "loss": 2.3774, - "step": 531220 - }, - { - "epoch": 0.93, - "learning_rate": 3.6799352671798326e-06, - "loss": 2.3966, - "step": 531230 - }, - { - "epoch": 0.93, - "learning_rate": 3.679063327253006e-06, - "loss": 2.2222, - "step": 531240 - }, - { - "epoch": 0.93, - "learning_rate": 3.6781913873261792e-06, - "loss": 2.2868, - "step": 531250 - }, - { - "epoch": 0.93, - "learning_rate": 3.677319447399352e-06, - "loss": 2.2377, - "step": 531260 - }, - { - "epoch": 0.93, - "learning_rate": 3.6764475074725255e-06, - "loss": 2.3106, - "step": 531270 - }, - { - "epoch": 0.93, - "learning_rate": 3.6755755675456984e-06, - "loss": 2.3176, - "step": 531280 - }, - { - "epoch": 0.93, - "learning_rate": 3.6747036276188718e-06, - "loss": 2.2431, - "step": 531290 - }, - { - "epoch": 0.93, - "learning_rate": 3.6738316876920447e-06, - "loss": 2.2523, - "step": 531300 - }, - { - "epoch": 0.93, - "learning_rate": 3.672959747765218e-06, - "loss": 2.1491, - "step": 531310 - }, - { - "epoch": 0.93, - "learning_rate": 3.672087807838391e-06, - "loss": 2.228, - "step": 531320 - }, - { - "epoch": 0.93, - "learning_rate": 3.6712158679115643e-06, - "loss": 2.276, - "step": 531330 - }, - { - "epoch": 0.93, - "learning_rate": 3.670343927984738e-06, - "loss": 2.1837, - "step": 531340 - }, - { - "epoch": 0.93, - "learning_rate": 3.669471988057911e-06, - "loss": 2.3741, - "step": 531350 - }, - { - "epoch": 0.93, - "learning_rate": 3.6686000481310844e-06, - "loss": 2.2402, - "step": 531360 - }, - { - "epoch": 0.93, - "learning_rate": 3.6677281082042577e-06, - "loss": 2.209, - "step": 531370 - }, - { - "epoch": 0.93, - "learning_rate": 3.6668561682774306e-06, - "loss": 2.3007, - "step": 531380 - }, - { - "epoch": 0.93, - "learning_rate": 3.665984228350604e-06, - "loss": 2.2506, - "step": 531390 - }, - { - "epoch": 0.93, - "learning_rate": 3.665112288423777e-06, - "loss": 2.1751, - "step": 531400 - }, - { - "epoch": 0.93, - "learning_rate": 3.6642403484969502e-06, - "loss": 2.2998, - "step": 531410 - }, - { - "epoch": 0.93, - "learning_rate": 3.663368408570123e-06, - "loss": 2.3238, - "step": 531420 - }, - { - "epoch": 0.93, - "learning_rate": 3.6624964686432965e-06, - "loss": 2.2079, - "step": 531430 - }, - { - "epoch": 0.93, - "learning_rate": 3.6616245287164694e-06, - "loss": 2.1828, - "step": 531440 - }, - { - "epoch": 0.93, - "learning_rate": 3.6607525887896428e-06, - "loss": 2.284, - "step": 531450 - }, - { - "epoch": 0.93, - "learning_rate": 3.6598806488628157e-06, - "loss": 2.1897, - "step": 531460 - }, - { - "epoch": 0.93, - "learning_rate": 3.6590087089359895e-06, - "loss": 2.3235, - "step": 531470 - }, - { - "epoch": 0.93, - "learning_rate": 3.658136769009163e-06, - "loss": 2.2138, - "step": 531480 - }, - { - "epoch": 0.93, - "learning_rate": 3.6572648290823357e-06, - "loss": 2.2282, - "step": 531490 - }, - { - "epoch": 0.93, - "learning_rate": 3.656392889155509e-06, - "loss": 2.2667, - "step": 531500 - }, - { - "epoch": 0.93, - "learning_rate": 3.6555209492286824e-06, - "loss": 2.3041, - "step": 531510 - }, - { - "epoch": 0.93, - "learning_rate": 3.6546490093018554e-06, - "loss": 2.3017, - "step": 531520 - }, - { - "epoch": 0.93, - "learning_rate": 3.6537770693750287e-06, - "loss": 2.3076, - "step": 531530 - }, - { - "epoch": 0.93, - "learning_rate": 3.6529051294482016e-06, - "loss": 2.1581, - "step": 531540 - }, - { - "epoch": 0.93, - "learning_rate": 3.652033189521375e-06, - "loss": 2.1707, - "step": 531550 - }, - { - "epoch": 0.93, - "learning_rate": 3.651161249594548e-06, - "loss": 2.2171, - "step": 531560 - }, - { - "epoch": 0.93, - "learning_rate": 3.6502893096677212e-06, - "loss": 2.2004, - "step": 531570 - }, - { - "epoch": 0.93, - "learning_rate": 3.649417369740894e-06, - "loss": 2.2313, - "step": 531580 - }, - { - "epoch": 0.93, - "learning_rate": 3.6485454298140675e-06, - "loss": 2.2715, - "step": 531590 - }, - { - "epoch": 0.93, - "learning_rate": 3.6476734898872404e-06, - "loss": 2.3293, - "step": 531600 - }, - { - "epoch": 0.93, - "learning_rate": 3.646801549960414e-06, - "loss": 2.2932, - "step": 531610 - }, - { - "epoch": 0.93, - "learning_rate": 3.6459296100335876e-06, - "loss": 2.2361, - "step": 531620 - }, - { - "epoch": 0.93, - "learning_rate": 3.645057670106761e-06, - "loss": 2.3005, - "step": 531630 - }, - { - "epoch": 0.93, - "learning_rate": 3.644185730179934e-06, - "loss": 2.2168, - "step": 531640 - }, - { - "epoch": 0.93, - "learning_rate": 3.643313790253107e-06, - "loss": 2.3165, - "step": 531650 - }, - { - "epoch": 0.93, - "learning_rate": 3.64244185032628e-06, - "loss": 2.2469, - "step": 531660 - }, - { - "epoch": 0.93, - "learning_rate": 3.6415699103994534e-06, - "loss": 2.3345, - "step": 531670 - }, - { - "epoch": 0.93, - "learning_rate": 3.6406979704726264e-06, - "loss": 2.3305, - "step": 531680 - }, - { - "epoch": 0.93, - "learning_rate": 3.6398260305457997e-06, - "loss": 2.2385, - "step": 531690 - }, - { - "epoch": 0.93, - "learning_rate": 3.6389540906189726e-06, - "loss": 2.3255, - "step": 531700 - }, - { - "epoch": 0.93, - "learning_rate": 3.638082150692146e-06, - "loss": 2.2056, - "step": 531710 - }, - { - "epoch": 0.93, - "learning_rate": 3.637210210765319e-06, - "loss": 2.1902, - "step": 531720 - }, - { - "epoch": 0.93, - "learning_rate": 3.6363382708384922e-06, - "loss": 2.218, - "step": 531730 - }, - { - "epoch": 0.93, - "learning_rate": 3.635466330911666e-06, - "loss": 2.2024, - "step": 531740 - }, - { - "epoch": 0.93, - "learning_rate": 3.634594390984839e-06, - "loss": 2.1747, - "step": 531750 - }, - { - "epoch": 0.93, - "learning_rate": 3.6337224510580123e-06, - "loss": 2.319, - "step": 531760 - }, - { - "epoch": 0.93, - "learning_rate": 3.6328505111311856e-06, - "loss": 2.243, - "step": 531770 - }, - { - "epoch": 0.93, - "learning_rate": 3.6319785712043586e-06, - "loss": 2.1829, - "step": 531780 - }, - { - "epoch": 0.93, - "learning_rate": 3.631106631277532e-06, - "loss": 2.2186, - "step": 531790 - }, - { - "epoch": 0.93, - "learning_rate": 3.630234691350705e-06, - "loss": 2.1927, - "step": 531800 - }, - { - "epoch": 0.93, - "learning_rate": 3.629362751423878e-06, - "loss": 2.2249, - "step": 531810 - }, - { - "epoch": 0.93, - "learning_rate": 3.628490811497051e-06, - "loss": 2.2447, - "step": 531820 - }, - { - "epoch": 0.93, - "learning_rate": 3.6276188715702244e-06, - "loss": 2.1663, - "step": 531830 - }, - { - "epoch": 0.93, - "learning_rate": 3.6267469316433974e-06, - "loss": 2.3668, - "step": 531840 - }, - { - "epoch": 0.93, - "learning_rate": 3.6258749917165707e-06, - "loss": 2.2507, - "step": 531850 - }, - { - "epoch": 0.93, - "learning_rate": 3.6250030517897436e-06, - "loss": 2.3141, - "step": 531860 - }, - { - "epoch": 0.93, - "learning_rate": 3.6241311118629174e-06, - "loss": 2.188, - "step": 531870 - }, - { - "epoch": 0.93, - "learning_rate": 3.6232591719360907e-06, - "loss": 2.1261, - "step": 531880 - }, - { - "epoch": 0.93, - "learning_rate": 3.622387232009264e-06, - "loss": 2.2262, - "step": 531890 - }, - { - "epoch": 0.93, - "learning_rate": 3.621515292082437e-06, - "loss": 2.213, - "step": 531900 - }, - { - "epoch": 0.93, - "learning_rate": 3.6206433521556104e-06, - "loss": 2.2301, - "step": 531910 - }, - { - "epoch": 0.93, - "learning_rate": 3.6197714122287833e-06, - "loss": 2.2684, - "step": 531920 - }, - { - "epoch": 0.93, - "learning_rate": 3.6188994723019566e-06, - "loss": 2.1987, - "step": 531930 - }, - { - "epoch": 0.93, - "learning_rate": 3.6180275323751296e-06, - "loss": 2.3346, - "step": 531940 - }, - { - "epoch": 0.93, - "learning_rate": 3.617155592448303e-06, - "loss": 2.2453, - "step": 531950 - }, - { - "epoch": 0.93, - "learning_rate": 3.616283652521476e-06, - "loss": 2.2199, - "step": 531960 - }, - { - "epoch": 0.93, - "learning_rate": 3.615411712594649e-06, - "loss": 2.3475, - "step": 531970 - }, - { - "epoch": 0.93, - "learning_rate": 3.614539772667822e-06, - "loss": 2.3182, - "step": 531980 - }, - { - "epoch": 0.93, - "learning_rate": 3.6136678327409954e-06, - "loss": 2.0041, - "step": 531990 - }, - { - "epoch": 0.93, - "learning_rate": 3.6127958928141692e-06, - "loss": 2.2182, - "step": 532000 - }, - { - "epoch": 0.93, - "learning_rate": 3.611923952887342e-06, - "loss": 2.1656, - "step": 532010 - }, - { - "epoch": 0.93, - "learning_rate": 3.6110520129605155e-06, - "loss": 2.3005, - "step": 532020 - }, - { - "epoch": 0.93, - "learning_rate": 3.610180073033689e-06, - "loss": 2.2463, - "step": 532030 - }, - { - "epoch": 0.93, - "learning_rate": 3.6093081331068618e-06, - "loss": 2.1894, - "step": 532040 - }, - { - "epoch": 0.93, - "learning_rate": 3.608436193180035e-06, - "loss": 2.3269, - "step": 532050 - }, - { - "epoch": 0.93, - "learning_rate": 3.607564253253208e-06, - "loss": 2.3251, - "step": 532060 - }, - { - "epoch": 0.93, - "learning_rate": 3.6066923133263814e-06, - "loss": 2.3544, - "step": 532070 - }, - { - "epoch": 0.93, - "learning_rate": 3.6058203733995543e-06, - "loss": 2.3052, - "step": 532080 - }, - { - "epoch": 0.93, - "learning_rate": 3.6049484334727276e-06, - "loss": 2.1812, - "step": 532090 - }, - { - "epoch": 0.93, - "learning_rate": 3.6040764935459006e-06, - "loss": 2.2686, - "step": 532100 - }, - { - "epoch": 0.93, - "learning_rate": 3.603204553619074e-06, - "loss": 2.2499, - "step": 532110 - }, - { - "epoch": 0.93, - "learning_rate": 3.602332613692247e-06, - "loss": 2.1908, - "step": 532120 - }, - { - "epoch": 0.93, - "learning_rate": 3.60146067376542e-06, - "loss": 2.3209, - "step": 532130 - }, - { - "epoch": 0.93, - "learning_rate": 3.600588733838594e-06, - "loss": 2.2806, - "step": 532140 - }, - { - "epoch": 0.93, - "learning_rate": 3.5997167939117673e-06, - "loss": 2.3178, - "step": 532150 - }, - { - "epoch": 0.93, - "learning_rate": 3.5988448539849402e-06, - "loss": 2.2125, - "step": 532160 - }, - { - "epoch": 0.93, - "learning_rate": 3.5979729140581136e-06, - "loss": 2.2375, - "step": 532170 - }, - { - "epoch": 0.93, - "learning_rate": 3.5971009741312865e-06, - "loss": 2.2681, - "step": 532180 - }, - { - "epoch": 0.93, - "learning_rate": 3.59622903420446e-06, - "loss": 2.2903, - "step": 532190 - }, - { - "epoch": 0.93, - "learning_rate": 3.5953570942776328e-06, - "loss": 2.2666, - "step": 532200 - }, - { - "epoch": 0.93, - "learning_rate": 3.594485154350806e-06, - "loss": 2.3087, - "step": 532210 - }, - { - "epoch": 0.93, - "learning_rate": 3.593613214423979e-06, - "loss": 2.2813, - "step": 532220 - }, - { - "epoch": 0.93, - "learning_rate": 3.5927412744971524e-06, - "loss": 2.283, - "step": 532230 - }, - { - "epoch": 0.93, - "learning_rate": 3.5918693345703253e-06, - "loss": 2.3044, - "step": 532240 - }, - { - "epoch": 0.93, - "learning_rate": 3.5909973946434986e-06, - "loss": 2.257, - "step": 532250 - }, - { - "epoch": 0.93, - "learning_rate": 3.5901254547166716e-06, - "loss": 2.2303, - "step": 532260 - }, - { - "epoch": 0.93, - "learning_rate": 3.5892535147898453e-06, - "loss": 2.0543, - "step": 532270 - }, - { - "epoch": 0.93, - "learning_rate": 3.5883815748630187e-06, - "loss": 2.3175, - "step": 532280 - }, - { - "epoch": 0.93, - "learning_rate": 3.587509634936192e-06, - "loss": 2.1778, - "step": 532290 - }, - { - "epoch": 0.93, - "learning_rate": 3.586637695009365e-06, - "loss": 2.279, - "step": 532300 - }, - { - "epoch": 0.93, - "learning_rate": 3.5857657550825383e-06, - "loss": 2.2472, - "step": 532310 - }, - { - "epoch": 0.93, - "learning_rate": 3.5848938151557112e-06, - "loss": 2.1796, - "step": 532320 - }, - { - "epoch": 0.93, - "learning_rate": 3.5840218752288846e-06, - "loss": 2.2346, - "step": 532330 - }, - { - "epoch": 0.93, - "learning_rate": 3.5831499353020575e-06, - "loss": 2.207, - "step": 532340 - }, - { - "epoch": 0.93, - "learning_rate": 3.582277995375231e-06, - "loss": 2.3044, - "step": 532350 - }, - { - "epoch": 0.93, - "learning_rate": 3.5814060554484038e-06, - "loss": 2.2831, - "step": 532360 - }, - { - "epoch": 0.93, - "learning_rate": 3.580534115521577e-06, - "loss": 2.3154, - "step": 532370 - }, - { - "epoch": 0.93, - "learning_rate": 3.57966217559475e-06, - "loss": 2.3359, - "step": 532380 - }, - { - "epoch": 0.93, - "learning_rate": 3.5787902356679234e-06, - "loss": 2.2497, - "step": 532390 - }, - { - "epoch": 0.93, - "learning_rate": 3.577918295741097e-06, - "loss": 2.1722, - "step": 532400 - }, - { - "epoch": 0.93, - "learning_rate": 3.5770463558142705e-06, - "loss": 2.3471, - "step": 532410 - }, - { - "epoch": 0.93, - "learning_rate": 3.5761744158874434e-06, - "loss": 2.2032, - "step": 532420 - }, - { - "epoch": 0.93, - "learning_rate": 3.5753024759606168e-06, - "loss": 2.2162, - "step": 532430 - }, - { - "epoch": 0.93, - "learning_rate": 3.5744305360337897e-06, - "loss": 2.2597, - "step": 532440 - }, - { - "epoch": 0.93, - "learning_rate": 3.573558596106963e-06, - "loss": 2.3014, - "step": 532450 - }, - { - "epoch": 0.93, - "learning_rate": 3.572686656180136e-06, - "loss": 2.3223, - "step": 532460 - }, - { - "epoch": 0.93, - "learning_rate": 3.5718147162533093e-06, - "loss": 2.2229, - "step": 532470 - }, - { - "epoch": 0.93, - "learning_rate": 3.5709427763264822e-06, - "loss": 2.2874, - "step": 532480 - }, - { - "epoch": 0.93, - "learning_rate": 3.5700708363996556e-06, - "loss": 2.1721, - "step": 532490 - }, - { - "epoch": 0.93, - "learning_rate": 3.5691988964728285e-06, - "loss": 2.3954, - "step": 532500 - }, - { - "epoch": 0.93, - "learning_rate": 3.568326956546002e-06, - "loss": 2.2023, - "step": 532510 - }, - { - "epoch": 0.93, - "learning_rate": 3.5674550166191748e-06, - "loss": 2.2505, - "step": 532520 - }, - { - "epoch": 0.93, - "learning_rate": 3.566583076692348e-06, - "loss": 2.3498, - "step": 532530 - }, - { - "epoch": 0.93, - "learning_rate": 3.565711136765522e-06, - "loss": 2.3234, - "step": 532540 - }, - { - "epoch": 0.93, - "learning_rate": 3.5648391968386952e-06, - "loss": 2.32, - "step": 532550 - }, - { - "epoch": 0.93, - "learning_rate": 3.563967256911868e-06, - "loss": 2.2989, - "step": 532560 - }, - { - "epoch": 0.93, - "learning_rate": 3.5630953169850415e-06, - "loss": 2.1259, - "step": 532570 - }, - { - "epoch": 0.93, - "learning_rate": 3.5622233770582144e-06, - "loss": 2.3008, - "step": 532580 - }, - { - "epoch": 0.93, - "learning_rate": 3.5613514371313878e-06, - "loss": 2.2789, - "step": 532590 - }, - { - "epoch": 0.93, - "learning_rate": 3.5604794972045607e-06, - "loss": 2.1415, - "step": 532600 - }, - { - "epoch": 0.93, - "learning_rate": 3.559607557277734e-06, - "loss": 2.2772, - "step": 532610 - }, - { - "epoch": 0.93, - "learning_rate": 3.558735617350907e-06, - "loss": 2.1764, - "step": 532620 - }, - { - "epoch": 0.93, - "learning_rate": 3.5578636774240803e-06, - "loss": 2.2841, - "step": 532630 - }, - { - "epoch": 0.93, - "learning_rate": 3.5569917374972532e-06, - "loss": 2.3178, - "step": 532640 - }, - { - "epoch": 0.93, - "learning_rate": 3.5561197975704266e-06, - "loss": 2.3074, - "step": 532650 - }, - { - "epoch": 0.93, - "learning_rate": 3.5552478576435995e-06, - "loss": 2.2043, - "step": 532660 - }, - { - "epoch": 0.93, - "learning_rate": 3.5543759177167737e-06, - "loss": 2.3038, - "step": 532670 - }, - { - "epoch": 0.93, - "learning_rate": 3.5535039777899466e-06, - "loss": 2.2804, - "step": 532680 - }, - { - "epoch": 0.93, - "learning_rate": 3.55263203786312e-06, - "loss": 2.1827, - "step": 532690 - }, - { - "epoch": 0.93, - "learning_rate": 3.551760097936293e-06, - "loss": 2.163, - "step": 532700 - }, - { - "epoch": 0.93, - "learning_rate": 3.5508881580094662e-06, - "loss": 2.2345, - "step": 532710 - }, - { - "epoch": 0.93, - "learning_rate": 3.550016218082639e-06, - "loss": 2.3177, - "step": 532720 - }, - { - "epoch": 0.93, - "learning_rate": 3.5491442781558125e-06, - "loss": 2.1984, - "step": 532730 - }, - { - "epoch": 0.93, - "learning_rate": 3.5482723382289854e-06, - "loss": 2.2816, - "step": 532740 - }, - { - "epoch": 0.93, - "learning_rate": 3.5474003983021588e-06, - "loss": 2.2675, - "step": 532750 - }, - { - "epoch": 0.93, - "learning_rate": 3.5465284583753317e-06, - "loss": 2.3153, - "step": 532760 - }, - { - "epoch": 0.93, - "learning_rate": 3.545656518448505e-06, - "loss": 2.1843, - "step": 532770 - }, - { - "epoch": 0.93, - "learning_rate": 3.544784578521678e-06, - "loss": 2.235, - "step": 532780 - }, - { - "epoch": 0.93, - "learning_rate": 3.5439126385948513e-06, - "loss": 2.1979, - "step": 532790 - }, - { - "epoch": 0.93, - "learning_rate": 3.543040698668025e-06, - "loss": 2.2039, - "step": 532800 - }, - { - "epoch": 0.93, - "learning_rate": 3.5421687587411984e-06, - "loss": 2.2391, - "step": 532810 - }, - { - "epoch": 0.93, - "learning_rate": 3.5412968188143713e-06, - "loss": 2.2328, - "step": 532820 - }, - { - "epoch": 0.93, - "learning_rate": 3.5404248788875447e-06, - "loss": 2.3527, - "step": 532830 - }, - { - "epoch": 0.93, - "learning_rate": 3.5395529389607176e-06, - "loss": 2.3501, - "step": 532840 - }, - { - "epoch": 0.93, - "learning_rate": 3.538680999033891e-06, - "loss": 2.3038, - "step": 532850 - }, - { - "epoch": 0.93, - "learning_rate": 3.537809059107064e-06, - "loss": 2.3055, - "step": 532860 - }, - { - "epoch": 0.93, - "learning_rate": 3.5369371191802372e-06, - "loss": 2.3335, - "step": 532870 - }, - { - "epoch": 0.93, - "learning_rate": 3.53606517925341e-06, - "loss": 2.1543, - "step": 532880 - }, - { - "epoch": 0.93, - "learning_rate": 3.5351932393265835e-06, - "loss": 2.3897, - "step": 532890 - }, - { - "epoch": 0.93, - "learning_rate": 3.5343212993997564e-06, - "loss": 2.345, - "step": 532900 - }, - { - "epoch": 0.93, - "learning_rate": 3.5334493594729298e-06, - "loss": 2.2098, - "step": 532910 - }, - { - "epoch": 0.93, - "learning_rate": 3.5325774195461027e-06, - "loss": 2.2146, - "step": 532920 - }, - { - "epoch": 0.93, - "learning_rate": 3.531705479619276e-06, - "loss": 2.3104, - "step": 532930 - }, - { - "epoch": 0.93, - "learning_rate": 3.53083353969245e-06, - "loss": 2.2872, - "step": 532940 - }, - { - "epoch": 0.93, - "learning_rate": 3.529961599765623e-06, - "loss": 2.1525, - "step": 532950 - }, - { - "epoch": 0.93, - "learning_rate": 3.529089659838796e-06, - "loss": 2.2936, - "step": 532960 - }, - { - "epoch": 0.93, - "learning_rate": 3.5282177199119694e-06, - "loss": 2.2488, - "step": 532970 - }, - { - "epoch": 0.93, - "learning_rate": 3.5273457799851423e-06, - "loss": 2.2132, - "step": 532980 - }, - { - "epoch": 0.93, - "learning_rate": 3.5264738400583157e-06, - "loss": 2.1815, - "step": 532990 - }, - { - "epoch": 0.93, - "learning_rate": 3.5256019001314886e-06, - "loss": 2.1018, - "step": 533000 - }, - { - "epoch": 0.93, - "learning_rate": 3.524729960204662e-06, - "loss": 2.2702, - "step": 533010 - }, - { - "epoch": 0.93, - "learning_rate": 3.523858020277835e-06, - "loss": 2.2127, - "step": 533020 - }, - { - "epoch": 0.93, - "learning_rate": 3.5229860803510082e-06, - "loss": 2.3189, - "step": 533030 - }, - { - "epoch": 0.93, - "learning_rate": 3.522114140424181e-06, - "loss": 2.1812, - "step": 533040 - }, - { - "epoch": 0.93, - "learning_rate": 3.5212422004973545e-06, - "loss": 2.3011, - "step": 533050 - }, - { - "epoch": 0.93, - "learning_rate": 3.5203702605705274e-06, - "loss": 2.1871, - "step": 533060 - }, - { - "epoch": 0.93, - "learning_rate": 3.5194983206437016e-06, - "loss": 2.2964, - "step": 533070 - }, - { - "epoch": 0.93, - "learning_rate": 3.5186263807168745e-06, - "loss": 2.2158, - "step": 533080 - }, - { - "epoch": 0.93, - "learning_rate": 3.517754440790048e-06, - "loss": 2.2663, - "step": 533090 - }, - { - "epoch": 0.93, - "learning_rate": 3.516882500863221e-06, - "loss": 2.3093, - "step": 533100 - }, - { - "epoch": 0.93, - "learning_rate": 3.516010560936394e-06, - "loss": 2.2594, - "step": 533110 - }, - { - "epoch": 0.93, - "learning_rate": 3.515138621009567e-06, - "loss": 2.3665, - "step": 533120 - }, - { - "epoch": 0.93, - "learning_rate": 3.5142666810827404e-06, - "loss": 2.1679, - "step": 533130 - }, - { - "epoch": 0.93, - "learning_rate": 3.5133947411559133e-06, - "loss": 2.3013, - "step": 533140 - }, - { - "epoch": 0.93, - "learning_rate": 3.5125228012290867e-06, - "loss": 2.3236, - "step": 533150 - }, - { - "epoch": 0.93, - "learning_rate": 3.5116508613022596e-06, - "loss": 2.2488, - "step": 533160 - }, - { - "epoch": 0.93, - "learning_rate": 3.510778921375433e-06, - "loss": 2.3885, - "step": 533170 - }, - { - "epoch": 0.93, - "learning_rate": 3.509906981448606e-06, - "loss": 2.1666, - "step": 533180 - }, - { - "epoch": 0.93, - "learning_rate": 3.5090350415217792e-06, - "loss": 2.3521, - "step": 533190 - }, - { - "epoch": 0.93, - "learning_rate": 3.508163101594953e-06, - "loss": 2.2115, - "step": 533200 - }, - { - "epoch": 0.93, - "learning_rate": 3.5072911616681263e-06, - "loss": 2.2578, - "step": 533210 - }, - { - "epoch": 0.93, - "learning_rate": 3.5064192217412993e-06, - "loss": 2.1985, - "step": 533220 - }, - { - "epoch": 0.93, - "learning_rate": 3.5055472818144726e-06, - "loss": 2.2874, - "step": 533230 - }, - { - "epoch": 0.93, - "learning_rate": 3.5046753418876455e-06, - "loss": 2.239, - "step": 533240 - }, - { - "epoch": 0.93, - "learning_rate": 3.503803401960819e-06, - "loss": 2.2371, - "step": 533250 - }, - { - "epoch": 0.93, - "learning_rate": 3.502931462033992e-06, - "loss": 2.2925, - "step": 533260 - }, - { - "epoch": 0.93, - "learning_rate": 3.502059522107165e-06, - "loss": 2.2873, - "step": 533270 - }, - { - "epoch": 0.93, - "learning_rate": 3.501187582180338e-06, - "loss": 2.3071, - "step": 533280 - }, - { - "epoch": 0.93, - "learning_rate": 3.5003156422535114e-06, - "loss": 2.1931, - "step": 533290 - }, - { - "epoch": 0.93, - "learning_rate": 3.4994437023266843e-06, - "loss": 2.284, - "step": 533300 - }, - { - "epoch": 0.93, - "learning_rate": 3.4985717623998577e-06, - "loss": 2.3184, - "step": 533310 - }, - { - "epoch": 0.93, - "learning_rate": 3.4976998224730306e-06, - "loss": 2.265, - "step": 533320 - }, - { - "epoch": 0.93, - "learning_rate": 3.496827882546205e-06, - "loss": 2.2631, - "step": 533330 - }, - { - "epoch": 0.93, - "learning_rate": 3.4959559426193777e-06, - "loss": 2.2034, - "step": 533340 - }, - { - "epoch": 0.93, - "learning_rate": 3.495084002692551e-06, - "loss": 2.265, - "step": 533350 - }, - { - "epoch": 0.93, - "learning_rate": 3.494212062765724e-06, - "loss": 2.402, - "step": 533360 - }, - { - "epoch": 0.93, - "learning_rate": 3.4933401228388973e-06, - "loss": 2.4324, - "step": 533370 - }, - { - "epoch": 0.93, - "learning_rate": 3.4924681829120703e-06, - "loss": 2.2677, - "step": 533380 - }, - { - "epoch": 0.93, - "learning_rate": 3.4915962429852436e-06, - "loss": 2.255, - "step": 533390 - }, - { - "epoch": 0.93, - "learning_rate": 3.4907243030584165e-06, - "loss": 2.1521, - "step": 533400 - }, - { - "epoch": 0.93, - "learning_rate": 3.48985236313159e-06, - "loss": 2.3285, - "step": 533410 - }, - { - "epoch": 0.93, - "learning_rate": 3.488980423204763e-06, - "loss": 2.1899, - "step": 533420 - }, - { - "epoch": 0.93, - "learning_rate": 3.488108483277936e-06, - "loss": 2.1583, - "step": 533430 - }, - { - "epoch": 0.93, - "learning_rate": 3.487236543351109e-06, - "loss": 2.2142, - "step": 533440 - }, - { - "epoch": 0.93, - "learning_rate": 3.4863646034242824e-06, - "loss": 2.2307, - "step": 533450 - }, - { - "epoch": 0.93, - "learning_rate": 3.4854926634974553e-06, - "loss": 2.129, - "step": 533460 - }, - { - "epoch": 0.93, - "learning_rate": 3.4846207235706295e-06, - "loss": 2.299, - "step": 533470 - }, - { - "epoch": 0.93, - "learning_rate": 3.4837487836438025e-06, - "loss": 2.226, - "step": 533480 - }, - { - "epoch": 0.93, - "learning_rate": 3.482876843716976e-06, - "loss": 2.18, - "step": 533490 - }, - { - "epoch": 0.93, - "learning_rate": 3.4820049037901487e-06, - "loss": 2.3491, - "step": 533500 - }, - { - "epoch": 0.93, - "learning_rate": 3.481132963863322e-06, - "loss": 2.2945, - "step": 533510 - }, - { - "epoch": 0.93, - "learning_rate": 3.480261023936495e-06, - "loss": 2.2743, - "step": 533520 - }, - { - "epoch": 0.93, - "learning_rate": 3.4793890840096683e-06, - "loss": 2.281, - "step": 533530 - }, - { - "epoch": 0.93, - "learning_rate": 3.4785171440828413e-06, - "loss": 2.3046, - "step": 533540 - }, - { - "epoch": 0.93, - "learning_rate": 3.4776452041560146e-06, - "loss": 2.1625, - "step": 533550 - }, - { - "epoch": 0.93, - "learning_rate": 3.4767732642291875e-06, - "loss": 2.2506, - "step": 533560 - }, - { - "epoch": 0.93, - "learning_rate": 3.475901324302361e-06, - "loss": 2.2378, - "step": 533570 - }, - { - "epoch": 0.93, - "learning_rate": 3.475029384375534e-06, - "loss": 2.2099, - "step": 533580 - }, - { - "epoch": 0.93, - "learning_rate": 3.474157444448707e-06, - "loss": 2.2845, - "step": 533590 - }, - { - "epoch": 0.93, - "learning_rate": 3.473285504521881e-06, - "loss": 2.307, - "step": 533600 - }, - { - "epoch": 0.93, - "learning_rate": 3.4724135645950543e-06, - "loss": 2.2424, - "step": 533610 - }, - { - "epoch": 0.93, - "learning_rate": 3.471541624668227e-06, - "loss": 2.2955, - "step": 533620 - }, - { - "epoch": 0.93, - "learning_rate": 3.4706696847414005e-06, - "loss": 2.2231, - "step": 533630 - }, - { - "epoch": 0.93, - "learning_rate": 3.4697977448145735e-06, - "loss": 2.2253, - "step": 533640 - }, - { - "epoch": 0.93, - "learning_rate": 3.468925804887747e-06, - "loss": 2.2533, - "step": 533650 - }, - { - "epoch": 0.93, - "learning_rate": 3.4680538649609197e-06, - "loss": 2.3474, - "step": 533660 - }, - { - "epoch": 0.93, - "learning_rate": 3.467181925034093e-06, - "loss": 2.3044, - "step": 533670 - }, - { - "epoch": 0.93, - "learning_rate": 3.466309985107266e-06, - "loss": 2.2864, - "step": 533680 - }, - { - "epoch": 0.93, - "learning_rate": 3.4654380451804393e-06, - "loss": 2.2088, - "step": 533690 - }, - { - "epoch": 0.93, - "learning_rate": 3.4645661052536123e-06, - "loss": 2.288, - "step": 533700 - }, - { - "epoch": 0.93, - "learning_rate": 3.4636941653267856e-06, - "loss": 2.2948, - "step": 533710 - }, - { - "epoch": 0.93, - "learning_rate": 3.4628222253999585e-06, - "loss": 2.2674, - "step": 533720 - }, - { - "epoch": 0.93, - "learning_rate": 3.4619502854731327e-06, - "loss": 2.1449, - "step": 533730 - }, - { - "epoch": 0.93, - "learning_rate": 3.4610783455463057e-06, - "loss": 2.1584, - "step": 533740 - }, - { - "epoch": 0.93, - "learning_rate": 3.460206405619479e-06, - "loss": 2.2557, - "step": 533750 - }, - { - "epoch": 0.93, - "learning_rate": 3.459334465692652e-06, - "loss": 2.2228, - "step": 533760 - }, - { - "epoch": 0.93, - "learning_rate": 3.4584625257658253e-06, - "loss": 2.2678, - "step": 533770 - }, - { - "epoch": 0.93, - "learning_rate": 3.457590585838998e-06, - "loss": 2.1563, - "step": 533780 - }, - { - "epoch": 0.93, - "learning_rate": 3.4567186459121715e-06, - "loss": 2.3384, - "step": 533790 - }, - { - "epoch": 0.93, - "learning_rate": 3.4558467059853445e-06, - "loss": 2.2342, - "step": 533800 - }, - { - "epoch": 0.93, - "learning_rate": 3.454974766058518e-06, - "loss": 2.2086, - "step": 533810 - }, - { - "epoch": 0.93, - "learning_rate": 3.4541028261316907e-06, - "loss": 2.2482, - "step": 533820 - }, - { - "epoch": 0.93, - "learning_rate": 3.453230886204864e-06, - "loss": 2.3153, - "step": 533830 - }, - { - "epoch": 0.93, - "learning_rate": 3.452358946278037e-06, - "loss": 2.2546, - "step": 533840 - }, - { - "epoch": 0.93, - "learning_rate": 3.4514870063512103e-06, - "loss": 2.2646, - "step": 533850 - }, - { - "epoch": 0.93, - "learning_rate": 3.4506150664243833e-06, - "loss": 2.0877, - "step": 533860 - }, - { - "epoch": 0.93, - "learning_rate": 3.4497431264975575e-06, - "loss": 2.2811, - "step": 533870 - }, - { - "epoch": 0.93, - "learning_rate": 3.4488711865707304e-06, - "loss": 2.2165, - "step": 533880 - }, - { - "epoch": 0.93, - "learning_rate": 3.4479992466439037e-06, - "loss": 2.2715, - "step": 533890 - }, - { - "epoch": 0.93, - "learning_rate": 3.4471273067170767e-06, - "loss": 2.2576, - "step": 533900 - }, - { - "epoch": 0.93, - "learning_rate": 3.44625536679025e-06, - "loss": 2.2876, - "step": 533910 - }, - { - "epoch": 0.93, - "learning_rate": 3.445383426863423e-06, - "loss": 2.2891, - "step": 533920 - }, - { - "epoch": 0.93, - "learning_rate": 3.4445114869365963e-06, - "loss": 2.1243, - "step": 533930 - }, - { - "epoch": 0.93, - "learning_rate": 3.443639547009769e-06, - "loss": 2.2856, - "step": 533940 - }, - { - "epoch": 0.93, - "learning_rate": 3.4427676070829425e-06, - "loss": 2.2452, - "step": 533950 - }, - { - "epoch": 0.93, - "learning_rate": 3.4418956671561155e-06, - "loss": 2.3078, - "step": 533960 - }, - { - "epoch": 0.93, - "learning_rate": 3.441023727229289e-06, - "loss": 2.2704, - "step": 533970 - }, - { - "epoch": 0.93, - "learning_rate": 3.4401517873024617e-06, - "loss": 2.396, - "step": 533980 - }, - { - "epoch": 0.93, - "learning_rate": 3.439279847375635e-06, - "loss": 2.2718, - "step": 533990 - }, - { - "epoch": 0.93, - "learning_rate": 3.438407907448809e-06, - "loss": 2.1842, - "step": 534000 - }, - { - "epoch": 0.93, - "learning_rate": 3.437535967521982e-06, - "loss": 2.2311, - "step": 534010 - }, - { - "epoch": 0.93, - "learning_rate": 3.436664027595155e-06, - "loss": 2.1971, - "step": 534020 - }, - { - "epoch": 0.93, - "learning_rate": 3.4357920876683285e-06, - "loss": 2.2959, - "step": 534030 - }, - { - "epoch": 0.93, - "learning_rate": 3.4349201477415014e-06, - "loss": 2.2511, - "step": 534040 - }, - { - "epoch": 0.93, - "learning_rate": 3.4340482078146747e-06, - "loss": 2.225, - "step": 534050 - }, - { - "epoch": 0.93, - "learning_rate": 3.4331762678878477e-06, - "loss": 2.3078, - "step": 534060 - }, - { - "epoch": 0.93, - "learning_rate": 3.432304327961021e-06, - "loss": 2.2912, - "step": 534070 - }, - { - "epoch": 0.93, - "learning_rate": 3.431432388034194e-06, - "loss": 2.3061, - "step": 534080 - }, - { - "epoch": 0.93, - "learning_rate": 3.4305604481073673e-06, - "loss": 2.2225, - "step": 534090 - }, - { - "epoch": 0.93, - "learning_rate": 3.42968850818054e-06, - "loss": 2.2274, - "step": 534100 - }, - { - "epoch": 0.93, - "learning_rate": 3.4288165682537135e-06, - "loss": 2.353, - "step": 534110 - }, - { - "epoch": 0.93, - "learning_rate": 3.4279446283268865e-06, - "loss": 2.2081, - "step": 534120 - }, - { - "epoch": 0.93, - "learning_rate": 3.4270726884000607e-06, - "loss": 2.2648, - "step": 534130 - }, - { - "epoch": 0.93, - "learning_rate": 3.4262007484732336e-06, - "loss": 2.282, - "step": 534140 - }, - { - "epoch": 0.93, - "learning_rate": 3.425328808546407e-06, - "loss": 2.3338, - "step": 534150 - }, - { - "epoch": 0.93, - "learning_rate": 3.42445686861958e-06, - "loss": 2.3397, - "step": 534160 - }, - { - "epoch": 0.93, - "learning_rate": 3.423584928692753e-06, - "loss": 2.2898, - "step": 534170 - }, - { - "epoch": 0.93, - "learning_rate": 3.422712988765926e-06, - "loss": 2.2992, - "step": 534180 - }, - { - "epoch": 0.93, - "learning_rate": 3.4218410488390995e-06, - "loss": 2.2678, - "step": 534190 - }, - { - "epoch": 0.93, - "learning_rate": 3.4209691089122724e-06, - "loss": 2.1875, - "step": 534200 - }, - { - "epoch": 0.93, - "learning_rate": 3.4200971689854457e-06, - "loss": 2.2489, - "step": 534210 - }, - { - "epoch": 0.93, - "learning_rate": 3.4192252290586187e-06, - "loss": 2.3225, - "step": 534220 - }, - { - "epoch": 0.93, - "learning_rate": 3.418353289131792e-06, - "loss": 2.2155, - "step": 534230 - }, - { - "epoch": 0.93, - "learning_rate": 3.417481349204965e-06, - "loss": 2.2621, - "step": 534240 - }, - { - "epoch": 0.93, - "learning_rate": 3.4166094092781383e-06, - "loss": 2.2432, - "step": 534250 - }, - { - "epoch": 0.93, - "learning_rate": 3.415737469351311e-06, - "loss": 2.2718, - "step": 534260 - }, - { - "epoch": 0.93, - "learning_rate": 3.4148655294244854e-06, - "loss": 2.2298, - "step": 534270 - }, - { - "epoch": 0.93, - "learning_rate": 3.4139935894976583e-06, - "loss": 2.2712, - "step": 534280 - }, - { - "epoch": 0.93, - "learning_rate": 3.4131216495708317e-06, - "loss": 2.2153, - "step": 534290 - }, - { - "epoch": 0.93, - "learning_rate": 3.4122497096440046e-06, - "loss": 2.2556, - "step": 534300 - }, - { - "epoch": 0.93, - "learning_rate": 3.411377769717178e-06, - "loss": 2.1313, - "step": 534310 - }, - { - "epoch": 0.93, - "learning_rate": 3.410505829790351e-06, - "loss": 2.2606, - "step": 534320 - }, - { - "epoch": 0.93, - "learning_rate": 3.409633889863524e-06, - "loss": 2.2666, - "step": 534330 - }, - { - "epoch": 0.93, - "learning_rate": 3.408761949936697e-06, - "loss": 2.2232, - "step": 534340 - }, - { - "epoch": 0.93, - "learning_rate": 3.4078900100098705e-06, - "loss": 2.2947, - "step": 534350 - }, - { - "epoch": 0.93, - "learning_rate": 3.4070180700830434e-06, - "loss": 2.199, - "step": 534360 - }, - { - "epoch": 0.93, - "learning_rate": 3.4061461301562167e-06, - "loss": 2.3334, - "step": 534370 - }, - { - "epoch": 0.93, - "learning_rate": 3.4052741902293897e-06, - "loss": 2.2286, - "step": 534380 - }, - { - "epoch": 0.93, - "learning_rate": 3.404402250302563e-06, - "loss": 2.1579, - "step": 534390 - }, - { - "epoch": 0.93, - "learning_rate": 3.4035303103757368e-06, - "loss": 2.2231, - "step": 534400 - }, - { - "epoch": 0.93, - "learning_rate": 3.40265837044891e-06, - "loss": 2.143, - "step": 534410 - }, - { - "epoch": 0.93, - "learning_rate": 3.401786430522083e-06, - "loss": 2.1563, - "step": 534420 - }, - { - "epoch": 0.93, - "learning_rate": 3.4009144905952564e-06, - "loss": 2.1365, - "step": 534430 - }, - { - "epoch": 0.93, - "learning_rate": 3.4000425506684293e-06, - "loss": 2.1862, - "step": 534440 - }, - { - "epoch": 0.93, - "learning_rate": 3.3991706107416027e-06, - "loss": 2.3183, - "step": 534450 - }, - { - "epoch": 0.93, - "learning_rate": 3.3982986708147756e-06, - "loss": 2.2022, - "step": 534460 - }, - { - "epoch": 0.93, - "learning_rate": 3.397426730887949e-06, - "loss": 2.2973, - "step": 534470 - }, - { - "epoch": 0.93, - "learning_rate": 3.396554790961122e-06, - "loss": 2.1479, - "step": 534480 - }, - { - "epoch": 0.93, - "learning_rate": 3.395682851034295e-06, - "loss": 2.3197, - "step": 534490 - }, - { - "epoch": 0.93, - "learning_rate": 3.394810911107468e-06, - "loss": 2.3254, - "step": 534500 - }, - { - "epoch": 0.93, - "learning_rate": 3.3939389711806415e-06, - "loss": 2.2445, - "step": 534510 - }, - { - "epoch": 0.93, - "learning_rate": 3.3930670312538144e-06, - "loss": 2.2181, - "step": 534520 - }, - { - "epoch": 0.93, - "learning_rate": 3.3921950913269886e-06, - "loss": 2.1547, - "step": 534530 - }, - { - "epoch": 0.93, - "learning_rate": 3.3913231514001615e-06, - "loss": 2.4095, - "step": 534540 - }, - { - "epoch": 0.93, - "learning_rate": 3.390451211473335e-06, - "loss": 2.1781, - "step": 534550 - }, - { - "epoch": 0.93, - "learning_rate": 3.3895792715465078e-06, - "loss": 2.2839, - "step": 534560 - }, - { - "epoch": 0.93, - "learning_rate": 3.388707331619681e-06, - "loss": 2.2618, - "step": 534570 - }, - { - "epoch": 0.93, - "learning_rate": 3.387835391692854e-06, - "loss": 2.3502, - "step": 534580 - }, - { - "epoch": 0.93, - "learning_rate": 3.3869634517660274e-06, - "loss": 2.2531, - "step": 534590 - }, - { - "epoch": 0.93, - "learning_rate": 3.3860915118392003e-06, - "loss": 2.1683, - "step": 534600 - }, - { - "epoch": 0.93, - "learning_rate": 3.3852195719123737e-06, - "loss": 2.2914, - "step": 534610 - }, - { - "epoch": 0.93, - "learning_rate": 3.3843476319855466e-06, - "loss": 2.2209, - "step": 534620 - }, - { - "epoch": 0.93, - "learning_rate": 3.38347569205872e-06, - "loss": 2.1329, - "step": 534630 - }, - { - "epoch": 0.93, - "learning_rate": 3.382603752131893e-06, - "loss": 2.2614, - "step": 534640 - }, - { - "epoch": 0.93, - "learning_rate": 3.381731812205066e-06, - "loss": 2.2779, - "step": 534650 - }, - { - "epoch": 0.93, - "learning_rate": 3.38085987227824e-06, - "loss": 2.1359, - "step": 534660 - }, - { - "epoch": 0.93, - "learning_rate": 3.3799879323514133e-06, - "loss": 2.1651, - "step": 534670 - }, - { - "epoch": 0.93, - "learning_rate": 3.3791159924245862e-06, - "loss": 2.2805, - "step": 534680 - }, - { - "epoch": 0.93, - "learning_rate": 3.3782440524977596e-06, - "loss": 2.3253, - "step": 534690 - }, - { - "epoch": 0.93, - "learning_rate": 3.3773721125709325e-06, - "loss": 2.2763, - "step": 534700 - }, - { - "epoch": 0.93, - "learning_rate": 3.376500172644106e-06, - "loss": 2.1133, - "step": 534710 - }, - { - "epoch": 0.93, - "learning_rate": 3.3756282327172788e-06, - "loss": 2.28, - "step": 534720 - }, - { - "epoch": 0.93, - "learning_rate": 3.374756292790452e-06, - "loss": 2.2504, - "step": 534730 - }, - { - "epoch": 0.93, - "learning_rate": 3.373884352863625e-06, - "loss": 2.3417, - "step": 534740 - }, - { - "epoch": 0.93, - "learning_rate": 3.3730124129367984e-06, - "loss": 2.1796, - "step": 534750 - }, - { - "epoch": 0.93, - "learning_rate": 3.3721404730099713e-06, - "loss": 2.2775, - "step": 534760 - }, - { - "epoch": 0.93, - "learning_rate": 3.3712685330831447e-06, - "loss": 2.2932, - "step": 534770 - }, - { - "epoch": 0.93, - "learning_rate": 3.3703965931563176e-06, - "loss": 2.2224, - "step": 534780 - }, - { - "epoch": 0.93, - "learning_rate": 3.369524653229491e-06, - "loss": 2.3642, - "step": 534790 - }, - { - "epoch": 0.93, - "learning_rate": 3.3686527133026647e-06, - "loss": 2.2552, - "step": 534800 - }, - { - "epoch": 0.93, - "learning_rate": 3.367780773375838e-06, - "loss": 2.253, - "step": 534810 - }, - { - "epoch": 0.93, - "learning_rate": 3.366908833449011e-06, - "loss": 2.2611, - "step": 534820 - }, - { - "epoch": 0.93, - "learning_rate": 3.3660368935221843e-06, - "loss": 2.3071, - "step": 534830 - }, - { - "epoch": 0.93, - "learning_rate": 3.3651649535953572e-06, - "loss": 2.2476, - "step": 534840 - }, - { - "epoch": 0.93, - "learning_rate": 3.3642930136685306e-06, - "loss": 2.2678, - "step": 534850 - }, - { - "epoch": 0.93, - "learning_rate": 3.3634210737417035e-06, - "loss": 2.2939, - "step": 534860 - }, - { - "epoch": 0.93, - "learning_rate": 3.362549133814877e-06, - "loss": 2.2695, - "step": 534870 - }, - { - "epoch": 0.93, - "learning_rate": 3.3616771938880498e-06, - "loss": 2.1956, - "step": 534880 - }, - { - "epoch": 0.93, - "learning_rate": 3.360805253961223e-06, - "loss": 2.2643, - "step": 534890 - }, - { - "epoch": 0.93, - "learning_rate": 3.359933314034396e-06, - "loss": 2.1824, - "step": 534900 - }, - { - "epoch": 0.93, - "learning_rate": 3.3590613741075694e-06, - "loss": 2.2407, - "step": 534910 - }, - { - "epoch": 0.93, - "learning_rate": 3.3581894341807427e-06, - "loss": 2.2691, - "step": 534920 - }, - { - "epoch": 0.93, - "learning_rate": 3.3573174942539165e-06, - "loss": 2.241, - "step": 534930 - }, - { - "epoch": 0.93, - "learning_rate": 3.3564455543270894e-06, - "loss": 2.2839, - "step": 534940 - }, - { - "epoch": 0.93, - "learning_rate": 3.3555736144002628e-06, - "loss": 2.2307, - "step": 534950 - }, - { - "epoch": 0.93, - "learning_rate": 3.3547016744734357e-06, - "loss": 2.2294, - "step": 534960 - }, - { - "epoch": 0.93, - "learning_rate": 3.353829734546609e-06, - "loss": 2.279, - "step": 534970 - }, - { - "epoch": 0.93, - "learning_rate": 3.352957794619782e-06, - "loss": 2.2433, - "step": 534980 - }, - { - "epoch": 0.93, - "learning_rate": 3.3520858546929553e-06, - "loss": 2.2397, - "step": 534990 - }, - { - "epoch": 0.93, - "learning_rate": 3.3512139147661282e-06, - "loss": 2.3348, - "step": 535000 - }, - { - "epoch": 0.93, - "learning_rate": 3.3503419748393016e-06, - "loss": 2.3274, - "step": 535010 - }, - { - "epoch": 0.93, - "learning_rate": 3.3494700349124745e-06, - "loss": 2.2107, - "step": 535020 - }, - { - "epoch": 0.93, - "learning_rate": 3.348598094985648e-06, - "loss": 2.301, - "step": 535030 - }, - { - "epoch": 0.93, - "learning_rate": 3.3477261550588208e-06, - "loss": 2.3355, - "step": 535040 - }, - { - "epoch": 0.93, - "learning_rate": 3.346854215131994e-06, - "loss": 2.3201, - "step": 535050 - }, - { - "epoch": 0.93, - "learning_rate": 3.345982275205168e-06, - "loss": 2.3214, - "step": 535060 - }, - { - "epoch": 0.93, - "learning_rate": 3.3451103352783412e-06, - "loss": 2.1851, - "step": 535070 - }, - { - "epoch": 0.93, - "learning_rate": 3.344238395351514e-06, - "loss": 2.2501, - "step": 535080 - }, - { - "epoch": 0.93, - "learning_rate": 3.3433664554246875e-06, - "loss": 2.2748, - "step": 535090 - }, - { - "epoch": 0.93, - "learning_rate": 3.3424945154978604e-06, - "loss": 2.1218, - "step": 535100 - }, - { - "epoch": 0.93, - "learning_rate": 3.3416225755710338e-06, - "loss": 2.2084, - "step": 535110 - }, - { - "epoch": 0.93, - "learning_rate": 3.3407506356442067e-06, - "loss": 2.2043, - "step": 535120 - }, - { - "epoch": 0.93, - "learning_rate": 3.33987869571738e-06, - "loss": 2.1721, - "step": 535130 - }, - { - "epoch": 0.93, - "learning_rate": 3.339006755790553e-06, - "loss": 2.2642, - "step": 535140 - }, - { - "epoch": 0.93, - "learning_rate": 3.3381348158637263e-06, - "loss": 2.2685, - "step": 535150 - }, - { - "epoch": 0.93, - "learning_rate": 3.3372628759368992e-06, - "loss": 2.2938, - "step": 535160 - }, - { - "epoch": 0.93, - "learning_rate": 3.3363909360100726e-06, - "loss": 2.3086, - "step": 535170 - }, - { - "epoch": 0.93, - "learning_rate": 3.335518996083246e-06, - "loss": 2.2737, - "step": 535180 - }, - { - "epoch": 0.93, - "learning_rate": 3.334647056156419e-06, - "loss": 2.3166, - "step": 535190 - }, - { - "epoch": 0.93, - "learning_rate": 3.3337751162295926e-06, - "loss": 2.2667, - "step": 535200 - }, - { - "epoch": 0.93, - "learning_rate": 3.332903176302766e-06, - "loss": 2.2067, - "step": 535210 - }, - { - "epoch": 0.93, - "learning_rate": 3.332031236375939e-06, - "loss": 2.3123, - "step": 535220 - }, - { - "epoch": 0.93, - "learning_rate": 3.3311592964491122e-06, - "loss": 2.2458, - "step": 535230 - }, - { - "epoch": 0.93, - "learning_rate": 3.330287356522285e-06, - "loss": 2.198, - "step": 535240 - }, - { - "epoch": 0.93, - "learning_rate": 3.3294154165954585e-06, - "loss": 2.1825, - "step": 535250 - }, - { - "epoch": 0.93, - "learning_rate": 3.3285434766686314e-06, - "loss": 2.3119, - "step": 535260 - }, - { - "epoch": 0.93, - "learning_rate": 3.3276715367418048e-06, - "loss": 2.2547, - "step": 535270 - }, - { - "epoch": 0.93, - "learning_rate": 3.3267995968149777e-06, - "loss": 2.1329, - "step": 535280 - }, - { - "epoch": 0.93, - "learning_rate": 3.325927656888151e-06, - "loss": 2.2197, - "step": 535290 - }, - { - "epoch": 0.93, - "learning_rate": 3.325055716961324e-06, - "loss": 2.3162, - "step": 535300 - }, - { - "epoch": 0.93, - "learning_rate": 3.3241837770344973e-06, - "loss": 2.2555, - "step": 535310 - }, - { - "epoch": 0.93, - "learning_rate": 3.3233118371076707e-06, - "loss": 2.3087, - "step": 535320 - }, - { - "epoch": 0.93, - "learning_rate": 3.3224398971808444e-06, - "loss": 2.2921, - "step": 535330 - }, - { - "epoch": 0.93, - "learning_rate": 3.3215679572540174e-06, - "loss": 2.2476, - "step": 535340 - }, - { - "epoch": 0.93, - "learning_rate": 3.3206960173271907e-06, - "loss": 2.2516, - "step": 535350 - }, - { - "epoch": 0.93, - "learning_rate": 3.3198240774003636e-06, - "loss": 2.1826, - "step": 535360 - }, - { - "epoch": 0.93, - "learning_rate": 3.318952137473537e-06, - "loss": 2.2514, - "step": 535370 - }, - { - "epoch": 0.93, - "learning_rate": 3.31808019754671e-06, - "loss": 2.3359, - "step": 535380 - }, - { - "epoch": 0.93, - "learning_rate": 3.3172082576198832e-06, - "loss": 2.2104, - "step": 535390 - }, - { - "epoch": 0.93, - "learning_rate": 3.316336317693056e-06, - "loss": 2.1037, - "step": 535400 - }, - { - "epoch": 0.93, - "learning_rate": 3.3154643777662295e-06, - "loss": 2.3122, - "step": 535410 - }, - { - "epoch": 0.93, - "learning_rate": 3.3145924378394024e-06, - "loss": 2.286, - "step": 535420 - }, - { - "epoch": 0.93, - "learning_rate": 3.3137204979125758e-06, - "loss": 2.317, - "step": 535430 - }, - { - "epoch": 0.93, - "learning_rate": 3.312848557985749e-06, - "loss": 2.2106, - "step": 535440 - }, - { - "epoch": 0.93, - "learning_rate": 3.311976618058922e-06, - "loss": 2.2187, - "step": 535450 - }, - { - "epoch": 0.93, - "learning_rate": 3.311104678132096e-06, - "loss": 2.291, - "step": 535460 - }, - { - "epoch": 0.93, - "learning_rate": 3.310232738205269e-06, - "loss": 2.2479, - "step": 535470 - }, - { - "epoch": 0.93, - "learning_rate": 3.309360798278442e-06, - "loss": 2.2038, - "step": 535480 - }, - { - "epoch": 0.93, - "learning_rate": 3.3084888583516154e-06, - "loss": 2.1474, - "step": 535490 - }, - { - "epoch": 0.93, - "learning_rate": 3.3076169184247884e-06, - "loss": 2.2648, - "step": 535500 - }, - { - "epoch": 0.93, - "learning_rate": 3.3067449784979617e-06, - "loss": 2.1899, - "step": 535510 - }, - { - "epoch": 0.93, - "learning_rate": 3.3058730385711346e-06, - "loss": 2.2674, - "step": 535520 - }, - { - "epoch": 0.93, - "learning_rate": 3.305001098644308e-06, - "loss": 2.2722, - "step": 535530 - }, - { - "epoch": 0.93, - "learning_rate": 3.304129158717481e-06, - "loss": 2.2693, - "step": 535540 - }, - { - "epoch": 0.93, - "learning_rate": 3.3032572187906542e-06, - "loss": 2.2177, - "step": 535550 - }, - { - "epoch": 0.93, - "learning_rate": 3.302385278863827e-06, - "loss": 2.2165, - "step": 535560 - }, - { - "epoch": 0.93, - "learning_rate": 3.3015133389370005e-06, - "loss": 2.2643, - "step": 535570 - }, - { - "epoch": 0.93, - "learning_rate": 3.300641399010174e-06, - "loss": 2.2669, - "step": 535580 - }, - { - "epoch": 0.93, - "learning_rate": 3.2997694590833468e-06, - "loss": 2.2574, - "step": 535590 - }, - { - "epoch": 0.93, - "learning_rate": 3.2988975191565206e-06, - "loss": 2.3148, - "step": 535600 - }, - { - "epoch": 0.93, - "learning_rate": 3.298025579229694e-06, - "loss": 2.3414, - "step": 535610 - }, - { - "epoch": 0.93, - "learning_rate": 3.297153639302867e-06, - "loss": 2.2758, - "step": 535620 - }, - { - "epoch": 0.93, - "learning_rate": 3.29628169937604e-06, - "loss": 2.2296, - "step": 535630 - }, - { - "epoch": 0.93, - "learning_rate": 3.295409759449213e-06, - "loss": 2.2938, - "step": 535640 - }, - { - "epoch": 0.93, - "learning_rate": 3.2945378195223864e-06, - "loss": 2.2688, - "step": 535650 - }, - { - "epoch": 0.93, - "learning_rate": 3.2936658795955594e-06, - "loss": 2.3066, - "step": 535660 - }, - { - "epoch": 0.93, - "learning_rate": 3.2927939396687327e-06, - "loss": 2.3637, - "step": 535670 - }, - { - "epoch": 0.93, - "learning_rate": 3.2919219997419056e-06, - "loss": 2.1657, - "step": 535680 - }, - { - "epoch": 0.93, - "learning_rate": 3.291050059815079e-06, - "loss": 2.212, - "step": 535690 - }, - { - "epoch": 0.93, - "learning_rate": 3.2901781198882523e-06, - "loss": 2.323, - "step": 535700 - }, - { - "epoch": 0.93, - "learning_rate": 3.2893061799614252e-06, - "loss": 2.2901, - "step": 535710 - }, - { - "epoch": 0.93, - "learning_rate": 3.2884342400345986e-06, - "loss": 2.1724, - "step": 535720 - }, - { - "epoch": 0.93, - "learning_rate": 3.2875623001077724e-06, - "loss": 2.344, - "step": 535730 - }, - { - "epoch": 0.93, - "learning_rate": 3.2866903601809453e-06, - "loss": 2.3463, - "step": 535740 - }, - { - "epoch": 0.93, - "learning_rate": 3.2858184202541186e-06, - "loss": 2.1896, - "step": 535750 - }, - { - "epoch": 0.93, - "learning_rate": 3.2849464803272916e-06, - "loss": 2.2397, - "step": 535760 - }, - { - "epoch": 0.93, - "learning_rate": 3.284074540400465e-06, - "loss": 2.2323, - "step": 535770 - }, - { - "epoch": 0.93, - "learning_rate": 3.283202600473638e-06, - "loss": 2.2906, - "step": 535780 - }, - { - "epoch": 0.93, - "learning_rate": 3.282330660546811e-06, - "loss": 2.1888, - "step": 535790 - }, - { - "epoch": 0.93, - "learning_rate": 3.281458720619984e-06, - "loss": 2.2675, - "step": 535800 - }, - { - "epoch": 0.93, - "learning_rate": 3.2805867806931574e-06, - "loss": 2.2495, - "step": 535810 - }, - { - "epoch": 0.93, - "learning_rate": 3.2797148407663304e-06, - "loss": 2.2783, - "step": 535820 - }, - { - "epoch": 0.93, - "learning_rate": 3.2788429008395037e-06, - "loss": 2.2552, - "step": 535830 - }, - { - "epoch": 0.93, - "learning_rate": 3.277970960912677e-06, - "loss": 2.2055, - "step": 535840 - }, - { - "epoch": 0.93, - "learning_rate": 3.27709902098585e-06, - "loss": 2.1947, - "step": 535850 - }, - { - "epoch": 0.93, - "learning_rate": 3.2762270810590237e-06, - "loss": 2.1378, - "step": 535860 - }, - { - "epoch": 0.93, - "learning_rate": 3.275355141132197e-06, - "loss": 2.2285, - "step": 535870 - }, - { - "epoch": 0.93, - "learning_rate": 3.27448320120537e-06, - "loss": 2.178, - "step": 535880 - }, - { - "epoch": 0.93, - "learning_rate": 3.2736112612785434e-06, - "loss": 2.2436, - "step": 535890 - }, - { - "epoch": 0.93, - "learning_rate": 3.2727393213517163e-06, - "loss": 2.2486, - "step": 535900 - }, - { - "epoch": 0.93, - "learning_rate": 3.2718673814248896e-06, - "loss": 2.3218, - "step": 535910 - }, - { - "epoch": 0.93, - "learning_rate": 3.2709954414980626e-06, - "loss": 2.2781, - "step": 535920 - }, - { - "epoch": 0.93, - "learning_rate": 3.270123501571236e-06, - "loss": 2.202, - "step": 535930 - }, - { - "epoch": 0.93, - "learning_rate": 3.269251561644409e-06, - "loss": 2.2034, - "step": 535940 - }, - { - "epoch": 0.93, - "learning_rate": 3.268379621717582e-06, - "loss": 2.286, - "step": 535950 - }, - { - "epoch": 0.93, - "learning_rate": 3.2675076817907555e-06, - "loss": 2.2337, - "step": 535960 - }, - { - "epoch": 0.93, - "learning_rate": 3.2666357418639284e-06, - "loss": 2.1801, - "step": 535970 - }, - { - "epoch": 0.93, - "learning_rate": 3.2657638019371018e-06, - "loss": 2.3168, - "step": 535980 - }, - { - "epoch": 0.93, - "learning_rate": 3.2648918620102756e-06, - "loss": 2.2644, - "step": 535990 - }, - { - "epoch": 0.93, - "learning_rate": 3.2640199220834485e-06, - "loss": 2.2873, - "step": 536000 - }, - { - "epoch": 0.93, - "learning_rate": 3.263147982156622e-06, - "loss": 2.229, - "step": 536010 - }, - { - "epoch": 0.93, - "learning_rate": 3.2622760422297947e-06, - "loss": 2.2341, - "step": 536020 - }, - { - "epoch": 0.93, - "learning_rate": 3.261404102302968e-06, - "loss": 2.1947, - "step": 536030 - }, - { - "epoch": 0.93, - "learning_rate": 3.260532162376141e-06, - "loss": 2.4571, - "step": 536040 - }, - { - "epoch": 0.93, - "learning_rate": 3.2596602224493144e-06, - "loss": 2.3251, - "step": 536050 - }, - { - "epoch": 0.93, - "learning_rate": 3.2587882825224873e-06, - "loss": 2.2201, - "step": 536060 - }, - { - "epoch": 0.93, - "learning_rate": 3.2579163425956606e-06, - "loss": 2.2249, - "step": 536070 - }, - { - "epoch": 0.93, - "learning_rate": 3.2570444026688336e-06, - "loss": 2.2656, - "step": 536080 - }, - { - "epoch": 0.93, - "learning_rate": 3.256172462742007e-06, - "loss": 2.2806, - "step": 536090 - }, - { - "epoch": 0.93, - "learning_rate": 3.2553005228151802e-06, - "loss": 2.2444, - "step": 536100 - }, - { - "epoch": 0.93, - "learning_rate": 3.254428582888353e-06, - "loss": 2.399, - "step": 536110 - }, - { - "epoch": 0.93, - "learning_rate": 3.2535566429615265e-06, - "loss": 2.1222, - "step": 536120 - }, - { - "epoch": 0.93, - "learning_rate": 3.2526847030347003e-06, - "loss": 2.2786, - "step": 536130 - }, - { - "epoch": 0.93, - "learning_rate": 3.251812763107873e-06, - "loss": 2.2067, - "step": 536140 - }, - { - "epoch": 0.93, - "learning_rate": 3.2509408231810466e-06, - "loss": 2.2573, - "step": 536150 - }, - { - "epoch": 0.93, - "learning_rate": 3.2500688832542195e-06, - "loss": 2.1837, - "step": 536160 - }, - { - "epoch": 0.94, - "learning_rate": 3.249196943327393e-06, - "loss": 2.1983, - "step": 536170 - }, - { - "epoch": 0.94, - "learning_rate": 3.2483250034005657e-06, - "loss": 2.2212, - "step": 536180 - }, - { - "epoch": 0.94, - "learning_rate": 3.247453063473739e-06, - "loss": 2.3439, - "step": 536190 - }, - { - "epoch": 0.94, - "learning_rate": 3.246581123546912e-06, - "loss": 2.3146, - "step": 536200 - }, - { - "epoch": 0.94, - "learning_rate": 3.2457091836200854e-06, - "loss": 2.2567, - "step": 536210 - }, - { - "epoch": 0.94, - "learning_rate": 3.2448372436932587e-06, - "loss": 2.2441, - "step": 536220 - }, - { - "epoch": 0.94, - "learning_rate": 3.2439653037664316e-06, - "loss": 2.2706, - "step": 536230 - }, - { - "epoch": 0.94, - "learning_rate": 3.243093363839605e-06, - "loss": 2.3006, - "step": 536240 - }, - { - "epoch": 0.94, - "learning_rate": 3.242221423912778e-06, - "loss": 2.2381, - "step": 536250 - }, - { - "epoch": 0.94, - "learning_rate": 3.2413494839859517e-06, - "loss": 2.392, - "step": 536260 - }, - { - "epoch": 0.94, - "learning_rate": 3.240477544059125e-06, - "loss": 2.2326, - "step": 536270 - }, - { - "epoch": 0.94, - "learning_rate": 3.239605604132298e-06, - "loss": 2.24, - "step": 536280 - }, - { - "epoch": 0.94, - "learning_rate": 3.2387336642054713e-06, - "loss": 2.0923, - "step": 536290 - }, - { - "epoch": 0.94, - "learning_rate": 3.237861724278644e-06, - "loss": 2.1709, - "step": 536300 - }, - { - "epoch": 0.94, - "learning_rate": 3.2369897843518176e-06, - "loss": 2.1517, - "step": 536310 - }, - { - "epoch": 0.94, - "learning_rate": 3.2361178444249905e-06, - "loss": 2.2985, - "step": 536320 - }, - { - "epoch": 0.94, - "learning_rate": 3.235245904498164e-06, - "loss": 2.3014, - "step": 536330 - }, - { - "epoch": 0.94, - "learning_rate": 3.2343739645713367e-06, - "loss": 2.3085, - "step": 536340 - }, - { - "epoch": 0.94, - "learning_rate": 3.23350202464451e-06, - "loss": 2.3036, - "step": 536350 - }, - { - "epoch": 0.94, - "learning_rate": 3.2326300847176834e-06, - "loss": 2.2863, - "step": 536360 - }, - { - "epoch": 0.94, - "learning_rate": 3.2317581447908564e-06, - "loss": 2.3914, - "step": 536370 - }, - { - "epoch": 0.94, - "learning_rate": 3.2308862048640297e-06, - "loss": 2.2307, - "step": 536380 - }, - { - "epoch": 0.94, - "learning_rate": 3.2300142649372035e-06, - "loss": 2.1266, - "step": 536390 - }, - { - "epoch": 0.94, - "learning_rate": 3.2291423250103764e-06, - "loss": 2.2812, - "step": 536400 - }, - { - "epoch": 0.94, - "learning_rate": 3.2282703850835498e-06, - "loss": 2.3657, - "step": 536410 - }, - { - "epoch": 0.94, - "learning_rate": 3.2273984451567227e-06, - "loss": 2.122, - "step": 536420 - }, - { - "epoch": 0.94, - "learning_rate": 3.226526505229896e-06, - "loss": 2.2138, - "step": 536430 - }, - { - "epoch": 0.94, - "learning_rate": 3.225654565303069e-06, - "loss": 2.2666, - "step": 536440 - }, - { - "epoch": 0.94, - "learning_rate": 3.2247826253762423e-06, - "loss": 2.2036, - "step": 536450 - }, - { - "epoch": 0.94, - "learning_rate": 3.2239106854494152e-06, - "loss": 2.2021, - "step": 536460 - }, - { - "epoch": 0.94, - "learning_rate": 3.2230387455225886e-06, - "loss": 2.293, - "step": 536470 - }, - { - "epoch": 0.94, - "learning_rate": 3.222166805595762e-06, - "loss": 2.1794, - "step": 536480 - }, - { - "epoch": 0.94, - "learning_rate": 3.221294865668935e-06, - "loss": 2.2521, - "step": 536490 - }, - { - "epoch": 0.94, - "learning_rate": 3.220422925742108e-06, - "loss": 2.1766, - "step": 536500 - }, - { - "epoch": 0.94, - "learning_rate": 3.219550985815281e-06, - "loss": 2.2993, - "step": 536510 - }, - { - "epoch": 0.94, - "learning_rate": 3.2186790458884544e-06, - "loss": 2.2886, - "step": 536520 - }, - { - "epoch": 0.94, - "learning_rate": 3.2178071059616282e-06, - "loss": 2.3214, - "step": 536530 - }, - { - "epoch": 0.94, - "learning_rate": 3.216935166034801e-06, - "loss": 2.1927, - "step": 536540 - }, - { - "epoch": 0.94, - "learning_rate": 3.2160632261079745e-06, - "loss": 2.2478, - "step": 536550 - }, - { - "epoch": 0.94, - "learning_rate": 3.2151912861811474e-06, - "loss": 2.2278, - "step": 536560 - }, - { - "epoch": 0.94, - "learning_rate": 3.2143193462543208e-06, - "loss": 2.2832, - "step": 536570 - }, - { - "epoch": 0.94, - "learning_rate": 3.2134474063274937e-06, - "loss": 2.3393, - "step": 536580 - }, - { - "epoch": 0.94, - "learning_rate": 3.212575466400667e-06, - "loss": 2.2266, - "step": 536590 - }, - { - "epoch": 0.94, - "learning_rate": 3.21170352647384e-06, - "loss": 2.2304, - "step": 536600 - }, - { - "epoch": 0.94, - "learning_rate": 3.2108315865470133e-06, - "loss": 2.2773, - "step": 536610 - }, - { - "epoch": 0.94, - "learning_rate": 3.2099596466201866e-06, - "loss": 2.2542, - "step": 536620 - }, - { - "epoch": 0.94, - "learning_rate": 3.2090877066933596e-06, - "loss": 2.1482, - "step": 536630 - }, - { - "epoch": 0.94, - "learning_rate": 3.208215766766533e-06, - "loss": 2.2627, - "step": 536640 - }, - { - "epoch": 0.94, - "learning_rate": 3.207343826839706e-06, - "loss": 2.3117, - "step": 536650 - }, - { - "epoch": 0.94, - "learning_rate": 3.2064718869128796e-06, - "loss": 2.3057, - "step": 536660 - }, - { - "epoch": 0.94, - "learning_rate": 3.205599946986053e-06, - "loss": 2.1842, - "step": 536670 - }, - { - "epoch": 0.94, - "learning_rate": 3.204728007059226e-06, - "loss": 2.1814, - "step": 536680 - }, - { - "epoch": 0.94, - "learning_rate": 3.2038560671323992e-06, - "loss": 2.1736, - "step": 536690 - }, - { - "epoch": 0.94, - "learning_rate": 3.202984127205572e-06, - "loss": 2.3084, - "step": 536700 - }, - { - "epoch": 0.94, - "learning_rate": 3.2021121872787455e-06, - "loss": 2.3203, - "step": 536710 - }, - { - "epoch": 0.94, - "learning_rate": 3.2012402473519184e-06, - "loss": 2.2249, - "step": 536720 - }, - { - "epoch": 0.94, - "learning_rate": 3.2003683074250918e-06, - "loss": 2.3413, - "step": 536730 - }, - { - "epoch": 0.94, - "learning_rate": 3.199496367498265e-06, - "loss": 2.2555, - "step": 536740 - }, - { - "epoch": 0.94, - "learning_rate": 3.198624427571438e-06, - "loss": 2.316, - "step": 536750 - }, - { - "epoch": 0.94, - "learning_rate": 3.1977524876446114e-06, - "loss": 2.1765, - "step": 536760 - }, - { - "epoch": 0.94, - "learning_rate": 3.1968805477177843e-06, - "loss": 2.2823, - "step": 536770 - }, - { - "epoch": 0.94, - "learning_rate": 3.1960086077909576e-06, - "loss": 2.2221, - "step": 536780 - }, - { - "epoch": 0.94, - "learning_rate": 3.1951366678641314e-06, - "loss": 2.3498, - "step": 536790 - }, - { - "epoch": 0.94, - "learning_rate": 3.1942647279373043e-06, - "loss": 2.1695, - "step": 536800 - }, - { - "epoch": 0.94, - "learning_rate": 3.1933927880104777e-06, - "loss": 2.2141, - "step": 536810 - }, - { - "epoch": 0.94, - "learning_rate": 3.1925208480836506e-06, - "loss": 2.3309, - "step": 536820 - }, - { - "epoch": 0.94, - "learning_rate": 3.191648908156824e-06, - "loss": 2.2212, - "step": 536830 - }, - { - "epoch": 0.94, - "learning_rate": 3.190776968229997e-06, - "loss": 2.2307, - "step": 536840 - }, - { - "epoch": 0.94, - "learning_rate": 3.1899050283031702e-06, - "loss": 2.3116, - "step": 536850 - }, - { - "epoch": 0.94, - "learning_rate": 3.189033088376343e-06, - "loss": 2.3307, - "step": 536860 - }, - { - "epoch": 0.94, - "learning_rate": 3.1881611484495165e-06, - "loss": 2.3183, - "step": 536870 - }, - { - "epoch": 0.94, - "learning_rate": 3.18728920852269e-06, - "loss": 2.2587, - "step": 536880 - }, - { - "epoch": 0.94, - "learning_rate": 3.1864172685958628e-06, - "loss": 2.3687, - "step": 536890 - }, - { - "epoch": 0.94, - "learning_rate": 3.185545328669036e-06, - "loss": 2.1713, - "step": 536900 - }, - { - "epoch": 0.94, - "learning_rate": 3.184673388742209e-06, - "loss": 2.3361, - "step": 536910 - }, - { - "epoch": 0.94, - "learning_rate": 3.1838014488153824e-06, - "loss": 2.3099, - "step": 536920 - }, - { - "epoch": 0.94, - "learning_rate": 3.182929508888556e-06, - "loss": 2.3755, - "step": 536930 - }, - { - "epoch": 0.94, - "learning_rate": 3.182057568961729e-06, - "loss": 2.2319, - "step": 536940 - }, - { - "epoch": 0.94, - "learning_rate": 3.1811856290349024e-06, - "loss": 2.2196, - "step": 536950 - }, - { - "epoch": 0.94, - "learning_rate": 3.1803136891080753e-06, - "loss": 2.2917, - "step": 536960 - }, - { - "epoch": 0.94, - "learning_rate": 3.1794417491812487e-06, - "loss": 2.3442, - "step": 536970 - }, - { - "epoch": 0.94, - "learning_rate": 3.1785698092544216e-06, - "loss": 2.2319, - "step": 536980 - }, - { - "epoch": 0.94, - "learning_rate": 3.177697869327595e-06, - "loss": 2.2195, - "step": 536990 - }, - { - "epoch": 0.94, - "learning_rate": 3.1768259294007683e-06, - "loss": 2.1825, - "step": 537000 - }, - { - "epoch": 0.94, - "learning_rate": 3.1759539894739412e-06, - "loss": 2.2083, - "step": 537010 - }, - { - "epoch": 0.94, - "learning_rate": 3.1750820495471146e-06, - "loss": 2.1925, - "step": 537020 - }, - { - "epoch": 0.94, - "learning_rate": 3.1742101096202875e-06, - "loss": 2.2748, - "step": 537030 - }, - { - "epoch": 0.94, - "learning_rate": 3.173338169693461e-06, - "loss": 2.2268, - "step": 537040 - }, - { - "epoch": 0.94, - "learning_rate": 3.1724662297666338e-06, - "loss": 2.3471, - "step": 537050 - }, - { - "epoch": 0.94, - "learning_rate": 3.1715942898398075e-06, - "loss": 2.2587, - "step": 537060 - }, - { - "epoch": 0.94, - "learning_rate": 3.170722349912981e-06, - "loss": 2.1665, - "step": 537070 - }, - { - "epoch": 0.94, - "learning_rate": 3.169850409986154e-06, - "loss": 2.2729, - "step": 537080 - }, - { - "epoch": 0.94, - "learning_rate": 3.168978470059327e-06, - "loss": 2.2281, - "step": 537090 - }, - { - "epoch": 0.94, - "learning_rate": 3.1681065301325e-06, - "loss": 2.3033, - "step": 537100 - }, - { - "epoch": 0.94, - "learning_rate": 3.1672345902056734e-06, - "loss": 2.2519, - "step": 537110 - }, - { - "epoch": 0.94, - "learning_rate": 3.1663626502788463e-06, - "loss": 2.239, - "step": 537120 - }, - { - "epoch": 0.94, - "learning_rate": 3.1654907103520197e-06, - "loss": 2.2318, - "step": 537130 - }, - { - "epoch": 0.94, - "learning_rate": 3.164618770425193e-06, - "loss": 2.2499, - "step": 537140 - }, - { - "epoch": 0.94, - "learning_rate": 3.163746830498366e-06, - "loss": 2.2372, - "step": 537150 - }, - { - "epoch": 0.94, - "learning_rate": 3.1628748905715393e-06, - "loss": 2.0954, - "step": 537160 - }, - { - "epoch": 0.94, - "learning_rate": 3.1620029506447122e-06, - "loss": 2.1726, - "step": 537170 - }, - { - "epoch": 0.94, - "learning_rate": 3.1611310107178856e-06, - "loss": 2.144, - "step": 537180 - }, - { - "epoch": 0.94, - "learning_rate": 3.1602590707910593e-06, - "loss": 2.2116, - "step": 537190 - }, - { - "epoch": 0.94, - "learning_rate": 3.1593871308642323e-06, - "loss": 2.2739, - "step": 537200 - }, - { - "epoch": 0.94, - "learning_rate": 3.1585151909374056e-06, - "loss": 2.3296, - "step": 537210 - }, - { - "epoch": 0.94, - "learning_rate": 3.1576432510105785e-06, - "loss": 2.191, - "step": 537220 - }, - { - "epoch": 0.94, - "learning_rate": 3.156771311083752e-06, - "loss": 2.3443, - "step": 537230 - }, - { - "epoch": 0.94, - "learning_rate": 3.155899371156925e-06, - "loss": 2.3893, - "step": 537240 - }, - { - "epoch": 0.94, - "learning_rate": 3.155027431230098e-06, - "loss": 2.2076, - "step": 537250 - }, - { - "epoch": 0.94, - "learning_rate": 3.1541554913032715e-06, - "loss": 2.276, - "step": 537260 - }, - { - "epoch": 0.94, - "learning_rate": 3.1532835513764444e-06, - "loss": 2.2453, - "step": 537270 - }, - { - "epoch": 0.94, - "learning_rate": 3.1524116114496178e-06, - "loss": 2.1982, - "step": 537280 - }, - { - "epoch": 0.94, - "learning_rate": 3.1515396715227907e-06, - "loss": 2.3439, - "step": 537290 - }, - { - "epoch": 0.94, - "learning_rate": 3.150667731595964e-06, - "loss": 2.347, - "step": 537300 - }, - { - "epoch": 0.94, - "learning_rate": 3.149795791669137e-06, - "loss": 2.259, - "step": 537310 - }, - { - "epoch": 0.94, - "learning_rate": 3.1489238517423103e-06, - "loss": 2.2691, - "step": 537320 - }, - { - "epoch": 0.94, - "learning_rate": 3.148051911815484e-06, - "loss": 2.2693, - "step": 537330 - }, - { - "epoch": 0.94, - "learning_rate": 3.147179971888657e-06, - "loss": 2.2585, - "step": 537340 - }, - { - "epoch": 0.94, - "learning_rate": 3.1463080319618303e-06, - "loss": 2.2635, - "step": 537350 - }, - { - "epoch": 0.94, - "learning_rate": 3.1454360920350033e-06, - "loss": 2.2717, - "step": 537360 - }, - { - "epoch": 0.94, - "learning_rate": 3.1445641521081766e-06, - "loss": 2.3047, - "step": 537370 - }, - { - "epoch": 0.94, - "learning_rate": 3.1436922121813495e-06, - "loss": 2.3806, - "step": 537380 - }, - { - "epoch": 0.94, - "learning_rate": 3.142820272254523e-06, - "loss": 2.2675, - "step": 537390 - }, - { - "epoch": 0.94, - "learning_rate": 3.1419483323276962e-06, - "loss": 2.1566, - "step": 537400 - }, - { - "epoch": 0.94, - "learning_rate": 3.141076392400869e-06, - "loss": 2.2624, - "step": 537410 - }, - { - "epoch": 0.94, - "learning_rate": 3.1402044524740425e-06, - "loss": 2.2903, - "step": 537420 - }, - { - "epoch": 0.94, - "learning_rate": 3.1393325125472154e-06, - "loss": 2.1672, - "step": 537430 - }, - { - "epoch": 0.94, - "learning_rate": 3.1384605726203888e-06, - "loss": 2.2072, - "step": 537440 - }, - { - "epoch": 0.94, - "learning_rate": 3.1375886326935617e-06, - "loss": 2.197, - "step": 537450 - }, - { - "epoch": 0.94, - "learning_rate": 3.1367166927667355e-06, - "loss": 2.2747, - "step": 537460 - }, - { - "epoch": 0.94, - "learning_rate": 3.135844752839909e-06, - "loss": 2.2124, - "step": 537470 - }, - { - "epoch": 0.94, - "learning_rate": 3.1349728129130817e-06, - "loss": 2.2018, - "step": 537480 - }, - { - "epoch": 0.94, - "learning_rate": 3.134100872986255e-06, - "loss": 2.2206, - "step": 537490 - }, - { - "epoch": 0.94, - "learning_rate": 3.133228933059428e-06, - "loss": 2.2808, - "step": 537500 - }, - { - "epoch": 0.94, - "learning_rate": 3.1323569931326013e-06, - "loss": 2.2972, - "step": 537510 - }, - { - "epoch": 0.94, - "learning_rate": 3.1314850532057747e-06, - "loss": 2.2253, - "step": 537520 - }, - { - "epoch": 0.94, - "learning_rate": 3.1306131132789476e-06, - "loss": 2.253, - "step": 537530 - }, - { - "epoch": 0.94, - "learning_rate": 3.129741173352121e-06, - "loss": 2.2628, - "step": 537540 - }, - { - "epoch": 0.94, - "learning_rate": 3.128869233425294e-06, - "loss": 2.2365, - "step": 537550 - }, - { - "epoch": 0.94, - "learning_rate": 3.1279972934984672e-06, - "loss": 2.2695, - "step": 537560 - }, - { - "epoch": 0.94, - "learning_rate": 3.12712535357164e-06, - "loss": 2.2909, - "step": 537570 - }, - { - "epoch": 0.94, - "learning_rate": 3.1262534136448135e-06, - "loss": 2.2352, - "step": 537580 - }, - { - "epoch": 0.94, - "learning_rate": 3.1253814737179873e-06, - "loss": 2.3245, - "step": 537590 - }, - { - "epoch": 0.94, - "learning_rate": 3.12450953379116e-06, - "loss": 2.202, - "step": 537600 - }, - { - "epoch": 0.94, - "learning_rate": 3.123637593864333e-06, - "loss": 2.1498, - "step": 537610 - }, - { - "epoch": 0.94, - "learning_rate": 3.1227656539375065e-06, - "loss": 2.3136, - "step": 537620 - }, - { - "epoch": 0.94, - "learning_rate": 3.12189371401068e-06, - "loss": 2.2406, - "step": 537630 - }, - { - "epoch": 0.94, - "learning_rate": 3.121021774083853e-06, - "loss": 2.2072, - "step": 537640 - }, - { - "epoch": 0.94, - "learning_rate": 3.120149834157026e-06, - "loss": 2.1767, - "step": 537650 - }, - { - "epoch": 0.94, - "learning_rate": 3.1192778942301994e-06, - "loss": 2.3305, - "step": 537660 - }, - { - "epoch": 0.94, - "learning_rate": 3.1184059543033723e-06, - "loss": 2.331, - "step": 537670 - }, - { - "epoch": 0.94, - "learning_rate": 3.1175340143765457e-06, - "loss": 2.2184, - "step": 537680 - }, - { - "epoch": 0.94, - "learning_rate": 3.116662074449719e-06, - "loss": 2.3048, - "step": 537690 - }, - { - "epoch": 0.94, - "learning_rate": 3.115790134522892e-06, - "loss": 2.3394, - "step": 537700 - }, - { - "epoch": 0.94, - "learning_rate": 3.1149181945960653e-06, - "loss": 2.3074, - "step": 537710 - }, - { - "epoch": 0.94, - "learning_rate": 3.1140462546692386e-06, - "loss": 2.1718, - "step": 537720 - }, - { - "epoch": 0.94, - "learning_rate": 3.1131743147424116e-06, - "loss": 2.2154, - "step": 537730 - }, - { - "epoch": 0.94, - "learning_rate": 3.112302374815585e-06, - "loss": 2.2192, - "step": 537740 - }, - { - "epoch": 0.94, - "learning_rate": 3.111430434888758e-06, - "loss": 2.2203, - "step": 537750 - }, - { - "epoch": 0.94, - "learning_rate": 3.110558494961931e-06, - "loss": 2.2006, - "step": 537760 - }, - { - "epoch": 0.94, - "learning_rate": 3.1096865550351045e-06, - "loss": 2.358, - "step": 537770 - }, - { - "epoch": 0.94, - "learning_rate": 3.108814615108278e-06, - "loss": 2.3073, - "step": 537780 - }, - { - "epoch": 0.94, - "learning_rate": 3.107942675181451e-06, - "loss": 2.342, - "step": 537790 - }, - { - "epoch": 0.94, - "learning_rate": 3.107070735254624e-06, - "loss": 2.3046, - "step": 537800 - }, - { - "epoch": 0.94, - "learning_rate": 3.106198795327797e-06, - "loss": 2.3038, - "step": 537810 - }, - { - "epoch": 0.94, - "learning_rate": 3.1053268554009704e-06, - "loss": 2.1727, - "step": 537820 - }, - { - "epoch": 0.94, - "learning_rate": 3.1044549154741438e-06, - "loss": 2.2889, - "step": 537830 - }, - { - "epoch": 0.94, - "learning_rate": 3.103582975547317e-06, - "loss": 2.1305, - "step": 537840 - }, - { - "epoch": 0.94, - "learning_rate": 3.10271103562049e-06, - "loss": 2.1498, - "step": 537850 - }, - { - "epoch": 0.94, - "learning_rate": 3.1018390956936634e-06, - "loss": 2.2472, - "step": 537860 - }, - { - "epoch": 0.94, - "learning_rate": 3.1009671557668363e-06, - "loss": 2.1019, - "step": 537870 - }, - { - "epoch": 0.94, - "learning_rate": 3.1000952158400096e-06, - "loss": 2.2235, - "step": 537880 - }, - { - "epoch": 0.94, - "learning_rate": 3.099223275913183e-06, - "loss": 2.2897, - "step": 537890 - }, - { - "epoch": 0.94, - "learning_rate": 3.0983513359863563e-06, - "loss": 2.279, - "step": 537900 - }, - { - "epoch": 0.94, - "learning_rate": 3.0974793960595293e-06, - "loss": 2.29, - "step": 537910 - }, - { - "epoch": 0.94, - "learning_rate": 3.0966074561327026e-06, - "loss": 2.1617, - "step": 537920 - }, - { - "epoch": 0.94, - "learning_rate": 3.0957355162058755e-06, - "loss": 2.198, - "step": 537930 - }, - { - "epoch": 0.94, - "learning_rate": 3.094863576279049e-06, - "loss": 2.2504, - "step": 537940 - }, - { - "epoch": 0.94, - "learning_rate": 3.093991636352222e-06, - "loss": 2.2537, - "step": 537950 - }, - { - "epoch": 0.94, - "learning_rate": 3.093119696425395e-06, - "loss": 2.1914, - "step": 537960 - }, - { - "epoch": 0.94, - "learning_rate": 3.0922477564985685e-06, - "loss": 2.3215, - "step": 537970 - }, - { - "epoch": 0.94, - "learning_rate": 3.091375816571742e-06, - "loss": 2.3401, - "step": 537980 - }, - { - "epoch": 0.94, - "learning_rate": 3.0905038766449148e-06, - "loss": 2.271, - "step": 537990 - }, - { - "epoch": 0.94, - "learning_rate": 3.089631936718088e-06, - "loss": 2.2241, - "step": 538000 - }, - { - "epoch": 0.94, - "learning_rate": 3.088759996791261e-06, - "loss": 2.2137, - "step": 538010 - }, - { - "epoch": 0.94, - "learning_rate": 3.0878880568644344e-06, - "loss": 2.3792, - "step": 538020 - }, - { - "epoch": 0.94, - "learning_rate": 3.0870161169376077e-06, - "loss": 2.3484, - "step": 538030 - }, - { - "epoch": 0.94, - "learning_rate": 3.086144177010781e-06, - "loss": 2.2959, - "step": 538040 - }, - { - "epoch": 0.94, - "learning_rate": 3.085272237083954e-06, - "loss": 2.3472, - "step": 538050 - }, - { - "epoch": 0.94, - "learning_rate": 3.0844002971571273e-06, - "loss": 2.2093, - "step": 538060 - }, - { - "epoch": 0.94, - "learning_rate": 3.0835283572303003e-06, - "loss": 2.2218, - "step": 538070 - }, - { - "epoch": 0.94, - "learning_rate": 3.0826564173034736e-06, - "loss": 2.2519, - "step": 538080 - }, - { - "epoch": 0.94, - "learning_rate": 3.081784477376647e-06, - "loss": 2.2299, - "step": 538090 - }, - { - "epoch": 0.94, - "learning_rate": 3.0809125374498203e-06, - "loss": 2.333, - "step": 538100 - }, - { - "epoch": 0.94, - "learning_rate": 3.0800405975229932e-06, - "loss": 2.2391, - "step": 538110 - }, - { - "epoch": 0.94, - "learning_rate": 3.0791686575961666e-06, - "loss": 2.2007, - "step": 538120 - }, - { - "epoch": 0.94, - "learning_rate": 3.0782967176693395e-06, - "loss": 2.335, - "step": 538130 - }, - { - "epoch": 0.94, - "learning_rate": 3.077424777742513e-06, - "loss": 2.2149, - "step": 538140 - }, - { - "epoch": 0.94, - "learning_rate": 3.0765528378156858e-06, - "loss": 2.2026, - "step": 538150 - }, - { - "epoch": 0.94, - "learning_rate": 3.0756808978888595e-06, - "loss": 2.2326, - "step": 538160 - }, - { - "epoch": 0.94, - "learning_rate": 3.0748089579620325e-06, - "loss": 2.2673, - "step": 538170 - }, - { - "epoch": 0.94, - "learning_rate": 3.073937018035206e-06, - "loss": 2.156, - "step": 538180 - }, - { - "epoch": 0.94, - "learning_rate": 3.0730650781083787e-06, - "loss": 2.3259, - "step": 538190 - }, - { - "epoch": 0.94, - "learning_rate": 3.072193138181552e-06, - "loss": 2.3315, - "step": 538200 - }, - { - "epoch": 0.94, - "learning_rate": 3.071321198254725e-06, - "loss": 2.336, - "step": 538210 - }, - { - "epoch": 0.94, - "learning_rate": 3.0704492583278983e-06, - "loss": 2.2484, - "step": 538220 - }, - { - "epoch": 0.94, - "learning_rate": 3.0695773184010717e-06, - "loss": 2.2614, - "step": 538230 - }, - { - "epoch": 0.94, - "learning_rate": 3.068705378474245e-06, - "loss": 2.1838, - "step": 538240 - }, - { - "epoch": 0.94, - "learning_rate": 3.067833438547418e-06, - "loss": 2.3151, - "step": 538250 - }, - { - "epoch": 0.94, - "learning_rate": 3.0669614986205913e-06, - "loss": 2.4027, - "step": 538260 - }, - { - "epoch": 0.94, - "learning_rate": 3.0660895586937642e-06, - "loss": 2.2875, - "step": 538270 - }, - { - "epoch": 0.94, - "learning_rate": 3.0652176187669376e-06, - "loss": 2.2285, - "step": 538280 - }, - { - "epoch": 0.94, - "learning_rate": 3.064345678840111e-06, - "loss": 2.2681, - "step": 538290 - }, - { - "epoch": 0.94, - "learning_rate": 3.0634737389132843e-06, - "loss": 2.2327, - "step": 538300 - }, - { - "epoch": 0.94, - "learning_rate": 3.062601798986457e-06, - "loss": 2.3268, - "step": 538310 - }, - { - "epoch": 0.94, - "learning_rate": 3.0617298590596305e-06, - "loss": 2.2679, - "step": 538320 - }, - { - "epoch": 0.94, - "learning_rate": 3.0608579191328035e-06, - "loss": 2.1337, - "step": 538330 - }, - { - "epoch": 0.94, - "learning_rate": 3.059985979205977e-06, - "loss": 2.2828, - "step": 538340 - }, - { - "epoch": 0.94, - "learning_rate": 3.0591140392791497e-06, - "loss": 2.2102, - "step": 538350 - }, - { - "epoch": 0.94, - "learning_rate": 3.0582420993523235e-06, - "loss": 2.2311, - "step": 538360 - }, - { - "epoch": 0.94, - "learning_rate": 3.0573701594254964e-06, - "loss": 2.2303, - "step": 538370 - }, - { - "epoch": 0.94, - "learning_rate": 3.0564982194986698e-06, - "loss": 2.3625, - "step": 538380 - }, - { - "epoch": 0.94, - "learning_rate": 3.0556262795718427e-06, - "loss": 2.2991, - "step": 538390 - }, - { - "epoch": 0.94, - "learning_rate": 3.054754339645016e-06, - "loss": 2.2171, - "step": 538400 - }, - { - "epoch": 0.94, - "learning_rate": 3.053882399718189e-06, - "loss": 2.2216, - "step": 538410 - }, - { - "epoch": 0.94, - "learning_rate": 3.0530104597913627e-06, - "loss": 2.2384, - "step": 538420 - }, - { - "epoch": 0.94, - "learning_rate": 3.0521385198645357e-06, - "loss": 2.203, - "step": 538430 - }, - { - "epoch": 0.94, - "learning_rate": 3.051266579937709e-06, - "loss": 2.3495, - "step": 538440 - }, - { - "epoch": 0.94, - "learning_rate": 3.050394640010882e-06, - "loss": 2.3383, - "step": 538450 - }, - { - "epoch": 0.94, - "learning_rate": 3.0495227000840553e-06, - "loss": 2.2315, - "step": 538460 - }, - { - "epoch": 0.94, - "learning_rate": 3.048650760157228e-06, - "loss": 2.2375, - "step": 538470 - }, - { - "epoch": 0.94, - "learning_rate": 3.0477788202304015e-06, - "loss": 2.325, - "step": 538480 - }, - { - "epoch": 0.94, - "learning_rate": 3.046906880303575e-06, - "loss": 2.1858, - "step": 538490 - }, - { - "epoch": 0.94, - "learning_rate": 3.0460349403767482e-06, - "loss": 2.2176, - "step": 538500 - }, - { - "epoch": 0.94, - "learning_rate": 3.045163000449921e-06, - "loss": 2.362, - "step": 538510 - }, - { - "epoch": 0.94, - "learning_rate": 3.0442910605230945e-06, - "loss": 2.231, - "step": 538520 - }, - { - "epoch": 0.94, - "learning_rate": 3.0434191205962674e-06, - "loss": 2.2626, - "step": 538530 - }, - { - "epoch": 0.94, - "learning_rate": 3.0425471806694408e-06, - "loss": 2.0989, - "step": 538540 - }, - { - "epoch": 0.94, - "learning_rate": 3.0416752407426137e-06, - "loss": 2.2577, - "step": 538550 - }, - { - "epoch": 0.94, - "learning_rate": 3.0408033008157875e-06, - "loss": 2.231, - "step": 538560 - }, - { - "epoch": 0.94, - "learning_rate": 3.0399313608889604e-06, - "loss": 2.2074, - "step": 538570 - }, - { - "epoch": 0.94, - "learning_rate": 3.0390594209621337e-06, - "loss": 2.268, - "step": 538580 - }, - { - "epoch": 0.94, - "learning_rate": 3.0381874810353067e-06, - "loss": 2.2338, - "step": 538590 - }, - { - "epoch": 0.94, - "learning_rate": 3.03731554110848e-06, - "loss": 2.2253, - "step": 538600 - }, - { - "epoch": 0.94, - "learning_rate": 3.036443601181653e-06, - "loss": 2.36, - "step": 538610 - }, - { - "epoch": 0.94, - "learning_rate": 3.0355716612548267e-06, - "loss": 2.1486, - "step": 538620 - }, - { - "epoch": 0.94, - "learning_rate": 3.0346997213279996e-06, - "loss": 2.2602, - "step": 538630 - }, - { - "epoch": 0.94, - "learning_rate": 3.033827781401173e-06, - "loss": 2.2557, - "step": 538640 - }, - { - "epoch": 0.94, - "learning_rate": 3.032955841474346e-06, - "loss": 2.2848, - "step": 538650 - }, - { - "epoch": 0.94, - "learning_rate": 3.0320839015475192e-06, - "loss": 2.3446, - "step": 538660 - }, - { - "epoch": 0.94, - "learning_rate": 3.031211961620692e-06, - "loss": 2.2588, - "step": 538670 - }, - { - "epoch": 0.94, - "learning_rate": 3.0303400216938655e-06, - "loss": 2.2247, - "step": 538680 - }, - { - "epoch": 0.94, - "learning_rate": 3.029468081767039e-06, - "loss": 2.317, - "step": 538690 - }, - { - "epoch": 0.94, - "learning_rate": 3.028596141840212e-06, - "loss": 2.1933, - "step": 538700 - }, - { - "epoch": 0.94, - "learning_rate": 3.027724201913385e-06, - "loss": 2.341, - "step": 538710 - }, - { - "epoch": 0.94, - "learning_rate": 3.0268522619865585e-06, - "loss": 2.1921, - "step": 538720 - }, - { - "epoch": 0.94, - "learning_rate": 3.0259803220597314e-06, - "loss": 2.2067, - "step": 538730 - }, - { - "epoch": 0.94, - "learning_rate": 3.0251083821329047e-06, - "loss": 2.2744, - "step": 538740 - }, - { - "epoch": 0.94, - "learning_rate": 3.024236442206078e-06, - "loss": 2.2983, - "step": 538750 - }, - { - "epoch": 0.94, - "learning_rate": 3.0233645022792514e-06, - "loss": 2.2492, - "step": 538760 - }, - { - "epoch": 0.94, - "learning_rate": 3.0224925623524243e-06, - "loss": 2.2708, - "step": 538770 - }, - { - "epoch": 0.94, - "learning_rate": 3.0216206224255977e-06, - "loss": 2.3082, - "step": 538780 - }, - { - "epoch": 0.94, - "learning_rate": 3.0207486824987706e-06, - "loss": 2.2357, - "step": 538790 - }, - { - "epoch": 0.94, - "learning_rate": 3.019876742571944e-06, - "loss": 2.2389, - "step": 538800 - }, - { - "epoch": 0.94, - "learning_rate": 3.019004802645117e-06, - "loss": 2.2049, - "step": 538810 - }, - { - "epoch": 0.94, - "learning_rate": 3.0181328627182907e-06, - "loss": 2.2336, - "step": 538820 - }, - { - "epoch": 0.94, - "learning_rate": 3.0172609227914636e-06, - "loss": 2.2695, - "step": 538830 - }, - { - "epoch": 0.94, - "learning_rate": 3.016388982864637e-06, - "loss": 2.1233, - "step": 538840 - }, - { - "epoch": 0.94, - "learning_rate": 3.01551704293781e-06, - "loss": 2.1803, - "step": 538850 - }, - { - "epoch": 0.94, - "learning_rate": 3.014645103010983e-06, - "loss": 2.2154, - "step": 538860 - }, - { - "epoch": 0.94, - "learning_rate": 3.013773163084156e-06, - "loss": 2.1458, - "step": 538870 - }, - { - "epoch": 0.94, - "learning_rate": 3.0129012231573295e-06, - "loss": 2.2503, - "step": 538880 - }, - { - "epoch": 0.94, - "learning_rate": 3.012029283230503e-06, - "loss": 2.1722, - "step": 538890 - }, - { - "epoch": 0.94, - "learning_rate": 3.011157343303676e-06, - "loss": 2.2256, - "step": 538900 - }, - { - "epoch": 0.94, - "learning_rate": 3.010285403376849e-06, - "loss": 2.326, - "step": 538910 - }, - { - "epoch": 0.94, - "learning_rate": 3.0094134634500224e-06, - "loss": 2.2235, - "step": 538920 - }, - { - "epoch": 0.94, - "learning_rate": 3.0085415235231953e-06, - "loss": 2.3167, - "step": 538930 - }, - { - "epoch": 0.94, - "learning_rate": 3.0076695835963687e-06, - "loss": 2.2821, - "step": 538940 - }, - { - "epoch": 0.94, - "learning_rate": 3.006797643669542e-06, - "loss": 2.3024, - "step": 538950 - }, - { - "epoch": 0.94, - "learning_rate": 3.0059257037427154e-06, - "loss": 2.168, - "step": 538960 - }, - { - "epoch": 0.94, - "learning_rate": 3.0050537638158883e-06, - "loss": 2.2276, - "step": 538970 - }, - { - "epoch": 0.94, - "learning_rate": 3.0041818238890617e-06, - "loss": 2.2684, - "step": 538980 - }, - { - "epoch": 0.94, - "learning_rate": 3.0033098839622346e-06, - "loss": 2.2646, - "step": 538990 - }, - { - "epoch": 0.94, - "learning_rate": 3.002437944035408e-06, - "loss": 2.302, - "step": 539000 - }, - { - "epoch": 0.94, - "learning_rate": 3.001566004108581e-06, - "loss": 2.2066, - "step": 539010 - }, - { - "epoch": 0.94, - "learning_rate": 3.0006940641817546e-06, - "loss": 2.2302, - "step": 539020 - }, - { - "epoch": 0.94, - "learning_rate": 2.9998221242549275e-06, - "loss": 2.2653, - "step": 539030 - }, - { - "epoch": 0.94, - "learning_rate": 2.998950184328101e-06, - "loss": 2.0885, - "step": 539040 - }, - { - "epoch": 0.94, - "learning_rate": 2.998078244401274e-06, - "loss": 2.3462, - "step": 539050 - }, - { - "epoch": 0.94, - "learning_rate": 2.997206304474447e-06, - "loss": 2.3821, - "step": 539060 - }, - { - "epoch": 0.94, - "learning_rate": 2.99633436454762e-06, - "loss": 2.2756, - "step": 539070 - }, - { - "epoch": 0.94, - "learning_rate": 2.9954624246207934e-06, - "loss": 2.1996, - "step": 539080 - }, - { - "epoch": 0.94, - "learning_rate": 2.9945904846939668e-06, - "loss": 2.3177, - "step": 539090 - }, - { - "epoch": 0.94, - "learning_rate": 2.99371854476714e-06, - "loss": 2.1772, - "step": 539100 - }, - { - "epoch": 0.94, - "learning_rate": 2.992846604840313e-06, - "loss": 2.1176, - "step": 539110 - }, - { - "epoch": 0.94, - "learning_rate": 2.9919746649134864e-06, - "loss": 2.2484, - "step": 539120 - }, - { - "epoch": 0.94, - "learning_rate": 2.9911027249866593e-06, - "loss": 2.1558, - "step": 539130 - }, - { - "epoch": 0.94, - "learning_rate": 2.9902307850598327e-06, - "loss": 2.2883, - "step": 539140 - }, - { - "epoch": 0.94, - "learning_rate": 2.989358845133006e-06, - "loss": 2.2449, - "step": 539150 - }, - { - "epoch": 0.94, - "learning_rate": 2.9884869052061794e-06, - "loss": 2.235, - "step": 539160 - }, - { - "epoch": 0.94, - "learning_rate": 2.9876149652793523e-06, - "loss": 2.2053, - "step": 539170 - }, - { - "epoch": 0.94, - "learning_rate": 2.9867430253525256e-06, - "loss": 2.2278, - "step": 539180 - }, - { - "epoch": 0.94, - "learning_rate": 2.9858710854256985e-06, - "loss": 2.3148, - "step": 539190 - }, - { - "epoch": 0.94, - "learning_rate": 2.984999145498872e-06, - "loss": 2.1276, - "step": 539200 - }, - { - "epoch": 0.94, - "learning_rate": 2.984127205572045e-06, - "loss": 2.2232, - "step": 539210 - }, - { - "epoch": 0.94, - "learning_rate": 2.9832552656452186e-06, - "loss": 2.1979, - "step": 539220 - }, - { - "epoch": 0.94, - "learning_rate": 2.9823833257183915e-06, - "loss": 2.2856, - "step": 539230 - }, - { - "epoch": 0.94, - "learning_rate": 2.981511385791565e-06, - "loss": 2.3332, - "step": 539240 - }, - { - "epoch": 0.94, - "learning_rate": 2.9806394458647378e-06, - "loss": 2.239, - "step": 539250 - }, - { - "epoch": 0.94, - "learning_rate": 2.979767505937911e-06, - "loss": 2.2871, - "step": 539260 - }, - { - "epoch": 0.94, - "learning_rate": 2.978895566011084e-06, - "loss": 2.3672, - "step": 539270 - }, - { - "epoch": 0.94, - "learning_rate": 2.9780236260842574e-06, - "loss": 2.3777, - "step": 539280 - }, - { - "epoch": 0.94, - "learning_rate": 2.9771516861574307e-06, - "loss": 2.2182, - "step": 539290 - }, - { - "epoch": 0.94, - "learning_rate": 2.976279746230604e-06, - "loss": 2.1132, - "step": 539300 - }, - { - "epoch": 0.94, - "learning_rate": 2.975407806303777e-06, - "loss": 2.2654, - "step": 539310 - }, - { - "epoch": 0.94, - "learning_rate": 2.9745358663769504e-06, - "loss": 2.1756, - "step": 539320 - }, - { - "epoch": 0.94, - "learning_rate": 2.9736639264501233e-06, - "loss": 2.3638, - "step": 539330 - }, - { - "epoch": 0.94, - "learning_rate": 2.9727919865232966e-06, - "loss": 2.3133, - "step": 539340 - }, - { - "epoch": 0.94, - "learning_rate": 2.97192004659647e-06, - "loss": 2.128, - "step": 539350 - }, - { - "epoch": 0.94, - "learning_rate": 2.9710481066696433e-06, - "loss": 2.2716, - "step": 539360 - }, - { - "epoch": 0.94, - "learning_rate": 2.9701761667428162e-06, - "loss": 2.2794, - "step": 539370 - }, - { - "epoch": 0.94, - "learning_rate": 2.9693042268159896e-06, - "loss": 2.2574, - "step": 539380 - }, - { - "epoch": 0.94, - "learning_rate": 2.9684322868891625e-06, - "loss": 2.3982, - "step": 539390 - }, - { - "epoch": 0.94, - "learning_rate": 2.967560346962336e-06, - "loss": 2.2724, - "step": 539400 - }, - { - "epoch": 0.94, - "learning_rate": 2.9666884070355088e-06, - "loss": 2.097, - "step": 539410 - }, - { - "epoch": 0.94, - "learning_rate": 2.9658164671086825e-06, - "loss": 2.2299, - "step": 539420 - }, - { - "epoch": 0.94, - "learning_rate": 2.9649445271818555e-06, - "loss": 2.2144, - "step": 539430 - }, - { - "epoch": 0.94, - "learning_rate": 2.964072587255029e-06, - "loss": 2.1987, - "step": 539440 - }, - { - "epoch": 0.94, - "learning_rate": 2.9632006473282017e-06, - "loss": 2.2401, - "step": 539450 - }, - { - "epoch": 0.94, - "learning_rate": 2.962328707401375e-06, - "loss": 2.2864, - "step": 539460 - }, - { - "epoch": 0.94, - "learning_rate": 2.961456767474548e-06, - "loss": 2.3012, - "step": 539470 - }, - { - "epoch": 0.94, - "learning_rate": 2.9605848275477214e-06, - "loss": 2.25, - "step": 539480 - }, - { - "epoch": 0.94, - "learning_rate": 2.9597128876208947e-06, - "loss": 2.2975, - "step": 539490 - }, - { - "epoch": 0.94, - "learning_rate": 2.958840947694068e-06, - "loss": 2.222, - "step": 539500 - }, - { - "epoch": 0.94, - "learning_rate": 2.957969007767241e-06, - "loss": 2.3901, - "step": 539510 - }, - { - "epoch": 0.94, - "learning_rate": 2.9570970678404143e-06, - "loss": 2.2003, - "step": 539520 - }, - { - "epoch": 0.94, - "learning_rate": 2.9562251279135872e-06, - "loss": 2.2822, - "step": 539530 - }, - { - "epoch": 0.94, - "learning_rate": 2.9553531879867606e-06, - "loss": 2.2553, - "step": 539540 - }, - { - "epoch": 0.94, - "learning_rate": 2.954481248059934e-06, - "loss": 2.2627, - "step": 539550 - }, - { - "epoch": 0.94, - "learning_rate": 2.9536093081331073e-06, - "loss": 2.3358, - "step": 539560 - }, - { - "epoch": 0.94, - "learning_rate": 2.95273736820628e-06, - "loss": 2.0655, - "step": 539570 - }, - { - "epoch": 0.94, - "learning_rate": 2.9518654282794535e-06, - "loss": 2.228, - "step": 539580 - }, - { - "epoch": 0.94, - "learning_rate": 2.9509934883526265e-06, - "loss": 2.1838, - "step": 539590 - }, - { - "epoch": 0.94, - "learning_rate": 2.9501215484258e-06, - "loss": 2.256, - "step": 539600 - }, - { - "epoch": 0.94, - "learning_rate": 2.9492496084989727e-06, - "loss": 2.2456, - "step": 539610 - }, - { - "epoch": 0.94, - "learning_rate": 2.9483776685721465e-06, - "loss": 2.3102, - "step": 539620 - }, - { - "epoch": 0.94, - "learning_rate": 2.9475057286453194e-06, - "loss": 2.2184, - "step": 539630 - }, - { - "epoch": 0.94, - "learning_rate": 2.9466337887184928e-06, - "loss": 2.2501, - "step": 539640 - }, - { - "epoch": 0.94, - "learning_rate": 2.9457618487916657e-06, - "loss": 2.2602, - "step": 539650 - }, - { - "epoch": 0.94, - "learning_rate": 2.944889908864839e-06, - "loss": 2.324, - "step": 539660 - }, - { - "epoch": 0.94, - "learning_rate": 2.944017968938012e-06, - "loss": 2.2136, - "step": 539670 - }, - { - "epoch": 0.94, - "learning_rate": 2.9431460290111853e-06, - "loss": 2.217, - "step": 539680 - }, - { - "epoch": 0.94, - "learning_rate": 2.9422740890843587e-06, - "loss": 2.3251, - "step": 539690 - }, - { - "epoch": 0.94, - "learning_rate": 2.941402149157532e-06, - "loss": 2.2054, - "step": 539700 - }, - { - "epoch": 0.94, - "learning_rate": 2.940530209230705e-06, - "loss": 2.1712, - "step": 539710 - }, - { - "epoch": 0.94, - "learning_rate": 2.9396582693038783e-06, - "loss": 2.1703, - "step": 539720 - }, - { - "epoch": 0.94, - "learning_rate": 2.938786329377051e-06, - "loss": 2.2816, - "step": 539730 - }, - { - "epoch": 0.94, - "learning_rate": 2.9379143894502245e-06, - "loss": 2.2571, - "step": 539740 - }, - { - "epoch": 0.94, - "learning_rate": 2.937042449523398e-06, - "loss": 2.2897, - "step": 539750 - }, - { - "epoch": 0.94, - "learning_rate": 2.9361705095965712e-06, - "loss": 2.2736, - "step": 539760 - }, - { - "epoch": 0.94, - "learning_rate": 2.935298569669744e-06, - "loss": 2.3179, - "step": 539770 - }, - { - "epoch": 0.94, - "learning_rate": 2.9344266297429175e-06, - "loss": 2.1965, - "step": 539780 - }, - { - "epoch": 0.94, - "learning_rate": 2.9335546898160904e-06, - "loss": 2.3385, - "step": 539790 - }, - { - "epoch": 0.94, - "learning_rate": 2.9326827498892638e-06, - "loss": 2.2129, - "step": 539800 - }, - { - "epoch": 0.94, - "learning_rate": 2.9318108099624367e-06, - "loss": 2.2405, - "step": 539810 - }, - { - "epoch": 0.94, - "learning_rate": 2.9309388700356105e-06, - "loss": 2.2127, - "step": 539820 - }, - { - "epoch": 0.94, - "learning_rate": 2.9300669301087834e-06, - "loss": 2.3267, - "step": 539830 - }, - { - "epoch": 0.94, - "learning_rate": 2.9291949901819567e-06, - "loss": 2.1402, - "step": 539840 - }, - { - "epoch": 0.94, - "learning_rate": 2.9283230502551297e-06, - "loss": 2.2536, - "step": 539850 - }, - { - "epoch": 0.94, - "learning_rate": 2.927451110328303e-06, - "loss": 2.2806, - "step": 539860 - }, - { - "epoch": 0.94, - "learning_rate": 2.926579170401476e-06, - "loss": 2.2737, - "step": 539870 - }, - { - "epoch": 0.94, - "learning_rate": 2.9257072304746493e-06, - "loss": 2.2023, - "step": 539880 - }, - { - "epoch": 0.94, - "learning_rate": 2.9248352905478226e-06, - "loss": 2.138, - "step": 539890 - }, - { - "epoch": 0.94, - "learning_rate": 2.923963350620996e-06, - "loss": 2.207, - "step": 539900 - }, - { - "epoch": 0.94, - "learning_rate": 2.923091410694169e-06, - "loss": 2.1866, - "step": 539910 - }, - { - "epoch": 0.94, - "learning_rate": 2.9222194707673422e-06, - "loss": 2.1378, - "step": 539920 - }, - { - "epoch": 0.94, - "learning_rate": 2.921347530840515e-06, - "loss": 2.2999, - "step": 539930 - }, - { - "epoch": 0.94, - "learning_rate": 2.9204755909136885e-06, - "loss": 2.3994, - "step": 539940 - }, - { - "epoch": 0.94, - "learning_rate": 2.919603650986862e-06, - "loss": 2.2017, - "step": 539950 - }, - { - "epoch": 0.94, - "learning_rate": 2.918731711060035e-06, - "loss": 2.2468, - "step": 539960 - }, - { - "epoch": 0.94, - "learning_rate": 2.917859771133208e-06, - "loss": 2.2979, - "step": 539970 - }, - { - "epoch": 0.94, - "learning_rate": 2.9169878312063815e-06, - "loss": 2.3121, - "step": 539980 - }, - { - "epoch": 0.94, - "learning_rate": 2.9161158912795544e-06, - "loss": 2.2874, - "step": 539990 - }, - { - "epoch": 0.94, - "learning_rate": 2.9152439513527277e-06, - "loss": 2.2134, - "step": 540000 - }, - { - "epoch": 0.94, - "learning_rate": 2.9143720114259007e-06, - "loss": 2.2113, - "step": 540010 - }, - { - "epoch": 0.94, - "learning_rate": 2.9135000714990744e-06, - "loss": 2.2596, - "step": 540020 - }, - { - "epoch": 0.94, - "learning_rate": 2.9126281315722474e-06, - "loss": 2.3426, - "step": 540030 - }, - { - "epoch": 0.94, - "learning_rate": 2.9117561916454207e-06, - "loss": 2.1943, - "step": 540040 - }, - { - "epoch": 0.94, - "learning_rate": 2.9108842517185936e-06, - "loss": 2.2508, - "step": 540050 - }, - { - "epoch": 0.94, - "learning_rate": 2.910012311791767e-06, - "loss": 2.2456, - "step": 540060 - }, - { - "epoch": 0.94, - "learning_rate": 2.90914037186494e-06, - "loss": 2.3432, - "step": 540070 - }, - { - "epoch": 0.94, - "learning_rate": 2.9082684319381132e-06, - "loss": 2.282, - "step": 540080 - }, - { - "epoch": 0.94, - "learning_rate": 2.9073964920112866e-06, - "loss": 2.151, - "step": 540090 - }, - { - "epoch": 0.94, - "learning_rate": 2.90652455208446e-06, - "loss": 2.2381, - "step": 540100 - }, - { - "epoch": 0.94, - "learning_rate": 2.905652612157633e-06, - "loss": 2.3599, - "step": 540110 - }, - { - "epoch": 0.94, - "learning_rate": 2.904780672230806e-06, - "loss": 2.343, - "step": 540120 - }, - { - "epoch": 0.94, - "learning_rate": 2.903908732303979e-06, - "loss": 2.2384, - "step": 540130 - }, - { - "epoch": 0.94, - "learning_rate": 2.9030367923771525e-06, - "loss": 2.1882, - "step": 540140 - }, - { - "epoch": 0.94, - "learning_rate": 2.902164852450326e-06, - "loss": 2.2624, - "step": 540150 - }, - { - "epoch": 0.94, - "learning_rate": 2.901292912523499e-06, - "loss": 2.1403, - "step": 540160 - }, - { - "epoch": 0.94, - "learning_rate": 2.900420972596672e-06, - "loss": 2.2205, - "step": 540170 - }, - { - "epoch": 0.94, - "learning_rate": 2.8995490326698454e-06, - "loss": 2.3256, - "step": 540180 - }, - { - "epoch": 0.94, - "learning_rate": 2.8986770927430184e-06, - "loss": 2.2557, - "step": 540190 - }, - { - "epoch": 0.94, - "learning_rate": 2.8978051528161917e-06, - "loss": 2.1819, - "step": 540200 - }, - { - "epoch": 0.94, - "learning_rate": 2.8969332128893646e-06, - "loss": 2.2904, - "step": 540210 - }, - { - "epoch": 0.94, - "learning_rate": 2.8960612729625384e-06, - "loss": 2.2203, - "step": 540220 - }, - { - "epoch": 0.94, - "learning_rate": 2.8951893330357113e-06, - "loss": 2.2878, - "step": 540230 - }, - { - "epoch": 0.94, - "learning_rate": 2.8943173931088847e-06, - "loss": 2.2856, - "step": 540240 - }, - { - "epoch": 0.94, - "learning_rate": 2.8934454531820576e-06, - "loss": 2.2974, - "step": 540250 - }, - { - "epoch": 0.94, - "learning_rate": 2.892573513255231e-06, - "loss": 2.3288, - "step": 540260 - }, - { - "epoch": 0.94, - "learning_rate": 2.891701573328404e-06, - "loss": 2.3138, - "step": 540270 - }, - { - "epoch": 0.94, - "learning_rate": 2.8908296334015776e-06, - "loss": 2.2988, - "step": 540280 - }, - { - "epoch": 0.94, - "learning_rate": 2.8899576934747506e-06, - "loss": 2.2295, - "step": 540290 - }, - { - "epoch": 0.94, - "learning_rate": 2.889085753547924e-06, - "loss": 2.2917, - "step": 540300 - }, - { - "epoch": 0.94, - "learning_rate": 2.888213813621097e-06, - "loss": 2.1653, - "step": 540310 - }, - { - "epoch": 0.94, - "learning_rate": 2.88734187369427e-06, - "loss": 2.309, - "step": 540320 - }, - { - "epoch": 0.94, - "learning_rate": 2.886469933767443e-06, - "loss": 2.299, - "step": 540330 - }, - { - "epoch": 0.94, - "learning_rate": 2.8855979938406164e-06, - "loss": 2.2283, - "step": 540340 - }, - { - "epoch": 0.94, - "learning_rate": 2.8847260539137898e-06, - "loss": 2.334, - "step": 540350 - }, - { - "epoch": 0.94, - "learning_rate": 2.883854113986963e-06, - "loss": 2.2694, - "step": 540360 - }, - { - "epoch": 0.94, - "learning_rate": 2.882982174060136e-06, - "loss": 2.2008, - "step": 540370 - }, - { - "epoch": 0.94, - "learning_rate": 2.8821102341333094e-06, - "loss": 2.3084, - "step": 540380 - }, - { - "epoch": 0.94, - "learning_rate": 2.8812382942064823e-06, - "loss": 2.2588, - "step": 540390 - }, - { - "epoch": 0.94, - "learning_rate": 2.8803663542796557e-06, - "loss": 2.3873, - "step": 540400 - }, - { - "epoch": 0.94, - "learning_rate": 2.8794944143528286e-06, - "loss": 2.2096, - "step": 540410 - }, - { - "epoch": 0.94, - "learning_rate": 2.8786224744260024e-06, - "loss": 2.3244, - "step": 540420 - }, - { - "epoch": 0.94, - "learning_rate": 2.8777505344991753e-06, - "loss": 2.1248, - "step": 540430 - }, - { - "epoch": 0.94, - "learning_rate": 2.8768785945723486e-06, - "loss": 2.2167, - "step": 540440 - }, - { - "epoch": 0.94, - "learning_rate": 2.8760066546455216e-06, - "loss": 2.2877, - "step": 540450 - }, - { - "epoch": 0.94, - "learning_rate": 2.875134714718695e-06, - "loss": 2.3946, - "step": 540460 - }, - { - "epoch": 0.94, - "learning_rate": 2.874262774791868e-06, - "loss": 2.2434, - "step": 540470 - }, - { - "epoch": 0.94, - "learning_rate": 2.8733908348650416e-06, - "loss": 2.2508, - "step": 540480 - }, - { - "epoch": 0.94, - "learning_rate": 2.8725188949382145e-06, - "loss": 2.421, - "step": 540490 - }, - { - "epoch": 0.94, - "learning_rate": 2.871646955011388e-06, - "loss": 2.2716, - "step": 540500 - }, - { - "epoch": 0.94, - "learning_rate": 2.8707750150845608e-06, - "loss": 2.3113, - "step": 540510 - }, - { - "epoch": 0.94, - "learning_rate": 2.869903075157734e-06, - "loss": 2.2386, - "step": 540520 - }, - { - "epoch": 0.94, - "learning_rate": 2.869031135230907e-06, - "loss": 2.2159, - "step": 540530 - }, - { - "epoch": 0.94, - "learning_rate": 2.8681591953040804e-06, - "loss": 2.3384, - "step": 540540 - }, - { - "epoch": 0.94, - "learning_rate": 2.8672872553772537e-06, - "loss": 2.2309, - "step": 540550 - }, - { - "epoch": 0.94, - "learning_rate": 2.866415315450427e-06, - "loss": 2.2789, - "step": 540560 - }, - { - "epoch": 0.94, - "learning_rate": 2.8655433755236e-06, - "loss": 2.3167, - "step": 540570 - }, - { - "epoch": 0.94, - "learning_rate": 2.8646714355967734e-06, - "loss": 2.2653, - "step": 540580 - }, - { - "epoch": 0.94, - "learning_rate": 2.8637994956699463e-06, - "loss": 2.3175, - "step": 540590 - }, - { - "epoch": 0.94, - "learning_rate": 2.8629275557431196e-06, - "loss": 2.2194, - "step": 540600 - }, - { - "epoch": 0.94, - "learning_rate": 2.8620556158162926e-06, - "loss": 2.2829, - "step": 540610 - }, - { - "epoch": 0.94, - "learning_rate": 2.8611836758894663e-06, - "loss": 2.3105, - "step": 540620 - }, - { - "epoch": 0.94, - "learning_rate": 2.8603117359626392e-06, - "loss": 2.2302, - "step": 540630 - }, - { - "epoch": 0.94, - "learning_rate": 2.8594397960358126e-06, - "loss": 2.2409, - "step": 540640 - }, - { - "epoch": 0.94, - "learning_rate": 2.8585678561089855e-06, - "loss": 2.1455, - "step": 540650 - }, - { - "epoch": 0.94, - "learning_rate": 2.857695916182159e-06, - "loss": 2.186, - "step": 540660 - }, - { - "epoch": 0.94, - "learning_rate": 2.8568239762553318e-06, - "loss": 2.4162, - "step": 540670 - }, - { - "epoch": 0.94, - "learning_rate": 2.8559520363285056e-06, - "loss": 2.2992, - "step": 540680 - }, - { - "epoch": 0.94, - "learning_rate": 2.8550800964016785e-06, - "loss": 2.3027, - "step": 540690 - }, - { - "epoch": 0.94, - "learning_rate": 2.854208156474852e-06, - "loss": 2.29, - "step": 540700 - }, - { - "epoch": 0.94, - "learning_rate": 2.8533362165480247e-06, - "loss": 2.3895, - "step": 540710 - }, - { - "epoch": 0.94, - "learning_rate": 2.852464276621198e-06, - "loss": 2.3049, - "step": 540720 - }, - { - "epoch": 0.94, - "learning_rate": 2.851592336694371e-06, - "loss": 2.265, - "step": 540730 - }, - { - "epoch": 0.94, - "learning_rate": 2.8507203967675444e-06, - "loss": 2.3475, - "step": 540740 - }, - { - "epoch": 0.94, - "learning_rate": 2.8498484568407177e-06, - "loss": 2.261, - "step": 540750 - }, - { - "epoch": 0.94, - "learning_rate": 2.848976516913891e-06, - "loss": 2.241, - "step": 540760 - }, - { - "epoch": 0.94, - "learning_rate": 2.848104576987064e-06, - "loss": 2.2555, - "step": 540770 - }, - { - "epoch": 0.94, - "learning_rate": 2.8472326370602373e-06, - "loss": 2.2443, - "step": 540780 - }, - { - "epoch": 0.94, - "learning_rate": 2.8463606971334102e-06, - "loss": 2.272, - "step": 540790 - }, - { - "epoch": 0.94, - "learning_rate": 2.8454887572065836e-06, - "loss": 2.2289, - "step": 540800 - }, - { - "epoch": 0.94, - "learning_rate": 2.8446168172797565e-06, - "loss": 2.1593, - "step": 540810 - }, - { - "epoch": 0.94, - "learning_rate": 2.8437448773529303e-06, - "loss": 2.3521, - "step": 540820 - }, - { - "epoch": 0.94, - "learning_rate": 2.842872937426103e-06, - "loss": 2.2919, - "step": 540830 - }, - { - "epoch": 0.94, - "learning_rate": 2.8420009974992766e-06, - "loss": 2.2447, - "step": 540840 - }, - { - "epoch": 0.94, - "learning_rate": 2.8411290575724495e-06, - "loss": 2.3496, - "step": 540850 - }, - { - "epoch": 0.94, - "learning_rate": 2.840257117645623e-06, - "loss": 2.3239, - "step": 540860 - }, - { - "epoch": 0.94, - "learning_rate": 2.8393851777187957e-06, - "loss": 2.2108, - "step": 540870 - }, - { - "epoch": 0.94, - "learning_rate": 2.8385132377919695e-06, - "loss": 2.2232, - "step": 540880 - }, - { - "epoch": 0.94, - "learning_rate": 2.8376412978651424e-06, - "loss": 2.2325, - "step": 540890 - }, - { - "epoch": 0.94, - "learning_rate": 2.836769357938316e-06, - "loss": 2.2405, - "step": 540900 - }, - { - "epoch": 0.94, - "learning_rate": 2.8358974180114887e-06, - "loss": 2.2198, - "step": 540910 - }, - { - "epoch": 0.94, - "learning_rate": 2.835025478084662e-06, - "loss": 2.2733, - "step": 540920 - }, - { - "epoch": 0.94, - "learning_rate": 2.834153538157835e-06, - "loss": 2.1588, - "step": 540930 - }, - { - "epoch": 0.94, - "learning_rate": 2.8332815982310083e-06, - "loss": 2.1059, - "step": 540940 - }, - { - "epoch": 0.94, - "learning_rate": 2.8324096583041817e-06, - "loss": 2.2738, - "step": 540950 - }, - { - "epoch": 0.94, - "learning_rate": 2.831537718377355e-06, - "loss": 2.2489, - "step": 540960 - }, - { - "epoch": 0.94, - "learning_rate": 2.830665778450528e-06, - "loss": 2.2083, - "step": 540970 - }, - { - "epoch": 0.94, - "learning_rate": 2.8297938385237013e-06, - "loss": 2.2335, - "step": 540980 - }, - { - "epoch": 0.94, - "learning_rate": 2.8289218985968742e-06, - "loss": 2.1287, - "step": 540990 - }, - { - "epoch": 0.94, - "learning_rate": 2.8280499586700476e-06, - "loss": 2.2468, - "step": 541000 - }, - { - "epoch": 0.94, - "learning_rate": 2.8271780187432205e-06, - "loss": 2.3236, - "step": 541010 - }, - { - "epoch": 0.94, - "learning_rate": 2.8263060788163943e-06, - "loss": 2.3914, - "step": 541020 - }, - { - "epoch": 0.94, - "learning_rate": 2.825434138889567e-06, - "loss": 2.2496, - "step": 541030 - }, - { - "epoch": 0.94, - "learning_rate": 2.8245621989627405e-06, - "loss": 2.1572, - "step": 541040 - }, - { - "epoch": 0.94, - "learning_rate": 2.8236902590359134e-06, - "loss": 2.2968, - "step": 541050 - }, - { - "epoch": 0.94, - "learning_rate": 2.822818319109087e-06, - "loss": 2.2623, - "step": 541060 - }, - { - "epoch": 0.94, - "learning_rate": 2.8219463791822597e-06, - "loss": 2.2851, - "step": 541070 - }, - { - "epoch": 0.94, - "learning_rate": 2.8210744392554335e-06, - "loss": 2.1921, - "step": 541080 - }, - { - "epoch": 0.94, - "learning_rate": 2.8202024993286064e-06, - "loss": 2.2444, - "step": 541090 - }, - { - "epoch": 0.94, - "learning_rate": 2.8193305594017798e-06, - "loss": 2.2458, - "step": 541100 - }, - { - "epoch": 0.94, - "learning_rate": 2.8184586194749527e-06, - "loss": 2.1417, - "step": 541110 - }, - { - "epoch": 0.94, - "learning_rate": 2.817586679548126e-06, - "loss": 2.2236, - "step": 541120 - }, - { - "epoch": 0.94, - "learning_rate": 2.816714739621299e-06, - "loss": 2.2748, - "step": 541130 - }, - { - "epoch": 0.94, - "learning_rate": 2.8158427996944723e-06, - "loss": 2.3522, - "step": 541140 - }, - { - "epoch": 0.94, - "learning_rate": 2.8149708597676456e-06, - "loss": 2.2961, - "step": 541150 - }, - { - "epoch": 0.94, - "learning_rate": 2.814098919840819e-06, - "loss": 2.2983, - "step": 541160 - }, - { - "epoch": 0.94, - "learning_rate": 2.813226979913992e-06, - "loss": 2.3057, - "step": 541170 - }, - { - "epoch": 0.94, - "learning_rate": 2.8123550399871653e-06, - "loss": 2.1915, - "step": 541180 - }, - { - "epoch": 0.94, - "learning_rate": 2.811483100060338e-06, - "loss": 2.1937, - "step": 541190 - }, - { - "epoch": 0.94, - "learning_rate": 2.8106111601335115e-06, - "loss": 2.2664, - "step": 541200 - }, - { - "epoch": 0.94, - "learning_rate": 2.8097392202066844e-06, - "loss": 2.1822, - "step": 541210 - }, - { - "epoch": 0.94, - "learning_rate": 2.8088672802798582e-06, - "loss": 2.3907, - "step": 541220 - }, - { - "epoch": 0.94, - "learning_rate": 2.807995340353031e-06, - "loss": 2.3318, - "step": 541230 - }, - { - "epoch": 0.94, - "learning_rate": 2.8071234004262045e-06, - "loss": 2.1943, - "step": 541240 - }, - { - "epoch": 0.94, - "learning_rate": 2.8062514604993774e-06, - "loss": 2.3491, - "step": 541250 - }, - { - "epoch": 0.94, - "learning_rate": 2.8053795205725508e-06, - "loss": 2.1221, - "step": 541260 - }, - { - "epoch": 0.94, - "learning_rate": 2.8045075806457237e-06, - "loss": 2.2213, - "step": 541270 - }, - { - "epoch": 0.94, - "learning_rate": 2.8036356407188974e-06, - "loss": 2.1274, - "step": 541280 - }, - { - "epoch": 0.94, - "learning_rate": 2.8027637007920704e-06, - "loss": 2.2496, - "step": 541290 - }, - { - "epoch": 0.94, - "learning_rate": 2.8018917608652437e-06, - "loss": 2.2521, - "step": 541300 - }, - { - "epoch": 0.94, - "learning_rate": 2.8010198209384166e-06, - "loss": 2.3243, - "step": 541310 - }, - { - "epoch": 0.94, - "learning_rate": 2.80014788101159e-06, - "loss": 2.2248, - "step": 541320 - }, - { - "epoch": 0.94, - "learning_rate": 2.799275941084763e-06, - "loss": 2.2542, - "step": 541330 - }, - { - "epoch": 0.94, - "learning_rate": 2.7984040011579363e-06, - "loss": 2.3226, - "step": 541340 - }, - { - "epoch": 0.94, - "learning_rate": 2.7975320612311096e-06, - "loss": 2.2503, - "step": 541350 - }, - { - "epoch": 0.94, - "learning_rate": 2.796660121304283e-06, - "loss": 2.2996, - "step": 541360 - }, - { - "epoch": 0.94, - "learning_rate": 2.795788181377456e-06, - "loss": 2.295, - "step": 541370 - }, - { - "epoch": 0.94, - "learning_rate": 2.7949162414506292e-06, - "loss": 2.2106, - "step": 541380 - }, - { - "epoch": 0.94, - "learning_rate": 2.794044301523802e-06, - "loss": 2.3409, - "step": 541390 - }, - { - "epoch": 0.94, - "learning_rate": 2.7931723615969755e-06, - "loss": 2.2292, - "step": 541400 - }, - { - "epoch": 0.94, - "learning_rate": 2.7923004216701484e-06, - "loss": 2.2278, - "step": 541410 - }, - { - "epoch": 0.94, - "learning_rate": 2.791428481743322e-06, - "loss": 2.2276, - "step": 541420 - }, - { - "epoch": 0.94, - "learning_rate": 2.790556541816495e-06, - "loss": 2.263, - "step": 541430 - }, - { - "epoch": 0.94, - "learning_rate": 2.7896846018896684e-06, - "loss": 2.2881, - "step": 541440 - }, - { - "epoch": 0.94, - "learning_rate": 2.7888126619628414e-06, - "loss": 2.1251, - "step": 541450 - }, - { - "epoch": 0.94, - "learning_rate": 2.7879407220360147e-06, - "loss": 2.3008, - "step": 541460 - }, - { - "epoch": 0.94, - "learning_rate": 2.7870687821091876e-06, - "loss": 2.342, - "step": 541470 - }, - { - "epoch": 0.94, - "learning_rate": 2.7861968421823614e-06, - "loss": 2.2441, - "step": 541480 - }, - { - "epoch": 0.94, - "learning_rate": 2.7853249022555343e-06, - "loss": 2.3613, - "step": 541490 - }, - { - "epoch": 0.94, - "learning_rate": 2.7844529623287077e-06, - "loss": 2.1987, - "step": 541500 - }, - { - "epoch": 0.94, - "learning_rate": 2.7835810224018806e-06, - "loss": 2.2505, - "step": 541510 - }, - { - "epoch": 0.94, - "learning_rate": 2.782709082475054e-06, - "loss": 2.2227, - "step": 541520 - }, - { - "epoch": 0.94, - "learning_rate": 2.781837142548227e-06, - "loss": 2.3024, - "step": 541530 - }, - { - "epoch": 0.94, - "learning_rate": 2.7809652026214002e-06, - "loss": 2.2036, - "step": 541540 - }, - { - "epoch": 0.94, - "learning_rate": 2.7800932626945736e-06, - "loss": 2.304, - "step": 541550 - }, - { - "epoch": 0.94, - "learning_rate": 2.779221322767747e-06, - "loss": 2.321, - "step": 541560 - }, - { - "epoch": 0.94, - "learning_rate": 2.77834938284092e-06, - "loss": 2.3093, - "step": 541570 - }, - { - "epoch": 0.94, - "learning_rate": 2.777477442914093e-06, - "loss": 2.2561, - "step": 541580 - }, - { - "epoch": 0.94, - "learning_rate": 2.776605502987266e-06, - "loss": 2.3034, - "step": 541590 - }, - { - "epoch": 0.94, - "learning_rate": 2.7757335630604394e-06, - "loss": 2.1889, - "step": 541600 - }, - { - "epoch": 0.94, - "learning_rate": 2.774861623133613e-06, - "loss": 2.1813, - "step": 541610 - }, - { - "epoch": 0.94, - "learning_rate": 2.773989683206786e-06, - "loss": 2.2896, - "step": 541620 - }, - { - "epoch": 0.94, - "learning_rate": 2.773117743279959e-06, - "loss": 2.3173, - "step": 541630 - }, - { - "epoch": 0.94, - "learning_rate": 2.7722458033531324e-06, - "loss": 2.1663, - "step": 541640 - }, - { - "epoch": 0.94, - "learning_rate": 2.7713738634263053e-06, - "loss": 2.263, - "step": 541650 - }, - { - "epoch": 0.94, - "learning_rate": 2.7705019234994787e-06, - "loss": 2.2263, - "step": 541660 - }, - { - "epoch": 0.94, - "learning_rate": 2.7696299835726516e-06, - "loss": 2.1989, - "step": 541670 - }, - { - "epoch": 0.94, - "learning_rate": 2.7687580436458254e-06, - "loss": 2.2914, - "step": 541680 - }, - { - "epoch": 0.94, - "learning_rate": 2.7678861037189983e-06, - "loss": 2.3203, - "step": 541690 - }, - { - "epoch": 0.94, - "learning_rate": 2.7670141637921716e-06, - "loss": 2.3471, - "step": 541700 - }, - { - "epoch": 0.94, - "learning_rate": 2.7661422238653446e-06, - "loss": 2.3099, - "step": 541710 - }, - { - "epoch": 0.94, - "learning_rate": 2.765270283938518e-06, - "loss": 2.1245, - "step": 541720 - }, - { - "epoch": 0.94, - "learning_rate": 2.764398344011691e-06, - "loss": 2.2202, - "step": 541730 - }, - { - "epoch": 0.94, - "learning_rate": 2.763526404084864e-06, - "loss": 2.2339, - "step": 541740 - }, - { - "epoch": 0.94, - "learning_rate": 2.7626544641580375e-06, - "loss": 2.2455, - "step": 541750 - }, - { - "epoch": 0.94, - "learning_rate": 2.761782524231211e-06, - "loss": 2.1982, - "step": 541760 - }, - { - "epoch": 0.94, - "learning_rate": 2.760910584304384e-06, - "loss": 2.3577, - "step": 541770 - }, - { - "epoch": 0.94, - "learning_rate": 2.760038644377557e-06, - "loss": 2.2907, - "step": 541780 - }, - { - "epoch": 0.94, - "learning_rate": 2.75916670445073e-06, - "loss": 2.2584, - "step": 541790 - }, - { - "epoch": 0.94, - "learning_rate": 2.7582947645239034e-06, - "loss": 2.2408, - "step": 541800 - }, - { - "epoch": 0.94, - "learning_rate": 2.7574228245970768e-06, - "loss": 2.2726, - "step": 541810 - }, - { - "epoch": 0.94, - "learning_rate": 2.75655088467025e-06, - "loss": 2.3176, - "step": 541820 - }, - { - "epoch": 0.94, - "learning_rate": 2.755678944743423e-06, - "loss": 2.4122, - "step": 541830 - }, - { - "epoch": 0.94, - "learning_rate": 2.7548070048165964e-06, - "loss": 2.2176, - "step": 541840 - }, - { - "epoch": 0.94, - "learning_rate": 2.7539350648897693e-06, - "loss": 2.3301, - "step": 541850 - }, - { - "epoch": 0.94, - "learning_rate": 2.7530631249629426e-06, - "loss": 2.1891, - "step": 541860 - }, - { - "epoch": 0.94, - "learning_rate": 2.7521911850361156e-06, - "loss": 2.2989, - "step": 541870 - }, - { - "epoch": 0.94, - "learning_rate": 2.7513192451092893e-06, - "loss": 2.2439, - "step": 541880 - }, - { - "epoch": 0.94, - "learning_rate": 2.7504473051824623e-06, - "loss": 2.2117, - "step": 541890 - }, - { - "epoch": 0.95, - "learning_rate": 2.7495753652556356e-06, - "loss": 2.1015, - "step": 541900 - }, - { - "epoch": 0.95, - "learning_rate": 2.7487034253288085e-06, - "loss": 2.2446, - "step": 541910 - }, - { - "epoch": 0.95, - "learning_rate": 2.747831485401982e-06, - "loss": 2.3763, - "step": 541920 - }, - { - "epoch": 0.95, - "learning_rate": 2.746959545475155e-06, - "loss": 2.2387, - "step": 541930 - }, - { - "epoch": 0.95, - "learning_rate": 2.746087605548328e-06, - "loss": 2.2434, - "step": 541940 - }, - { - "epoch": 0.95, - "learning_rate": 2.7452156656215015e-06, - "loss": 2.2584, - "step": 541950 - }, - { - "epoch": 0.95, - "learning_rate": 2.744343725694675e-06, - "loss": 2.2054, - "step": 541960 - }, - { - "epoch": 0.95, - "learning_rate": 2.7434717857678478e-06, - "loss": 2.2764, - "step": 541970 - }, - { - "epoch": 0.95, - "learning_rate": 2.742599845841021e-06, - "loss": 2.1751, - "step": 541980 - }, - { - "epoch": 0.95, - "learning_rate": 2.741727905914194e-06, - "loss": 2.2874, - "step": 541990 - }, - { - "epoch": 0.95, - "learning_rate": 2.7408559659873674e-06, - "loss": 2.2982, - "step": 542000 - }, - { - "epoch": 0.95, - "learning_rate": 2.7399840260605407e-06, - "loss": 2.1865, - "step": 542010 - }, - { - "epoch": 0.95, - "learning_rate": 2.739112086133714e-06, - "loss": 2.231, - "step": 542020 - }, - { - "epoch": 0.95, - "learning_rate": 2.738240146206887e-06, - "loss": 2.2745, - "step": 542030 - }, - { - "epoch": 0.95, - "learning_rate": 2.7373682062800603e-06, - "loss": 2.2183, - "step": 542040 - }, - { - "epoch": 0.95, - "learning_rate": 2.7364962663532333e-06, - "loss": 2.293, - "step": 542050 - }, - { - "epoch": 0.95, - "learning_rate": 2.7356243264264066e-06, - "loss": 2.2182, - "step": 542060 - }, - { - "epoch": 0.95, - "learning_rate": 2.7347523864995795e-06, - "loss": 2.2624, - "step": 542070 - }, - { - "epoch": 0.95, - "learning_rate": 2.7338804465727533e-06, - "loss": 2.2767, - "step": 542080 - }, - { - "epoch": 0.95, - "learning_rate": 2.7330085066459262e-06, - "loss": 2.1843, - "step": 542090 - }, - { - "epoch": 0.95, - "learning_rate": 2.7321365667190996e-06, - "loss": 2.2788, - "step": 542100 - }, - { - "epoch": 0.95, - "learning_rate": 2.7312646267922725e-06, - "loss": 2.4059, - "step": 542110 - }, - { - "epoch": 0.95, - "learning_rate": 2.730392686865446e-06, - "loss": 2.3118, - "step": 542120 - }, - { - "epoch": 0.95, - "learning_rate": 2.7295207469386188e-06, - "loss": 2.287, - "step": 542130 - }, - { - "epoch": 0.95, - "learning_rate": 2.728648807011792e-06, - "loss": 2.2732, - "step": 542140 - }, - { - "epoch": 0.95, - "learning_rate": 2.7277768670849655e-06, - "loss": 2.1569, - "step": 542150 - }, - { - "epoch": 0.95, - "learning_rate": 2.726904927158139e-06, - "loss": 2.3242, - "step": 542160 - }, - { - "epoch": 0.95, - "learning_rate": 2.7260329872313117e-06, - "loss": 2.2388, - "step": 542170 - }, - { - "epoch": 0.95, - "learning_rate": 2.725161047304485e-06, - "loss": 2.2865, - "step": 542180 - }, - { - "epoch": 0.95, - "learning_rate": 2.724289107377658e-06, - "loss": 2.3761, - "step": 542190 - }, - { - "epoch": 0.95, - "learning_rate": 2.7234171674508313e-06, - "loss": 2.3591, - "step": 542200 - }, - { - "epoch": 0.95, - "learning_rate": 2.7225452275240047e-06, - "loss": 2.2767, - "step": 542210 - }, - { - "epoch": 0.95, - "learning_rate": 2.721673287597178e-06, - "loss": 2.2714, - "step": 542220 - }, - { - "epoch": 0.95, - "learning_rate": 2.720801347670351e-06, - "loss": 2.1954, - "step": 542230 - }, - { - "epoch": 0.95, - "learning_rate": 2.7199294077435243e-06, - "loss": 2.2514, - "step": 542240 - }, - { - "epoch": 0.95, - "learning_rate": 2.7190574678166972e-06, - "loss": 2.2663, - "step": 542250 - }, - { - "epoch": 0.95, - "learning_rate": 2.7181855278898706e-06, - "loss": 2.2491, - "step": 542260 - }, - { - "epoch": 0.95, - "learning_rate": 2.7173135879630435e-06, - "loss": 2.3274, - "step": 542270 - }, - { - "epoch": 0.95, - "learning_rate": 2.7164416480362173e-06, - "loss": 2.1346, - "step": 542280 - }, - { - "epoch": 0.95, - "learning_rate": 2.71556970810939e-06, - "loss": 2.2683, - "step": 542290 - }, - { - "epoch": 0.95, - "learning_rate": 2.7146977681825635e-06, - "loss": 2.3552, - "step": 542300 - }, - { - "epoch": 0.95, - "learning_rate": 2.7138258282557365e-06, - "loss": 2.2762, - "step": 542310 - }, - { - "epoch": 0.95, - "learning_rate": 2.71295388832891e-06, - "loss": 2.3246, - "step": 542320 - }, - { - "epoch": 0.95, - "learning_rate": 2.7120819484020827e-06, - "loss": 2.328, - "step": 542330 - }, - { - "epoch": 0.95, - "learning_rate": 2.711210008475256e-06, - "loss": 2.3488, - "step": 542340 - }, - { - "epoch": 0.95, - "learning_rate": 2.7103380685484294e-06, - "loss": 2.1645, - "step": 542350 - }, - { - "epoch": 0.95, - "learning_rate": 2.7094661286216028e-06, - "loss": 2.2161, - "step": 542360 - }, - { - "epoch": 0.95, - "learning_rate": 2.7085941886947757e-06, - "loss": 2.3565, - "step": 542370 - }, - { - "epoch": 0.95, - "learning_rate": 2.707722248767949e-06, - "loss": 2.314, - "step": 542380 - }, - { - "epoch": 0.95, - "learning_rate": 2.706850308841122e-06, - "loss": 2.203, - "step": 542390 - }, - { - "epoch": 0.95, - "learning_rate": 2.7059783689142953e-06, - "loss": 2.27, - "step": 542400 - }, - { - "epoch": 0.95, - "learning_rate": 2.7051064289874686e-06, - "loss": 2.0449, - "step": 542410 - }, - { - "epoch": 0.95, - "learning_rate": 2.704234489060642e-06, - "loss": 2.2567, - "step": 542420 - }, - { - "epoch": 0.95, - "learning_rate": 2.703362549133815e-06, - "loss": 2.192, - "step": 542430 - }, - { - "epoch": 0.95, - "learning_rate": 2.7024906092069883e-06, - "loss": 2.2177, - "step": 542440 - }, - { - "epoch": 0.95, - "learning_rate": 2.701618669280161e-06, - "loss": 2.2, - "step": 542450 - }, - { - "epoch": 0.95, - "learning_rate": 2.7007467293533345e-06, - "loss": 2.2507, - "step": 542460 - }, - { - "epoch": 0.95, - "learning_rate": 2.6998747894265075e-06, - "loss": 2.3072, - "step": 542470 - }, - { - "epoch": 0.95, - "learning_rate": 2.6990028494996812e-06, - "loss": 2.2949, - "step": 542480 - }, - { - "epoch": 0.95, - "learning_rate": 2.698130909572854e-06, - "loss": 2.3034, - "step": 542490 - }, - { - "epoch": 0.95, - "learning_rate": 2.6972589696460275e-06, - "loss": 2.3105, - "step": 542500 - }, - { - "epoch": 0.95, - "learning_rate": 2.6963870297192004e-06, - "loss": 2.1524, - "step": 542510 - }, - { - "epoch": 0.95, - "learning_rate": 2.6955150897923738e-06, - "loss": 2.2648, - "step": 542520 - }, - { - "epoch": 0.95, - "learning_rate": 2.6946431498655467e-06, - "loss": 2.1524, - "step": 542530 - }, - { - "epoch": 0.95, - "learning_rate": 2.69377120993872e-06, - "loss": 2.3211, - "step": 542540 - }, - { - "epoch": 0.95, - "learning_rate": 2.6928992700118934e-06, - "loss": 2.2292, - "step": 542550 - }, - { - "epoch": 0.95, - "learning_rate": 2.6920273300850667e-06, - "loss": 2.1146, - "step": 542560 - }, - { - "epoch": 0.95, - "learning_rate": 2.6911553901582396e-06, - "loss": 2.2195, - "step": 542570 - }, - { - "epoch": 0.95, - "learning_rate": 2.690283450231413e-06, - "loss": 2.3257, - "step": 542580 - }, - { - "epoch": 0.95, - "learning_rate": 2.689411510304586e-06, - "loss": 2.19, - "step": 542590 - }, - { - "epoch": 0.95, - "learning_rate": 2.6885395703777593e-06, - "loss": 2.3293, - "step": 542600 - }, - { - "epoch": 0.95, - "learning_rate": 2.6876676304509326e-06, - "loss": 2.2646, - "step": 542610 - }, - { - "epoch": 0.95, - "learning_rate": 2.686795690524106e-06, - "loss": 2.3193, - "step": 542620 - }, - { - "epoch": 0.95, - "learning_rate": 2.685923750597279e-06, - "loss": 2.2391, - "step": 542630 - }, - { - "epoch": 0.95, - "learning_rate": 2.6850518106704522e-06, - "loss": 2.2322, - "step": 542640 - }, - { - "epoch": 0.95, - "learning_rate": 2.684179870743625e-06, - "loss": 2.2417, - "step": 542650 - }, - { - "epoch": 0.95, - "learning_rate": 2.6833079308167985e-06, - "loss": 2.1089, - "step": 542660 - }, - { - "epoch": 0.95, - "learning_rate": 2.6824359908899714e-06, - "loss": 2.1256, - "step": 542670 - }, - { - "epoch": 0.95, - "learning_rate": 2.681564050963145e-06, - "loss": 2.2517, - "step": 542680 - }, - { - "epoch": 0.95, - "learning_rate": 2.680692111036318e-06, - "loss": 2.1697, - "step": 542690 - }, - { - "epoch": 0.95, - "learning_rate": 2.6798201711094915e-06, - "loss": 2.338, - "step": 542700 - }, - { - "epoch": 0.95, - "learning_rate": 2.6789482311826644e-06, - "loss": 2.3024, - "step": 542710 - }, - { - "epoch": 0.95, - "learning_rate": 2.6780762912558377e-06, - "loss": 2.2246, - "step": 542720 - }, - { - "epoch": 0.95, - "learning_rate": 2.6772043513290107e-06, - "loss": 2.313, - "step": 542730 - }, - { - "epoch": 0.95, - "learning_rate": 2.676332411402184e-06, - "loss": 2.1964, - "step": 542740 - }, - { - "epoch": 0.95, - "learning_rate": 2.6754604714753573e-06, - "loss": 2.2752, - "step": 542750 - }, - { - "epoch": 0.95, - "learning_rate": 2.6745885315485307e-06, - "loss": 2.2693, - "step": 542760 - }, - { - "epoch": 0.95, - "learning_rate": 2.6737165916217036e-06, - "loss": 2.1416, - "step": 542770 - }, - { - "epoch": 0.95, - "learning_rate": 2.672844651694877e-06, - "loss": 2.2308, - "step": 542780 - }, - { - "epoch": 0.95, - "learning_rate": 2.67197271176805e-06, - "loss": 2.1081, - "step": 542790 - }, - { - "epoch": 0.95, - "learning_rate": 2.6711007718412232e-06, - "loss": 2.1882, - "step": 542800 - }, - { - "epoch": 0.95, - "learning_rate": 2.6702288319143966e-06, - "loss": 2.2281, - "step": 542810 - }, - { - "epoch": 0.95, - "learning_rate": 2.66935689198757e-06, - "loss": 2.1907, - "step": 542820 - }, - { - "epoch": 0.95, - "learning_rate": 2.668484952060743e-06, - "loss": 2.2475, - "step": 542830 - }, - { - "epoch": 0.95, - "learning_rate": 2.667613012133916e-06, - "loss": 2.2082, - "step": 542840 - }, - { - "epoch": 0.95, - "learning_rate": 2.666741072207089e-06, - "loss": 2.31, - "step": 542850 - }, - { - "epoch": 0.95, - "learning_rate": 2.6658691322802625e-06, - "loss": 2.2796, - "step": 542860 - }, - { - "epoch": 0.95, - "learning_rate": 2.6649971923534354e-06, - "loss": 2.3255, - "step": 542870 - }, - { - "epoch": 0.95, - "learning_rate": 2.664125252426609e-06, - "loss": 2.2165, - "step": 542880 - }, - { - "epoch": 0.95, - "learning_rate": 2.663253312499782e-06, - "loss": 2.2226, - "step": 542890 - }, - { - "epoch": 0.95, - "learning_rate": 2.6623813725729554e-06, - "loss": 2.353, - "step": 542900 - }, - { - "epoch": 0.95, - "learning_rate": 2.6615094326461283e-06, - "loss": 2.2204, - "step": 542910 - }, - { - "epoch": 0.95, - "learning_rate": 2.6606374927193017e-06, - "loss": 2.2835, - "step": 542920 - }, - { - "epoch": 0.95, - "learning_rate": 2.6597655527924746e-06, - "loss": 2.282, - "step": 542930 - }, - { - "epoch": 0.95, - "learning_rate": 2.6588936128656484e-06, - "loss": 2.1742, - "step": 542940 - }, - { - "epoch": 0.95, - "learning_rate": 2.6580216729388213e-06, - "loss": 2.2272, - "step": 542950 - }, - { - "epoch": 0.95, - "learning_rate": 2.6571497330119947e-06, - "loss": 2.2137, - "step": 542960 - }, - { - "epoch": 0.95, - "learning_rate": 2.6562777930851676e-06, - "loss": 2.3083, - "step": 542970 - }, - { - "epoch": 0.95, - "learning_rate": 2.655405853158341e-06, - "loss": 2.163, - "step": 542980 - }, - { - "epoch": 0.95, - "learning_rate": 2.654533913231514e-06, - "loss": 2.2642, - "step": 542990 - }, - { - "epoch": 0.95, - "learning_rate": 2.653661973304687e-06, - "loss": 2.2568, - "step": 543000 - }, - { - "epoch": 0.95, - "learning_rate": 2.6527900333778605e-06, - "loss": 2.2644, - "step": 543010 - }, - { - "epoch": 0.95, - "learning_rate": 2.651918093451034e-06, - "loss": 2.1923, - "step": 543020 - }, - { - "epoch": 0.95, - "learning_rate": 2.651046153524207e-06, - "loss": 2.2127, - "step": 543030 - }, - { - "epoch": 0.95, - "learning_rate": 2.65017421359738e-06, - "loss": 2.2218, - "step": 543040 - }, - { - "epoch": 0.95, - "learning_rate": 2.649302273670553e-06, - "loss": 2.0549, - "step": 543050 - }, - { - "epoch": 0.95, - "learning_rate": 2.6484303337437264e-06, - "loss": 2.3251, - "step": 543060 - }, - { - "epoch": 0.95, - "learning_rate": 2.6475583938168998e-06, - "loss": 2.2968, - "step": 543070 - }, - { - "epoch": 0.95, - "learning_rate": 2.646686453890073e-06, - "loss": 2.2509, - "step": 543080 - }, - { - "epoch": 0.95, - "learning_rate": 2.645814513963246e-06, - "loss": 2.3343, - "step": 543090 - }, - { - "epoch": 0.95, - "learning_rate": 2.6449425740364194e-06, - "loss": 2.2422, - "step": 543100 - }, - { - "epoch": 0.95, - "learning_rate": 2.6440706341095923e-06, - "loss": 2.2182, - "step": 543110 - }, - { - "epoch": 0.95, - "learning_rate": 2.6431986941827657e-06, - "loss": 2.3742, - "step": 543120 - }, - { - "epoch": 0.95, - "learning_rate": 2.6423267542559386e-06, - "loss": 2.3237, - "step": 543130 - }, - { - "epoch": 0.95, - "learning_rate": 2.6414548143291123e-06, - "loss": 2.2463, - "step": 543140 - }, - { - "epoch": 0.95, - "learning_rate": 2.6405828744022853e-06, - "loss": 2.2592, - "step": 543150 - }, - { - "epoch": 0.95, - "learning_rate": 2.6397109344754586e-06, - "loss": 2.3101, - "step": 543160 - }, - { - "epoch": 0.95, - "learning_rate": 2.6388389945486315e-06, - "loss": 2.2334, - "step": 543170 - }, - { - "epoch": 0.95, - "learning_rate": 2.637967054621805e-06, - "loss": 2.2268, - "step": 543180 - }, - { - "epoch": 0.95, - "learning_rate": 2.637095114694978e-06, - "loss": 2.1403, - "step": 543190 - }, - { - "epoch": 0.95, - "learning_rate": 2.636223174768151e-06, - "loss": 2.2605, - "step": 543200 - }, - { - "epoch": 0.95, - "learning_rate": 2.6353512348413245e-06, - "loss": 2.2981, - "step": 543210 - }, - { - "epoch": 0.95, - "learning_rate": 2.634479294914498e-06, - "loss": 2.3147, - "step": 543220 - }, - { - "epoch": 0.95, - "learning_rate": 2.6336073549876708e-06, - "loss": 2.3118, - "step": 543230 - }, - { - "epoch": 0.95, - "learning_rate": 2.632735415060844e-06, - "loss": 2.1757, - "step": 543240 - }, - { - "epoch": 0.95, - "learning_rate": 2.631863475134017e-06, - "loss": 2.3479, - "step": 543250 - }, - { - "epoch": 0.95, - "learning_rate": 2.6309915352071904e-06, - "loss": 2.2171, - "step": 543260 - }, - { - "epoch": 0.95, - "learning_rate": 2.6301195952803637e-06, - "loss": 2.3316, - "step": 543270 - }, - { - "epoch": 0.95, - "learning_rate": 2.629247655353537e-06, - "loss": 2.2638, - "step": 543280 - }, - { - "epoch": 0.95, - "learning_rate": 2.62837571542671e-06, - "loss": 2.1645, - "step": 543290 - }, - { - "epoch": 0.95, - "learning_rate": 2.6275037754998833e-06, - "loss": 2.2728, - "step": 543300 - }, - { - "epoch": 0.95, - "learning_rate": 2.6266318355730563e-06, - "loss": 2.2189, - "step": 543310 - }, - { - "epoch": 0.95, - "learning_rate": 2.6257598956462296e-06, - "loss": 2.1662, - "step": 543320 - }, - { - "epoch": 0.95, - "learning_rate": 2.624887955719403e-06, - "loss": 2.3045, - "step": 543330 - }, - { - "epoch": 0.95, - "learning_rate": 2.6240160157925763e-06, - "loss": 2.0843, - "step": 543340 - }, - { - "epoch": 0.95, - "learning_rate": 2.6231440758657492e-06, - "loss": 2.2851, - "step": 543350 - }, - { - "epoch": 0.95, - "learning_rate": 2.6222721359389226e-06, - "loss": 2.1663, - "step": 543360 - }, - { - "epoch": 0.95, - "learning_rate": 2.6214001960120955e-06, - "loss": 2.2716, - "step": 543370 - }, - { - "epoch": 0.95, - "learning_rate": 2.620528256085269e-06, - "loss": 2.1842, - "step": 543380 - }, - { - "epoch": 0.95, - "learning_rate": 2.6196563161584418e-06, - "loss": 2.2985, - "step": 543390 - }, - { - "epoch": 0.95, - "learning_rate": 2.618784376231615e-06, - "loss": 2.2749, - "step": 543400 - }, - { - "epoch": 0.95, - "learning_rate": 2.6179124363047885e-06, - "loss": 2.3029, - "step": 543410 - }, - { - "epoch": 0.95, - "learning_rate": 2.617040496377962e-06, - "loss": 2.2788, - "step": 543420 - }, - { - "epoch": 0.95, - "learning_rate": 2.6161685564511347e-06, - "loss": 2.3096, - "step": 543430 - }, - { - "epoch": 0.95, - "learning_rate": 2.615296616524308e-06, - "loss": 2.1936, - "step": 543440 - }, - { - "epoch": 0.95, - "learning_rate": 2.614424676597481e-06, - "loss": 2.2127, - "step": 543450 - }, - { - "epoch": 0.95, - "learning_rate": 2.6135527366706543e-06, - "loss": 2.2605, - "step": 543460 - }, - { - "epoch": 0.95, - "learning_rate": 2.6126807967438277e-06, - "loss": 2.2964, - "step": 543470 - }, - { - "epoch": 0.95, - "learning_rate": 2.611808856817001e-06, - "loss": 2.3369, - "step": 543480 - }, - { - "epoch": 0.95, - "learning_rate": 2.610936916890174e-06, - "loss": 2.155, - "step": 543490 - }, - { - "epoch": 0.95, - "learning_rate": 2.6100649769633473e-06, - "loss": 2.3023, - "step": 543500 - }, - { - "epoch": 0.95, - "learning_rate": 2.6091930370365202e-06, - "loss": 2.2857, - "step": 543510 - }, - { - "epoch": 0.95, - "learning_rate": 2.6083210971096936e-06, - "loss": 2.19, - "step": 543520 - }, - { - "epoch": 0.95, - "learning_rate": 2.607449157182867e-06, - "loss": 2.3202, - "step": 543530 - }, - { - "epoch": 0.95, - "learning_rate": 2.6065772172560403e-06, - "loss": 2.1464, - "step": 543540 - }, - { - "epoch": 0.95, - "learning_rate": 2.605705277329213e-06, - "loss": 2.0498, - "step": 543550 - }, - { - "epoch": 0.95, - "learning_rate": 2.6048333374023865e-06, - "loss": 2.3068, - "step": 543560 - }, - { - "epoch": 0.95, - "learning_rate": 2.6039613974755595e-06, - "loss": 2.3308, - "step": 543570 - }, - { - "epoch": 0.95, - "learning_rate": 2.603089457548733e-06, - "loss": 2.2498, - "step": 543580 - }, - { - "epoch": 0.95, - "learning_rate": 2.602217517621906e-06, - "loss": 2.2576, - "step": 543590 - }, - { - "epoch": 0.95, - "learning_rate": 2.601345577695079e-06, - "loss": 2.1605, - "step": 543600 - }, - { - "epoch": 0.95, - "learning_rate": 2.6004736377682524e-06, - "loss": 2.2711, - "step": 543610 - }, - { - "epoch": 0.95, - "learning_rate": 2.5996016978414258e-06, - "loss": 2.2722, - "step": 543620 - }, - { - "epoch": 0.95, - "learning_rate": 2.5987297579145987e-06, - "loss": 2.2055, - "step": 543630 - }, - { - "epoch": 0.95, - "learning_rate": 2.597857817987772e-06, - "loss": 2.1815, - "step": 543640 - }, - { - "epoch": 0.95, - "learning_rate": 2.596985878060945e-06, - "loss": 2.3642, - "step": 543650 - }, - { - "epoch": 0.95, - "learning_rate": 2.5961139381341183e-06, - "loss": 2.2899, - "step": 543660 - }, - { - "epoch": 0.95, - "learning_rate": 2.5952419982072917e-06, - "loss": 2.1949, - "step": 543670 - }, - { - "epoch": 0.95, - "learning_rate": 2.594370058280465e-06, - "loss": 2.269, - "step": 543680 - }, - { - "epoch": 0.95, - "learning_rate": 2.593498118353638e-06, - "loss": 2.2939, - "step": 543690 - }, - { - "epoch": 0.95, - "learning_rate": 2.5926261784268113e-06, - "loss": 2.3265, - "step": 543700 - }, - { - "epoch": 0.95, - "learning_rate": 2.591754238499984e-06, - "loss": 2.28, - "step": 543710 - }, - { - "epoch": 0.95, - "learning_rate": 2.5908822985731575e-06, - "loss": 2.119, - "step": 543720 - }, - { - "epoch": 0.95, - "learning_rate": 2.590010358646331e-06, - "loss": 2.4113, - "step": 543730 - }, - { - "epoch": 0.95, - "learning_rate": 2.5891384187195042e-06, - "loss": 2.2507, - "step": 543740 - }, - { - "epoch": 0.95, - "learning_rate": 2.588266478792677e-06, - "loss": 2.1589, - "step": 543750 - }, - { - "epoch": 0.95, - "learning_rate": 2.5873945388658505e-06, - "loss": 2.2475, - "step": 543760 - }, - { - "epoch": 0.95, - "learning_rate": 2.5865225989390234e-06, - "loss": 2.2911, - "step": 543770 - }, - { - "epoch": 0.95, - "learning_rate": 2.5856506590121968e-06, - "loss": 2.2108, - "step": 543780 - }, - { - "epoch": 0.95, - "learning_rate": 2.58477871908537e-06, - "loss": 2.346, - "step": 543790 - }, - { - "epoch": 0.95, - "learning_rate": 2.583906779158543e-06, - "loss": 2.1875, - "step": 543800 - }, - { - "epoch": 0.95, - "learning_rate": 2.5830348392317164e-06, - "loss": 2.2479, - "step": 543810 - }, - { - "epoch": 0.95, - "learning_rate": 2.5821628993048897e-06, - "loss": 2.3395, - "step": 543820 - }, - { - "epoch": 0.95, - "learning_rate": 2.5812909593780627e-06, - "loss": 2.2599, - "step": 543830 - }, - { - "epoch": 0.95, - "learning_rate": 2.580419019451236e-06, - "loss": 2.2114, - "step": 543840 - }, - { - "epoch": 0.95, - "learning_rate": 2.5795470795244094e-06, - "loss": 2.1499, - "step": 543850 - }, - { - "epoch": 0.95, - "learning_rate": 2.5786751395975823e-06, - "loss": 2.2229, - "step": 543860 - }, - { - "epoch": 0.95, - "learning_rate": 2.5778031996707556e-06, - "loss": 2.269, - "step": 543870 - }, - { - "epoch": 0.95, - "learning_rate": 2.576931259743929e-06, - "loss": 2.1191, - "step": 543880 - }, - { - "epoch": 0.95, - "learning_rate": 2.576059319817102e-06, - "loss": 2.3093, - "step": 543890 - }, - { - "epoch": 0.95, - "learning_rate": 2.5751873798902752e-06, - "loss": 2.3097, - "step": 543900 - }, - { - "epoch": 0.95, - "learning_rate": 2.574315439963448e-06, - "loss": 2.2516, - "step": 543910 - }, - { - "epoch": 0.95, - "learning_rate": 2.5734435000366215e-06, - "loss": 2.2993, - "step": 543920 - }, - { - "epoch": 0.95, - "learning_rate": 2.572571560109795e-06, - "loss": 2.235, - "step": 543930 - }, - { - "epoch": 0.95, - "learning_rate": 2.571699620182968e-06, - "loss": 2.1701, - "step": 543940 - }, - { - "epoch": 0.95, - "learning_rate": 2.570827680256141e-06, - "loss": 2.297, - "step": 543950 - }, - { - "epoch": 0.95, - "learning_rate": 2.5699557403293145e-06, - "loss": 2.2669, - "step": 543960 - }, - { - "epoch": 0.95, - "learning_rate": 2.5690838004024874e-06, - "loss": 2.1571, - "step": 543970 - }, - { - "epoch": 0.95, - "learning_rate": 2.5682118604756607e-06, - "loss": 2.2778, - "step": 543980 - }, - { - "epoch": 0.95, - "learning_rate": 2.567339920548834e-06, - "loss": 2.3698, - "step": 543990 - }, - { - "epoch": 0.95, - "learning_rate": 2.566467980622007e-06, - "loss": 2.1493, - "step": 544000 - }, - { - "epoch": 0.95, - "learning_rate": 2.5655960406951804e-06, - "loss": 2.2864, - "step": 544010 - }, - { - "epoch": 0.95, - "learning_rate": 2.5647241007683537e-06, - "loss": 2.2517, - "step": 544020 - }, - { - "epoch": 0.95, - "learning_rate": 2.5638521608415266e-06, - "loss": 2.3508, - "step": 544030 - }, - { - "epoch": 0.95, - "learning_rate": 2.5629802209147e-06, - "loss": 2.1819, - "step": 544040 - }, - { - "epoch": 0.95, - "learning_rate": 2.5621082809878733e-06, - "loss": 2.1974, - "step": 544050 - }, - { - "epoch": 0.95, - "learning_rate": 2.5612363410610462e-06, - "loss": 2.2557, - "step": 544060 - }, - { - "epoch": 0.95, - "learning_rate": 2.5603644011342196e-06, - "loss": 2.1219, - "step": 544070 - }, - { - "epoch": 0.95, - "learning_rate": 2.559492461207393e-06, - "loss": 2.216, - "step": 544080 - }, - { - "epoch": 0.95, - "learning_rate": 2.558620521280566e-06, - "loss": 2.2217, - "step": 544090 - }, - { - "epoch": 0.95, - "learning_rate": 2.557748581353739e-06, - "loss": 2.2263, - "step": 544100 - }, - { - "epoch": 0.95, - "learning_rate": 2.5568766414269125e-06, - "loss": 2.2696, - "step": 544110 - }, - { - "epoch": 0.95, - "learning_rate": 2.5560047015000855e-06, - "loss": 2.2584, - "step": 544120 - }, - { - "epoch": 0.95, - "learning_rate": 2.555132761573259e-06, - "loss": 2.281, - "step": 544130 - }, - { - "epoch": 0.95, - "learning_rate": 2.554260821646432e-06, - "loss": 2.3413, - "step": 544140 - }, - { - "epoch": 0.95, - "learning_rate": 2.553388881719605e-06, - "loss": 2.2642, - "step": 544150 - }, - { - "epoch": 0.95, - "learning_rate": 2.5525169417927784e-06, - "loss": 2.3207, - "step": 544160 - }, - { - "epoch": 0.95, - "learning_rate": 2.5516450018659518e-06, - "loss": 2.2741, - "step": 544170 - }, - { - "epoch": 0.95, - "learning_rate": 2.5507730619391247e-06, - "loss": 2.272, - "step": 544180 - }, - { - "epoch": 0.95, - "learning_rate": 2.549901122012298e-06, - "loss": 2.2075, - "step": 544190 - }, - { - "epoch": 0.95, - "learning_rate": 2.549029182085471e-06, - "loss": 2.3438, - "step": 544200 - }, - { - "epoch": 0.95, - "learning_rate": 2.5481572421586443e-06, - "loss": 2.2739, - "step": 544210 - }, - { - "epoch": 0.95, - "learning_rate": 2.5472853022318177e-06, - "loss": 2.326, - "step": 544220 - }, - { - "epoch": 0.95, - "learning_rate": 2.5464133623049906e-06, - "loss": 2.2058, - "step": 544230 - }, - { - "epoch": 0.95, - "learning_rate": 2.545541422378164e-06, - "loss": 2.2055, - "step": 544240 - }, - { - "epoch": 0.95, - "learning_rate": 2.5446694824513373e-06, - "loss": 2.2434, - "step": 544250 - }, - { - "epoch": 0.95, - "learning_rate": 2.54379754252451e-06, - "loss": 2.1337, - "step": 544260 - }, - { - "epoch": 0.95, - "learning_rate": 2.5429256025976835e-06, - "loss": 2.2736, - "step": 544270 - }, - { - "epoch": 0.95, - "learning_rate": 2.542053662670857e-06, - "loss": 2.2926, - "step": 544280 - }, - { - "epoch": 0.95, - "learning_rate": 2.54118172274403e-06, - "loss": 2.2843, - "step": 544290 - }, - { - "epoch": 0.95, - "learning_rate": 2.540309782817203e-06, - "loss": 2.3947, - "step": 544300 - }, - { - "epoch": 0.95, - "learning_rate": 2.5394378428903765e-06, - "loss": 2.2809, - "step": 544310 - }, - { - "epoch": 0.95, - "learning_rate": 2.5385659029635494e-06, - "loss": 2.2993, - "step": 544320 - }, - { - "epoch": 0.95, - "learning_rate": 2.5376939630367228e-06, - "loss": 2.2124, - "step": 544330 - }, - { - "epoch": 0.95, - "learning_rate": 2.536822023109896e-06, - "loss": 2.4059, - "step": 544340 - }, - { - "epoch": 0.95, - "learning_rate": 2.535950083183069e-06, - "loss": 2.3454, - "step": 544350 - }, - { - "epoch": 0.95, - "learning_rate": 2.5350781432562424e-06, - "loss": 2.2322, - "step": 544360 - }, - { - "epoch": 0.95, - "learning_rate": 2.5342062033294157e-06, - "loss": 2.2385, - "step": 544370 - }, - { - "epoch": 0.95, - "learning_rate": 2.5333342634025887e-06, - "loss": 2.2068, - "step": 544380 - }, - { - "epoch": 0.95, - "learning_rate": 2.532462323475762e-06, - "loss": 2.2872, - "step": 544390 - }, - { - "epoch": 0.95, - "learning_rate": 2.531590383548935e-06, - "loss": 2.2398, - "step": 544400 - }, - { - "epoch": 0.95, - "learning_rate": 2.5307184436221083e-06, - "loss": 2.1245, - "step": 544410 - }, - { - "epoch": 0.95, - "learning_rate": 2.5298465036952816e-06, - "loss": 2.3552, - "step": 544420 - }, - { - "epoch": 0.95, - "learning_rate": 2.528974563768455e-06, - "loss": 2.2119, - "step": 544430 - }, - { - "epoch": 0.95, - "learning_rate": 2.528102623841628e-06, - "loss": 2.3118, - "step": 544440 - }, - { - "epoch": 0.95, - "learning_rate": 2.5272306839148012e-06, - "loss": 2.2709, - "step": 544450 - }, - { - "epoch": 0.95, - "learning_rate": 2.526358743987974e-06, - "loss": 2.2983, - "step": 544460 - }, - { - "epoch": 0.95, - "learning_rate": 2.5254868040611475e-06, - "loss": 2.2849, - "step": 544470 - }, - { - "epoch": 0.95, - "learning_rate": 2.524614864134321e-06, - "loss": 2.1921, - "step": 544480 - }, - { - "epoch": 0.95, - "learning_rate": 2.5237429242074938e-06, - "loss": 2.2888, - "step": 544490 - }, - { - "epoch": 0.95, - "learning_rate": 2.522870984280667e-06, - "loss": 2.2396, - "step": 544500 - }, - { - "epoch": 0.95, - "learning_rate": 2.5219990443538405e-06, - "loss": 2.1193, - "step": 544510 - }, - { - "epoch": 0.95, - "learning_rate": 2.5211271044270134e-06, - "loss": 2.3253, - "step": 544520 - }, - { - "epoch": 0.95, - "learning_rate": 2.5202551645001867e-06, - "loss": 2.1952, - "step": 544530 - }, - { - "epoch": 0.95, - "learning_rate": 2.51938322457336e-06, - "loss": 2.2469, - "step": 544540 - }, - { - "epoch": 0.95, - "learning_rate": 2.518511284646533e-06, - "loss": 2.2822, - "step": 544550 - }, - { - "epoch": 0.95, - "learning_rate": 2.5176393447197064e-06, - "loss": 2.2287, - "step": 544560 - }, - { - "epoch": 0.95, - "learning_rate": 2.5167674047928797e-06, - "loss": 2.285, - "step": 544570 - }, - { - "epoch": 0.95, - "learning_rate": 2.5158954648660526e-06, - "loss": 2.4004, - "step": 544580 - }, - { - "epoch": 0.95, - "learning_rate": 2.515023524939226e-06, - "loss": 2.27, - "step": 544590 - }, - { - "epoch": 0.95, - "learning_rate": 2.514151585012399e-06, - "loss": 2.2398, - "step": 544600 - }, - { - "epoch": 0.95, - "learning_rate": 2.5132796450855722e-06, - "loss": 2.2618, - "step": 544610 - }, - { - "epoch": 0.95, - "learning_rate": 2.5124077051587456e-06, - "loss": 2.2678, - "step": 544620 - }, - { - "epoch": 0.95, - "learning_rate": 2.511535765231919e-06, - "loss": 2.2477, - "step": 544630 - }, - { - "epoch": 0.95, - "learning_rate": 2.510663825305092e-06, - "loss": 2.2156, - "step": 544640 - }, - { - "epoch": 0.95, - "learning_rate": 2.509791885378265e-06, - "loss": 2.2105, - "step": 544650 - }, - { - "epoch": 0.95, - "learning_rate": 2.508919945451438e-06, - "loss": 2.2446, - "step": 544660 - }, - { - "epoch": 0.95, - "learning_rate": 2.5080480055246115e-06, - "loss": 2.2738, - "step": 544670 - }, - { - "epoch": 0.95, - "learning_rate": 2.507176065597785e-06, - "loss": 2.2045, - "step": 544680 - }, - { - "epoch": 0.95, - "learning_rate": 2.506304125670958e-06, - "loss": 2.2266, - "step": 544690 - }, - { - "epoch": 0.95, - "learning_rate": 2.505432185744131e-06, - "loss": 2.1725, - "step": 544700 - }, - { - "epoch": 0.95, - "learning_rate": 2.5045602458173044e-06, - "loss": 2.2779, - "step": 544710 - }, - { - "epoch": 0.95, - "learning_rate": 2.5036883058904774e-06, - "loss": 2.3916, - "step": 544720 - }, - { - "epoch": 0.95, - "learning_rate": 2.5028163659636507e-06, - "loss": 2.1494, - "step": 544730 - }, - { - "epoch": 0.95, - "learning_rate": 2.501944426036824e-06, - "loss": 2.1204, - "step": 544740 - }, - { - "epoch": 0.95, - "learning_rate": 2.501072486109997e-06, - "loss": 2.2106, - "step": 544750 - }, - { - "epoch": 0.95, - "learning_rate": 2.5002005461831703e-06, - "loss": 2.2678, - "step": 544760 - }, - { - "epoch": 0.95, - "learning_rate": 2.4993286062563437e-06, - "loss": 2.3199, - "step": 544770 - }, - { - "epoch": 0.95, - "learning_rate": 2.4984566663295166e-06, - "loss": 2.1956, - "step": 544780 - }, - { - "epoch": 0.95, - "learning_rate": 2.49758472640269e-06, - "loss": 2.153, - "step": 544790 - }, - { - "epoch": 0.95, - "learning_rate": 2.496712786475863e-06, - "loss": 2.2359, - "step": 544800 - }, - { - "epoch": 0.95, - "learning_rate": 2.495840846549036e-06, - "loss": 2.2833, - "step": 544810 - }, - { - "epoch": 0.95, - "learning_rate": 2.4949689066222096e-06, - "loss": 2.2076, - "step": 544820 - }, - { - "epoch": 0.95, - "learning_rate": 2.494096966695383e-06, - "loss": 2.0867, - "step": 544830 - }, - { - "epoch": 0.95, - "learning_rate": 2.493225026768556e-06, - "loss": 2.2388, - "step": 544840 - }, - { - "epoch": 0.95, - "learning_rate": 2.492353086841729e-06, - "loss": 2.3474, - "step": 544850 - }, - { - "epoch": 0.95, - "learning_rate": 2.491481146914902e-06, - "loss": 2.2093, - "step": 544860 - }, - { - "epoch": 0.95, - "learning_rate": 2.4906092069880754e-06, - "loss": 2.2256, - "step": 544870 - }, - { - "epoch": 0.95, - "learning_rate": 2.4897372670612488e-06, - "loss": 2.2515, - "step": 544880 - }, - { - "epoch": 0.95, - "learning_rate": 2.488865327134422e-06, - "loss": 2.2327, - "step": 544890 - }, - { - "epoch": 0.95, - "learning_rate": 2.487993387207595e-06, - "loss": 2.1421, - "step": 544900 - }, - { - "epoch": 0.95, - "learning_rate": 2.4871214472807684e-06, - "loss": 2.1358, - "step": 544910 - }, - { - "epoch": 0.95, - "learning_rate": 2.4862495073539413e-06, - "loss": 2.2707, - "step": 544920 - }, - { - "epoch": 0.95, - "learning_rate": 2.4853775674271147e-06, - "loss": 2.3101, - "step": 544930 - }, - { - "epoch": 0.95, - "learning_rate": 2.484505627500288e-06, - "loss": 2.3213, - "step": 544940 - }, - { - "epoch": 0.95, - "learning_rate": 2.4836336875734614e-06, - "loss": 2.2114, - "step": 544950 - }, - { - "epoch": 0.95, - "learning_rate": 2.4827617476466343e-06, - "loss": 2.2298, - "step": 544960 - }, - { - "epoch": 0.95, - "learning_rate": 2.4818898077198076e-06, - "loss": 2.1848, - "step": 544970 - }, - { - "epoch": 0.95, - "learning_rate": 2.4810178677929806e-06, - "loss": 2.2756, - "step": 544980 - }, - { - "epoch": 0.95, - "learning_rate": 2.480145927866154e-06, - "loss": 2.2417, - "step": 544990 - }, - { - "epoch": 0.95, - "learning_rate": 2.479273987939327e-06, - "loss": 2.2328, - "step": 545000 + "learning_rate": 4.9982152482054324e-05, + "loss": 3.2655, + "step": 100 }, { - "epoch": 0.95, - "learning_rate": 2.4784020480125e-06, - "loss": 2.312, - "step": 545010 - }, - { - "epoch": 0.95, - "learning_rate": 2.4775301080856735e-06, - "loss": 2.3354, - "step": 545020 + "epoch": 0.0, + "learning_rate": 4.9964304964108645e-05, + "loss": 3.2142, + "step": 200 }, { - "epoch": 0.95, - "learning_rate": 2.476658168158847e-06, - "loss": 2.1976, - "step": 545030 + "epoch": 0.0, + "learning_rate": 4.9946457446162966e-05, + "loss": 3.1805, + "step": 300 }, { - "epoch": 0.95, - "learning_rate": 2.4757862282320198e-06, - "loss": 2.2623, - "step": 545040 + "epoch": 0.0, + "learning_rate": 4.992860992821729e-05, + "loss": 3.1781, + "step": 400 }, { - "epoch": 0.95, - "learning_rate": 2.474914288305193e-06, - "loss": 2.1757, - "step": 545050 + "epoch": 0.0, + "learning_rate": 4.991076241027161e-05, + "loss": 3.1664, + "step": 500 }, { - "epoch": 0.95, - "learning_rate": 2.474042348378366e-06, - "loss": 2.263, - "step": 545060 + "epoch": 0.0, + "learning_rate": 4.989291489232592e-05, + "loss": 3.158, + "step": 600 }, { - "epoch": 0.95, - "learning_rate": 2.4731704084515394e-06, - "loss": 2.1892, - "step": 545070 + "epoch": 0.0, + "learning_rate": 4.9875067374380244e-05, + "loss": 3.1607, + "step": 700 }, { - "epoch": 0.95, - "learning_rate": 2.4722984685247127e-06, - "loss": 2.3593, - "step": 545080 + "epoch": 0.0, + "learning_rate": 4.9857219856434565e-05, + "loss": 3.1491, + "step": 800 }, { - "epoch": 0.95, - "learning_rate": 2.471426528597886e-06, - "loss": 2.3011, - "step": 545090 + "epoch": 0.0, + "learning_rate": 4.9839372338488887e-05, + "loss": 3.141, + "step": 900 }, { - "epoch": 0.95, - "learning_rate": 2.470554588671059e-06, - "loss": 2.2, - "step": 545100 + "epoch": 0.0, + "learning_rate": 4.982152482054321e-05, + "loss": 3.1409, + "step": 1000 }, { - "epoch": 0.95, - "learning_rate": 2.4696826487442324e-06, - "loss": 2.2158, - "step": 545110 + "epoch": 0.0, + "learning_rate": 4.980367730259753e-05, + "loss": 3.1489, + "step": 1100 }, { - "epoch": 0.95, - "learning_rate": 2.4688107088174053e-06, - "loss": 2.2828, - "step": 545120 + "epoch": 0.0, + "learning_rate": 4.978582978465185e-05, + "loss": 3.1458, + "step": 1200 }, { - "epoch": 0.95, - "learning_rate": 2.4679387688905786e-06, - "loss": 2.2866, - "step": 545130 + "epoch": 0.0, + "learning_rate": 4.976798226670617e-05, + "loss": 3.1312, + "step": 1300 }, { - "epoch": 0.95, - "learning_rate": 2.467066828963752e-06, - "loss": 2.1983, - "step": 545140 + "epoch": 0.0, + "learning_rate": 4.975013474876049e-05, + "loss": 3.1286, + "step": 1400 }, { - "epoch": 0.95, - "learning_rate": 2.4661948890369253e-06, - "loss": 2.2994, - "step": 545150 + "epoch": 0.01, + "learning_rate": 4.9732287230814814e-05, + "loss": 3.1277, + "step": 1500 }, { - "epoch": 0.95, - "learning_rate": 2.4653229491100982e-06, - "loss": 2.3157, - "step": 545160 + "epoch": 0.01, + "learning_rate": 4.9714439712869135e-05, + "loss": 3.1141, + "step": 1600 }, { - "epoch": 0.95, - "learning_rate": 2.4644510091832716e-06, - "loss": 2.1165, - "step": 545170 + "epoch": 0.01, + "learning_rate": 4.969659219492345e-05, + "loss": 3.1065, + "step": 1700 }, { - "epoch": 0.95, - "learning_rate": 2.4635790692564445e-06, - "loss": 2.2817, - "step": 545180 + "epoch": 0.01, + "learning_rate": 4.967874467697777e-05, + "loss": 3.1102, + "step": 1800 }, { - "epoch": 0.95, - "learning_rate": 2.462707129329618e-06, - "loss": 2.1859, - "step": 545190 + "epoch": 0.01, + "learning_rate": 4.966089715903209e-05, + "loss": 3.1169, + "step": 1900 }, { - "epoch": 0.95, - "learning_rate": 2.4618351894027908e-06, - "loss": 2.3134, - "step": 545200 + "epoch": 0.01, + "learning_rate": 4.964304964108641e-05, + "loss": 3.115, + "step": 2000 }, { - "epoch": 0.95, - "learning_rate": 2.4609632494759646e-06, - "loss": 2.2209, - "step": 545210 + "epoch": 0.01, + "learning_rate": 4.9625202123140734e-05, + "loss": 3.1067, + "step": 2100 }, { - "epoch": 0.95, - "learning_rate": 2.4600913095491375e-06, - "loss": 2.3163, - "step": 545220 + "epoch": 0.01, + "learning_rate": 4.9607354605195056e-05, + "loss": 3.0965, + "step": 2200 }, { - "epoch": 0.95, - "learning_rate": 2.459219369622311e-06, - "loss": 2.2983, - "step": 545230 + "epoch": 0.01, + "learning_rate": 4.958950708724938e-05, + "loss": 3.0902, + "step": 2300 }, { - "epoch": 0.95, - "learning_rate": 2.4583474296954837e-06, - "loss": 2.2761, - "step": 545240 + "epoch": 0.01, + "learning_rate": 4.95716595693037e-05, + "loss": 3.0859, + "step": 2400 }, { - "epoch": 0.95, - "learning_rate": 2.457475489768657e-06, - "loss": 2.2094, - "step": 545250 + "epoch": 0.01, + "learning_rate": 4.955381205135802e-05, + "loss": 3.0999, + "step": 2500 }, { - "epoch": 0.95, - "learning_rate": 2.45660354984183e-06, - "loss": 2.108, - "step": 545260 + "epoch": 0.01, + "learning_rate": 4.953596453341234e-05, + "loss": 3.0828, + "step": 2600 }, { - "epoch": 0.95, - "learning_rate": 2.4557316099150034e-06, - "loss": 2.2564, - "step": 545270 + "epoch": 0.01, + "learning_rate": 4.951811701546666e-05, + "loss": 3.0801, + "step": 2700 }, { - "epoch": 0.95, - "learning_rate": 2.4548596699881767e-06, - "loss": 2.2008, - "step": 545280 + "epoch": 0.01, + "learning_rate": 4.950026949752098e-05, + "loss": 3.0769, + "step": 2800 }, { - "epoch": 0.95, - "learning_rate": 2.45398773006135e-06, - "loss": 2.2437, - "step": 545290 + "epoch": 0.01, + "learning_rate": 4.9482421979575304e-05, + "loss": 3.0826, + "step": 2900 }, { - "epoch": 0.95, - "learning_rate": 2.453115790134523e-06, - "loss": 2.2615, - "step": 545300 + "epoch": 0.01, + "learning_rate": 4.9464574461629625e-05, + "loss": 3.0805, + "step": 3000 }, { - "epoch": 0.95, - "learning_rate": 2.4522438502076963e-06, - "loss": 2.3225, - "step": 545310 + "epoch": 0.01, + "learning_rate": 4.9446726943683947e-05, + "loss": 3.0767, + "step": 3100 }, { - "epoch": 0.95, - "learning_rate": 2.4513719102808692e-06, - "loss": 2.2736, - "step": 545320 + "epoch": 0.01, + "learning_rate": 4.942887942573827e-05, + "loss": 3.0758, + "step": 3200 }, { - "epoch": 0.95, - "learning_rate": 2.4504999703540426e-06, - "loss": 2.1832, - "step": 545330 + "epoch": 0.01, + "learning_rate": 4.941103190779259e-05, + "loss": 3.0669, + "step": 3300 }, { - "epoch": 0.95, - "learning_rate": 2.449628030427216e-06, - "loss": 2.2579, - "step": 545340 + "epoch": 0.01, + "learning_rate": 4.939318438984691e-05, + "loss": 3.0613, + "step": 3400 }, { - "epoch": 0.95, - "learning_rate": 2.4487560905003893e-06, - "loss": 2.1994, - "step": 545350 + "epoch": 0.01, + "learning_rate": 4.937533687190123e-05, + "loss": 3.0743, + "step": 3500 }, { - "epoch": 0.95, - "learning_rate": 2.4478841505735622e-06, - "loss": 2.3694, - "step": 545360 + "epoch": 0.01, + "learning_rate": 4.935748935395555e-05, + "loss": 3.0717, + "step": 3600 }, { - "epoch": 0.95, - "learning_rate": 2.4470122106467356e-06, - "loss": 2.2571, - "step": 545370 + "epoch": 0.01, + "learning_rate": 4.933964183600987e-05, + "loss": 3.0649, + "step": 3700 }, { - "epoch": 0.95, - "learning_rate": 2.4461402707199085e-06, - "loss": 2.1509, - "step": 545380 + "epoch": 0.01, + "learning_rate": 4.932179431806419e-05, + "loss": 3.0618, + "step": 3800 }, { - "epoch": 0.95, - "learning_rate": 2.445268330793082e-06, - "loss": 2.2328, - "step": 545390 + "epoch": 0.01, + "learning_rate": 4.930394680011851e-05, + "loss": 3.0586, + "step": 3900 }, { - "epoch": 0.95, - "learning_rate": 2.4443963908662548e-06, - "loss": 2.3319, - "step": 545400 + "epoch": 0.01, + "learning_rate": 4.928609928217283e-05, + "loss": 3.0575, + "step": 4000 }, { - "epoch": 0.95, - "learning_rate": 2.4435244509394285e-06, - "loss": 2.2635, - "step": 545410 + "epoch": 0.01, + "learning_rate": 4.926825176422715e-05, + "loss": 3.0582, + "step": 4100 }, { - "epoch": 0.95, - "learning_rate": 2.4426525110126014e-06, - "loss": 2.2592, - "step": 545420 + "epoch": 0.01, + "learning_rate": 4.925040424628147e-05, + "loss": 3.0567, + "step": 4200 }, { - "epoch": 0.95, - "learning_rate": 2.441780571085775e-06, - "loss": 2.1532, - "step": 545430 + "epoch": 0.02, + "learning_rate": 4.9232556728335794e-05, + "loss": 3.0404, + "step": 4300 }, { - "epoch": 0.95, - "learning_rate": 2.4409086311589477e-06, - "loss": 2.2211, - "step": 545440 + "epoch": 0.02, + "learning_rate": 4.9214709210390116e-05, + "loss": 3.0449, + "step": 4400 }, { - "epoch": 0.95, - "learning_rate": 2.440036691232121e-06, - "loss": 2.2978, - "step": 545450 + "epoch": 0.02, + "learning_rate": 4.919686169244444e-05, + "loss": 3.0541, + "step": 4500 }, { - "epoch": 0.95, - "learning_rate": 2.439164751305294e-06, - "loss": 2.2862, - "step": 545460 + "epoch": 0.02, + "learning_rate": 4.917901417449876e-05, + "loss": 3.0451, + "step": 4600 }, { - "epoch": 0.95, - "learning_rate": 2.4382928113784678e-06, - "loss": 2.2549, - "step": 545470 + "epoch": 0.02, + "learning_rate": 4.916116665655308e-05, + "loss": 3.0483, + "step": 4700 }, { - "epoch": 0.95, - "learning_rate": 2.4374208714516407e-06, - "loss": 2.2473, - "step": 545480 + "epoch": 0.02, + "learning_rate": 4.9143319138607394e-05, + "loss": 3.0485, + "step": 4800 }, { - "epoch": 0.95, - "learning_rate": 2.436548931524814e-06, - "loss": 2.3084, - "step": 545490 + "epoch": 0.02, + "learning_rate": 4.9125471620661715e-05, + "loss": 3.0481, + "step": 4900 }, { - "epoch": 0.95, - "learning_rate": 2.435676991597987e-06, - "loss": 2.1976, - "step": 545500 + "epoch": 0.02, + "learning_rate": 4.9107624102716036e-05, + "loss": 3.0357, + "step": 5000 }, { - "epoch": 0.95, - "learning_rate": 2.4348050516711603e-06, - "loss": 2.1313, - "step": 545510 + "epoch": 0.02, + "learning_rate": 4.908977658477036e-05, + "loss": 3.0463, + "step": 5100 }, { - "epoch": 0.95, - "learning_rate": 2.4339331117443332e-06, - "loss": 2.2891, - "step": 545520 + "epoch": 0.02, + "learning_rate": 4.907192906682468e-05, + "loss": 3.0369, + "step": 5200 }, { - "epoch": 0.95, - "learning_rate": 2.4330611718175066e-06, - "loss": 2.2785, - "step": 545530 + "epoch": 0.02, + "learning_rate": 4.9054081548879e-05, + "loss": 3.0465, + "step": 5300 }, { - "epoch": 0.95, - "learning_rate": 2.43218923189068e-06, - "loss": 2.2639, - "step": 545540 + "epoch": 0.02, + "learning_rate": 4.903623403093332e-05, + "loss": 3.0229, + "step": 5400 }, { - "epoch": 0.95, - "learning_rate": 2.4313172919638533e-06, - "loss": 2.2013, - "step": 545550 + "epoch": 0.02, + "learning_rate": 4.901838651298764e-05, + "loss": 3.0339, + "step": 5500 }, { - "epoch": 0.95, - "learning_rate": 2.430445352037026e-06, - "loss": 2.3245, - "step": 545560 + "epoch": 0.02, + "learning_rate": 4.900053899504196e-05, + "loss": 3.0449, + "step": 5600 }, { - "epoch": 0.95, - "learning_rate": 2.4295734121101995e-06, - "loss": 2.2147, - "step": 545570 + "epoch": 0.02, + "learning_rate": 4.8982691477096285e-05, + "loss": 3.0402, + "step": 5700 }, { - "epoch": 0.95, - "learning_rate": 2.4287014721833724e-06, - "loss": 2.2235, - "step": 545580 + "epoch": 0.02, + "learning_rate": 4.8964843959150606e-05, + "loss": 3.0287, + "step": 5800 }, { - "epoch": 0.95, - "learning_rate": 2.427829532256546e-06, - "loss": 2.2633, - "step": 545590 + "epoch": 0.02, + "learning_rate": 4.894699644120492e-05, + "loss": 3.0269, + "step": 5900 }, { - "epoch": 0.95, - "learning_rate": 2.4269575923297187e-06, - "loss": 2.2725, - "step": 545600 + "epoch": 0.02, + "learning_rate": 4.892914892325924e-05, + "loss": 3.0284, + "step": 6000 }, { - "epoch": 0.95, - "learning_rate": 2.4260856524028925e-06, - "loss": 2.2017, - "step": 545610 + "epoch": 0.02, + "learning_rate": 4.891130140531356e-05, + "loss": 3.0195, + "step": 6100 }, { - "epoch": 0.95, - "learning_rate": 2.4252137124760654e-06, - "loss": 2.2619, - "step": 545620 + "epoch": 0.02, + "learning_rate": 4.8893453887367884e-05, + "loss": 3.0309, + "step": 6200 }, { - "epoch": 0.95, - "learning_rate": 2.4243417725492388e-06, - "loss": 2.2781, - "step": 545630 + "epoch": 0.02, + "learning_rate": 4.8875606369422205e-05, + "loss": 3.0327, + "step": 6300 }, { - "epoch": 0.95, - "learning_rate": 2.4234698326224117e-06, - "loss": 2.3427, - "step": 545640 + "epoch": 0.02, + "learning_rate": 4.8857758851476526e-05, + "loss": 3.0303, + "step": 6400 }, { - "epoch": 0.95, - "learning_rate": 2.422597892695585e-06, - "loss": 2.2573, - "step": 545650 + "epoch": 0.02, + "learning_rate": 4.883991133353085e-05, + "loss": 3.0224, + "step": 6500 }, { - "epoch": 0.95, - "learning_rate": 2.421725952768758e-06, - "loss": 2.1072, - "step": 545660 + "epoch": 0.02, + "learning_rate": 4.882206381558517e-05, + "loss": 3.0304, + "step": 6600 }, { - "epoch": 0.95, - "learning_rate": 2.4208540128419317e-06, - "loss": 2.3521, - "step": 545670 + "epoch": 0.02, + "learning_rate": 4.880421629763949e-05, + "loss": 3.0275, + "step": 6700 }, { - "epoch": 0.95, - "learning_rate": 2.4199820729151046e-06, - "loss": 2.1925, - "step": 545680 + "epoch": 0.02, + "learning_rate": 4.878636877969381e-05, + "loss": 3.0202, + "step": 6800 }, { - "epoch": 0.95, - "learning_rate": 2.419110132988278e-06, - "loss": 2.4101, - "step": 545690 + "epoch": 0.02, + "learning_rate": 4.876852126174813e-05, + "loss": 3.0301, + "step": 6900 }, { - "epoch": 0.95, - "learning_rate": 2.418238193061451e-06, - "loss": 2.2786, - "step": 545700 + "epoch": 0.02, + "learning_rate": 4.875067374380245e-05, + "loss": 3.0177, + "step": 7000 }, { - "epoch": 0.95, - "learning_rate": 2.4173662531346243e-06, - "loss": 2.3245, - "step": 545710 + "epoch": 0.03, + "learning_rate": 4.873282622585677e-05, + "loss": 3.0258, + "step": 7100 }, { - "epoch": 0.95, - "learning_rate": 2.416494313207797e-06, - "loss": 2.3808, - "step": 545720 + "epoch": 0.03, + "learning_rate": 4.871497870791109e-05, + "loss": 3.0146, + "step": 7200 }, { - "epoch": 0.95, - "learning_rate": 2.4156223732809705e-06, - "loss": 2.3069, - "step": 545730 + "epoch": 0.03, + "learning_rate": 4.869713118996541e-05, + "loss": 3.0197, + "step": 7300 }, { - "epoch": 0.95, - "learning_rate": 2.414750433354144e-06, - "loss": 2.2514, - "step": 545740 + "epoch": 0.03, + "learning_rate": 4.867928367201973e-05, + "loss": 3.0226, + "step": 7400 }, { - "epoch": 0.95, - "learning_rate": 2.4138784934273172e-06, - "loss": 2.3171, - "step": 545750 + "epoch": 0.03, + "learning_rate": 4.866143615407405e-05, + "loss": 3.0154, + "step": 7500 }, { - "epoch": 0.95, - "learning_rate": 2.41300655350049e-06, - "loss": 2.3116, - "step": 545760 + "epoch": 0.03, + "learning_rate": 4.8643588636128374e-05, + "loss": 3.0075, + "step": 7600 }, { - "epoch": 0.95, - "learning_rate": 2.4121346135736635e-06, - "loss": 2.2331, - "step": 545770 + "epoch": 0.03, + "learning_rate": 4.86257411181827e-05, + "loss": 3.0174, + "step": 7700 }, { - "epoch": 0.95, - "learning_rate": 2.4112626736468364e-06, - "loss": 2.2581, - "step": 545780 + "epoch": 0.03, + "learning_rate": 4.860789360023702e-05, + "loss": 3.0117, + "step": 7800 }, { - "epoch": 0.95, - "learning_rate": 2.4103907337200098e-06, - "loss": 2.2611, - "step": 545790 + "epoch": 0.03, + "learning_rate": 4.859004608229134e-05, + "loss": 3.0067, + "step": 7900 }, { - "epoch": 0.95, - "learning_rate": 2.409518793793183e-06, - "loss": 2.3104, - "step": 545800 + "epoch": 0.03, + "learning_rate": 4.857219856434566e-05, + "loss": 3.0154, + "step": 8000 }, { - "epoch": 0.95, - "learning_rate": 2.4086468538663564e-06, - "loss": 2.2208, - "step": 545810 + "epoch": 0.03, + "learning_rate": 4.855435104639998e-05, + "loss": 3.016, + "step": 8100 }, { - "epoch": 0.95, - "learning_rate": 2.4077749139395294e-06, - "loss": 2.154, - "step": 545820 + "epoch": 0.03, + "learning_rate": 4.85365035284543e-05, + "loss": 3.0083, + "step": 8200 }, { - "epoch": 0.95, - "learning_rate": 2.4069029740127027e-06, - "loss": 2.3364, - "step": 545830 + "epoch": 0.03, + "learning_rate": 4.851865601050862e-05, + "loss": 3.0094, + "step": 8300 }, { - "epoch": 0.95, - "learning_rate": 2.4060310340858756e-06, - "loss": 2.2608, - "step": 545840 + "epoch": 0.03, + "learning_rate": 4.8500808492562944e-05, + "loss": 3.0071, + "step": 8400 }, { - "epoch": 0.95, - "learning_rate": 2.405159094159049e-06, - "loss": 2.1997, - "step": 545850 + "epoch": 0.03, + "learning_rate": 4.8482960974617265e-05, + "loss": 3.0037, + "step": 8500 }, { - "epoch": 0.95, - "learning_rate": 2.404287154232222e-06, - "loss": 2.2819, - "step": 545860 + "epoch": 0.03, + "learning_rate": 4.8465113456671586e-05, + "loss": 3.0166, + "step": 8600 }, { - "epoch": 0.95, - "learning_rate": 2.4034152143053957e-06, - "loss": 2.2785, - "step": 545870 + "epoch": 0.03, + "learning_rate": 4.844726593872591e-05, + "loss": 3.0083, + "step": 8700 }, { - "epoch": 0.95, - "learning_rate": 2.4025432743785686e-06, - "loss": 2.3315, - "step": 545880 + "epoch": 0.03, + "learning_rate": 4.842941842078023e-05, + "loss": 3.0019, + "step": 8800 }, { - "epoch": 0.95, - "learning_rate": 2.401671334451742e-06, - "loss": 2.375, - "step": 545890 + "epoch": 0.03, + "learning_rate": 4.841157090283455e-05, + "loss": 3.0104, + "step": 8900 }, { - "epoch": 0.95, - "learning_rate": 2.400799394524915e-06, - "loss": 2.3274, - "step": 545900 + "epoch": 0.03, + "learning_rate": 4.8393723384888864e-05, + "loss": 2.9979, + "step": 9000 }, { - "epoch": 0.95, - "learning_rate": 2.3999274545980882e-06, - "loss": 2.2501, - "step": 545910 + "epoch": 0.03, + "learning_rate": 4.8375875866943186e-05, + "loss": 3.0066, + "step": 9100 }, { - "epoch": 0.95, - "learning_rate": 2.399055514671261e-06, - "loss": 2.2307, - "step": 545920 + "epoch": 0.03, + "learning_rate": 4.835802834899751e-05, + "loss": 3.0047, + "step": 9200 }, { - "epoch": 0.95, - "learning_rate": 2.3981835747444345e-06, - "loss": 2.164, - "step": 545930 + "epoch": 0.03, + "learning_rate": 4.834018083105183e-05, + "loss": 3.0059, + "step": 9300 }, { - "epoch": 0.95, - "learning_rate": 2.397311634817608e-06, - "loss": 2.1375, - "step": 545940 + "epoch": 0.03, + "learning_rate": 4.832233331310615e-05, + "loss": 2.9923, + "step": 9400 }, { - "epoch": 0.95, - "learning_rate": 2.396439694890781e-06, - "loss": 2.2169, - "step": 545950 + "epoch": 0.03, + "learning_rate": 4.830448579516047e-05, + "loss": 2.9994, + "step": 9500 }, { - "epoch": 0.95, - "learning_rate": 2.395567754963954e-06, - "loss": 2.3007, - "step": 545960 + "epoch": 0.03, + "learning_rate": 4.828663827721479e-05, + "loss": 2.9912, + "step": 9600 }, { - "epoch": 0.95, - "learning_rate": 2.3946958150371274e-06, - "loss": 2.1939, - "step": 545970 + "epoch": 0.03, + "learning_rate": 4.826879075926911e-05, + "loss": 2.993, + "step": 9700 }, { - "epoch": 0.95, - "learning_rate": 2.3938238751103004e-06, - "loss": 2.2579, - "step": 545980 + "epoch": 0.03, + "learning_rate": 4.8250943241323434e-05, + "loss": 2.985, + "step": 9800 }, { - "epoch": 0.95, - "learning_rate": 2.3929519351834737e-06, - "loss": 2.2623, - "step": 545990 + "epoch": 0.04, + "learning_rate": 4.8233095723377755e-05, + "loss": 2.9926, + "step": 9900 }, { - "epoch": 0.95, - "learning_rate": 2.392079995256647e-06, - "loss": 2.1107, - "step": 546000 + "epoch": 0.04, + "learning_rate": 4.8215248205432076e-05, + "loss": 2.9905, + "step": 10000 }, { - "epoch": 0.95, - "learning_rate": 2.3912080553298204e-06, - "loss": 2.2154, - "step": 546010 + "epoch": 0.04, + "learning_rate": 4.819740068748639e-05, + "loss": 2.9819, + "step": 10100 }, { - "epoch": 0.95, - "learning_rate": 2.3903361154029933e-06, - "loss": 2.3147, - "step": 546020 + "epoch": 0.04, + "learning_rate": 4.817955316954071e-05, + "loss": 2.9921, + "step": 10200 }, { - "epoch": 0.95, - "learning_rate": 2.3894641754761667e-06, - "loss": 2.2499, - "step": 546030 + "epoch": 0.04, + "learning_rate": 4.816170565159503e-05, + "loss": 2.9812, + "step": 10300 }, { - "epoch": 0.95, - "learning_rate": 2.3885922355493396e-06, - "loss": 2.2636, - "step": 546040 + "epoch": 0.04, + "learning_rate": 4.8143858133649355e-05, + "loss": 2.9954, + "step": 10400 }, { - "epoch": 0.95, - "learning_rate": 2.387720295622513e-06, - "loss": 2.1825, - "step": 546050 + "epoch": 0.04, + "learning_rate": 4.8126010615703676e-05, + "loss": 2.9938, + "step": 10500 }, { - "epoch": 0.95, - "learning_rate": 2.386848355695686e-06, - "loss": 2.3019, - "step": 546060 + "epoch": 0.04, + "learning_rate": 4.8108163097758e-05, + "loss": 2.983, + "step": 10600 }, { - "epoch": 0.95, - "learning_rate": 2.3859764157688596e-06, - "loss": 2.2237, - "step": 546070 + "epoch": 0.04, + "learning_rate": 4.809031557981232e-05, + "loss": 2.9933, + "step": 10700 }, { - "epoch": 0.95, - "learning_rate": 2.3851044758420326e-06, - "loss": 2.2071, - "step": 546080 + "epoch": 0.04, + "learning_rate": 4.807246806186664e-05, + "loss": 2.9954, + "step": 10800 }, { - "epoch": 0.95, - "learning_rate": 2.384232535915206e-06, - "loss": 2.2997, - "step": 546090 + "epoch": 0.04, + "learning_rate": 4.805462054392096e-05, + "loss": 2.9773, + "step": 10900 }, { - "epoch": 0.95, - "learning_rate": 2.383360595988379e-06, - "loss": 2.1521, - "step": 546100 + "epoch": 0.04, + "learning_rate": 4.803677302597528e-05, + "loss": 2.9905, + "step": 11000 }, { - "epoch": 0.95, - "learning_rate": 2.382488656061552e-06, - "loss": 2.351, - "step": 546110 + "epoch": 0.04, + "learning_rate": 4.80189255080296e-05, + "loss": 2.9884, + "step": 11100 }, { - "epoch": 0.95, - "learning_rate": 2.381616716134725e-06, - "loss": 2.2448, - "step": 546120 + "epoch": 0.04, + "learning_rate": 4.800107799008392e-05, + "loss": 2.9752, + "step": 11200 }, { - "epoch": 0.95, - "learning_rate": 2.3807447762078984e-06, - "loss": 2.267, - "step": 546130 + "epoch": 0.04, + "learning_rate": 4.798323047213824e-05, + "loss": 2.9862, + "step": 11300 }, { - "epoch": 0.95, - "learning_rate": 2.379872836281072e-06, - "loss": 2.3421, - "step": 546140 + "epoch": 0.04, + "learning_rate": 4.796538295419256e-05, + "loss": 2.983, + "step": 11400 }, { - "epoch": 0.95, - "learning_rate": 2.379000896354245e-06, - "loss": 2.2389, - "step": 546150 + "epoch": 0.04, + "learning_rate": 4.794753543624688e-05, + "loss": 2.9796, + "step": 11500 }, { - "epoch": 0.95, - "learning_rate": 2.378128956427418e-06, - "loss": 2.2053, - "step": 546160 + "epoch": 0.04, + "learning_rate": 4.79296879183012e-05, + "loss": 2.9725, + "step": 11600 }, { - "epoch": 0.95, - "learning_rate": 2.3772570165005914e-06, - "loss": 2.2504, - "step": 546170 + "epoch": 0.04, + "learning_rate": 4.7911840400355524e-05, + "loss": 2.9862, + "step": 11700 }, { - "epoch": 0.95, - "learning_rate": 2.3763850765737643e-06, - "loss": 2.2459, - "step": 546180 + "epoch": 0.04, + "learning_rate": 4.7893992882409845e-05, + "loss": 2.9857, + "step": 11800 }, { - "epoch": 0.95, - "learning_rate": 2.3755131366469377e-06, - "loss": 2.225, - "step": 546190 + "epoch": 0.04, + "learning_rate": 4.7876145364464166e-05, + "loss": 2.9709, + "step": 11900 }, { - "epoch": 0.95, - "learning_rate": 2.374641196720111e-06, - "loss": 2.2955, - "step": 546200 + "epoch": 0.04, + "learning_rate": 4.785829784651849e-05, + "loss": 2.9848, + "step": 12000 }, { - "epoch": 0.95, - "learning_rate": 2.3737692567932844e-06, - "loss": 2.2561, - "step": 546210 + "epoch": 0.04, + "learning_rate": 4.784045032857281e-05, + "loss": 2.9783, + "step": 12100 }, { - "epoch": 0.95, - "learning_rate": 2.3728973168664573e-06, - "loss": 2.1852, - "step": 546220 + "epoch": 0.04, + "learning_rate": 4.782260281062712e-05, + "loss": 2.9718, + "step": 12200 }, { - "epoch": 0.95, - "learning_rate": 2.3720253769396306e-06, - "loss": 2.243, - "step": 546230 + "epoch": 0.04, + "learning_rate": 4.7804755292681444e-05, + "loss": 2.9787, + "step": 12300 }, { - "epoch": 0.95, - "learning_rate": 2.3711534370128036e-06, - "loss": 2.216, - "step": 546240 + "epoch": 0.04, + "learning_rate": 4.7786907774735765e-05, + "loss": 2.9676, + "step": 12400 }, { - "epoch": 0.95, - "learning_rate": 2.370281497085977e-06, - "loss": 2.2331, - "step": 546250 + "epoch": 0.04, + "learning_rate": 4.7769060256790086e-05, + "loss": 2.9666, + "step": 12500 }, { - "epoch": 0.95, - "learning_rate": 2.36940955715915e-06, - "loss": 2.3522, - "step": 546260 + "epoch": 0.04, + "learning_rate": 4.775121273884441e-05, + "loss": 2.9778, + "step": 12600 }, { - "epoch": 0.95, - "learning_rate": 2.3685376172323236e-06, - "loss": 2.3059, - "step": 546270 + "epoch": 0.05, + "learning_rate": 4.773336522089873e-05, + "loss": 2.9741, + "step": 12700 }, { - "epoch": 0.95, - "learning_rate": 2.3676656773054965e-06, - "loss": 2.308, - "step": 546280 + "epoch": 0.05, + "learning_rate": 4.771551770295306e-05, + "loss": 2.9708, + "step": 12800 }, { - "epoch": 0.95, - "learning_rate": 2.36679373737867e-06, - "loss": 2.2304, - "step": 546290 + "epoch": 0.05, + "learning_rate": 4.769767018500738e-05, + "loss": 2.9686, + "step": 12900 }, { - "epoch": 0.95, - "learning_rate": 2.365921797451843e-06, - "loss": 2.1864, - "step": 546300 + "epoch": 0.05, + "learning_rate": 4.76798226670617e-05, + "loss": 2.9707, + "step": 13000 }, { - "epoch": 0.95, - "learning_rate": 2.365049857525016e-06, - "loss": 2.0917, - "step": 546310 + "epoch": 0.05, + "learning_rate": 4.7661975149116014e-05, + "loss": 2.9682, + "step": 13100 }, { - "epoch": 0.95, - "learning_rate": 2.364177917598189e-06, - "loss": 2.2946, - "step": 546320 + "epoch": 0.05, + "learning_rate": 4.7644127631170335e-05, + "loss": 2.966, + "step": 13200 }, { - "epoch": 0.95, - "learning_rate": 2.3633059776713624e-06, - "loss": 2.3124, - "step": 546330 + "epoch": 0.05, + "learning_rate": 4.7626280113224656e-05, + "loss": 2.9716, + "step": 13300 }, { - "epoch": 0.95, - "learning_rate": 2.3624340377445358e-06, - "loss": 2.3082, - "step": 546340 + "epoch": 0.05, + "learning_rate": 4.760843259527898e-05, + "loss": 2.9772, + "step": 13400 }, { - "epoch": 0.95, - "learning_rate": 2.361562097817709e-06, - "loss": 2.4248, - "step": 546350 + "epoch": 0.05, + "learning_rate": 4.75905850773333e-05, + "loss": 2.9659, + "step": 13500 }, { - "epoch": 0.95, - "learning_rate": 2.360690157890882e-06, - "loss": 2.1653, - "step": 546360 + "epoch": 0.05, + "learning_rate": 4.757273755938762e-05, + "loss": 2.9753, + "step": 13600 }, { - "epoch": 0.95, - "learning_rate": 2.3598182179640554e-06, - "loss": 2.3416, - "step": 546370 + "epoch": 0.05, + "learning_rate": 4.755489004144194e-05, + "loss": 2.9617, + "step": 13700 }, { - "epoch": 0.95, - "learning_rate": 2.3589462780372283e-06, - "loss": 2.2055, - "step": 546380 + "epoch": 0.05, + "learning_rate": 4.753704252349626e-05, + "loss": 2.9614, + "step": 13800 }, { - "epoch": 0.95, - "learning_rate": 2.3580743381104016e-06, - "loss": 2.2958, - "step": 546390 + "epoch": 0.05, + "learning_rate": 4.7519195005550584e-05, + "loss": 2.9713, + "step": 13900 }, { - "epoch": 0.95, - "learning_rate": 2.357202398183575e-06, - "loss": 2.2981, - "step": 546400 + "epoch": 0.05, + "learning_rate": 4.7501347487604905e-05, + "loss": 2.9694, + "step": 14000 }, { - "epoch": 0.95, - "learning_rate": 2.3563304582567483e-06, - "loss": 2.2739, - "step": 546410 + "epoch": 0.05, + "learning_rate": 4.7483499969659226e-05, + "loss": 2.9663, + "step": 14100 }, { - "epoch": 0.95, - "learning_rate": 2.3554585183299213e-06, - "loss": 2.2434, - "step": 546420 + "epoch": 0.05, + "learning_rate": 4.746565245171354e-05, + "loss": 2.9633, + "step": 14200 }, { - "epoch": 0.95, - "learning_rate": 2.3545865784030946e-06, - "loss": 2.1919, - "step": 546430 + "epoch": 0.05, + "learning_rate": 4.744780493376786e-05, + "loss": 2.9668, + "step": 14300 }, { - "epoch": 0.95, - "learning_rate": 2.3537146384762675e-06, - "loss": 2.3015, - "step": 546440 + "epoch": 0.05, + "learning_rate": 4.742995741582218e-05, + "loss": 2.956, + "step": 14400 }, { - "epoch": 0.95, - "learning_rate": 2.352842698549441e-06, - "loss": 2.2654, - "step": 546450 + "epoch": 0.05, + "learning_rate": 4.7412109897876504e-05, + "loss": 2.9591, + "step": 14500 }, { - "epoch": 0.95, - "learning_rate": 2.351970758622614e-06, - "loss": 2.1999, - "step": 546460 + "epoch": 0.05, + "learning_rate": 4.7394262379930825e-05, + "loss": 2.9598, + "step": 14600 }, { - "epoch": 0.95, - "learning_rate": 2.3510988186957876e-06, - "loss": 2.234, - "step": 546470 + "epoch": 0.05, + "learning_rate": 4.7376414861985146e-05, + "loss": 2.95, + "step": 14700 }, { - "epoch": 0.95, - "learning_rate": 2.3502268787689605e-06, - "loss": 2.3861, - "step": 546480 + "epoch": 0.05, + "learning_rate": 4.735856734403947e-05, + "loss": 2.9574, + "step": 14800 }, { - "epoch": 0.95, - "learning_rate": 2.349354938842134e-06, - "loss": 2.2771, - "step": 546490 + "epoch": 0.05, + "learning_rate": 4.734071982609379e-05, + "loss": 2.9655, + "step": 14900 }, { - "epoch": 0.95, - "learning_rate": 2.3484829989153068e-06, - "loss": 2.2003, - "step": 546500 + "epoch": 0.05, + "learning_rate": 4.732287230814811e-05, + "loss": 2.9585, + "step": 15000 }, { - "epoch": 0.95, - "learning_rate": 2.34761105898848e-06, - "loss": 2.1573, - "step": 546510 + "epoch": 0.05, + "learning_rate": 4.730502479020243e-05, + "loss": 2.9571, + "step": 15100 }, { - "epoch": 0.95, - "learning_rate": 2.346739119061653e-06, - "loss": 2.206, - "step": 546520 + "epoch": 0.05, + "learning_rate": 4.728717727225675e-05, + "loss": 2.9675, + "step": 15200 }, { - "epoch": 0.95, - "learning_rate": 2.3458671791348264e-06, - "loss": 2.1976, - "step": 546530 + "epoch": 0.05, + "learning_rate": 4.726932975431107e-05, + "loss": 2.9577, + "step": 15300 }, { - "epoch": 0.95, - "learning_rate": 2.3449952392079997e-06, - "loss": 2.2254, - "step": 546540 + "epoch": 0.05, + "learning_rate": 4.725148223636539e-05, + "loss": 2.9613, + "step": 15400 }, { - "epoch": 0.95, - "learning_rate": 2.344123299281173e-06, - "loss": 2.2502, - "step": 546550 + "epoch": 0.06, + "learning_rate": 4.723363471841971e-05, + "loss": 2.9628, + "step": 15500 }, { - "epoch": 0.95, - "learning_rate": 2.343251359354346e-06, - "loss": 2.3419, - "step": 546560 + "epoch": 0.06, + "learning_rate": 4.721578720047403e-05, + "loss": 2.9584, + "step": 15600 }, { - "epoch": 0.95, - "learning_rate": 2.3423794194275193e-06, - "loss": 2.3007, - "step": 546570 + "epoch": 0.06, + "learning_rate": 4.719793968252835e-05, + "loss": 2.9501, + "step": 15700 }, { - "epoch": 0.95, - "learning_rate": 2.3415074795006923e-06, - "loss": 2.2496, - "step": 546580 + "epoch": 0.06, + "learning_rate": 4.718009216458267e-05, + "loss": 2.9566, + "step": 15800 }, { - "epoch": 0.95, - "learning_rate": 2.3406355395738656e-06, - "loss": 2.2267, - "step": 546590 + "epoch": 0.06, + "learning_rate": 4.7162244646636994e-05, + "loss": 2.9547, + "step": 15900 }, { - "epoch": 0.95, - "learning_rate": 2.339763599647039e-06, - "loss": 2.235, - "step": 546600 + "epoch": 0.06, + "learning_rate": 4.7144397128691315e-05, + "loss": 2.9563, + "step": 16000 }, { - "epoch": 0.95, - "learning_rate": 2.3388916597202123e-06, - "loss": 2.2486, - "step": 546610 + "epoch": 0.06, + "learning_rate": 4.712654961074564e-05, + "loss": 2.9514, + "step": 16100 }, { - "epoch": 0.95, - "learning_rate": 2.3380197197933852e-06, - "loss": 2.274, - "step": 546620 + "epoch": 0.06, + "learning_rate": 4.710870209279996e-05, + "loss": 2.953, + "step": 16200 }, { - "epoch": 0.95, - "learning_rate": 2.3371477798665586e-06, - "loss": 2.2604, - "step": 546630 + "epoch": 0.06, + "learning_rate": 4.709085457485428e-05, + "loss": 2.9614, + "step": 16300 }, { - "epoch": 0.95, - "learning_rate": 2.3362758399397315e-06, - "loss": 2.3021, - "step": 546640 + "epoch": 0.06, + "learning_rate": 4.7073007056908594e-05, + "loss": 2.9524, + "step": 16400 }, { - "epoch": 0.95, - "learning_rate": 2.335403900012905e-06, - "loss": 2.2332, - "step": 546650 + "epoch": 0.06, + "learning_rate": 4.7055159538962915e-05, + "loss": 2.9636, + "step": 16500 }, { - "epoch": 0.95, - "learning_rate": 2.3345319600860778e-06, - "loss": 2.2688, - "step": 546660 + "epoch": 0.06, + "learning_rate": 4.7037312021017236e-05, + "loss": 2.9469, + "step": 16600 }, { - "epoch": 0.95, - "learning_rate": 2.3336600201592515e-06, - "loss": 2.2771, - "step": 546670 + "epoch": 0.06, + "learning_rate": 4.701946450307156e-05, + "loss": 2.9505, + "step": 16700 }, { - "epoch": 0.95, - "learning_rate": 2.3327880802324245e-06, - "loss": 2.344, - "step": 546680 + "epoch": 0.06, + "learning_rate": 4.700161698512588e-05, + "loss": 2.9413, + "step": 16800 }, { - "epoch": 0.95, - "learning_rate": 2.331916140305598e-06, - "loss": 2.2443, - "step": 546690 + "epoch": 0.06, + "learning_rate": 4.69837694671802e-05, + "loss": 2.9437, + "step": 16900 }, { - "epoch": 0.95, - "learning_rate": 2.3310442003787707e-06, - "loss": 2.2089, - "step": 546700 + "epoch": 0.06, + "learning_rate": 4.696592194923452e-05, + "loss": 2.9568, + "step": 17000 }, { - "epoch": 0.95, - "learning_rate": 2.330172260451944e-06, - "loss": 2.281, - "step": 546710 + "epoch": 0.06, + "learning_rate": 4.694807443128884e-05, + "loss": 2.9489, + "step": 17100 }, { - "epoch": 0.95, - "learning_rate": 2.329300320525117e-06, - "loss": 2.1677, - "step": 546720 + "epoch": 0.06, + "learning_rate": 4.693022691334316e-05, + "loss": 2.9461, + "step": 17200 }, { - "epoch": 0.95, - "learning_rate": 2.3284283805982903e-06, - "loss": 2.1939, - "step": 546730 + "epoch": 0.06, + "learning_rate": 4.6912379395397484e-05, + "loss": 2.9527, + "step": 17300 }, { - "epoch": 0.95, - "learning_rate": 2.3275564406714637e-06, - "loss": 2.3583, - "step": 546740 + "epoch": 0.06, + "learning_rate": 4.6894531877451806e-05, + "loss": 2.9453, + "step": 17400 }, { - "epoch": 0.95, - "learning_rate": 2.326684500744637e-06, - "loss": 2.2376, - "step": 546750 + "epoch": 0.06, + "learning_rate": 4.687668435950612e-05, + "loss": 2.9504, + "step": 17500 }, { - "epoch": 0.95, - "learning_rate": 2.32581256081781e-06, - "loss": 2.3141, - "step": 546760 + "epoch": 0.06, + "learning_rate": 4.685883684156044e-05, + "loss": 2.9493, + "step": 17600 }, { - "epoch": 0.95, - "learning_rate": 2.3249406208909833e-06, - "loss": 2.2933, - "step": 546770 + "epoch": 0.06, + "learning_rate": 4.684098932361476e-05, + "loss": 2.9494, + "step": 17700 }, { - "epoch": 0.95, - "learning_rate": 2.3240686809641562e-06, - "loss": 2.2202, - "step": 546780 + "epoch": 0.06, + "learning_rate": 4.6823141805669084e-05, + "loss": 2.9507, + "step": 17800 }, { - "epoch": 0.95, - "learning_rate": 2.3231967410373296e-06, - "loss": 2.2829, - "step": 546790 + "epoch": 0.06, + "learning_rate": 4.680529428772341e-05, + "loss": 2.9527, + "step": 17900 }, { - "epoch": 0.95, - "learning_rate": 2.322324801110503e-06, - "loss": 2.2842, - "step": 546800 + "epoch": 0.06, + "learning_rate": 4.678744676977773e-05, + "loss": 2.9302, + "step": 18000 }, { - "epoch": 0.95, - "learning_rate": 2.3214528611836763e-06, - "loss": 2.2399, - "step": 546810 + "epoch": 0.06, + "learning_rate": 4.6769599251832054e-05, + "loss": 2.9517, + "step": 18100 }, { - "epoch": 0.95, - "learning_rate": 2.320580921256849e-06, - "loss": 2.2808, - "step": 546820 + "epoch": 0.06, + "learning_rate": 4.6751751733886375e-05, + "loss": 2.927, + "step": 18200 }, { - "epoch": 0.95, - "learning_rate": 2.3197089813300225e-06, - "loss": 2.305, - "step": 546830 + "epoch": 0.07, + "learning_rate": 4.67339042159407e-05, + "loss": 2.9401, + "step": 18300 }, { - "epoch": 0.95, - "learning_rate": 2.3188370414031955e-06, - "loss": 2.3999, - "step": 546840 + "epoch": 0.07, + "learning_rate": 4.671605669799501e-05, + "loss": 2.9564, + "step": 18400 }, { - "epoch": 0.95, - "learning_rate": 2.317965101476369e-06, - "loss": 2.3725, - "step": 546850 + "epoch": 0.07, + "learning_rate": 4.669820918004933e-05, + "loss": 2.943, + "step": 18500 }, { - "epoch": 0.95, - "learning_rate": 2.3170931615495417e-06, - "loss": 2.1977, - "step": 546860 + "epoch": 0.07, + "learning_rate": 4.6680361662103654e-05, + "loss": 2.9414, + "step": 18600 }, { - "epoch": 0.95, - "learning_rate": 2.3162212216227155e-06, - "loss": 2.2745, - "step": 546870 + "epoch": 0.07, + "learning_rate": 4.6662514144157975e-05, + "loss": 2.9446, + "step": 18700 }, { - "epoch": 0.95, - "learning_rate": 2.3153492816958884e-06, - "loss": 2.301, - "step": 546880 + "epoch": 0.07, + "learning_rate": 4.6644666626212296e-05, + "loss": 2.9462, + "step": 18800 }, { - "epoch": 0.95, - "learning_rate": 2.3144773417690618e-06, - "loss": 2.2798, - "step": 546890 + "epoch": 0.07, + "learning_rate": 4.662681910826662e-05, + "loss": 2.9353, + "step": 18900 }, { - "epoch": 0.95, - "learning_rate": 2.3136054018422347e-06, - "loss": 2.2484, - "step": 546900 + "epoch": 0.07, + "learning_rate": 4.660897159032094e-05, + "loss": 2.9467, + "step": 19000 }, { - "epoch": 0.95, - "learning_rate": 2.312733461915408e-06, - "loss": 2.3052, - "step": 546910 + "epoch": 0.07, + "learning_rate": 4.659112407237526e-05, + "loss": 2.9301, + "step": 19100 }, { - "epoch": 0.95, - "learning_rate": 2.311861521988581e-06, - "loss": 2.223, - "step": 546920 + "epoch": 0.07, + "learning_rate": 4.657327655442958e-05, + "loss": 2.9428, + "step": 19200 }, { - "epoch": 0.95, - "learning_rate": 2.3109895820617543e-06, - "loss": 2.2238, - "step": 546930 + "epoch": 0.07, + "learning_rate": 4.65554290364839e-05, + "loss": 2.9403, + "step": 19300 }, { - "epoch": 0.95, - "learning_rate": 2.3101176421349276e-06, - "loss": 2.3042, - "step": 546940 + "epoch": 0.07, + "learning_rate": 4.653758151853822e-05, + "loss": 2.9301, + "step": 19400 }, { - "epoch": 0.95, - "learning_rate": 2.309245702208101e-06, - "loss": 2.3014, - "step": 546950 + "epoch": 0.07, + "learning_rate": 4.651973400059254e-05, + "loss": 2.9338, + "step": 19500 }, { - "epoch": 0.95, - "learning_rate": 2.308373762281274e-06, - "loss": 2.2912, - "step": 546960 + "epoch": 0.07, + "learning_rate": 4.650188648264686e-05, + "loss": 2.9398, + "step": 19600 }, { - "epoch": 0.95, - "learning_rate": 2.3075018223544473e-06, - "loss": 2.2321, - "step": 546970 + "epoch": 0.07, + "learning_rate": 4.648403896470118e-05, + "loss": 2.9341, + "step": 19700 }, { - "epoch": 0.95, - "learning_rate": 2.30662988242762e-06, - "loss": 2.2372, - "step": 546980 + "epoch": 0.07, + "learning_rate": 4.64661914467555e-05, + "loss": 2.9378, + "step": 19800 }, { - "epoch": 0.95, - "learning_rate": 2.3057579425007935e-06, - "loss": 2.2261, - "step": 546990 + "epoch": 0.07, + "learning_rate": 4.644834392880982e-05, + "loss": 2.9242, + "step": 19900 }, { - "epoch": 0.95, - "learning_rate": 2.304886002573967e-06, - "loss": 2.2528, - "step": 547000 + "epoch": 0.07, + "learning_rate": 4.6430496410864144e-05, + "loss": 2.9369, + "step": 20000 }, { - "epoch": 0.95, - "learning_rate": 2.3040140626471402e-06, - "loss": 2.3404, - "step": 547010 + "epoch": 0.07, + "learning_rate": 4.6412648892918465e-05, + "loss": 2.9442, + "step": 20100 }, { - "epoch": 0.95, - "learning_rate": 2.303142122720313e-06, - "loss": 2.3461, - "step": 547020 + "epoch": 0.07, + "learning_rate": 4.6394801374972786e-05, + "loss": 2.934, + "step": 20200 }, { - "epoch": 0.95, - "learning_rate": 2.3022701827934865e-06, - "loss": 2.3317, - "step": 547030 + "epoch": 0.07, + "learning_rate": 4.637695385702711e-05, + "loss": 2.9385, + "step": 20300 }, { - "epoch": 0.95, - "learning_rate": 2.3013982428666594e-06, - "loss": 2.246, - "step": 547040 + "epoch": 0.07, + "learning_rate": 4.635910633908143e-05, + "loss": 2.9304, + "step": 20400 }, { - "epoch": 0.95, - "learning_rate": 2.3005263029398328e-06, - "loss": 2.1873, - "step": 547050 + "epoch": 0.07, + "learning_rate": 4.634125882113575e-05, + "loss": 2.9351, + "step": 20500 }, { - "epoch": 0.95, - "learning_rate": 2.2996543630130057e-06, - "loss": 2.3561, - "step": 547060 + "epoch": 0.07, + "learning_rate": 4.6323411303190064e-05, + "loss": 2.9297, + "step": 20600 }, { - "epoch": 0.95, - "learning_rate": 2.2987824230861795e-06, - "loss": 2.2678, - "step": 547070 + "epoch": 0.07, + "learning_rate": 4.6305563785244385e-05, + "loss": 2.9271, + "step": 20700 }, { - "epoch": 0.95, - "learning_rate": 2.2979104831593524e-06, - "loss": 2.2016, - "step": 547080 + "epoch": 0.07, + "learning_rate": 4.628771626729871e-05, + "loss": 2.9317, + "step": 20800 }, { - "epoch": 0.95, - "learning_rate": 2.2970385432325257e-06, - "loss": 2.2192, - "step": 547090 + "epoch": 0.07, + "learning_rate": 4.626986874935303e-05, + "loss": 2.9295, + "step": 20900 }, { - "epoch": 0.95, - "learning_rate": 2.2961666033056986e-06, - "loss": 2.2594, - "step": 547100 + "epoch": 0.07, + "learning_rate": 4.625202123140735e-05, + "loss": 2.9402, + "step": 21000 }, { - "epoch": 0.95, - "learning_rate": 2.295294663378872e-06, - "loss": 2.3505, - "step": 547110 + "epoch": 0.08, + "learning_rate": 4.623417371346167e-05, + "loss": 2.9259, + "step": 21100 }, { - "epoch": 0.95, - "learning_rate": 2.294422723452045e-06, - "loss": 2.2501, - "step": 547120 + "epoch": 0.08, + "learning_rate": 4.621632619551599e-05, + "loss": 2.933, + "step": 21200 }, { - "epoch": 0.95, - "learning_rate": 2.2935507835252187e-06, - "loss": 2.2323, - "step": 547130 + "epoch": 0.08, + "learning_rate": 4.619847867757031e-05, + "loss": 2.9216, + "step": 21300 }, { - "epoch": 0.95, - "learning_rate": 2.2926788435983916e-06, - "loss": 2.1234, - "step": 547140 + "epoch": 0.08, + "learning_rate": 4.6180631159624634e-05, + "loss": 2.933, + "step": 21400 }, { - "epoch": 0.95, - "learning_rate": 2.291806903671565e-06, - "loss": 2.0985, - "step": 547150 + "epoch": 0.08, + "learning_rate": 4.6162783641678955e-05, + "loss": 2.9376, + "step": 21500 }, { - "epoch": 0.95, - "learning_rate": 2.290934963744738e-06, - "loss": 2.3311, - "step": 547160 + "epoch": 0.08, + "learning_rate": 4.6144936123733276e-05, + "loss": 2.9255, + "step": 21600 }, { - "epoch": 0.95, - "learning_rate": 2.2900630238179112e-06, - "loss": 2.233, - "step": 547170 + "epoch": 0.08, + "learning_rate": 4.612708860578759e-05, + "loss": 2.9342, + "step": 21700 }, { - "epoch": 0.95, - "learning_rate": 2.289191083891084e-06, - "loss": 2.2663, - "step": 547180 + "epoch": 0.08, + "learning_rate": 4.610924108784191e-05, + "loss": 2.9278, + "step": 21800 }, { - "epoch": 0.95, - "learning_rate": 2.2883191439642575e-06, - "loss": 2.2596, - "step": 547190 + "epoch": 0.08, + "learning_rate": 4.609139356989623e-05, + "loss": 2.9181, + "step": 21900 }, { - "epoch": 0.95, - "learning_rate": 2.287447204037431e-06, - "loss": 2.2153, - "step": 547200 + "epoch": 0.08, + "learning_rate": 4.6073546051950554e-05, + "loss": 2.927, + "step": 22000 }, { - "epoch": 0.95, - "learning_rate": 2.286575264110604e-06, - "loss": 2.1509, - "step": 547210 + "epoch": 0.08, + "learning_rate": 4.6055698534004876e-05, + "loss": 2.9297, + "step": 22100 }, { - "epoch": 0.95, - "learning_rate": 2.285703324183777e-06, - "loss": 2.2355, - "step": 547220 + "epoch": 0.08, + "learning_rate": 4.60378510160592e-05, + "loss": 2.9301, + "step": 22200 }, { - "epoch": 0.95, - "learning_rate": 2.2848313842569505e-06, - "loss": 2.3394, - "step": 547230 + "epoch": 0.08, + "learning_rate": 4.602000349811352e-05, + "loss": 2.9257, + "step": 22300 }, { - "epoch": 0.95, - "learning_rate": 2.2839594443301234e-06, - "loss": 2.0861, - "step": 547240 + "epoch": 0.08, + "learning_rate": 4.600215598016784e-05, + "loss": 2.9263, + "step": 22400 }, { - "epoch": 0.95, - "learning_rate": 2.2830875044032967e-06, - "loss": 2.3179, - "step": 547250 + "epoch": 0.08, + "learning_rate": 4.598430846222216e-05, + "loss": 2.9152, + "step": 22500 }, { - "epoch": 0.95, - "learning_rate": 2.2822155644764697e-06, - "loss": 2.4755, - "step": 547260 + "epoch": 0.08, + "learning_rate": 4.596646094427648e-05, + "loss": 2.9272, + "step": 22600 }, { - "epoch": 0.95, - "learning_rate": 2.2813436245496434e-06, - "loss": 2.2912, - "step": 547270 + "epoch": 0.08, + "learning_rate": 4.59486134263308e-05, + "loss": 2.9196, + "step": 22700 }, { - "epoch": 0.95, - "learning_rate": 2.2804716846228163e-06, - "loss": 2.2019, - "step": 547280 + "epoch": 0.08, + "learning_rate": 4.593076590838512e-05, + "loss": 2.9285, + "step": 22800 }, { - "epoch": 0.95, - "learning_rate": 2.2795997446959897e-06, - "loss": 2.2186, - "step": 547290 + "epoch": 0.08, + "learning_rate": 4.591291839043944e-05, + "loss": 2.9176, + "step": 22900 }, { - "epoch": 0.95, - "learning_rate": 2.2787278047691626e-06, - "loss": 2.2714, - "step": 547300 + "epoch": 0.08, + "learning_rate": 4.589507087249377e-05, + "loss": 2.9267, + "step": 23000 }, { - "epoch": 0.95, - "learning_rate": 2.277855864842336e-06, - "loss": 2.3745, - "step": 547310 + "epoch": 0.08, + "learning_rate": 4.587722335454809e-05, + "loss": 2.9226, + "step": 23100 }, { - "epoch": 0.95, - "learning_rate": 2.276983924915509e-06, - "loss": 2.2315, - "step": 547320 + "epoch": 0.08, + "learning_rate": 4.585937583660241e-05, + "loss": 2.9278, + "step": 23200 }, { - "epoch": 0.95, - "learning_rate": 2.2761119849886827e-06, - "loss": 2.2822, - "step": 547330 + "epoch": 0.08, + "learning_rate": 4.584152831865673e-05, + "loss": 2.9186, + "step": 23300 }, { - "epoch": 0.95, - "learning_rate": 2.2752400450618556e-06, - "loss": 2.2022, - "step": 547340 + "epoch": 0.08, + "learning_rate": 4.582368080071105e-05, + "loss": 2.9262, + "step": 23400 }, { - "epoch": 0.95, - "learning_rate": 2.274368105135029e-06, - "loss": 2.2784, - "step": 547350 + "epoch": 0.08, + "learning_rate": 4.580583328276537e-05, + "loss": 2.9204, + "step": 23500 }, { - "epoch": 0.95, - "learning_rate": 2.273496165208202e-06, - "loss": 2.2043, - "step": 547360 + "epoch": 0.08, + "learning_rate": 4.5787985764819694e-05, + "loss": 2.9287, + "step": 23600 }, { - "epoch": 0.95, - "learning_rate": 2.272624225281375e-06, - "loss": 2.3141, - "step": 547370 + "epoch": 0.08, + "learning_rate": 4.577013824687401e-05, + "loss": 2.9274, + "step": 23700 }, { - "epoch": 0.95, - "learning_rate": 2.271752285354548e-06, - "loss": 2.2086, - "step": 547380 + "epoch": 0.08, + "learning_rate": 4.575229072892833e-05, + "loss": 2.904, + "step": 23800 }, { - "epoch": 0.95, - "learning_rate": 2.2708803454277215e-06, - "loss": 2.2828, - "step": 547390 + "epoch": 0.09, + "learning_rate": 4.573444321098265e-05, + "loss": 2.9017, + "step": 23900 }, { - "epoch": 0.95, - "learning_rate": 2.270008405500895e-06, - "loss": 2.1905, - "step": 547400 + "epoch": 0.09, + "learning_rate": 4.571659569303697e-05, + "loss": 2.9142, + "step": 24000 }, { - "epoch": 0.95, - "learning_rate": 2.269136465574068e-06, - "loss": 2.3122, - "step": 547410 + "epoch": 0.09, + "learning_rate": 4.569874817509129e-05, + "loss": 2.9195, + "step": 24100 }, { - "epoch": 0.95, - "learning_rate": 2.268264525647241e-06, - "loss": 2.2688, - "step": 547420 + "epoch": 0.09, + "learning_rate": 4.5680900657145614e-05, + "loss": 2.9171, + "step": 24200 }, { - "epoch": 0.95, - "learning_rate": 2.2673925857204144e-06, - "loss": 2.1581, - "step": 547430 + "epoch": 0.09, + "learning_rate": 4.5663053139199936e-05, + "loss": 2.921, + "step": 24300 }, { - "epoch": 0.95, - "learning_rate": 2.2665206457935873e-06, - "loss": 2.3199, - "step": 547440 + "epoch": 0.09, + "learning_rate": 4.564520562125426e-05, + "loss": 2.9243, + "step": 24400 }, { - "epoch": 0.95, - "learning_rate": 2.2656487058667607e-06, - "loss": 2.1878, - "step": 547450 + "epoch": 0.09, + "learning_rate": 4.562735810330858e-05, + "loss": 2.9245, + "step": 24500 }, { - "epoch": 0.95, - "learning_rate": 2.2647767659399336e-06, - "loss": 2.0662, - "step": 547460 + "epoch": 0.09, + "learning_rate": 4.56095105853629e-05, + "loss": 2.9135, + "step": 24600 }, { - "epoch": 0.95, - "learning_rate": 2.2639048260131074e-06, - "loss": 2.2949, - "step": 547470 + "epoch": 0.09, + "learning_rate": 4.559166306741722e-05, + "loss": 2.9224, + "step": 24700 }, { - "epoch": 0.95, - "learning_rate": 2.2630328860862803e-06, - "loss": 2.1925, - "step": 547480 + "epoch": 0.09, + "learning_rate": 4.5573815549471535e-05, + "loss": 2.9328, + "step": 24800 }, { - "epoch": 0.95, - "learning_rate": 2.2621609461594537e-06, - "loss": 2.1069, - "step": 547490 + "epoch": 0.09, + "learning_rate": 4.5555968031525856e-05, + "loss": 2.9171, + "step": 24900 }, { - "epoch": 0.95, - "learning_rate": 2.2612890062326266e-06, - "loss": 2.2431, - "step": 547500 + "epoch": 0.09, + "learning_rate": 4.553812051358018e-05, + "loss": 2.9026, + "step": 25000 }, { - "epoch": 0.95, - "learning_rate": 2.2604170663058e-06, - "loss": 2.2422, - "step": 547510 + "epoch": 0.09, + "learning_rate": 4.55202729956345e-05, + "loss": 2.9174, + "step": 25100 }, { - "epoch": 0.95, - "learning_rate": 2.259545126378973e-06, - "loss": 2.2959, - "step": 547520 + "epoch": 0.09, + "learning_rate": 4.550242547768882e-05, + "loss": 2.915, + "step": 25200 }, { - "epoch": 0.95, - "learning_rate": 2.2586731864521466e-06, - "loss": 2.2155, - "step": 547530 + "epoch": 0.09, + "learning_rate": 4.548457795974314e-05, + "loss": 2.9166, + "step": 25300 }, { - "epoch": 0.95, - "learning_rate": 2.2578012465253195e-06, - "loss": 2.3109, - "step": 547540 + "epoch": 0.09, + "learning_rate": 4.546673044179746e-05, + "loss": 2.92, + "step": 25400 }, { - "epoch": 0.95, - "learning_rate": 2.256929306598493e-06, - "loss": 2.2589, - "step": 547550 + "epoch": 0.09, + "learning_rate": 4.5448882923851783e-05, + "loss": 2.9208, + "step": 25500 }, { - "epoch": 0.95, - "learning_rate": 2.256057366671666e-06, - "loss": 2.2799, - "step": 547560 + "epoch": 0.09, + "learning_rate": 4.5431035405906105e-05, + "loss": 2.9125, + "step": 25600 }, { - "epoch": 0.95, - "learning_rate": 2.255185426744839e-06, - "loss": 2.2483, - "step": 547570 + "epoch": 0.09, + "learning_rate": 4.5413187887960426e-05, + "loss": 2.9141, + "step": 25700 }, { - "epoch": 0.95, - "learning_rate": 2.254313486818012e-06, - "loss": 2.2025, - "step": 547580 + "epoch": 0.09, + "learning_rate": 4.539534037001475e-05, + "loss": 2.9063, + "step": 25800 }, { - "epoch": 0.95, - "learning_rate": 2.2534415468911854e-06, - "loss": 2.2733, - "step": 547590 + "epoch": 0.09, + "learning_rate": 4.537749285206906e-05, + "loss": 2.9108, + "step": 25900 }, { - "epoch": 0.95, - "learning_rate": 2.2525696069643588e-06, - "loss": 2.3538, - "step": 547600 + "epoch": 0.09, + "learning_rate": 4.535964533412338e-05, + "loss": 2.8963, + "step": 26000 }, { - "epoch": 0.95, - "learning_rate": 2.251697667037532e-06, - "loss": 2.3007, - "step": 547610 + "epoch": 0.09, + "learning_rate": 4.5341797816177704e-05, + "loss": 2.9079, + "step": 26100 }, { - "epoch": 0.95, - "learning_rate": 2.250825727110705e-06, - "loss": 2.3888, - "step": 547620 + "epoch": 0.09, + "learning_rate": 4.5323950298232025e-05, + "loss": 2.9122, + "step": 26200 }, { - "epoch": 0.96, - "learning_rate": 2.2499537871838784e-06, - "loss": 2.2001, - "step": 547630 + "epoch": 0.09, + "learning_rate": 4.5306102780286346e-05, + "loss": 2.9094, + "step": 26300 }, { - "epoch": 0.96, - "learning_rate": 2.2490818472570513e-06, - "loss": 2.3206, - "step": 547640 + "epoch": 0.09, + "learning_rate": 4.528825526234067e-05, + "loss": 2.9195, + "step": 26400 }, { - "epoch": 0.96, - "learning_rate": 2.2482099073302247e-06, - "loss": 2.2795, - "step": 547650 + "epoch": 0.09, + "learning_rate": 4.527040774439499e-05, + "loss": 2.9079, + "step": 26500 }, { - "epoch": 0.96, - "learning_rate": 2.2473379674033976e-06, - "loss": 2.1441, - "step": 547660 + "epoch": 0.09, + "learning_rate": 4.525256022644931e-05, + "loss": 2.9167, + "step": 26600 }, { - "epoch": 0.96, - "learning_rate": 2.2464660274765713e-06, - "loss": 2.3291, - "step": 547670 + "epoch": 0.1, + "learning_rate": 4.523471270850363e-05, + "loss": 2.9091, + "step": 26700 }, { - "epoch": 0.96, - "learning_rate": 2.2455940875497443e-06, - "loss": 2.3019, - "step": 547680 + "epoch": 0.1, + "learning_rate": 4.521686519055795e-05, + "loss": 2.9022, + "step": 26800 }, { - "epoch": 0.96, - "learning_rate": 2.2447221476229176e-06, - "loss": 2.1395, - "step": 547690 + "epoch": 0.1, + "learning_rate": 4.5199017672612274e-05, + "loss": 2.9099, + "step": 26900 }, { - "epoch": 0.96, - "learning_rate": 2.2438502076960905e-06, - "loss": 2.4181, - "step": 547700 + "epoch": 0.1, + "learning_rate": 4.518117015466659e-05, + "loss": 2.9264, + "step": 27000 }, { - "epoch": 0.96, - "learning_rate": 2.242978267769264e-06, - "loss": 2.3326, - "step": 547710 + "epoch": 0.1, + "learning_rate": 4.516332263672091e-05, + "loss": 2.911, + "step": 27100 }, { - "epoch": 0.96, - "learning_rate": 2.242106327842437e-06, - "loss": 2.2458, - "step": 547720 + "epoch": 0.1, + "learning_rate": 4.514547511877523e-05, + "loss": 2.9119, + "step": 27200 }, { - "epoch": 0.96, - "learning_rate": 2.2412343879156106e-06, - "loss": 2.252, - "step": 547730 + "epoch": 0.1, + "learning_rate": 4.512762760082955e-05, + "loss": 2.9108, + "step": 27300 }, { - "epoch": 0.96, - "learning_rate": 2.2403624479887835e-06, - "loss": 2.2049, - "step": 547740 + "epoch": 0.1, + "learning_rate": 4.510978008288387e-05, + "loss": 2.9135, + "step": 27400 }, { - "epoch": 0.96, - "learning_rate": 2.239490508061957e-06, - "loss": 2.196, - "step": 547750 + "epoch": 0.1, + "learning_rate": 4.5091932564938194e-05, + "loss": 2.9107, + "step": 27500 }, { - "epoch": 0.96, - "learning_rate": 2.2386185681351298e-06, - "loss": 2.3516, - "step": 547760 + "epoch": 0.1, + "learning_rate": 4.5074085046992515e-05, + "loss": 2.8936, + "step": 27600 }, { - "epoch": 0.96, - "learning_rate": 2.237746628208303e-06, - "loss": 2.2954, - "step": 547770 + "epoch": 0.1, + "learning_rate": 4.505623752904684e-05, + "loss": 2.9127, + "step": 27700 }, { - "epoch": 0.96, - "learning_rate": 2.236874688281476e-06, - "loss": 2.1983, - "step": 547780 + "epoch": 0.1, + "learning_rate": 4.503839001110116e-05, + "loss": 2.9002, + "step": 27800 }, { - "epoch": 0.96, - "learning_rate": 2.2360027483546494e-06, - "loss": 2.146, - "step": 547790 + "epoch": 0.1, + "learning_rate": 4.502054249315548e-05, + "loss": 2.9018, + "step": 27900 }, { - "epoch": 0.96, - "learning_rate": 2.2351308084278227e-06, - "loss": 2.2141, - "step": 547800 + "epoch": 0.1, + "learning_rate": 4.50026949752098e-05, + "loss": 2.8991, + "step": 28000 }, { - "epoch": 0.96, - "learning_rate": 2.234258868500996e-06, - "loss": 2.2574, - "step": 547810 + "epoch": 0.1, + "learning_rate": 4.498484745726412e-05, + "loss": 2.9029, + "step": 28100 }, { - "epoch": 0.96, - "learning_rate": 2.233386928574169e-06, - "loss": 2.1786, - "step": 547820 + "epoch": 0.1, + "learning_rate": 4.496699993931844e-05, + "loss": 2.9135, + "step": 28200 }, { - "epoch": 0.96, - "learning_rate": 2.2325149886473423e-06, - "loss": 2.2283, - "step": 547830 + "epoch": 0.1, + "learning_rate": 4.4949152421372764e-05, + "loss": 2.9018, + "step": 28300 }, { - "epoch": 0.96, - "learning_rate": 2.2316430487205153e-06, - "loss": 2.232, - "step": 547840 + "epoch": 0.1, + "learning_rate": 4.4931304903427085e-05, + "loss": 2.9132, + "step": 28400 }, { - "epoch": 0.96, - "learning_rate": 2.2307711087936886e-06, - "loss": 2.2842, - "step": 547850 + "epoch": 0.1, + "learning_rate": 4.4913457385481406e-05, + "loss": 2.915, + "step": 28500 }, { - "epoch": 0.96, - "learning_rate": 2.2298991688668615e-06, - "loss": 2.2714, - "step": 547860 + "epoch": 0.1, + "learning_rate": 4.489560986753573e-05, + "loss": 2.8909, + "step": 28600 }, { - "epoch": 0.96, - "learning_rate": 2.2290272289400353e-06, - "loss": 2.1873, - "step": 547870 + "epoch": 0.1, + "learning_rate": 4.487776234959005e-05, + "loss": 2.9024, + "step": 28700 }, { - "epoch": 0.96, - "learning_rate": 2.2281552890132082e-06, - "loss": 2.2551, - "step": 547880 + "epoch": 0.1, + "learning_rate": 4.485991483164437e-05, + "loss": 2.8926, + "step": 28800 }, { - "epoch": 0.96, - "learning_rate": 2.2272833490863816e-06, - "loss": 2.2201, - "step": 547890 + "epoch": 0.1, + "learning_rate": 4.484206731369869e-05, + "loss": 2.8982, + "step": 28900 }, { - "epoch": 0.96, - "learning_rate": 2.2264114091595545e-06, - "loss": 2.1522, - "step": 547900 + "epoch": 0.1, + "learning_rate": 4.4824219795753006e-05, + "loss": 2.9044, + "step": 29000 }, { - "epoch": 0.96, - "learning_rate": 2.225539469232728e-06, - "loss": 2.3391, - "step": 547910 + "epoch": 0.1, + "learning_rate": 4.480637227780733e-05, + "loss": 2.9007, + "step": 29100 }, { - "epoch": 0.96, - "learning_rate": 2.2246675293059008e-06, - "loss": 2.2814, - "step": 547920 + "epoch": 0.1, + "learning_rate": 4.478852475986165e-05, + "loss": 2.8998, + "step": 29200 }, { - "epoch": 0.96, - "learning_rate": 2.2237955893790745e-06, - "loss": 2.287, - "step": 547930 + "epoch": 0.1, + "learning_rate": 4.477067724191597e-05, + "loss": 2.9021, + "step": 29300 }, { - "epoch": 0.96, - "learning_rate": 2.2229236494522475e-06, - "loss": 2.3146, - "step": 547940 + "epoch": 0.1, + "learning_rate": 4.475282972397029e-05, + "loss": 2.9067, + "step": 29400 }, { - "epoch": 0.96, - "learning_rate": 2.222051709525421e-06, - "loss": 2.1639, - "step": 547950 + "epoch": 0.11, + "learning_rate": 4.473498220602461e-05, + "loss": 2.9029, + "step": 29500 }, { - "epoch": 0.96, - "learning_rate": 2.2211797695985937e-06, - "loss": 2.3047, - "step": 547960 + "epoch": 0.11, + "learning_rate": 4.471713468807893e-05, + "loss": 2.8996, + "step": 29600 }, { - "epoch": 0.96, - "learning_rate": 2.220307829671767e-06, - "loss": 2.2788, - "step": 547970 + "epoch": 0.11, + "learning_rate": 4.4699287170133254e-05, + "loss": 2.8947, + "step": 29700 }, { - "epoch": 0.96, - "learning_rate": 2.21943588974494e-06, - "loss": 2.2073, - "step": 547980 + "epoch": 0.11, + "learning_rate": 4.4681439652187575e-05, + "loss": 2.8999, + "step": 29800 }, { - "epoch": 0.96, - "learning_rate": 2.2185639498181133e-06, - "loss": 2.2876, - "step": 547990 + "epoch": 0.11, + "learning_rate": 4.4663592134241897e-05, + "loss": 2.8911, + "step": 29900 }, { - "epoch": 0.96, - "learning_rate": 2.2176920098912867e-06, - "loss": 2.2736, - "step": 548000 + "epoch": 0.11, + "learning_rate": 4.464574461629622e-05, + "loss": 2.8956, + "step": 30000 }, { - "epoch": 0.96, - "learning_rate": 2.21682006996446e-06, - "loss": 2.265, - "step": 548010 + "epoch": 0.11, + "learning_rate": 4.462789709835053e-05, + "loss": 2.9037, + "step": 30100 }, { - "epoch": 0.96, - "learning_rate": 2.215948130037633e-06, - "loss": 2.2266, - "step": 548020 + "epoch": 0.11, + "learning_rate": 4.4610049580404853e-05, + "loss": 2.888, + "step": 30200 }, { - "epoch": 0.96, - "learning_rate": 2.2150761901108063e-06, - "loss": 2.2271, - "step": 548030 + "epoch": 0.11, + "learning_rate": 4.4592202062459175e-05, + "loss": 2.8946, + "step": 30300 }, { - "epoch": 0.96, - "learning_rate": 2.2142042501839792e-06, - "loss": 2.2247, - "step": 548040 + "epoch": 0.11, + "learning_rate": 4.4574354544513496e-05, + "loss": 2.9023, + "step": 30400 }, { - "epoch": 0.96, - "learning_rate": 2.2133323102571526e-06, - "loss": 2.2552, - "step": 548050 + "epoch": 0.11, + "learning_rate": 4.455650702656782e-05, + "loss": 2.9015, + "step": 30500 }, { - "epoch": 0.96, - "learning_rate": 2.2124603703303255e-06, - "loss": 2.2627, - "step": 548060 + "epoch": 0.11, + "learning_rate": 4.453865950862214e-05, + "loss": 2.8981, + "step": 30600 }, { - "epoch": 0.96, - "learning_rate": 2.2115884304034993e-06, - "loss": 2.2483, - "step": 548070 + "epoch": 0.11, + "learning_rate": 4.452081199067646e-05, + "loss": 2.9012, + "step": 30700 }, { - "epoch": 0.96, - "learning_rate": 2.210716490476672e-06, - "loss": 2.3368, - "step": 548080 + "epoch": 0.11, + "learning_rate": 4.450296447273078e-05, + "loss": 2.9027, + "step": 30800 }, { - "epoch": 0.96, - "learning_rate": 2.2098445505498455e-06, - "loss": 2.2257, - "step": 548090 + "epoch": 0.11, + "learning_rate": 4.44851169547851e-05, + "loss": 2.8998, + "step": 30900 }, { - "epoch": 0.96, - "learning_rate": 2.2089726106230185e-06, - "loss": 2.2755, - "step": 548100 + "epoch": 0.11, + "learning_rate": 4.446726943683942e-05, + "loss": 2.896, + "step": 31000 }, { - "epoch": 0.96, - "learning_rate": 2.208100670696192e-06, - "loss": 2.2692, - "step": 548110 + "epoch": 0.11, + "learning_rate": 4.4449421918893744e-05, + "loss": 2.8943, + "step": 31100 }, { - "epoch": 0.96, - "learning_rate": 2.2072287307693647e-06, - "loss": 2.2085, - "step": 548120 + "epoch": 0.11, + "learning_rate": 4.443157440094806e-05, + "loss": 2.8959, + "step": 31200 }, { - "epoch": 0.96, - "learning_rate": 2.2063567908425385e-06, - "loss": 2.1802, - "step": 548130 + "epoch": 0.11, + "learning_rate": 4.441372688300238e-05, + "loss": 2.8864, + "step": 31300 }, { - "epoch": 0.96, - "learning_rate": 2.2054848509157114e-06, - "loss": 2.1915, - "step": 548140 + "epoch": 0.11, + "learning_rate": 4.43958793650567e-05, + "loss": 2.8969, + "step": 31400 }, { - "epoch": 0.96, - "learning_rate": 2.2046129109888848e-06, - "loss": 2.2696, - "step": 548150 + "epoch": 0.11, + "learning_rate": 4.437803184711102e-05, + "loss": 2.8877, + "step": 31500 }, { - "epoch": 0.96, - "learning_rate": 2.2037409710620577e-06, - "loss": 2.2594, - "step": 548160 + "epoch": 0.11, + "learning_rate": 4.4360184329165344e-05, + "loss": 2.888, + "step": 31600 }, { - "epoch": 0.96, - "learning_rate": 2.202869031135231e-06, - "loss": 2.3258, - "step": 548170 + "epoch": 0.11, + "learning_rate": 4.4342336811219665e-05, + "loss": 2.8799, + "step": 31700 }, { - "epoch": 0.96, - "learning_rate": 2.201997091208404e-06, - "loss": 2.2721, - "step": 548180 + "epoch": 0.11, + "learning_rate": 4.4324489293273986e-05, + "loss": 2.8901, + "step": 31800 }, { - "epoch": 0.96, - "learning_rate": 2.2011251512815773e-06, - "loss": 2.2186, - "step": 548190 + "epoch": 0.11, + "learning_rate": 4.430664177532831e-05, + "loss": 2.8944, + "step": 31900 }, { - "epoch": 0.96, - "learning_rate": 2.2002532113547507e-06, - "loss": 2.3382, - "step": 548200 + "epoch": 0.11, + "learning_rate": 4.428879425738263e-05, + "loss": 2.8914, + "step": 32000 }, { - "epoch": 0.96, - "learning_rate": 2.199381271427924e-06, - "loss": 2.3268, - "step": 548210 + "epoch": 0.11, + "learning_rate": 4.427094673943695e-05, + "loss": 2.8816, + "step": 32100 }, { - "epoch": 0.96, - "learning_rate": 2.198509331501097e-06, - "loss": 2.3425, - "step": 548220 + "epoch": 0.11, + "learning_rate": 4.425309922149127e-05, + "loss": 2.8752, + "step": 32200 }, { - "epoch": 0.96, - "learning_rate": 2.1976373915742703e-06, - "loss": 2.1319, - "step": 548230 + "epoch": 0.12, + "learning_rate": 4.4235251703545585e-05, + "loss": 2.8947, + "step": 32300 }, { - "epoch": 0.96, - "learning_rate": 2.196765451647443e-06, - "loss": 2.2031, - "step": 548240 + "epoch": 0.12, + "learning_rate": 4.421740418559991e-05, + "loss": 2.8882, + "step": 32400 }, { - "epoch": 0.96, - "learning_rate": 2.1958935117206165e-06, - "loss": 2.2311, - "step": 548250 + "epoch": 0.12, + "learning_rate": 4.419955666765423e-05, + "loss": 2.8851, + "step": 32500 }, { - "epoch": 0.96, - "learning_rate": 2.1950215717937895e-06, - "loss": 2.2964, - "step": 548260 + "epoch": 0.12, + "learning_rate": 4.418170914970855e-05, + "loss": 2.8871, + "step": 32600 }, { - "epoch": 0.96, - "learning_rate": 2.1941496318669632e-06, - "loss": 2.241, - "step": 548270 + "epoch": 0.12, + "learning_rate": 4.416386163176287e-05, + "loss": 2.8999, + "step": 32700 }, { - "epoch": 0.96, - "learning_rate": 2.193277691940136e-06, - "loss": 2.1729, - "step": 548280 + "epoch": 0.12, + "learning_rate": 4.414601411381719e-05, + "loss": 2.8968, + "step": 32800 }, { - "epoch": 0.96, - "learning_rate": 2.1924057520133095e-06, - "loss": 2.1319, - "step": 548290 + "epoch": 0.12, + "learning_rate": 4.412816659587151e-05, + "loss": 2.8961, + "step": 32900 }, { - "epoch": 0.96, - "learning_rate": 2.1915338120864824e-06, - "loss": 2.2774, - "step": 548300 + "epoch": 0.12, + "learning_rate": 4.4110319077925834e-05, + "loss": 2.8843, + "step": 33000 }, { - "epoch": 0.96, - "learning_rate": 2.1906618721596558e-06, - "loss": 2.3251, - "step": 548310 + "epoch": 0.12, + "learning_rate": 4.4092471559980155e-05, + "loss": 2.8937, + "step": 33100 }, { - "epoch": 0.96, - "learning_rate": 2.1897899322328287e-06, - "loss": 2.2287, - "step": 548320 + "epoch": 0.12, + "learning_rate": 4.4074624042034476e-05, + "loss": 2.8943, + "step": 33200 }, { - "epoch": 0.96, - "learning_rate": 2.1889179923060025e-06, - "loss": 2.2735, - "step": 548330 + "epoch": 0.12, + "learning_rate": 4.40567765240888e-05, + "loss": 2.8934, + "step": 33300 }, { - "epoch": 0.96, - "learning_rate": 2.1880460523791754e-06, - "loss": 2.3578, - "step": 548340 + "epoch": 0.12, + "learning_rate": 4.403892900614312e-05, + "loss": 2.8827, + "step": 33400 }, { - "epoch": 0.96, - "learning_rate": 2.1871741124523487e-06, - "loss": 2.3219, - "step": 548350 + "epoch": 0.12, + "learning_rate": 4.402108148819744e-05, + "loss": 2.8842, + "step": 33500 }, { - "epoch": 0.96, - "learning_rate": 2.1863021725255217e-06, - "loss": 2.285, - "step": 548360 + "epoch": 0.12, + "learning_rate": 4.400323397025176e-05, + "loss": 2.897, + "step": 33600 }, { - "epoch": 0.96, - "learning_rate": 2.185430232598695e-06, - "loss": 2.2455, - "step": 548370 + "epoch": 0.12, + "learning_rate": 4.398538645230608e-05, + "loss": 2.8934, + "step": 33700 }, { - "epoch": 0.96, - "learning_rate": 2.184558292671868e-06, - "loss": 2.2134, - "step": 548380 + "epoch": 0.12, + "learning_rate": 4.3967538934360404e-05, + "loss": 2.8872, + "step": 33800 }, { - "epoch": 0.96, - "learning_rate": 2.1836863527450413e-06, - "loss": 2.3495, - "step": 548390 + "epoch": 0.12, + "learning_rate": 4.3949691416414725e-05, + "loss": 2.8913, + "step": 33900 }, { - "epoch": 0.96, - "learning_rate": 2.1828144128182146e-06, - "loss": 2.2239, - "step": 548400 + "epoch": 0.12, + "learning_rate": 4.3931843898469046e-05, + "loss": 2.8967, + "step": 34000 }, { - "epoch": 0.96, - "learning_rate": 2.181942472891388e-06, - "loss": 2.2084, - "step": 548410 + "epoch": 0.12, + "learning_rate": 4.391399638052337e-05, + "loss": 2.8891, + "step": 34100 }, { - "epoch": 0.96, - "learning_rate": 2.181070532964561e-06, - "loss": 2.2495, - "step": 548420 + "epoch": 0.12, + "learning_rate": 4.389614886257769e-05, + "loss": 2.8905, + "step": 34200 }, { - "epoch": 0.96, - "learning_rate": 2.1801985930377342e-06, - "loss": 2.2749, - "step": 548430 + "epoch": 0.12, + "learning_rate": 4.3878301344632e-05, + "loss": 2.8873, + "step": 34300 }, { - "epoch": 0.96, - "learning_rate": 2.179326653110907e-06, - "loss": 2.2085, - "step": 548440 + "epoch": 0.12, + "learning_rate": 4.3860453826686324e-05, + "loss": 2.8666, + "step": 34400 }, { - "epoch": 0.96, - "learning_rate": 2.1784547131840805e-06, - "loss": 2.2028, - "step": 548450 + "epoch": 0.12, + "learning_rate": 4.3842606308740645e-05, + "loss": 2.8838, + "step": 34500 }, { - "epoch": 0.96, - "learning_rate": 2.1775827732572534e-06, - "loss": 2.2778, - "step": 548460 + "epoch": 0.12, + "learning_rate": 4.3824758790794967e-05, + "loss": 2.8856, + "step": 34600 }, { - "epoch": 0.96, - "learning_rate": 2.176710833330427e-06, - "loss": 2.3775, - "step": 548470 + "epoch": 0.12, + "learning_rate": 4.380691127284929e-05, + "loss": 2.8823, + "step": 34700 }, { - "epoch": 0.96, - "learning_rate": 2.1758388934036e-06, - "loss": 2.1392, - "step": 548480 + "epoch": 0.12, + "learning_rate": 4.378906375490361e-05, + "loss": 2.8862, + "step": 34800 }, { - "epoch": 0.96, - "learning_rate": 2.1749669534767735e-06, - "loss": 2.2315, - "step": 548490 + "epoch": 0.12, + "learning_rate": 4.377121623695793e-05, + "loss": 2.8845, + "step": 34900 }, { - "epoch": 0.96, - "learning_rate": 2.1740950135499464e-06, - "loss": 2.3304, - "step": 548500 + "epoch": 0.12, + "learning_rate": 4.375336871901225e-05, + "loss": 2.8771, + "step": 35000 }, { - "epoch": 0.96, - "learning_rate": 2.1732230736231197e-06, - "loss": 2.2791, - "step": 548510 + "epoch": 0.13, + "learning_rate": 4.373552120106657e-05, + "loss": 2.8801, + "step": 35100 }, { - "epoch": 0.96, - "learning_rate": 2.1723511336962927e-06, - "loss": 2.2093, - "step": 548520 + "epoch": 0.13, + "learning_rate": 4.3717673683120894e-05, + "loss": 2.8853, + "step": 35200 }, { - "epoch": 0.96, - "learning_rate": 2.1714791937694664e-06, - "loss": 2.2383, - "step": 548530 + "epoch": 0.13, + "learning_rate": 4.369982616517521e-05, + "loss": 2.8846, + "step": 35300 }, { - "epoch": 0.96, - "learning_rate": 2.1706072538426394e-06, - "loss": 2.4283, - "step": 548540 + "epoch": 0.13, + "learning_rate": 4.368197864722953e-05, + "loss": 2.8738, + "step": 35400 }, { - "epoch": 0.96, - "learning_rate": 2.1697353139158127e-06, - "loss": 2.2694, - "step": 548550 + "epoch": 0.13, + "learning_rate": 4.366413112928385e-05, + "loss": 2.8921, + "step": 35500 }, { - "epoch": 0.96, - "learning_rate": 2.1688633739889856e-06, - "loss": 2.1701, - "step": 548560 + "epoch": 0.13, + "learning_rate": 4.364628361133817e-05, + "loss": 2.8795, + "step": 35600 }, { - "epoch": 0.96, - "learning_rate": 2.167991434062159e-06, - "loss": 2.2412, - "step": 548570 + "epoch": 0.13, + "learning_rate": 4.362843609339249e-05, + "loss": 2.8811, + "step": 35700 }, { - "epoch": 0.96, - "learning_rate": 2.167119494135332e-06, - "loss": 2.2505, - "step": 548580 + "epoch": 0.13, + "learning_rate": 4.3610588575446814e-05, + "loss": 2.8788, + "step": 35800 }, { - "epoch": 0.96, - "learning_rate": 2.1662475542085052e-06, - "loss": 2.2266, - "step": 548590 + "epoch": 0.13, + "learning_rate": 4.3592741057501136e-05, + "loss": 2.8811, + "step": 35900 }, { - "epoch": 0.96, - "learning_rate": 2.1653756142816786e-06, - "loss": 2.3442, - "step": 548600 + "epoch": 0.13, + "learning_rate": 4.357489353955546e-05, + "loss": 2.8831, + "step": 36000 }, { - "epoch": 0.96, - "learning_rate": 2.164503674354852e-06, - "loss": 2.3059, - "step": 548610 + "epoch": 0.13, + "learning_rate": 4.355704602160978e-05, + "loss": 2.8804, + "step": 36100 }, { - "epoch": 0.96, - "learning_rate": 2.163631734428025e-06, - "loss": 2.3164, - "step": 548620 + "epoch": 0.13, + "learning_rate": 4.35391985036641e-05, + "loss": 2.8745, + "step": 36200 }, { - "epoch": 0.96, - "learning_rate": 2.162759794501198e-06, - "loss": 2.4074, - "step": 548630 + "epoch": 0.13, + "learning_rate": 4.352135098571842e-05, + "loss": 2.8806, + "step": 36300 }, { - "epoch": 0.96, - "learning_rate": 2.161887854574371e-06, - "loss": 2.3199, - "step": 548640 + "epoch": 0.13, + "learning_rate": 4.3503503467772735e-05, + "loss": 2.889, + "step": 36400 }, { - "epoch": 0.96, - "learning_rate": 2.1610159146475445e-06, - "loss": 2.1971, - "step": 548650 + "epoch": 0.13, + "learning_rate": 4.3485655949827056e-05, + "loss": 2.8757, + "step": 36500 }, { - "epoch": 0.96, - "learning_rate": 2.160143974720718e-06, - "loss": 2.2494, - "step": 548660 + "epoch": 0.13, + "learning_rate": 4.346780843188138e-05, + "loss": 2.8937, + "step": 36600 }, { - "epoch": 0.96, - "learning_rate": 2.159272034793891e-06, - "loss": 2.3235, - "step": 548670 + "epoch": 0.13, + "learning_rate": 4.34499609139357e-05, + "loss": 2.8649, + "step": 36700 }, { - "epoch": 0.96, - "learning_rate": 2.158400094867064e-06, - "loss": 2.3405, - "step": 548680 + "epoch": 0.13, + "learning_rate": 4.343211339599002e-05, + "loss": 2.8782, + "step": 36800 }, { - "epoch": 0.96, - "learning_rate": 2.1575281549402374e-06, - "loss": 2.2133, - "step": 548690 + "epoch": 0.13, + "learning_rate": 4.341426587804434e-05, + "loss": 2.8843, + "step": 36900 }, { - "epoch": 0.96, - "learning_rate": 2.1566562150134104e-06, - "loss": 2.3514, - "step": 548700 + "epoch": 0.13, + "learning_rate": 4.339641836009866e-05, + "loss": 2.8823, + "step": 37000 }, { - "epoch": 0.96, - "learning_rate": 2.1557842750865837e-06, - "loss": 2.2337, - "step": 548710 + "epoch": 0.13, + "learning_rate": 4.3378570842152983e-05, + "loss": 2.8677, + "step": 37100 }, { - "epoch": 0.96, - "learning_rate": 2.1549123351597566e-06, - "loss": 2.2102, - "step": 548720 + "epoch": 0.13, + "learning_rate": 4.3360723324207305e-05, + "loss": 2.8788, + "step": 37200 }, { - "epoch": 0.96, - "learning_rate": 2.1540403952329304e-06, - "loss": 2.2615, - "step": 548730 + "epoch": 0.13, + "learning_rate": 4.3342875806261626e-05, + "loss": 2.8773, + "step": 37300 }, { - "epoch": 0.96, - "learning_rate": 2.1531684553061033e-06, - "loss": 2.2055, - "step": 548740 + "epoch": 0.13, + "learning_rate": 4.332502828831595e-05, + "loss": 2.8774, + "step": 37400 }, { - "epoch": 0.96, - "learning_rate": 2.1522965153792767e-06, - "loss": 2.2878, - "step": 548750 + "epoch": 0.13, + "learning_rate": 4.330718077037026e-05, + "loss": 2.8756, + "step": 37500 }, { - "epoch": 0.96, - "learning_rate": 2.1514245754524496e-06, - "loss": 2.3249, - "step": 548760 + "epoch": 0.13, + "learning_rate": 4.328933325242458e-05, + "loss": 2.8975, + "step": 37600 }, { - "epoch": 0.96, - "learning_rate": 2.150552635525623e-06, - "loss": 2.3096, - "step": 548770 + "epoch": 0.13, + "learning_rate": 4.3271485734478904e-05, + "loss": 2.8696, + "step": 37700 }, { - "epoch": 0.96, - "learning_rate": 2.149680695598796e-06, - "loss": 2.3044, - "step": 548780 + "epoch": 0.13, + "learning_rate": 4.3253638216533225e-05, + "loss": 2.8816, + "step": 37800 }, { - "epoch": 0.96, - "learning_rate": 2.148808755671969e-06, - "loss": 2.2532, - "step": 548790 + "epoch": 0.14, + "learning_rate": 4.3235790698587546e-05, + "loss": 2.8705, + "step": 37900 }, { - "epoch": 0.96, - "learning_rate": 2.1479368157451425e-06, - "loss": 2.2492, - "step": 548800 + "epoch": 0.14, + "learning_rate": 4.321794318064187e-05, + "loss": 2.8702, + "step": 38000 }, { - "epoch": 0.96, - "learning_rate": 2.147064875818316e-06, - "loss": 2.161, - "step": 548810 + "epoch": 0.14, + "learning_rate": 4.320009566269619e-05, + "loss": 2.8791, + "step": 38100 }, { - "epoch": 0.96, - "learning_rate": 2.146192935891489e-06, - "loss": 2.2425, - "step": 548820 + "epoch": 0.14, + "learning_rate": 4.318224814475051e-05, + "loss": 2.8812, + "step": 38200 }, { - "epoch": 0.96, - "learning_rate": 2.145320995964662e-06, - "loss": 2.2544, - "step": 548830 + "epoch": 0.14, + "learning_rate": 4.316440062680484e-05, + "loss": 2.868, + "step": 38300 }, { - "epoch": 0.96, - "learning_rate": 2.144449056037835e-06, - "loss": 2.2085, - "step": 548840 + "epoch": 0.14, + "learning_rate": 4.314655310885915e-05, + "loss": 2.881, + "step": 38400 }, { - "epoch": 0.96, - "learning_rate": 2.1435771161110084e-06, - "loss": 2.1969, - "step": 548850 + "epoch": 0.14, + "learning_rate": 4.3128705590913474e-05, + "loss": 2.8783, + "step": 38500 }, { - "epoch": 0.96, - "learning_rate": 2.1427051761841818e-06, - "loss": 2.2056, - "step": 548860 + "epoch": 0.14, + "learning_rate": 4.3110858072967795e-05, + "loss": 2.8848, + "step": 38600 }, { - "epoch": 0.96, - "learning_rate": 2.141833236257355e-06, - "loss": 2.1675, - "step": 548870 + "epoch": 0.14, + "learning_rate": 4.3093010555022116e-05, + "loss": 2.8771, + "step": 38700 }, { - "epoch": 0.96, - "learning_rate": 2.140961296330528e-06, - "loss": 2.3683, - "step": 548880 + "epoch": 0.14, + "learning_rate": 4.307516303707644e-05, + "loss": 2.8584, + "step": 38800 }, { - "epoch": 0.96, - "learning_rate": 2.1400893564037014e-06, - "loss": 2.2568, - "step": 548890 + "epoch": 0.14, + "learning_rate": 4.305731551913076e-05, + "loss": 2.8824, + "step": 38900 }, { - "epoch": 0.96, - "learning_rate": 2.1392174164768743e-06, - "loss": 2.2644, - "step": 548900 + "epoch": 0.14, + "learning_rate": 4.303946800118508e-05, + "loss": 2.879, + "step": 39000 }, { - "epoch": 0.96, - "learning_rate": 2.1383454765500477e-06, - "loss": 2.2656, - "step": 548910 + "epoch": 0.14, + "learning_rate": 4.30216204832394e-05, + "loss": 2.8753, + "step": 39100 }, { - "epoch": 0.96, - "learning_rate": 2.1374735366232206e-06, - "loss": 2.2273, - "step": 548920 + "epoch": 0.14, + "learning_rate": 4.300377296529372e-05, + "loss": 2.8864, + "step": 39200 }, { - "epoch": 0.96, - "learning_rate": 2.1366015966963944e-06, - "loss": 2.2378, - "step": 548930 + "epoch": 0.14, + "learning_rate": 4.298592544734804e-05, + "loss": 2.8741, + "step": 39300 }, { - "epoch": 0.96, - "learning_rate": 2.1357296567695673e-06, - "loss": 2.2276, - "step": 548940 + "epoch": 0.14, + "learning_rate": 4.2968077929402365e-05, + "loss": 2.8719, + "step": 39400 }, { - "epoch": 0.96, - "learning_rate": 2.1348577168427406e-06, - "loss": 2.3637, - "step": 548950 + "epoch": 0.14, + "learning_rate": 4.295023041145668e-05, + "loss": 2.8661, + "step": 39500 }, { - "epoch": 0.96, - "learning_rate": 2.1339857769159136e-06, - "loss": 2.2605, - "step": 548960 + "epoch": 0.14, + "learning_rate": 4.2932382893511e-05, + "loss": 2.8768, + "step": 39600 }, { - "epoch": 0.96, - "learning_rate": 2.133113836989087e-06, - "loss": 2.232, - "step": 548970 + "epoch": 0.14, + "learning_rate": 4.291453537556532e-05, + "loss": 2.858, + "step": 39700 }, { - "epoch": 0.96, - "learning_rate": 2.13224189706226e-06, - "loss": 2.2656, - "step": 548980 + "epoch": 0.14, + "learning_rate": 4.289668785761964e-05, + "loss": 2.8816, + "step": 39800 }, { - "epoch": 0.96, - "learning_rate": 2.131369957135433e-06, - "loss": 2.3304, - "step": 548990 + "epoch": 0.14, + "learning_rate": 4.2878840339673964e-05, + "loss": 2.8814, + "step": 39900 }, { - "epoch": 0.96, - "learning_rate": 2.1304980172086065e-06, - "loss": 2.1228, - "step": 549000 + "epoch": 0.14, + "learning_rate": 4.2860992821728285e-05, + "loss": 2.8632, + "step": 40000 }, { - "epoch": 0.96, - "learning_rate": 2.12962607728178e-06, - "loss": 2.3305, - "step": 549010 + "epoch": 0.14, + "learning_rate": 4.2843145303782606e-05, + "loss": 2.8693, + "step": 40100 }, { - "epoch": 0.96, - "learning_rate": 2.1287541373549528e-06, - "loss": 2.308, - "step": 549020 + "epoch": 0.14, + "learning_rate": 4.282529778583693e-05, + "loss": 2.8715, + "step": 40200 }, { - "epoch": 0.96, - "learning_rate": 2.127882197428126e-06, - "loss": 2.2958, - "step": 549030 + "epoch": 0.14, + "learning_rate": 4.280745026789125e-05, + "loss": 2.8737, + "step": 40300 }, { - "epoch": 0.96, - "learning_rate": 2.127010257501299e-06, - "loss": 2.2719, - "step": 549040 + "epoch": 0.14, + "learning_rate": 4.278960274994557e-05, + "loss": 2.8663, + "step": 40400 }, { - "epoch": 0.96, - "learning_rate": 2.1261383175744724e-06, - "loss": 2.3376, - "step": 549050 + "epoch": 0.14, + "learning_rate": 4.277175523199989e-05, + "loss": 2.8713, + "step": 40500 }, { - "epoch": 0.96, - "learning_rate": 2.1252663776476457e-06, - "loss": 2.2011, - "step": 549060 + "epoch": 0.14, + "learning_rate": 4.2753907714054206e-05, + "loss": 2.869, + "step": 40600 }, { - "epoch": 0.96, - "learning_rate": 2.124394437720819e-06, - "loss": 2.2153, - "step": 549070 + "epoch": 0.15, + "learning_rate": 4.273606019610853e-05, + "loss": 2.8638, + "step": 40700 }, { - "epoch": 0.96, - "learning_rate": 2.123522497793992e-06, - "loss": 2.2211, - "step": 549080 + "epoch": 0.15, + "learning_rate": 4.271821267816285e-05, + "loss": 2.8783, + "step": 40800 }, { - "epoch": 0.96, - "learning_rate": 2.1226505578671654e-06, - "loss": 2.2413, - "step": 549090 + "epoch": 0.15, + "learning_rate": 4.270036516021717e-05, + "loss": 2.8704, + "step": 40900 }, { - "epoch": 0.96, - "learning_rate": 2.1217786179403383e-06, - "loss": 2.2932, - "step": 549100 + "epoch": 0.15, + "learning_rate": 4.268251764227149e-05, + "loss": 2.8665, + "step": 41000 }, { - "epoch": 0.96, - "learning_rate": 2.1209066780135116e-06, - "loss": 2.2626, - "step": 549110 + "epoch": 0.15, + "learning_rate": 4.266467012432581e-05, + "loss": 2.8649, + "step": 41100 }, { - "epoch": 0.96, - "learning_rate": 2.1200347380866846e-06, - "loss": 2.2682, - "step": 549120 + "epoch": 0.15, + "learning_rate": 4.264682260638013e-05, + "loss": 2.8722, + "step": 41200 }, { - "epoch": 0.96, - "learning_rate": 2.1191627981598583e-06, - "loss": 2.3554, - "step": 549130 + "epoch": 0.15, + "learning_rate": 4.2628975088434454e-05, + "loss": 2.8696, + "step": 41300 }, { - "epoch": 0.96, - "learning_rate": 2.1182908582330312e-06, - "loss": 2.2765, - "step": 549140 + "epoch": 0.15, + "learning_rate": 4.2611127570488775e-05, + "loss": 2.8669, + "step": 41400 }, { - "epoch": 0.96, - "learning_rate": 2.1174189183062046e-06, - "loss": 2.3049, - "step": 549150 + "epoch": 0.15, + "learning_rate": 4.2593280052543097e-05, + "loss": 2.8631, + "step": 41500 }, { - "epoch": 0.96, - "learning_rate": 2.1165469783793775e-06, - "loss": 2.3702, - "step": 549160 + "epoch": 0.15, + "learning_rate": 4.257543253459742e-05, + "loss": 2.8778, + "step": 41600 }, { - "epoch": 0.96, - "learning_rate": 2.115675038452551e-06, - "loss": 2.1818, - "step": 549170 + "epoch": 0.15, + "learning_rate": 4.255758501665173e-05, + "loss": 2.8643, + "step": 41700 }, { - "epoch": 0.96, - "learning_rate": 2.1148030985257238e-06, - "loss": 2.2866, - "step": 549180 + "epoch": 0.15, + "learning_rate": 4.2539737498706053e-05, + "loss": 2.854, + "step": 41800 }, { - "epoch": 0.96, - "learning_rate": 2.113931158598897e-06, - "loss": 2.3641, - "step": 549190 + "epoch": 0.15, + "learning_rate": 4.2521889980760375e-05, + "loss": 2.8628, + "step": 41900 }, { - "epoch": 0.96, - "learning_rate": 2.1130592186720705e-06, - "loss": 2.2369, - "step": 549200 + "epoch": 0.15, + "learning_rate": 4.2504042462814696e-05, + "loss": 2.8594, + "step": 42000 }, { - "epoch": 0.96, - "learning_rate": 2.112187278745244e-06, - "loss": 2.3028, - "step": 549210 + "epoch": 0.15, + "learning_rate": 4.248619494486902e-05, + "loss": 2.8626, + "step": 42100 }, { - "epoch": 0.96, - "learning_rate": 2.1113153388184167e-06, - "loss": 2.3245, - "step": 549220 + "epoch": 0.15, + "learning_rate": 4.246834742692334e-05, + "loss": 2.8617, + "step": 42200 }, { - "epoch": 0.96, - "learning_rate": 2.11044339889159e-06, - "loss": 2.1161, - "step": 549230 + "epoch": 0.15, + "learning_rate": 4.245049990897766e-05, + "loss": 2.8608, + "step": 42300 }, { - "epoch": 0.96, - "learning_rate": 2.109571458964763e-06, - "loss": 2.3191, - "step": 549240 + "epoch": 0.15, + "learning_rate": 4.243265239103198e-05, + "loss": 2.8686, + "step": 42400 }, { - "epoch": 0.96, - "learning_rate": 2.1086995190379364e-06, - "loss": 2.2109, - "step": 549250 + "epoch": 0.15, + "learning_rate": 4.24148048730863e-05, + "loss": 2.8715, + "step": 42500 }, { - "epoch": 0.96, - "learning_rate": 2.1078275791111097e-06, - "loss": 2.1694, - "step": 549260 + "epoch": 0.15, + "learning_rate": 4.239695735514062e-05, + "loss": 2.8743, + "step": 42600 }, { - "epoch": 0.96, - "learning_rate": 2.106955639184283e-06, - "loss": 2.3058, - "step": 549270 + "epoch": 0.15, + "learning_rate": 4.2379109837194944e-05, + "loss": 2.8715, + "step": 42700 }, { - "epoch": 0.96, - "learning_rate": 2.106083699257456e-06, - "loss": 2.3565, - "step": 549280 + "epoch": 0.15, + "learning_rate": 4.236126231924926e-05, + "loss": 2.8652, + "step": 42800 }, { - "epoch": 0.96, - "learning_rate": 2.1052117593306293e-06, - "loss": 2.2459, - "step": 549290 + "epoch": 0.15, + "learning_rate": 4.234341480130358e-05, + "loss": 2.8489, + "step": 42900 }, { - "epoch": 0.96, - "learning_rate": 2.1043398194038022e-06, - "loss": 2.3758, - "step": 549300 + "epoch": 0.15, + "learning_rate": 4.23255672833579e-05, + "loss": 2.8605, + "step": 43000 }, { - "epoch": 0.96, - "learning_rate": 2.1034678794769756e-06, - "loss": 2.252, - "step": 549310 + "epoch": 0.15, + "learning_rate": 4.230771976541222e-05, + "loss": 2.8606, + "step": 43100 }, { - "epoch": 0.96, - "learning_rate": 2.1025959395501485e-06, - "loss": 2.2538, - "step": 549320 + "epoch": 0.15, + "learning_rate": 4.2289872247466544e-05, + "loss": 2.8656, + "step": 43200 }, { - "epoch": 0.96, - "learning_rate": 2.1017239996233223e-06, - "loss": 2.2192, - "step": 549330 + "epoch": 0.15, + "learning_rate": 4.2272024729520865e-05, + "loss": 2.8607, + "step": 43300 }, { - "epoch": 0.96, - "learning_rate": 2.100852059696495e-06, - "loss": 2.2591, - "step": 549340 + "epoch": 0.15, + "learning_rate": 4.2254177211575186e-05, + "loss": 2.8614, + "step": 43400 }, { - "epoch": 0.96, - "learning_rate": 2.0999801197696686e-06, - "loss": 2.2811, - "step": 549350 + "epoch": 0.16, + "learning_rate": 4.2236329693629514e-05, + "loss": 2.858, + "step": 43500 }, { - "epoch": 0.96, - "learning_rate": 2.0991081798428415e-06, - "loss": 2.2203, - "step": 549360 + "epoch": 0.16, + "learning_rate": 4.2218482175683835e-05, + "loss": 2.8582, + "step": 43600 }, { - "epoch": 0.96, - "learning_rate": 2.098236239916015e-06, - "loss": 2.2842, - "step": 549370 + "epoch": 0.16, + "learning_rate": 4.220063465773815e-05, + "loss": 2.8664, + "step": 43700 }, { - "epoch": 0.96, - "learning_rate": 2.0973642999891877e-06, - "loss": 2.314, - "step": 549380 + "epoch": 0.16, + "learning_rate": 4.218278713979247e-05, + "loss": 2.867, + "step": 43800 }, { - "epoch": 0.96, - "learning_rate": 2.096492360062361e-06, - "loss": 2.2475, - "step": 549390 + "epoch": 0.16, + "learning_rate": 4.216493962184679e-05, + "loss": 2.8731, + "step": 43900 }, { - "epoch": 0.96, - "learning_rate": 2.0956204201355344e-06, - "loss": 2.3045, - "step": 549400 + "epoch": 0.16, + "learning_rate": 4.214709210390111e-05, + "loss": 2.8612, + "step": 44000 }, { - "epoch": 0.96, - "learning_rate": 2.0947484802087078e-06, - "loss": 2.3666, - "step": 549410 + "epoch": 0.16, + "learning_rate": 4.2129244585955435e-05, + "loss": 2.8553, + "step": 44100 }, { - "epoch": 0.96, - "learning_rate": 2.0938765402818807e-06, - "loss": 2.2596, - "step": 549420 + "epoch": 0.16, + "learning_rate": 4.2111397068009756e-05, + "loss": 2.8642, + "step": 44200 }, { - "epoch": 0.96, - "learning_rate": 2.093004600355054e-06, - "loss": 2.2387, - "step": 549430 + "epoch": 0.16, + "learning_rate": 4.209354955006408e-05, + "loss": 2.8693, + "step": 44300 }, { - "epoch": 0.96, - "learning_rate": 2.092132660428227e-06, - "loss": 2.224, - "step": 549440 + "epoch": 0.16, + "learning_rate": 4.20757020321184e-05, + "loss": 2.8573, + "step": 44400 }, { - "epoch": 0.96, - "learning_rate": 2.0912607205014003e-06, - "loss": 2.3323, - "step": 549450 + "epoch": 0.16, + "learning_rate": 4.205785451417272e-05, + "loss": 2.8646, + "step": 44500 }, { - "epoch": 0.96, - "learning_rate": 2.0903887805745737e-06, - "loss": 2.2351, - "step": 549460 + "epoch": 0.16, + "learning_rate": 4.204000699622704e-05, + "loss": 2.863, + "step": 44600 }, { - "epoch": 0.96, - "learning_rate": 2.089516840647747e-06, - "loss": 2.2693, - "step": 549470 + "epoch": 0.16, + "learning_rate": 4.202215947828136e-05, + "loss": 2.8674, + "step": 44700 }, { - "epoch": 0.96, - "learning_rate": 2.08864490072092e-06, - "loss": 2.193, - "step": 549480 + "epoch": 0.16, + "learning_rate": 4.2004311960335676e-05, + "loss": 2.8609, + "step": 44800 }, { - "epoch": 0.96, - "learning_rate": 2.0877729607940933e-06, - "loss": 2.3525, - "step": 549490 + "epoch": 0.16, + "learning_rate": 4.198646444239e-05, + "loss": 2.8604, + "step": 44900 }, { - "epoch": 0.96, - "learning_rate": 2.086901020867266e-06, - "loss": 2.272, - "step": 549500 + "epoch": 0.16, + "learning_rate": 4.196861692444432e-05, + "loss": 2.8587, + "step": 45000 }, { - "epoch": 0.96, - "learning_rate": 2.0860290809404396e-06, - "loss": 2.2348, - "step": 549510 + "epoch": 0.16, + "learning_rate": 4.195076940649864e-05, + "loss": 2.8611, + "step": 45100 }, { - "epoch": 0.96, - "learning_rate": 2.0851571410136125e-06, - "loss": 2.2678, - "step": 549520 + "epoch": 0.16, + "learning_rate": 4.193292188855296e-05, + "loss": 2.8605, + "step": 45200 }, { - "epoch": 0.96, - "learning_rate": 2.0842852010867862e-06, - "loss": 2.1919, - "step": 549530 + "epoch": 0.16, + "learning_rate": 4.191507437060728e-05, + "loss": 2.8599, + "step": 45300 }, { - "epoch": 0.96, - "learning_rate": 2.083413261159959e-06, - "loss": 2.2756, - "step": 549540 + "epoch": 0.16, + "learning_rate": 4.1897226852661604e-05, + "loss": 2.8597, + "step": 45400 }, { - "epoch": 0.96, - "learning_rate": 2.0825413212331325e-06, - "loss": 2.3498, - "step": 549550 + "epoch": 0.16, + "learning_rate": 4.1879379334715925e-05, + "loss": 2.8613, + "step": 45500 }, { - "epoch": 0.96, - "learning_rate": 2.0816693813063054e-06, - "loss": 2.199, - "step": 549560 + "epoch": 0.16, + "learning_rate": 4.1861531816770246e-05, + "loss": 2.8523, + "step": 45600 }, { - "epoch": 0.96, - "learning_rate": 2.0807974413794788e-06, - "loss": 2.2142, - "step": 549570 + "epoch": 0.16, + "learning_rate": 4.184368429882457e-05, + "loss": 2.8463, + "step": 45700 }, { - "epoch": 0.96, - "learning_rate": 2.0799255014526517e-06, - "loss": 2.0132, - "step": 549580 + "epoch": 0.16, + "learning_rate": 4.182583678087889e-05, + "loss": 2.8558, + "step": 45800 }, { - "epoch": 0.96, - "learning_rate": 2.079053561525825e-06, - "loss": 2.2042, - "step": 549590 + "epoch": 0.16, + "learning_rate": 4.18079892629332e-05, + "loss": 2.854, + "step": 45900 }, { - "epoch": 0.96, - "learning_rate": 2.0781816215989984e-06, - "loss": 2.2316, - "step": 549600 + "epoch": 0.16, + "learning_rate": 4.1790141744987524e-05, + "loss": 2.8539, + "step": 46000 }, { - "epoch": 0.96, - "learning_rate": 2.0773096816721717e-06, - "loss": 2.297, - "step": 549610 + "epoch": 0.16, + "learning_rate": 4.1772294227041845e-05, + "loss": 2.8612, + "step": 46100 }, { - "epoch": 0.96, - "learning_rate": 2.0764377417453447e-06, - "loss": 2.1572, - "step": 549620 + "epoch": 0.16, + "learning_rate": 4.1754446709096167e-05, + "loss": 2.8571, + "step": 46200 }, { - "epoch": 0.96, - "learning_rate": 2.075565801818518e-06, - "loss": 2.1747, - "step": 549630 + "epoch": 0.17, + "learning_rate": 4.173659919115049e-05, + "loss": 2.8656, + "step": 46300 }, { - "epoch": 0.96, - "learning_rate": 2.074693861891691e-06, - "loss": 2.2471, - "step": 549640 + "epoch": 0.17, + "learning_rate": 4.171875167320481e-05, + "loss": 2.8571, + "step": 46400 }, { - "epoch": 0.96, - "learning_rate": 2.0738219219648643e-06, - "loss": 2.2145, - "step": 549650 + "epoch": 0.17, + "learning_rate": 4.170090415525913e-05, + "loss": 2.8538, + "step": 46500 }, { - "epoch": 0.96, - "learning_rate": 2.0729499820380376e-06, - "loss": 2.2956, - "step": 549660 + "epoch": 0.17, + "learning_rate": 4.168305663731345e-05, + "loss": 2.8643, + "step": 46600 }, { - "epoch": 0.96, - "learning_rate": 2.072078042111211e-06, - "loss": 2.2143, - "step": 549670 + "epoch": 0.17, + "learning_rate": 4.166520911936777e-05, + "loss": 2.8593, + "step": 46700 }, { - "epoch": 0.96, - "learning_rate": 2.071206102184384e-06, - "loss": 2.211, - "step": 549680 + "epoch": 0.17, + "learning_rate": 4.1647361601422094e-05, + "loss": 2.8608, + "step": 46800 }, { - "epoch": 0.96, - "learning_rate": 2.0703341622575572e-06, - "loss": 2.2311, - "step": 549690 + "epoch": 0.17, + "learning_rate": 4.1629514083476415e-05, + "loss": 2.8656, + "step": 46900 }, { - "epoch": 0.96, - "learning_rate": 2.06946222233073e-06, - "loss": 2.2775, - "step": 549700 + "epoch": 0.17, + "learning_rate": 4.161166656553073e-05, + "loss": 2.8556, + "step": 47000 }, { - "epoch": 0.96, - "learning_rate": 2.0685902824039035e-06, - "loss": 2.313, - "step": 549710 + "epoch": 0.17, + "learning_rate": 4.159381904758505e-05, + "loss": 2.8533, + "step": 47100 }, { - "epoch": 0.96, - "learning_rate": 2.0677183424770764e-06, - "loss": 2.2429, - "step": 549720 + "epoch": 0.17, + "learning_rate": 4.157597152963937e-05, + "loss": 2.8573, + "step": 47200 }, { - "epoch": 0.96, - "learning_rate": 2.06684640255025e-06, - "loss": 2.2047, - "step": 549730 + "epoch": 0.17, + "learning_rate": 4.155812401169369e-05, + "loss": 2.8553, + "step": 47300 }, { - "epoch": 0.96, - "learning_rate": 2.065974462623423e-06, - "loss": 2.2742, - "step": 549740 + "epoch": 0.17, + "learning_rate": 4.1540276493748014e-05, + "loss": 2.8608, + "step": 47400 }, { - "epoch": 0.96, - "learning_rate": 2.0651025226965965e-06, - "loss": 2.1623, - "step": 549750 + "epoch": 0.17, + "learning_rate": 4.1522428975802336e-05, + "loss": 2.8571, + "step": 47500 }, { - "epoch": 0.96, - "learning_rate": 2.0642305827697694e-06, - "loss": 2.2385, - "step": 549760 + "epoch": 0.17, + "learning_rate": 4.150458145785666e-05, + "loss": 2.8527, + "step": 47600 }, { - "epoch": 0.96, - "learning_rate": 2.0633586428429427e-06, - "loss": 2.2121, - "step": 549770 + "epoch": 0.17, + "learning_rate": 4.148673393991098e-05, + "loss": 2.8564, + "step": 47700 }, { - "epoch": 0.96, - "learning_rate": 2.0624867029161157e-06, - "loss": 2.2441, - "step": 549780 + "epoch": 0.17, + "learning_rate": 4.14688864219653e-05, + "loss": 2.8488, + "step": 47800 }, { - "epoch": 0.96, - "learning_rate": 2.061614762989289e-06, - "loss": 2.2667, - "step": 549790 + "epoch": 0.17, + "learning_rate": 4.145103890401962e-05, + "loss": 2.8546, + "step": 47900 }, { - "epoch": 0.96, - "learning_rate": 2.0607428230624624e-06, - "loss": 2.3278, - "step": 549800 + "epoch": 0.17, + "learning_rate": 4.143319138607394e-05, + "loss": 2.8542, + "step": 48000 }, { - "epoch": 0.96, - "learning_rate": 2.0598708831356357e-06, - "loss": 2.1885, - "step": 549810 + "epoch": 0.17, + "learning_rate": 4.1415343868128256e-05, + "loss": 2.8474, + "step": 48100 }, { - "epoch": 0.96, - "learning_rate": 2.0589989432088086e-06, - "loss": 2.1507, - "step": 549820 + "epoch": 0.17, + "learning_rate": 4.139749635018258e-05, + "loss": 2.8504, + "step": 48200 }, { - "epoch": 0.96, - "learning_rate": 2.058127003281982e-06, - "loss": 2.2038, - "step": 549830 + "epoch": 0.17, + "learning_rate": 4.13796488322369e-05, + "loss": 2.858, + "step": 48300 }, { - "epoch": 0.96, - "learning_rate": 2.057255063355155e-06, - "loss": 2.1565, - "step": 549840 + "epoch": 0.17, + "learning_rate": 4.136180131429122e-05, + "loss": 2.847, + "step": 48400 }, { - "epoch": 0.96, - "learning_rate": 2.0563831234283283e-06, - "loss": 2.4138, - "step": 549850 + "epoch": 0.17, + "learning_rate": 4.134395379634554e-05, + "loss": 2.8431, + "step": 48500 }, { - "epoch": 0.96, - "learning_rate": 2.0555111835015016e-06, - "loss": 2.2313, - "step": 549860 + "epoch": 0.17, + "learning_rate": 4.132610627839987e-05, + "loss": 2.8534, + "step": 48600 }, { - "epoch": 0.96, - "learning_rate": 2.054639243574675e-06, - "loss": 2.3024, - "step": 549870 + "epoch": 0.17, + "learning_rate": 4.130825876045419e-05, + "loss": 2.8457, + "step": 48700 }, { - "epoch": 0.96, - "learning_rate": 2.053767303647848e-06, - "loss": 2.196, - "step": 549880 + "epoch": 0.17, + "learning_rate": 4.129041124250851e-05, + "loss": 2.8611, + "step": 48800 }, { - "epoch": 0.96, - "learning_rate": 2.0528953637210212e-06, - "loss": 2.2501, - "step": 549890 + "epoch": 0.17, + "learning_rate": 4.127256372456283e-05, + "loss": 2.8424, + "step": 48900 }, { - "epoch": 0.96, - "learning_rate": 2.052023423794194e-06, - "loss": 2.2949, - "step": 549900 + "epoch": 0.17, + "learning_rate": 4.125471620661715e-05, + "loss": 2.8518, + "step": 49000 }, { - "epoch": 0.96, - "learning_rate": 2.0511514838673675e-06, - "loss": 2.2572, - "step": 549910 + "epoch": 0.18, + "learning_rate": 4.123686868867147e-05, + "loss": 2.8601, + "step": 49100 }, { - "epoch": 0.96, - "learning_rate": 2.0502795439405404e-06, - "loss": 2.3009, - "step": 549920 + "epoch": 0.18, + "learning_rate": 4.121902117072579e-05, + "loss": 2.8475, + "step": 49200 }, { - "epoch": 0.96, - "learning_rate": 2.049407604013714e-06, - "loss": 2.1467, - "step": 549930 + "epoch": 0.18, + "learning_rate": 4.120117365278011e-05, + "loss": 2.8561, + "step": 49300 }, { - "epoch": 0.96, - "learning_rate": 2.048535664086887e-06, - "loss": 2.2156, - "step": 549940 + "epoch": 0.18, + "learning_rate": 4.118332613483443e-05, + "loss": 2.8666, + "step": 49400 }, { - "epoch": 0.96, - "learning_rate": 2.0476637241600604e-06, - "loss": 2.2554, - "step": 549950 + "epoch": 0.18, + "learning_rate": 4.116547861688875e-05, + "loss": 2.8522, + "step": 49500 }, { - "epoch": 0.96, - "learning_rate": 2.0467917842332334e-06, - "loss": 2.4111, - "step": 549960 + "epoch": 0.18, + "learning_rate": 4.1147631098943074e-05, + "loss": 2.8481, + "step": 49600 }, { - "epoch": 0.96, - "learning_rate": 2.0459198443064067e-06, - "loss": 2.2792, - "step": 549970 + "epoch": 0.18, + "learning_rate": 4.1129783580997395e-05, + "loss": 2.8584, + "step": 49700 }, { - "epoch": 0.96, - "learning_rate": 2.0450479043795796e-06, - "loss": 2.1987, - "step": 549980 + "epoch": 0.18, + "learning_rate": 4.111193606305172e-05, + "loss": 2.8557, + "step": 49800 }, { - "epoch": 0.96, - "learning_rate": 2.0441759644527534e-06, - "loss": 2.2193, - "step": 549990 + "epoch": 0.18, + "learning_rate": 4.109408854510604e-05, + "loss": 2.8509, + "step": 49900 }, { - "epoch": 0.96, - "learning_rate": 2.0433040245259263e-06, - "loss": 2.233, - "step": 550000 + "epoch": 0.18, + "learning_rate": 4.107624102716036e-05, + "loss": 2.8536, + "step": 50000 }, { - "epoch": 0.96, - "learning_rate": 2.0424320845990997e-06, - "loss": 2.2137, - "step": 550010 + "epoch": 0.18, + "learning_rate": 4.1058393509214674e-05, + "loss": 2.843, + "step": 50100 }, { - "epoch": 0.96, - "learning_rate": 2.0415601446722726e-06, - "loss": 2.224, - "step": 550020 + "epoch": 0.18, + "learning_rate": 4.1040545991268995e-05, + "loss": 2.848, + "step": 50200 }, { - "epoch": 0.96, - "learning_rate": 2.040688204745446e-06, - "loss": 2.2596, - "step": 550030 + "epoch": 0.18, + "learning_rate": 4.1022698473323316e-05, + "loss": 2.8521, + "step": 50300 }, { - "epoch": 0.96, - "learning_rate": 2.039816264818619e-06, - "loss": 2.2274, - "step": 550040 + "epoch": 0.18, + "learning_rate": 4.100485095537764e-05, + "loss": 2.8368, + "step": 50400 }, { - "epoch": 0.96, - "learning_rate": 2.0389443248917922e-06, - "loss": 2.3068, - "step": 550050 + "epoch": 0.18, + "learning_rate": 4.098700343743196e-05, + "loss": 2.8653, + "step": 50500 }, { - "epoch": 0.96, - "learning_rate": 2.0380723849649656e-06, - "loss": 2.2634, - "step": 550060 + "epoch": 0.18, + "learning_rate": 4.096915591948628e-05, + "loss": 2.8587, + "step": 50600 }, { - "epoch": 0.96, - "learning_rate": 2.037200445038139e-06, - "loss": 2.2667, - "step": 550070 + "epoch": 0.18, + "learning_rate": 4.09513084015406e-05, + "loss": 2.8547, + "step": 50700 }, { - "epoch": 0.96, - "learning_rate": 2.036328505111312e-06, - "loss": 2.2477, - "step": 550080 + "epoch": 0.18, + "learning_rate": 4.093346088359492e-05, + "loss": 2.847, + "step": 50800 }, { - "epoch": 0.96, - "learning_rate": 2.035456565184485e-06, - "loss": 2.2404, - "step": 550090 + "epoch": 0.18, + "learning_rate": 4.091561336564924e-05, + "loss": 2.8457, + "step": 50900 }, { - "epoch": 0.96, - "learning_rate": 2.034584625257658e-06, - "loss": 2.3097, - "step": 550100 + "epoch": 0.18, + "learning_rate": 4.0897765847703565e-05, + "loss": 2.8517, + "step": 51000 }, { - "epoch": 0.96, - "learning_rate": 2.0337126853308314e-06, - "loss": 2.2108, - "step": 550110 + "epoch": 0.18, + "learning_rate": 4.0879918329757886e-05, + "loss": 2.8362, + "step": 51100 }, { - "epoch": 0.96, - "learning_rate": 2.032840745404005e-06, - "loss": 2.2717, - "step": 550120 + "epoch": 0.18, + "learning_rate": 4.08620708118122e-05, + "loss": 2.8562, + "step": 51200 }, { - "epoch": 0.96, - "learning_rate": 2.031968805477178e-06, - "loss": 2.18, - "step": 550130 + "epoch": 0.18, + "learning_rate": 4.084422329386652e-05, + "loss": 2.8518, + "step": 51300 }, { - "epoch": 0.96, - "learning_rate": 2.031096865550351e-06, - "loss": 2.2825, - "step": 550140 + "epoch": 0.18, + "learning_rate": 4.082637577592084e-05, + "loss": 2.8371, + "step": 51400 }, { - "epoch": 0.96, - "learning_rate": 2.0302249256235244e-06, - "loss": 2.2011, - "step": 550150 + "epoch": 0.18, + "learning_rate": 4.0808528257975164e-05, + "loss": 2.8484, + "step": 51500 }, { - "epoch": 0.96, - "learning_rate": 2.0293529856966973e-06, - "loss": 2.3342, - "step": 550160 + "epoch": 0.18, + "learning_rate": 4.0790680740029485e-05, + "loss": 2.8457, + "step": 51600 }, { - "epoch": 0.96, - "learning_rate": 2.0284810457698707e-06, - "loss": 2.334, - "step": 550170 + "epoch": 0.18, + "learning_rate": 4.0772833222083806e-05, + "loss": 2.843, + "step": 51700 }, { - "epoch": 0.96, - "learning_rate": 2.0276091058430436e-06, - "loss": 2.3034, - "step": 550180 + "epoch": 0.18, + "learning_rate": 4.075498570413813e-05, + "loss": 2.8378, + "step": 51800 }, { - "epoch": 0.96, - "learning_rate": 2.0267371659162174e-06, - "loss": 2.2741, - "step": 550190 + "epoch": 0.19, + "learning_rate": 4.073713818619245e-05, + "loss": 2.8577, + "step": 51900 }, { - "epoch": 0.96, - "learning_rate": 2.0258652259893903e-06, - "loss": 2.2089, - "step": 550200 + "epoch": 0.19, + "learning_rate": 4.071929066824677e-05, + "loss": 2.8458, + "step": 52000 }, { - "epoch": 0.96, - "learning_rate": 2.0249932860625636e-06, - "loss": 2.2486, - "step": 550210 + "epoch": 0.19, + "learning_rate": 4.070144315030109e-05, + "loss": 2.8408, + "step": 52100 }, { - "epoch": 0.96, - "learning_rate": 2.0241213461357366e-06, - "loss": 2.2691, - "step": 550220 + "epoch": 0.19, + "learning_rate": 4.068359563235541e-05, + "loss": 2.8462, + "step": 52200 }, { - "epoch": 0.96, - "learning_rate": 2.02324940620891e-06, - "loss": 2.2506, - "step": 550230 + "epoch": 0.19, + "learning_rate": 4.066574811440973e-05, + "loss": 2.828, + "step": 52300 }, { - "epoch": 0.96, - "learning_rate": 2.022377466282083e-06, - "loss": 2.2759, - "step": 550240 + "epoch": 0.19, + "learning_rate": 4.064790059646405e-05, + "loss": 2.8387, + "step": 52400 }, { - "epoch": 0.96, - "learning_rate": 2.021505526355256e-06, - "loss": 2.2623, - "step": 550250 + "epoch": 0.19, + "learning_rate": 4.063005307851837e-05, + "loss": 2.8412, + "step": 52500 }, { - "epoch": 0.96, - "learning_rate": 2.0206335864284295e-06, - "loss": 2.3624, - "step": 550260 + "epoch": 0.19, + "learning_rate": 4.061220556057269e-05, + "loss": 2.8409, + "step": 52600 }, { - "epoch": 0.96, - "learning_rate": 2.019761646501603e-06, - "loss": 2.2381, - "step": 550270 + "epoch": 0.19, + "learning_rate": 4.059435804262701e-05, + "loss": 2.8331, + "step": 52700 }, { - "epoch": 0.96, - "learning_rate": 2.018889706574776e-06, - "loss": 2.2783, - "step": 550280 + "epoch": 0.19, + "learning_rate": 4.057651052468133e-05, + "loss": 2.8533, + "step": 52800 }, { - "epoch": 0.96, - "learning_rate": 2.018017766647949e-06, - "loss": 2.2405, - "step": 550290 + "epoch": 0.19, + "learning_rate": 4.0558663006735654e-05, + "loss": 2.8419, + "step": 52900 }, { - "epoch": 0.96, - "learning_rate": 2.017145826721122e-06, - "loss": 2.2536, - "step": 550300 + "epoch": 0.19, + "learning_rate": 4.0540815488789975e-05, + "loss": 2.844, + "step": 53000 }, { - "epoch": 0.96, - "learning_rate": 2.0162738867942954e-06, - "loss": 2.2682, - "step": 550310 + "epoch": 0.19, + "learning_rate": 4.0522967970844296e-05, + "loss": 2.8462, + "step": 53100 }, { - "epoch": 0.96, - "learning_rate": 2.0154019468674688e-06, - "loss": 2.2475, - "step": 550320 + "epoch": 0.19, + "learning_rate": 4.050512045289862e-05, + "loss": 2.8403, + "step": 53200 }, { - "epoch": 0.96, - "learning_rate": 2.014530006940642e-06, - "loss": 2.2928, - "step": 550330 + "epoch": 0.19, + "learning_rate": 4.048727293495294e-05, + "loss": 2.8335, + "step": 53300 }, { - "epoch": 0.96, - "learning_rate": 2.013658067013815e-06, - "loss": 2.2551, - "step": 550340 + "epoch": 0.19, + "learning_rate": 4.046942541700725e-05, + "loss": 2.8462, + "step": 53400 }, { - "epoch": 0.96, - "learning_rate": 2.0127861270869884e-06, - "loss": 2.3168, - "step": 550350 + "epoch": 0.19, + "learning_rate": 4.0451577899061575e-05, + "loss": 2.838, + "step": 53500 }, { - "epoch": 0.96, - "learning_rate": 2.0119141871601613e-06, - "loss": 2.2481, - "step": 550360 + "epoch": 0.19, + "learning_rate": 4.0433730381115896e-05, + "loss": 2.8352, + "step": 53600 }, { - "epoch": 0.96, - "learning_rate": 2.0110422472333346e-06, - "loss": 2.2395, - "step": 550370 + "epoch": 0.19, + "learning_rate": 4.0415882863170224e-05, + "loss": 2.8374, + "step": 53700 }, { - "epoch": 0.96, - "learning_rate": 2.010170307306508e-06, - "loss": 2.2371, - "step": 550380 + "epoch": 0.19, + "learning_rate": 4.0398035345224545e-05, + "loss": 2.8347, + "step": 53800 }, { - "epoch": 0.96, - "learning_rate": 2.0092983673796813e-06, - "loss": 2.1903, - "step": 550390 + "epoch": 0.19, + "learning_rate": 4.0380187827278866e-05, + "loss": 2.8214, + "step": 53900 }, { - "epoch": 0.96, - "learning_rate": 2.0084264274528543e-06, - "loss": 2.1325, - "step": 550400 + "epoch": 0.19, + "learning_rate": 4.036234030933319e-05, + "loss": 2.849, + "step": 54000 }, { - "epoch": 0.96, - "learning_rate": 2.0075544875260276e-06, - "loss": 2.2045, - "step": 550410 + "epoch": 0.19, + "learning_rate": 4.034449279138751e-05, + "loss": 2.8423, + "step": 54100 }, { - "epoch": 0.96, - "learning_rate": 2.0066825475992005e-06, - "loss": 2.2285, - "step": 550420 + "epoch": 0.19, + "learning_rate": 4.032664527344183e-05, + "loss": 2.8396, + "step": 54200 }, { - "epoch": 0.96, - "learning_rate": 2.005810607672374e-06, - "loss": 2.2945, - "step": 550430 + "epoch": 0.19, + "learning_rate": 4.0308797755496144e-05, + "loss": 2.8333, + "step": 54300 }, { - "epoch": 0.96, - "learning_rate": 2.0049386677455472e-06, - "loss": 2.2642, - "step": 550440 + "epoch": 0.19, + "learning_rate": 4.0290950237550465e-05, + "loss": 2.8334, + "step": 54400 }, { - "epoch": 0.96, - "learning_rate": 2.00406672781872e-06, - "loss": 2.2451, - "step": 550450 + "epoch": 0.19, + "learning_rate": 4.027310271960479e-05, + "loss": 2.8289, + "step": 54500 }, { - "epoch": 0.96, - "learning_rate": 2.0031947878918935e-06, - "loss": 2.1505, - "step": 550460 + "epoch": 0.19, + "learning_rate": 4.025525520165911e-05, + "loss": 2.8505, + "step": 54600 }, { - "epoch": 0.96, - "learning_rate": 2.002322847965067e-06, - "loss": 2.2826, - "step": 550470 + "epoch": 0.2, + "learning_rate": 4.023740768371343e-05, + "loss": 2.8387, + "step": 54700 }, { - "epoch": 0.96, - "learning_rate": 2.0014509080382398e-06, - "loss": 2.1626, - "step": 550480 + "epoch": 0.2, + "learning_rate": 4.021956016576775e-05, + "loss": 2.8407, + "step": 54800 }, { - "epoch": 0.96, - "learning_rate": 2.000578968111413e-06, - "loss": 2.2798, - "step": 550490 + "epoch": 0.2, + "learning_rate": 4.020171264782207e-05, + "loss": 2.8396, + "step": 54900 }, { - "epoch": 0.96, - "learning_rate": 1.999707028184586e-06, - "loss": 2.2426, - "step": 550500 + "epoch": 0.2, + "learning_rate": 4.018386512987639e-05, + "loss": 2.8391, + "step": 55000 }, { - "epoch": 0.96, - "learning_rate": 1.9988350882577594e-06, - "loss": 2.2846, - "step": 550510 + "epoch": 0.2, + "learning_rate": 4.0166017611930714e-05, + "loss": 2.8314, + "step": 55100 }, { - "epoch": 0.96, - "learning_rate": 1.9979631483309327e-06, - "loss": 2.2586, - "step": 550520 + "epoch": 0.2, + "learning_rate": 4.0148170093985035e-05, + "loss": 2.8403, + "step": 55200 }, { - "epoch": 0.96, - "learning_rate": 1.997091208404106e-06, - "loss": 2.2094, - "step": 550530 + "epoch": 0.2, + "learning_rate": 4.0130322576039356e-05, + "loss": 2.842, + "step": 55300 }, { - "epoch": 0.96, - "learning_rate": 1.996219268477279e-06, - "loss": 2.1888, - "step": 550540 + "epoch": 0.2, + "learning_rate": 4.011247505809367e-05, + "loss": 2.8382, + "step": 55400 }, { - "epoch": 0.96, - "learning_rate": 1.9953473285504523e-06, - "loss": 2.1734, - "step": 550550 + "epoch": 0.2, + "learning_rate": 4.009462754014799e-05, + "loss": 2.8445, + "step": 55500 }, { - "epoch": 0.96, - "learning_rate": 1.9944753886236253e-06, - "loss": 2.3198, - "step": 550560 + "epoch": 0.2, + "learning_rate": 4.007678002220231e-05, + "loss": 2.8377, + "step": 55600 }, { - "epoch": 0.96, - "learning_rate": 1.9936034486967986e-06, - "loss": 2.1513, - "step": 550570 + "epoch": 0.2, + "learning_rate": 4.0058932504256634e-05, + "loss": 2.8388, + "step": 55700 }, { - "epoch": 0.96, - "learning_rate": 1.992731508769972e-06, - "loss": 2.2692, - "step": 550580 + "epoch": 0.2, + "learning_rate": 4.0041084986310956e-05, + "loss": 2.8286, + "step": 55800 }, { - "epoch": 0.96, - "learning_rate": 1.9918595688431453e-06, - "loss": 2.2369, - "step": 550590 + "epoch": 0.2, + "learning_rate": 4.002323746836528e-05, + "loss": 2.8204, + "step": 55900 }, { - "epoch": 0.96, - "learning_rate": 1.9909876289163182e-06, - "loss": 2.2818, - "step": 550600 + "epoch": 0.2, + "learning_rate": 4.00053899504196e-05, + "loss": 2.8434, + "step": 56000 }, { - "epoch": 0.96, - "learning_rate": 1.9901156889894916e-06, - "loss": 2.2742, - "step": 550610 + "epoch": 0.2, + "learning_rate": 3.998754243247392e-05, + "loss": 2.8375, + "step": 56100 }, { - "epoch": 0.96, - "learning_rate": 1.9892437490626645e-06, - "loss": 2.1107, - "step": 550620 + "epoch": 0.2, + "learning_rate": 3.996969491452824e-05, + "loss": 2.8283, + "step": 56200 }, { - "epoch": 0.96, - "learning_rate": 1.988371809135838e-06, - "loss": 2.2136, - "step": 550630 + "epoch": 0.2, + "learning_rate": 3.995184739658256e-05, + "loss": 2.8268, + "step": 56300 }, { - "epoch": 0.96, - "learning_rate": 1.987499869209011e-06, - "loss": 2.2626, - "step": 550640 + "epoch": 0.2, + "learning_rate": 3.993399987863688e-05, + "loss": 2.8338, + "step": 56400 }, { - "epoch": 0.96, - "learning_rate": 1.986627929282184e-06, - "loss": 2.1764, - "step": 550650 + "epoch": 0.2, + "learning_rate": 3.99161523606912e-05, + "loss": 2.8414, + "step": 56500 }, { - "epoch": 0.96, - "learning_rate": 1.9857559893553574e-06, - "loss": 2.1722, - "step": 550660 + "epoch": 0.2, + "learning_rate": 3.989830484274552e-05, + "loss": 2.8335, + "step": 56600 }, { - "epoch": 0.96, - "learning_rate": 1.984884049428531e-06, - "loss": 2.3007, - "step": 550670 + "epoch": 0.2, + "learning_rate": 3.988045732479984e-05, + "loss": 2.8301, + "step": 56700 }, { - "epoch": 0.96, - "learning_rate": 1.9840121095017037e-06, - "loss": 2.3462, - "step": 550680 + "epoch": 0.2, + "learning_rate": 3.986260980685416e-05, + "loss": 2.8353, + "step": 56800 }, { - "epoch": 0.96, - "learning_rate": 1.983140169574877e-06, - "loss": 2.3655, - "step": 550690 + "epoch": 0.2, + "learning_rate": 3.984476228890848e-05, + "loss": 2.8319, + "step": 56900 }, { - "epoch": 0.96, - "learning_rate": 1.9822682296480504e-06, - "loss": 2.288, - "step": 550700 + "epoch": 0.2, + "learning_rate": 3.9826914770962804e-05, + "loss": 2.8368, + "step": 57000 }, { - "epoch": 0.96, - "learning_rate": 1.9813962897212233e-06, - "loss": 2.3511, - "step": 550710 + "epoch": 0.2, + "learning_rate": 3.9809067253017125e-05, + "loss": 2.8305, + "step": 57100 }, { - "epoch": 0.96, - "learning_rate": 1.9805243497943967e-06, - "loss": 2.1934, - "step": 550720 + "epoch": 0.2, + "learning_rate": 3.9791219735071446e-05, + "loss": 2.8269, + "step": 57200 }, { - "epoch": 0.96, - "learning_rate": 1.97965240986757e-06, - "loss": 2.2678, - "step": 550730 + "epoch": 0.2, + "learning_rate": 3.977337221712577e-05, + "loss": 2.8326, + "step": 57300 }, { - "epoch": 0.96, - "learning_rate": 1.978780469940743e-06, - "loss": 2.3617, - "step": 550740 + "epoch": 0.2, + "learning_rate": 3.975552469918009e-05, + "loss": 2.8347, + "step": 57400 }, { - "epoch": 0.96, - "learning_rate": 1.9779085300139163e-06, - "loss": 2.3644, - "step": 550750 + "epoch": 0.21, + "learning_rate": 3.97376771812344e-05, + "loss": 2.8247, + "step": 57500 }, { - "epoch": 0.96, - "learning_rate": 1.9770365900870892e-06, - "loss": 2.1546, - "step": 550760 + "epoch": 0.21, + "learning_rate": 3.9719829663288724e-05, + "loss": 2.8293, + "step": 57600 }, { - "epoch": 0.96, - "learning_rate": 1.9761646501602626e-06, - "loss": 2.3161, - "step": 550770 + "epoch": 0.21, + "learning_rate": 3.9701982145343045e-05, + "loss": 2.8288, + "step": 57700 }, { - "epoch": 0.96, - "learning_rate": 1.975292710233436e-06, - "loss": 2.3406, - "step": 550780 + "epoch": 0.21, + "learning_rate": 3.9684134627397366e-05, + "loss": 2.8195, + "step": 57800 }, { - "epoch": 0.96, - "learning_rate": 1.9744207703066093e-06, - "loss": 2.2442, - "step": 550790 + "epoch": 0.21, + "learning_rate": 3.966628710945169e-05, + "loss": 2.8307, + "step": 57900 }, { - "epoch": 0.96, - "learning_rate": 1.973548830379782e-06, - "loss": 2.2272, - "step": 550800 + "epoch": 0.21, + "learning_rate": 3.964843959150601e-05, + "loss": 2.8316, + "step": 58000 }, { - "epoch": 0.96, - "learning_rate": 1.9726768904529555e-06, - "loss": 2.2034, - "step": 550810 + "epoch": 0.21, + "learning_rate": 3.963059207356033e-05, + "loss": 2.835, + "step": 58100 }, { - "epoch": 0.96, - "learning_rate": 1.9718049505261285e-06, - "loss": 2.2605, - "step": 550820 + "epoch": 0.21, + "learning_rate": 3.961274455561465e-05, + "loss": 2.8219, + "step": 58200 }, { - "epoch": 0.96, - "learning_rate": 1.970933010599302e-06, - "loss": 2.2596, - "step": 550830 + "epoch": 0.21, + "learning_rate": 3.959489703766897e-05, + "loss": 2.8291, + "step": 58300 }, { - "epoch": 0.96, - "learning_rate": 1.970061070672475e-06, - "loss": 2.3294, - "step": 550840 + "epoch": 0.21, + "learning_rate": 3.9577049519723294e-05, + "loss": 2.8261, + "step": 58400 }, { - "epoch": 0.96, - "learning_rate": 1.969189130745648e-06, - "loss": 2.1313, - "step": 550850 + "epoch": 0.21, + "learning_rate": 3.9559202001777615e-05, + "loss": 2.8232, + "step": 58500 }, { - "epoch": 0.96, - "learning_rate": 1.9683171908188214e-06, - "loss": 2.2056, - "step": 550860 + "epoch": 0.21, + "learning_rate": 3.954135448383193e-05, + "loss": 2.8356, + "step": 58600 }, { - "epoch": 0.96, - "learning_rate": 1.9674452508919948e-06, - "loss": 2.3046, - "step": 550870 + "epoch": 0.21, + "learning_rate": 3.952350696588625e-05, + "loss": 2.8329, + "step": 58700 }, { - "epoch": 0.96, - "learning_rate": 1.9665733109651677e-06, - "loss": 2.3104, - "step": 550880 + "epoch": 0.21, + "learning_rate": 3.950565944794058e-05, + "loss": 2.8351, + "step": 58800 }, { - "epoch": 0.96, - "learning_rate": 1.965701371038341e-06, - "loss": 2.1023, - "step": 550890 + "epoch": 0.21, + "learning_rate": 3.94878119299949e-05, + "loss": 2.8262, + "step": 58900 }, { - "epoch": 0.96, - "learning_rate": 1.9648294311115144e-06, - "loss": 2.2828, - "step": 550900 + "epoch": 0.21, + "learning_rate": 3.946996441204922e-05, + "loss": 2.8217, + "step": 59000 }, { - "epoch": 0.96, - "learning_rate": 1.9639574911846873e-06, - "loss": 2.3221, - "step": 550910 + "epoch": 0.21, + "learning_rate": 3.945211689410354e-05, + "loss": 2.8293, + "step": 59100 }, { - "epoch": 0.96, - "learning_rate": 1.9630855512578606e-06, - "loss": 2.1929, - "step": 550920 + "epoch": 0.21, + "learning_rate": 3.9434269376157863e-05, + "loss": 2.8246, + "step": 59200 }, { - "epoch": 0.96, - "learning_rate": 1.962213611331034e-06, - "loss": 2.189, - "step": 550930 + "epoch": 0.21, + "learning_rate": 3.9416421858212185e-05, + "loss": 2.8263, + "step": 59300 }, { - "epoch": 0.96, - "learning_rate": 1.961341671404207e-06, - "loss": 2.2766, - "step": 550940 + "epoch": 0.21, + "learning_rate": 3.9398574340266506e-05, + "loss": 2.8327, + "step": 59400 }, { - "epoch": 0.96, - "learning_rate": 1.9604697314773803e-06, - "loss": 2.124, - "step": 550950 + "epoch": 0.21, + "learning_rate": 3.938072682232082e-05, + "loss": 2.8302, + "step": 59500 }, { - "epoch": 0.96, - "learning_rate": 1.9595977915505536e-06, - "loss": 2.2524, - "step": 550960 + "epoch": 0.21, + "learning_rate": 3.936287930437514e-05, + "loss": 2.8261, + "step": 59600 }, { - "epoch": 0.96, - "learning_rate": 1.9587258516237265e-06, - "loss": 2.2324, - "step": 550970 + "epoch": 0.21, + "learning_rate": 3.934503178642946e-05, + "loss": 2.8255, + "step": 59700 }, { - "epoch": 0.96, - "learning_rate": 1.9578539116969e-06, - "loss": 2.3051, - "step": 550980 + "epoch": 0.21, + "learning_rate": 3.9327184268483784e-05, + "loss": 2.8291, + "step": 59800 }, { - "epoch": 0.96, - "learning_rate": 1.9569819717700732e-06, - "loss": 2.3175, - "step": 550990 + "epoch": 0.21, + "learning_rate": 3.9309336750538105e-05, + "loss": 2.8335, + "step": 59900 }, { - "epoch": 0.96, - "learning_rate": 1.956110031843246e-06, - "loss": 2.2662, - "step": 551000 + "epoch": 0.21, + "learning_rate": 3.9291489232592426e-05, + "loss": 2.8345, + "step": 60000 }, { - "epoch": 0.96, - "learning_rate": 1.9552380919164195e-06, - "loss": 2.3021, - "step": 551010 + "epoch": 0.21, + "learning_rate": 3.927364171464675e-05, + "loss": 2.8267, + "step": 60100 }, { - "epoch": 0.96, - "learning_rate": 1.9543661519895924e-06, - "loss": 2.2099, - "step": 551020 + "epoch": 0.21, + "learning_rate": 3.925579419670107e-05, + "loss": 2.8294, + "step": 60200 }, { - "epoch": 0.96, - "learning_rate": 1.9534942120627658e-06, - "loss": 2.1783, - "step": 551030 + "epoch": 0.22, + "learning_rate": 3.923794667875539e-05, + "loss": 2.8296, + "step": 60300 }, { - "epoch": 0.96, - "learning_rate": 1.952622272135939e-06, - "loss": 2.2927, - "step": 551040 + "epoch": 0.22, + "learning_rate": 3.922009916080971e-05, + "loss": 2.825, + "step": 60400 }, { - "epoch": 0.96, - "learning_rate": 1.951750332209112e-06, - "loss": 2.3145, - "step": 551050 + "epoch": 0.22, + "learning_rate": 3.920225164286403e-05, + "loss": 2.8255, + "step": 60500 }, { - "epoch": 0.96, - "learning_rate": 1.9508783922822854e-06, - "loss": 2.3566, - "step": 551060 + "epoch": 0.22, + "learning_rate": 3.918440412491835e-05, + "loss": 2.8265, + "step": 60600 }, { - "epoch": 0.96, - "learning_rate": 1.9500064523554587e-06, - "loss": 2.2983, - "step": 551070 + "epoch": 0.22, + "learning_rate": 3.916655660697267e-05, + "loss": 2.824, + "step": 60700 }, { - "epoch": 0.96, - "learning_rate": 1.9491345124286316e-06, - "loss": 2.2202, - "step": 551080 + "epoch": 0.22, + "learning_rate": 3.914870908902699e-05, + "loss": 2.8239, + "step": 60800 }, { - "epoch": 0.96, - "learning_rate": 1.948262572501805e-06, - "loss": 2.1849, - "step": 551090 + "epoch": 0.22, + "learning_rate": 3.913086157108131e-05, + "loss": 2.8292, + "step": 60900 }, { - "epoch": 0.96, - "learning_rate": 1.9473906325749783e-06, - "loss": 2.2116, - "step": 551100 + "epoch": 0.22, + "learning_rate": 3.911301405313563e-05, + "loss": 2.8268, + "step": 61000 }, { - "epoch": 0.96, - "learning_rate": 1.9465186926481513e-06, - "loss": 2.2921, - "step": 551110 + "epoch": 0.22, + "learning_rate": 3.909516653518995e-05, + "loss": 2.8234, + "step": 61100 }, { - "epoch": 0.96, - "learning_rate": 1.9456467527213246e-06, - "loss": 2.4628, - "step": 551120 + "epoch": 0.22, + "learning_rate": 3.9077319017244274e-05, + "loss": 2.8276, + "step": 61200 }, { - "epoch": 0.96, - "learning_rate": 1.944774812794498e-06, - "loss": 2.2863, - "step": 551130 + "epoch": 0.22, + "learning_rate": 3.9059471499298595e-05, + "loss": 2.8208, + "step": 61300 }, { - "epoch": 0.96, - "learning_rate": 1.943902872867671e-06, - "loss": 2.1973, - "step": 551140 + "epoch": 0.22, + "learning_rate": 3.904162398135292e-05, + "loss": 2.8301, + "step": 61400 }, { - "epoch": 0.96, - "learning_rate": 1.9430309329408442e-06, - "loss": 2.3097, - "step": 551150 + "epoch": 0.22, + "learning_rate": 3.902377646340724e-05, + "loss": 2.8209, + "step": 61500 }, { - "epoch": 0.96, - "learning_rate": 1.9421589930140176e-06, - "loss": 2.3081, - "step": 551160 + "epoch": 0.22, + "learning_rate": 3.900592894546156e-05, + "loss": 2.8219, + "step": 61600 }, { - "epoch": 0.96, - "learning_rate": 1.9412870530871905e-06, - "loss": 2.241, - "step": 551170 + "epoch": 0.22, + "learning_rate": 3.8988081427515874e-05, + "loss": 2.8197, + "step": 61700 }, { - "epoch": 0.96, - "learning_rate": 1.940415113160364e-06, - "loss": 2.1982, - "step": 551180 + "epoch": 0.22, + "learning_rate": 3.8970233909570195e-05, + "loss": 2.828, + "step": 61800 }, { - "epoch": 0.96, - "learning_rate": 1.939543173233537e-06, - "loss": 2.2838, - "step": 551190 + "epoch": 0.22, + "learning_rate": 3.8952386391624516e-05, + "loss": 2.8193, + "step": 61900 }, { - "epoch": 0.96, - "learning_rate": 1.93867123330671e-06, - "loss": 2.3082, - "step": 551200 + "epoch": 0.22, + "learning_rate": 3.893453887367884e-05, + "loss": 2.824, + "step": 62000 }, { - "epoch": 0.96, - "learning_rate": 1.9377992933798835e-06, - "loss": 2.2891, - "step": 551210 + "epoch": 0.22, + "learning_rate": 3.891669135573316e-05, + "loss": 2.8243, + "step": 62100 }, { - "epoch": 0.96, - "learning_rate": 1.936927353453057e-06, - "loss": 2.1735, - "step": 551220 + "epoch": 0.22, + "learning_rate": 3.889884383778748e-05, + "loss": 2.8251, + "step": 62200 }, { - "epoch": 0.96, - "learning_rate": 1.9360554135262297e-06, - "loss": 2.2645, - "step": 551230 + "epoch": 0.22, + "learning_rate": 3.88809963198418e-05, + "loss": 2.8178, + "step": 62300 }, { - "epoch": 0.96, - "learning_rate": 1.935183473599403e-06, - "loss": 2.269, - "step": 551240 + "epoch": 0.22, + "learning_rate": 3.886314880189612e-05, + "loss": 2.8137, + "step": 62400 }, { - "epoch": 0.96, - "learning_rate": 1.934311533672576e-06, - "loss": 2.2991, - "step": 551250 + "epoch": 0.22, + "learning_rate": 3.884530128395044e-05, + "loss": 2.8303, + "step": 62500 }, { - "epoch": 0.96, - "learning_rate": 1.9334395937457493e-06, - "loss": 2.2868, - "step": 551260 + "epoch": 0.22, + "learning_rate": 3.8827453766004764e-05, + "loss": 2.8176, + "step": 62600 }, { - "epoch": 0.96, - "learning_rate": 1.9325676538189227e-06, - "loss": 2.3244, - "step": 551270 + "epoch": 0.22, + "learning_rate": 3.8809606248059086e-05, + "loss": 2.8195, + "step": 62700 }, { - "epoch": 0.96, - "learning_rate": 1.9316957138920956e-06, - "loss": 2.2505, - "step": 551280 + "epoch": 0.22, + "learning_rate": 3.87917587301134e-05, + "loss": 2.8333, + "step": 62800 }, { - "epoch": 0.96, - "learning_rate": 1.930823773965269e-06, - "loss": 2.2732, - "step": 551290 + "epoch": 0.22, + "learning_rate": 3.877391121216772e-05, + "loss": 2.8282, + "step": 62900 }, { - "epoch": 0.96, - "learning_rate": 1.9299518340384423e-06, - "loss": 2.1887, - "step": 551300 + "epoch": 0.22, + "learning_rate": 3.875606369422204e-05, + "loss": 2.8149, + "step": 63000 }, { - "epoch": 0.96, - "learning_rate": 1.9290798941116152e-06, - "loss": 2.2848, - "step": 551310 + "epoch": 0.23, + "learning_rate": 3.8738216176276364e-05, + "loss": 2.8329, + "step": 63100 }, { - "epoch": 0.96, - "learning_rate": 1.9282079541847886e-06, - "loss": 2.2294, - "step": 551320 + "epoch": 0.23, + "learning_rate": 3.8720368658330685e-05, + "loss": 2.8254, + "step": 63200 }, { - "epoch": 0.96, - "learning_rate": 1.927336014257962e-06, - "loss": 2.1747, - "step": 551330 + "epoch": 0.23, + "learning_rate": 3.8702521140385006e-05, + "loss": 2.8217, + "step": 63300 }, { - "epoch": 0.96, - "learning_rate": 1.926464074331135e-06, - "loss": 2.33, - "step": 551340 + "epoch": 0.23, + "learning_rate": 3.868467362243933e-05, + "loss": 2.8281, + "step": 63400 }, { - "epoch": 0.96, - "learning_rate": 1.925592134404308e-06, - "loss": 2.1724, - "step": 551350 + "epoch": 0.23, + "learning_rate": 3.866682610449365e-05, + "loss": 2.8274, + "step": 63500 }, { - "epoch": 0.96, - "learning_rate": 1.9247201944774815e-06, - "loss": 2.3032, - "step": 551360 + "epoch": 0.23, + "learning_rate": 3.864897858654797e-05, + "loss": 2.8173, + "step": 63600 }, { - "epoch": 0.96, - "learning_rate": 1.9238482545506545e-06, - "loss": 2.235, - "step": 551370 + "epoch": 0.23, + "learning_rate": 3.863113106860229e-05, + "loss": 2.8199, + "step": 63700 }, { - "epoch": 0.96, - "learning_rate": 1.922976314623828e-06, - "loss": 2.267, - "step": 551380 + "epoch": 0.23, + "learning_rate": 3.861328355065661e-05, + "loss": 2.8304, + "step": 63800 }, { - "epoch": 0.96, - "learning_rate": 1.922104374697001e-06, - "loss": 2.226, - "step": 551390 + "epoch": 0.23, + "learning_rate": 3.8595436032710933e-05, + "loss": 2.8193, + "step": 63900 }, { - "epoch": 0.96, - "learning_rate": 1.921232434770174e-06, - "loss": 2.2197, - "step": 551400 + "epoch": 0.23, + "learning_rate": 3.8577588514765255e-05, + "loss": 2.8193, + "step": 64000 }, { - "epoch": 0.96, - "learning_rate": 1.9203604948433474e-06, - "loss": 2.2292, - "step": 551410 + "epoch": 0.23, + "learning_rate": 3.8559740996819576e-05, + "loss": 2.8161, + "step": 64100 }, { - "epoch": 0.96, - "learning_rate": 1.9194885549165208e-06, - "loss": 2.2012, - "step": 551420 + "epoch": 0.23, + "learning_rate": 3.85418934788739e-05, + "loss": 2.822, + "step": 64200 }, { - "epoch": 0.96, - "learning_rate": 1.9186166149896937e-06, - "loss": 2.2295, - "step": 551430 + "epoch": 0.23, + "learning_rate": 3.852404596092822e-05, + "loss": 2.8195, + "step": 64300 }, { - "epoch": 0.96, - "learning_rate": 1.917744675062867e-06, - "loss": 2.3263, - "step": 551440 + "epoch": 0.23, + "learning_rate": 3.850619844298254e-05, + "loss": 2.836, + "step": 64400 }, { - "epoch": 0.96, - "learning_rate": 1.91687273513604e-06, - "loss": 2.2882, - "step": 551450 + "epoch": 0.23, + "learning_rate": 3.848835092503686e-05, + "loss": 2.8261, + "step": 64500 }, { - "epoch": 0.96, - "learning_rate": 1.9160007952092133e-06, - "loss": 2.2617, - "step": 551460 + "epoch": 0.23, + "learning_rate": 3.847050340709118e-05, + "loss": 2.8232, + "step": 64600 }, { - "epoch": 0.96, - "learning_rate": 1.9151288552823866e-06, - "loss": 2.2816, - "step": 551470 + "epoch": 0.23, + "learning_rate": 3.84526558891455e-05, + "loss": 2.8256, + "step": 64700 }, { - "epoch": 0.96, - "learning_rate": 1.91425691535556e-06, - "loss": 2.243, - "step": 551480 + "epoch": 0.23, + "learning_rate": 3.843480837119982e-05, + "loss": 2.8224, + "step": 64800 }, { - "epoch": 0.96, - "learning_rate": 1.913384975428733e-06, - "loss": 2.2922, - "step": 551490 + "epoch": 0.23, + "learning_rate": 3.841696085325414e-05, + "loss": 2.8168, + "step": 64900 }, { - "epoch": 0.96, - "learning_rate": 1.9125130355019063e-06, - "loss": 2.1378, - "step": 551500 + "epoch": 0.23, + "learning_rate": 3.839911333530846e-05, + "loss": 2.8229, + "step": 65000 }, { - "epoch": 0.96, - "learning_rate": 1.911641095575079e-06, - "loss": 2.3663, - "step": 551510 + "epoch": 0.23, + "learning_rate": 3.838126581736278e-05, + "loss": 2.8128, + "step": 65100 }, { - "epoch": 0.96, - "learning_rate": 1.9107691556482525e-06, - "loss": 2.2003, - "step": 551520 + "epoch": 0.23, + "learning_rate": 3.83634182994171e-05, + "loss": 2.8177, + "step": 65200 }, { - "epoch": 0.96, - "learning_rate": 1.909897215721426e-06, - "loss": 2.1962, - "step": 551530 + "epoch": 0.23, + "learning_rate": 3.8345570781471424e-05, + "loss": 2.8243, + "step": 65300 }, { - "epoch": 0.96, - "learning_rate": 1.909025275794599e-06, - "loss": 2.1229, - "step": 551540 + "epoch": 0.23, + "learning_rate": 3.8327723263525745e-05, + "loss": 2.8253, + "step": 65400 }, { - "epoch": 0.96, - "learning_rate": 1.908153335867772e-06, - "loss": 2.2654, - "step": 551550 + "epoch": 0.23, + "learning_rate": 3.8309875745580066e-05, + "loss": 2.8213, + "step": 65500 }, { - "epoch": 0.96, - "learning_rate": 1.9072813959409453e-06, - "loss": 2.2426, - "step": 551560 + "epoch": 0.23, + "learning_rate": 3.829202822763439e-05, + "loss": 2.8196, + "step": 65600 }, { - "epoch": 0.96, - "learning_rate": 1.9064094560141184e-06, - "loss": 2.2591, - "step": 551570 + "epoch": 0.23, + "learning_rate": 3.827418070968871e-05, + "loss": 2.8226, + "step": 65700 }, { - "epoch": 0.96, - "learning_rate": 1.9055375160872916e-06, - "loss": 2.2525, - "step": 551580 + "epoch": 0.23, + "learning_rate": 3.825633319174303e-05, + "loss": 2.8216, + "step": 65800 }, { - "epoch": 0.96, - "learning_rate": 1.9046655761604651e-06, - "loss": 2.3497, - "step": 551590 + "epoch": 0.24, + "learning_rate": 3.8238485673797344e-05, + "loss": 2.8176, + "step": 65900 }, { - "epoch": 0.96, - "learning_rate": 1.9037936362336382e-06, - "loss": 2.2373, - "step": 551600 + "epoch": 0.24, + "learning_rate": 3.8220638155851665e-05, + "loss": 2.8155, + "step": 66000 }, { - "epoch": 0.96, - "learning_rate": 1.9029216963068114e-06, - "loss": 2.094, - "step": 551610 + "epoch": 0.24, + "learning_rate": 3.820279063790599e-05, + "loss": 2.8205, + "step": 66100 }, { - "epoch": 0.96, - "learning_rate": 1.9020497563799845e-06, - "loss": 2.1656, - "step": 551620 + "epoch": 0.24, + "learning_rate": 3.818494311996031e-05, + "loss": 2.8173, + "step": 66200 }, { - "epoch": 0.96, - "learning_rate": 1.9011778164531577e-06, - "loss": 2.267, - "step": 551630 + "epoch": 0.24, + "learning_rate": 3.816709560201463e-05, + "loss": 2.8177, + "step": 66300 }, { - "epoch": 0.96, - "learning_rate": 1.9003058765263308e-06, - "loss": 2.2511, - "step": 551640 + "epoch": 0.24, + "learning_rate": 3.814924808406895e-05, + "loss": 2.8228, + "step": 66400 }, { - "epoch": 0.96, - "learning_rate": 1.899433936599504e-06, - "loss": 2.3047, - "step": 551650 + "epoch": 0.24, + "learning_rate": 3.813140056612327e-05, + "loss": 2.8189, + "step": 66500 }, { - "epoch": 0.96, - "learning_rate": 1.8985619966726775e-06, - "loss": 2.2751, - "step": 551660 + "epoch": 0.24, + "learning_rate": 3.811355304817759e-05, + "loss": 2.8131, + "step": 66600 }, { - "epoch": 0.96, - "learning_rate": 1.8976900567458506e-06, - "loss": 2.2888, - "step": 551670 + "epoch": 0.24, + "learning_rate": 3.8095705530231914e-05, + "loss": 2.8143, + "step": 66700 }, { - "epoch": 0.96, - "learning_rate": 1.8968181168190237e-06, - "loss": 2.3028, - "step": 551680 + "epoch": 0.24, + "learning_rate": 3.8077858012286235e-05, + "loss": 2.8232, + "step": 66800 }, { - "epoch": 0.96, - "learning_rate": 1.8959461768921969e-06, - "loss": 2.3219, - "step": 551690 + "epoch": 0.24, + "learning_rate": 3.8060010494340556e-05, + "loss": 2.8274, + "step": 66900 }, { - "epoch": 0.96, - "learning_rate": 1.89507423696537e-06, - "loss": 2.3045, - "step": 551700 + "epoch": 0.24, + "learning_rate": 3.804216297639487e-05, + "loss": 2.8239, + "step": 67000 }, { - "epoch": 0.96, - "learning_rate": 1.8942022970385432e-06, - "loss": 2.2194, - "step": 551710 + "epoch": 0.24, + "learning_rate": 3.802431545844919e-05, + "loss": 2.8201, + "step": 67100 }, { - "epoch": 0.96, - "learning_rate": 1.8933303571117167e-06, - "loss": 2.2948, - "step": 551720 + "epoch": 0.24, + "learning_rate": 3.800646794050351e-05, + "loss": 2.8165, + "step": 67200 }, { - "epoch": 0.96, - "learning_rate": 1.8924584171848898e-06, - "loss": 2.2159, - "step": 551730 + "epoch": 0.24, + "learning_rate": 3.7988620422557834e-05, + "loss": 2.8003, + "step": 67300 }, { - "epoch": 0.96, - "learning_rate": 1.891586477258063e-06, - "loss": 2.2528, - "step": 551740 + "epoch": 0.24, + "learning_rate": 3.7970772904612156e-05, + "loss": 2.8125, + "step": 67400 }, { - "epoch": 0.96, - "learning_rate": 1.8907145373312361e-06, - "loss": 2.3496, - "step": 551750 + "epoch": 0.24, + "learning_rate": 3.795292538666648e-05, + "loss": 2.8208, + "step": 67500 }, { - "epoch": 0.96, - "learning_rate": 1.8898425974044092e-06, - "loss": 2.2518, - "step": 551760 + "epoch": 0.24, + "learning_rate": 3.79350778687208e-05, + "loss": 2.8136, + "step": 67600 }, { - "epoch": 0.96, - "learning_rate": 1.8889706574775824e-06, - "loss": 2.1767, - "step": 551770 + "epoch": 0.24, + "learning_rate": 3.791723035077512e-05, + "loss": 2.815, + "step": 67700 }, { - "epoch": 0.96, - "learning_rate": 1.8880987175507555e-06, - "loss": 2.2376, - "step": 551780 + "epoch": 0.24, + "learning_rate": 3.789938283282944e-05, + "loss": 2.8129, + "step": 67800 }, { - "epoch": 0.96, - "learning_rate": 1.887226777623929e-06, - "loss": 2.2406, - "step": 551790 + "epoch": 0.24, + "learning_rate": 3.788153531488376e-05, + "loss": 2.8263, + "step": 67900 }, { - "epoch": 0.96, - "learning_rate": 1.8863548376971022e-06, - "loss": 2.3826, - "step": 551800 + "epoch": 0.24, + "learning_rate": 3.786368779693808e-05, + "loss": 2.8188, + "step": 68000 }, { - "epoch": 0.96, - "learning_rate": 1.8854828977702753e-06, - "loss": 2.1954, - "step": 551810 + "epoch": 0.24, + "learning_rate": 3.78458402789924e-05, + "loss": 2.8157, + "step": 68100 }, { - "epoch": 0.96, - "learning_rate": 1.8846109578434485e-06, - "loss": 2.3046, - "step": 551820 + "epoch": 0.24, + "learning_rate": 3.782799276104672e-05, + "loss": 2.8161, + "step": 68200 }, { - "epoch": 0.96, - "learning_rate": 1.8837390179166216e-06, - "loss": 2.2776, - "step": 551830 + "epoch": 0.24, + "learning_rate": 3.781014524310104e-05, + "loss": 2.8165, + "step": 68300 }, { - "epoch": 0.96, - "learning_rate": 1.8828670779897947e-06, - "loss": 2.3111, - "step": 551840 + "epoch": 0.24, + "learning_rate": 3.779229772515536e-05, + "loss": 2.8123, + "step": 68400 }, { - "epoch": 0.96, - "learning_rate": 1.8819951380629679e-06, - "loss": 2.2894, - "step": 551850 + "epoch": 0.24, + "learning_rate": 3.777445020720968e-05, + "loss": 2.8163, + "step": 68500 }, { - "epoch": 0.96, - "learning_rate": 1.8811231981361414e-06, - "loss": 2.2037, - "step": 551860 + "epoch": 0.24, + "learning_rate": 3.7756602689264003e-05, + "loss": 2.8181, + "step": 68600 }, { - "epoch": 0.96, - "learning_rate": 1.8802512582093146e-06, - "loss": 2.2353, - "step": 551870 + "epoch": 0.25, + "learning_rate": 3.7738755171318325e-05, + "loss": 2.8145, + "step": 68700 }, { - "epoch": 0.96, - "learning_rate": 1.8793793182824877e-06, - "loss": 2.2409, - "step": 551880 + "epoch": 0.25, + "learning_rate": 3.7720907653372646e-05, + "loss": 2.8149, + "step": 68800 }, { - "epoch": 0.96, - "learning_rate": 1.8785073783556608e-06, - "loss": 2.2054, - "step": 551890 + "epoch": 0.25, + "learning_rate": 3.770306013542697e-05, + "loss": 2.811, + "step": 68900 }, { - "epoch": 0.96, - "learning_rate": 1.877635438428834e-06, - "loss": 2.2473, - "step": 551900 + "epoch": 0.25, + "learning_rate": 3.768521261748129e-05, + "loss": 2.8121, + "step": 69000 }, { - "epoch": 0.96, - "learning_rate": 1.8767634985020071e-06, - "loss": 2.3203, - "step": 551910 + "epoch": 0.25, + "learning_rate": 3.766736509953561e-05, + "loss": 2.8145, + "step": 69100 }, { - "epoch": 0.96, - "learning_rate": 1.8758915585751807e-06, - "loss": 2.2967, - "step": 551920 + "epoch": 0.25, + "learning_rate": 3.764951758158993e-05, + "loss": 2.8179, + "step": 69200 }, { - "epoch": 0.96, - "learning_rate": 1.8750196186483538e-06, - "loss": 2.2635, - "step": 551930 + "epoch": 0.25, + "learning_rate": 3.763167006364425e-05, + "loss": 2.8092, + "step": 69300 }, { - "epoch": 0.96, - "learning_rate": 1.874147678721527e-06, - "loss": 2.2932, - "step": 551940 + "epoch": 0.25, + "learning_rate": 3.761382254569857e-05, + "loss": 2.8153, + "step": 69400 }, { - "epoch": 0.96, - "learning_rate": 1.8732757387947e-06, - "loss": 2.2163, - "step": 551950 + "epoch": 0.25, + "learning_rate": 3.7595975027752894e-05, + "loss": 2.8191, + "step": 69500 }, { - "epoch": 0.96, - "learning_rate": 1.8724037988678732e-06, - "loss": 2.2227, - "step": 551960 + "epoch": 0.25, + "learning_rate": 3.7578127509807216e-05, + "loss": 2.8241, + "step": 69600 }, { - "epoch": 0.96, - "learning_rate": 1.8715318589410463e-06, - "loss": 2.274, - "step": 551970 + "epoch": 0.25, + "learning_rate": 3.756027999186154e-05, + "loss": 2.812, + "step": 69700 }, { - "epoch": 0.96, - "learning_rate": 1.8706599190142195e-06, - "loss": 2.3497, - "step": 551980 + "epoch": 0.25, + "learning_rate": 3.754243247391586e-05, + "loss": 2.8149, + "step": 69800 }, { - "epoch": 0.96, - "learning_rate": 1.869787979087393e-06, - "loss": 2.3136, - "step": 551990 + "epoch": 0.25, + "learning_rate": 3.752458495597018e-05, + "loss": 2.8231, + "step": 69900 }, { - "epoch": 0.96, - "learning_rate": 1.8689160391605662e-06, - "loss": 2.2337, - "step": 552000 + "epoch": 0.25, + "learning_rate": 3.75067374380245e-05, + "loss": 2.8172, + "step": 70000 }, { - "epoch": 0.96, - "learning_rate": 1.8680440992337393e-06, - "loss": 2.194, - "step": 552010 + "epoch": 0.25, + "learning_rate": 3.7488889920078815e-05, + "loss": 2.8039, + "step": 70100 }, { - "epoch": 0.96, - "learning_rate": 1.8671721593069124e-06, - "loss": 2.4179, - "step": 552020 + "epoch": 0.25, + "learning_rate": 3.7471042402133136e-05, + "loss": 2.8142, + "step": 70200 }, { - "epoch": 0.96, - "learning_rate": 1.8663002193800856e-06, - "loss": 2.2832, - "step": 552030 + "epoch": 0.25, + "learning_rate": 3.745319488418746e-05, + "loss": 2.8196, + "step": 70300 }, { - "epoch": 0.96, - "learning_rate": 1.8654282794532587e-06, - "loss": 2.2109, - "step": 552040 + "epoch": 0.25, + "learning_rate": 3.743534736624178e-05, + "loss": 2.8097, + "step": 70400 }, { - "epoch": 0.96, - "learning_rate": 1.8645563395264318e-06, - "loss": 2.3328, - "step": 552050 + "epoch": 0.25, + "learning_rate": 3.74174998482961e-05, + "loss": 2.8031, + "step": 70500 }, { - "epoch": 0.96, - "learning_rate": 1.8636843995996054e-06, - "loss": 2.1954, - "step": 552060 + "epoch": 0.25, + "learning_rate": 3.739965233035042e-05, + "loss": 2.8111, + "step": 70600 }, { - "epoch": 0.96, - "learning_rate": 1.8628124596727785e-06, - "loss": 2.1698, - "step": 552070 + "epoch": 0.25, + "learning_rate": 3.738180481240474e-05, + "loss": 2.8112, + "step": 70700 }, { - "epoch": 0.96, - "learning_rate": 1.8619405197459517e-06, - "loss": 2.2372, - "step": 552080 + "epoch": 0.25, + "learning_rate": 3.7363957294459063e-05, + "loss": 2.818, + "step": 70800 }, { - "epoch": 0.96, - "learning_rate": 1.8610685798191248e-06, - "loss": 2.1831, - "step": 552090 + "epoch": 0.25, + "learning_rate": 3.7346109776513385e-05, + "loss": 2.8037, + "step": 70900 }, { - "epoch": 0.96, - "learning_rate": 1.860196639892298e-06, - "loss": 2.3198, - "step": 552100 + "epoch": 0.25, + "learning_rate": 3.7328262258567706e-05, + "loss": 2.8099, + "step": 71000 }, { - "epoch": 0.96, - "learning_rate": 1.859324699965471e-06, - "loss": 2.1868, - "step": 552110 + "epoch": 0.25, + "learning_rate": 3.731041474062203e-05, + "loss": 2.8041, + "step": 71100 }, { - "epoch": 0.96, - "learning_rate": 1.8584527600386446e-06, - "loss": 2.2697, - "step": 552120 + "epoch": 0.25, + "learning_rate": 3.729256722267634e-05, + "loss": 2.8205, + "step": 71200 }, { - "epoch": 0.96, - "learning_rate": 1.8575808201118178e-06, - "loss": 2.1802, - "step": 552130 + "epoch": 0.25, + "learning_rate": 3.727471970473066e-05, + "loss": 2.8189, + "step": 71300 }, { - "epoch": 0.96, - "learning_rate": 1.856708880184991e-06, - "loss": 2.2026, - "step": 552140 + "epoch": 0.25, + "learning_rate": 3.7256872186784984e-05, + "loss": 2.8132, + "step": 71400 }, { - "epoch": 0.96, - "learning_rate": 1.855836940258164e-06, - "loss": 2.2473, - "step": 552150 + "epoch": 0.26, + "learning_rate": 3.7239024668839305e-05, + "loss": 2.8115, + "step": 71500 }, { - "epoch": 0.96, - "learning_rate": 1.8549650003313372e-06, - "loss": 2.3191, - "step": 552160 + "epoch": 0.26, + "learning_rate": 3.7221177150893626e-05, + "loss": 2.8013, + "step": 71600 }, { - "epoch": 0.96, - "learning_rate": 1.8540930604045103e-06, - "loss": 2.4016, - "step": 552170 + "epoch": 0.26, + "learning_rate": 3.720332963294795e-05, + "loss": 2.8026, + "step": 71700 }, { - "epoch": 0.96, - "learning_rate": 1.8532211204776834e-06, - "loss": 2.2182, - "step": 552180 + "epoch": 0.26, + "learning_rate": 3.718548211500227e-05, + "loss": 2.8047, + "step": 71800 }, { - "epoch": 0.96, - "learning_rate": 1.852349180550857e-06, - "loss": 2.2538, - "step": 552190 + "epoch": 0.26, + "learning_rate": 3.716763459705659e-05, + "loss": 2.8157, + "step": 71900 }, { - "epoch": 0.96, - "learning_rate": 1.8514772406240301e-06, - "loss": 2.2405, - "step": 552200 + "epoch": 0.26, + "learning_rate": 3.714978707911091e-05, + "loss": 2.814, + "step": 72000 }, { - "epoch": 0.96, - "learning_rate": 1.8506053006972033e-06, - "loss": 2.2943, - "step": 552210 + "epoch": 0.26, + "learning_rate": 3.713193956116523e-05, + "loss": 2.8161, + "step": 72100 }, { - "epoch": 0.96, - "learning_rate": 1.8497333607703764e-06, - "loss": 2.1779, - "step": 552220 + "epoch": 0.26, + "learning_rate": 3.7114092043219554e-05, + "loss": 2.8115, + "step": 72200 }, { - "epoch": 0.96, - "learning_rate": 1.8488614208435495e-06, - "loss": 2.3304, - "step": 552230 + "epoch": 0.26, + "learning_rate": 3.709624452527387e-05, + "loss": 2.8193, + "step": 72300 }, { - "epoch": 0.96, - "learning_rate": 1.8479894809167227e-06, - "loss": 2.3454, - "step": 552240 + "epoch": 0.26, + "learning_rate": 3.707839700732819e-05, + "loss": 2.8088, + "step": 72400 }, { - "epoch": 0.96, - "learning_rate": 1.8471175409898958e-06, - "loss": 2.1409, - "step": 552250 + "epoch": 0.26, + "learning_rate": 3.706054948938251e-05, + "loss": 2.804, + "step": 72500 }, { - "epoch": 0.96, - "learning_rate": 1.8462456010630694e-06, - "loss": 2.2056, - "step": 552260 + "epoch": 0.26, + "learning_rate": 3.704270197143683e-05, + "loss": 2.798, + "step": 72600 }, { - "epoch": 0.96, - "learning_rate": 1.8453736611362425e-06, - "loss": 2.2273, - "step": 552270 + "epoch": 0.26, + "learning_rate": 3.702485445349115e-05, + "loss": 2.8055, + "step": 72700 }, { - "epoch": 0.96, - "learning_rate": 1.8445017212094156e-06, - "loss": 2.2739, - "step": 552280 + "epoch": 0.26, + "learning_rate": 3.7007006935545474e-05, + "loss": 2.8116, + "step": 72800 }, { - "epoch": 0.96, - "learning_rate": 1.8436297812825888e-06, - "loss": 2.3057, - "step": 552290 + "epoch": 0.26, + "learning_rate": 3.6989159417599795e-05, + "loss": 2.8163, + "step": 72900 }, { - "epoch": 0.96, - "learning_rate": 1.842757841355762e-06, - "loss": 2.2, - "step": 552300 + "epoch": 0.26, + "learning_rate": 3.6971311899654117e-05, + "loss": 2.8096, + "step": 73000 }, { - "epoch": 0.96, - "learning_rate": 1.841885901428935e-06, - "loss": 2.2718, - "step": 552310 + "epoch": 0.26, + "learning_rate": 3.695346438170844e-05, + "loss": 2.8119, + "step": 73100 }, { - "epoch": 0.96, - "learning_rate": 1.8410139615021086e-06, - "loss": 2.1524, - "step": 552320 + "epoch": 0.26, + "learning_rate": 3.693561686376276e-05, + "loss": 2.8193, + "step": 73200 }, { - "epoch": 0.96, - "learning_rate": 1.8401420215752817e-06, - "loss": 2.3101, - "step": 552330 + "epoch": 0.26, + "learning_rate": 3.691776934581708e-05, + "loss": 2.8066, + "step": 73300 }, { - "epoch": 0.96, - "learning_rate": 1.8392700816484549e-06, - "loss": 2.1887, - "step": 552340 + "epoch": 0.26, + "learning_rate": 3.6899921827871395e-05, + "loss": 2.8117, + "step": 73400 }, { - "epoch": 0.96, - "learning_rate": 1.838398141721628e-06, - "loss": 2.3018, - "step": 552350 + "epoch": 0.26, + "learning_rate": 3.6882074309925716e-05, + "loss": 2.8091, + "step": 73500 }, { - "epoch": 0.96, - "learning_rate": 1.8375262017948011e-06, - "loss": 2.2816, - "step": 552360 + "epoch": 0.26, + "learning_rate": 3.686422679198004e-05, + "loss": 2.8075, + "step": 73600 }, { - "epoch": 0.96, - "learning_rate": 1.8366542618679743e-06, - "loss": 2.2158, - "step": 552370 + "epoch": 0.26, + "learning_rate": 3.684637927403436e-05, + "loss": 2.8055, + "step": 73700 }, { - "epoch": 0.96, - "learning_rate": 1.8357823219411474e-06, - "loss": 2.2361, - "step": 552380 + "epoch": 0.26, + "learning_rate": 3.682853175608868e-05, + "loss": 2.8076, + "step": 73800 }, { - "epoch": 0.96, - "learning_rate": 1.834910382014321e-06, - "loss": 2.2731, - "step": 552390 + "epoch": 0.26, + "learning_rate": 3.6810684238143e-05, + "loss": 2.8159, + "step": 73900 }, { - "epoch": 0.96, - "learning_rate": 1.834038442087494e-06, - "loss": 2.2669, - "step": 552400 + "epoch": 0.26, + "learning_rate": 3.679283672019732e-05, + "loss": 2.8066, + "step": 74000 }, { - "epoch": 0.96, - "learning_rate": 1.8331665021606672e-06, - "loss": 2.3504, - "step": 552410 + "epoch": 0.26, + "learning_rate": 3.677498920225165e-05, + "loss": 2.8005, + "step": 74100 }, { - "epoch": 0.96, - "learning_rate": 1.8322945622338404e-06, - "loss": 2.2293, - "step": 552420 + "epoch": 0.26, + "learning_rate": 3.675714168430597e-05, + "loss": 2.809, + "step": 74200 }, { - "epoch": 0.96, - "learning_rate": 1.8314226223070135e-06, - "loss": 2.2698, - "step": 552430 + "epoch": 0.27, + "learning_rate": 3.6739294166360286e-05, + "loss": 2.81, + "step": 74300 }, { - "epoch": 0.96, - "learning_rate": 1.8305506823801866e-06, - "loss": 2.2858, - "step": 552440 + "epoch": 0.27, + "learning_rate": 3.672144664841461e-05, + "loss": 2.7959, + "step": 74400 }, { - "epoch": 0.96, - "learning_rate": 1.8296787424533598e-06, - "loss": 2.2318, - "step": 552450 + "epoch": 0.27, + "learning_rate": 3.670359913046893e-05, + "loss": 2.7977, + "step": 74500 }, { - "epoch": 0.96, - "learning_rate": 1.8288068025265333e-06, - "loss": 2.3177, - "step": 552460 + "epoch": 0.27, + "learning_rate": 3.668575161252325e-05, + "loss": 2.8063, + "step": 74600 }, { - "epoch": 0.96, - "learning_rate": 1.8279348625997065e-06, - "loss": 2.2286, - "step": 552470 + "epoch": 0.27, + "learning_rate": 3.666790409457757e-05, + "loss": 2.811, + "step": 74700 }, { - "epoch": 0.96, - "learning_rate": 1.8270629226728796e-06, - "loss": 2.2512, - "step": 552480 + "epoch": 0.27, + "learning_rate": 3.665005657663189e-05, + "loss": 2.8095, + "step": 74800 }, { - "epoch": 0.96, - "learning_rate": 1.8261909827460527e-06, - "loss": 2.3272, - "step": 552490 + "epoch": 0.27, + "learning_rate": 3.663220905868621e-05, + "loss": 2.81, + "step": 74900 }, { - "epoch": 0.96, - "learning_rate": 1.8253190428192259e-06, - "loss": 2.2255, - "step": 552500 + "epoch": 0.27, + "learning_rate": 3.6614361540740534e-05, + "loss": 2.8034, + "step": 75000 }, { - "epoch": 0.96, - "learning_rate": 1.824447102892399e-06, - "loss": 2.1682, - "step": 552510 + "epoch": 0.27, + "learning_rate": 3.6596514022794855e-05, + "loss": 2.8054, + "step": 75100 }, { - "epoch": 0.96, - "learning_rate": 1.8235751629655726e-06, - "loss": 2.2626, - "step": 552520 + "epoch": 0.27, + "learning_rate": 3.6578666504849177e-05, + "loss": 2.8026, + "step": 75200 }, { - "epoch": 0.96, - "learning_rate": 1.8227032230387457e-06, - "loss": 2.1825, - "step": 552530 + "epoch": 0.27, + "learning_rate": 3.65608189869035e-05, + "loss": 2.8075, + "step": 75300 }, { - "epoch": 0.96, - "learning_rate": 1.8218312831119188e-06, - "loss": 2.3173, - "step": 552540 + "epoch": 0.27, + "learning_rate": 3.654297146895781e-05, + "loss": 2.8087, + "step": 75400 }, { - "epoch": 0.96, - "learning_rate": 1.820959343185092e-06, - "loss": 2.2592, - "step": 552550 + "epoch": 0.27, + "learning_rate": 3.6525123951012133e-05, + "loss": 2.7983, + "step": 75500 }, { - "epoch": 0.96, - "learning_rate": 1.820087403258265e-06, - "loss": 2.3082, - "step": 552560 + "epoch": 0.27, + "learning_rate": 3.6507276433066455e-05, + "loss": 2.8036, + "step": 75600 }, { - "epoch": 0.96, - "learning_rate": 1.8192154633314382e-06, - "loss": 2.2512, - "step": 552570 + "epoch": 0.27, + "learning_rate": 3.6489428915120776e-05, + "loss": 2.8184, + "step": 75700 }, { - "epoch": 0.96, - "learning_rate": 1.8183435234046114e-06, - "loss": 2.2687, - "step": 552580 + "epoch": 0.27, + "learning_rate": 3.64715813971751e-05, + "loss": 2.7996, + "step": 75800 }, { - "epoch": 0.96, - "learning_rate": 1.817471583477785e-06, - "loss": 2.2291, - "step": 552590 + "epoch": 0.27, + "learning_rate": 3.645373387922942e-05, + "loss": 2.8028, + "step": 75900 }, { - "epoch": 0.96, - "learning_rate": 1.816599643550958e-06, - "loss": 2.2665, - "step": 552600 + "epoch": 0.27, + "learning_rate": 3.643588636128374e-05, + "loss": 2.8051, + "step": 76000 }, { - "epoch": 0.96, - "learning_rate": 1.8157277036241312e-06, - "loss": 2.3579, - "step": 552610 + "epoch": 0.27, + "learning_rate": 3.641803884333806e-05, + "loss": 2.7947, + "step": 76100 }, { - "epoch": 0.96, - "learning_rate": 1.8148557636973043e-06, - "loss": 2.2447, - "step": 552620 + "epoch": 0.27, + "learning_rate": 3.640019132539238e-05, + "loss": 2.8027, + "step": 76200 }, { - "epoch": 0.96, - "learning_rate": 1.8139838237704775e-06, - "loss": 2.2538, - "step": 552630 + "epoch": 0.27, + "learning_rate": 3.63823438074467e-05, + "loss": 2.7995, + "step": 76300 }, { - "epoch": 0.96, - "learning_rate": 1.8131118838436506e-06, - "loss": 2.157, - "step": 552640 + "epoch": 0.27, + "learning_rate": 3.6364496289501024e-05, + "loss": 2.8027, + "step": 76400 }, { - "epoch": 0.96, - "learning_rate": 1.8122399439168237e-06, - "loss": 2.3167, - "step": 552650 + "epoch": 0.27, + "learning_rate": 3.634664877155534e-05, + "loss": 2.813, + "step": 76500 }, { - "epoch": 0.96, - "learning_rate": 1.8113680039899973e-06, - "loss": 2.427, - "step": 552660 + "epoch": 0.27, + "learning_rate": 3.632880125360966e-05, + "loss": 2.7952, + "step": 76600 }, { - "epoch": 0.96, - "learning_rate": 1.8104960640631704e-06, - "loss": 2.281, - "step": 552670 + "epoch": 0.27, + "learning_rate": 3.631095373566398e-05, + "loss": 2.8047, + "step": 76700 }, { - "epoch": 0.96, - "learning_rate": 1.8096241241363436e-06, - "loss": 2.2491, - "step": 552680 + "epoch": 0.27, + "learning_rate": 3.62931062177183e-05, + "loss": 2.8081, + "step": 76800 }, { - "epoch": 0.96, - "learning_rate": 1.8087521842095167e-06, - "loss": 2.2694, - "step": 552690 + "epoch": 0.27, + "learning_rate": 3.6275258699772624e-05, + "loss": 2.8098, + "step": 76900 }, { - "epoch": 0.96, - "learning_rate": 1.8078802442826898e-06, - "loss": 2.275, - "step": 552700 + "epoch": 0.27, + "learning_rate": 3.6257411181826945e-05, + "loss": 2.8081, + "step": 77000 }, { - "epoch": 0.96, - "learning_rate": 1.807008304355863e-06, - "loss": 2.3274, - "step": 552710 + "epoch": 0.28, + "learning_rate": 3.6239563663881266e-05, + "loss": 2.8029, + "step": 77100 }, { - "epoch": 0.96, - "learning_rate": 1.8061363644290365e-06, - "loss": 2.3189, - "step": 552720 + "epoch": 0.28, + "learning_rate": 3.622171614593559e-05, + "loss": 2.8009, + "step": 77200 }, { - "epoch": 0.96, - "learning_rate": 1.8052644245022097e-06, - "loss": 2.2287, - "step": 552730 + "epoch": 0.28, + "learning_rate": 3.620386862798991e-05, + "loss": 2.8057, + "step": 77300 }, { - "epoch": 0.96, - "learning_rate": 1.8043924845753828e-06, - "loss": 2.2174, - "step": 552740 + "epoch": 0.28, + "learning_rate": 3.618602111004423e-05, + "loss": 2.8088, + "step": 77400 }, { - "epoch": 0.96, - "learning_rate": 1.803520544648556e-06, - "loss": 2.2923, - "step": 552750 + "epoch": 0.28, + "learning_rate": 3.616817359209855e-05, + "loss": 2.8007, + "step": 77500 }, { - "epoch": 0.96, - "learning_rate": 1.802648604721729e-06, - "loss": 2.2849, - "step": 552760 + "epoch": 0.28, + "learning_rate": 3.6150326074152865e-05, + "loss": 2.8024, + "step": 77600 }, { - "epoch": 0.96, - "learning_rate": 1.8017766647949022e-06, - "loss": 2.2156, - "step": 552770 + "epoch": 0.28, + "learning_rate": 3.6132478556207187e-05, + "loss": 2.7984, + "step": 77700 }, { - "epoch": 0.96, - "learning_rate": 1.8009047248680753e-06, - "loss": 2.1536, - "step": 552780 + "epoch": 0.28, + "learning_rate": 3.611463103826151e-05, + "loss": 2.811, + "step": 77800 }, { - "epoch": 0.96, - "learning_rate": 1.8000327849412489e-06, - "loss": 2.2014, - "step": 552790 + "epoch": 0.28, + "learning_rate": 3.609678352031583e-05, + "loss": 2.7933, + "step": 77900 }, { - "epoch": 0.96, - "learning_rate": 1.799160845014422e-06, - "loss": 2.2737, - "step": 552800 + "epoch": 0.28, + "learning_rate": 3.607893600237015e-05, + "loss": 2.7904, + "step": 78000 }, { - "epoch": 0.96, - "learning_rate": 1.7982889050875952e-06, - "loss": 2.3023, - "step": 552810 + "epoch": 0.28, + "learning_rate": 3.606108848442447e-05, + "loss": 2.8006, + "step": 78100 }, { - "epoch": 0.96, - "learning_rate": 1.7974169651607683e-06, - "loss": 2.2478, - "step": 552820 + "epoch": 0.28, + "learning_rate": 3.604324096647879e-05, + "loss": 2.8043, + "step": 78200 }, { - "epoch": 0.96, - "learning_rate": 1.7965450252339414e-06, - "loss": 2.3029, - "step": 552830 + "epoch": 0.28, + "learning_rate": 3.6025393448533114e-05, + "loss": 2.7954, + "step": 78300 }, { - "epoch": 0.96, - "learning_rate": 1.7956730853071146e-06, - "loss": 2.3484, - "step": 552840 + "epoch": 0.28, + "learning_rate": 3.6007545930587435e-05, + "loss": 2.7991, + "step": 78400 }, { - "epoch": 0.96, - "learning_rate": 1.7948011453802881e-06, - "loss": 2.3055, - "step": 552850 + "epoch": 0.28, + "learning_rate": 3.5989698412641756e-05, + "loss": 2.8027, + "step": 78500 }, { - "epoch": 0.96, - "learning_rate": 1.7939292054534613e-06, - "loss": 2.2635, - "step": 552860 + "epoch": 0.28, + "learning_rate": 3.597185089469608e-05, + "loss": 2.8098, + "step": 78600 }, { - "epoch": 0.96, - "learning_rate": 1.7930572655266344e-06, - "loss": 2.3619, - "step": 552870 + "epoch": 0.28, + "learning_rate": 3.595400337675039e-05, + "loss": 2.8082, + "step": 78700 }, { - "epoch": 0.96, - "learning_rate": 1.7921853255998075e-06, - "loss": 2.1922, - "step": 552880 + "epoch": 0.28, + "learning_rate": 3.593615585880471e-05, + "loss": 2.7968, + "step": 78800 }, { - "epoch": 0.96, - "learning_rate": 1.7913133856729807e-06, - "loss": 2.2854, - "step": 552890 + "epoch": 0.28, + "learning_rate": 3.5918308340859034e-05, + "loss": 2.8025, + "step": 78900 }, { - "epoch": 0.96, - "learning_rate": 1.7904414457461538e-06, - "loss": 2.2297, - "step": 552900 + "epoch": 0.28, + "learning_rate": 3.5900460822913356e-05, + "loss": 2.7976, + "step": 79000 }, { - "epoch": 0.96, - "learning_rate": 1.789569505819327e-06, - "loss": 2.3282, - "step": 552910 + "epoch": 0.28, + "learning_rate": 3.588261330496768e-05, + "loss": 2.8049, + "step": 79100 }, { - "epoch": 0.96, - "learning_rate": 1.7886975658925005e-06, - "loss": 2.3598, - "step": 552920 + "epoch": 0.28, + "learning_rate": 3.5864765787022005e-05, + "loss": 2.8057, + "step": 79200 }, { - "epoch": 0.96, - "learning_rate": 1.7878256259656736e-06, - "loss": 2.3253, - "step": 552930 + "epoch": 0.28, + "learning_rate": 3.5846918269076326e-05, + "loss": 2.8104, + "step": 79300 }, { - "epoch": 0.96, - "learning_rate": 1.7869536860388468e-06, - "loss": 2.2163, - "step": 552940 + "epoch": 0.28, + "learning_rate": 3.582907075113065e-05, + "loss": 2.796, + "step": 79400 }, { - "epoch": 0.96, - "learning_rate": 1.7860817461120199e-06, - "loss": 2.3038, - "step": 552950 + "epoch": 0.28, + "learning_rate": 3.581122323318497e-05, + "loss": 2.8066, + "step": 79500 }, { - "epoch": 0.96, - "learning_rate": 1.785209806185193e-06, - "loss": 2.1539, - "step": 552960 + "epoch": 0.28, + "learning_rate": 3.579337571523928e-05, + "loss": 2.8091, + "step": 79600 }, { - "epoch": 0.96, - "learning_rate": 1.7843378662583662e-06, - "loss": 2.3165, - "step": 552970 + "epoch": 0.28, + "learning_rate": 3.5775528197293604e-05, + "loss": 2.8055, + "step": 79700 }, { - "epoch": 0.96, - "learning_rate": 1.7834659263315393e-06, - "loss": 2.2569, - "step": 552980 + "epoch": 0.28, + "learning_rate": 3.5757680679347925e-05, + "loss": 2.7998, + "step": 79800 }, { - "epoch": 0.96, - "learning_rate": 1.7825939864047129e-06, - "loss": 2.175, - "step": 552990 + "epoch": 0.29, + "learning_rate": 3.5739833161402247e-05, + "loss": 2.7972, + "step": 79900 }, { - "epoch": 0.96, - "learning_rate": 1.781722046477886e-06, - "loss": 2.325, - "step": 553000 + "epoch": 0.29, + "learning_rate": 3.572198564345657e-05, + "loss": 2.8224, + "step": 80000 }, { - "epoch": 0.96, - "learning_rate": 1.7808501065510591e-06, - "loss": 2.2807, - "step": 553010 + "epoch": 0.29, + "learning_rate": 3.570413812551089e-05, + "loss": 2.7974, + "step": 80100 }, { - "epoch": 0.96, - "learning_rate": 1.7799781666242323e-06, - "loss": 2.32, - "step": 553020 + "epoch": 0.29, + "learning_rate": 3.568629060756521e-05, + "loss": 2.803, + "step": 80200 }, { - "epoch": 0.96, - "learning_rate": 1.7791062266974054e-06, - "loss": 2.2674, - "step": 553030 + "epoch": 0.29, + "learning_rate": 3.566844308961953e-05, + "loss": 2.8, + "step": 80300 }, { - "epoch": 0.96, - "learning_rate": 1.7782342867705785e-06, - "loss": 2.3068, - "step": 553040 + "epoch": 0.29, + "learning_rate": 3.565059557167385e-05, + "loss": 2.8029, + "step": 80400 }, { - "epoch": 0.96, - "learning_rate": 1.777362346843752e-06, - "loss": 2.2626, - "step": 553050 + "epoch": 0.29, + "learning_rate": 3.5632748053728174e-05, + "loss": 2.7944, + "step": 80500 }, { - "epoch": 0.96, - "learning_rate": 1.7764904069169252e-06, - "loss": 2.2435, - "step": 553060 + "epoch": 0.29, + "learning_rate": 3.561490053578249e-05, + "loss": 2.7996, + "step": 80600 }, { - "epoch": 0.96, - "learning_rate": 1.7756184669900984e-06, - "loss": 2.2644, - "step": 553070 + "epoch": 0.29, + "learning_rate": 3.559705301783681e-05, + "loss": 2.8045, + "step": 80700 }, { - "epoch": 0.96, - "learning_rate": 1.7747465270632715e-06, - "loss": 2.267, - "step": 553080 + "epoch": 0.29, + "learning_rate": 3.557920549989113e-05, + "loss": 2.8062, + "step": 80800 }, { - "epoch": 0.96, - "learning_rate": 1.7738745871364446e-06, - "loss": 2.3047, - "step": 553090 + "epoch": 0.29, + "learning_rate": 3.556135798194545e-05, + "loss": 2.7918, + "step": 80900 }, { - "epoch": 0.96, - "learning_rate": 1.7730026472096178e-06, - "loss": 2.2573, - "step": 553100 + "epoch": 0.29, + "learning_rate": 3.554351046399977e-05, + "loss": 2.7998, + "step": 81000 }, { - "epoch": 0.96, - "learning_rate": 1.7721307072827909e-06, - "loss": 2.1954, - "step": 553110 + "epoch": 0.29, + "learning_rate": 3.5525662946054094e-05, + "loss": 2.8071, + "step": 81100 }, { - "epoch": 0.96, - "learning_rate": 1.7712587673559645e-06, - "loss": 2.1124, - "step": 553120 + "epoch": 0.29, + "learning_rate": 3.5507815428108416e-05, + "loss": 2.7921, + "step": 81200 }, { - "epoch": 0.96, - "learning_rate": 1.7703868274291376e-06, - "loss": 2.291, - "step": 553130 + "epoch": 0.29, + "learning_rate": 3.548996791016274e-05, + "loss": 2.7935, + "step": 81300 }, { - "epoch": 0.96, - "learning_rate": 1.7695148875023107e-06, - "loss": 2.323, - "step": 553140 + "epoch": 0.29, + "learning_rate": 3.547212039221706e-05, + "loss": 2.7901, + "step": 81400 }, { - "epoch": 0.96, - "learning_rate": 1.7686429475754839e-06, - "loss": 2.1658, - "step": 553150 + "epoch": 0.29, + "learning_rate": 3.545427287427138e-05, + "loss": 2.7961, + "step": 81500 }, { - "epoch": 0.96, - "learning_rate": 1.767771007648657e-06, - "loss": 2.1501, - "step": 553160 + "epoch": 0.29, + "learning_rate": 3.54364253563257e-05, + "loss": 2.8023, + "step": 81600 }, { - "epoch": 0.96, - "learning_rate": 1.7668990677218301e-06, - "loss": 2.241, - "step": 553170 + "epoch": 0.29, + "learning_rate": 3.5418577838380015e-05, + "loss": 2.7976, + "step": 81700 }, { - "epoch": 0.96, - "learning_rate": 1.7660271277950033e-06, - "loss": 2.2042, - "step": 553180 + "epoch": 0.29, + "learning_rate": 3.5400730320434336e-05, + "loss": 2.8003, + "step": 81800 }, { - "epoch": 0.96, - "learning_rate": 1.7651551878681768e-06, - "loss": 2.2815, - "step": 553190 + "epoch": 0.29, + "learning_rate": 3.538288280248866e-05, + "loss": 2.7947, + "step": 81900 }, { - "epoch": 0.96, - "learning_rate": 1.76428324794135e-06, - "loss": 2.2974, - "step": 553200 + "epoch": 0.29, + "learning_rate": 3.536503528454298e-05, + "loss": 2.7876, + "step": 82000 }, { - "epoch": 0.96, - "learning_rate": 1.763411308014523e-06, - "loss": 2.259, - "step": 553210 + "epoch": 0.29, + "learning_rate": 3.53471877665973e-05, + "loss": 2.8015, + "step": 82100 }, { - "epoch": 0.96, - "learning_rate": 1.7625393680876962e-06, - "loss": 2.2552, - "step": 553220 + "epoch": 0.29, + "learning_rate": 3.532934024865162e-05, + "loss": 2.8107, + "step": 82200 }, { - "epoch": 0.96, - "learning_rate": 1.7616674281608694e-06, - "loss": 2.1913, - "step": 553230 + "epoch": 0.29, + "learning_rate": 3.531149273070594e-05, + "loss": 2.7999, + "step": 82300 }, { - "epoch": 0.96, - "learning_rate": 1.7607954882340425e-06, - "loss": 2.211, - "step": 553240 + "epoch": 0.29, + "learning_rate": 3.529364521276026e-05, + "loss": 2.795, + "step": 82400 }, { - "epoch": 0.96, - "learning_rate": 1.759923548307216e-06, - "loss": 2.1047, - "step": 553250 + "epoch": 0.29, + "learning_rate": 3.5275797694814585e-05, + "loss": 2.7994, + "step": 82500 }, { - "epoch": 0.96, - "learning_rate": 1.7590516083803892e-06, - "loss": 2.2718, - "step": 553260 + "epoch": 0.29, + "learning_rate": 3.5257950176868906e-05, + "loss": 2.8099, + "step": 82600 }, { - "epoch": 0.96, - "learning_rate": 1.7581796684535623e-06, - "loss": 2.3275, - "step": 553270 + "epoch": 0.3, + "learning_rate": 3.524010265892323e-05, + "loss": 2.8062, + "step": 82700 }, { - "epoch": 0.96, - "learning_rate": 1.7573077285267355e-06, - "loss": 2.3052, - "step": 553280 + "epoch": 0.3, + "learning_rate": 3.522225514097754e-05, + "loss": 2.795, + "step": 82800 }, { - "epoch": 0.96, - "learning_rate": 1.7564357885999086e-06, - "loss": 2.3094, - "step": 553290 + "epoch": 0.3, + "learning_rate": 3.520440762303186e-05, + "loss": 2.8096, + "step": 82900 }, { - "epoch": 0.96, - "learning_rate": 1.7555638486730817e-06, - "loss": 2.3273, - "step": 553300 + "epoch": 0.3, + "learning_rate": 3.5186560105086184e-05, + "loss": 2.7915, + "step": 83000 }, { - "epoch": 0.96, - "learning_rate": 1.7546919087462549e-06, - "loss": 2.3653, - "step": 553310 + "epoch": 0.3, + "learning_rate": 3.5168712587140505e-05, + "loss": 2.7943, + "step": 83100 }, { - "epoch": 0.96, - "learning_rate": 1.7538199688194284e-06, - "loss": 2.2131, - "step": 553320 + "epoch": 0.3, + "learning_rate": 3.5150865069194826e-05, + "loss": 2.7945, + "step": 83200 }, { - "epoch": 0.96, - "learning_rate": 1.7529480288926015e-06, - "loss": 2.1681, - "step": 553330 + "epoch": 0.3, + "learning_rate": 3.513301755124915e-05, + "loss": 2.796, + "step": 83300 }, { - "epoch": 0.96, - "learning_rate": 1.7520760889657747e-06, - "loss": 2.131, - "step": 553340 + "epoch": 0.3, + "learning_rate": 3.511517003330347e-05, + "loss": 2.8073, + "step": 83400 }, { - "epoch": 0.96, - "learning_rate": 1.7512041490389478e-06, - "loss": 2.3241, - "step": 553350 + "epoch": 0.3, + "learning_rate": 3.509732251535779e-05, + "loss": 2.8, + "step": 83500 }, { - "epoch": 0.96, - "learning_rate": 1.750332209112121e-06, - "loss": 2.3555, - "step": 553360 + "epoch": 0.3, + "learning_rate": 3.507947499741211e-05, + "loss": 2.7775, + "step": 83600 }, { - "epoch": 0.97, - "learning_rate": 1.749460269185294e-06, - "loss": 2.3085, - "step": 553370 + "epoch": 0.3, + "learning_rate": 3.506162747946643e-05, + "loss": 2.8005, + "step": 83700 }, { - "epoch": 0.97, - "learning_rate": 1.7485883292584672e-06, - "loss": 2.2096, - "step": 553380 + "epoch": 0.3, + "learning_rate": 3.5043779961520754e-05, + "loss": 2.7855, + "step": 83800 }, { - "epoch": 0.97, - "learning_rate": 1.7477163893316408e-06, - "loss": 2.1571, - "step": 553390 + "epoch": 0.3, + "learning_rate": 3.502593244357507e-05, + "loss": 2.7942, + "step": 83900 }, { - "epoch": 0.97, - "learning_rate": 1.746844449404814e-06, - "loss": 2.3937, - "step": 553400 + "epoch": 0.3, + "learning_rate": 3.500808492562939e-05, + "loss": 2.7927, + "step": 84000 }, { - "epoch": 0.97, - "learning_rate": 1.745972509477987e-06, - "loss": 2.252, - "step": 553410 + "epoch": 0.3, + "learning_rate": 3.499023740768371e-05, + "loss": 2.7909, + "step": 84100 }, { - "epoch": 0.97, - "learning_rate": 1.7451005695511602e-06, - "loss": 2.2851, - "step": 553420 + "epoch": 0.3, + "learning_rate": 3.497238988973803e-05, + "loss": 2.7891, + "step": 84200 }, { - "epoch": 0.97, - "learning_rate": 1.7442286296243333e-06, - "loss": 2.3478, - "step": 553430 + "epoch": 0.3, + "learning_rate": 3.495454237179236e-05, + "loss": 2.7811, + "step": 84300 }, { - "epoch": 0.97, - "learning_rate": 1.7433566896975065e-06, - "loss": 2.1997, - "step": 553440 + "epoch": 0.3, + "learning_rate": 3.493669485384668e-05, + "loss": 2.7972, + "step": 84400 }, { - "epoch": 0.97, - "learning_rate": 1.74248474977068e-06, - "loss": 2.2476, - "step": 553450 + "epoch": 0.3, + "learning_rate": 3.4918847335901e-05, + "loss": 2.7969, + "step": 84500 }, { - "epoch": 0.97, - "learning_rate": 1.7416128098438531e-06, - "loss": 2.3198, - "step": 553460 + "epoch": 0.3, + "learning_rate": 3.490099981795532e-05, + "loss": 2.786, + "step": 84600 }, { - "epoch": 0.97, - "learning_rate": 1.7407408699170263e-06, - "loss": 2.1941, - "step": 553470 + "epoch": 0.3, + "learning_rate": 3.4883152300009645e-05, + "loss": 2.7791, + "step": 84700 }, { - "epoch": 0.97, - "learning_rate": 1.7398689299901994e-06, - "loss": 2.1799, - "step": 553480 + "epoch": 0.3, + "learning_rate": 3.486530478206396e-05, + "loss": 2.7897, + "step": 84800 }, { - "epoch": 0.97, - "learning_rate": 1.7389969900633726e-06, - "loss": 2.1985, - "step": 553490 + "epoch": 0.3, + "learning_rate": 3.484745726411828e-05, + "loss": 2.7829, + "step": 84900 }, { - "epoch": 0.97, - "learning_rate": 1.7381250501365457e-06, - "loss": 2.1746, - "step": 553500 + "epoch": 0.3, + "learning_rate": 3.48296097461726e-05, + "loss": 2.7877, + "step": 85000 }, { - "epoch": 0.97, - "learning_rate": 1.7372531102097188e-06, - "loss": 2.2752, - "step": 553510 + "epoch": 0.3, + "learning_rate": 3.481176222822692e-05, + "loss": 2.7965, + "step": 85100 }, { - "epoch": 0.97, - "learning_rate": 1.7363811702828924e-06, - "loss": 2.3473, - "step": 553520 + "epoch": 0.3, + "learning_rate": 3.4793914710281244e-05, + "loss": 2.7986, + "step": 85200 }, { - "epoch": 0.97, - "learning_rate": 1.7355092303560655e-06, - "loss": 2.3697, - "step": 553530 + "epoch": 0.3, + "learning_rate": 3.4776067192335565e-05, + "loss": 2.7859, + "step": 85300 }, { - "epoch": 0.97, - "learning_rate": 1.7346372904292386e-06, - "loss": 2.3522, - "step": 553540 + "epoch": 0.3, + "learning_rate": 3.4758219674389886e-05, + "loss": 2.7989, + "step": 85400 }, { - "epoch": 0.97, - "learning_rate": 1.7337653505024118e-06, - "loss": 2.2706, - "step": 553550 + "epoch": 0.31, + "learning_rate": 3.474037215644421e-05, + "loss": 2.7942, + "step": 85500 }, { - "epoch": 0.97, - "learning_rate": 1.732893410575585e-06, - "loss": 2.1929, - "step": 553560 + "epoch": 0.31, + "learning_rate": 3.472252463849853e-05, + "loss": 2.793, + "step": 85600 }, { - "epoch": 0.97, - "learning_rate": 1.732021470648758e-06, - "loss": 2.303, - "step": 553570 + "epoch": 0.31, + "learning_rate": 3.470467712055285e-05, + "loss": 2.7894, + "step": 85700 }, { - "epoch": 0.97, - "learning_rate": 1.7311495307219314e-06, - "loss": 2.1921, - "step": 553580 + "epoch": 0.31, + "learning_rate": 3.468682960260717e-05, + "loss": 2.7974, + "step": 85800 }, { - "epoch": 0.97, - "learning_rate": 1.7302775907951047e-06, - "loss": 2.3248, - "step": 553590 + "epoch": 0.31, + "learning_rate": 3.4668982084661486e-05, + "loss": 2.7912, + "step": 85900 }, { - "epoch": 0.97, - "learning_rate": 1.7294056508682779e-06, - "loss": 2.2501, - "step": 553600 + "epoch": 0.31, + "learning_rate": 3.465113456671581e-05, + "loss": 2.8016, + "step": 86000 }, { - "epoch": 0.97, - "learning_rate": 1.728533710941451e-06, - "loss": 2.2211, - "step": 553610 + "epoch": 0.31, + "learning_rate": 3.463328704877013e-05, + "loss": 2.7912, + "step": 86100 }, { - "epoch": 0.97, - "learning_rate": 1.7276617710146241e-06, - "loss": 2.2948, - "step": 553620 + "epoch": 0.31, + "learning_rate": 3.461543953082445e-05, + "loss": 2.7997, + "step": 86200 }, { - "epoch": 0.97, - "learning_rate": 1.7267898310877973e-06, - "loss": 2.2848, - "step": 553630 + "epoch": 0.31, + "learning_rate": 3.459759201287877e-05, + "loss": 2.7946, + "step": 86300 }, { - "epoch": 0.97, - "learning_rate": 1.7259178911609706e-06, - "loss": 2.181, - "step": 553640 + "epoch": 0.31, + "learning_rate": 3.457974449493309e-05, + "loss": 2.7986, + "step": 86400 }, { - "epoch": 0.97, - "learning_rate": 1.725045951234144e-06, - "loss": 2.3184, - "step": 553650 + "epoch": 0.31, + "learning_rate": 3.456189697698741e-05, + "loss": 2.7806, + "step": 86500 }, { - "epoch": 0.97, - "learning_rate": 1.7241740113073171e-06, - "loss": 2.1916, - "step": 553660 + "epoch": 0.31, + "learning_rate": 3.4544049459041734e-05, + "loss": 2.8009, + "step": 86600 }, { - "epoch": 0.97, - "learning_rate": 1.7233020713804902e-06, - "loss": 2.2737, - "step": 553670 + "epoch": 0.31, + "learning_rate": 3.4526201941096055e-05, + "loss": 2.7881, + "step": 86700 }, { - "epoch": 0.97, - "learning_rate": 1.7224301314536634e-06, - "loss": 2.3077, - "step": 553680 + "epoch": 0.31, + "learning_rate": 3.4508354423150376e-05, + "loss": 2.7896, + "step": 86800 }, { - "epoch": 0.97, - "learning_rate": 1.7215581915268365e-06, - "loss": 2.2741, - "step": 553690 + "epoch": 0.31, + "learning_rate": 3.44905069052047e-05, + "loss": 2.7916, + "step": 86900 }, { - "epoch": 0.97, - "learning_rate": 1.7206862516000096e-06, - "loss": 2.181, - "step": 553700 + "epoch": 0.31, + "learning_rate": 3.447265938725901e-05, + "loss": 2.7909, + "step": 87000 }, { - "epoch": 0.97, - "learning_rate": 1.719814311673183e-06, - "loss": 2.3821, - "step": 553710 + "epoch": 0.31, + "learning_rate": 3.445481186931333e-05, + "loss": 2.7981, + "step": 87100 }, { - "epoch": 0.97, - "learning_rate": 1.7189423717463563e-06, - "loss": 2.1242, - "step": 553720 + "epoch": 0.31, + "learning_rate": 3.4436964351367655e-05, + "loss": 2.7981, + "step": 87200 }, { - "epoch": 0.97, - "learning_rate": 1.7180704318195295e-06, - "loss": 2.1756, - "step": 553730 + "epoch": 0.31, + "learning_rate": 3.4419116833421976e-05, + "loss": 2.7944, + "step": 87300 }, { - "epoch": 0.97, - "learning_rate": 1.7171984918927026e-06, - "loss": 2.2809, - "step": 553740 + "epoch": 0.31, + "learning_rate": 3.44012693154763e-05, + "loss": 2.7774, + "step": 87400 }, { - "epoch": 0.97, - "learning_rate": 1.7163265519658757e-06, - "loss": 2.1752, - "step": 553750 + "epoch": 0.31, + "learning_rate": 3.438342179753062e-05, + "loss": 2.7957, + "step": 87500 }, { - "epoch": 0.97, - "learning_rate": 1.7154546120390489e-06, - "loss": 2.3747, - "step": 553760 + "epoch": 0.31, + "learning_rate": 3.436557427958494e-05, + "loss": 2.7897, + "step": 87600 }, { - "epoch": 0.97, - "learning_rate": 1.7145826721122222e-06, - "loss": 2.2294, - "step": 553770 + "epoch": 0.31, + "learning_rate": 3.434772676163926e-05, + "loss": 2.7931, + "step": 87700 }, { - "epoch": 0.97, - "learning_rate": 1.7137107321853954e-06, - "loss": 2.2404, - "step": 553780 + "epoch": 0.31, + "learning_rate": 3.432987924369358e-05, + "loss": 2.8006, + "step": 87800 }, { - "epoch": 0.97, - "learning_rate": 1.7128387922585687e-06, - "loss": 2.2205, - "step": 553790 + "epoch": 0.31, + "learning_rate": 3.43120317257479e-05, + "loss": 2.7896, + "step": 87900 }, { - "epoch": 0.97, - "learning_rate": 1.7119668523317418e-06, - "loss": 2.1693, - "step": 553800 + "epoch": 0.31, + "learning_rate": 3.4294184207802224e-05, + "loss": 2.7926, + "step": 88000 }, { - "epoch": 0.97, - "learning_rate": 1.711094912404915e-06, - "loss": 2.2301, - "step": 553810 + "epoch": 0.31, + "learning_rate": 3.427633668985654e-05, + "loss": 2.7889, + "step": 88100 }, { - "epoch": 0.97, - "learning_rate": 1.7102229724780881e-06, - "loss": 2.2516, - "step": 553820 + "epoch": 0.31, + "learning_rate": 3.425848917191086e-05, + "loss": 2.7929, + "step": 88200 }, { - "epoch": 0.97, - "learning_rate": 1.7093510325512612e-06, - "loss": 2.2237, - "step": 553830 + "epoch": 0.32, + "learning_rate": 3.424064165396518e-05, + "loss": 2.8003, + "step": 88300 }, { - "epoch": 0.97, - "learning_rate": 1.7084790926244346e-06, - "loss": 2.1335, - "step": 553840 + "epoch": 0.32, + "learning_rate": 3.42227941360195e-05, + "loss": 2.7875, + "step": 88400 }, { - "epoch": 0.97, - "learning_rate": 1.707607152697608e-06, - "loss": 2.2342, - "step": 553850 + "epoch": 0.32, + "learning_rate": 3.4204946618073824e-05, + "loss": 2.7897, + "step": 88500 }, { - "epoch": 0.97, - "learning_rate": 1.706735212770781e-06, - "loss": 2.2849, - "step": 553860 + "epoch": 0.32, + "learning_rate": 3.4187099100128145e-05, + "loss": 2.7913, + "step": 88600 }, { - "epoch": 0.97, - "learning_rate": 1.7058632728439542e-06, - "loss": 2.3399, - "step": 553870 + "epoch": 0.32, + "learning_rate": 3.4169251582182466e-05, + "loss": 2.7967, + "step": 88700 }, { - "epoch": 0.97, - "learning_rate": 1.7049913329171273e-06, - "loss": 2.2417, - "step": 553880 + "epoch": 0.32, + "learning_rate": 3.415140406423679e-05, + "loss": 2.7979, + "step": 88800 }, { - "epoch": 0.97, - "learning_rate": 1.7041193929903005e-06, - "loss": 2.3057, - "step": 553890 + "epoch": 0.32, + "learning_rate": 3.413355654629111e-05, + "loss": 2.7955, + "step": 88900 }, { - "epoch": 0.97, - "learning_rate": 1.7032474530634738e-06, - "loss": 2.4038, - "step": 553900 + "epoch": 0.32, + "learning_rate": 3.411570902834543e-05, + "loss": 2.7939, + "step": 89000 }, { - "epoch": 0.97, - "learning_rate": 1.702375513136647e-06, - "loss": 2.2919, - "step": 553910 + "epoch": 0.32, + "learning_rate": 3.409786151039975e-05, + "loss": 2.7744, + "step": 89100 }, { - "epoch": 0.97, - "learning_rate": 1.7015035732098203e-06, - "loss": 2.3155, - "step": 553920 + "epoch": 0.32, + "learning_rate": 3.4080013992454065e-05, + "loss": 2.7845, + "step": 89200 }, { - "epoch": 0.97, - "learning_rate": 1.7006316332829934e-06, - "loss": 2.2119, - "step": 553930 + "epoch": 0.32, + "learning_rate": 3.4062166474508387e-05, + "loss": 2.7793, + "step": 89300 }, { - "epoch": 0.97, - "learning_rate": 1.6997596933561666e-06, - "loss": 2.3619, - "step": 553940 + "epoch": 0.32, + "learning_rate": 3.4044318956562715e-05, + "loss": 2.7996, + "step": 89400 }, { - "epoch": 0.97, - "learning_rate": 1.6988877534293397e-06, - "loss": 2.294, - "step": 553950 + "epoch": 0.32, + "learning_rate": 3.4026471438617036e-05, + "loss": 2.7876, + "step": 89500 }, { - "epoch": 0.97, - "learning_rate": 1.6980158135025128e-06, - "loss": 2.2218, - "step": 553960 + "epoch": 0.32, + "learning_rate": 3.400862392067136e-05, + "loss": 2.7879, + "step": 89600 }, { - "epoch": 0.97, - "learning_rate": 1.6971438735756862e-06, - "loss": 2.3403, - "step": 553970 + "epoch": 0.32, + "learning_rate": 3.399077640272568e-05, + "loss": 2.7849, + "step": 89700 }, { - "epoch": 0.97, - "learning_rate": 1.6962719336488593e-06, - "loss": 2.2258, - "step": 553980 + "epoch": 0.32, + "learning_rate": 3.397292888478e-05, + "loss": 2.7854, + "step": 89800 }, { - "epoch": 0.97, - "learning_rate": 1.6953999937220327e-06, - "loss": 2.2204, - "step": 553990 + "epoch": 0.32, + "learning_rate": 3.395508136683432e-05, + "loss": 2.7948, + "step": 89900 }, { - "epoch": 0.97, - "learning_rate": 1.6945280537952058e-06, - "loss": 2.1147, - "step": 554000 + "epoch": 0.32, + "learning_rate": 3.393723384888864e-05, + "loss": 2.7837, + "step": 90000 }, { - "epoch": 0.97, - "learning_rate": 1.693656113868379e-06, - "loss": 2.2985, - "step": 554010 + "epoch": 0.32, + "learning_rate": 3.3919386330942956e-05, + "loss": 2.7937, + "step": 90100 }, { - "epoch": 0.97, - "learning_rate": 1.692784173941552e-06, - "loss": 2.252, - "step": 554020 + "epoch": 0.32, + "learning_rate": 3.390153881299728e-05, + "loss": 2.787, + "step": 90200 }, { - "epoch": 0.97, - "learning_rate": 1.6919122340147254e-06, - "loss": 2.2344, - "step": 554030 + "epoch": 0.32, + "learning_rate": 3.38836912950516e-05, + "loss": 2.7907, + "step": 90300 }, { - "epoch": 0.97, - "learning_rate": 1.6910402940878986e-06, - "loss": 2.318, - "step": 554040 + "epoch": 0.32, + "learning_rate": 3.386584377710592e-05, + "loss": 2.7884, + "step": 90400 }, { - "epoch": 0.97, - "learning_rate": 1.690168354161072e-06, - "loss": 2.3401, - "step": 554050 + "epoch": 0.32, + "learning_rate": 3.384799625916024e-05, + "loss": 2.7879, + "step": 90500 }, { - "epoch": 0.97, - "learning_rate": 1.689296414234245e-06, - "loss": 2.2197, - "step": 554060 + "epoch": 0.32, + "learning_rate": 3.383014874121456e-05, + "loss": 2.8006, + "step": 90600 }, { - "epoch": 0.97, - "learning_rate": 1.6884244743074182e-06, - "loss": 2.1917, - "step": 554070 + "epoch": 0.32, + "learning_rate": 3.3812301223268884e-05, + "loss": 2.8, + "step": 90700 }, { - "epoch": 0.97, - "learning_rate": 1.6875525343805913e-06, - "loss": 2.2286, - "step": 554080 + "epoch": 0.32, + "learning_rate": 3.3794453705323205e-05, + "loss": 2.7887, + "step": 90800 }, { - "epoch": 0.97, - "learning_rate": 1.6866805944537644e-06, - "loss": 2.2192, - "step": 554090 + "epoch": 0.32, + "learning_rate": 3.3776606187377526e-05, + "loss": 2.7826, + "step": 90900 }, { - "epoch": 0.97, - "learning_rate": 1.6858086545269378e-06, - "loss": 2.1195, - "step": 554100 + "epoch": 0.32, + "learning_rate": 3.375875866943185e-05, + "loss": 2.7828, + "step": 91000 }, { - "epoch": 0.97, - "learning_rate": 1.684936714600111e-06, - "loss": 2.3637, - "step": 554110 + "epoch": 0.33, + "learning_rate": 3.374091115148617e-05, + "loss": 2.7941, + "step": 91100 }, { - "epoch": 0.97, - "learning_rate": 1.6840647746732843e-06, - "loss": 2.2766, - "step": 554120 + "epoch": 0.33, + "learning_rate": 3.372306363354048e-05, + "loss": 2.7942, + "step": 91200 }, { - "epoch": 0.97, - "learning_rate": 1.6831928347464574e-06, - "loss": 2.3601, - "step": 554130 + "epoch": 0.33, + "learning_rate": 3.3705216115594804e-05, + "loss": 2.7859, + "step": 91300 }, { - "epoch": 0.97, - "learning_rate": 1.6823208948196305e-06, - "loss": 2.1361, - "step": 554140 + "epoch": 0.33, + "learning_rate": 3.3687368597649125e-05, + "loss": 2.7765, + "step": 91400 }, { - "epoch": 0.97, - "learning_rate": 1.6814489548928037e-06, - "loss": 2.1989, - "step": 554150 + "epoch": 0.33, + "learning_rate": 3.3669521079703446e-05, + "loss": 2.7843, + "step": 91500 }, { - "epoch": 0.97, - "learning_rate": 1.680577014965977e-06, - "loss": 2.227, - "step": 554160 + "epoch": 0.33, + "learning_rate": 3.365167356175777e-05, + "loss": 2.7845, + "step": 91600 }, { - "epoch": 0.97, - "learning_rate": 1.6797050750391502e-06, - "loss": 2.2987, - "step": 554170 + "epoch": 0.33, + "learning_rate": 3.363382604381209e-05, + "loss": 2.7959, + "step": 91700 }, { - "epoch": 0.97, - "learning_rate": 1.6788331351123235e-06, - "loss": 2.1902, - "step": 554180 + "epoch": 0.33, + "learning_rate": 3.361597852586641e-05, + "loss": 2.7833, + "step": 91800 }, { - "epoch": 0.97, - "learning_rate": 1.6779611951854966e-06, - "loss": 2.3424, - "step": 554190 + "epoch": 0.33, + "learning_rate": 3.359813100792073e-05, + "loss": 2.7813, + "step": 91900 }, { - "epoch": 0.97, - "learning_rate": 1.6770892552586698e-06, - "loss": 2.301, - "step": 554200 + "epoch": 0.33, + "learning_rate": 3.358028348997505e-05, + "loss": 2.7833, + "step": 92000 }, { - "epoch": 0.97, - "learning_rate": 1.676217315331843e-06, - "loss": 2.1808, - "step": 554210 + "epoch": 0.33, + "learning_rate": 3.3562435972029374e-05, + "loss": 2.7833, + "step": 92100 }, { - "epoch": 0.97, - "learning_rate": 1.675345375405016e-06, - "loss": 2.2922, - "step": 554220 + "epoch": 0.33, + "learning_rate": 3.3544588454083695e-05, + "loss": 2.7922, + "step": 92200 }, { - "epoch": 0.97, - "learning_rate": 1.6744734354781894e-06, - "loss": 2.3374, - "step": 554230 + "epoch": 0.33, + "learning_rate": 3.352674093613801e-05, + "loss": 2.7835, + "step": 92300 }, { - "epoch": 0.97, - "learning_rate": 1.6736014955513625e-06, - "loss": 2.3415, - "step": 554240 + "epoch": 0.33, + "learning_rate": 3.350889341819233e-05, + "loss": 2.7863, + "step": 92400 }, { - "epoch": 0.97, - "learning_rate": 1.6727295556245359e-06, - "loss": 2.2748, - "step": 554250 + "epoch": 0.33, + "learning_rate": 3.349104590024665e-05, + "loss": 2.7915, + "step": 92500 }, { - "epoch": 0.97, - "learning_rate": 1.671857615697709e-06, - "loss": 2.2454, - "step": 554260 + "epoch": 0.33, + "learning_rate": 3.347319838230097e-05, + "loss": 2.7777, + "step": 92600 }, { - "epoch": 0.97, - "learning_rate": 1.6709856757708821e-06, - "loss": 2.2884, - "step": 554270 + "epoch": 0.33, + "learning_rate": 3.3455350864355294e-05, + "loss": 2.7776, + "step": 92700 }, { - "epoch": 0.97, - "learning_rate": 1.6701137358440553e-06, - "loss": 2.2739, - "step": 554280 + "epoch": 0.33, + "learning_rate": 3.3437503346409615e-05, + "loss": 2.7845, + "step": 92800 }, { - "epoch": 0.97, - "learning_rate": 1.6692417959172286e-06, - "loss": 2.1906, - "step": 554290 + "epoch": 0.33, + "learning_rate": 3.341965582846394e-05, + "loss": 2.7885, + "step": 92900 }, { - "epoch": 0.97, - "learning_rate": 1.6683698559904018e-06, - "loss": 2.3138, - "step": 554300 + "epoch": 0.33, + "learning_rate": 3.340180831051826e-05, + "loss": 2.7868, + "step": 93000 }, { - "epoch": 0.97, - "learning_rate": 1.6674979160635749e-06, - "loss": 2.1153, - "step": 554310 + "epoch": 0.33, + "learning_rate": 3.338396079257258e-05, + "loss": 2.7877, + "step": 93100 }, { - "epoch": 0.97, - "learning_rate": 1.6666259761367482e-06, - "loss": 2.2674, - "step": 554320 + "epoch": 0.33, + "learning_rate": 3.33661132746269e-05, + "loss": 2.7766, + "step": 93200 }, { - "epoch": 0.97, - "learning_rate": 1.6657540362099214e-06, - "loss": 2.3433, - "step": 554330 + "epoch": 0.33, + "learning_rate": 3.334826575668122e-05, + "loss": 2.777, + "step": 93300 }, { - "epoch": 0.97, - "learning_rate": 1.6648820962830945e-06, - "loss": 2.3748, - "step": 554340 + "epoch": 0.33, + "learning_rate": 3.3330418238735536e-05, + "loss": 2.7879, + "step": 93400 }, { - "epoch": 0.97, - "learning_rate": 1.6640101563562676e-06, - "loss": 2.2691, - "step": 554350 + "epoch": 0.33, + "learning_rate": 3.331257072078986e-05, + "loss": 2.7862, + "step": 93500 }, { - "epoch": 0.97, - "learning_rate": 1.663138216429441e-06, - "loss": 2.2277, - "step": 554360 + "epoch": 0.33, + "learning_rate": 3.329472320284418e-05, + "loss": 2.7689, + "step": 93600 }, { - "epoch": 0.97, - "learning_rate": 1.6622662765026141e-06, - "loss": 2.3055, - "step": 554370 + "epoch": 0.33, + "learning_rate": 3.32768756848985e-05, + "loss": 2.7883, + "step": 93700 }, { - "epoch": 0.97, - "learning_rate": 1.6613943365757875e-06, - "loss": 2.2573, - "step": 554380 + "epoch": 0.33, + "learning_rate": 3.325902816695282e-05, + "loss": 2.7862, + "step": 93800 }, { - "epoch": 0.97, - "learning_rate": 1.6605223966489606e-06, - "loss": 2.244, - "step": 554390 + "epoch": 0.34, + "learning_rate": 3.324118064900714e-05, + "loss": 2.789, + "step": 93900 }, { - "epoch": 0.97, - "learning_rate": 1.6596504567221337e-06, - "loss": 2.273, - "step": 554400 + "epoch": 0.34, + "learning_rate": 3.322333313106146e-05, + "loss": 2.7981, + "step": 94000 }, { - "epoch": 0.97, - "learning_rate": 1.6587785167953069e-06, - "loss": 2.2629, - "step": 554410 + "epoch": 0.34, + "learning_rate": 3.3205485613115785e-05, + "loss": 2.78, + "step": 94100 }, { - "epoch": 0.97, - "learning_rate": 1.6579065768684802e-06, - "loss": 2.2635, - "step": 554420 + "epoch": 0.34, + "learning_rate": 3.3187638095170106e-05, + "loss": 2.7938, + "step": 94200 }, { - "epoch": 0.97, - "learning_rate": 1.6570346369416533e-06, - "loss": 2.243, - "step": 554430 + "epoch": 0.34, + "learning_rate": 3.316979057722443e-05, + "loss": 2.7848, + "step": 94300 }, { - "epoch": 0.97, - "learning_rate": 1.6561626970148265e-06, - "loss": 2.2626, - "step": 554440 + "epoch": 0.34, + "learning_rate": 3.315194305927875e-05, + "loss": 2.7788, + "step": 94400 }, { - "epoch": 0.97, - "learning_rate": 1.6552907570879998e-06, - "loss": 2.2504, - "step": 554450 + "epoch": 0.34, + "learning_rate": 3.313409554133307e-05, + "loss": 2.7731, + "step": 94500 }, { - "epoch": 0.97, - "learning_rate": 1.654418817161173e-06, - "loss": 2.254, - "step": 554460 + "epoch": 0.34, + "learning_rate": 3.311624802338739e-05, + "loss": 2.7879, + "step": 94600 }, { - "epoch": 0.97, - "learning_rate": 1.653546877234346e-06, - "loss": 2.2493, - "step": 554470 + "epoch": 0.34, + "learning_rate": 3.309840050544171e-05, + "loss": 2.7804, + "step": 94700 }, { - "epoch": 0.97, - "learning_rate": 1.6526749373075192e-06, - "loss": 2.2131, - "step": 554480 + "epoch": 0.34, + "learning_rate": 3.308055298749603e-05, + "loss": 2.7745, + "step": 94800 }, { - "epoch": 0.97, - "learning_rate": 1.6518029973806926e-06, - "loss": 2.2277, - "step": 554490 + "epoch": 0.34, + "learning_rate": 3.3062705469550354e-05, + "loss": 2.7767, + "step": 94900 }, { - "epoch": 0.97, - "learning_rate": 1.6509310574538657e-06, - "loss": 2.1969, - "step": 554500 + "epoch": 0.34, + "learning_rate": 3.3044857951604675e-05, + "loss": 2.7902, + "step": 95000 }, { - "epoch": 0.97, - "learning_rate": 1.6500591175270388e-06, - "loss": 2.2662, - "step": 554510 + "epoch": 0.34, + "learning_rate": 3.3027010433659e-05, + "loss": 2.7728, + "step": 95100 }, { - "epoch": 0.97, - "learning_rate": 1.6491871776002122e-06, - "loss": 2.2429, - "step": 554520 + "epoch": 0.34, + "learning_rate": 3.300916291571332e-05, + "loss": 2.7857, + "step": 95200 }, { - "epoch": 0.97, - "learning_rate": 1.6483152376733853e-06, - "loss": 2.2458, - "step": 554530 + "epoch": 0.34, + "learning_rate": 3.299131539776764e-05, + "loss": 2.7792, + "step": 95300 }, { - "epoch": 0.97, - "learning_rate": 1.6474432977465585e-06, - "loss": 2.264, - "step": 554540 + "epoch": 0.34, + "learning_rate": 3.2973467879821954e-05, + "loss": 2.7858, + "step": 95400 }, { - "epoch": 0.97, - "learning_rate": 1.6465713578197318e-06, - "loss": 2.2421, - "step": 554550 + "epoch": 0.34, + "learning_rate": 3.2955620361876275e-05, + "loss": 2.7917, + "step": 95500 }, { - "epoch": 0.97, - "learning_rate": 1.645699417892905e-06, - "loss": 2.229, - "step": 554560 + "epoch": 0.34, + "learning_rate": 3.2937772843930596e-05, + "loss": 2.7761, + "step": 95600 }, { - "epoch": 0.97, - "learning_rate": 1.644827477966078e-06, - "loss": 2.259, - "step": 554570 + "epoch": 0.34, + "learning_rate": 3.291992532598492e-05, + "loss": 2.7859, + "step": 95700 }, { - "epoch": 0.97, - "learning_rate": 1.6439555380392514e-06, - "loss": 2.3506, - "step": 554580 + "epoch": 0.34, + "learning_rate": 3.290207780803924e-05, + "loss": 2.7807, + "step": 95800 }, { - "epoch": 0.97, - "learning_rate": 1.6430835981124246e-06, - "loss": 2.12, - "step": 554590 + "epoch": 0.34, + "learning_rate": 3.288423029009356e-05, + "loss": 2.7925, + "step": 95900 }, { - "epoch": 0.97, - "learning_rate": 1.6422116581855977e-06, - "loss": 2.1462, - "step": 554600 + "epoch": 0.34, + "learning_rate": 3.286638277214788e-05, + "loss": 2.7724, + "step": 96000 }, { - "epoch": 0.97, - "learning_rate": 1.6413397182587708e-06, - "loss": 2.2328, - "step": 554610 + "epoch": 0.34, + "learning_rate": 3.28485352542022e-05, + "loss": 2.7807, + "step": 96100 }, { - "epoch": 0.97, - "learning_rate": 1.6404677783319442e-06, - "loss": 2.2884, - "step": 554620 + "epoch": 0.34, + "learning_rate": 3.283068773625652e-05, + "loss": 2.7829, + "step": 96200 }, { - "epoch": 0.97, - "learning_rate": 1.6395958384051173e-06, - "loss": 2.3023, - "step": 554630 + "epoch": 0.34, + "learning_rate": 3.2812840218310844e-05, + "loss": 2.7864, + "step": 96300 }, { - "epoch": 0.97, - "learning_rate": 1.6387238984782904e-06, - "loss": 2.2997, - "step": 554640 + "epoch": 0.34, + "learning_rate": 3.2794992700365166e-05, + "loss": 2.7896, + "step": 96400 }, { - "epoch": 0.97, - "learning_rate": 1.6378519585514638e-06, - "loss": 2.2715, - "step": 554650 + "epoch": 0.34, + "learning_rate": 3.277714518241948e-05, + "loss": 2.7769, + "step": 96500 }, { - "epoch": 0.97, - "learning_rate": 1.636980018624637e-06, - "loss": 2.212, - "step": 554660 + "epoch": 0.34, + "learning_rate": 3.27592976644738e-05, + "loss": 2.7887, + "step": 96600 }, { - "epoch": 0.97, - "learning_rate": 1.63610807869781e-06, - "loss": 2.2865, - "step": 554670 + "epoch": 0.35, + "learning_rate": 3.274145014652812e-05, + "loss": 2.7704, + "step": 96700 }, { - "epoch": 0.97, - "learning_rate": 1.6352361387709834e-06, - "loss": 2.2824, - "step": 554680 + "epoch": 0.35, + "learning_rate": 3.2723602628582444e-05, + "loss": 2.784, + "step": 96800 }, { - "epoch": 0.97, - "learning_rate": 1.6343641988441565e-06, - "loss": 2.2597, - "step": 554690 + "epoch": 0.35, + "learning_rate": 3.2705755110636765e-05, + "loss": 2.7876, + "step": 96900 }, { - "epoch": 0.97, - "learning_rate": 1.6334922589173297e-06, - "loss": 2.225, - "step": 554700 + "epoch": 0.35, + "learning_rate": 3.2687907592691086e-05, + "loss": 2.7886, + "step": 97000 }, { - "epoch": 0.97, - "learning_rate": 1.6326203189905028e-06, - "loss": 2.2208, - "step": 554710 + "epoch": 0.35, + "learning_rate": 3.267006007474541e-05, + "loss": 2.7802, + "step": 97100 }, { - "epoch": 0.97, - "learning_rate": 1.6317483790636762e-06, - "loss": 2.251, - "step": 554720 + "epoch": 0.35, + "learning_rate": 3.265221255679973e-05, + "loss": 2.7813, + "step": 97200 }, { - "epoch": 0.97, - "learning_rate": 1.6308764391368493e-06, - "loss": 2.316, - "step": 554730 + "epoch": 0.35, + "learning_rate": 3.263436503885405e-05, + "loss": 2.7827, + "step": 97300 }, { - "epoch": 0.97, - "learning_rate": 1.6300044992100224e-06, - "loss": 2.246, - "step": 554740 + "epoch": 0.35, + "learning_rate": 3.261651752090837e-05, + "loss": 2.7824, + "step": 97400 }, { - "epoch": 0.97, - "learning_rate": 1.6291325592831958e-06, - "loss": 2.1604, - "step": 554750 + "epoch": 0.35, + "learning_rate": 3.259867000296269e-05, + "loss": 2.7709, + "step": 97500 }, { - "epoch": 0.97, - "learning_rate": 1.628260619356369e-06, - "loss": 2.2608, - "step": 554760 + "epoch": 0.35, + "learning_rate": 3.258082248501701e-05, + "loss": 2.7766, + "step": 97600 }, { - "epoch": 0.97, - "learning_rate": 1.627388679429542e-06, - "loss": 2.2199, - "step": 554770 + "epoch": 0.35, + "learning_rate": 3.256297496707133e-05, + "loss": 2.7816, + "step": 97700 }, { - "epoch": 0.97, - "learning_rate": 1.6265167395027154e-06, - "loss": 2.3545, - "step": 554780 + "epoch": 0.35, + "learning_rate": 3.254512744912565e-05, + "loss": 2.774, + "step": 97800 }, { - "epoch": 0.97, - "learning_rate": 1.6256447995758885e-06, - "loss": 2.2729, - "step": 554790 + "epoch": 0.35, + "learning_rate": 3.252727993117997e-05, + "loss": 2.7819, + "step": 97900 }, { - "epoch": 0.97, - "learning_rate": 1.6247728596490617e-06, - "loss": 2.2121, - "step": 554800 + "epoch": 0.35, + "learning_rate": 3.250943241323429e-05, + "loss": 2.7736, + "step": 98000 }, { - "epoch": 0.97, - "learning_rate": 1.623900919722235e-06, - "loss": 2.3864, - "step": 554810 + "epoch": 0.35, + "learning_rate": 3.249158489528861e-05, + "loss": 2.7824, + "step": 98100 }, { - "epoch": 0.97, - "learning_rate": 1.6230289797954081e-06, - "loss": 2.3141, - "step": 554820 + "epoch": 0.35, + "learning_rate": 3.2473737377342934e-05, + "loss": 2.7786, + "step": 98200 }, { - "epoch": 0.97, - "learning_rate": 1.6221570398685813e-06, - "loss": 2.1324, - "step": 554830 + "epoch": 0.35, + "learning_rate": 3.2455889859397255e-05, + "loss": 2.7774, + "step": 98300 }, { - "epoch": 0.97, - "learning_rate": 1.6212850999417544e-06, - "loss": 2.251, - "step": 554840 + "epoch": 0.35, + "learning_rate": 3.2438042341451576e-05, + "loss": 2.7831, + "step": 98400 }, { - "epoch": 0.97, - "learning_rate": 1.6204131600149278e-06, - "loss": 2.2826, - "step": 554850 + "epoch": 0.35, + "learning_rate": 3.24201948235059e-05, + "loss": 2.778, + "step": 98500 }, { - "epoch": 0.97, - "learning_rate": 1.6195412200881009e-06, - "loss": 2.3082, - "step": 554860 + "epoch": 0.35, + "learning_rate": 3.240234730556022e-05, + "loss": 2.7847, + "step": 98600 }, { - "epoch": 0.97, - "learning_rate": 1.618669280161274e-06, - "loss": 2.2582, - "step": 554870 + "epoch": 0.35, + "learning_rate": 3.238449978761453e-05, + "loss": 2.7897, + "step": 98700 }, { - "epoch": 0.97, - "learning_rate": 1.6177973402344474e-06, - "loss": 2.1674, - "step": 554880 + "epoch": 0.35, + "learning_rate": 3.2366652269668855e-05, + "loss": 2.7819, + "step": 98800 }, { - "epoch": 0.97, - "learning_rate": 1.6169254003076205e-06, - "loss": 2.224, - "step": 554890 + "epoch": 0.35, + "learning_rate": 3.2348804751723176e-05, + "loss": 2.777, + "step": 98900 }, { - "epoch": 0.97, - "learning_rate": 1.6160534603807936e-06, - "loss": 2.2808, - "step": 554900 + "epoch": 0.35, + "learning_rate": 3.23309572337775e-05, + "loss": 2.7767, + "step": 99000 }, { - "epoch": 0.97, - "learning_rate": 1.6151815204539668e-06, - "loss": 2.2951, - "step": 554910 + "epoch": 0.35, + "learning_rate": 3.231310971583182e-05, + "loss": 2.7747, + "step": 99100 }, { - "epoch": 0.97, - "learning_rate": 1.6143095805271401e-06, - "loss": 2.2683, - "step": 554920 + "epoch": 0.35, + "learning_rate": 3.229526219788614e-05, + "loss": 2.7872, + "step": 99200 }, { - "epoch": 0.97, - "learning_rate": 1.6134376406003133e-06, - "loss": 2.2188, - "step": 554930 + "epoch": 0.35, + "learning_rate": 3.227741467994046e-05, + "loss": 2.7743, + "step": 99300 }, { - "epoch": 0.97, - "learning_rate": 1.6125657006734866e-06, - "loss": 2.2146, - "step": 554940 + "epoch": 0.35, + "learning_rate": 3.225956716199478e-05, + "loss": 2.7711, + "step": 99400 }, { - "epoch": 0.97, - "learning_rate": 1.6116937607466597e-06, - "loss": 2.3173, - "step": 554950 + "epoch": 0.36, + "learning_rate": 3.22417196440491e-05, + "loss": 2.7764, + "step": 99500 }, { - "epoch": 0.97, - "learning_rate": 1.6108218208198329e-06, - "loss": 2.2339, - "step": 554960 + "epoch": 0.36, + "learning_rate": 3.2223872126103424e-05, + "loss": 2.7801, + "step": 99600 }, { - "epoch": 0.97, - "learning_rate": 1.609949880893006e-06, - "loss": 2.1198, - "step": 554970 + "epoch": 0.36, + "learning_rate": 3.2206024608157745e-05, + "loss": 2.7806, + "step": 99700 }, { - "epoch": 0.97, - "learning_rate": 1.6090779409661794e-06, - "loss": 2.4139, - "step": 554980 + "epoch": 0.36, + "learning_rate": 3.218817709021207e-05, + "loss": 2.7855, + "step": 99800 }, { - "epoch": 0.97, - "learning_rate": 1.6082060010393525e-06, - "loss": 2.3212, - "step": 554990 + "epoch": 0.36, + "learning_rate": 3.217032957226639e-05, + "loss": 2.7787, + "step": 99900 }, { - "epoch": 0.97, - "learning_rate": 1.6073340611125256e-06, - "loss": 2.3449, - "step": 555000 + "epoch": 0.36, + "learning_rate": 3.215248205432071e-05, + "loss": 2.7816, + "step": 100000 }, { - "epoch": 0.97, - "learning_rate": 1.606462121185699e-06, - "loss": 2.2039, - "step": 555010 + "epoch": 0.36, + "learning_rate": 3.213463453637503e-05, + "loss": 2.7644, + "step": 100100 }, { - "epoch": 0.97, - "learning_rate": 1.605590181258872e-06, - "loss": 2.1972, - "step": 555020 + "epoch": 0.36, + "learning_rate": 3.211678701842935e-05, + "loss": 2.7853, + "step": 100200 }, { - "epoch": 0.97, - "learning_rate": 1.6047182413320452e-06, - "loss": 2.2929, - "step": 555030 + "epoch": 0.36, + "learning_rate": 3.209893950048367e-05, + "loss": 2.7787, + "step": 100300 }, { - "epoch": 0.97, - "learning_rate": 1.6038463014052184e-06, - "loss": 2.2426, - "step": 555040 + "epoch": 0.36, + "learning_rate": 3.2081091982537994e-05, + "loss": 2.7706, + "step": 100400 }, { - "epoch": 0.97, - "learning_rate": 1.6029743614783917e-06, - "loss": 2.3362, - "step": 555050 + "epoch": 0.36, + "learning_rate": 3.2063244464592315e-05, + "loss": 2.7756, + "step": 100500 }, { - "epoch": 0.97, - "learning_rate": 1.6021024215515649e-06, - "loss": 2.2201, - "step": 555060 + "epoch": 0.36, + "learning_rate": 3.2045396946646636e-05, + "loss": 2.7726, + "step": 100600 }, { - "epoch": 0.97, - "learning_rate": 1.6012304816247382e-06, - "loss": 2.2887, - "step": 555070 + "epoch": 0.36, + "learning_rate": 3.202754942870095e-05, + "loss": 2.7702, + "step": 100700 }, { - "epoch": 0.97, - "learning_rate": 1.6003585416979113e-06, - "loss": 2.2736, - "step": 555080 + "epoch": 0.36, + "learning_rate": 3.200970191075527e-05, + "loss": 2.7696, + "step": 100800 }, { - "epoch": 0.97, - "learning_rate": 1.5994866017710845e-06, - "loss": 2.257, - "step": 555090 + "epoch": 0.36, + "learning_rate": 3.199185439280959e-05, + "loss": 2.7758, + "step": 100900 }, { - "epoch": 0.97, - "learning_rate": 1.5986146618442576e-06, - "loss": 2.2901, - "step": 555100 + "epoch": 0.36, + "learning_rate": 3.1974006874863914e-05, + "loss": 2.7863, + "step": 101000 }, { - "epoch": 0.97, - "learning_rate": 1.5977427219174307e-06, - "loss": 2.2906, - "step": 555110 + "epoch": 0.36, + "learning_rate": 3.1956159356918236e-05, + "loss": 2.7811, + "step": 101100 }, { - "epoch": 0.97, - "learning_rate": 1.596870781990604e-06, - "loss": 2.129, - "step": 555120 + "epoch": 0.36, + "learning_rate": 3.193831183897256e-05, + "loss": 2.7844, + "step": 101200 }, { - "epoch": 0.97, - "learning_rate": 1.5959988420637772e-06, - "loss": 2.2973, - "step": 555130 + "epoch": 0.36, + "learning_rate": 3.192046432102688e-05, + "loss": 2.781, + "step": 101300 }, { - "epoch": 0.97, - "learning_rate": 1.5951269021369506e-06, - "loss": 2.2271, - "step": 555140 + "epoch": 0.36, + "learning_rate": 3.19026168030812e-05, + "loss": 2.7812, + "step": 101400 }, { - "epoch": 0.97, - "learning_rate": 1.5942549622101237e-06, - "loss": 2.2339, - "step": 555150 + "epoch": 0.36, + "learning_rate": 3.188476928513552e-05, + "loss": 2.7776, + "step": 101500 }, { - "epoch": 0.97, - "learning_rate": 1.5933830222832968e-06, - "loss": 2.3421, - "step": 555160 + "epoch": 0.36, + "learning_rate": 3.186692176718984e-05, + "loss": 2.7818, + "step": 101600 }, { - "epoch": 0.97, - "learning_rate": 1.59251108235647e-06, - "loss": 2.3837, - "step": 555170 + "epoch": 0.36, + "learning_rate": 3.184907424924416e-05, + "loss": 2.7723, + "step": 101700 }, { - "epoch": 0.97, - "learning_rate": 1.5916391424296433e-06, - "loss": 2.2561, - "step": 555180 + "epoch": 0.36, + "learning_rate": 3.183122673129848e-05, + "loss": 2.7708, + "step": 101800 }, { - "epoch": 0.97, - "learning_rate": 1.5907672025028165e-06, - "loss": 2.2621, - "step": 555190 + "epoch": 0.36, + "learning_rate": 3.18133792133528e-05, + "loss": 2.7878, + "step": 101900 }, { - "epoch": 0.97, - "learning_rate": 1.5898952625759898e-06, - "loss": 2.3197, - "step": 555200 + "epoch": 0.36, + "learning_rate": 3.179553169540712e-05, + "loss": 2.7813, + "step": 102000 }, { - "epoch": 0.97, - "learning_rate": 1.589023322649163e-06, - "loss": 2.2127, - "step": 555210 + "epoch": 0.36, + "learning_rate": 3.177768417746144e-05, + "loss": 2.7802, + "step": 102100 }, { - "epoch": 0.97, - "learning_rate": 1.588151382722336e-06, - "loss": 2.2264, - "step": 555220 + "epoch": 0.36, + "learning_rate": 3.175983665951576e-05, + "loss": 2.773, + "step": 102200 }, { - "epoch": 0.97, - "learning_rate": 1.5872794427955092e-06, - "loss": 2.3189, - "step": 555230 + "epoch": 0.37, + "learning_rate": 3.1741989141570083e-05, + "loss": 2.7742, + "step": 102300 }, { - "epoch": 0.97, - "learning_rate": 1.5864075028686823e-06, - "loss": 2.2904, - "step": 555240 + "epoch": 0.37, + "learning_rate": 3.1724141623624405e-05, + "loss": 2.7707, + "step": 102400 }, { - "epoch": 0.97, - "learning_rate": 1.5855355629418557e-06, - "loss": 2.2969, - "step": 555250 + "epoch": 0.37, + "learning_rate": 3.1706294105678726e-05, + "loss": 2.783, + "step": 102500 }, { - "epoch": 0.97, - "learning_rate": 1.584663623015029e-06, - "loss": 2.3153, - "step": 555260 + "epoch": 0.37, + "learning_rate": 3.168844658773305e-05, + "loss": 2.7739, + "step": 102600 }, { - "epoch": 0.97, - "learning_rate": 1.5837916830882022e-06, - "loss": 2.2445, - "step": 555270 + "epoch": 0.37, + "learning_rate": 3.167059906978737e-05, + "loss": 2.7649, + "step": 102700 }, { - "epoch": 0.97, - "learning_rate": 1.5829197431613753e-06, - "loss": 2.2881, - "step": 555280 + "epoch": 0.37, + "learning_rate": 3.165275155184169e-05, + "loss": 2.7831, + "step": 102800 }, { - "epoch": 0.97, - "learning_rate": 1.5820478032345484e-06, - "loss": 2.284, - "step": 555290 + "epoch": 0.37, + "learning_rate": 3.1634904033896004e-05, + "loss": 2.7838, + "step": 102900 }, { - "epoch": 0.97, - "learning_rate": 1.5811758633077216e-06, - "loss": 2.2476, - "step": 555300 + "epoch": 0.37, + "learning_rate": 3.1617056515950325e-05, + "loss": 2.7795, + "step": 103000 }, { - "epoch": 0.97, - "learning_rate": 1.5803039233808947e-06, - "loss": 2.207, - "step": 555310 + "epoch": 0.37, + "learning_rate": 3.1599208998004646e-05, + "loss": 2.7791, + "step": 103100 }, { - "epoch": 0.97, - "learning_rate": 1.579431983454068e-06, - "loss": 2.2626, - "step": 555320 + "epoch": 0.37, + "learning_rate": 3.158136148005897e-05, + "loss": 2.7725, + "step": 103200 }, { - "epoch": 0.97, - "learning_rate": 1.5785600435272414e-06, - "loss": 2.1805, - "step": 555330 + "epoch": 0.37, + "learning_rate": 3.156351396211329e-05, + "loss": 2.7783, + "step": 103300 }, { - "epoch": 0.97, - "learning_rate": 1.5776881036004145e-06, - "loss": 2.2812, - "step": 555340 + "epoch": 0.37, + "learning_rate": 3.154566644416761e-05, + "loss": 2.7832, + "step": 103400 }, { - "epoch": 0.97, - "learning_rate": 1.5768161636735877e-06, - "loss": 2.1062, - "step": 555350 + "epoch": 0.37, + "learning_rate": 3.152781892622193e-05, + "loss": 2.7692, + "step": 103500 }, { - "epoch": 0.97, - "learning_rate": 1.5759442237467608e-06, - "loss": 2.2624, - "step": 555360 + "epoch": 0.37, + "learning_rate": 3.150997140827625e-05, + "loss": 2.7771, + "step": 103600 }, { - "epoch": 0.97, - "learning_rate": 1.575072283819934e-06, - "loss": 2.2567, - "step": 555370 + "epoch": 0.37, + "learning_rate": 3.1492123890330574e-05, + "loss": 2.7737, + "step": 103700 }, { - "epoch": 0.97, - "learning_rate": 1.5742003438931073e-06, - "loss": 2.1279, - "step": 555380 + "epoch": 0.37, + "learning_rate": 3.1474276372384895e-05, + "loss": 2.7709, + "step": 103800 }, { - "epoch": 0.97, - "learning_rate": 1.5733284039662806e-06, - "loss": 2.2571, - "step": 555390 + "epoch": 0.37, + "learning_rate": 3.145642885443921e-05, + "loss": 2.768, + "step": 103900 }, { - "epoch": 0.97, - "learning_rate": 1.5724564640394538e-06, - "loss": 2.2348, - "step": 555400 + "epoch": 0.37, + "learning_rate": 3.143858133649353e-05, + "loss": 2.7733, + "step": 104000 }, { - "epoch": 0.97, - "learning_rate": 1.571584524112627e-06, - "loss": 2.3653, - "step": 555410 + "epoch": 0.37, + "learning_rate": 3.142073381854785e-05, + "loss": 2.7802, + "step": 104100 }, { - "epoch": 0.97, - "learning_rate": 1.5707125841858e-06, - "loss": 2.2842, - "step": 555420 + "epoch": 0.37, + "learning_rate": 3.140288630060217e-05, + "loss": 2.7794, + "step": 104200 }, { - "epoch": 0.97, - "learning_rate": 1.5698406442589732e-06, - "loss": 2.3318, - "step": 555430 + "epoch": 0.37, + "learning_rate": 3.1385038782656494e-05, + "loss": 2.764, + "step": 104300 }, { - "epoch": 0.97, - "learning_rate": 1.5689687043321463e-06, - "loss": 2.3517, - "step": 555440 + "epoch": 0.37, + "learning_rate": 3.1367191264710815e-05, + "loss": 2.7789, + "step": 104400 }, { - "epoch": 0.97, - "learning_rate": 1.5680967644053196e-06, - "loss": 2.2991, - "step": 555450 + "epoch": 0.37, + "learning_rate": 3.134934374676514e-05, + "loss": 2.7717, + "step": 104500 }, { - "epoch": 0.97, - "learning_rate": 1.567224824478493e-06, - "loss": 2.2404, - "step": 555460 + "epoch": 0.37, + "learning_rate": 3.133149622881946e-05, + "loss": 2.7823, + "step": 104600 }, { - "epoch": 0.97, - "learning_rate": 1.5663528845516661e-06, - "loss": 2.2132, - "step": 555470 + "epoch": 0.37, + "learning_rate": 3.1313648710873786e-05, + "loss": 2.7802, + "step": 104700 }, { - "epoch": 0.97, - "learning_rate": 1.5654809446248393e-06, - "loss": 2.2334, - "step": 555480 + "epoch": 0.37, + "learning_rate": 3.12958011929281e-05, + "loss": 2.771, + "step": 104800 }, { - "epoch": 0.97, - "learning_rate": 1.5646090046980124e-06, - "loss": 2.2079, - "step": 555490 + "epoch": 0.37, + "learning_rate": 3.127795367498242e-05, + "loss": 2.7752, + "step": 104900 }, { - "epoch": 0.97, - "learning_rate": 1.5637370647711855e-06, - "loss": 2.2957, - "step": 555500 + "epoch": 0.37, + "learning_rate": 3.126010615703674e-05, + "loss": 2.7721, + "step": 105000 }, { - "epoch": 0.97, - "learning_rate": 1.5628651248443587e-06, - "loss": 2.2932, - "step": 555510 + "epoch": 0.38, + "learning_rate": 3.1242258639091064e-05, + "loss": 2.7679, + "step": 105100 }, { - "epoch": 0.97, - "learning_rate": 1.561993184917532e-06, - "loss": 2.1311, - "step": 555520 + "epoch": 0.38, + "learning_rate": 3.1224411121145385e-05, + "loss": 2.7666, + "step": 105200 }, { - "epoch": 0.97, - "learning_rate": 1.5611212449907054e-06, - "loss": 2.1689, - "step": 555530 + "epoch": 0.38, + "learning_rate": 3.1206563603199706e-05, + "loss": 2.7789, + "step": 105300 }, { - "epoch": 0.97, - "learning_rate": 1.5602493050638785e-06, - "loss": 2.3365, - "step": 555540 + "epoch": 0.38, + "learning_rate": 3.118871608525403e-05, + "loss": 2.7649, + "step": 105400 }, { - "epoch": 0.97, - "learning_rate": 1.5593773651370516e-06, - "loss": 2.2702, - "step": 555550 + "epoch": 0.38, + "learning_rate": 3.117086856730835e-05, + "loss": 2.7786, + "step": 105500 }, { - "epoch": 0.97, - "learning_rate": 1.558505425210225e-06, - "loss": 2.3433, - "step": 555560 + "epoch": 0.38, + "learning_rate": 3.115302104936267e-05, + "loss": 2.7672, + "step": 105600 }, { - "epoch": 0.97, - "learning_rate": 1.5576334852833981e-06, - "loss": 2.3235, - "step": 555570 + "epoch": 0.38, + "learning_rate": 3.113517353141699e-05, + "loss": 2.772, + "step": 105700 }, { - "epoch": 0.97, - "learning_rate": 1.5567615453565712e-06, - "loss": 2.2545, - "step": 555580 + "epoch": 0.38, + "learning_rate": 3.111732601347131e-05, + "loss": 2.7773, + "step": 105800 }, { - "epoch": 0.97, - "learning_rate": 1.5558896054297444e-06, - "loss": 2.3105, - "step": 555590 + "epoch": 0.38, + "learning_rate": 3.109947849552563e-05, + "loss": 2.7653, + "step": 105900 }, { - "epoch": 0.97, - "learning_rate": 1.5550176655029177e-06, - "loss": 2.3016, - "step": 555600 + "epoch": 0.38, + "learning_rate": 3.108163097757995e-05, + "loss": 2.7805, + "step": 106000 }, { - "epoch": 0.97, - "learning_rate": 1.5541457255760909e-06, - "loss": 2.2619, - "step": 555610 + "epoch": 0.38, + "learning_rate": 3.106378345963427e-05, + "loss": 2.7822, + "step": 106100 }, { - "epoch": 0.97, - "learning_rate": 1.553273785649264e-06, - "loss": 2.2994, - "step": 555620 + "epoch": 0.38, + "learning_rate": 3.104593594168859e-05, + "loss": 2.7739, + "step": 106200 }, { - "epoch": 0.97, - "learning_rate": 1.5524018457224373e-06, - "loss": 2.2392, - "step": 555630 + "epoch": 0.38, + "learning_rate": 3.102808842374291e-05, + "loss": 2.7786, + "step": 106300 }, { - "epoch": 0.97, - "learning_rate": 1.5515299057956105e-06, - "loss": 2.3068, - "step": 555640 + "epoch": 0.38, + "learning_rate": 3.101024090579723e-05, + "loss": 2.7724, + "step": 106400 }, { - "epoch": 0.97, - "learning_rate": 1.5506579658687836e-06, - "loss": 2.2707, - "step": 555650 + "epoch": 0.38, + "learning_rate": 3.0992393387851554e-05, + "loss": 2.7703, + "step": 106500 }, { - "epoch": 0.97, - "learning_rate": 1.549786025941957e-06, - "loss": 2.242, - "step": 555660 + "epoch": 0.38, + "learning_rate": 3.0974545869905875e-05, + "loss": 2.7688, + "step": 106600 }, { - "epoch": 0.97, - "learning_rate": 1.54891408601513e-06, - "loss": 2.2699, - "step": 555670 + "epoch": 0.38, + "learning_rate": 3.0956698351960197e-05, + "loss": 2.7611, + "step": 106700 }, { - "epoch": 0.97, - "learning_rate": 1.5480421460883032e-06, - "loss": 2.3619, - "step": 555680 + "epoch": 0.38, + "learning_rate": 3.093885083401452e-05, + "loss": 2.7784, + "step": 106800 }, { - "epoch": 0.97, - "learning_rate": 1.5471702061614764e-06, - "loss": 2.2337, - "step": 555690 + "epoch": 0.38, + "learning_rate": 3.092100331606884e-05, + "loss": 2.7738, + "step": 106900 }, { - "epoch": 0.97, - "learning_rate": 1.5462982662346497e-06, - "loss": 2.2171, - "step": 555700 + "epoch": 0.38, + "learning_rate": 3.0903155798123153e-05, + "loss": 2.7673, + "step": 107000 }, { - "epoch": 0.97, - "learning_rate": 1.5454263263078228e-06, - "loss": 2.2539, - "step": 555710 + "epoch": 0.38, + "learning_rate": 3.0885308280177475e-05, + "loss": 2.7668, + "step": 107100 }, { - "epoch": 0.97, - "learning_rate": 1.544554386380996e-06, - "loss": 2.3429, - "step": 555720 + "epoch": 0.38, + "learning_rate": 3.0867460762231796e-05, + "loss": 2.7788, + "step": 107200 }, { - "epoch": 0.97, - "learning_rate": 1.5436824464541693e-06, - "loss": 2.281, - "step": 555730 + "epoch": 0.38, + "learning_rate": 3.084961324428612e-05, + "loss": 2.767, + "step": 107300 }, { - "epoch": 0.97, - "learning_rate": 1.5428105065273425e-06, - "loss": 2.3049, - "step": 555740 + "epoch": 0.38, + "learning_rate": 3.083176572634044e-05, + "loss": 2.7629, + "step": 107400 }, { - "epoch": 0.97, - "learning_rate": 1.5419385666005156e-06, - "loss": 2.1721, - "step": 555750 + "epoch": 0.38, + "learning_rate": 3.081391820839476e-05, + "loss": 2.7755, + "step": 107500 }, { - "epoch": 0.97, - "learning_rate": 1.541066626673689e-06, - "loss": 2.4376, - "step": 555760 + "epoch": 0.38, + "learning_rate": 3.079607069044908e-05, + "loss": 2.776, + "step": 107600 }, { - "epoch": 0.97, - "learning_rate": 1.540194686746862e-06, - "loss": 2.3109, - "step": 555770 + "epoch": 0.38, + "learning_rate": 3.07782231725034e-05, + "loss": 2.7787, + "step": 107700 }, { - "epoch": 0.97, - "learning_rate": 1.5393227468200352e-06, - "loss": 2.2443, - "step": 555780 + "epoch": 0.38, + "learning_rate": 3.076037565455772e-05, + "loss": 2.772, + "step": 107800 }, { - "epoch": 0.97, - "learning_rate": 1.5384508068932083e-06, - "loss": 2.1826, - "step": 555790 + "epoch": 0.39, + "learning_rate": 3.0742528136612044e-05, + "loss": 2.7732, + "step": 107900 }, { - "epoch": 0.97, - "learning_rate": 1.5375788669663817e-06, - "loss": 2.2966, - "step": 555800 + "epoch": 0.39, + "learning_rate": 3.0724680618666366e-05, + "loss": 2.7695, + "step": 108000 }, { - "epoch": 0.97, - "learning_rate": 1.5367069270395548e-06, - "loss": 2.2749, - "step": 555810 + "epoch": 0.39, + "learning_rate": 3.070683310072068e-05, + "loss": 2.7793, + "step": 108100 }, { - "epoch": 0.97, - "learning_rate": 1.535834987112728e-06, - "loss": 2.2512, - "step": 555820 + "epoch": 0.39, + "learning_rate": 3.0688985582775e-05, + "loss": 2.7695, + "step": 108200 }, { - "epoch": 0.97, - "learning_rate": 1.5349630471859013e-06, - "loss": 2.3076, - "step": 555830 + "epoch": 0.39, + "learning_rate": 3.067113806482932e-05, + "loss": 2.7743, + "step": 108300 }, { - "epoch": 0.97, - "learning_rate": 1.5340911072590744e-06, - "loss": 2.2531, - "step": 555840 + "epoch": 0.39, + "learning_rate": 3.0653290546883644e-05, + "loss": 2.7815, + "step": 108400 }, { - "epoch": 0.97, - "learning_rate": 1.5332191673322476e-06, - "loss": 2.2215, - "step": 555850 + "epoch": 0.39, + "learning_rate": 3.0635443028937965e-05, + "loss": 2.7798, + "step": 108500 }, { - "epoch": 0.97, - "learning_rate": 1.532347227405421e-06, - "loss": 2.2785, - "step": 555860 + "epoch": 0.39, + "learning_rate": 3.0617595510992286e-05, + "loss": 2.7774, + "step": 108600 }, { - "epoch": 0.97, - "learning_rate": 1.531475287478594e-06, - "loss": 2.2501, - "step": 555870 + "epoch": 0.39, + "learning_rate": 3.059974799304661e-05, + "loss": 2.7779, + "step": 108700 }, { - "epoch": 0.97, - "learning_rate": 1.5306033475517672e-06, - "loss": 2.3064, - "step": 555880 + "epoch": 0.39, + "learning_rate": 3.058190047510093e-05, + "loss": 2.7747, + "step": 108800 }, { - "epoch": 0.97, - "learning_rate": 1.5297314076249403e-06, - "loss": 2.2887, - "step": 555890 + "epoch": 0.39, + "learning_rate": 3.056405295715525e-05, + "loss": 2.7721, + "step": 108900 }, { - "epoch": 0.97, - "learning_rate": 1.5288594676981137e-06, - "loss": 2.3909, - "step": 555900 + "epoch": 0.39, + "learning_rate": 3.054620543920957e-05, + "loss": 2.7749, + "step": 109000 }, { - "epoch": 0.97, - "learning_rate": 1.5279875277712868e-06, - "loss": 2.2474, - "step": 555910 + "epoch": 0.39, + "learning_rate": 3.052835792126389e-05, + "loss": 2.767, + "step": 109100 }, { - "epoch": 0.97, - "learning_rate": 1.52711558784446e-06, - "loss": 2.3194, - "step": 555920 + "epoch": 0.39, + "learning_rate": 3.051051040331821e-05, + "loss": 2.7563, + "step": 109200 }, { - "epoch": 0.97, - "learning_rate": 1.5262436479176333e-06, - "loss": 2.1862, - "step": 555930 + "epoch": 0.39, + "learning_rate": 3.049266288537253e-05, + "loss": 2.7759, + "step": 109300 }, { - "epoch": 0.97, - "learning_rate": 1.5253717079908064e-06, - "loss": 2.2852, - "step": 555940 + "epoch": 0.39, + "learning_rate": 3.0474815367426852e-05, + "loss": 2.766, + "step": 109400 }, { - "epoch": 0.97, - "learning_rate": 1.5244997680639796e-06, - "loss": 2.21, - "step": 555950 + "epoch": 0.39, + "learning_rate": 3.045696784948117e-05, + "loss": 2.7694, + "step": 109500 }, { - "epoch": 0.97, - "learning_rate": 1.523627828137153e-06, - "loss": 2.2061, - "step": 555960 + "epoch": 0.39, + "learning_rate": 3.043912033153549e-05, + "loss": 2.7632, + "step": 109600 }, { - "epoch": 0.97, - "learning_rate": 1.522755888210326e-06, - "loss": 2.1962, - "step": 555970 + "epoch": 0.39, + "learning_rate": 3.0421272813589813e-05, + "loss": 2.7565, + "step": 109700 }, { - "epoch": 0.97, - "learning_rate": 1.5218839482834992e-06, - "loss": 2.3278, - "step": 555980 + "epoch": 0.39, + "learning_rate": 3.0403425295644137e-05, + "loss": 2.7679, + "step": 109800 }, { - "epoch": 0.97, - "learning_rate": 1.5210120083566723e-06, - "loss": 2.3555, - "step": 555990 + "epoch": 0.39, + "learning_rate": 3.038557777769846e-05, + "loss": 2.7621, + "step": 109900 }, { - "epoch": 0.97, - "learning_rate": 1.5201400684298456e-06, - "loss": 2.2766, - "step": 556000 + "epoch": 0.39, + "learning_rate": 3.036773025975278e-05, + "loss": 2.7688, + "step": 110000 }, { - "epoch": 0.97, - "learning_rate": 1.5192681285030188e-06, - "loss": 2.2627, - "step": 556010 + "epoch": 0.39, + "learning_rate": 3.03498827418071e-05, + "loss": 2.7615, + "step": 110100 }, { - "epoch": 0.97, - "learning_rate": 1.518396188576192e-06, - "loss": 2.2313, - "step": 556020 + "epoch": 0.39, + "learning_rate": 3.0332035223861422e-05, + "loss": 2.7697, + "step": 110200 }, { - "epoch": 0.97, - "learning_rate": 1.5175242486493653e-06, - "loss": 2.264, - "step": 556030 + "epoch": 0.39, + "learning_rate": 3.0314187705915743e-05, + "loss": 2.7759, + "step": 110300 }, { - "epoch": 0.97, - "learning_rate": 1.5166523087225384e-06, - "loss": 2.2079, - "step": 556040 + "epoch": 0.39, + "learning_rate": 3.029634018797006e-05, + "loss": 2.7709, + "step": 110400 }, { - "epoch": 0.97, - "learning_rate": 1.5157803687957115e-06, - "loss": 2.3158, - "step": 556050 + "epoch": 0.39, + "learning_rate": 3.0278492670024382e-05, + "loss": 2.7642, + "step": 110500 }, { - "epoch": 0.97, - "learning_rate": 1.5149084288688849e-06, - "loss": 2.2848, - "step": 556060 + "epoch": 0.39, + "learning_rate": 3.0260645152078704e-05, + "loss": 2.764, + "step": 110600 }, { - "epoch": 0.97, - "learning_rate": 1.514036488942058e-06, - "loss": 2.2374, - "step": 556070 + "epoch": 0.4, + "learning_rate": 3.0242797634133025e-05, + "loss": 2.7764, + "step": 110700 }, { - "epoch": 0.97, - "learning_rate": 1.5131645490152312e-06, - "loss": 2.2489, - "step": 556080 + "epoch": 0.4, + "learning_rate": 3.0224950116187346e-05, + "loss": 2.7683, + "step": 110800 }, { - "epoch": 0.97, - "learning_rate": 1.5122926090884043e-06, - "loss": 2.2706, - "step": 556090 + "epoch": 0.4, + "learning_rate": 3.0207102598241664e-05, + "loss": 2.7657, + "step": 110900 }, { - "epoch": 0.97, - "learning_rate": 1.5114206691615776e-06, - "loss": 2.3939, - "step": 556100 + "epoch": 0.4, + "learning_rate": 3.0189255080295985e-05, + "loss": 2.7731, + "step": 111000 }, { - "epoch": 0.97, - "learning_rate": 1.5105487292347508e-06, - "loss": 2.3169, - "step": 556110 + "epoch": 0.4, + "learning_rate": 3.0171407562350306e-05, + "loss": 2.7703, + "step": 111100 }, { - "epoch": 0.97, - "learning_rate": 1.509676789307924e-06, - "loss": 2.2499, - "step": 556120 + "epoch": 0.4, + "learning_rate": 3.0153560044404628e-05, + "loss": 2.7718, + "step": 111200 }, { - "epoch": 0.97, - "learning_rate": 1.5088048493810972e-06, - "loss": 2.1636, - "step": 556130 + "epoch": 0.4, + "learning_rate": 3.013571252645895e-05, + "loss": 2.7739, + "step": 111300 }, { - "epoch": 0.97, - "learning_rate": 1.5079329094542704e-06, - "loss": 2.1416, - "step": 556140 + "epoch": 0.4, + "learning_rate": 3.011786500851327e-05, + "loss": 2.7715, + "step": 111400 }, { - "epoch": 0.97, - "learning_rate": 1.5070609695274435e-06, - "loss": 2.2278, - "step": 556150 + "epoch": 0.4, + "learning_rate": 3.0100017490567588e-05, + "loss": 2.7594, + "step": 111500 }, { - "epoch": 0.97, - "learning_rate": 1.5061890296006169e-06, - "loss": 2.1529, - "step": 556160 + "epoch": 0.4, + "learning_rate": 3.008216997262191e-05, + "loss": 2.7705, + "step": 111600 }, { - "epoch": 0.97, - "learning_rate": 1.50531708967379e-06, - "loss": 2.2838, - "step": 556170 + "epoch": 0.4, + "learning_rate": 3.006432245467623e-05, + "loss": 2.7714, + "step": 111700 }, { - "epoch": 0.97, - "learning_rate": 1.5044451497469631e-06, - "loss": 2.2997, - "step": 556180 + "epoch": 0.4, + "learning_rate": 3.004647493673055e-05, + "loss": 2.7601, + "step": 111800 }, { - "epoch": 0.97, - "learning_rate": 1.5035732098201363e-06, - "loss": 2.2549, - "step": 556190 + "epoch": 0.4, + "learning_rate": 3.0028627418784873e-05, + "loss": 2.7659, + "step": 111900 }, { - "epoch": 0.97, - "learning_rate": 1.5027012698933096e-06, - "loss": 2.2632, - "step": 556200 + "epoch": 0.4, + "learning_rate": 3.001077990083919e-05, + "loss": 2.7733, + "step": 112000 }, { - "epoch": 0.97, - "learning_rate": 1.5018293299664827e-06, - "loss": 2.2286, - "step": 556210 + "epoch": 0.4, + "learning_rate": 2.9992932382893512e-05, + "loss": 2.7685, + "step": 112100 }, { - "epoch": 0.97, - "learning_rate": 1.5009573900396559e-06, - "loss": 2.2266, - "step": 556220 + "epoch": 0.4, + "learning_rate": 2.9975084864947833e-05, + "loss": 2.7684, + "step": 112200 }, { - "epoch": 0.97, - "learning_rate": 1.5000854501128292e-06, - "loss": 2.1704, - "step": 556230 + "epoch": 0.4, + "learning_rate": 2.9957237347002154e-05, + "loss": 2.7722, + "step": 112300 }, { - "epoch": 0.97, - "learning_rate": 1.4992135101860024e-06, - "loss": 2.196, - "step": 556240 + "epoch": 0.4, + "learning_rate": 2.9939389829056475e-05, + "loss": 2.7639, + "step": 112400 }, { - "epoch": 0.97, - "learning_rate": 1.4983415702591755e-06, - "loss": 2.0888, - "step": 556250 + "epoch": 0.4, + "learning_rate": 2.9921542311110797e-05, + "loss": 2.7693, + "step": 112500 }, { - "epoch": 0.97, - "learning_rate": 1.4974696303323488e-06, - "loss": 2.346, - "step": 556260 + "epoch": 0.4, + "learning_rate": 2.9903694793165114e-05, + "loss": 2.759, + "step": 112600 }, { - "epoch": 0.97, - "learning_rate": 1.496597690405522e-06, - "loss": 2.2748, - "step": 556270 + "epoch": 0.4, + "learning_rate": 2.9885847275219436e-05, + "loss": 2.7726, + "step": 112700 }, { - "epoch": 0.97, - "learning_rate": 1.4957257504786951e-06, - "loss": 2.3429, - "step": 556280 + "epoch": 0.4, + "learning_rate": 2.9867999757273757e-05, + "loss": 2.7667, + "step": 112800 }, { - "epoch": 0.97, - "learning_rate": 1.4948538105518682e-06, - "loss": 2.2014, - "step": 556290 + "epoch": 0.4, + "learning_rate": 2.9850152239328078e-05, + "loss": 2.7621, + "step": 112900 }, { - "epoch": 0.97, - "learning_rate": 1.4939818706250416e-06, - "loss": 2.2558, - "step": 556300 + "epoch": 0.4, + "learning_rate": 2.98323047213824e-05, + "loss": 2.772, + "step": 113000 }, { - "epoch": 0.97, - "learning_rate": 1.4931099306982147e-06, - "loss": 2.3525, - "step": 556310 + "epoch": 0.4, + "learning_rate": 2.9814457203436717e-05, + "loss": 2.7647, + "step": 113100 }, { - "epoch": 0.97, - "learning_rate": 1.4922379907713879e-06, - "loss": 2.2544, - "step": 556320 + "epoch": 0.4, + "learning_rate": 2.9796609685491038e-05, + "loss": 2.7604, + "step": 113200 }, { - "epoch": 0.97, - "learning_rate": 1.4913660508445612e-06, - "loss": 2.2916, - "step": 556330 + "epoch": 0.4, + "learning_rate": 2.977876216754536e-05, + "loss": 2.7798, + "step": 113300 }, { - "epoch": 0.97, - "learning_rate": 1.4904941109177343e-06, - "loss": 2.231, - "step": 556340 + "epoch": 0.4, + "learning_rate": 2.976091464959968e-05, + "loss": 2.7606, + "step": 113400 }, { - "epoch": 0.97, - "learning_rate": 1.4896221709909075e-06, - "loss": 2.2176, - "step": 556350 + "epoch": 0.41, + "learning_rate": 2.9743067131654002e-05, + "loss": 2.7628, + "step": 113500 }, { - "epoch": 0.97, - "learning_rate": 1.4887502310640808e-06, - "loss": 2.2391, - "step": 556360 + "epoch": 0.41, + "learning_rate": 2.9725219613708323e-05, + "loss": 2.7717, + "step": 113600 }, { - "epoch": 0.97, - "learning_rate": 1.487878291137254e-06, - "loss": 2.2239, - "step": 556370 + "epoch": 0.41, + "learning_rate": 2.970737209576264e-05, + "loss": 2.7719, + "step": 113700 }, { - "epoch": 0.97, - "learning_rate": 1.487006351210427e-06, - "loss": 2.1511, - "step": 556380 + "epoch": 0.41, + "learning_rate": 2.9689524577816962e-05, + "loss": 2.7632, + "step": 113800 }, { - "epoch": 0.97, - "learning_rate": 1.4861344112836002e-06, - "loss": 2.3223, - "step": 556390 + "epoch": 0.41, + "learning_rate": 2.9671677059871283e-05, + "loss": 2.7752, + "step": 113900 }, { - "epoch": 0.97, - "learning_rate": 1.4852624713567736e-06, - "loss": 2.2759, - "step": 556400 + "epoch": 0.41, + "learning_rate": 2.9653829541925605e-05, + "loss": 2.7617, + "step": 114000 }, { - "epoch": 0.97, - "learning_rate": 1.4843905314299467e-06, - "loss": 2.2577, - "step": 556410 + "epoch": 0.41, + "learning_rate": 2.9635982023979926e-05, + "loss": 2.7669, + "step": 114100 }, { - "epoch": 0.97, - "learning_rate": 1.4835185915031198e-06, - "loss": 2.168, - "step": 556420 + "epoch": 0.41, + "learning_rate": 2.9618134506034244e-05, + "loss": 2.7616, + "step": 114200 }, { - "epoch": 0.97, - "learning_rate": 1.4826466515762932e-06, - "loss": 2.2506, - "step": 556430 + "epoch": 0.41, + "learning_rate": 2.9600286988088565e-05, + "loss": 2.7716, + "step": 114300 }, { - "epoch": 0.97, - "learning_rate": 1.4817747116494663e-06, - "loss": 2.2292, - "step": 556440 + "epoch": 0.41, + "learning_rate": 2.9582439470142886e-05, + "loss": 2.7509, + "step": 114400 }, { - "epoch": 0.97, - "learning_rate": 1.4809027717226395e-06, - "loss": 2.2864, - "step": 556450 + "epoch": 0.41, + "learning_rate": 2.9564591952197207e-05, + "loss": 2.7704, + "step": 114500 }, { - "epoch": 0.97, - "learning_rate": 1.4800308317958128e-06, - "loss": 2.1869, - "step": 556460 + "epoch": 0.41, + "learning_rate": 2.954674443425153e-05, + "loss": 2.7653, + "step": 114600 }, { - "epoch": 0.97, - "learning_rate": 1.479158891868986e-06, - "loss": 2.3212, - "step": 556470 + "epoch": 0.41, + "learning_rate": 2.952889691630585e-05, + "loss": 2.7519, + "step": 114700 }, { - "epoch": 0.97, - "learning_rate": 1.478286951942159e-06, - "loss": 2.3397, - "step": 556480 + "epoch": 0.41, + "learning_rate": 2.9511049398360168e-05, + "loss": 2.7644, + "step": 114800 }, { - "epoch": 0.97, - "learning_rate": 1.4774150120153322e-06, - "loss": 2.3069, - "step": 556490 + "epoch": 0.41, + "learning_rate": 2.9493201880414496e-05, + "loss": 2.7755, + "step": 114900 }, { - "epoch": 0.97, - "learning_rate": 1.4765430720885056e-06, - "loss": 2.2283, - "step": 556500 + "epoch": 0.41, + "learning_rate": 2.9475354362468817e-05, + "loss": 2.7644, + "step": 115000 }, { - "epoch": 0.97, - "learning_rate": 1.4756711321616787e-06, - "loss": 2.2471, - "step": 556510 + "epoch": 0.41, + "learning_rate": 2.9457506844523135e-05, + "loss": 2.7642, + "step": 115100 }, { - "epoch": 0.97, - "learning_rate": 1.4747991922348518e-06, - "loss": 2.1821, - "step": 556520 + "epoch": 0.41, + "learning_rate": 2.9439659326577456e-05, + "loss": 2.7685, + "step": 115200 }, { - "epoch": 0.97, - "learning_rate": 1.4739272523080252e-06, - "loss": 2.2605, - "step": 556530 + "epoch": 0.41, + "learning_rate": 2.9421811808631777e-05, + "loss": 2.7611, + "step": 115300 }, { - "epoch": 0.97, - "learning_rate": 1.4730553123811983e-06, - "loss": 2.2762, - "step": 556540 + "epoch": 0.41, + "learning_rate": 2.9403964290686098e-05, + "loss": 2.7727, + "step": 115400 }, { - "epoch": 0.97, - "learning_rate": 1.4721833724543714e-06, - "loss": 2.2054, - "step": 556550 + "epoch": 0.41, + "learning_rate": 2.938611677274042e-05, + "loss": 2.7658, + "step": 115500 }, { - "epoch": 0.97, - "learning_rate": 1.4713114325275448e-06, - "loss": 2.2169, - "step": 556560 + "epoch": 0.41, + "learning_rate": 2.936826925479474e-05, + "loss": 2.7597, + "step": 115600 }, { - "epoch": 0.97, - "learning_rate": 1.470439492600718e-06, - "loss": 2.2147, - "step": 556570 + "epoch": 0.41, + "learning_rate": 2.935042173684906e-05, + "loss": 2.761, + "step": 115700 }, { - "epoch": 0.97, - "learning_rate": 1.469567552673891e-06, - "loss": 2.3589, - "step": 556580 + "epoch": 0.41, + "learning_rate": 2.933257421890338e-05, + "loss": 2.7679, + "step": 115800 }, { - "epoch": 0.97, - "learning_rate": 1.4686956127470642e-06, - "loss": 2.2304, - "step": 556590 + "epoch": 0.41, + "learning_rate": 2.93147267009577e-05, + "loss": 2.7595, + "step": 115900 }, { - "epoch": 0.97, - "learning_rate": 1.4678236728202375e-06, - "loss": 2.2363, - "step": 556600 + "epoch": 0.41, + "learning_rate": 2.9296879183012022e-05, + "loss": 2.7625, + "step": 116000 }, { - "epoch": 0.97, - "learning_rate": 1.4669517328934107e-06, - "loss": 2.2838, - "step": 556610 + "epoch": 0.41, + "learning_rate": 2.9279031665066343e-05, + "loss": 2.7687, + "step": 116100 }, { - "epoch": 0.97, - "learning_rate": 1.4660797929665838e-06, - "loss": 2.2719, - "step": 556620 + "epoch": 0.41, + "learning_rate": 2.926118414712066e-05, + "loss": 2.7706, + "step": 116200 }, { - "epoch": 0.97, - "learning_rate": 1.4652078530397572e-06, - "loss": 2.2487, - "step": 556630 + "epoch": 0.42, + "learning_rate": 2.9243336629174982e-05, + "loss": 2.7599, + "step": 116300 }, { - "epoch": 0.97, - "learning_rate": 1.4643359131129303e-06, - "loss": 2.2318, - "step": 556640 + "epoch": 0.42, + "learning_rate": 2.9225489111229304e-05, + "loss": 2.7678, + "step": 116400 }, { - "epoch": 0.97, - "learning_rate": 1.4634639731861034e-06, - "loss": 2.2873, - "step": 556650 + "epoch": 0.42, + "learning_rate": 2.9207641593283625e-05, + "loss": 2.7669, + "step": 116500 }, { - "epoch": 0.97, - "learning_rate": 1.4625920332592768e-06, - "loss": 2.2771, - "step": 556660 + "epoch": 0.42, + "learning_rate": 2.9189794075337946e-05, + "loss": 2.7563, + "step": 116600 }, { - "epoch": 0.97, - "learning_rate": 1.46172009333245e-06, - "loss": 2.1261, - "step": 556670 + "epoch": 0.42, + "learning_rate": 2.9171946557392267e-05, + "loss": 2.7615, + "step": 116700 }, { - "epoch": 0.97, - "learning_rate": 1.460848153405623e-06, - "loss": 2.3138, - "step": 556680 + "epoch": 0.42, + "learning_rate": 2.9154099039446585e-05, + "loss": 2.7517, + "step": 116800 }, { - "epoch": 0.97, - "learning_rate": 1.4599762134787962e-06, - "loss": 2.1783, - "step": 556690 + "epoch": 0.42, + "learning_rate": 2.9136251521500906e-05, + "loss": 2.7608, + "step": 116900 }, { - "epoch": 0.97, - "learning_rate": 1.4591042735519695e-06, - "loss": 2.2976, - "step": 556700 + "epoch": 0.42, + "learning_rate": 2.9118404003555228e-05, + "loss": 2.769, + "step": 117000 }, { - "epoch": 0.97, - "learning_rate": 1.4582323336251427e-06, - "loss": 2.2825, - "step": 556710 + "epoch": 0.42, + "learning_rate": 2.910055648560955e-05, + "loss": 2.7616, + "step": 117100 }, { - "epoch": 0.97, - "learning_rate": 1.4573603936983158e-06, - "loss": 2.2415, - "step": 556720 + "epoch": 0.42, + "learning_rate": 2.908270896766387e-05, + "loss": 2.7562, + "step": 117200 }, { - "epoch": 0.97, - "learning_rate": 1.4564884537714891e-06, - "loss": 2.2896, - "step": 556730 + "epoch": 0.42, + "learning_rate": 2.9064861449718188e-05, + "loss": 2.7626, + "step": 117300 }, { - "epoch": 0.97, - "learning_rate": 1.4556165138446623e-06, - "loss": 2.2563, - "step": 556740 + "epoch": 0.42, + "learning_rate": 2.904701393177251e-05, + "loss": 2.7589, + "step": 117400 }, { - "epoch": 0.97, - "learning_rate": 1.4547445739178354e-06, - "loss": 2.2992, - "step": 556750 + "epoch": 0.42, + "learning_rate": 2.902916641382683e-05, + "loss": 2.7657, + "step": 117500 }, { - "epoch": 0.97, - "learning_rate": 1.4538726339910088e-06, - "loss": 2.3119, - "step": 556760 + "epoch": 0.42, + "learning_rate": 2.901131889588115e-05, + "loss": 2.7595, + "step": 117600 }, { - "epoch": 0.97, - "learning_rate": 1.4530006940641819e-06, - "loss": 2.3751, - "step": 556770 + "epoch": 0.42, + "learning_rate": 2.8993471377935473e-05, + "loss": 2.7686, + "step": 117700 }, { - "epoch": 0.97, - "learning_rate": 1.452128754137355e-06, - "loss": 2.1475, - "step": 556780 + "epoch": 0.42, + "learning_rate": 2.8975623859989794e-05, + "loss": 2.7624, + "step": 117800 }, { - "epoch": 0.97, - "learning_rate": 1.4512568142105282e-06, - "loss": 2.2757, - "step": 556790 + "epoch": 0.42, + "learning_rate": 2.895777634204411e-05, + "loss": 2.7675, + "step": 117900 }, { - "epoch": 0.97, - "learning_rate": 1.4503848742837015e-06, - "loss": 2.2821, - "step": 556800 + "epoch": 0.42, + "learning_rate": 2.8939928824098433e-05, + "loss": 2.759, + "step": 118000 }, { - "epoch": 0.97, - "learning_rate": 1.4495129343568746e-06, - "loss": 2.1999, - "step": 556810 + "epoch": 0.42, + "learning_rate": 2.8922081306152754e-05, + "loss": 2.7601, + "step": 118100 }, { - "epoch": 0.97, - "learning_rate": 1.4486409944300478e-06, - "loss": 2.3075, - "step": 556820 + "epoch": 0.42, + "learning_rate": 2.8904233788207075e-05, + "loss": 2.7665, + "step": 118200 }, { - "epoch": 0.97, - "learning_rate": 1.4477690545032211e-06, - "loss": 2.1464, - "step": 556830 + "epoch": 0.42, + "learning_rate": 2.8886386270261397e-05, + "loss": 2.7626, + "step": 118300 }, { - "epoch": 0.97, - "learning_rate": 1.4468971145763943e-06, - "loss": 2.3657, - "step": 556840 + "epoch": 0.42, + "learning_rate": 2.8868538752315714e-05, + "loss": 2.7513, + "step": 118400 }, { - "epoch": 0.97, - "learning_rate": 1.4460251746495674e-06, - "loss": 2.2333, - "step": 556850 + "epoch": 0.42, + "learning_rate": 2.8850691234370036e-05, + "loss": 2.7645, + "step": 118500 }, { - "epoch": 0.97, - "learning_rate": 1.4451532347227407e-06, - "loss": 2.2439, - "step": 556860 + "epoch": 0.42, + "learning_rate": 2.8832843716424357e-05, + "loss": 2.7585, + "step": 118600 }, { - "epoch": 0.97, - "learning_rate": 1.4442812947959139e-06, - "loss": 2.1618, - "step": 556870 + "epoch": 0.42, + "learning_rate": 2.8814996198478678e-05, + "loss": 2.7556, + "step": 118700 }, { - "epoch": 0.97, - "learning_rate": 1.443409354869087e-06, - "loss": 2.2677, - "step": 556880 + "epoch": 0.42, + "learning_rate": 2.8797148680533e-05, + "loss": 2.7694, + "step": 118800 }, { - "epoch": 0.97, - "learning_rate": 1.4425374149422601e-06, - "loss": 2.2772, - "step": 556890 + "epoch": 0.42, + "learning_rate": 2.877930116258732e-05, + "loss": 2.7676, + "step": 118900 }, { - "epoch": 0.97, - "learning_rate": 1.4416654750154335e-06, - "loss": 2.2589, - "step": 556900 + "epoch": 0.42, + "learning_rate": 2.8761453644641638e-05, + "loss": 2.7649, + "step": 119000 }, { - "epoch": 0.97, - "learning_rate": 1.4407935350886066e-06, - "loss": 2.2198, - "step": 556910 + "epoch": 0.43, + "learning_rate": 2.874360612669596e-05, + "loss": 2.7552, + "step": 119100 }, { - "epoch": 0.97, - "learning_rate": 1.4399215951617798e-06, - "loss": 2.1906, - "step": 556920 + "epoch": 0.43, + "learning_rate": 2.872575860875028e-05, + "loss": 2.7612, + "step": 119200 }, { - "epoch": 0.97, - "learning_rate": 1.439049655234953e-06, - "loss": 2.3355, - "step": 556930 + "epoch": 0.43, + "learning_rate": 2.8707911090804602e-05, + "loss": 2.7602, + "step": 119300 }, { - "epoch": 0.97, - "learning_rate": 1.4381777153081262e-06, - "loss": 2.1785, - "step": 556940 + "epoch": 0.43, + "learning_rate": 2.8690063572858923e-05, + "loss": 2.7551, + "step": 119400 }, { - "epoch": 0.97, - "learning_rate": 1.4373057753812994e-06, - "loss": 2.2304, - "step": 556950 + "epoch": 0.43, + "learning_rate": 2.867221605491324e-05, + "loss": 2.7676, + "step": 119500 }, { - "epoch": 0.97, - "learning_rate": 1.4364338354544727e-06, - "loss": 2.3393, - "step": 556960 + "epoch": 0.43, + "learning_rate": 2.8654368536967562e-05, + "loss": 2.7624, + "step": 119600 }, { - "epoch": 0.97, - "learning_rate": 1.4355618955276459e-06, - "loss": 2.3296, - "step": 556970 + "epoch": 0.43, + "learning_rate": 2.8636521019021883e-05, + "loss": 2.7723, + "step": 119700 }, { - "epoch": 0.97, - "learning_rate": 1.434689955600819e-06, - "loss": 2.1528, - "step": 556980 + "epoch": 0.43, + "learning_rate": 2.8618673501076205e-05, + "loss": 2.754, + "step": 119800 }, { - "epoch": 0.97, - "learning_rate": 1.4338180156739923e-06, - "loss": 2.1813, - "step": 556990 + "epoch": 0.43, + "learning_rate": 2.8600825983130526e-05, + "loss": 2.763, + "step": 119900 }, { - "epoch": 0.97, - "learning_rate": 1.4329460757471655e-06, - "loss": 2.2529, - "step": 557000 + "epoch": 0.43, + "learning_rate": 2.8582978465184847e-05, + "loss": 2.7562, + "step": 120000 }, { - "epoch": 0.97, - "learning_rate": 1.4320741358203386e-06, - "loss": 2.2411, - "step": 557010 + "epoch": 0.43, + "learning_rate": 2.856513094723917e-05, + "loss": 2.7504, + "step": 120100 }, { - "epoch": 0.97, - "learning_rate": 1.4312021958935117e-06, - "loss": 2.2884, - "step": 557020 + "epoch": 0.43, + "learning_rate": 2.8547283429293493e-05, + "loss": 2.7601, + "step": 120200 }, { - "epoch": 0.97, - "learning_rate": 1.430330255966685e-06, - "loss": 2.2115, - "step": 557030 + "epoch": 0.43, + "learning_rate": 2.8529435911347814e-05, + "loss": 2.7528, + "step": 120300 }, { - "epoch": 0.97, - "learning_rate": 1.4294583160398582e-06, - "loss": 2.1466, - "step": 557040 + "epoch": 0.43, + "learning_rate": 2.8511588393402132e-05, + "loss": 2.7636, + "step": 120400 }, { - "epoch": 0.97, - "learning_rate": 1.4285863761130314e-06, - "loss": 2.3351, - "step": 557050 + "epoch": 0.43, + "learning_rate": 2.8493740875456453e-05, + "loss": 2.7589, + "step": 120500 }, { - "epoch": 0.97, - "learning_rate": 1.4277144361862047e-06, - "loss": 2.2066, - "step": 557060 + "epoch": 0.43, + "learning_rate": 2.8475893357510774e-05, + "loss": 2.7598, + "step": 120600 }, { - "epoch": 0.97, - "learning_rate": 1.4268424962593778e-06, - "loss": 2.3266, - "step": 557070 + "epoch": 0.43, + "learning_rate": 2.8458045839565096e-05, + "loss": 2.7556, + "step": 120700 }, { - "epoch": 0.97, - "learning_rate": 1.425970556332551e-06, - "loss": 2.234, - "step": 557080 + "epoch": 0.43, + "learning_rate": 2.8440198321619417e-05, + "loss": 2.757, + "step": 120800 }, { - "epoch": 0.97, - "learning_rate": 1.4250986164057243e-06, - "loss": 2.2568, - "step": 557090 + "epoch": 0.43, + "learning_rate": 2.8422350803673735e-05, + "loss": 2.7574, + "step": 120900 }, { - "epoch": 0.97, - "learning_rate": 1.4242266764788974e-06, - "loss": 2.232, - "step": 557100 + "epoch": 0.43, + "learning_rate": 2.8404503285728056e-05, + "loss": 2.7673, + "step": 121000 }, { - "epoch": 0.97, - "learning_rate": 1.4233547365520706e-06, - "loss": 2.335, - "step": 557110 + "epoch": 0.43, + "learning_rate": 2.8386655767782377e-05, + "loss": 2.7559, + "step": 121100 }, { - "epoch": 0.97, - "learning_rate": 1.4224827966252437e-06, - "loss": 2.2722, - "step": 557120 + "epoch": 0.43, + "learning_rate": 2.8368808249836698e-05, + "loss": 2.7568, + "step": 121200 }, { - "epoch": 0.97, - "learning_rate": 1.421610856698417e-06, - "loss": 2.366, - "step": 557130 + "epoch": 0.43, + "learning_rate": 2.835096073189102e-05, + "loss": 2.7604, + "step": 121300 }, { - "epoch": 0.97, - "learning_rate": 1.4207389167715902e-06, - "loss": 2.2835, - "step": 557140 + "epoch": 0.43, + "learning_rate": 2.833311321394534e-05, + "loss": 2.7564, + "step": 121400 }, { - "epoch": 0.97, - "learning_rate": 1.4198669768447633e-06, - "loss": 2.3118, - "step": 557150 + "epoch": 0.43, + "learning_rate": 2.831526569599966e-05, + "loss": 2.7626, + "step": 121500 }, { - "epoch": 0.97, - "learning_rate": 1.4189950369179367e-06, - "loss": 2.2839, - "step": 557160 + "epoch": 0.43, + "learning_rate": 2.829741817805398e-05, + "loss": 2.7636, + "step": 121600 }, { - "epoch": 0.97, - "learning_rate": 1.4181230969911098e-06, - "loss": 2.3092, - "step": 557170 + "epoch": 0.43, + "learning_rate": 2.82795706601083e-05, + "loss": 2.7605, + "step": 121700 }, { - "epoch": 0.97, - "learning_rate": 1.417251157064283e-06, - "loss": 2.1787, - "step": 557180 + "epoch": 0.43, + "learning_rate": 2.8261723142162622e-05, + "loss": 2.7583, + "step": 121800 }, { - "epoch": 0.97, - "learning_rate": 1.4163792171374563e-06, - "loss": 2.271, - "step": 557190 + "epoch": 0.44, + "learning_rate": 2.8243875624216943e-05, + "loss": 2.7727, + "step": 121900 }, { - "epoch": 0.97, - "learning_rate": 1.4155072772106294e-06, - "loss": 2.2317, - "step": 557200 + "epoch": 0.44, + "learning_rate": 2.822602810627126e-05, + "loss": 2.7519, + "step": 122000 }, { - "epoch": 0.97, - "learning_rate": 1.4146353372838026e-06, - "loss": 2.2617, - "step": 557210 + "epoch": 0.44, + "learning_rate": 2.8208180588325582e-05, + "loss": 2.7585, + "step": 122100 }, { - "epoch": 0.97, - "learning_rate": 1.4137633973569757e-06, - "loss": 2.3213, - "step": 557220 + "epoch": 0.44, + "learning_rate": 2.8190333070379904e-05, + "loss": 2.7645, + "step": 122200 }, { - "epoch": 0.97, - "learning_rate": 1.412891457430149e-06, - "loss": 2.2165, - "step": 557230 + "epoch": 0.44, + "learning_rate": 2.8172485552434225e-05, + "loss": 2.7689, + "step": 122300 }, { - "epoch": 0.97, - "learning_rate": 1.4120195175033222e-06, - "loss": 2.3584, - "step": 557240 + "epoch": 0.44, + "learning_rate": 2.8154638034488546e-05, + "loss": 2.7523, + "step": 122400 }, { - "epoch": 0.97, - "learning_rate": 1.4111475775764953e-06, - "loss": 2.27, - "step": 557250 + "epoch": 0.44, + "learning_rate": 2.8136790516542867e-05, + "loss": 2.7602, + "step": 122500 }, { - "epoch": 0.97, - "learning_rate": 1.4102756376496687e-06, - "loss": 2.2048, - "step": 557260 + "epoch": 0.44, + "learning_rate": 2.8118942998597185e-05, + "loss": 2.756, + "step": 122600 }, { - "epoch": 0.97, - "learning_rate": 1.4094036977228418e-06, - "loss": 2.2289, - "step": 557270 + "epoch": 0.44, + "learning_rate": 2.8101095480651506e-05, + "loss": 2.7626, + "step": 122700 }, { - "epoch": 0.97, - "learning_rate": 1.408531757796015e-06, - "loss": 2.3524, - "step": 557280 + "epoch": 0.44, + "learning_rate": 2.8083247962705828e-05, + "loss": 2.7616, + "step": 122800 }, { - "epoch": 0.97, - "learning_rate": 1.4076598178691883e-06, - "loss": 2.2002, - "step": 557290 + "epoch": 0.44, + "learning_rate": 2.806540044476015e-05, + "loss": 2.7545, + "step": 122900 }, { - "epoch": 0.97, - "learning_rate": 1.4067878779423614e-06, - "loss": 2.2693, - "step": 557300 + "epoch": 0.44, + "learning_rate": 2.804755292681447e-05, + "loss": 2.7735, + "step": 123000 }, { - "epoch": 0.97, - "learning_rate": 1.4059159380155345e-06, - "loss": 2.2165, - "step": 557310 + "epoch": 0.44, + "learning_rate": 2.8029705408868788e-05, + "loss": 2.761, + "step": 123100 }, { - "epoch": 0.97, - "learning_rate": 1.4050439980887077e-06, - "loss": 2.3103, - "step": 557320 + "epoch": 0.44, + "learning_rate": 2.801185789092311e-05, + "loss": 2.7621, + "step": 123200 }, { - "epoch": 0.97, - "learning_rate": 1.404172058161881e-06, - "loss": 2.3465, - "step": 557330 + "epoch": 0.44, + "learning_rate": 2.799401037297743e-05, + "loss": 2.7577, + "step": 123300 }, { - "epoch": 0.97, - "learning_rate": 1.4033001182350542e-06, - "loss": 2.376, - "step": 557340 + "epoch": 0.44, + "learning_rate": 2.797616285503175e-05, + "loss": 2.7498, + "step": 123400 }, { - "epoch": 0.97, - "learning_rate": 1.4024281783082273e-06, - "loss": 2.3299, - "step": 557350 + "epoch": 0.44, + "learning_rate": 2.7958315337086073e-05, + "loss": 2.7634, + "step": 123500 }, { - "epoch": 0.97, - "learning_rate": 1.4015562383814006e-06, - "loss": 2.2997, - "step": 557360 + "epoch": 0.44, + "learning_rate": 2.7940467819140394e-05, + "loss": 2.764, + "step": 123600 }, { - "epoch": 0.97, - "learning_rate": 1.4006842984545738e-06, - "loss": 2.2071, - "step": 557370 + "epoch": 0.44, + "learning_rate": 2.792262030119471e-05, + "loss": 2.7741, + "step": 123700 }, { - "epoch": 0.97, - "learning_rate": 1.399812358527747e-06, - "loss": 2.2718, - "step": 557380 + "epoch": 0.44, + "learning_rate": 2.7904772783249033e-05, + "loss": 2.7674, + "step": 123800 }, { - "epoch": 0.97, - "learning_rate": 1.3989404186009203e-06, - "loss": 2.2663, - "step": 557390 + "epoch": 0.44, + "learning_rate": 2.7886925265303354e-05, + "loss": 2.748, + "step": 123900 }, { - "epoch": 0.97, - "learning_rate": 1.3980684786740934e-06, - "loss": 2.2225, - "step": 557400 + "epoch": 0.44, + "learning_rate": 2.7869077747357675e-05, + "loss": 2.7595, + "step": 124000 }, { - "epoch": 0.97, - "learning_rate": 1.3971965387472665e-06, - "loss": 2.2257, - "step": 557410 + "epoch": 0.44, + "learning_rate": 2.7851230229411997e-05, + "loss": 2.7542, + "step": 124100 }, { - "epoch": 0.97, - "learning_rate": 1.3963245988204397e-06, - "loss": 2.1495, - "step": 557420 + "epoch": 0.44, + "learning_rate": 2.7833382711466314e-05, + "loss": 2.7677, + "step": 124200 }, { - "epoch": 0.97, - "learning_rate": 1.395452658893613e-06, - "loss": 2.1333, - "step": 557430 + "epoch": 0.44, + "learning_rate": 2.7815535193520636e-05, + "loss": 2.7678, + "step": 124300 }, { - "epoch": 0.97, - "learning_rate": 1.3945807189667861e-06, - "loss": 2.2335, - "step": 557440 + "epoch": 0.44, + "learning_rate": 2.7797687675574957e-05, + "loss": 2.7632, + "step": 124400 }, { - "epoch": 0.97, - "learning_rate": 1.3937087790399593e-06, - "loss": 2.2179, - "step": 557450 + "epoch": 0.44, + "learning_rate": 2.7779840157629278e-05, + "loss": 2.7536, + "step": 124500 }, { - "epoch": 0.97, - "learning_rate": 1.3928368391131326e-06, - "loss": 2.1709, - "step": 557460 + "epoch": 0.44, + "learning_rate": 2.77619926396836e-05, + "loss": 2.7657, + "step": 124600 }, { - "epoch": 0.97, - "learning_rate": 1.3919648991863058e-06, - "loss": 2.2746, - "step": 557470 + "epoch": 0.45, + "learning_rate": 2.774414512173792e-05, + "loss": 2.7621, + "step": 124700 }, { - "epoch": 0.97, - "learning_rate": 1.3910929592594789e-06, - "loss": 2.309, - "step": 557480 + "epoch": 0.45, + "learning_rate": 2.7726297603792238e-05, + "loss": 2.7572, + "step": 124800 }, { - "epoch": 0.97, - "learning_rate": 1.3902210193326522e-06, - "loss": 2.3955, - "step": 557490 + "epoch": 0.45, + "learning_rate": 2.770845008584656e-05, + "loss": 2.759, + "step": 124900 }, { - "epoch": 0.97, - "learning_rate": 1.3893490794058254e-06, - "loss": 2.2406, - "step": 557500 + "epoch": 0.45, + "learning_rate": 2.769060256790088e-05, + "loss": 2.7554, + "step": 125000 }, { - "epoch": 0.97, - "learning_rate": 1.3884771394789985e-06, - "loss": 2.3348, - "step": 557510 + "epoch": 0.45, + "learning_rate": 2.7672755049955202e-05, + "loss": 2.7481, + "step": 125100 }, { - "epoch": 0.97, - "learning_rate": 1.3876051995521716e-06, - "loss": 2.196, - "step": 557520 + "epoch": 0.45, + "learning_rate": 2.7654907532009526e-05, + "loss": 2.7598, + "step": 125200 }, { - "epoch": 0.97, - "learning_rate": 1.386733259625345e-06, - "loss": 2.1193, - "step": 557530 + "epoch": 0.45, + "learning_rate": 2.7637060014063848e-05, + "loss": 2.7662, + "step": 125300 }, { - "epoch": 0.97, - "learning_rate": 1.3858613196985181e-06, - "loss": 2.2508, - "step": 557540 + "epoch": 0.45, + "learning_rate": 2.761921249611817e-05, + "loss": 2.765, + "step": 125400 }, { - "epoch": 0.97, - "learning_rate": 1.3849893797716913e-06, - "loss": 2.306, - "step": 557550 + "epoch": 0.45, + "learning_rate": 2.760136497817249e-05, + "loss": 2.7548, + "step": 125500 }, { - "epoch": 0.97, - "learning_rate": 1.3841174398448646e-06, - "loss": 2.2178, - "step": 557560 + "epoch": 0.45, + "learning_rate": 2.758351746022681e-05, + "loss": 2.7529, + "step": 125600 }, { - "epoch": 0.97, - "learning_rate": 1.3832454999180377e-06, - "loss": 2.2354, - "step": 557570 + "epoch": 0.45, + "learning_rate": 2.756566994228113e-05, + "loss": 2.7479, + "step": 125700 }, { - "epoch": 0.97, - "learning_rate": 1.3823735599912109e-06, - "loss": 2.3524, - "step": 557580 + "epoch": 0.45, + "learning_rate": 2.754782242433545e-05, + "loss": 2.7477, + "step": 125800 }, { - "epoch": 0.97, - "learning_rate": 1.3815016200643842e-06, - "loss": 2.3315, - "step": 557590 + "epoch": 0.45, + "learning_rate": 2.752997490638977e-05, + "loss": 2.745, + "step": 125900 }, { - "epoch": 0.97, - "learning_rate": 1.3806296801375574e-06, - "loss": 2.2657, - "step": 557600 + "epoch": 0.45, + "learning_rate": 2.7512127388444093e-05, + "loss": 2.7561, + "step": 126000 }, { - "epoch": 0.97, - "learning_rate": 1.3797577402107305e-06, - "loss": 2.2192, - "step": 557610 + "epoch": 0.45, + "learning_rate": 2.7494279870498414e-05, + "loss": 2.7503, + "step": 126100 }, { - "epoch": 0.97, - "learning_rate": 1.3788858002839036e-06, - "loss": 2.2569, - "step": 557620 + "epoch": 0.45, + "learning_rate": 2.7476432352552732e-05, + "loss": 2.7533, + "step": 126200 }, { - "epoch": 0.97, - "learning_rate": 1.378013860357077e-06, - "loss": 2.2495, - "step": 557630 + "epoch": 0.45, + "learning_rate": 2.7458584834607053e-05, + "loss": 2.7483, + "step": 126300 }, { - "epoch": 0.97, - "learning_rate": 1.3771419204302501e-06, - "loss": 2.2579, - "step": 557640 + "epoch": 0.45, + "learning_rate": 2.7440737316661374e-05, + "loss": 2.7628, + "step": 126400 }, { - "epoch": 0.97, - "learning_rate": 1.3762699805034232e-06, - "loss": 2.2374, - "step": 557650 + "epoch": 0.45, + "learning_rate": 2.7422889798715696e-05, + "loss": 2.7571, + "step": 126500 }, { - "epoch": 0.97, - "learning_rate": 1.3753980405765966e-06, - "loss": 2.2429, - "step": 557660 + "epoch": 0.45, + "learning_rate": 2.7405042280770017e-05, + "loss": 2.7596, + "step": 126600 }, { - "epoch": 0.97, - "learning_rate": 1.3745261006497697e-06, - "loss": 2.26, - "step": 557670 + "epoch": 0.45, + "learning_rate": 2.7387194762824338e-05, + "loss": 2.7522, + "step": 126700 }, { - "epoch": 0.97, - "learning_rate": 1.3736541607229429e-06, - "loss": 2.3051, - "step": 557680 + "epoch": 0.45, + "learning_rate": 2.7369347244878656e-05, + "loss": 2.7577, + "step": 126800 }, { - "epoch": 0.97, - "learning_rate": 1.3727822207961162e-06, - "loss": 2.2358, - "step": 557690 + "epoch": 0.45, + "learning_rate": 2.7351499726932977e-05, + "loss": 2.7501, + "step": 126900 }, { - "epoch": 0.97, - "learning_rate": 1.3719102808692893e-06, - "loss": 2.2889, - "step": 557700 + "epoch": 0.45, + "learning_rate": 2.7333652208987298e-05, + "loss": 2.7453, + "step": 127000 }, { - "epoch": 0.97, - "learning_rate": 1.3710383409424625e-06, - "loss": 2.1749, - "step": 557710 + "epoch": 0.45, + "learning_rate": 2.731580469104162e-05, + "loss": 2.7565, + "step": 127100 }, { - "epoch": 0.97, - "learning_rate": 1.3701664010156356e-06, - "loss": 2.2625, - "step": 557720 + "epoch": 0.45, + "learning_rate": 2.729795717309594e-05, + "loss": 2.7527, + "step": 127200 }, { - "epoch": 0.97, - "learning_rate": 1.369294461088809e-06, - "loss": 2.2314, - "step": 557730 + "epoch": 0.45, + "learning_rate": 2.728010965515026e-05, + "loss": 2.7426, + "step": 127300 }, { - "epoch": 0.97, - "learning_rate": 1.368422521161982e-06, - "loss": 2.2213, - "step": 557740 + "epoch": 0.45, + "learning_rate": 2.726226213720458e-05, + "loss": 2.7606, + "step": 127400 }, { - "epoch": 0.97, - "learning_rate": 1.3675505812351552e-06, - "loss": 2.2866, - "step": 557750 + "epoch": 0.46, + "learning_rate": 2.72444146192589e-05, + "loss": 2.752, + "step": 127500 }, { - "epoch": 0.97, - "learning_rate": 1.3666786413083286e-06, - "loss": 2.2699, - "step": 557760 + "epoch": 0.46, + "learning_rate": 2.7226567101313222e-05, + "loss": 2.7606, + "step": 127600 }, { - "epoch": 0.97, - "learning_rate": 1.3658067013815017e-06, - "loss": 2.1604, - "step": 557770 + "epoch": 0.46, + "learning_rate": 2.7208719583367543e-05, + "loss": 2.765, + "step": 127700 }, { - "epoch": 0.97, - "learning_rate": 1.3649347614546748e-06, - "loss": 2.2491, - "step": 557780 + "epoch": 0.46, + "learning_rate": 2.7190872065421865e-05, + "loss": 2.7667, + "step": 127800 }, { - "epoch": 0.97, - "learning_rate": 1.3640628215278482e-06, - "loss": 2.2856, - "step": 557790 + "epoch": 0.46, + "learning_rate": 2.7173024547476182e-05, + "loss": 2.7577, + "step": 127900 }, { - "epoch": 0.97, - "learning_rate": 1.3631908816010213e-06, - "loss": 2.2596, - "step": 557800 + "epoch": 0.46, + "learning_rate": 2.7155177029530504e-05, + "loss": 2.7512, + "step": 128000 }, { - "epoch": 0.97, - "learning_rate": 1.3623189416741945e-06, - "loss": 2.2502, - "step": 557810 + "epoch": 0.46, + "learning_rate": 2.7137329511584825e-05, + "loss": 2.7527, + "step": 128100 }, { - "epoch": 0.97, - "learning_rate": 1.3614470017473676e-06, - "loss": 2.2107, - "step": 557820 + "epoch": 0.46, + "learning_rate": 2.7119481993639146e-05, + "loss": 2.7469, + "step": 128200 }, { - "epoch": 0.97, - "learning_rate": 1.360575061820541e-06, - "loss": 2.2273, - "step": 557830 + "epoch": 0.46, + "learning_rate": 2.7101634475693467e-05, + "loss": 2.7507, + "step": 128300 }, { - "epoch": 0.97, - "learning_rate": 1.359703121893714e-06, - "loss": 2.2728, - "step": 557840 + "epoch": 0.46, + "learning_rate": 2.7083786957747785e-05, + "loss": 2.7518, + "step": 128400 }, { - "epoch": 0.97, - "learning_rate": 1.3588311819668872e-06, - "loss": 2.2593, - "step": 557850 + "epoch": 0.46, + "learning_rate": 2.7065939439802106e-05, + "loss": 2.751, + "step": 128500 }, { - "epoch": 0.97, - "learning_rate": 1.3579592420400606e-06, - "loss": 2.2579, - "step": 557860 + "epoch": 0.46, + "learning_rate": 2.7048091921856427e-05, + "loss": 2.7627, + "step": 128600 }, { - "epoch": 0.97, - "learning_rate": 1.3570873021132337e-06, - "loss": 2.2654, - "step": 557870 + "epoch": 0.46, + "learning_rate": 2.703024440391075e-05, + "loss": 2.7516, + "step": 128700 }, { - "epoch": 0.97, - "learning_rate": 1.3562153621864068e-06, - "loss": 2.1041, - "step": 557880 + "epoch": 0.46, + "learning_rate": 2.701239688596507e-05, + "loss": 2.7515, + "step": 128800 }, { - "epoch": 0.97, - "learning_rate": 1.3553434222595802e-06, - "loss": 2.1499, - "step": 557890 + "epoch": 0.46, + "learning_rate": 2.699454936801939e-05, + "loss": 2.7556, + "step": 128900 }, { - "epoch": 0.97, - "learning_rate": 1.3544714823327533e-06, - "loss": 2.222, - "step": 557900 + "epoch": 0.46, + "learning_rate": 2.697670185007371e-05, + "loss": 2.7491, + "step": 129000 }, { - "epoch": 0.97, - "learning_rate": 1.3535995424059264e-06, - "loss": 2.3645, - "step": 557910 + "epoch": 0.46, + "learning_rate": 2.695885433212803e-05, + "loss": 2.7524, + "step": 129100 }, { - "epoch": 0.97, - "learning_rate": 1.3527276024790996e-06, - "loss": 2.2273, - "step": 557920 + "epoch": 0.46, + "learning_rate": 2.694100681418235e-05, + "loss": 2.7487, + "step": 129200 }, { - "epoch": 0.97, - "learning_rate": 1.351855662552273e-06, - "loss": 2.2721, - "step": 557930 + "epoch": 0.46, + "learning_rate": 2.6923159296236673e-05, + "loss": 2.763, + "step": 129300 }, { - "epoch": 0.97, - "learning_rate": 1.350983722625446e-06, - "loss": 2.2276, - "step": 557940 + "epoch": 0.46, + "learning_rate": 2.6905311778290994e-05, + "loss": 2.739, + "step": 129400 }, { - "epoch": 0.97, - "learning_rate": 1.3501117826986192e-06, - "loss": 2.2702, - "step": 557950 + "epoch": 0.46, + "learning_rate": 2.688746426034531e-05, + "loss": 2.7549, + "step": 129500 }, { - "epoch": 0.97, - "learning_rate": 1.3492398427717925e-06, - "loss": 2.3439, - "step": 557960 + "epoch": 0.46, + "learning_rate": 2.6869616742399633e-05, + "loss": 2.761, + "step": 129600 }, { - "epoch": 0.97, - "learning_rate": 1.3483679028449657e-06, - "loss": 2.311, - "step": 557970 + "epoch": 0.46, + "learning_rate": 2.6851769224453954e-05, + "loss": 2.7487, + "step": 129700 }, { - "epoch": 0.97, - "learning_rate": 1.3474959629181388e-06, - "loss": 2.2971, - "step": 557980 + "epoch": 0.46, + "learning_rate": 2.6833921706508275e-05, + "loss": 2.7585, + "step": 129800 }, { - "epoch": 0.97, - "learning_rate": 1.3466240229913121e-06, - "loss": 2.2345, - "step": 557990 + "epoch": 0.46, + "learning_rate": 2.6816074188562596e-05, + "loss": 2.7546, + "step": 129900 }, { - "epoch": 0.97, - "learning_rate": 1.3457520830644853e-06, - "loss": 2.3805, - "step": 558000 + "epoch": 0.46, + "learning_rate": 2.6798226670616918e-05, + "loss": 2.7487, + "step": 130000 }, { - "epoch": 0.97, - "learning_rate": 1.3448801431376584e-06, - "loss": 2.234, - "step": 558010 + "epoch": 0.46, + "learning_rate": 2.6780379152671236e-05, + "loss": 2.7442, + "step": 130100 }, { - "epoch": 0.97, - "learning_rate": 1.3440082032108316e-06, - "loss": 2.2137, - "step": 558020 + "epoch": 0.46, + "learning_rate": 2.6762531634725557e-05, + "loss": 2.7464, + "step": 130200 }, { - "epoch": 0.97, - "learning_rate": 1.343136263284005e-06, - "loss": 2.32, - "step": 558030 + "epoch": 0.47, + "learning_rate": 2.6744684116779885e-05, + "loss": 2.7618, + "step": 130300 }, { - "epoch": 0.97, - "learning_rate": 1.342264323357178e-06, - "loss": 2.1954, - "step": 558040 + "epoch": 0.47, + "learning_rate": 2.6726836598834203e-05, + "loss": 2.7588, + "step": 130400 }, { - "epoch": 0.97, - "learning_rate": 1.3413923834303512e-06, - "loss": 2.0258, - "step": 558050 + "epoch": 0.47, + "learning_rate": 2.6708989080888524e-05, + "loss": 2.7507, + "step": 130500 }, { - "epoch": 0.97, - "learning_rate": 1.3405204435035245e-06, - "loss": 2.2558, - "step": 558060 + "epoch": 0.47, + "learning_rate": 2.6691141562942845e-05, + "loss": 2.7527, + "step": 130600 }, { - "epoch": 0.97, - "learning_rate": 1.3396485035766976e-06, - "loss": 2.1589, - "step": 558070 + "epoch": 0.47, + "learning_rate": 2.6673294044997166e-05, + "loss": 2.7451, + "step": 130700 }, { - "epoch": 0.97, - "learning_rate": 1.3387765636498708e-06, - "loss": 2.3309, - "step": 558080 + "epoch": 0.47, + "learning_rate": 2.6655446527051487e-05, + "loss": 2.747, + "step": 130800 }, { - "epoch": 0.97, - "learning_rate": 1.3379046237230441e-06, - "loss": 2.2468, - "step": 558090 + "epoch": 0.47, + "learning_rate": 2.663759900910581e-05, + "loss": 2.7497, + "step": 130900 }, { - "epoch": 0.97, - "learning_rate": 1.3370326837962173e-06, - "loss": 2.2752, - "step": 558100 + "epoch": 0.47, + "learning_rate": 2.6619751491160126e-05, + "loss": 2.7488, + "step": 131000 }, { - "epoch": 0.97, - "learning_rate": 1.3361607438693904e-06, - "loss": 2.3213, - "step": 558110 + "epoch": 0.47, + "learning_rate": 2.6601903973214448e-05, + "loss": 2.7602, + "step": 131100 }, { - "epoch": 0.97, - "learning_rate": 1.3352888039425635e-06, - "loss": 2.2877, - "step": 558120 + "epoch": 0.47, + "learning_rate": 2.658405645526877e-05, + "loss": 2.7607, + "step": 131200 }, { - "epoch": 0.97, - "learning_rate": 1.3344168640157369e-06, - "loss": 2.2485, - "step": 558130 + "epoch": 0.47, + "learning_rate": 2.656620893732309e-05, + "loss": 2.755, + "step": 131300 }, { - "epoch": 0.97, - "learning_rate": 1.33354492408891e-06, - "loss": 2.3491, - "step": 558140 + "epoch": 0.47, + "learning_rate": 2.654836141937741e-05, + "loss": 2.7475, + "step": 131400 }, { - "epoch": 0.97, - "learning_rate": 1.3326729841620831e-06, - "loss": 2.2751, - "step": 558150 + "epoch": 0.47, + "learning_rate": 2.653051390143173e-05, + "loss": 2.748, + "step": 131500 }, { - "epoch": 0.97, - "learning_rate": 1.3318010442352565e-06, - "loss": 2.3038, - "step": 558160 + "epoch": 0.47, + "learning_rate": 2.651266638348605e-05, + "loss": 2.7503, + "step": 131600 }, { - "epoch": 0.97, - "learning_rate": 1.3309291043084296e-06, - "loss": 2.2789, - "step": 558170 + "epoch": 0.47, + "learning_rate": 2.649481886554037e-05, + "loss": 2.7487, + "step": 131700 }, { - "epoch": 0.97, - "learning_rate": 1.3300571643816028e-06, - "loss": 2.184, - "step": 558180 + "epoch": 0.47, + "learning_rate": 2.6476971347594693e-05, + "loss": 2.7458, + "step": 131800 }, { - "epoch": 0.97, - "learning_rate": 1.3291852244547761e-06, - "loss": 2.165, - "step": 558190 + "epoch": 0.47, + "learning_rate": 2.6459123829649014e-05, + "loss": 2.7588, + "step": 131900 }, { - "epoch": 0.97, - "learning_rate": 1.3283132845279492e-06, - "loss": 2.1944, - "step": 558200 + "epoch": 0.47, + "learning_rate": 2.6441276311703332e-05, + "loss": 2.7382, + "step": 132000 }, { - "epoch": 0.97, - "learning_rate": 1.3274413446011224e-06, - "loss": 2.2595, - "step": 558210 + "epoch": 0.47, + "learning_rate": 2.6423428793757653e-05, + "loss": 2.757, + "step": 132100 }, { - "epoch": 0.97, - "learning_rate": 1.3265694046742955e-06, - "loss": 2.2371, - "step": 558220 + "epoch": 0.47, + "learning_rate": 2.6405581275811974e-05, + "loss": 2.762, + "step": 132200 }, { - "epoch": 0.97, - "learning_rate": 1.3256974647474689e-06, - "loss": 2.3085, - "step": 558230 + "epoch": 0.47, + "learning_rate": 2.6387733757866295e-05, + "loss": 2.7397, + "step": 132300 }, { - "epoch": 0.97, - "learning_rate": 1.324825524820642e-06, - "loss": 2.2845, - "step": 558240 + "epoch": 0.47, + "learning_rate": 2.6369886239920617e-05, + "loss": 2.7499, + "step": 132400 }, { - "epoch": 0.97, - "learning_rate": 1.3239535848938151e-06, - "loss": 2.2287, - "step": 558250 + "epoch": 0.47, + "learning_rate": 2.6352038721974938e-05, + "loss": 2.7543, + "step": 132500 }, { - "epoch": 0.97, - "learning_rate": 1.3230816449669885e-06, - "loss": 2.2292, - "step": 558260 + "epoch": 0.47, + "learning_rate": 2.6334191204029256e-05, + "loss": 2.7473, + "step": 132600 }, { - "epoch": 0.97, - "learning_rate": 1.3222097050401616e-06, - "loss": 2.323, - "step": 558270 + "epoch": 0.47, + "learning_rate": 2.6316343686083577e-05, + "loss": 2.7637, + "step": 132700 }, { - "epoch": 0.97, - "learning_rate": 1.3213377651133347e-06, - "loss": 2.2172, - "step": 558280 + "epoch": 0.47, + "learning_rate": 2.6298496168137898e-05, + "loss": 2.7512, + "step": 132800 }, { - "epoch": 0.97, - "learning_rate": 1.320465825186508e-06, - "loss": 2.2229, - "step": 558290 + "epoch": 0.47, + "learning_rate": 2.628064865019222e-05, + "loss": 2.7512, + "step": 132900 }, { - "epoch": 0.97, - "learning_rate": 1.3195938852596812e-06, - "loss": 2.3149, - "step": 558300 + "epoch": 0.47, + "learning_rate": 2.626280113224654e-05, + "loss": 2.7439, + "step": 133000 }, { - "epoch": 0.97, - "learning_rate": 1.3187219453328544e-06, - "loss": 2.2392, - "step": 558310 + "epoch": 0.48, + "learning_rate": 2.624495361430086e-05, + "loss": 2.7528, + "step": 133100 }, { - "epoch": 0.97, - "learning_rate": 1.3178500054060275e-06, - "loss": 2.219, - "step": 558320 + "epoch": 0.48, + "learning_rate": 2.622710609635518e-05, + "loss": 2.7516, + "step": 133200 }, { - "epoch": 0.97, - "learning_rate": 1.3169780654792008e-06, - "loss": 2.2994, - "step": 558330 + "epoch": 0.48, + "learning_rate": 2.62092585784095e-05, + "loss": 2.7441, + "step": 133300 }, { - "epoch": 0.97, - "learning_rate": 1.316106125552374e-06, - "loss": 2.298, - "step": 558340 + "epoch": 0.48, + "learning_rate": 2.6191411060463822e-05, + "loss": 2.7522, + "step": 133400 }, { - "epoch": 0.97, - "learning_rate": 1.3152341856255471e-06, - "loss": 2.3215, - "step": 558350 + "epoch": 0.48, + "learning_rate": 2.6173563542518143e-05, + "loss": 2.7407, + "step": 133500 }, { - "epoch": 0.97, - "learning_rate": 1.3143622456987205e-06, - "loss": 2.3763, - "step": 558360 + "epoch": 0.48, + "learning_rate": 2.6155716024572465e-05, + "loss": 2.7493, + "step": 133600 }, { - "epoch": 0.97, - "learning_rate": 1.3134903057718936e-06, - "loss": 2.3559, - "step": 558370 + "epoch": 0.48, + "learning_rate": 2.6137868506626782e-05, + "loss": 2.738, + "step": 133700 }, { - "epoch": 0.97, - "learning_rate": 1.3126183658450667e-06, - "loss": 2.129, - "step": 558380 + "epoch": 0.48, + "learning_rate": 2.6120020988681104e-05, + "loss": 2.7546, + "step": 133800 }, { - "epoch": 0.97, - "learning_rate": 1.31174642591824e-06, - "loss": 2.2144, - "step": 558390 + "epoch": 0.48, + "learning_rate": 2.6102173470735425e-05, + "loss": 2.7533, + "step": 133900 }, { - "epoch": 0.97, - "learning_rate": 1.3108744859914132e-06, - "loss": 2.3498, - "step": 558400 + "epoch": 0.48, + "learning_rate": 2.6084325952789746e-05, + "loss": 2.7519, + "step": 134000 }, { - "epoch": 0.97, - "learning_rate": 1.3100025460645863e-06, - "loss": 2.2458, - "step": 558410 + "epoch": 0.48, + "learning_rate": 2.6066478434844067e-05, + "loss": 2.7701, + "step": 134100 }, { - "epoch": 0.97, - "learning_rate": 1.3091306061377597e-06, - "loss": 2.2619, - "step": 558420 + "epoch": 0.48, + "learning_rate": 2.6048630916898385e-05, + "loss": 2.7568, + "step": 134200 }, { - "epoch": 0.97, - "learning_rate": 1.3082586662109328e-06, - "loss": 2.2135, - "step": 558430 + "epoch": 0.48, + "learning_rate": 2.6030783398952706e-05, + "loss": 2.7504, + "step": 134300 }, { - "epoch": 0.97, - "learning_rate": 1.307386726284106e-06, - "loss": 2.2637, - "step": 558440 + "epoch": 0.48, + "learning_rate": 2.6012935881007027e-05, + "loss": 2.7449, + "step": 134400 }, { - "epoch": 0.97, - "learning_rate": 1.306514786357279e-06, - "loss": 2.279, - "step": 558450 + "epoch": 0.48, + "learning_rate": 2.599508836306135e-05, + "loss": 2.7515, + "step": 134500 }, { - "epoch": 0.97, - "learning_rate": 1.3056428464304524e-06, - "loss": 2.139, - "step": 558460 + "epoch": 0.48, + "learning_rate": 2.597724084511567e-05, + "loss": 2.751, + "step": 134600 }, { - "epoch": 0.97, - "learning_rate": 1.3047709065036256e-06, - "loss": 2.2944, - "step": 558470 + "epoch": 0.48, + "learning_rate": 2.595939332716999e-05, + "loss": 2.7471, + "step": 134700 }, { - "epoch": 0.97, - "learning_rate": 1.3038989665767987e-06, - "loss": 2.2057, - "step": 558480 + "epoch": 0.48, + "learning_rate": 2.594154580922431e-05, + "loss": 2.7567, + "step": 134800 }, { - "epoch": 0.97, - "learning_rate": 1.303027026649972e-06, - "loss": 2.1446, - "step": 558490 + "epoch": 0.48, + "learning_rate": 2.592369829127863e-05, + "loss": 2.7525, + "step": 134900 }, { - "epoch": 0.97, - "learning_rate": 1.3021550867231452e-06, - "loss": 2.2854, - "step": 558500 + "epoch": 0.48, + "learning_rate": 2.590585077333295e-05, + "loss": 2.7495, + "step": 135000 }, { - "epoch": 0.97, - "learning_rate": 1.3012831467963183e-06, - "loss": 2.1906, - "step": 558510 + "epoch": 0.48, + "learning_rate": 2.5888003255387273e-05, + "loss": 2.7366, + "step": 135100 }, { - "epoch": 0.97, - "learning_rate": 1.3004112068694917e-06, - "loss": 2.3106, - "step": 558520 + "epoch": 0.48, + "learning_rate": 2.5870155737441594e-05, + "loss": 2.7473, + "step": 135200 }, { - "epoch": 0.97, - "learning_rate": 1.2995392669426648e-06, - "loss": 2.1754, - "step": 558530 + "epoch": 0.48, + "learning_rate": 2.585230821949591e-05, + "loss": 2.7443, + "step": 135300 }, { - "epoch": 0.97, - "learning_rate": 1.298667327015838e-06, - "loss": 2.2834, - "step": 558540 + "epoch": 0.48, + "learning_rate": 2.583446070155024e-05, + "loss": 2.7467, + "step": 135400 }, { - "epoch": 0.97, - "learning_rate": 1.297795387089011e-06, - "loss": 2.3427, - "step": 558550 + "epoch": 0.48, + "learning_rate": 2.581661318360456e-05, + "loss": 2.738, + "step": 135500 }, { - "epoch": 0.97, - "learning_rate": 1.2969234471621844e-06, - "loss": 2.2798, - "step": 558560 + "epoch": 0.48, + "learning_rate": 2.5798765665658882e-05, + "loss": 2.7387, + "step": 135600 }, { - "epoch": 0.97, - "learning_rate": 1.2960515072353576e-06, - "loss": 2.1845, - "step": 558570 + "epoch": 0.48, + "learning_rate": 2.57809181477132e-05, + "loss": 2.7489, + "step": 135700 }, { - "epoch": 0.97, - "learning_rate": 1.2951795673085307e-06, - "loss": 2.2228, - "step": 558580 + "epoch": 0.48, + "learning_rate": 2.576307062976752e-05, + "loss": 2.7453, + "step": 135800 }, { - "epoch": 0.97, - "learning_rate": 1.294307627381704e-06, - "loss": 2.2685, - "step": 558590 + "epoch": 0.49, + "learning_rate": 2.5745223111821842e-05, + "loss": 2.7451, + "step": 135900 }, { - "epoch": 0.97, - "learning_rate": 1.2934356874548772e-06, - "loss": 2.203, - "step": 558600 + "epoch": 0.49, + "learning_rate": 2.5727375593876163e-05, + "loss": 2.7548, + "step": 136000 }, { - "epoch": 0.97, - "learning_rate": 1.2925637475280503e-06, - "loss": 2.3443, - "step": 558610 + "epoch": 0.49, + "learning_rate": 2.5709528075930485e-05, + "loss": 2.7495, + "step": 136100 }, { - "epoch": 0.97, - "learning_rate": 1.2916918076012237e-06, - "loss": 2.1876, - "step": 558620 + "epoch": 0.49, + "learning_rate": 2.5691680557984803e-05, + "loss": 2.7477, + "step": 136200 }, { - "epoch": 0.97, - "learning_rate": 1.2908198676743968e-06, - "loss": 2.3354, - "step": 558630 + "epoch": 0.49, + "learning_rate": 2.5673833040039124e-05, + "loss": 2.7342, + "step": 136300 }, { - "epoch": 0.97, - "learning_rate": 1.28994792774757e-06, - "loss": 2.2132, - "step": 558640 + "epoch": 0.49, + "learning_rate": 2.5655985522093445e-05, + "loss": 2.747, + "step": 136400 }, { - "epoch": 0.97, - "learning_rate": 1.289075987820743e-06, - "loss": 2.2528, - "step": 558650 + "epoch": 0.49, + "learning_rate": 2.5638138004147766e-05, + "loss": 2.7491, + "step": 136500 }, { - "epoch": 0.97, - "learning_rate": 1.2882040478939164e-06, - "loss": 2.2778, - "step": 558660 + "epoch": 0.49, + "learning_rate": 2.5620290486202087e-05, + "loss": 2.7354, + "step": 136600 }, { - "epoch": 0.97, - "learning_rate": 1.2873321079670895e-06, - "loss": 2.3244, - "step": 558670 + "epoch": 0.49, + "learning_rate": 2.560244296825641e-05, + "loss": 2.7453, + "step": 136700 }, { - "epoch": 0.97, - "learning_rate": 1.2864601680402627e-06, - "loss": 2.2474, - "step": 558680 + "epoch": 0.49, + "learning_rate": 2.5584595450310726e-05, + "loss": 2.7476, + "step": 136800 }, { - "epoch": 0.97, - "learning_rate": 1.285588228113436e-06, - "loss": 2.2185, - "step": 558690 + "epoch": 0.49, + "learning_rate": 2.5566747932365048e-05, + "loss": 2.7495, + "step": 136900 }, { - "epoch": 0.97, - "learning_rate": 1.2847162881866092e-06, - "loss": 2.2469, - "step": 558700 + "epoch": 0.49, + "learning_rate": 2.554890041441937e-05, + "loss": 2.7475, + "step": 137000 }, { - "epoch": 0.97, - "learning_rate": 1.2838443482597823e-06, - "loss": 2.2871, - "step": 558710 + "epoch": 0.49, + "learning_rate": 2.553105289647369e-05, + "loss": 2.7538, + "step": 137100 }, { - "epoch": 0.97, - "learning_rate": 1.2829724083329556e-06, - "loss": 2.2921, - "step": 558720 + "epoch": 0.49, + "learning_rate": 2.551320537852801e-05, + "loss": 2.7488, + "step": 137200 }, { - "epoch": 0.97, - "learning_rate": 1.2821004684061288e-06, - "loss": 2.3394, - "step": 558730 + "epoch": 0.49, + "learning_rate": 2.549535786058233e-05, + "loss": 2.7532, + "step": 137300 }, { - "epoch": 0.97, - "learning_rate": 1.281228528479302e-06, - "loss": 2.1689, - "step": 558740 + "epoch": 0.49, + "learning_rate": 2.547751034263665e-05, + "loss": 2.7602, + "step": 137400 }, { - "epoch": 0.97, - "learning_rate": 1.280356588552475e-06, - "loss": 2.1776, - "step": 558750 + "epoch": 0.49, + "learning_rate": 2.545966282469097e-05, + "loss": 2.7702, + "step": 137500 }, { - "epoch": 0.97, - "learning_rate": 1.2794846486256484e-06, - "loss": 2.3054, - "step": 558760 + "epoch": 0.49, + "learning_rate": 2.5441815306745293e-05, + "loss": 2.7445, + "step": 137600 }, { - "epoch": 0.97, - "learning_rate": 1.2786127086988215e-06, - "loss": 2.2465, - "step": 558770 + "epoch": 0.49, + "learning_rate": 2.5423967788799614e-05, + "loss": 2.7486, + "step": 137700 }, { - "epoch": 0.97, - "learning_rate": 1.2777407687719947e-06, - "loss": 2.2158, - "step": 558780 + "epoch": 0.49, + "learning_rate": 2.5406120270853935e-05, + "loss": 2.7399, + "step": 137800 }, { - "epoch": 0.97, - "learning_rate": 1.276868828845168e-06, - "loss": 2.232, - "step": 558790 + "epoch": 0.49, + "learning_rate": 2.5388272752908253e-05, + "loss": 2.7414, + "step": 137900 }, { - "epoch": 0.97, - "learning_rate": 1.2759968889183411e-06, - "loss": 2.1998, - "step": 558800 + "epoch": 0.49, + "learning_rate": 2.5370425234962574e-05, + "loss": 2.7525, + "step": 138000 }, { - "epoch": 0.97, - "learning_rate": 1.2751249489915143e-06, - "loss": 2.2291, - "step": 558810 + "epoch": 0.49, + "learning_rate": 2.5352577717016895e-05, + "loss": 2.7458, + "step": 138100 }, { - "epoch": 0.97, - "learning_rate": 1.2742530090646876e-06, - "loss": 2.2286, - "step": 558820 + "epoch": 0.49, + "learning_rate": 2.5334730199071217e-05, + "loss": 2.752, + "step": 138200 }, { - "epoch": 0.97, - "learning_rate": 1.2733810691378608e-06, - "loss": 2.2935, - "step": 558830 + "epoch": 0.49, + "learning_rate": 2.5316882681125538e-05, + "loss": 2.7483, + "step": 138300 }, { - "epoch": 0.97, - "learning_rate": 1.2725091292110339e-06, - "loss": 2.3482, - "step": 558840 + "epoch": 0.49, + "learning_rate": 2.5299035163179856e-05, + "loss": 2.74, + "step": 138400 }, { - "epoch": 0.97, - "learning_rate": 1.271637189284207e-06, - "loss": 2.2398, - "step": 558850 + "epoch": 0.49, + "learning_rate": 2.5281187645234177e-05, + "loss": 2.7632, + "step": 138500 }, { - "epoch": 0.97, - "learning_rate": 1.2707652493573804e-06, - "loss": 2.3636, - "step": 558860 + "epoch": 0.49, + "learning_rate": 2.5263340127288498e-05, + "loss": 2.7447, + "step": 138600 }, { - "epoch": 0.97, - "learning_rate": 1.2698933094305535e-06, - "loss": 2.2312, - "step": 558870 + "epoch": 0.5, + "learning_rate": 2.524549260934282e-05, + "loss": 2.7355, + "step": 138700 }, { - "epoch": 0.97, - "learning_rate": 1.2690213695037266e-06, - "loss": 2.2623, - "step": 558880 + "epoch": 0.5, + "learning_rate": 2.522764509139714e-05, + "loss": 2.7461, + "step": 138800 }, { - "epoch": 0.97, - "learning_rate": 1.2681494295769e-06, - "loss": 2.2292, - "step": 558890 + "epoch": 0.5, + "learning_rate": 2.5209797573451462e-05, + "loss": 2.7478, + "step": 138900 }, { - "epoch": 0.97, - "learning_rate": 1.2672774896500731e-06, - "loss": 2.3562, - "step": 558900 + "epoch": 0.5, + "learning_rate": 2.519195005550578e-05, + "loss": 2.7389, + "step": 139000 }, { - "epoch": 0.97, - "learning_rate": 1.2664055497232463e-06, - "loss": 2.2337, - "step": 558910 + "epoch": 0.5, + "learning_rate": 2.51741025375601e-05, + "loss": 2.7421, + "step": 139100 }, { - "epoch": 0.97, - "learning_rate": 1.2655336097964196e-06, - "loss": 2.2799, - "step": 558920 + "epoch": 0.5, + "learning_rate": 2.5156255019614422e-05, + "loss": 2.7595, + "step": 139200 }, { - "epoch": 0.97, - "learning_rate": 1.2646616698695927e-06, - "loss": 2.2665, - "step": 558930 + "epoch": 0.5, + "learning_rate": 2.5138407501668743e-05, + "loss": 2.7452, + "step": 139300 }, { - "epoch": 0.97, - "learning_rate": 1.2637897299427659e-06, - "loss": 2.1419, - "step": 558940 + "epoch": 0.5, + "learning_rate": 2.5120559983723064e-05, + "loss": 2.746, + "step": 139400 }, { - "epoch": 0.97, - "learning_rate": 1.262917790015939e-06, - "loss": 2.2718, - "step": 558950 + "epoch": 0.5, + "learning_rate": 2.5102712465777382e-05, + "loss": 2.7434, + "step": 139500 }, { - "epoch": 0.97, - "learning_rate": 1.2620458500891123e-06, - "loss": 2.1522, - "step": 558960 + "epoch": 0.5, + "learning_rate": 2.5084864947831704e-05, + "loss": 2.7466, + "step": 139600 }, { - "epoch": 0.97, - "learning_rate": 1.2611739101622855e-06, - "loss": 2.1907, - "step": 558970 + "epoch": 0.5, + "learning_rate": 2.5067017429886025e-05, + "loss": 2.7494, + "step": 139700 }, { - "epoch": 0.97, - "learning_rate": 1.2603019702354586e-06, - "loss": 2.2259, - "step": 558980 + "epoch": 0.5, + "learning_rate": 2.5049169911940346e-05, + "loss": 2.7442, + "step": 139800 }, { - "epoch": 0.97, - "learning_rate": 1.259430030308632e-06, - "loss": 2.2349, - "step": 558990 + "epoch": 0.5, + "learning_rate": 2.5031322393994667e-05, + "loss": 2.736, + "step": 139900 }, { - "epoch": 0.97, - "learning_rate": 1.258558090381805e-06, - "loss": 2.2312, - "step": 559000 + "epoch": 0.5, + "learning_rate": 2.501347487604899e-05, + "loss": 2.7473, + "step": 140000 }, { - "epoch": 0.97, - "learning_rate": 1.2576861504549782e-06, - "loss": 2.3962, - "step": 559010 + "epoch": 0.5, + "learning_rate": 2.499562735810331e-05, + "loss": 2.7432, + "step": 140100 }, { - "epoch": 0.97, - "learning_rate": 1.2568142105281516e-06, - "loss": 2.196, - "step": 559020 + "epoch": 0.5, + "learning_rate": 2.497777984015763e-05, + "loss": 2.7406, + "step": 140200 }, { - "epoch": 0.97, - "learning_rate": 1.2559422706013247e-06, - "loss": 2.2349, - "step": 559030 + "epoch": 0.5, + "learning_rate": 2.4959932322211952e-05, + "loss": 2.7418, + "step": 140300 }, { - "epoch": 0.97, - "learning_rate": 1.2550703306744978e-06, - "loss": 2.3159, - "step": 559040 + "epoch": 0.5, + "learning_rate": 2.4942084804266273e-05, + "loss": 2.7518, + "step": 140400 }, { - "epoch": 0.97, - "learning_rate": 1.254198390747671e-06, - "loss": 2.2864, - "step": 559050 + "epoch": 0.5, + "learning_rate": 2.492423728632059e-05, + "loss": 2.7358, + "step": 140500 }, { - "epoch": 0.97, - "learning_rate": 1.2533264508208443e-06, - "loss": 2.3125, - "step": 559060 + "epoch": 0.5, + "learning_rate": 2.4906389768374912e-05, + "loss": 2.7471, + "step": 140600 }, { - "epoch": 0.97, - "learning_rate": 1.2524545108940175e-06, - "loss": 2.1632, - "step": 559070 + "epoch": 0.5, + "learning_rate": 2.4888542250429233e-05, + "loss": 2.7565, + "step": 140700 }, { - "epoch": 0.97, - "learning_rate": 1.2515825709671906e-06, - "loss": 2.1982, - "step": 559080 + "epoch": 0.5, + "learning_rate": 2.4870694732483555e-05, + "loss": 2.7375, + "step": 140800 }, { - "epoch": 0.97, - "learning_rate": 1.250710631040364e-06, - "loss": 2.1882, - "step": 559090 + "epoch": 0.5, + "learning_rate": 2.4852847214537876e-05, + "loss": 2.7518, + "step": 140900 }, { - "epoch": 0.98, - "learning_rate": 1.249838691113537e-06, - "loss": 2.303, - "step": 559100 + "epoch": 0.5, + "learning_rate": 2.4834999696592197e-05, + "loss": 2.7417, + "step": 141000 }, { - "epoch": 0.98, - "learning_rate": 1.2489667511867102e-06, - "loss": 2.3185, - "step": 559110 + "epoch": 0.5, + "learning_rate": 2.4817152178646515e-05, + "loss": 2.7378, + "step": 141100 }, { - "epoch": 0.98, - "learning_rate": 1.2480948112598836e-06, - "loss": 2.1983, - "step": 559120 + "epoch": 0.5, + "learning_rate": 2.4799304660700836e-05, + "loss": 2.7404, + "step": 141200 }, { - "epoch": 0.98, - "learning_rate": 1.2472228713330567e-06, - "loss": 2.2022, - "step": 559130 + "epoch": 0.5, + "learning_rate": 2.4781457142755157e-05, + "loss": 2.7438, + "step": 141300 }, { - "epoch": 0.98, - "learning_rate": 1.2463509314062298e-06, - "loss": 2.3166, - "step": 559140 + "epoch": 0.5, + "learning_rate": 2.476360962480948e-05, + "loss": 2.7558, + "step": 141400 }, { - "epoch": 0.98, - "learning_rate": 1.245478991479403e-06, - "loss": 2.2578, - "step": 559150 + "epoch": 0.51, + "learning_rate": 2.47457621068638e-05, + "loss": 2.7436, + "step": 141500 }, { - "epoch": 0.98, - "learning_rate": 1.2446070515525763e-06, - "loss": 2.3798, - "step": 559160 + "epoch": 0.51, + "learning_rate": 2.4727914588918118e-05, + "loss": 2.7479, + "step": 141600 }, { - "epoch": 0.98, - "learning_rate": 1.2437351116257494e-06, - "loss": 2.1052, - "step": 559170 + "epoch": 0.51, + "learning_rate": 2.471006707097244e-05, + "loss": 2.7583, + "step": 141700 }, { - "epoch": 0.98, - "learning_rate": 1.2428631716989226e-06, - "loss": 2.2327, - "step": 559180 + "epoch": 0.51, + "learning_rate": 2.4692219553026763e-05, + "loss": 2.7381, + "step": 141800 }, { - "epoch": 0.98, - "learning_rate": 1.241991231772096e-06, - "loss": 2.3314, - "step": 559190 + "epoch": 0.51, + "learning_rate": 2.4674372035081085e-05, + "loss": 2.7397, + "step": 141900 }, { - "epoch": 0.98, - "learning_rate": 1.241119291845269e-06, - "loss": 2.2306, - "step": 559200 + "epoch": 0.51, + "learning_rate": 2.4656524517135406e-05, + "loss": 2.744, + "step": 142000 }, { - "epoch": 0.98, - "learning_rate": 1.2402473519184422e-06, - "loss": 2.2913, - "step": 559210 + "epoch": 0.51, + "learning_rate": 2.4638676999189724e-05, + "loss": 2.7566, + "step": 142100 }, { - "epoch": 0.98, - "learning_rate": 1.2393754119916155e-06, - "loss": 2.2686, - "step": 559220 + "epoch": 0.51, + "learning_rate": 2.4620829481244045e-05, + "loss": 2.7493, + "step": 142200 }, { - "epoch": 0.98, - "learning_rate": 1.2385034720647887e-06, - "loss": 2.358, - "step": 559230 + "epoch": 0.51, + "learning_rate": 2.4602981963298366e-05, + "loss": 2.7335, + "step": 142300 }, { - "epoch": 0.98, - "learning_rate": 1.2376315321379618e-06, - "loss": 2.2, - "step": 559240 + "epoch": 0.51, + "learning_rate": 2.4585134445352687e-05, + "loss": 2.7386, + "step": 142400 }, { - "epoch": 0.98, - "learning_rate": 1.236759592211135e-06, - "loss": 2.3191, - "step": 559250 + "epoch": 0.51, + "learning_rate": 2.456728692740701e-05, + "loss": 2.7502, + "step": 142500 }, { - "epoch": 0.98, - "learning_rate": 1.2358876522843083e-06, - "loss": 2.2996, - "step": 559260 + "epoch": 0.51, + "learning_rate": 2.4549439409461326e-05, + "loss": 2.7461, + "step": 142600 }, { - "epoch": 0.98, - "learning_rate": 1.2350157123574814e-06, - "loss": 2.2346, - "step": 559270 + "epoch": 0.51, + "learning_rate": 2.4531591891515648e-05, + "loss": 2.7352, + "step": 142700 }, { - "epoch": 0.98, - "learning_rate": 1.2341437724306546e-06, - "loss": 2.196, - "step": 559280 + "epoch": 0.51, + "learning_rate": 2.451374437356997e-05, + "loss": 2.7417, + "step": 142800 }, { - "epoch": 0.98, - "learning_rate": 1.233271832503828e-06, - "loss": 2.28, - "step": 559290 + "epoch": 0.51, + "learning_rate": 2.449589685562429e-05, + "loss": 2.7435, + "step": 142900 }, { - "epoch": 0.98, - "learning_rate": 1.232399892577001e-06, - "loss": 2.3259, - "step": 559300 + "epoch": 0.51, + "learning_rate": 2.447804933767861e-05, + "loss": 2.748, + "step": 143000 }, { - "epoch": 0.98, - "learning_rate": 1.2315279526501742e-06, - "loss": 2.3384, - "step": 559310 + "epoch": 0.51, + "learning_rate": 2.446020181973293e-05, + "loss": 2.7458, + "step": 143100 }, { - "epoch": 0.98, - "learning_rate": 1.2306560127233475e-06, - "loss": 2.2386, - "step": 559320 + "epoch": 0.51, + "learning_rate": 2.444235430178725e-05, + "loss": 2.7492, + "step": 143200 }, { - "epoch": 0.98, - "learning_rate": 1.2297840727965207e-06, - "loss": 2.2795, - "step": 559330 + "epoch": 0.51, + "learning_rate": 2.442450678384157e-05, + "loss": 2.7469, + "step": 143300 }, { - "epoch": 0.98, - "learning_rate": 1.2289121328696938e-06, - "loss": 2.2903, - "step": 559340 + "epoch": 0.51, + "learning_rate": 2.4406659265895893e-05, + "loss": 2.7519, + "step": 143400 }, { - "epoch": 0.98, - "learning_rate": 1.228040192942867e-06, - "loss": 2.2048, - "step": 559350 + "epoch": 0.51, + "learning_rate": 2.4388811747950214e-05, + "loss": 2.7411, + "step": 143500 }, { - "epoch": 0.98, - "learning_rate": 1.2271682530160403e-06, - "loss": 2.2694, - "step": 559360 + "epoch": 0.51, + "learning_rate": 2.4370964230004535e-05, + "loss": 2.7353, + "step": 143600 }, { - "epoch": 0.98, - "learning_rate": 1.2262963130892134e-06, - "loss": 2.1487, - "step": 559370 + "epoch": 0.51, + "learning_rate": 2.4353116712058853e-05, + "loss": 2.7478, + "step": 143700 }, { - "epoch": 0.98, - "learning_rate": 1.2254243731623865e-06, - "loss": 2.1174, - "step": 559380 + "epoch": 0.51, + "learning_rate": 2.4335269194113174e-05, + "loss": 2.7418, + "step": 143800 }, { - "epoch": 0.98, - "learning_rate": 1.2245524332355599e-06, - "loss": 2.2024, - "step": 559390 + "epoch": 0.51, + "learning_rate": 2.4317421676167495e-05, + "loss": 2.7269, + "step": 143900 }, { - "epoch": 0.98, - "learning_rate": 1.223680493308733e-06, - "loss": 2.249, - "step": 559400 + "epoch": 0.51, + "learning_rate": 2.4299574158221817e-05, + "loss": 2.7446, + "step": 144000 }, { - "epoch": 0.98, - "learning_rate": 1.2228085533819062e-06, - "loss": 2.2771, - "step": 559410 + "epoch": 0.51, + "learning_rate": 2.4281726640276138e-05, + "loss": 2.7508, + "step": 144100 }, { - "epoch": 0.98, - "learning_rate": 1.2219366134550795e-06, - "loss": 2.242, - "step": 559420 + "epoch": 0.51, + "learning_rate": 2.4263879122330456e-05, + "loss": 2.7431, + "step": 144200 }, { - "epoch": 0.98, - "learning_rate": 1.2210646735282526e-06, - "loss": 2.1684, - "step": 559430 + "epoch": 0.52, + "learning_rate": 2.424603160438478e-05, + "loss": 2.7478, + "step": 144300 }, { - "epoch": 0.98, - "learning_rate": 1.2201927336014258e-06, - "loss": 2.1752, - "step": 559440 + "epoch": 0.52, + "learning_rate": 2.42281840864391e-05, + "loss": 2.7388, + "step": 144400 }, { - "epoch": 0.98, - "learning_rate": 1.219320793674599e-06, - "loss": 2.4073, - "step": 559450 + "epoch": 0.52, + "learning_rate": 2.4210336568493423e-05, + "loss": 2.7506, + "step": 144500 }, { - "epoch": 0.98, - "learning_rate": 1.2184488537477723e-06, - "loss": 2.3331, - "step": 559460 + "epoch": 0.52, + "learning_rate": 2.4192489050547744e-05, + "loss": 2.7405, + "step": 144600 }, { - "epoch": 0.98, - "learning_rate": 1.2175769138209454e-06, - "loss": 2.1774, - "step": 559470 + "epoch": 0.52, + "learning_rate": 2.4174641532602062e-05, + "loss": 2.7351, + "step": 144700 }, { - "epoch": 0.98, - "learning_rate": 1.2167049738941185e-06, - "loss": 2.1561, - "step": 559480 + "epoch": 0.52, + "learning_rate": 2.4156794014656383e-05, + "loss": 2.7508, + "step": 144800 }, { - "epoch": 0.98, - "learning_rate": 1.2158330339672919e-06, - "loss": 2.2997, - "step": 559490 + "epoch": 0.52, + "learning_rate": 2.4138946496710704e-05, + "loss": 2.7595, + "step": 144900 }, { - "epoch": 0.98, - "learning_rate": 1.214961094040465e-06, - "loss": 2.1782, - "step": 559500 + "epoch": 0.52, + "learning_rate": 2.4121098978765025e-05, + "loss": 2.7456, + "step": 145000 }, { - "epoch": 0.98, - "learning_rate": 1.2140891541136381e-06, - "loss": 2.2278, - "step": 559510 + "epoch": 0.52, + "learning_rate": 2.4103251460819347e-05, + "loss": 2.7487, + "step": 145100 }, { - "epoch": 0.98, - "learning_rate": 1.2132172141868115e-06, - "loss": 2.333, - "step": 559520 + "epoch": 0.52, + "learning_rate": 2.4085403942873664e-05, + "loss": 2.7473, + "step": 145200 }, { - "epoch": 0.98, - "learning_rate": 1.2123452742599846e-06, - "loss": 2.2219, - "step": 559530 + "epoch": 0.52, + "learning_rate": 2.4067556424927986e-05, + "loss": 2.7426, + "step": 145300 }, { - "epoch": 0.98, - "learning_rate": 1.2114733343331578e-06, - "loss": 2.1262, - "step": 559540 + "epoch": 0.52, + "learning_rate": 2.4049708906982307e-05, + "loss": 2.7394, + "step": 145400 }, { - "epoch": 0.98, - "learning_rate": 1.2106013944063309e-06, - "loss": 2.197, - "step": 559550 + "epoch": 0.52, + "learning_rate": 2.4031861389036628e-05, + "loss": 2.7362, + "step": 145500 }, { - "epoch": 0.98, - "learning_rate": 1.2097294544795042e-06, - "loss": 2.2699, - "step": 559560 + "epoch": 0.52, + "learning_rate": 2.401401387109095e-05, + "loss": 2.7418, + "step": 145600 }, { - "epoch": 0.98, - "learning_rate": 1.2088575145526774e-06, - "loss": 2.2473, - "step": 559570 + "epoch": 0.52, + "learning_rate": 2.399616635314527e-05, + "loss": 2.7537, + "step": 145700 }, { - "epoch": 0.98, - "learning_rate": 1.2079855746258505e-06, - "loss": 2.2492, - "step": 559580 + "epoch": 0.52, + "learning_rate": 2.397831883519959e-05, + "loss": 2.7451, + "step": 145800 }, { - "epoch": 0.98, - "learning_rate": 1.2071136346990239e-06, - "loss": 2.2226, - "step": 559590 + "epoch": 0.52, + "learning_rate": 2.396047131725391e-05, + "loss": 2.7504, + "step": 145900 }, { - "epoch": 0.98, - "learning_rate": 1.206241694772197e-06, - "loss": 2.2128, - "step": 559600 + "epoch": 0.52, + "learning_rate": 2.394262379930823e-05, + "loss": 2.7472, + "step": 146000 }, { - "epoch": 0.98, - "learning_rate": 1.2053697548453701e-06, - "loss": 2.2359, - "step": 559610 + "epoch": 0.52, + "learning_rate": 2.3924776281362552e-05, + "loss": 2.7374, + "step": 146100 }, { - "epoch": 0.98, - "learning_rate": 1.2044978149185435e-06, - "loss": 2.2815, - "step": 559620 + "epoch": 0.52, + "learning_rate": 2.3906928763416873e-05, + "loss": 2.7421, + "step": 146200 }, { - "epoch": 0.98, - "learning_rate": 1.2036258749917166e-06, - "loss": 2.2204, - "step": 559630 + "epoch": 0.52, + "learning_rate": 2.388908124547119e-05, + "loss": 2.745, + "step": 146300 }, { - "epoch": 0.98, - "learning_rate": 1.2027539350648897e-06, - "loss": 2.1787, - "step": 559640 + "epoch": 0.52, + "learning_rate": 2.3871233727525512e-05, + "loss": 2.7375, + "step": 146400 }, { - "epoch": 0.98, - "learning_rate": 1.2018819951380629e-06, - "loss": 2.2499, - "step": 559650 + "epoch": 0.52, + "learning_rate": 2.3853386209579833e-05, + "loss": 2.7346, + "step": 146500 }, { - "epoch": 0.98, - "learning_rate": 1.2010100552112362e-06, - "loss": 2.1928, - "step": 559660 + "epoch": 0.52, + "learning_rate": 2.3835538691634155e-05, + "loss": 2.7361, + "step": 146600 }, { - "epoch": 0.98, - "learning_rate": 1.2001381152844094e-06, - "loss": 2.3713, - "step": 559670 + "epoch": 0.52, + "learning_rate": 2.3817691173688476e-05, + "loss": 2.7455, + "step": 146700 }, { - "epoch": 0.98, - "learning_rate": 1.1992661753575825e-06, - "loss": 2.2505, - "step": 559680 + "epoch": 0.52, + "learning_rate": 2.3799843655742797e-05, + "loss": 2.7492, + "step": 146800 }, { - "epoch": 0.98, - "learning_rate": 1.1983942354307558e-06, - "loss": 2.261, - "step": 559690 + "epoch": 0.52, + "learning_rate": 2.378199613779712e-05, + "loss": 2.7403, + "step": 146900 }, { - "epoch": 0.98, - "learning_rate": 1.197522295503929e-06, - "loss": 2.2751, - "step": 559700 + "epoch": 0.52, + "learning_rate": 2.376414861985144e-05, + "loss": 2.739, + "step": 147000 }, { - "epoch": 0.98, - "learning_rate": 1.196650355577102e-06, - "loss": 2.3133, - "step": 559710 + "epoch": 0.53, + "learning_rate": 2.374630110190576e-05, + "loss": 2.7435, + "step": 147100 }, { - "epoch": 0.98, - "learning_rate": 1.1957784156502755e-06, - "loss": 2.3428, - "step": 559720 + "epoch": 0.53, + "learning_rate": 2.3728453583960082e-05, + "loss": 2.7487, + "step": 147200 }, { - "epoch": 0.98, - "learning_rate": 1.1949064757234486e-06, - "loss": 2.1907, - "step": 559730 + "epoch": 0.53, + "learning_rate": 2.37106060660144e-05, + "loss": 2.7402, + "step": 147300 }, { - "epoch": 0.98, - "learning_rate": 1.1940345357966217e-06, - "loss": 2.31, - "step": 559740 + "epoch": 0.53, + "learning_rate": 2.369275854806872e-05, + "loss": 2.7438, + "step": 147400 }, { - "epoch": 0.98, - "learning_rate": 1.193162595869795e-06, - "loss": 2.2414, - "step": 559750 + "epoch": 0.53, + "learning_rate": 2.3674911030123042e-05, + "loss": 2.7439, + "step": 147500 }, { - "epoch": 0.98, - "learning_rate": 1.1922906559429682e-06, - "loss": 2.2894, - "step": 559760 + "epoch": 0.53, + "learning_rate": 2.3657063512177363e-05, + "loss": 2.7467, + "step": 147600 }, { - "epoch": 0.98, - "learning_rate": 1.1914187160161413e-06, - "loss": 2.3549, - "step": 559770 + "epoch": 0.53, + "learning_rate": 2.3639215994231685e-05, + "loss": 2.7309, + "step": 147700 }, { - "epoch": 0.98, - "learning_rate": 1.1905467760893145e-06, - "loss": 2.1604, - "step": 559780 + "epoch": 0.53, + "learning_rate": 2.3621368476286006e-05, + "loss": 2.7259, + "step": 147800 }, { - "epoch": 0.98, - "learning_rate": 1.1896748361624878e-06, - "loss": 2.1888, - "step": 559790 + "epoch": 0.53, + "learning_rate": 2.3603520958340324e-05, + "loss": 2.7411, + "step": 147900 }, { - "epoch": 0.98, - "learning_rate": 1.188802896235661e-06, - "loss": 2.2956, - "step": 559800 + "epoch": 0.53, + "learning_rate": 2.3585673440394645e-05, + "loss": 2.731, + "step": 148000 }, { - "epoch": 0.98, - "learning_rate": 1.187930956308834e-06, - "loss": 2.2489, - "step": 559810 + "epoch": 0.53, + "learning_rate": 2.3567825922448966e-05, + "loss": 2.7355, + "step": 148100 }, { - "epoch": 0.98, - "learning_rate": 1.1870590163820074e-06, - "loss": 2.1996, - "step": 559820 + "epoch": 0.53, + "learning_rate": 2.3549978404503287e-05, + "loss": 2.7483, + "step": 148200 }, { - "epoch": 0.98, - "learning_rate": 1.1861870764551806e-06, - "loss": 2.292, - "step": 559830 + "epoch": 0.53, + "learning_rate": 2.353213088655761e-05, + "loss": 2.7381, + "step": 148300 }, { - "epoch": 0.98, - "learning_rate": 1.1853151365283537e-06, - "loss": 2.275, - "step": 559840 + "epoch": 0.53, + "learning_rate": 2.3514283368611926e-05, + "loss": 2.7356, + "step": 148400 }, { - "epoch": 0.98, - "learning_rate": 1.184443196601527e-06, - "loss": 2.3384, - "step": 559850 + "epoch": 0.53, + "learning_rate": 2.3496435850666248e-05, + "loss": 2.7512, + "step": 148500 }, { - "epoch": 0.98, - "learning_rate": 1.1835712566747002e-06, - "loss": 2.3103, - "step": 559860 + "epoch": 0.53, + "learning_rate": 2.347858833272057e-05, + "loss": 2.7407, + "step": 148600 }, { - "epoch": 0.98, - "learning_rate": 1.1826993167478733e-06, - "loss": 2.2746, - "step": 559870 + "epoch": 0.53, + "learning_rate": 2.346074081477489e-05, + "loss": 2.7338, + "step": 148700 }, { - "epoch": 0.98, - "learning_rate": 1.1818273768210465e-06, - "loss": 2.2354, - "step": 559880 + "epoch": 0.53, + "learning_rate": 2.344289329682921e-05, + "loss": 2.7281, + "step": 148800 }, { - "epoch": 0.98, - "learning_rate": 1.1809554368942198e-06, - "loss": 2.1509, - "step": 559890 + "epoch": 0.53, + "learning_rate": 2.3425045778883532e-05, + "loss": 2.7326, + "step": 148900 }, { - "epoch": 0.98, - "learning_rate": 1.180083496967393e-06, - "loss": 2.2359, - "step": 559900 + "epoch": 0.53, + "learning_rate": 2.340719826093785e-05, + "loss": 2.7227, + "step": 149000 }, { - "epoch": 0.98, - "learning_rate": 1.179211557040566e-06, - "loss": 2.2744, - "step": 559910 + "epoch": 0.53, + "learning_rate": 2.338935074299217e-05, + "loss": 2.7437, + "step": 149100 }, { - "epoch": 0.98, - "learning_rate": 1.1783396171137394e-06, - "loss": 2.2434, - "step": 559920 + "epoch": 0.53, + "learning_rate": 2.3371503225046493e-05, + "loss": 2.739, + "step": 149200 }, { - "epoch": 0.98, - "learning_rate": 1.1774676771869125e-06, - "loss": 2.3005, - "step": 559930 + "epoch": 0.53, + "learning_rate": 2.3353655707100814e-05, + "loss": 2.7323, + "step": 149300 }, { - "epoch": 0.98, - "learning_rate": 1.1765957372600857e-06, - "loss": 2.1885, - "step": 559940 + "epoch": 0.53, + "learning_rate": 2.3335808189155135e-05, + "loss": 2.7362, + "step": 149400 }, { - "epoch": 0.98, - "learning_rate": 1.175723797333259e-06, - "loss": 2.2272, - "step": 559950 + "epoch": 0.53, + "learning_rate": 2.3317960671209456e-05, + "loss": 2.7386, + "step": 149500 }, { - "epoch": 0.98, - "learning_rate": 1.1748518574064322e-06, - "loss": 2.2666, - "step": 559960 + "epoch": 0.53, + "learning_rate": 2.3300113153263778e-05, + "loss": 2.7508, + "step": 149600 }, { - "epoch": 0.98, - "learning_rate": 1.1739799174796053e-06, - "loss": 2.2408, - "step": 559970 + "epoch": 0.53, + "learning_rate": 2.32822656353181e-05, + "loss": 2.7415, + "step": 149700 }, { - "epoch": 0.98, - "learning_rate": 1.1731079775527784e-06, - "loss": 2.2886, - "step": 559980 + "epoch": 0.53, + "learning_rate": 2.326441811737242e-05, + "loss": 2.7551, + "step": 149800 }, { - "epoch": 0.98, - "learning_rate": 1.1722360376259518e-06, - "loss": 2.1221, - "step": 559990 + "epoch": 0.54, + "learning_rate": 2.324657059942674e-05, + "loss": 2.7312, + "step": 149900 }, { - "epoch": 0.98, - "learning_rate": 1.171364097699125e-06, - "loss": 2.2362, - "step": 560000 + "epoch": 0.54, + "learning_rate": 2.322872308148106e-05, + "loss": 2.7526, + "step": 150000 }, { - "epoch": 0.98, - "learning_rate": 1.170492157772298e-06, - "loss": 2.2836, - "step": 560010 + "epoch": 0.54, + "learning_rate": 2.321087556353538e-05, + "loss": 2.7379, + "step": 150100 }, { - "epoch": 0.98, - "learning_rate": 1.1696202178454714e-06, - "loss": 2.2937, - "step": 560020 + "epoch": 0.54, + "learning_rate": 2.31930280455897e-05, + "loss": 2.7416, + "step": 150200 }, { - "epoch": 0.98, - "learning_rate": 1.1687482779186445e-06, - "loss": 2.2424, - "step": 560030 + "epoch": 0.54, + "learning_rate": 2.3175180527644023e-05, + "loss": 2.7331, + "step": 150300 }, { - "epoch": 0.98, - "learning_rate": 1.1678763379918177e-06, - "loss": 2.3813, - "step": 560040 + "epoch": 0.54, + "learning_rate": 2.3157333009698344e-05, + "loss": 2.7272, + "step": 150400 }, { - "epoch": 0.98, - "learning_rate": 1.167004398064991e-06, - "loss": 2.1948, - "step": 560050 + "epoch": 0.54, + "learning_rate": 2.3139485491752662e-05, + "loss": 2.7433, + "step": 150500 }, { - "epoch": 0.98, - "learning_rate": 1.1661324581381641e-06, - "loss": 2.2482, - "step": 560060 + "epoch": 0.54, + "learning_rate": 2.3121637973806983e-05, + "loss": 2.7358, + "step": 150600 }, { - "epoch": 0.98, - "learning_rate": 1.1652605182113373e-06, - "loss": 2.2512, - "step": 560070 + "epoch": 0.54, + "learning_rate": 2.3103790455861304e-05, + "loss": 2.7218, + "step": 150700 }, { - "epoch": 0.98, - "learning_rate": 1.1643885782845104e-06, - "loss": 2.3467, - "step": 560080 + "epoch": 0.54, + "learning_rate": 2.3085942937915625e-05, + "loss": 2.73, + "step": 150800 }, { - "epoch": 0.98, - "learning_rate": 1.1635166383576838e-06, - "loss": 2.1642, - "step": 560090 + "epoch": 0.54, + "learning_rate": 2.3068095419969947e-05, + "loss": 2.734, + "step": 150900 }, { - "epoch": 0.98, - "learning_rate": 1.162644698430857e-06, - "loss": 2.2601, - "step": 560100 + "epoch": 0.54, + "learning_rate": 2.3050247902024268e-05, + "loss": 2.7469, + "step": 151000 }, { - "epoch": 0.98, - "learning_rate": 1.16177275850403e-06, - "loss": 2.1966, - "step": 560110 + "epoch": 0.54, + "learning_rate": 2.3032400384078586e-05, + "loss": 2.7356, + "step": 151100 }, { - "epoch": 0.98, - "learning_rate": 1.1609008185772034e-06, - "loss": 2.1497, - "step": 560120 + "epoch": 0.54, + "learning_rate": 2.3014552866132907e-05, + "loss": 2.7421, + "step": 151200 }, { - "epoch": 0.98, - "learning_rate": 1.1600288786503765e-06, - "loss": 2.1988, - "step": 560130 + "epoch": 0.54, + "learning_rate": 2.2996705348187228e-05, + "loss": 2.7388, + "step": 151300 }, { - "epoch": 0.98, - "learning_rate": 1.1591569387235496e-06, - "loss": 2.2529, - "step": 560140 + "epoch": 0.54, + "learning_rate": 2.297885783024155e-05, + "loss": 2.7337, + "step": 151400 }, { - "epoch": 0.98, - "learning_rate": 1.158284998796723e-06, - "loss": 2.1327, - "step": 560150 + "epoch": 0.54, + "learning_rate": 2.296101031229587e-05, + "loss": 2.74, + "step": 151500 }, { - "epoch": 0.98, - "learning_rate": 1.1574130588698961e-06, - "loss": 2.3862, - "step": 560160 + "epoch": 0.54, + "learning_rate": 2.294316279435019e-05, + "loss": 2.7336, + "step": 151600 }, { - "epoch": 0.98, - "learning_rate": 1.1565411189430693e-06, - "loss": 2.2971, - "step": 560170 + "epoch": 0.54, + "learning_rate": 2.292531527640451e-05, + "loss": 2.7438, + "step": 151700 }, { - "epoch": 0.98, - "learning_rate": 1.1556691790162424e-06, - "loss": 2.2394, - "step": 560180 + "epoch": 0.54, + "learning_rate": 2.290746775845883e-05, + "loss": 2.7376, + "step": 151800 }, { - "epoch": 0.98, - "learning_rate": 1.1547972390894157e-06, - "loss": 2.2354, - "step": 560190 + "epoch": 0.54, + "learning_rate": 2.2889620240513152e-05, + "loss": 2.7321, + "step": 151900 }, { - "epoch": 0.98, - "learning_rate": 1.1539252991625889e-06, - "loss": 2.1403, - "step": 560200 + "epoch": 0.54, + "learning_rate": 2.2871772722567477e-05, + "loss": 2.7423, + "step": 152000 }, { - "epoch": 0.98, - "learning_rate": 1.153053359235762e-06, - "loss": 2.2891, - "step": 560210 + "epoch": 0.54, + "learning_rate": 2.2853925204621794e-05, + "loss": 2.7312, + "step": 152100 }, { - "epoch": 0.98, - "learning_rate": 1.1521814193089354e-06, - "loss": 2.2835, - "step": 560220 + "epoch": 0.54, + "learning_rate": 2.2836077686676116e-05, + "loss": 2.7442, + "step": 152200 }, { - "epoch": 0.98, - "learning_rate": 1.1513094793821085e-06, - "loss": 2.2729, - "step": 560230 + "epoch": 0.54, + "learning_rate": 2.2818230168730437e-05, + "loss": 2.7308, + "step": 152300 }, { - "epoch": 0.98, - "learning_rate": 1.1504375394552816e-06, - "loss": 2.3164, - "step": 560240 + "epoch": 0.54, + "learning_rate": 2.2800382650784758e-05, + "loss": 2.7277, + "step": 152400 }, { - "epoch": 0.98, - "learning_rate": 1.149565599528455e-06, - "loss": 2.1026, - "step": 560250 + "epoch": 0.54, + "learning_rate": 2.278253513283908e-05, + "loss": 2.7335, + "step": 152500 }, { - "epoch": 0.98, - "learning_rate": 1.1486936596016281e-06, - "loss": 2.2854, - "step": 560260 + "epoch": 0.54, + "learning_rate": 2.2764687614893397e-05, + "loss": 2.7382, + "step": 152600 }, { - "epoch": 0.98, - "learning_rate": 1.1478217196748012e-06, - "loss": 2.2539, - "step": 560270 + "epoch": 0.55, + "learning_rate": 2.2746840096947718e-05, + "loss": 2.7324, + "step": 152700 }, { - "epoch": 0.98, - "learning_rate": 1.1469497797479744e-06, - "loss": 2.1666, - "step": 560280 + "epoch": 0.55, + "learning_rate": 2.272899257900204e-05, + "loss": 2.7361, + "step": 152800 }, { - "epoch": 0.98, - "learning_rate": 1.1460778398211477e-06, - "loss": 2.2243, - "step": 560290 + "epoch": 0.55, + "learning_rate": 2.271114506105636e-05, + "loss": 2.7301, + "step": 152900 }, { - "epoch": 0.98, - "learning_rate": 1.1452058998943209e-06, - "loss": 2.3096, - "step": 560300 + "epoch": 0.55, + "learning_rate": 2.2693297543110682e-05, + "loss": 2.7327, + "step": 153000 }, { - "epoch": 0.98, - "learning_rate": 1.144333959967494e-06, - "loss": 2.2344, - "step": 560310 + "epoch": 0.55, + "learning_rate": 2.2675450025165003e-05, + "loss": 2.7254, + "step": 153100 }, { - "epoch": 0.98, - "learning_rate": 1.1434620200406673e-06, - "loss": 2.1954, - "step": 560320 + "epoch": 0.55, + "learning_rate": 2.265760250721932e-05, + "loss": 2.7393, + "step": 153200 }, { - "epoch": 0.98, - "learning_rate": 1.1425900801138405e-06, - "loss": 2.2445, - "step": 560330 + "epoch": 0.55, + "learning_rate": 2.2639754989273642e-05, + "loss": 2.7282, + "step": 153300 }, { - "epoch": 0.98, - "learning_rate": 1.1417181401870136e-06, - "loss": 2.1848, - "step": 560340 + "epoch": 0.55, + "learning_rate": 2.2621907471327963e-05, + "loss": 2.7323, + "step": 153400 }, { - "epoch": 0.98, - "learning_rate": 1.140846200260187e-06, - "loss": 2.364, - "step": 560350 + "epoch": 0.55, + "learning_rate": 2.2604059953382285e-05, + "loss": 2.7472, + "step": 153500 }, { - "epoch": 0.98, - "learning_rate": 1.13997426033336e-06, - "loss": 2.2378, - "step": 560360 + "epoch": 0.55, + "learning_rate": 2.2586212435436606e-05, + "loss": 2.7348, + "step": 153600 }, { - "epoch": 0.98, - "learning_rate": 1.1391023204065332e-06, - "loss": 2.3023, - "step": 560370 + "epoch": 0.55, + "learning_rate": 2.2568364917490924e-05, + "loss": 2.7405, + "step": 153700 }, { - "epoch": 0.98, - "learning_rate": 1.1382303804797064e-06, - "loss": 2.2514, - "step": 560380 + "epoch": 0.55, + "learning_rate": 2.2550517399545245e-05, + "loss": 2.7285, + "step": 153800 }, { - "epoch": 0.98, - "learning_rate": 1.1373584405528797e-06, - "loss": 2.2346, - "step": 560390 + "epoch": 0.55, + "learning_rate": 2.2532669881599566e-05, + "loss": 2.7314, + "step": 153900 }, { - "epoch": 0.98, - "learning_rate": 1.1364865006260528e-06, - "loss": 2.212, - "step": 560400 + "epoch": 0.55, + "learning_rate": 2.2514822363653887e-05, + "loss": 2.737, + "step": 154000 }, { - "epoch": 0.98, - "learning_rate": 1.135614560699226e-06, - "loss": 2.2476, - "step": 560410 + "epoch": 0.55, + "learning_rate": 2.249697484570821e-05, + "loss": 2.7351, + "step": 154100 }, { - "epoch": 0.98, - "learning_rate": 1.1347426207723993e-06, - "loss": 2.2794, - "step": 560420 + "epoch": 0.55, + "learning_rate": 2.247912732776253e-05, + "loss": 2.7373, + "step": 154200 }, { - "epoch": 0.98, - "learning_rate": 1.1338706808455725e-06, - "loss": 2.3437, - "step": 560430 + "epoch": 0.55, + "learning_rate": 2.2461279809816848e-05, + "loss": 2.7375, + "step": 154300 }, { - "epoch": 0.98, - "learning_rate": 1.1329987409187456e-06, - "loss": 2.1432, - "step": 560440 + "epoch": 0.55, + "learning_rate": 2.244343229187117e-05, + "loss": 2.7319, + "step": 154400 }, { - "epoch": 0.98, - "learning_rate": 1.132126800991919e-06, - "loss": 2.1399, - "step": 560450 + "epoch": 0.55, + "learning_rate": 2.2425584773925493e-05, + "loss": 2.7364, + "step": 154500 }, { - "epoch": 0.98, - "learning_rate": 1.131254861065092e-06, - "loss": 2.2166, - "step": 560460 + "epoch": 0.55, + "learning_rate": 2.2407737255979815e-05, + "loss": 2.74, + "step": 154600 }, { - "epoch": 0.98, - "learning_rate": 1.1303829211382652e-06, - "loss": 2.2856, - "step": 560470 + "epoch": 0.55, + "learning_rate": 2.2389889738034132e-05, + "loss": 2.7392, + "step": 154700 }, { - "epoch": 0.98, - "learning_rate": 1.1295109812114383e-06, - "loss": 2.2547, - "step": 560480 + "epoch": 0.55, + "learning_rate": 2.2372042220088454e-05, + "loss": 2.7344, + "step": 154800 }, { - "epoch": 0.98, - "learning_rate": 1.1286390412846117e-06, - "loss": 2.278, - "step": 560490 + "epoch": 0.55, + "learning_rate": 2.2354194702142775e-05, + "loss": 2.7385, + "step": 154900 }, { - "epoch": 0.98, - "learning_rate": 1.1277671013577848e-06, - "loss": 2.2243, - "step": 560500 + "epoch": 0.55, + "learning_rate": 2.2336347184197096e-05, + "loss": 2.7381, + "step": 155000 }, { - "epoch": 0.98, - "learning_rate": 1.126895161430958e-06, - "loss": 2.3362, - "step": 560510 + "epoch": 0.55, + "learning_rate": 2.2318499666251417e-05, + "loss": 2.7338, + "step": 155100 }, { - "epoch": 0.98, - "learning_rate": 1.1260232215041313e-06, - "loss": 2.3506, - "step": 560520 + "epoch": 0.55, + "learning_rate": 2.2300652148305735e-05, + "loss": 2.735, + "step": 155200 }, { - "epoch": 0.98, - "learning_rate": 1.1251512815773044e-06, - "loss": 2.2223, - "step": 560530 + "epoch": 0.55, + "learning_rate": 2.2282804630360056e-05, + "loss": 2.7421, + "step": 155300 }, { - "epoch": 0.98, - "learning_rate": 1.1242793416504776e-06, - "loss": 2.2848, - "step": 560540 + "epoch": 0.55, + "learning_rate": 2.2264957112414378e-05, + "loss": 2.7342, + "step": 155400 }, { - "epoch": 0.98, - "learning_rate": 1.123407401723651e-06, - "loss": 2.2239, - "step": 560550 + "epoch": 0.56, + "learning_rate": 2.22471095944687e-05, + "loss": 2.7246, + "step": 155500 }, { - "epoch": 0.98, - "learning_rate": 1.122535461796824e-06, - "loss": 2.1378, - "step": 560560 + "epoch": 0.56, + "learning_rate": 2.222926207652302e-05, + "loss": 2.7373, + "step": 155600 }, { - "epoch": 0.98, - "learning_rate": 1.1216635218699972e-06, - "loss": 2.3284, - "step": 560570 + "epoch": 0.56, + "learning_rate": 2.221141455857734e-05, + "loss": 2.7279, + "step": 155700 }, { - "epoch": 0.98, - "learning_rate": 1.1207915819431703e-06, - "loss": 2.2218, - "step": 560580 + "epoch": 0.56, + "learning_rate": 2.219356704063166e-05, + "loss": 2.7401, + "step": 155800 }, { - "epoch": 0.98, - "learning_rate": 1.1199196420163437e-06, - "loss": 2.3705, - "step": 560590 + "epoch": 0.56, + "learning_rate": 2.217571952268598e-05, + "loss": 2.7328, + "step": 155900 }, { - "epoch": 0.98, - "learning_rate": 1.1190477020895168e-06, - "loss": 2.2129, - "step": 560600 + "epoch": 0.56, + "learning_rate": 2.21578720047403e-05, + "loss": 2.7382, + "step": 156000 }, { - "epoch": 0.98, - "learning_rate": 1.11817576216269e-06, - "loss": 2.2863, - "step": 560610 + "epoch": 0.56, + "learning_rate": 2.2140024486794623e-05, + "loss": 2.7401, + "step": 156100 }, { - "epoch": 0.98, - "learning_rate": 1.1173038222358633e-06, - "loss": 2.3711, - "step": 560620 + "epoch": 0.56, + "learning_rate": 2.2122176968848944e-05, + "loss": 2.7447, + "step": 156200 }, { - "epoch": 0.98, - "learning_rate": 1.1164318823090364e-06, - "loss": 2.2838, - "step": 560630 + "epoch": 0.56, + "learning_rate": 2.2104329450903262e-05, + "loss": 2.7364, + "step": 156300 }, { - "epoch": 0.98, - "learning_rate": 1.1155599423822096e-06, - "loss": 2.3096, - "step": 560640 + "epoch": 0.56, + "learning_rate": 2.2086481932957583e-05, + "loss": 2.7355, + "step": 156400 }, { - "epoch": 0.98, - "learning_rate": 1.114688002455383e-06, - "loss": 2.1327, - "step": 560650 + "epoch": 0.56, + "learning_rate": 2.2068634415011904e-05, + "loss": 2.7373, + "step": 156500 }, { - "epoch": 0.98, - "learning_rate": 1.113816062528556e-06, - "loss": 2.1761, - "step": 560660 + "epoch": 0.56, + "learning_rate": 2.2050786897066225e-05, + "loss": 2.7383, + "step": 156600 }, { - "epoch": 0.98, - "learning_rate": 1.1129441226017292e-06, - "loss": 2.2696, - "step": 560670 + "epoch": 0.56, + "learning_rate": 2.2032939379120547e-05, + "loss": 2.7296, + "step": 156700 }, { - "epoch": 0.98, - "learning_rate": 1.1120721826749023e-06, - "loss": 2.2596, - "step": 560680 + "epoch": 0.56, + "learning_rate": 2.2015091861174868e-05, + "loss": 2.742, + "step": 156800 }, { - "epoch": 0.98, - "learning_rate": 1.1112002427480757e-06, - "loss": 2.1831, - "step": 560690 + "epoch": 0.56, + "learning_rate": 2.1997244343229186e-05, + "loss": 2.7389, + "step": 156900 }, { - "epoch": 0.98, - "learning_rate": 1.1103283028212488e-06, - "loss": 2.2795, - "step": 560700 + "epoch": 0.56, + "learning_rate": 2.1979396825283507e-05, + "loss": 2.7347, + "step": 157000 }, { - "epoch": 0.98, - "learning_rate": 1.109456362894422e-06, - "loss": 2.2092, - "step": 560710 + "epoch": 0.56, + "learning_rate": 2.196154930733783e-05, + "loss": 2.7319, + "step": 157100 }, { - "epoch": 0.98, - "learning_rate": 1.1085844229675953e-06, - "loss": 2.206, - "step": 560720 + "epoch": 0.56, + "learning_rate": 2.1943701789392153e-05, + "loss": 2.7376, + "step": 157200 }, { - "epoch": 0.98, - "learning_rate": 1.1077124830407684e-06, - "loss": 2.32, - "step": 560730 + "epoch": 0.56, + "learning_rate": 2.192585427144647e-05, + "loss": 2.7379, + "step": 157300 }, { - "epoch": 0.98, - "learning_rate": 1.1068405431139415e-06, - "loss": 2.3078, - "step": 560740 + "epoch": 0.56, + "learning_rate": 2.190800675350079e-05, + "loss": 2.7259, + "step": 157400 }, { - "epoch": 0.98, - "learning_rate": 1.1059686031871149e-06, - "loss": 2.342, - "step": 560750 + "epoch": 0.56, + "learning_rate": 2.1890159235555113e-05, + "loss": 2.7286, + "step": 157500 }, { - "epoch": 0.98, - "learning_rate": 1.105096663260288e-06, - "loss": 2.2596, - "step": 560760 + "epoch": 0.56, + "learning_rate": 2.1872311717609434e-05, + "loss": 2.7355, + "step": 157600 }, { - "epoch": 0.98, - "learning_rate": 1.1042247233334612e-06, - "loss": 2.3602, - "step": 560770 + "epoch": 0.56, + "learning_rate": 2.1854464199663755e-05, + "loss": 2.7356, + "step": 157700 }, { - "epoch": 0.98, - "learning_rate": 1.1033527834066343e-06, - "loss": 2.2678, - "step": 560780 + "epoch": 0.56, + "learning_rate": 2.1836616681718077e-05, + "loss": 2.74, + "step": 157800 }, { - "epoch": 0.98, - "learning_rate": 1.1024808434798076e-06, - "loss": 2.2437, - "step": 560790 + "epoch": 0.56, + "learning_rate": 2.1818769163772394e-05, + "loss": 2.7324, + "step": 157900 }, { - "epoch": 0.98, - "learning_rate": 1.1016089035529808e-06, - "loss": 2.2969, - "step": 560800 + "epoch": 0.56, + "learning_rate": 2.1800921645826716e-05, + "loss": 2.7417, + "step": 158000 }, { - "epoch": 0.98, - "learning_rate": 1.100736963626154e-06, - "loss": 2.1401, - "step": 560810 + "epoch": 0.56, + "learning_rate": 2.1783074127881037e-05, + "loss": 2.7372, + "step": 158100 }, { - "epoch": 0.98, - "learning_rate": 1.0998650236993272e-06, - "loss": 2.2128, - "step": 560820 + "epoch": 0.56, + "learning_rate": 2.1765226609935358e-05, + "loss": 2.7353, + "step": 158200 }, { - "epoch": 0.98, - "learning_rate": 1.0989930837725004e-06, - "loss": 2.2287, - "step": 560830 + "epoch": 0.57, + "learning_rate": 2.174737909198968e-05, + "loss": 2.7333, + "step": 158300 }, { - "epoch": 0.98, - "learning_rate": 1.0981211438456735e-06, - "loss": 2.1963, - "step": 560840 + "epoch": 0.57, + "learning_rate": 2.1729531574043997e-05, + "loss": 2.7282, + "step": 158400 }, { - "epoch": 0.98, - "learning_rate": 1.0972492039188469e-06, - "loss": 2.1909, - "step": 560850 + "epoch": 0.57, + "learning_rate": 2.1711684056098318e-05, + "loss": 2.7233, + "step": 158500 }, { - "epoch": 0.98, - "learning_rate": 1.09637726399202e-06, - "loss": 2.3629, - "step": 560860 + "epoch": 0.57, + "learning_rate": 2.169383653815264e-05, + "loss": 2.7364, + "step": 158600 }, { - "epoch": 0.98, - "learning_rate": 1.0955053240651931e-06, - "loss": 2.3116, - "step": 560870 + "epoch": 0.57, + "learning_rate": 2.167598902020696e-05, + "loss": 2.7266, + "step": 158700 }, { - "epoch": 0.98, - "learning_rate": 1.0946333841383663e-06, - "loss": 2.1741, - "step": 560880 + "epoch": 0.57, + "learning_rate": 2.1658141502261282e-05, + "loss": 2.7387, + "step": 158800 }, { - "epoch": 0.98, - "learning_rate": 1.0937614442115396e-06, - "loss": 2.1977, - "step": 560890 + "epoch": 0.57, + "learning_rate": 2.1640293984315603e-05, + "loss": 2.7276, + "step": 158900 }, { - "epoch": 0.98, - "learning_rate": 1.0928895042847127e-06, - "loss": 2.2809, - "step": 560900 + "epoch": 0.57, + "learning_rate": 2.162244646636992e-05, + "loss": 2.731, + "step": 159000 }, { - "epoch": 0.98, - "learning_rate": 1.0920175643578859e-06, - "loss": 2.1329, - "step": 560910 + "epoch": 0.57, + "learning_rate": 2.1604598948424242e-05, + "loss": 2.7318, + "step": 159100 }, { - "epoch": 0.98, - "learning_rate": 1.0911456244310592e-06, - "loss": 2.3361, - "step": 560920 + "epoch": 0.57, + "learning_rate": 2.1586751430478563e-05, + "loss": 2.7236, + "step": 159200 }, { - "epoch": 0.98, - "learning_rate": 1.0902736845042324e-06, - "loss": 2.1677, - "step": 560930 + "epoch": 0.57, + "learning_rate": 2.1568903912532885e-05, + "loss": 2.7312, + "step": 159300 }, { - "epoch": 0.98, - "learning_rate": 1.0894017445774055e-06, - "loss": 2.1659, - "step": 560940 + "epoch": 0.57, + "learning_rate": 2.1551056394587206e-05, + "loss": 2.731, + "step": 159400 }, { - "epoch": 0.98, - "learning_rate": 1.0885298046505788e-06, - "loss": 2.2684, - "step": 560950 + "epoch": 0.57, + "learning_rate": 2.1533208876641524e-05, + "loss": 2.731, + "step": 159500 }, { - "epoch": 0.98, - "learning_rate": 1.087657864723752e-06, - "loss": 2.3013, - "step": 560960 + "epoch": 0.57, + "learning_rate": 2.1515361358695848e-05, + "loss": 2.7295, + "step": 159600 }, { - "epoch": 0.98, - "learning_rate": 1.0867859247969251e-06, - "loss": 2.3516, - "step": 560970 + "epoch": 0.57, + "learning_rate": 2.149751384075017e-05, + "loss": 2.7353, + "step": 159700 }, { - "epoch": 0.98, - "learning_rate": 1.0859139848700985e-06, - "loss": 2.3725, - "step": 560980 + "epoch": 0.57, + "learning_rate": 2.147966632280449e-05, + "loss": 2.7237, + "step": 159800 }, { - "epoch": 0.98, - "learning_rate": 1.0850420449432716e-06, - "loss": 2.2086, - "step": 560990 + "epoch": 0.57, + "learning_rate": 2.1461818804858812e-05, + "loss": 2.7234, + "step": 159900 }, { - "epoch": 0.98, - "learning_rate": 1.0841701050164447e-06, - "loss": 2.3558, - "step": 561000 + "epoch": 0.57, + "learning_rate": 2.144397128691313e-05, + "loss": 2.7391, + "step": 160000 }, { - "epoch": 0.98, - "learning_rate": 1.0832981650896179e-06, - "loss": 2.3488, - "step": 561010 + "epoch": 0.57, + "learning_rate": 2.142612376896745e-05, + "loss": 2.7354, + "step": 160100 }, { - "epoch": 0.98, - "learning_rate": 1.0824262251627912e-06, - "loss": 2.2939, - "step": 561020 + "epoch": 0.57, + "learning_rate": 2.1408276251021772e-05, + "loss": 2.7322, + "step": 160200 }, { - "epoch": 0.98, - "learning_rate": 1.0815542852359643e-06, - "loss": 2.1998, - "step": 561030 + "epoch": 0.57, + "learning_rate": 2.1390428733076093e-05, + "loss": 2.734, + "step": 160300 }, { - "epoch": 0.98, - "learning_rate": 1.0806823453091375e-06, - "loss": 2.3013, - "step": 561040 + "epoch": 0.57, + "learning_rate": 2.1372581215130415e-05, + "loss": 2.7288, + "step": 160400 }, { - "epoch": 0.98, - "learning_rate": 1.0798104053823108e-06, - "loss": 2.2287, - "step": 561050 + "epoch": 0.57, + "learning_rate": 2.1354733697184732e-05, + "loss": 2.7248, + "step": 160500 }, { - "epoch": 0.98, - "learning_rate": 1.078938465455484e-06, - "loss": 2.2175, - "step": 561060 + "epoch": 0.57, + "learning_rate": 2.1336886179239054e-05, + "loss": 2.7324, + "step": 160600 }, { - "epoch": 0.98, - "learning_rate": 1.078066525528657e-06, - "loss": 2.279, - "step": 561070 + "epoch": 0.57, + "learning_rate": 2.1319038661293375e-05, + "loss": 2.7315, + "step": 160700 }, { - "epoch": 0.98, - "learning_rate": 1.0771945856018304e-06, - "loss": 2.207, - "step": 561080 + "epoch": 0.57, + "learning_rate": 2.1301191143347696e-05, + "loss": 2.7247, + "step": 160800 }, { - "epoch": 0.98, - "learning_rate": 1.0763226456750036e-06, - "loss": 2.2057, - "step": 561090 + "epoch": 0.57, + "learning_rate": 2.1283343625402017e-05, + "loss": 2.7203, + "step": 160900 }, { - "epoch": 0.98, - "learning_rate": 1.0754507057481767e-06, - "loss": 2.3825, - "step": 561100 + "epoch": 0.57, + "learning_rate": 2.126549610745634e-05, + "loss": 2.7303, + "step": 161000 }, { - "epoch": 0.98, - "learning_rate": 1.07457876582135e-06, - "loss": 2.2906, - "step": 561110 + "epoch": 0.58, + "learning_rate": 2.1247648589510656e-05, + "loss": 2.7359, + "step": 161100 }, { - "epoch": 0.98, - "learning_rate": 1.0737068258945232e-06, - "loss": 2.2422, - "step": 561120 + "epoch": 0.58, + "learning_rate": 2.1229801071564978e-05, + "loss": 2.7361, + "step": 161200 }, { - "epoch": 0.98, - "learning_rate": 1.0728348859676963e-06, - "loss": 2.2374, - "step": 561130 + "epoch": 0.58, + "learning_rate": 2.12119535536193e-05, + "loss": 2.7247, + "step": 161300 }, { - "epoch": 0.98, - "learning_rate": 1.0719629460408695e-06, - "loss": 2.1227, - "step": 561140 + "epoch": 0.58, + "learning_rate": 2.119410603567362e-05, + "loss": 2.7246, + "step": 161400 }, { - "epoch": 0.98, - "learning_rate": 1.0710910061140428e-06, - "loss": 2.3305, - "step": 561150 + "epoch": 0.58, + "learning_rate": 2.117625851772794e-05, + "loss": 2.7382, + "step": 161500 }, { - "epoch": 0.98, - "learning_rate": 1.070219066187216e-06, - "loss": 2.3062, - "step": 561160 + "epoch": 0.58, + "learning_rate": 2.115841099978226e-05, + "loss": 2.7319, + "step": 161600 }, { - "epoch": 0.98, - "learning_rate": 1.069347126260389e-06, - "loss": 2.375, - "step": 561170 + "epoch": 0.58, + "learning_rate": 2.114056348183658e-05, + "loss": 2.7361, + "step": 161700 }, { - "epoch": 0.98, - "learning_rate": 1.0684751863335624e-06, - "loss": 2.3366, - "step": 561180 + "epoch": 0.58, + "learning_rate": 2.11227159638909e-05, + "loss": 2.7345, + "step": 161800 }, { - "epoch": 0.98, - "learning_rate": 1.0676032464067356e-06, - "loss": 2.1475, - "step": 561190 + "epoch": 0.58, + "learning_rate": 2.1104868445945223e-05, + "loss": 2.7344, + "step": 161900 }, { - "epoch": 0.98, - "learning_rate": 1.0667313064799087e-06, - "loss": 2.3217, - "step": 561200 + "epoch": 0.58, + "learning_rate": 2.1087020927999544e-05, + "loss": 2.7123, + "step": 162000 }, { - "epoch": 0.98, - "learning_rate": 1.065859366553082e-06, - "loss": 2.1556, - "step": 561210 + "epoch": 0.58, + "learning_rate": 2.1069173410053865e-05, + "loss": 2.7427, + "step": 162100 }, { - "epoch": 0.98, - "learning_rate": 1.0649874266262552e-06, - "loss": 2.2612, - "step": 561220 + "epoch": 0.58, + "learning_rate": 2.1051325892108186e-05, + "loss": 2.7383, + "step": 162200 }, { - "epoch": 0.98, - "learning_rate": 1.0641154866994283e-06, - "loss": 2.3734, - "step": 561230 + "epoch": 0.58, + "learning_rate": 2.1033478374162507e-05, + "loss": 2.7346, + "step": 162300 }, { - "epoch": 0.98, - "learning_rate": 1.0632435467726017e-06, - "loss": 2.2656, - "step": 561240 + "epoch": 0.58, + "learning_rate": 2.101563085621683e-05, + "loss": 2.7368, + "step": 162400 }, { - "epoch": 0.98, - "learning_rate": 1.0623716068457748e-06, - "loss": 2.2837, - "step": 561250 + "epoch": 0.58, + "learning_rate": 2.099778333827115e-05, + "loss": 2.7379, + "step": 162500 }, { - "epoch": 0.98, - "learning_rate": 1.061499666918948e-06, - "loss": 2.315, - "step": 561260 + "epoch": 0.58, + "learning_rate": 2.0979935820325468e-05, + "loss": 2.7412, + "step": 162600 }, { - "epoch": 0.98, - "learning_rate": 1.060627726992121e-06, - "loss": 2.1716, - "step": 561270 + "epoch": 0.58, + "learning_rate": 2.096208830237979e-05, + "loss": 2.7277, + "step": 162700 }, { - "epoch": 0.98, - "learning_rate": 1.0597557870652944e-06, - "loss": 2.2645, - "step": 561280 + "epoch": 0.58, + "learning_rate": 2.094424078443411e-05, + "loss": 2.7263, + "step": 162800 }, { - "epoch": 0.98, - "learning_rate": 1.0588838471384675e-06, - "loss": 2.2822, - "step": 561290 + "epoch": 0.58, + "learning_rate": 2.092639326648843e-05, + "loss": 2.743, + "step": 162900 }, { - "epoch": 0.98, - "learning_rate": 1.0580119072116407e-06, - "loss": 2.3514, - "step": 561300 + "epoch": 0.58, + "learning_rate": 2.0908545748542753e-05, + "loss": 2.7327, + "step": 163000 }, { - "epoch": 0.98, - "learning_rate": 1.057139967284814e-06, - "loss": 2.2571, - "step": 561310 + "epoch": 0.58, + "learning_rate": 2.0890698230597074e-05, + "loss": 2.7256, + "step": 163100 }, { - "epoch": 0.98, - "learning_rate": 1.0562680273579872e-06, - "loss": 2.2039, - "step": 561320 + "epoch": 0.58, + "learning_rate": 2.087285071265139e-05, + "loss": 2.7262, + "step": 163200 }, { - "epoch": 0.98, - "learning_rate": 1.0553960874311603e-06, - "loss": 2.2091, - "step": 561330 + "epoch": 0.58, + "learning_rate": 2.0855003194705713e-05, + "loss": 2.7296, + "step": 163300 }, { - "epoch": 0.98, - "learning_rate": 1.0545241475043336e-06, - "loss": 2.2877, - "step": 561340 + "epoch": 0.58, + "learning_rate": 2.0837155676760034e-05, + "loss": 2.7268, + "step": 163400 }, { - "epoch": 0.98, - "learning_rate": 1.0536522075775068e-06, - "loss": 2.2743, - "step": 561350 + "epoch": 0.58, + "learning_rate": 2.0819308158814355e-05, + "loss": 2.7389, + "step": 163500 }, { - "epoch": 0.98, - "learning_rate": 1.05278026765068e-06, - "loss": 2.2122, - "step": 561360 + "epoch": 0.58, + "learning_rate": 2.0801460640868677e-05, + "loss": 2.7382, + "step": 163600 }, { - "epoch": 0.98, - "learning_rate": 1.0519083277238533e-06, - "loss": 2.2259, - "step": 561370 + "epoch": 0.58, + "learning_rate": 2.0783613122922994e-05, + "loss": 2.7265, + "step": 163700 }, { - "epoch": 0.98, - "learning_rate": 1.0510363877970264e-06, - "loss": 2.1938, - "step": 561380 + "epoch": 0.58, + "learning_rate": 2.0765765604977316e-05, + "loss": 2.7362, + "step": 163800 }, { - "epoch": 0.98, - "learning_rate": 1.0501644478701995e-06, - "loss": 2.3835, - "step": 561390 + "epoch": 0.59, + "learning_rate": 2.0747918087031637e-05, + "loss": 2.7381, + "step": 163900 }, { - "epoch": 0.98, - "learning_rate": 1.0492925079433727e-06, - "loss": 2.235, - "step": 561400 + "epoch": 0.59, + "learning_rate": 2.0730070569085958e-05, + "loss": 2.7294, + "step": 164000 }, { - "epoch": 0.98, - "learning_rate": 1.048420568016546e-06, - "loss": 2.191, - "step": 561410 + "epoch": 0.59, + "learning_rate": 2.071222305114028e-05, + "loss": 2.734, + "step": 164100 }, { - "epoch": 0.98, - "learning_rate": 1.0475486280897191e-06, - "loss": 2.2837, - "step": 561420 + "epoch": 0.59, + "learning_rate": 2.06943755331946e-05, + "loss": 2.7334, + "step": 164200 }, { - "epoch": 0.98, - "learning_rate": 1.0466766881628923e-06, - "loss": 2.2419, - "step": 561430 + "epoch": 0.59, + "learning_rate": 2.0676528015248918e-05, + "loss": 2.7351, + "step": 164300 }, { - "epoch": 0.98, - "learning_rate": 1.0458047482360656e-06, - "loss": 2.2102, - "step": 561440 + "epoch": 0.59, + "learning_rate": 2.065868049730324e-05, + "loss": 2.7395, + "step": 164400 }, { - "epoch": 0.98, - "learning_rate": 1.0449328083092388e-06, - "loss": 2.2566, - "step": 561450 + "epoch": 0.59, + "learning_rate": 2.064083297935756e-05, + "loss": 2.7273, + "step": 164500 }, { - "epoch": 0.98, - "learning_rate": 1.0440608683824119e-06, - "loss": 2.2947, - "step": 561460 + "epoch": 0.59, + "learning_rate": 2.0622985461411882e-05, + "loss": 2.7393, + "step": 164600 }, { - "epoch": 0.98, - "learning_rate": 1.0431889284555852e-06, - "loss": 2.2382, - "step": 561470 + "epoch": 0.59, + "learning_rate": 2.0605137943466203e-05, + "loss": 2.7142, + "step": 164700 }, { - "epoch": 0.98, - "learning_rate": 1.0423169885287584e-06, - "loss": 2.226, - "step": 561480 + "epoch": 0.59, + "learning_rate": 2.0587290425520524e-05, + "loss": 2.7215, + "step": 164800 }, { - "epoch": 0.98, - "learning_rate": 1.0414450486019315e-06, - "loss": 2.2959, - "step": 561490 + "epoch": 0.59, + "learning_rate": 2.0569442907574846e-05, + "loss": 2.7487, + "step": 164900 }, { - "epoch": 0.98, - "learning_rate": 1.0405731086751049e-06, - "loss": 2.2731, - "step": 561500 + "epoch": 0.59, + "learning_rate": 2.0551595389629167e-05, + "loss": 2.7345, + "step": 165000 }, { - "epoch": 0.98, - "learning_rate": 1.039701168748278e-06, - "loss": 2.2655, - "step": 561510 + "epoch": 0.59, + "learning_rate": 2.0533747871683488e-05, + "loss": 2.7379, + "step": 165100 }, { - "epoch": 0.98, - "learning_rate": 1.0388292288214511e-06, - "loss": 2.2094, - "step": 561520 + "epoch": 0.59, + "learning_rate": 2.051590035373781e-05, + "loss": 2.7307, + "step": 165200 }, { - "epoch": 0.98, - "learning_rate": 1.0379572888946243e-06, - "loss": 2.2075, - "step": 561530 + "epoch": 0.59, + "learning_rate": 2.0498052835792127e-05, + "loss": 2.7303, + "step": 165300 }, { - "epoch": 0.98, - "learning_rate": 1.0370853489677976e-06, - "loss": 2.2398, - "step": 561540 + "epoch": 0.59, + "learning_rate": 2.0480205317846448e-05, + "loss": 2.7239, + "step": 165400 }, { - "epoch": 0.98, - "learning_rate": 1.0362134090409707e-06, - "loss": 2.3226, - "step": 561550 + "epoch": 0.59, + "learning_rate": 2.046235779990077e-05, + "loss": 2.7309, + "step": 165500 }, { - "epoch": 0.98, - "learning_rate": 1.0353414691141439e-06, - "loss": 2.2867, - "step": 561560 + "epoch": 0.59, + "learning_rate": 2.044451028195509e-05, + "loss": 2.7322, + "step": 165600 }, { - "epoch": 0.98, - "learning_rate": 1.0344695291873172e-06, - "loss": 2.2684, - "step": 561570 + "epoch": 0.59, + "learning_rate": 2.0426662764009412e-05, + "loss": 2.733, + "step": 165700 }, { - "epoch": 0.98, - "learning_rate": 1.0335975892604904e-06, - "loss": 2.2569, - "step": 561580 + "epoch": 0.59, + "learning_rate": 2.040881524606373e-05, + "loss": 2.7296, + "step": 165800 }, { - "epoch": 0.98, - "learning_rate": 1.0327256493336635e-06, - "loss": 2.2437, - "step": 561590 + "epoch": 0.59, + "learning_rate": 2.039096772811805e-05, + "loss": 2.7305, + "step": 165900 }, { - "epoch": 0.98, - "learning_rate": 1.0318537094068368e-06, - "loss": 2.2257, - "step": 561600 + "epoch": 0.59, + "learning_rate": 2.0373120210172372e-05, + "loss": 2.7323, + "step": 166000 }, { - "epoch": 0.98, - "learning_rate": 1.03098176948001e-06, - "loss": 2.2769, - "step": 561610 + "epoch": 0.59, + "learning_rate": 2.0355272692226693e-05, + "loss": 2.7186, + "step": 166100 }, { - "epoch": 0.98, - "learning_rate": 1.030109829553183e-06, - "loss": 2.3251, - "step": 561620 + "epoch": 0.59, + "learning_rate": 2.0337425174281015e-05, + "loss": 2.7257, + "step": 166200 }, { - "epoch": 0.98, - "learning_rate": 1.0292378896263564e-06, - "loss": 2.3117, - "step": 561630 + "epoch": 0.59, + "learning_rate": 2.0319577656335332e-05, + "loss": 2.724, + "step": 166300 }, { - "epoch": 0.98, - "learning_rate": 1.0283659496995296e-06, - "loss": 2.2348, - "step": 561640 + "epoch": 0.59, + "learning_rate": 2.0301730138389654e-05, + "loss": 2.744, + "step": 166400 }, { - "epoch": 0.98, - "learning_rate": 1.0274940097727027e-06, - "loss": 2.2728, - "step": 561650 + "epoch": 0.59, + "learning_rate": 2.0283882620443975e-05, + "loss": 2.7325, + "step": 166500 }, { - "epoch": 0.98, - "learning_rate": 1.026622069845876e-06, - "loss": 2.1051, - "step": 561660 + "epoch": 0.59, + "learning_rate": 2.0266035102498296e-05, + "loss": 2.7355, + "step": 166600 }, { - "epoch": 0.98, - "learning_rate": 1.0257501299190492e-06, - "loss": 2.214, - "step": 561670 + "epoch": 0.6, + "learning_rate": 2.0248187584552617e-05, + "loss": 2.7348, + "step": 166700 }, { - "epoch": 0.98, - "learning_rate": 1.0248781899922223e-06, - "loss": 2.2584, - "step": 561680 + "epoch": 0.6, + "learning_rate": 2.023034006660694e-05, + "loss": 2.7232, + "step": 166800 }, { - "epoch": 0.98, - "learning_rate": 1.0240062500653955e-06, - "loss": 2.1876, - "step": 561690 + "epoch": 0.6, + "learning_rate": 2.0212492548661256e-05, + "loss": 2.7342, + "step": 166900 }, { - "epoch": 0.98, - "learning_rate": 1.0231343101385688e-06, - "loss": 2.2276, - "step": 561700 + "epoch": 0.6, + "learning_rate": 2.0194645030715577e-05, + "loss": 2.736, + "step": 167000 }, { - "epoch": 0.98, - "learning_rate": 1.022262370211742e-06, - "loss": 2.3318, - "step": 561710 + "epoch": 0.6, + "learning_rate": 2.01767975127699e-05, + "loss": 2.7335, + "step": 167100 }, { - "epoch": 0.98, - "learning_rate": 1.021390430284915e-06, - "loss": 2.2341, - "step": 561720 + "epoch": 0.6, + "learning_rate": 2.015894999482422e-05, + "loss": 2.7272, + "step": 167200 }, { - "epoch": 0.98, - "learning_rate": 1.0205184903580884e-06, - "loss": 2.3171, - "step": 561730 + "epoch": 0.6, + "learning_rate": 2.014110247687854e-05, + "loss": 2.7345, + "step": 167300 }, { - "epoch": 0.98, - "learning_rate": 1.0196465504312616e-06, - "loss": 2.2509, - "step": 561740 + "epoch": 0.6, + "learning_rate": 2.0123254958932862e-05, + "loss": 2.7304, + "step": 167400 }, { - "epoch": 0.98, - "learning_rate": 1.0187746105044347e-06, - "loss": 2.42, - "step": 561750 + "epoch": 0.6, + "learning_rate": 2.0105407440987184e-05, + "loss": 2.7237, + "step": 167500 }, { - "epoch": 0.98, - "learning_rate": 1.017902670577608e-06, - "loss": 2.1528, - "step": 561760 + "epoch": 0.6, + "learning_rate": 2.0087559923041505e-05, + "loss": 2.7293, + "step": 167600 }, { - "epoch": 0.98, - "learning_rate": 1.0170307306507812e-06, - "loss": 2.2868, - "step": 561770 + "epoch": 0.6, + "learning_rate": 2.0069712405095826e-05, + "loss": 2.7264, + "step": 167700 }, { - "epoch": 0.98, - "learning_rate": 1.0161587907239543e-06, - "loss": 2.3448, - "step": 561780 + "epoch": 0.6, + "learning_rate": 2.0051864887150147e-05, + "loss": 2.7075, + "step": 167800 }, { - "epoch": 0.98, - "learning_rate": 1.0152868507971277e-06, - "loss": 2.2158, - "step": 561790 + "epoch": 0.6, + "learning_rate": 2.0034017369204465e-05, + "loss": 2.736, + "step": 167900 }, { - "epoch": 0.98, - "learning_rate": 1.0144149108703008e-06, - "loss": 2.2836, - "step": 561800 + "epoch": 0.6, + "learning_rate": 2.0016169851258786e-05, + "loss": 2.7302, + "step": 168000 }, { - "epoch": 0.98, - "learning_rate": 1.013542970943474e-06, - "loss": 2.4156, - "step": 561810 + "epoch": 0.6, + "learning_rate": 1.9998322333313107e-05, + "loss": 2.7386, + "step": 168100 }, { - "epoch": 0.98, - "learning_rate": 1.012671031016647e-06, - "loss": 2.2206, - "step": 561820 + "epoch": 0.6, + "learning_rate": 1.998047481536743e-05, + "loss": 2.7324, + "step": 168200 }, { - "epoch": 0.98, - "learning_rate": 1.0117990910898204e-06, - "loss": 2.1765, - "step": 561830 + "epoch": 0.6, + "learning_rate": 1.996262729742175e-05, + "loss": 2.7342, + "step": 168300 }, { - "epoch": 0.98, - "learning_rate": 1.0109271511629935e-06, - "loss": 2.231, - "step": 561840 + "epoch": 0.6, + "learning_rate": 1.9944779779476068e-05, + "loss": 2.7263, + "step": 168400 }, { - "epoch": 0.98, - "learning_rate": 1.0100552112361667e-06, - "loss": 2.274, - "step": 561850 + "epoch": 0.6, + "learning_rate": 1.992693226153039e-05, + "loss": 2.728, + "step": 168500 }, { - "epoch": 0.98, - "learning_rate": 1.00918327130934e-06, - "loss": 2.2393, - "step": 561860 + "epoch": 0.6, + "learning_rate": 1.990908474358471e-05, + "loss": 2.7226, + "step": 168600 }, { - "epoch": 0.98, - "learning_rate": 1.0083113313825132e-06, - "loss": 2.3253, - "step": 561870 + "epoch": 0.6, + "learning_rate": 1.989123722563903e-05, + "loss": 2.7231, + "step": 168700 }, { - "epoch": 0.98, - "learning_rate": 1.0074393914556863e-06, - "loss": 2.1912, - "step": 561880 + "epoch": 0.6, + "learning_rate": 1.9873389707693353e-05, + "loss": 2.7286, + "step": 168800 }, { - "epoch": 0.98, - "learning_rate": 1.0065674515288596e-06, - "loss": 2.2858, - "step": 561890 + "epoch": 0.6, + "learning_rate": 1.9855542189747674e-05, + "loss": 2.7298, + "step": 168900 }, { - "epoch": 0.98, - "learning_rate": 1.0056955116020328e-06, - "loss": 2.2749, - "step": 561900 + "epoch": 0.6, + "learning_rate": 1.983769467180199e-05, + "loss": 2.727, + "step": 169000 }, { - "epoch": 0.98, - "learning_rate": 1.004823571675206e-06, - "loss": 2.2418, - "step": 561910 + "epoch": 0.6, + "learning_rate": 1.9819847153856313e-05, + "loss": 2.728, + "step": 169100 }, { - "epoch": 0.98, - "learning_rate": 1.0039516317483793e-06, - "loss": 2.3366, - "step": 561920 + "epoch": 0.6, + "learning_rate": 1.9801999635910634e-05, + "loss": 2.7248, + "step": 169200 }, { - "epoch": 0.98, - "learning_rate": 1.0030796918215524e-06, - "loss": 2.2901, - "step": 561930 + "epoch": 0.6, + "learning_rate": 1.9784152117964955e-05, + "loss": 2.7209, + "step": 169300 }, { - "epoch": 0.98, - "learning_rate": 1.0022077518947255e-06, - "loss": 2.2997, - "step": 561940 + "epoch": 0.6, + "learning_rate": 1.9766304600019276e-05, + "loss": 2.7347, + "step": 169400 }, { - "epoch": 0.98, - "learning_rate": 1.0013358119678987e-06, - "loss": 2.3353, - "step": 561950 + "epoch": 0.61, + "learning_rate": 1.9748457082073594e-05, + "loss": 2.723, + "step": 169500 }, { - "epoch": 0.98, - "learning_rate": 1.000463872041072e-06, - "loss": 2.217, - "step": 561960 + "epoch": 0.61, + "learning_rate": 1.9730609564127916e-05, + "loss": 2.7269, + "step": 169600 }, { - "epoch": 0.98, - "learning_rate": 9.995919321142451e-07, - "loss": 2.3019, - "step": 561970 + "epoch": 0.61, + "learning_rate": 1.9712762046182237e-05, + "loss": 2.7281, + "step": 169700 }, { - "epoch": 0.98, - "learning_rate": 9.987199921874183e-07, - "loss": 2.2875, - "step": 561980 + "epoch": 0.61, + "learning_rate": 1.969491452823656e-05, + "loss": 2.7226, + "step": 169800 }, { - "epoch": 0.98, - "learning_rate": 9.978480522605916e-07, - "loss": 2.2951, - "step": 561990 + "epoch": 0.61, + "learning_rate": 1.9677067010290883e-05, + "loss": 2.7264, + "step": 169900 }, { - "epoch": 0.98, - "learning_rate": 9.969761123337648e-07, - "loss": 2.1514, - "step": 562000 + "epoch": 0.61, + "learning_rate": 1.96592194923452e-05, + "loss": 2.7239, + "step": 170000 }, { - "epoch": 0.98, - "learning_rate": 9.961041724069379e-07, - "loss": 2.264, - "step": 562010 + "epoch": 0.61, + "learning_rate": 1.964137197439952e-05, + "loss": 2.7346, + "step": 170100 }, { - "epoch": 0.98, - "learning_rate": 9.952322324801112e-07, - "loss": 2.2657, - "step": 562020 + "epoch": 0.61, + "learning_rate": 1.9623524456453843e-05, + "loss": 2.7238, + "step": 170200 }, { - "epoch": 0.98, - "learning_rate": 9.943602925532844e-07, - "loss": 2.3328, - "step": 562030 + "epoch": 0.61, + "learning_rate": 1.9605676938508164e-05, + "loss": 2.7189, + "step": 170300 }, { - "epoch": 0.98, - "learning_rate": 9.934883526264575e-07, - "loss": 2.3698, - "step": 562040 + "epoch": 0.61, + "learning_rate": 1.9587829420562485e-05, + "loss": 2.71, + "step": 170400 }, { - "epoch": 0.98, - "learning_rate": 9.926164126996309e-07, - "loss": 2.2118, - "step": 562050 + "epoch": 0.61, + "learning_rate": 1.9569981902616803e-05, + "loss": 2.7351, + "step": 170500 }, { - "epoch": 0.98, - "learning_rate": 9.91744472772804e-07, - "loss": 2.3477, - "step": 562060 + "epoch": 0.61, + "learning_rate": 1.9552134384671124e-05, + "loss": 2.7317, + "step": 170600 }, { - "epoch": 0.98, - "learning_rate": 9.908725328459771e-07, - "loss": 2.2331, - "step": 562070 + "epoch": 0.61, + "learning_rate": 1.9534286866725445e-05, + "loss": 2.7294, + "step": 170700 }, { - "epoch": 0.98, - "learning_rate": 9.900005929191503e-07, - "loss": 2.3357, - "step": 562080 + "epoch": 0.61, + "learning_rate": 1.9516439348779767e-05, + "loss": 2.7275, + "step": 170800 }, { - "epoch": 0.98, - "learning_rate": 9.891286529923236e-07, - "loss": 2.285, - "step": 562090 + "epoch": 0.61, + "learning_rate": 1.9498591830834088e-05, + "loss": 2.7257, + "step": 170900 }, { - "epoch": 0.98, - "learning_rate": 9.882567130654967e-07, - "loss": 2.3814, - "step": 562100 + "epoch": 0.61, + "learning_rate": 1.948074431288841e-05, + "loss": 2.7292, + "step": 171000 }, { - "epoch": 0.98, - "learning_rate": 9.873847731386699e-07, - "loss": 2.3199, - "step": 562110 + "epoch": 0.61, + "learning_rate": 1.9462896794942727e-05, + "loss": 2.7256, + "step": 171100 }, { - "epoch": 0.98, - "learning_rate": 9.865128332118432e-07, - "loss": 2.1881, - "step": 562120 + "epoch": 0.61, + "learning_rate": 1.9445049276997048e-05, + "loss": 2.7299, + "step": 171200 }, { - "epoch": 0.98, - "learning_rate": 9.856408932850164e-07, - "loss": 2.3348, - "step": 562130 + "epoch": 0.61, + "learning_rate": 1.942720175905137e-05, + "loss": 2.7187, + "step": 171300 }, { - "epoch": 0.98, - "learning_rate": 9.847689533581895e-07, - "loss": 2.349, - "step": 562140 + "epoch": 0.61, + "learning_rate": 1.940935424110569e-05, + "loss": 2.7382, + "step": 171400 }, { - "epoch": 0.98, - "learning_rate": 9.838970134313628e-07, - "loss": 2.2428, - "step": 562150 + "epoch": 0.61, + "learning_rate": 1.9391506723160012e-05, + "loss": 2.7323, + "step": 171500 }, { - "epoch": 0.98, - "learning_rate": 9.83025073504536e-07, - "loss": 2.2607, - "step": 562160 + "epoch": 0.61, + "learning_rate": 1.937365920521433e-05, + "loss": 2.7233, + "step": 171600 }, { - "epoch": 0.98, - "learning_rate": 9.821531335777091e-07, - "loss": 2.3305, - "step": 562170 + "epoch": 0.61, + "learning_rate": 1.935581168726865e-05, + "loss": 2.7148, + "step": 171700 }, { - "epoch": 0.98, - "learning_rate": 9.812811936508825e-07, - "loss": 2.3528, - "step": 562180 + "epoch": 0.61, + "learning_rate": 1.9337964169322972e-05, + "loss": 2.727, + "step": 171800 }, { - "epoch": 0.98, - "learning_rate": 9.804092537240556e-07, - "loss": 2.3714, - "step": 562190 + "epoch": 0.61, + "learning_rate": 1.9320116651377293e-05, + "loss": 2.731, + "step": 171900 }, { - "epoch": 0.98, - "learning_rate": 9.795373137972287e-07, - "loss": 2.331, - "step": 562200 + "epoch": 0.61, + "learning_rate": 1.9302269133431615e-05, + "loss": 2.7285, + "step": 172000 }, { - "epoch": 0.98, - "learning_rate": 9.786653738704019e-07, - "loss": 2.187, - "step": 562210 + "epoch": 0.61, + "learning_rate": 1.9284421615485936e-05, + "loss": 2.7351, + "step": 172100 }, { - "epoch": 0.98, - "learning_rate": 9.777934339435752e-07, - "loss": 2.3204, - "step": 562220 + "epoch": 0.61, + "learning_rate": 1.9266574097540254e-05, + "loss": 2.7242, + "step": 172200 }, { - "epoch": 0.98, - "learning_rate": 9.769214940167483e-07, - "loss": 2.2534, - "step": 562230 + "epoch": 0.62, + "learning_rate": 1.9248726579594575e-05, + "loss": 2.7252, + "step": 172300 }, { - "epoch": 0.98, - "learning_rate": 9.760495540899215e-07, - "loss": 2.1692, - "step": 562240 + "epoch": 0.62, + "learning_rate": 1.92308790616489e-05, + "loss": 2.7327, + "step": 172400 }, { - "epoch": 0.98, - "learning_rate": 9.751776141630948e-07, - "loss": 2.2021, - "step": 562250 + "epoch": 0.62, + "learning_rate": 1.921303154370322e-05, + "loss": 2.7288, + "step": 172500 }, { - "epoch": 0.98, - "learning_rate": 9.74305674236268e-07, - "loss": 2.3338, - "step": 562260 + "epoch": 0.62, + "learning_rate": 1.919518402575754e-05, + "loss": 2.7168, + "step": 172600 }, { - "epoch": 0.98, - "learning_rate": 9.73433734309441e-07, - "loss": 2.1877, - "step": 562270 + "epoch": 0.62, + "learning_rate": 1.917733650781186e-05, + "loss": 2.7302, + "step": 172700 }, { - "epoch": 0.98, - "learning_rate": 9.725617943826144e-07, - "loss": 2.1975, - "step": 562280 + "epoch": 0.62, + "learning_rate": 1.915948898986618e-05, + "loss": 2.7306, + "step": 172800 }, { - "epoch": 0.98, - "learning_rate": 9.716898544557876e-07, - "loss": 2.2767, - "step": 562290 + "epoch": 0.62, + "learning_rate": 1.9141641471920502e-05, + "loss": 2.7166, + "step": 172900 }, { - "epoch": 0.98, - "learning_rate": 9.708179145289607e-07, - "loss": 2.2955, - "step": 562300 + "epoch": 0.62, + "learning_rate": 1.9123793953974823e-05, + "loss": 2.7168, + "step": 173000 }, { - "epoch": 0.98, - "learning_rate": 9.699459746021338e-07, - "loss": 2.3001, - "step": 562310 + "epoch": 0.62, + "learning_rate": 1.9105946436029144e-05, + "loss": 2.736, + "step": 173100 }, { - "epoch": 0.98, - "learning_rate": 9.690740346753072e-07, - "loss": 2.2813, - "step": 562320 + "epoch": 0.62, + "learning_rate": 1.9088098918083462e-05, + "loss": 2.724, + "step": 173200 }, { - "epoch": 0.98, - "learning_rate": 9.682020947484803e-07, - "loss": 2.2731, - "step": 562330 + "epoch": 0.62, + "learning_rate": 1.9070251400137784e-05, + "loss": 2.7258, + "step": 173300 }, { - "epoch": 0.98, - "learning_rate": 9.673301548216535e-07, - "loss": 2.2692, - "step": 562340 + "epoch": 0.62, + "learning_rate": 1.9052403882192105e-05, + "loss": 2.723, + "step": 173400 }, { - "epoch": 0.98, - "learning_rate": 9.664582148948268e-07, - "loss": 2.2259, - "step": 562350 + "epoch": 0.62, + "learning_rate": 1.9034556364246426e-05, + "loss": 2.7322, + "step": 173500 }, { - "epoch": 0.98, - "learning_rate": 9.65586274968e-07, - "loss": 2.3122, - "step": 562360 + "epoch": 0.62, + "learning_rate": 1.9016708846300747e-05, + "loss": 2.7307, + "step": 173600 }, { - "epoch": 0.98, - "learning_rate": 9.64714335041173e-07, - "loss": 2.3276, - "step": 562370 + "epoch": 0.62, + "learning_rate": 1.8998861328355065e-05, + "loss": 2.7214, + "step": 173700 }, { - "epoch": 0.98, - "learning_rate": 9.638423951143464e-07, - "loss": 2.2612, - "step": 562380 + "epoch": 0.62, + "learning_rate": 1.8981013810409386e-05, + "loss": 2.7123, + "step": 173800 }, { - "epoch": 0.98, - "learning_rate": 9.629704551875196e-07, - "loss": 2.2987, - "step": 562390 + "epoch": 0.62, + "learning_rate": 1.8963166292463707e-05, + "loss": 2.731, + "step": 173900 }, { - "epoch": 0.98, - "learning_rate": 9.620985152606927e-07, - "loss": 2.2785, - "step": 562400 + "epoch": 0.62, + "learning_rate": 1.894531877451803e-05, + "loss": 2.7262, + "step": 174000 }, { - "epoch": 0.98, - "learning_rate": 9.612265753338658e-07, - "loss": 2.1792, - "step": 562410 + "epoch": 0.62, + "learning_rate": 1.892747125657235e-05, + "loss": 2.7263, + "step": 174100 }, { - "epoch": 0.98, - "learning_rate": 9.603546354070392e-07, - "loss": 2.1427, - "step": 562420 + "epoch": 0.62, + "learning_rate": 1.890962373862667e-05, + "loss": 2.7317, + "step": 174200 }, { - "epoch": 0.98, - "learning_rate": 9.594826954802123e-07, - "loss": 2.2518, - "step": 562430 + "epoch": 0.62, + "learning_rate": 1.889177622068099e-05, + "loss": 2.7196, + "step": 174300 }, { - "epoch": 0.98, - "learning_rate": 9.586107555533854e-07, - "loss": 2.3458, - "step": 562440 + "epoch": 0.62, + "learning_rate": 1.887392870273531e-05, + "loss": 2.7145, + "step": 174400 }, { - "epoch": 0.98, - "learning_rate": 9.577388156265588e-07, - "loss": 2.2893, - "step": 562450 + "epoch": 0.62, + "learning_rate": 1.885608118478963e-05, + "loss": 2.731, + "step": 174500 }, { - "epoch": 0.98, - "learning_rate": 9.56866875699732e-07, - "loss": 2.2465, - "step": 562460 + "epoch": 0.62, + "learning_rate": 1.8838233666843953e-05, + "loss": 2.7168, + "step": 174600 }, { - "epoch": 0.98, - "learning_rate": 9.55994935772905e-07, - "loss": 2.3136, - "step": 562470 + "epoch": 0.62, + "learning_rate": 1.8820386148898274e-05, + "loss": 2.7146, + "step": 174700 }, { - "epoch": 0.98, - "learning_rate": 9.551229958460784e-07, - "loss": 2.2978, - "step": 562480 + "epoch": 0.62, + "learning_rate": 1.880253863095259e-05, + "loss": 2.7292, + "step": 174800 }, { - "epoch": 0.98, - "learning_rate": 9.542510559192515e-07, - "loss": 2.3661, - "step": 562490 + "epoch": 0.62, + "learning_rate": 1.8784691113006913e-05, + "loss": 2.7264, + "step": 174900 }, { - "epoch": 0.98, - "learning_rate": 9.533791159924246e-07, - "loss": 2.2757, - "step": 562500 + "epoch": 0.62, + "learning_rate": 1.8766843595061237e-05, + "loss": 2.7189, + "step": 175000 }, { - "epoch": 0.98, - "learning_rate": 9.525071760655977e-07, - "loss": 2.2476, - "step": 562510 + "epoch": 0.63, + "learning_rate": 1.874899607711556e-05, + "loss": 2.7263, + "step": 175100 }, { - "epoch": 0.98, - "learning_rate": 9.51635236138771e-07, - "loss": 2.2354, - "step": 562520 + "epoch": 0.63, + "learning_rate": 1.873114855916988e-05, + "loss": 2.7316, + "step": 175200 }, { - "epoch": 0.98, - "learning_rate": 9.507632962119442e-07, - "loss": 2.2733, - "step": 562530 + "epoch": 0.63, + "learning_rate": 1.8713301041224198e-05, + "loss": 2.7149, + "step": 175300 }, { - "epoch": 0.98, - "learning_rate": 9.498913562851173e-07, - "loss": 2.3437, - "step": 562540 + "epoch": 0.63, + "learning_rate": 1.869545352327852e-05, + "loss": 2.7134, + "step": 175400 }, { - "epoch": 0.98, - "learning_rate": 9.490194163582907e-07, - "loss": 2.2418, - "step": 562550 + "epoch": 0.63, + "learning_rate": 1.867760600533284e-05, + "loss": 2.7276, + "step": 175500 }, { - "epoch": 0.98, - "learning_rate": 9.481474764314638e-07, - "loss": 2.1783, - "step": 562560 + "epoch": 0.63, + "learning_rate": 1.865975848738716e-05, + "loss": 2.7289, + "step": 175600 }, { - "epoch": 0.98, - "learning_rate": 9.472755365046369e-07, - "loss": 2.3158, - "step": 562570 + "epoch": 0.63, + "learning_rate": 1.8641910969441483e-05, + "loss": 2.7301, + "step": 175700 }, { - "epoch": 0.98, - "learning_rate": 9.464035965778103e-07, - "loss": 2.2304, - "step": 562580 + "epoch": 0.63, + "learning_rate": 1.86240634514958e-05, + "loss": 2.7229, + "step": 175800 }, { - "epoch": 0.98, - "learning_rate": 9.455316566509834e-07, - "loss": 2.1899, - "step": 562590 + "epoch": 0.63, + "learning_rate": 1.860621593355012e-05, + "loss": 2.7207, + "step": 175900 }, { - "epoch": 0.98, - "learning_rate": 9.446597167241565e-07, - "loss": 2.1701, - "step": 562600 + "epoch": 0.63, + "learning_rate": 1.8588368415604443e-05, + "loss": 2.7187, + "step": 176000 }, { - "epoch": 0.98, - "learning_rate": 9.437877767973299e-07, - "loss": 2.2597, - "step": 562610 + "epoch": 0.63, + "learning_rate": 1.8570520897658764e-05, + "loss": 2.7242, + "step": 176100 }, { - "epoch": 0.98, - "learning_rate": 9.42915836870503e-07, - "loss": 2.3538, - "step": 562620 + "epoch": 0.63, + "learning_rate": 1.8552673379713085e-05, + "loss": 2.7331, + "step": 176200 }, { - "epoch": 0.98, - "learning_rate": 9.420438969436762e-07, - "loss": 2.1842, - "step": 562630 + "epoch": 0.63, + "learning_rate": 1.8534825861767406e-05, + "loss": 2.728, + "step": 176300 }, { - "epoch": 0.98, - "learning_rate": 9.411719570168493e-07, - "loss": 2.1564, - "step": 562640 + "epoch": 0.63, + "learning_rate": 1.8516978343821724e-05, + "loss": 2.7247, + "step": 176400 }, { - "epoch": 0.98, - "learning_rate": 9.403000170900226e-07, - "loss": 2.2102, - "step": 562650 + "epoch": 0.63, + "learning_rate": 1.8499130825876045e-05, + "loss": 2.7274, + "step": 176500 }, { - "epoch": 0.98, - "learning_rate": 9.394280771631958e-07, - "loss": 2.2827, - "step": 562660 + "epoch": 0.63, + "learning_rate": 1.8481283307930367e-05, + "loss": 2.7342, + "step": 176600 }, { - "epoch": 0.98, - "learning_rate": 9.385561372363689e-07, - "loss": 2.2028, - "step": 562670 + "epoch": 0.63, + "learning_rate": 1.8463435789984688e-05, + "loss": 2.7282, + "step": 176700 }, { - "epoch": 0.98, - "learning_rate": 9.376841973095423e-07, - "loss": 2.2833, - "step": 562680 + "epoch": 0.63, + "learning_rate": 1.844558827203901e-05, + "loss": 2.7143, + "step": 176800 }, { - "epoch": 0.98, - "learning_rate": 9.368122573827154e-07, - "loss": 2.3622, - "step": 562690 + "epoch": 0.63, + "learning_rate": 1.8427740754093327e-05, + "loss": 2.7194, + "step": 176900 }, { - "epoch": 0.98, - "learning_rate": 9.359403174558885e-07, - "loss": 2.2367, - "step": 562700 + "epoch": 0.63, + "learning_rate": 1.8409893236147648e-05, + "loss": 2.7324, + "step": 177000 }, { - "epoch": 0.98, - "learning_rate": 9.350683775290619e-07, - "loss": 2.2848, - "step": 562710 + "epoch": 0.63, + "learning_rate": 1.839204571820197e-05, + "loss": 2.7307, + "step": 177100 }, { - "epoch": 0.98, - "learning_rate": 9.34196437602235e-07, - "loss": 2.2458, - "step": 562720 + "epoch": 0.63, + "learning_rate": 1.837419820025629e-05, + "loss": 2.7296, + "step": 177200 }, { - "epoch": 0.98, - "learning_rate": 9.333244976754081e-07, - "loss": 2.2344, - "step": 562730 + "epoch": 0.63, + "learning_rate": 1.8356350682310612e-05, + "loss": 2.7236, + "step": 177300 }, { - "epoch": 0.98, - "learning_rate": 9.324525577485813e-07, - "loss": 2.3331, - "step": 562740 + "epoch": 0.63, + "learning_rate": 1.833850316436493e-05, + "loss": 2.7156, + "step": 177400 }, { - "epoch": 0.98, - "learning_rate": 9.315806178217546e-07, - "loss": 2.1674, - "step": 562750 + "epoch": 0.63, + "learning_rate": 1.8320655646419254e-05, + "loss": 2.7224, + "step": 177500 }, { - "epoch": 0.98, - "learning_rate": 9.307086778949278e-07, - "loss": 2.2783, - "step": 562760 + "epoch": 0.63, + "learning_rate": 1.8302808128473575e-05, + "loss": 2.7156, + "step": 177600 }, { - "epoch": 0.98, - "learning_rate": 9.298367379681009e-07, - "loss": 2.3326, - "step": 562770 + "epoch": 0.63, + "learning_rate": 1.8284960610527897e-05, + "loss": 2.724, + "step": 177700 }, { - "epoch": 0.98, - "learning_rate": 9.289647980412742e-07, - "loss": 2.3818, - "step": 562780 + "epoch": 0.63, + "learning_rate": 1.8267113092582218e-05, + "loss": 2.7244, + "step": 177800 }, { - "epoch": 0.98, - "learning_rate": 9.280928581144474e-07, - "loss": 2.2422, - "step": 562790 + "epoch": 0.64, + "learning_rate": 1.8249265574636536e-05, + "loss": 2.7247, + "step": 177900 }, { - "epoch": 0.98, - "learning_rate": 9.272209181876205e-07, - "loss": 2.3358, - "step": 562800 + "epoch": 0.64, + "learning_rate": 1.8231418056690857e-05, + "loss": 2.7214, + "step": 178000 }, { - "epoch": 0.98, - "learning_rate": 9.263489782607939e-07, - "loss": 2.2369, - "step": 562810 + "epoch": 0.64, + "learning_rate": 1.8213570538745178e-05, + "loss": 2.7257, + "step": 178100 }, { - "epoch": 0.98, - "learning_rate": 9.25477038333967e-07, - "loss": 2.2468, - "step": 562820 + "epoch": 0.64, + "learning_rate": 1.81957230207995e-05, + "loss": 2.7253, + "step": 178200 }, { - "epoch": 0.98, - "learning_rate": 9.246050984071401e-07, - "loss": 2.3564, - "step": 562830 + "epoch": 0.64, + "learning_rate": 1.817787550285382e-05, + "loss": 2.7244, + "step": 178300 }, { - "epoch": 0.98, - "learning_rate": 9.237331584803134e-07, - "loss": 2.2635, - "step": 562840 + "epoch": 0.64, + "learning_rate": 1.816002798490814e-05, + "loss": 2.7392, + "step": 178400 }, { - "epoch": 0.98, - "learning_rate": 9.228612185534866e-07, - "loss": 2.31, - "step": 562850 + "epoch": 0.64, + "learning_rate": 1.814218046696246e-05, + "loss": 2.7217, + "step": 178500 }, { - "epoch": 0.98, - "learning_rate": 9.219892786266597e-07, - "loss": 2.1726, - "step": 562860 + "epoch": 0.64, + "learning_rate": 1.812433294901678e-05, + "loss": 2.7255, + "step": 178600 }, { - "epoch": 0.98, - "learning_rate": 9.211173386998329e-07, - "loss": 2.2974, - "step": 562870 + "epoch": 0.64, + "learning_rate": 1.8106485431071102e-05, + "loss": 2.7261, + "step": 178700 }, { - "epoch": 0.98, - "learning_rate": 9.202453987730062e-07, - "loss": 2.3372, - "step": 562880 + "epoch": 0.64, + "learning_rate": 1.8088637913125423e-05, + "loss": 2.7218, + "step": 178800 }, { - "epoch": 0.98, - "learning_rate": 9.193734588461794e-07, - "loss": 2.1252, - "step": 562890 + "epoch": 0.64, + "learning_rate": 1.8070790395179744e-05, + "loss": 2.7325, + "step": 178900 }, { - "epoch": 0.98, - "learning_rate": 9.185015189193525e-07, - "loss": 2.1867, - "step": 562900 + "epoch": 0.64, + "learning_rate": 1.8052942877234062e-05, + "loss": 2.7252, + "step": 179000 }, { - "epoch": 0.98, - "learning_rate": 9.176295789925258e-07, - "loss": 2.2259, - "step": 562910 + "epoch": 0.64, + "learning_rate": 1.8035095359288384e-05, + "loss": 2.7204, + "step": 179100 }, { - "epoch": 0.98, - "learning_rate": 9.16757639065699e-07, - "loss": 2.2098, - "step": 562920 + "epoch": 0.64, + "learning_rate": 1.8017247841342705e-05, + "loss": 2.7163, + "step": 179200 }, { - "epoch": 0.98, - "learning_rate": 9.158856991388721e-07, - "loss": 2.3059, - "step": 562930 + "epoch": 0.64, + "learning_rate": 1.7999400323397026e-05, + "loss": 2.7288, + "step": 179300 }, { - "epoch": 0.98, - "learning_rate": 9.150137592120453e-07, - "loss": 2.2977, - "step": 562940 + "epoch": 0.64, + "learning_rate": 1.7981552805451347e-05, + "loss": 2.7302, + "step": 179400 }, { - "epoch": 0.98, - "learning_rate": 9.141418192852186e-07, - "loss": 2.2685, - "step": 562950 + "epoch": 0.64, + "learning_rate": 1.7963705287505665e-05, + "loss": 2.7141, + "step": 179500 }, { - "epoch": 0.98, - "learning_rate": 9.132698793583917e-07, - "loss": 2.1683, - "step": 562960 + "epoch": 0.64, + "learning_rate": 1.7945857769559986e-05, + "loss": 2.7133, + "step": 179600 }, { - "epoch": 0.98, - "learning_rate": 9.12397939431565e-07, - "loss": 2.1839, - "step": 562970 + "epoch": 0.64, + "learning_rate": 1.7928010251614307e-05, + "loss": 2.7207, + "step": 179700 }, { - "epoch": 0.98, - "learning_rate": 9.115259995047382e-07, - "loss": 2.2489, - "step": 562980 + "epoch": 0.64, + "learning_rate": 1.791016273366863e-05, + "loss": 2.7191, + "step": 179800 }, { - "epoch": 0.98, - "learning_rate": 9.106540595779113e-07, - "loss": 2.2183, - "step": 562990 + "epoch": 0.64, + "learning_rate": 1.789231521572295e-05, + "loss": 2.7188, + "step": 179900 }, { - "epoch": 0.98, - "learning_rate": 9.097821196510845e-07, - "loss": 2.2668, - "step": 563000 + "epoch": 0.64, + "learning_rate": 1.787446769777727e-05, + "loss": 2.7159, + "step": 180000 }, { - "epoch": 0.98, - "learning_rate": 9.089101797242578e-07, - "loss": 2.2331, - "step": 563010 + "epoch": 0.64, + "learning_rate": 1.7856620179831592e-05, + "loss": 2.7176, + "step": 180100 }, { - "epoch": 0.98, - "learning_rate": 9.08038239797431e-07, - "loss": 2.2943, - "step": 563020 + "epoch": 0.64, + "learning_rate": 1.7838772661885913e-05, + "loss": 2.7271, + "step": 180200 }, { - "epoch": 0.98, - "learning_rate": 9.071662998706041e-07, - "loss": 2.3451, - "step": 563030 + "epoch": 0.64, + "learning_rate": 1.7820925143940235e-05, + "loss": 2.7298, + "step": 180300 }, { - "epoch": 0.98, - "learning_rate": 9.062943599437773e-07, - "loss": 2.168, - "step": 563040 + "epoch": 0.64, + "learning_rate": 1.7803077625994556e-05, + "loss": 2.7158, + "step": 180400 }, { - "epoch": 0.98, - "learning_rate": 9.054224200169506e-07, - "loss": 2.253, - "step": 563050 + "epoch": 0.64, + "learning_rate": 1.7785230108048874e-05, + "loss": 2.733, + "step": 180500 }, { - "epoch": 0.98, - "learning_rate": 9.045504800901237e-07, - "loss": 2.2498, - "step": 563060 + "epoch": 0.64, + "learning_rate": 1.7767382590103195e-05, + "loss": 2.7242, + "step": 180600 }, { - "epoch": 0.98, - "learning_rate": 9.036785401632969e-07, - "loss": 2.1895, - "step": 563070 + "epoch": 0.65, + "learning_rate": 1.7749535072157516e-05, + "loss": 2.7177, + "step": 180700 }, { - "epoch": 0.98, - "learning_rate": 9.028066002364702e-07, - "loss": 2.2042, - "step": 563080 + "epoch": 0.65, + "learning_rate": 1.7731687554211837e-05, + "loss": 2.7187, + "step": 180800 }, { - "epoch": 0.98, - "learning_rate": 9.019346603096433e-07, - "loss": 2.3531, - "step": 563090 + "epoch": 0.65, + "learning_rate": 1.771384003626616e-05, + "loss": 2.7196, + "step": 180900 }, { - "epoch": 0.98, - "learning_rate": 9.010627203828166e-07, - "loss": 2.1927, - "step": 563100 + "epoch": 0.65, + "learning_rate": 1.769599251832048e-05, + "loss": 2.7254, + "step": 181000 }, { - "epoch": 0.98, - "learning_rate": 9.001907804559898e-07, - "loss": 2.178, - "step": 563110 + "epoch": 0.65, + "learning_rate": 1.7678145000374798e-05, + "loss": 2.717, + "step": 181100 }, { - "epoch": 0.98, - "learning_rate": 8.993188405291629e-07, - "loss": 2.2787, - "step": 563120 + "epoch": 0.65, + "learning_rate": 1.766029748242912e-05, + "loss": 2.7162, + "step": 181200 }, { - "epoch": 0.98, - "learning_rate": 8.984469006023361e-07, - "loss": 2.3142, - "step": 563130 + "epoch": 0.65, + "learning_rate": 1.764244996448344e-05, + "loss": 2.7167, + "step": 181300 }, { - "epoch": 0.98, - "learning_rate": 8.975749606755093e-07, - "loss": 2.3551, - "step": 563140 + "epoch": 0.65, + "learning_rate": 1.762460244653776e-05, + "loss": 2.7216, + "step": 181400 }, { - "epoch": 0.98, - "learning_rate": 8.967030207486825e-07, - "loss": 2.2375, - "step": 563150 + "epoch": 0.65, + "learning_rate": 1.7606754928592082e-05, + "loss": 2.7254, + "step": 181500 }, { - "epoch": 0.98, - "learning_rate": 8.958310808218557e-07, - "loss": 2.3814, - "step": 563160 + "epoch": 0.65, + "learning_rate": 1.75889074106464e-05, + "loss": 2.72, + "step": 181600 }, { - "epoch": 0.98, - "learning_rate": 8.949591408950289e-07, - "loss": 2.2586, - "step": 563170 + "epoch": 0.65, + "learning_rate": 1.757105989270072e-05, + "loss": 2.7132, + "step": 181700 }, { - "epoch": 0.98, - "learning_rate": 8.940872009682022e-07, - "loss": 2.2952, - "step": 563180 + "epoch": 0.65, + "learning_rate": 1.7553212374755043e-05, + "loss": 2.723, + "step": 181800 }, { - "epoch": 0.98, - "learning_rate": 8.932152610413753e-07, - "loss": 2.2833, - "step": 563190 + "epoch": 0.65, + "learning_rate": 1.7535364856809364e-05, + "loss": 2.7191, + "step": 181900 }, { - "epoch": 0.98, - "learning_rate": 8.923433211145485e-07, - "loss": 2.23, - "step": 563200 + "epoch": 0.65, + "learning_rate": 1.7517517338863685e-05, + "loss": 2.7216, + "step": 182000 }, { - "epoch": 0.98, - "learning_rate": 8.914713811877218e-07, - "loss": 2.1484, - "step": 563210 + "epoch": 0.65, + "learning_rate": 1.7499669820918006e-05, + "loss": 2.7184, + "step": 182100 }, { - "epoch": 0.98, - "learning_rate": 8.905994412608949e-07, - "loss": 2.167, - "step": 563220 + "epoch": 0.65, + "learning_rate": 1.7481822302972324e-05, + "loss": 2.7303, + "step": 182200 }, { - "epoch": 0.98, - "learning_rate": 8.897275013340682e-07, - "loss": 2.3548, - "step": 563230 + "epoch": 0.65, + "learning_rate": 1.7463974785026645e-05, + "loss": 2.7074, + "step": 182300 }, { - "epoch": 0.98, - "learning_rate": 8.888555614072413e-07, - "loss": 2.2475, - "step": 563240 + "epoch": 0.65, + "learning_rate": 1.7446127267080967e-05, + "loss": 2.7286, + "step": 182400 }, { - "epoch": 0.98, - "learning_rate": 8.879836214804145e-07, - "loss": 2.2569, - "step": 563250 + "epoch": 0.65, + "learning_rate": 1.7428279749135288e-05, + "loss": 2.7204, + "step": 182500 }, { - "epoch": 0.98, - "learning_rate": 8.871116815535878e-07, - "loss": 2.269, - "step": 563260 + "epoch": 0.65, + "learning_rate": 1.741043223118961e-05, + "loss": 2.7159, + "step": 182600 }, { - "epoch": 0.98, - "learning_rate": 8.862397416267609e-07, - "loss": 2.2654, - "step": 563270 + "epoch": 0.65, + "learning_rate": 1.739258471324393e-05, + "loss": 2.7101, + "step": 182700 }, { - "epoch": 0.98, - "learning_rate": 8.853678016999341e-07, - "loss": 2.3581, - "step": 563280 + "epoch": 0.65, + "learning_rate": 1.737473719529825e-05, + "loss": 2.7151, + "step": 182800 }, { - "epoch": 0.98, - "learning_rate": 8.844958617731073e-07, - "loss": 2.1809, - "step": 563290 + "epoch": 0.65, + "learning_rate": 1.7356889677352573e-05, + "loss": 2.7056, + "step": 182900 }, { - "epoch": 0.98, - "learning_rate": 8.836239218462805e-07, - "loss": 2.3118, - "step": 563300 + "epoch": 0.65, + "learning_rate": 1.7339042159406894e-05, + "loss": 2.7251, + "step": 183000 }, { - "epoch": 0.98, - "learning_rate": 8.827519819194538e-07, - "loss": 2.2944, - "step": 563310 + "epoch": 0.65, + "learning_rate": 1.7321194641461215e-05, + "loss": 2.7264, + "step": 183100 }, { - "epoch": 0.98, - "learning_rate": 8.818800419926269e-07, - "loss": 2.2478, - "step": 563320 + "epoch": 0.65, + "learning_rate": 1.7303347123515533e-05, + "loss": 2.7249, + "step": 183200 }, { - "epoch": 0.98, - "learning_rate": 8.810081020658001e-07, - "loss": 2.2749, - "step": 563330 + "epoch": 0.65, + "learning_rate": 1.7285499605569854e-05, + "loss": 2.7095, + "step": 183300 }, { - "epoch": 0.98, - "learning_rate": 8.801361621389733e-07, - "loss": 2.2952, - "step": 563340 + "epoch": 0.65, + "learning_rate": 1.7267652087624175e-05, + "loss": 2.7235, + "step": 183400 }, { - "epoch": 0.98, - "learning_rate": 8.792642222121465e-07, - "loss": 2.3279, - "step": 563350 + "epoch": 0.66, + "learning_rate": 1.7249804569678497e-05, + "loss": 2.7213, + "step": 183500 }, { - "epoch": 0.98, - "learning_rate": 8.783922822853198e-07, - "loss": 2.2535, - "step": 563360 + "epoch": 0.66, + "learning_rate": 1.7231957051732818e-05, + "loss": 2.7328, + "step": 183600 }, { - "epoch": 0.98, - "learning_rate": 8.775203423584929e-07, - "loss": 2.3122, - "step": 563370 + "epoch": 0.66, + "learning_rate": 1.7214109533787136e-05, + "loss": 2.7092, + "step": 183700 }, { - "epoch": 0.98, - "learning_rate": 8.766484024316661e-07, - "loss": 2.0859, - "step": 563380 + "epoch": 0.66, + "learning_rate": 1.7196262015841457e-05, + "loss": 2.7146, + "step": 183800 }, { - "epoch": 0.98, - "learning_rate": 8.757764625048394e-07, - "loss": 2.2589, - "step": 563390 + "epoch": 0.66, + "learning_rate": 1.7178414497895778e-05, + "loss": 2.7208, + "step": 183900 }, { - "epoch": 0.98, - "learning_rate": 8.749045225780125e-07, - "loss": 2.2846, - "step": 563400 + "epoch": 0.66, + "learning_rate": 1.71605669799501e-05, + "loss": 2.723, + "step": 184000 }, { - "epoch": 0.98, - "learning_rate": 8.740325826511857e-07, - "loss": 2.2639, - "step": 563410 + "epoch": 0.66, + "learning_rate": 1.714271946200442e-05, + "loss": 2.7104, + "step": 184100 }, { - "epoch": 0.98, - "learning_rate": 8.731606427243589e-07, - "loss": 2.2425, - "step": 563420 + "epoch": 0.66, + "learning_rate": 1.7124871944058742e-05, + "loss": 2.7221, + "step": 184200 }, { - "epoch": 0.98, - "learning_rate": 8.722887027975321e-07, - "loss": 2.3136, - "step": 563430 + "epoch": 0.66, + "learning_rate": 1.710702442611306e-05, + "loss": 2.7253, + "step": 184300 }, { - "epoch": 0.98, - "learning_rate": 8.714167628707053e-07, - "loss": 2.2165, - "step": 563440 + "epoch": 0.66, + "learning_rate": 1.708917690816738e-05, + "loss": 2.712, + "step": 184400 }, { - "epoch": 0.98, - "learning_rate": 8.705448229438785e-07, - "loss": 2.2748, - "step": 563450 + "epoch": 0.66, + "learning_rate": 1.7071329390221702e-05, + "loss": 2.723, + "step": 184500 }, { - "epoch": 0.98, - "learning_rate": 8.696728830170517e-07, - "loss": 2.3063, - "step": 563460 + "epoch": 0.66, + "learning_rate": 1.7053481872276023e-05, + "loss": 2.7147, + "step": 184600 }, { - "epoch": 0.98, - "learning_rate": 8.688009430902249e-07, - "loss": 2.2266, - "step": 563470 + "epoch": 0.66, + "learning_rate": 1.7035634354330344e-05, + "loss": 2.7115, + "step": 184700 }, { - "epoch": 0.98, - "learning_rate": 8.679290031633981e-07, - "loss": 2.3787, - "step": 563480 + "epoch": 0.66, + "learning_rate": 1.7017786836384662e-05, + "loss": 2.7187, + "step": 184800 }, { - "epoch": 0.98, - "learning_rate": 8.670570632365713e-07, - "loss": 2.2116, - "step": 563490 + "epoch": 0.66, + "learning_rate": 1.6999939318438983e-05, + "loss": 2.7232, + "step": 184900 }, { - "epoch": 0.98, - "learning_rate": 8.661851233097445e-07, - "loss": 2.3504, - "step": 563500 + "epoch": 0.66, + "learning_rate": 1.6982091800493305e-05, + "loss": 2.7248, + "step": 185000 }, { - "epoch": 0.98, - "learning_rate": 8.653131833829177e-07, - "loss": 2.2168, - "step": 563510 + "epoch": 0.66, + "learning_rate": 1.6964244282547626e-05, + "loss": 2.7092, + "step": 185100 }, { - "epoch": 0.98, - "learning_rate": 8.64441243456091e-07, - "loss": 2.1993, - "step": 563520 + "epoch": 0.66, + "learning_rate": 1.694639676460195e-05, + "loss": 2.7228, + "step": 185200 }, { - "epoch": 0.98, - "learning_rate": 8.635693035292641e-07, - "loss": 2.2392, - "step": 563530 + "epoch": 0.66, + "learning_rate": 1.692854924665627e-05, + "loss": 2.7268, + "step": 185300 }, { - "epoch": 0.98, - "learning_rate": 8.626973636024372e-07, - "loss": 2.2469, - "step": 563540 + "epoch": 0.66, + "learning_rate": 1.691070172871059e-05, + "loss": 2.7142, + "step": 185400 }, { - "epoch": 0.98, - "learning_rate": 8.618254236756105e-07, - "loss": 2.2169, - "step": 563550 + "epoch": 0.66, + "learning_rate": 1.689285421076491e-05, + "loss": 2.7131, + "step": 185500 }, { - "epoch": 0.98, - "learning_rate": 8.609534837487837e-07, - "loss": 2.1682, - "step": 563560 + "epoch": 0.66, + "learning_rate": 1.6875006692819232e-05, + "loss": 2.7241, + "step": 185600 }, { - "epoch": 0.98, - "learning_rate": 8.600815438219568e-07, - "loss": 2.1782, - "step": 563570 + "epoch": 0.66, + "learning_rate": 1.6857159174873553e-05, + "loss": 2.7147, + "step": 185700 }, { - "epoch": 0.98, - "learning_rate": 8.592096038951301e-07, - "loss": 2.2642, - "step": 563580 + "epoch": 0.66, + "learning_rate": 1.683931165692787e-05, + "loss": 2.7145, + "step": 185800 }, { - "epoch": 0.98, - "learning_rate": 8.583376639683033e-07, - "loss": 2.2717, - "step": 563590 + "epoch": 0.66, + "learning_rate": 1.6821464138982192e-05, + "loss": 2.7177, + "step": 185900 }, { - "epoch": 0.98, - "learning_rate": 8.574657240414765e-07, - "loss": 2.1521, - "step": 563600 + "epoch": 0.66, + "learning_rate": 1.6803616621036513e-05, + "loss": 2.7221, + "step": 186000 }, { - "epoch": 0.98, - "learning_rate": 8.565937841146497e-07, - "loss": 2.2407, - "step": 563610 + "epoch": 0.66, + "learning_rate": 1.6785769103090835e-05, + "loss": 2.7218, + "step": 186100 }, { - "epoch": 0.98, - "learning_rate": 8.557218441878229e-07, - "loss": 2.2709, - "step": 563620 + "epoch": 0.66, + "learning_rate": 1.6767921585145156e-05, + "loss": 2.7185, + "step": 186200 }, { - "epoch": 0.98, - "learning_rate": 8.548499042609961e-07, - "loss": 2.3894, - "step": 563630 + "epoch": 0.66, + "learning_rate": 1.6750074067199477e-05, + "loss": 2.7084, + "step": 186300 }, { - "epoch": 0.98, - "learning_rate": 8.539779643341692e-07, - "loss": 2.2594, - "step": 563640 + "epoch": 0.67, + "learning_rate": 1.6732226549253795e-05, + "loss": 2.7109, + "step": 186400 }, { - "epoch": 0.98, - "learning_rate": 8.531060244073426e-07, - "loss": 2.1642, - "step": 563650 + "epoch": 0.67, + "learning_rate": 1.6714379031308116e-05, + "loss": 2.7236, + "step": 186500 }, { - "epoch": 0.98, - "learning_rate": 8.522340844805157e-07, - "loss": 2.3587, - "step": 563660 + "epoch": 0.67, + "learning_rate": 1.6696531513362437e-05, + "loss": 2.732, + "step": 186600 }, { - "epoch": 0.98, - "learning_rate": 8.513621445536888e-07, - "loss": 2.1569, - "step": 563670 + "epoch": 0.67, + "learning_rate": 1.667868399541676e-05, + "loss": 2.7222, + "step": 186700 }, { - "epoch": 0.98, - "learning_rate": 8.504902046268621e-07, - "loss": 2.2474, - "step": 563680 + "epoch": 0.67, + "learning_rate": 1.666083647747108e-05, + "loss": 2.7112, + "step": 186800 }, { - "epoch": 0.98, - "learning_rate": 8.496182647000353e-07, - "loss": 2.2394, - "step": 563690 + "epoch": 0.67, + "learning_rate": 1.6642988959525398e-05, + "loss": 2.7275, + "step": 186900 }, { - "epoch": 0.98, - "learning_rate": 8.487463247732084e-07, - "loss": 2.3289, - "step": 563700 + "epoch": 0.67, + "learning_rate": 1.662514144157972e-05, + "loss": 2.7227, + "step": 187000 }, { - "epoch": 0.98, - "learning_rate": 8.478743848463817e-07, - "loss": 2.2337, - "step": 563710 + "epoch": 0.67, + "learning_rate": 1.660729392363404e-05, + "loss": 2.723, + "step": 187100 }, { - "epoch": 0.98, - "learning_rate": 8.470024449195549e-07, - "loss": 2.1952, - "step": 563720 + "epoch": 0.67, + "learning_rate": 1.658944640568836e-05, + "loss": 2.732, + "step": 187200 }, { - "epoch": 0.98, - "learning_rate": 8.461305049927281e-07, - "loss": 2.1816, - "step": 563730 + "epoch": 0.67, + "learning_rate": 1.6571598887742682e-05, + "loss": 2.7154, + "step": 187300 }, { - "epoch": 0.98, - "learning_rate": 8.452585650659012e-07, - "loss": 2.2365, - "step": 563740 + "epoch": 0.67, + "learning_rate": 1.6553751369797004e-05, + "loss": 2.7151, + "step": 187400 }, { - "epoch": 0.98, - "learning_rate": 8.443866251390745e-07, - "loss": 2.2146, - "step": 563750 + "epoch": 0.67, + "learning_rate": 1.653590385185132e-05, + "loss": 2.7072, + "step": 187500 }, { - "epoch": 0.98, - "learning_rate": 8.435146852122477e-07, - "loss": 2.2649, - "step": 563760 + "epoch": 0.67, + "learning_rate": 1.6518056333905643e-05, + "loss": 2.7216, + "step": 187600 }, { - "epoch": 0.98, - "learning_rate": 8.426427452854208e-07, - "loss": 2.2548, - "step": 563770 + "epoch": 0.67, + "learning_rate": 1.6500208815959967e-05, + "loss": 2.7015, + "step": 187700 }, { - "epoch": 0.98, - "learning_rate": 8.417708053585942e-07, - "loss": 2.229, - "step": 563780 + "epoch": 0.67, + "learning_rate": 1.648236129801429e-05, + "loss": 2.7158, + "step": 187800 }, { - "epoch": 0.98, - "learning_rate": 8.408988654317673e-07, - "loss": 2.2489, - "step": 563790 + "epoch": 0.67, + "learning_rate": 1.6464513780068606e-05, + "loss": 2.7235, + "step": 187900 }, { - "epoch": 0.98, - "learning_rate": 8.400269255049404e-07, - "loss": 2.1303, - "step": 563800 + "epoch": 0.67, + "learning_rate": 1.6446666262122928e-05, + "loss": 2.7088, + "step": 188000 }, { - "epoch": 0.98, - "learning_rate": 8.391549855781137e-07, - "loss": 2.2409, - "step": 563810 + "epoch": 0.67, + "learning_rate": 1.642881874417725e-05, + "loss": 2.7184, + "step": 188100 }, { - "epoch": 0.98, - "learning_rate": 8.382830456512869e-07, - "loss": 2.2933, - "step": 563820 + "epoch": 0.67, + "learning_rate": 1.641097122623157e-05, + "loss": 2.7156, + "step": 188200 }, { - "epoch": 0.98, - "learning_rate": 8.3741110572446e-07, - "loss": 2.3089, - "step": 563830 + "epoch": 0.67, + "learning_rate": 1.639312370828589e-05, + "loss": 2.7184, + "step": 188300 }, { - "epoch": 0.98, - "learning_rate": 8.365391657976332e-07, - "loss": 2.3019, - "step": 563840 + "epoch": 0.67, + "learning_rate": 1.6375276190340212e-05, + "loss": 2.7243, + "step": 188400 }, { - "epoch": 0.98, - "learning_rate": 8.356672258708065e-07, - "loss": 2.1981, - "step": 563850 + "epoch": 0.67, + "learning_rate": 1.635742867239453e-05, + "loss": 2.7248, + "step": 188500 }, { - "epoch": 0.98, - "learning_rate": 8.347952859439797e-07, - "loss": 2.199, - "step": 563860 + "epoch": 0.67, + "learning_rate": 1.633958115444885e-05, + "loss": 2.7154, + "step": 188600 }, { - "epoch": 0.98, - "learning_rate": 8.339233460171528e-07, - "loss": 2.355, - "step": 563870 + "epoch": 0.67, + "learning_rate": 1.6321733636503173e-05, + "loss": 2.7176, + "step": 188700 }, { - "epoch": 0.98, - "learning_rate": 8.330514060903261e-07, - "loss": 2.2595, - "step": 563880 + "epoch": 0.67, + "learning_rate": 1.6303886118557494e-05, + "loss": 2.7134, + "step": 188800 }, { - "epoch": 0.98, - "learning_rate": 8.321794661634993e-07, - "loss": 2.0383, - "step": 563890 + "epoch": 0.67, + "learning_rate": 1.6286038600611815e-05, + "loss": 2.7259, + "step": 188900 }, { - "epoch": 0.98, - "learning_rate": 8.313075262366724e-07, - "loss": 2.3561, - "step": 563900 + "epoch": 0.67, + "learning_rate": 1.6268191082666133e-05, + "loss": 2.7226, + "step": 189000 }, { - "epoch": 0.98, - "learning_rate": 8.304355863098458e-07, - "loss": 2.2996, - "step": 563910 + "epoch": 0.67, + "learning_rate": 1.6250343564720454e-05, + "loss": 2.7062, + "step": 189100 }, { - "epoch": 0.98, - "learning_rate": 8.295636463830189e-07, - "loss": 2.2617, - "step": 563920 + "epoch": 0.68, + "learning_rate": 1.6232496046774775e-05, + "loss": 2.7082, + "step": 189200 }, { - "epoch": 0.98, - "learning_rate": 8.28691706456192e-07, - "loss": 2.2765, - "step": 563930 + "epoch": 0.68, + "learning_rate": 1.6214648528829097e-05, + "loss": 2.712, + "step": 189300 }, { - "epoch": 0.98, - "learning_rate": 8.278197665293653e-07, - "loss": 2.2632, - "step": 563940 + "epoch": 0.68, + "learning_rate": 1.6196801010883418e-05, + "loss": 2.7137, + "step": 189400 }, { - "epoch": 0.98, - "learning_rate": 8.269478266025385e-07, - "loss": 2.2946, - "step": 563950 + "epoch": 0.68, + "learning_rate": 1.6178953492937736e-05, + "loss": 2.7242, + "step": 189500 }, { - "epoch": 0.98, - "learning_rate": 8.260758866757116e-07, - "loss": 2.2306, - "step": 563960 + "epoch": 0.68, + "learning_rate": 1.6161105974992057e-05, + "loss": 2.7074, + "step": 189600 }, { - "epoch": 0.98, - "learning_rate": 8.252039467488848e-07, - "loss": 2.3172, - "step": 563970 + "epoch": 0.68, + "learning_rate": 1.6143258457046378e-05, + "loss": 2.7128, + "step": 189700 }, { - "epoch": 0.98, - "learning_rate": 8.243320068220581e-07, - "loss": 2.2092, - "step": 563980 + "epoch": 0.68, + "learning_rate": 1.61254109391007e-05, + "loss": 2.726, + "step": 189800 }, { - "epoch": 0.98, - "learning_rate": 8.234600668952313e-07, - "loss": 2.3072, - "step": 563990 + "epoch": 0.68, + "learning_rate": 1.610756342115502e-05, + "loss": 2.7125, + "step": 189900 }, { - "epoch": 0.98, - "learning_rate": 8.225881269684044e-07, - "loss": 2.1649, - "step": 564000 + "epoch": 0.68, + "learning_rate": 1.6089715903209342e-05, + "loss": 2.7131, + "step": 190000 }, { - "epoch": 0.98, - "learning_rate": 8.217161870415777e-07, - "loss": 2.3146, - "step": 564010 + "epoch": 0.68, + "learning_rate": 1.607186838526366e-05, + "loss": 2.7301, + "step": 190100 }, { - "epoch": 0.98, - "learning_rate": 8.208442471147509e-07, - "loss": 2.2742, - "step": 564020 + "epoch": 0.68, + "learning_rate": 1.605402086731798e-05, + "loss": 2.7243, + "step": 190200 }, { - "epoch": 0.98, - "learning_rate": 8.19972307187924e-07, - "loss": 2.2596, - "step": 564030 + "epoch": 0.68, + "learning_rate": 1.6036173349372305e-05, + "loss": 2.715, + "step": 190300 }, { - "epoch": 0.98, - "learning_rate": 8.191003672610974e-07, - "loss": 2.2809, - "step": 564040 + "epoch": 0.68, + "learning_rate": 1.6018325831426627e-05, + "loss": 2.7066, + "step": 190400 }, { - "epoch": 0.98, - "learning_rate": 8.182284273342705e-07, - "loss": 2.303, - "step": 564050 + "epoch": 0.68, + "learning_rate": 1.6000478313480944e-05, + "loss": 2.7182, + "step": 190500 }, { - "epoch": 0.98, - "learning_rate": 8.173564874074436e-07, - "loss": 2.3044, - "step": 564060 + "epoch": 0.68, + "learning_rate": 1.5982630795535266e-05, + "loss": 2.7147, + "step": 190600 }, { - "epoch": 0.98, - "learning_rate": 8.164845474806168e-07, - "loss": 2.2742, - "step": 564070 + "epoch": 0.68, + "learning_rate": 1.5964783277589587e-05, + "loss": 2.7144, + "step": 190700 }, { - "epoch": 0.98, - "learning_rate": 8.156126075537901e-07, - "loss": 2.2303, - "step": 564080 + "epoch": 0.68, + "learning_rate": 1.5946935759643908e-05, + "loss": 2.7222, + "step": 190800 }, { - "epoch": 0.98, - "learning_rate": 8.147406676269632e-07, - "loss": 2.1893, - "step": 564090 + "epoch": 0.68, + "learning_rate": 1.592908824169823e-05, + "loss": 2.7202, + "step": 190900 }, { - "epoch": 0.98, - "learning_rate": 8.138687277001364e-07, - "loss": 2.2682, - "step": 564100 + "epoch": 0.68, + "learning_rate": 1.591124072375255e-05, + "loss": 2.7086, + "step": 191000 }, { - "epoch": 0.98, - "learning_rate": 8.129967877733097e-07, - "loss": 2.2967, - "step": 564110 + "epoch": 0.68, + "learning_rate": 1.589339320580687e-05, + "loss": 2.7141, + "step": 191100 }, { - "epoch": 0.98, - "learning_rate": 8.121248478464829e-07, - "loss": 2.2862, - "step": 564120 + "epoch": 0.68, + "learning_rate": 1.587554568786119e-05, + "loss": 2.7148, + "step": 191200 }, { - "epoch": 0.98, - "learning_rate": 8.11252907919656e-07, - "loss": 2.2666, - "step": 564130 + "epoch": 0.68, + "learning_rate": 1.585769816991551e-05, + "loss": 2.7037, + "step": 191300 }, { - "epoch": 0.98, - "learning_rate": 8.103809679928293e-07, - "loss": 2.1685, - "step": 564140 + "epoch": 0.68, + "learning_rate": 1.5839850651969832e-05, + "loss": 2.7298, + "step": 191400 }, { - "epoch": 0.98, - "learning_rate": 8.095090280660025e-07, - "loss": 2.2236, - "step": 564150 + "epoch": 0.68, + "learning_rate": 1.5822003134024153e-05, + "loss": 2.7071, + "step": 191500 }, { - "epoch": 0.98, - "learning_rate": 8.086370881391756e-07, - "loss": 2.319, - "step": 564160 + "epoch": 0.68, + "learning_rate": 1.580415561607847e-05, + "loss": 2.71, + "step": 191600 }, { - "epoch": 0.98, - "learning_rate": 8.077651482123487e-07, - "loss": 2.2707, - "step": 564170 + "epoch": 0.68, + "learning_rate": 1.5786308098132792e-05, + "loss": 2.7058, + "step": 191700 }, { - "epoch": 0.98, - "learning_rate": 8.068932082855221e-07, - "loss": 2.1779, - "step": 564180 + "epoch": 0.68, + "learning_rate": 1.5768460580187113e-05, + "loss": 2.7256, + "step": 191800 }, { - "epoch": 0.98, - "learning_rate": 8.060212683586952e-07, - "loss": 2.3288, - "step": 564190 + "epoch": 0.68, + "learning_rate": 1.5750613062241435e-05, + "loss": 2.7194, + "step": 191900 }, { - "epoch": 0.98, - "learning_rate": 8.051493284318684e-07, - "loss": 2.2389, - "step": 564200 + "epoch": 0.69, + "learning_rate": 1.5732765544295756e-05, + "loss": 2.7117, + "step": 192000 }, { - "epoch": 0.98, - "learning_rate": 8.042773885050417e-07, - "loss": 2.1754, - "step": 564210 + "epoch": 0.69, + "learning_rate": 1.5714918026350077e-05, + "loss": 2.7162, + "step": 192100 }, { - "epoch": 0.98, - "learning_rate": 8.034054485782148e-07, - "loss": 2.3098, - "step": 564220 + "epoch": 0.69, + "learning_rate": 1.5697070508404395e-05, + "loss": 2.7219, + "step": 192200 }, { - "epoch": 0.98, - "learning_rate": 8.02533508651388e-07, - "loss": 2.3338, - "step": 564230 + "epoch": 0.69, + "learning_rate": 1.5679222990458716e-05, + "loss": 2.716, + "step": 192300 }, { - "epoch": 0.98, - "learning_rate": 8.016615687245613e-07, - "loss": 2.2843, - "step": 564240 + "epoch": 0.69, + "learning_rate": 1.5661375472513037e-05, + "loss": 2.7156, + "step": 192400 }, { - "epoch": 0.98, - "learning_rate": 8.007896287977345e-07, - "loss": 2.3562, - "step": 564250 + "epoch": 0.69, + "learning_rate": 1.564352795456736e-05, + "loss": 2.7103, + "step": 192500 }, { - "epoch": 0.98, - "learning_rate": 7.999176888709076e-07, - "loss": 2.204, - "step": 564260 + "epoch": 0.69, + "learning_rate": 1.562568043662168e-05, + "loss": 2.7085, + "step": 192600 }, { - "epoch": 0.98, - "learning_rate": 7.990457489440807e-07, - "loss": 2.1956, - "step": 564270 + "epoch": 0.69, + "learning_rate": 1.5607832918675998e-05, + "loss": 2.7151, + "step": 192700 }, { - "epoch": 0.98, - "learning_rate": 7.981738090172541e-07, - "loss": 2.3456, - "step": 564280 + "epoch": 0.69, + "learning_rate": 1.5589985400730322e-05, + "loss": 2.711, + "step": 192800 }, { - "epoch": 0.98, - "learning_rate": 7.973018690904272e-07, - "loss": 2.179, - "step": 564290 + "epoch": 0.69, + "learning_rate": 1.5572137882784643e-05, + "loss": 2.7089, + "step": 192900 }, { - "epoch": 0.98, - "learning_rate": 7.964299291636003e-07, - "loss": 2.1896, - "step": 564300 + "epoch": 0.69, + "learning_rate": 1.5554290364838965e-05, + "loss": 2.7197, + "step": 193000 }, { - "epoch": 0.98, - "learning_rate": 7.955579892367737e-07, - "loss": 2.3574, - "step": 564310 + "epoch": 0.69, + "learning_rate": 1.5536442846893286e-05, + "loss": 2.7035, + "step": 193100 }, { - "epoch": 0.98, - "learning_rate": 7.946860493099468e-07, - "loss": 2.1898, - "step": 564320 + "epoch": 0.69, + "learning_rate": 1.5518595328947604e-05, + "loss": 2.724, + "step": 193200 }, { - "epoch": 0.98, - "learning_rate": 7.9381410938312e-07, - "loss": 2.2799, - "step": 564330 + "epoch": 0.69, + "learning_rate": 1.5500747811001925e-05, + "loss": 2.721, + "step": 193300 }, { - "epoch": 0.98, - "learning_rate": 7.929421694562933e-07, - "loss": 2.2201, - "step": 564340 + "epoch": 0.69, + "learning_rate": 1.5482900293056246e-05, + "loss": 2.7175, + "step": 193400 }, { - "epoch": 0.98, - "learning_rate": 7.920702295294664e-07, - "loss": 2.2473, - "step": 564350 + "epoch": 0.69, + "learning_rate": 1.5465052775110567e-05, + "loss": 2.7098, + "step": 193500 }, { - "epoch": 0.98, - "learning_rate": 7.911982896026396e-07, - "loss": 2.2674, - "step": 564360 + "epoch": 0.69, + "learning_rate": 1.544720525716489e-05, + "loss": 2.7112, + "step": 193600 }, { - "epoch": 0.98, - "learning_rate": 7.903263496758127e-07, - "loss": 2.3348, - "step": 564370 + "epoch": 0.69, + "learning_rate": 1.5429357739219206e-05, + "loss": 2.7137, + "step": 193700 }, { - "epoch": 0.98, - "learning_rate": 7.89454409748986e-07, - "loss": 2.3759, - "step": 564380 + "epoch": 0.69, + "learning_rate": 1.5411510221273528e-05, + "loss": 2.7177, + "step": 193800 }, { - "epoch": 0.98, - "learning_rate": 7.885824698221592e-07, - "loss": 2.271, - "step": 564390 + "epoch": 0.69, + "learning_rate": 1.539366270332785e-05, + "loss": 2.7109, + "step": 193900 }, { - "epoch": 0.98, - "learning_rate": 7.877105298953323e-07, - "loss": 2.3301, - "step": 564400 + "epoch": 0.69, + "learning_rate": 1.537581518538217e-05, + "loss": 2.7027, + "step": 194000 }, { - "epoch": 0.98, - "learning_rate": 7.868385899685057e-07, - "loss": 2.357, - "step": 564410 + "epoch": 0.69, + "learning_rate": 1.535796766743649e-05, + "loss": 2.7139, + "step": 194100 }, { - "epoch": 0.98, - "learning_rate": 7.859666500416788e-07, - "loss": 2.2438, - "step": 564420 + "epoch": 0.69, + "learning_rate": 1.5340120149490812e-05, + "loss": 2.7126, + "step": 194200 }, { - "epoch": 0.98, - "learning_rate": 7.850947101148519e-07, - "loss": 2.1113, - "step": 564430 + "epoch": 0.69, + "learning_rate": 1.532227263154513e-05, + "loss": 2.7025, + "step": 194300 }, { - "epoch": 0.98, - "learning_rate": 7.842227701880253e-07, - "loss": 2.2355, - "step": 564440 + "epoch": 0.69, + "learning_rate": 1.530442511359945e-05, + "loss": 2.7097, + "step": 194400 }, { - "epoch": 0.98, - "learning_rate": 7.833508302611984e-07, - "loss": 2.236, - "step": 564450 + "epoch": 0.69, + "learning_rate": 1.5286577595653773e-05, + "loss": 2.7117, + "step": 194500 }, { - "epoch": 0.98, - "learning_rate": 7.824788903343715e-07, - "loss": 2.3107, - "step": 564460 + "epoch": 0.69, + "learning_rate": 1.5268730077708094e-05, + "loss": 2.7228, + "step": 194600 }, { - "epoch": 0.98, - "learning_rate": 7.816069504075447e-07, - "loss": 2.1796, - "step": 564470 + "epoch": 0.69, + "learning_rate": 1.5250882559762413e-05, + "loss": 2.7108, + "step": 194700 }, { - "epoch": 0.98, - "learning_rate": 7.807350104807179e-07, - "loss": 2.1674, - "step": 564480 + "epoch": 0.7, + "learning_rate": 1.5233035041816735e-05, + "loss": 2.6974, + "step": 194800 }, { - "epoch": 0.98, - "learning_rate": 7.798630705538912e-07, - "loss": 2.2377, - "step": 564490 + "epoch": 0.7, + "learning_rate": 1.5215187523871056e-05, + "loss": 2.7131, + "step": 194900 }, { - "epoch": 0.98, - "learning_rate": 7.789911306270644e-07, - "loss": 2.1686, - "step": 564500 + "epoch": 0.7, + "learning_rate": 1.5197340005925375e-05, + "loss": 2.7097, + "step": 195000 }, { - "epoch": 0.98, - "learning_rate": 7.781191907002375e-07, - "loss": 2.2091, - "step": 564510 + "epoch": 0.7, + "learning_rate": 1.5179492487979697e-05, + "loss": 2.7097, + "step": 195100 }, { - "epoch": 0.98, - "learning_rate": 7.772472507734108e-07, - "loss": 2.2464, - "step": 564520 + "epoch": 0.7, + "learning_rate": 1.5161644970034016e-05, + "loss": 2.7182, + "step": 195200 }, { - "epoch": 0.98, - "learning_rate": 7.763753108465839e-07, - "loss": 2.2199, - "step": 564530 + "epoch": 0.7, + "learning_rate": 1.5143797452088337e-05, + "loss": 2.7113, + "step": 195300 }, { - "epoch": 0.98, - "learning_rate": 7.755033709197572e-07, - "loss": 2.2362, - "step": 564540 + "epoch": 0.7, + "learning_rate": 1.512594993414266e-05, + "loss": 2.7196, + "step": 195400 }, { - "epoch": 0.98, - "learning_rate": 7.746314309929304e-07, - "loss": 2.2365, - "step": 564550 + "epoch": 0.7, + "learning_rate": 1.5108102416196981e-05, + "loss": 2.7211, + "step": 195500 }, { - "epoch": 0.98, - "learning_rate": 7.737594910661035e-07, - "loss": 2.2101, - "step": 564560 + "epoch": 0.7, + "learning_rate": 1.5090254898251303e-05, + "loss": 2.7129, + "step": 195600 }, { - "epoch": 0.98, - "learning_rate": 7.728875511392768e-07, - "loss": 2.2937, - "step": 564570 + "epoch": 0.7, + "learning_rate": 1.5072407380305622e-05, + "loss": 2.7124, + "step": 195700 }, { - "epoch": 0.98, - "learning_rate": 7.720156112124499e-07, - "loss": 2.2002, - "step": 564580 + "epoch": 0.7, + "learning_rate": 1.5054559862359943e-05, + "loss": 2.7142, + "step": 195800 }, { - "epoch": 0.98, - "learning_rate": 7.711436712856231e-07, - "loss": 2.0609, - "step": 564590 + "epoch": 0.7, + "learning_rate": 1.5036712344414265e-05, + "loss": 2.71, + "step": 195900 }, { - "epoch": 0.98, - "learning_rate": 7.702717313587964e-07, - "loss": 2.1932, - "step": 564600 + "epoch": 0.7, + "learning_rate": 1.5018864826468584e-05, + "loss": 2.7202, + "step": 196000 }, { - "epoch": 0.98, - "learning_rate": 7.693997914319695e-07, - "loss": 2.3044, - "step": 564610 + "epoch": 0.7, + "learning_rate": 1.5001017308522905e-05, + "loss": 2.7147, + "step": 196100 }, { - "epoch": 0.98, - "learning_rate": 7.685278515051428e-07, - "loss": 2.2504, - "step": 564620 + "epoch": 0.7, + "learning_rate": 1.4983169790577225e-05, + "loss": 2.705, + "step": 196200 }, { - "epoch": 0.98, - "learning_rate": 7.67655911578316e-07, - "loss": 2.1779, - "step": 564630 + "epoch": 0.7, + "learning_rate": 1.4965322272631546e-05, + "loss": 2.7123, + "step": 196300 }, { - "epoch": 0.98, - "learning_rate": 7.667839716514891e-07, - "loss": 2.1509, - "step": 564640 + "epoch": 0.7, + "learning_rate": 1.4947474754685867e-05, + "loss": 2.7156, + "step": 196400 }, { - "epoch": 0.98, - "learning_rate": 7.659120317246624e-07, - "loss": 2.222, - "step": 564650 + "epoch": 0.7, + "learning_rate": 1.4929627236740187e-05, + "loss": 2.716, + "step": 196500 }, { - "epoch": 0.98, - "learning_rate": 7.650400917978355e-07, - "loss": 2.3494, - "step": 564660 + "epoch": 0.7, + "learning_rate": 1.4911779718794508e-05, + "loss": 2.7234, + "step": 196600 }, { - "epoch": 0.98, - "learning_rate": 7.641681518710088e-07, - "loss": 2.3317, - "step": 564670 + "epoch": 0.7, + "learning_rate": 1.489393220084883e-05, + "loss": 2.7084, + "step": 196700 }, { - "epoch": 0.98, - "learning_rate": 7.63296211944182e-07, - "loss": 2.3167, - "step": 564680 + "epoch": 0.7, + "learning_rate": 1.4876084682903149e-05, + "loss": 2.7275, + "step": 196800 }, { - "epoch": 0.98, - "learning_rate": 7.624242720173551e-07, - "loss": 2.315, - "step": 564690 + "epoch": 0.7, + "learning_rate": 1.485823716495747e-05, + "loss": 2.7241, + "step": 196900 }, { - "epoch": 0.98, - "learning_rate": 7.615523320905284e-07, - "loss": 2.3124, - "step": 564700 + "epoch": 0.7, + "learning_rate": 1.4840389647011791e-05, + "loss": 2.7109, + "step": 197000 }, { - "epoch": 0.98, - "learning_rate": 7.606803921637015e-07, - "loss": 2.2515, - "step": 564710 + "epoch": 0.7, + "learning_rate": 1.482254212906611e-05, + "loss": 2.7211, + "step": 197100 }, { - "epoch": 0.98, - "learning_rate": 7.598084522368747e-07, - "loss": 2.3442, - "step": 564720 + "epoch": 0.7, + "learning_rate": 1.4804694611120432e-05, + "loss": 2.717, + "step": 197200 }, { - "epoch": 0.98, - "learning_rate": 7.58936512310048e-07, - "loss": 2.2467, - "step": 564730 + "epoch": 0.7, + "learning_rate": 1.4786847093174751e-05, + "loss": 2.7164, + "step": 197300 }, { - "epoch": 0.98, - "learning_rate": 7.580645723832211e-07, - "loss": 2.228, - "step": 564740 + "epoch": 0.7, + "learning_rate": 1.4768999575229073e-05, + "loss": 2.7071, + "step": 197400 }, { - "epoch": 0.98, - "learning_rate": 7.571926324563944e-07, - "loss": 2.2962, - "step": 564750 + "epoch": 0.7, + "learning_rate": 1.4751152057283394e-05, + "loss": 2.7143, + "step": 197500 }, { - "epoch": 0.98, - "learning_rate": 7.563206925295675e-07, - "loss": 2.333, - "step": 564760 + "epoch": 0.71, + "learning_rate": 1.4733304539337713e-05, + "loss": 2.7101, + "step": 197600 }, { - "epoch": 0.98, - "learning_rate": 7.554487526027407e-07, - "loss": 2.2435, - "step": 564770 + "epoch": 0.71, + "learning_rate": 1.4715457021392035e-05, + "loss": 2.703, + "step": 197700 }, { - "epoch": 0.98, - "learning_rate": 7.54576812675914e-07, - "loss": 2.2097, - "step": 564780 + "epoch": 0.71, + "learning_rate": 1.4697609503446356e-05, + "loss": 2.7191, + "step": 197800 }, { - "epoch": 0.98, - "learning_rate": 7.537048727490871e-07, - "loss": 2.2659, - "step": 564790 + "epoch": 0.71, + "learning_rate": 1.4679761985500679e-05, + "loss": 2.6988, + "step": 197900 }, { - "epoch": 0.98, - "learning_rate": 7.528329328222604e-07, - "loss": 2.2521, - "step": 564800 + "epoch": 0.71, + "learning_rate": 1.4661914467554998e-05, + "loss": 2.7139, + "step": 198000 }, { - "epoch": 0.98, - "learning_rate": 7.519609928954335e-07, - "loss": 2.3104, - "step": 564810 + "epoch": 0.71, + "learning_rate": 1.464406694960932e-05, + "loss": 2.7126, + "step": 198100 }, { - "epoch": 0.98, - "learning_rate": 7.510890529686067e-07, - "loss": 2.3152, - "step": 564820 + "epoch": 0.71, + "learning_rate": 1.462621943166364e-05, + "loss": 2.7098, + "step": 198200 }, { - "epoch": 0.98, - "learning_rate": 7.5021711304178e-07, - "loss": 2.2084, - "step": 564830 + "epoch": 0.71, + "learning_rate": 1.460837191371796e-05, + "loss": 2.7169, + "step": 198300 }, { - "epoch": 0.99, - "learning_rate": 7.493451731149531e-07, - "loss": 2.2544, - "step": 564840 + "epoch": 0.71, + "learning_rate": 1.4590524395772281e-05, + "loss": 2.7155, + "step": 198400 }, { - "epoch": 0.99, - "learning_rate": 7.484732331881263e-07, - "loss": 2.2766, - "step": 564850 + "epoch": 0.71, + "learning_rate": 1.4572676877826603e-05, + "loss": 2.7074, + "step": 198500 }, { - "epoch": 0.99, - "learning_rate": 7.476012932612995e-07, - "loss": 2.3273, - "step": 564860 + "epoch": 0.71, + "learning_rate": 1.4554829359880922e-05, + "loss": 2.7125, + "step": 198600 }, { - "epoch": 0.99, - "learning_rate": 7.467293533344727e-07, - "loss": 2.3189, - "step": 564870 + "epoch": 0.71, + "learning_rate": 1.4536981841935243e-05, + "loss": 2.7075, + "step": 198700 }, { - "epoch": 0.99, - "learning_rate": 7.45857413407646e-07, - "loss": 2.0952, - "step": 564880 + "epoch": 0.71, + "learning_rate": 1.4519134323989565e-05, + "loss": 2.7093, + "step": 198800 }, { - "epoch": 0.99, - "learning_rate": 7.449854734808191e-07, - "loss": 2.1253, - "step": 564890 + "epoch": 0.71, + "learning_rate": 1.4501286806043884e-05, + "loss": 2.723, + "step": 198900 }, { - "epoch": 0.99, - "learning_rate": 7.441135335539923e-07, - "loss": 2.3869, - "step": 564900 + "epoch": 0.71, + "learning_rate": 1.4483439288098205e-05, + "loss": 2.7153, + "step": 199000 }, { - "epoch": 0.99, - "learning_rate": 7.432415936271655e-07, - "loss": 2.2481, - "step": 564910 + "epoch": 0.71, + "learning_rate": 1.4465591770152525e-05, + "loss": 2.722, + "step": 199100 }, { - "epoch": 0.99, - "learning_rate": 7.423696537003387e-07, - "loss": 2.1201, - "step": 564920 + "epoch": 0.71, + "learning_rate": 1.4447744252206846e-05, + "loss": 2.7141, + "step": 199200 }, { - "epoch": 0.99, - "learning_rate": 7.41497713773512e-07, - "loss": 2.2553, - "step": 564930 + "epoch": 0.71, + "learning_rate": 1.4429896734261167e-05, + "loss": 2.7116, + "step": 199300 }, { - "epoch": 0.99, - "learning_rate": 7.406257738466851e-07, - "loss": 2.2527, - "step": 564940 + "epoch": 0.71, + "learning_rate": 1.4412049216315487e-05, + "loss": 2.7091, + "step": 199400 }, { - "epoch": 0.99, - "learning_rate": 7.397538339198583e-07, - "loss": 2.2273, - "step": 564950 + "epoch": 0.71, + "learning_rate": 1.4394201698369808e-05, + "loss": 2.7091, + "step": 199500 }, { - "epoch": 0.99, - "learning_rate": 7.388818939930315e-07, - "loss": 2.2804, - "step": 564960 + "epoch": 0.71, + "learning_rate": 1.437635418042413e-05, + "loss": 2.7183, + "step": 199600 }, { - "epoch": 0.99, - "learning_rate": 7.380099540662047e-07, - "loss": 2.2636, - "step": 564970 + "epoch": 0.71, + "learning_rate": 1.4358506662478449e-05, + "loss": 2.7198, + "step": 199700 }, { - "epoch": 0.99, - "learning_rate": 7.371380141393779e-07, - "loss": 2.2305, - "step": 564980 + "epoch": 0.71, + "learning_rate": 1.434065914453277e-05, + "loss": 2.7075, + "step": 199800 }, { - "epoch": 0.99, - "learning_rate": 7.362660742125511e-07, - "loss": 2.1349, - "step": 564990 + "epoch": 0.71, + "learning_rate": 1.4322811626587091e-05, + "loss": 2.7077, + "step": 199900 }, { - "epoch": 0.99, - "learning_rate": 7.353941342857243e-07, - "loss": 2.1725, - "step": 565000 + "epoch": 0.71, + "learning_rate": 1.430496410864141e-05, + "loss": 2.7082, + "step": 200000 }, { - "epoch": 0.99, - "learning_rate": 7.345221943588974e-07, - "loss": 2.3944, - "step": 565010 + "epoch": 0.71, + "learning_rate": 1.4287116590695732e-05, + "loss": 2.7021, + "step": 200100 }, { - "epoch": 0.99, - "learning_rate": 7.336502544320707e-07, - "loss": 2.3278, - "step": 565020 + "epoch": 0.71, + "learning_rate": 1.4269269072750051e-05, + "loss": 2.7069, + "step": 200200 }, { - "epoch": 0.99, - "learning_rate": 7.327783145052439e-07, - "loss": 2.2342, - "step": 565030 + "epoch": 0.71, + "learning_rate": 1.4251421554804373e-05, + "loss": 2.7115, + "step": 200300 }, { - "epoch": 0.99, - "learning_rate": 7.319063745784171e-07, - "loss": 2.2451, - "step": 565040 + "epoch": 0.72, + "learning_rate": 1.4233574036858694e-05, + "loss": 2.721, + "step": 200400 }, { - "epoch": 0.99, - "learning_rate": 7.310344346515903e-07, - "loss": 2.1649, - "step": 565050 + "epoch": 0.72, + "learning_rate": 1.4215726518913017e-05, + "loss": 2.7126, + "step": 200500 }, { - "epoch": 0.99, - "learning_rate": 7.301624947247634e-07, - "loss": 2.3163, - "step": 565060 + "epoch": 0.72, + "learning_rate": 1.4197879000967338e-05, + "loss": 2.71, + "step": 200600 }, { - "epoch": 0.99, - "learning_rate": 7.292905547979367e-07, - "loss": 2.3208, - "step": 565070 + "epoch": 0.72, + "learning_rate": 1.4180031483021658e-05, + "loss": 2.7111, + "step": 200700 }, { - "epoch": 0.99, - "learning_rate": 7.284186148711099e-07, - "loss": 2.2829, - "step": 565080 + "epoch": 0.72, + "learning_rate": 1.4162183965075979e-05, + "loss": 2.7108, + "step": 200800 }, { - "epoch": 0.99, - "learning_rate": 7.275466749442831e-07, - "loss": 2.3568, - "step": 565090 + "epoch": 0.72, + "learning_rate": 1.41443364471303e-05, + "loss": 2.7228, + "step": 200900 }, { - "epoch": 0.99, - "learning_rate": 7.266747350174563e-07, - "loss": 2.2269, - "step": 565100 + "epoch": 0.72, + "learning_rate": 1.412648892918462e-05, + "loss": 2.7085, + "step": 201000 }, { - "epoch": 0.99, - "learning_rate": 7.258027950906294e-07, - "loss": 2.2657, - "step": 565110 + "epoch": 0.72, + "learning_rate": 1.410864141123894e-05, + "loss": 2.7095, + "step": 201100 }, { - "epoch": 0.99, - "learning_rate": 7.249308551638027e-07, - "loss": 2.2955, - "step": 565120 + "epoch": 0.72, + "learning_rate": 1.409079389329326e-05, + "loss": 2.7077, + "step": 201200 }, { - "epoch": 0.99, - "learning_rate": 7.240589152369759e-07, - "loss": 2.2948, - "step": 565130 + "epoch": 0.72, + "learning_rate": 1.4072946375347581e-05, + "loss": 2.7039, + "step": 201300 }, { - "epoch": 0.99, - "learning_rate": 7.23186975310149e-07, - "loss": 2.3701, - "step": 565140 + "epoch": 0.72, + "learning_rate": 1.4055098857401903e-05, + "loss": 2.7041, + "step": 201400 }, { - "epoch": 0.99, - "learning_rate": 7.223150353833223e-07, - "loss": 2.1348, - "step": 565150 + "epoch": 0.72, + "learning_rate": 1.4037251339456222e-05, + "loss": 2.7023, + "step": 201500 }, { - "epoch": 0.99, - "learning_rate": 7.214430954564954e-07, - "loss": 2.1794, - "step": 565160 + "epoch": 0.72, + "learning_rate": 1.4019403821510543e-05, + "loss": 2.7144, + "step": 201600 }, { - "epoch": 0.99, - "learning_rate": 7.205711555296687e-07, - "loss": 2.2437, - "step": 565170 + "epoch": 0.72, + "learning_rate": 1.4001556303564865e-05, + "loss": 2.7156, + "step": 201700 }, { - "epoch": 0.99, - "learning_rate": 7.196992156028419e-07, - "loss": 2.2745, - "step": 565180 + "epoch": 0.72, + "learning_rate": 1.3983708785619184e-05, + "loss": 2.7142, + "step": 201800 }, { - "epoch": 0.99, - "learning_rate": 7.18827275676015e-07, - "loss": 2.3191, - "step": 565190 + "epoch": 0.72, + "learning_rate": 1.3965861267673505e-05, + "loss": 2.7201, + "step": 201900 }, { - "epoch": 0.99, - "learning_rate": 7.179553357491883e-07, - "loss": 2.229, - "step": 565200 + "epoch": 0.72, + "learning_rate": 1.3948013749727827e-05, + "loss": 2.6971, + "step": 202000 }, { - "epoch": 0.99, - "learning_rate": 7.170833958223614e-07, - "loss": 2.2031, - "step": 565210 + "epoch": 0.72, + "learning_rate": 1.3930166231782146e-05, + "loss": 2.7061, + "step": 202100 }, { - "epoch": 0.99, - "learning_rate": 7.162114558955347e-07, - "loss": 2.187, - "step": 565220 + "epoch": 0.72, + "learning_rate": 1.3912318713836467e-05, + "loss": 2.6988, + "step": 202200 }, { - "epoch": 0.99, - "learning_rate": 7.153395159687079e-07, - "loss": 2.338, - "step": 565230 + "epoch": 0.72, + "learning_rate": 1.3894471195890787e-05, + "loss": 2.6982, + "step": 202300 }, { - "epoch": 0.99, - "learning_rate": 7.14467576041881e-07, - "loss": 2.1543, - "step": 565240 + "epoch": 0.72, + "learning_rate": 1.3876623677945108e-05, + "loss": 2.7014, + "step": 202400 }, { - "epoch": 0.99, - "learning_rate": 7.135956361150543e-07, - "loss": 2.2273, - "step": 565250 + "epoch": 0.72, + "learning_rate": 1.385877615999943e-05, + "loss": 2.7116, + "step": 202500 }, { - "epoch": 0.99, - "learning_rate": 7.127236961882274e-07, - "loss": 2.2736, - "step": 565260 + "epoch": 0.72, + "learning_rate": 1.3840928642053749e-05, + "loss": 2.7166, + "step": 202600 }, { - "epoch": 0.99, - "learning_rate": 7.118517562614006e-07, - "loss": 2.2796, - "step": 565270 + "epoch": 0.72, + "learning_rate": 1.382308112410807e-05, + "loss": 2.7059, + "step": 202700 }, { - "epoch": 0.99, - "learning_rate": 7.109798163345739e-07, - "loss": 2.2559, - "step": 565280 + "epoch": 0.72, + "learning_rate": 1.3805233606162391e-05, + "loss": 2.7062, + "step": 202800 }, { - "epoch": 0.99, - "learning_rate": 7.10107876407747e-07, - "loss": 2.2563, - "step": 565290 + "epoch": 0.72, + "learning_rate": 1.378738608821671e-05, + "loss": 2.7098, + "step": 202900 }, { - "epoch": 0.99, - "learning_rate": 7.092359364809203e-07, - "loss": 2.2775, - "step": 565300 + "epoch": 0.72, + "learning_rate": 1.3769538570271035e-05, + "loss": 2.7037, + "step": 203000 }, { - "epoch": 0.99, - "learning_rate": 7.083639965540934e-07, - "loss": 2.2039, - "step": 565310 + "epoch": 0.72, + "learning_rate": 1.3751691052325355e-05, + "loss": 2.6999, + "step": 203100 }, { - "epoch": 0.99, - "learning_rate": 7.074920566272666e-07, - "loss": 2.2327, - "step": 565320 + "epoch": 0.73, + "learning_rate": 1.3733843534379676e-05, + "loss": 2.7086, + "step": 203200 }, { - "epoch": 0.99, - "learning_rate": 7.066201167004399e-07, - "loss": 2.3388, - "step": 565330 + "epoch": 0.73, + "learning_rate": 1.3715996016433996e-05, + "loss": 2.6995, + "step": 203300 }, { - "epoch": 0.99, - "learning_rate": 7.05748176773613e-07, - "loss": 2.2131, - "step": 565340 + "epoch": 0.73, + "learning_rate": 1.3698148498488317e-05, + "loss": 2.711, + "step": 203400 }, { - "epoch": 0.99, - "learning_rate": 7.048762368467862e-07, - "loss": 2.2595, - "step": 565350 + "epoch": 0.73, + "learning_rate": 1.3680300980542638e-05, + "loss": 2.7133, + "step": 203500 }, { - "epoch": 0.99, - "learning_rate": 7.040042969199594e-07, - "loss": 2.1787, - "step": 565360 + "epoch": 0.73, + "learning_rate": 1.3662453462596957e-05, + "loss": 2.7038, + "step": 203600 }, { - "epoch": 0.99, - "learning_rate": 7.031323569931326e-07, - "loss": 2.2854, - "step": 565370 + "epoch": 0.73, + "learning_rate": 1.3644605944651279e-05, + "loss": 2.7063, + "step": 203700 }, { - "epoch": 0.99, - "learning_rate": 7.022604170663059e-07, - "loss": 2.2124, - "step": 565380 + "epoch": 0.73, + "learning_rate": 1.36267584267056e-05, + "loss": 2.7157, + "step": 203800 }, { - "epoch": 0.99, - "learning_rate": 7.01388477139479e-07, - "loss": 2.1589, - "step": 565390 + "epoch": 0.73, + "learning_rate": 1.360891090875992e-05, + "loss": 2.7108, + "step": 203900 }, { - "epoch": 0.99, - "learning_rate": 7.005165372126522e-07, - "loss": 2.2644, - "step": 565400 + "epoch": 0.73, + "learning_rate": 1.359106339081424e-05, + "loss": 2.7191, + "step": 204000 }, { - "epoch": 0.99, - "learning_rate": 6.996445972858254e-07, - "loss": 2.4313, - "step": 565410 + "epoch": 0.73, + "learning_rate": 1.357321587286856e-05, + "loss": 2.7154, + "step": 204100 }, { - "epoch": 0.99, - "learning_rate": 6.987726573589986e-07, - "loss": 2.2437, - "step": 565420 + "epoch": 0.73, + "learning_rate": 1.3555368354922881e-05, + "loss": 2.7079, + "step": 204200 }, { - "epoch": 0.99, - "learning_rate": 6.979007174321719e-07, - "loss": 2.2907, - "step": 565430 + "epoch": 0.73, + "learning_rate": 1.3537520836977203e-05, + "loss": 2.7155, + "step": 204300 }, { - "epoch": 0.99, - "learning_rate": 6.97028777505345e-07, - "loss": 2.2222, - "step": 565440 + "epoch": 0.73, + "learning_rate": 1.3519673319031522e-05, + "loss": 2.7104, + "step": 204400 }, { - "epoch": 0.99, - "learning_rate": 6.961568375785182e-07, - "loss": 2.3191, - "step": 565450 + "epoch": 0.73, + "learning_rate": 1.3501825801085843e-05, + "loss": 2.7177, + "step": 204500 }, { - "epoch": 0.99, - "learning_rate": 6.952848976516914e-07, - "loss": 2.1629, - "step": 565460 + "epoch": 0.73, + "learning_rate": 1.3483978283140165e-05, + "loss": 2.7027, + "step": 204600 }, { - "epoch": 0.99, - "learning_rate": 6.944129577248646e-07, - "loss": 2.1649, - "step": 565470 + "epoch": 0.73, + "learning_rate": 1.3466130765194484e-05, + "loss": 2.7069, + "step": 204700 }, { - "epoch": 0.99, - "learning_rate": 6.935410177980378e-07, - "loss": 2.1814, - "step": 565480 + "epoch": 0.73, + "learning_rate": 1.3448283247248805e-05, + "loss": 2.7113, + "step": 204800 }, { - "epoch": 0.99, - "learning_rate": 6.92669077871211e-07, - "loss": 2.1859, - "step": 565490 + "epoch": 0.73, + "learning_rate": 1.3430435729303127e-05, + "loss": 2.7089, + "step": 204900 }, { - "epoch": 0.99, - "learning_rate": 6.917971379443842e-07, - "loss": 2.2481, - "step": 565500 + "epoch": 0.73, + "learning_rate": 1.3412588211357446e-05, + "loss": 2.7084, + "step": 205000 }, { - "epoch": 0.99, - "learning_rate": 6.909251980175574e-07, - "loss": 2.2751, - "step": 565510 + "epoch": 0.73, + "learning_rate": 1.3394740693411767e-05, + "loss": 2.7063, + "step": 205100 }, { - "epoch": 0.99, - "learning_rate": 6.900532580907306e-07, - "loss": 2.1521, - "step": 565520 + "epoch": 0.73, + "learning_rate": 1.3376893175466087e-05, + "loss": 2.7047, + "step": 205200 }, { - "epoch": 0.99, - "learning_rate": 6.891813181639038e-07, - "loss": 2.3292, - "step": 565530 + "epoch": 0.73, + "learning_rate": 1.3359045657520408e-05, + "loss": 2.7045, + "step": 205300 }, { - "epoch": 0.99, - "learning_rate": 6.88309378237077e-07, - "loss": 2.2744, - "step": 565540 + "epoch": 0.73, + "learning_rate": 1.334119813957473e-05, + "loss": 2.7003, + "step": 205400 }, { - "epoch": 0.99, - "learning_rate": 6.874374383102502e-07, - "loss": 2.311, - "step": 565550 + "epoch": 0.73, + "learning_rate": 1.3323350621629049e-05, + "loss": 2.7127, + "step": 205500 }, { - "epoch": 0.99, - "learning_rate": 6.865654983834233e-07, - "loss": 2.3417, - "step": 565560 + "epoch": 0.73, + "learning_rate": 1.3305503103683373e-05, + "loss": 2.706, + "step": 205600 }, { - "epoch": 0.99, - "learning_rate": 6.856935584565966e-07, - "loss": 2.2685, - "step": 565570 + "epoch": 0.73, + "learning_rate": 1.3287655585737693e-05, + "loss": 2.7087, + "step": 205700 }, { - "epoch": 0.99, - "learning_rate": 6.848216185297698e-07, - "loss": 2.1714, - "step": 565580 + "epoch": 0.73, + "learning_rate": 1.3269808067792014e-05, + "loss": 2.7042, + "step": 205800 }, { - "epoch": 0.99, - "learning_rate": 6.83949678602943e-07, - "loss": 2.2941, - "step": 565590 + "epoch": 0.73, + "learning_rate": 1.3251960549846335e-05, + "loss": 2.7102, + "step": 205900 }, { - "epoch": 0.99, - "learning_rate": 6.830777386761162e-07, - "loss": 2.2803, - "step": 565600 + "epoch": 0.74, + "learning_rate": 1.3234113031900655e-05, + "loss": 2.7052, + "step": 206000 }, { - "epoch": 0.99, - "learning_rate": 6.822057987492893e-07, - "loss": 2.2903, - "step": 565610 + "epoch": 0.74, + "learning_rate": 1.3216265513954976e-05, + "loss": 2.7132, + "step": 206100 }, { - "epoch": 0.99, - "learning_rate": 6.813338588224626e-07, - "loss": 2.246, - "step": 565620 + "epoch": 0.74, + "learning_rate": 1.3198417996009296e-05, + "loss": 2.7066, + "step": 206200 }, { - "epoch": 0.99, - "learning_rate": 6.804619188956358e-07, - "loss": 2.3149, - "step": 565630 + "epoch": 0.74, + "learning_rate": 1.3180570478063617e-05, + "loss": 2.7044, + "step": 206300 }, { - "epoch": 0.99, - "learning_rate": 6.79589978968809e-07, - "loss": 2.2535, - "step": 565640 + "epoch": 0.74, + "learning_rate": 1.3162722960117938e-05, + "loss": 2.7034, + "step": 206400 }, { - "epoch": 0.99, - "learning_rate": 6.787180390419822e-07, - "loss": 2.3071, - "step": 565650 + "epoch": 0.74, + "learning_rate": 1.3144875442172257e-05, + "loss": 2.7098, + "step": 206500 }, { - "epoch": 0.99, - "learning_rate": 6.778460991151553e-07, - "loss": 2.1893, - "step": 565660 + "epoch": 0.74, + "learning_rate": 1.3127027924226579e-05, + "loss": 2.7157, + "step": 206600 }, { - "epoch": 0.99, - "learning_rate": 6.769741591883286e-07, - "loss": 2.2613, - "step": 565670 + "epoch": 0.74, + "learning_rate": 1.31091804062809e-05, + "loss": 2.7046, + "step": 206700 }, { - "epoch": 0.99, - "learning_rate": 6.761022192615018e-07, - "loss": 2.3175, - "step": 565680 + "epoch": 0.74, + "learning_rate": 1.309133288833522e-05, + "loss": 2.7127, + "step": 206800 }, { - "epoch": 0.99, - "learning_rate": 6.752302793346749e-07, - "loss": 2.2578, - "step": 565690 + "epoch": 0.74, + "learning_rate": 1.307348537038954e-05, + "loss": 2.7212, + "step": 206900 }, { - "epoch": 0.99, - "learning_rate": 6.743583394078482e-07, - "loss": 2.2987, - "step": 565700 + "epoch": 0.74, + "learning_rate": 1.3055637852443862e-05, + "loss": 2.7121, + "step": 207000 }, { - "epoch": 0.99, - "learning_rate": 6.734863994810213e-07, - "loss": 2.2943, - "step": 565710 + "epoch": 0.74, + "learning_rate": 1.3037790334498181e-05, + "loss": 2.7047, + "step": 207100 }, { - "epoch": 0.99, - "learning_rate": 6.726144595541946e-07, - "loss": 2.3093, - "step": 565720 + "epoch": 0.74, + "learning_rate": 1.3019942816552503e-05, + "loss": 2.7158, + "step": 207200 }, { - "epoch": 0.99, - "learning_rate": 6.717425196273678e-07, - "loss": 2.3023, - "step": 565730 + "epoch": 0.74, + "learning_rate": 1.3002095298606822e-05, + "loss": 2.7122, + "step": 207300 }, { - "epoch": 0.99, - "learning_rate": 6.708705797005409e-07, - "loss": 2.3029, - "step": 565740 + "epoch": 0.74, + "learning_rate": 1.2984247780661143e-05, + "loss": 2.7048, + "step": 207400 }, { - "epoch": 0.99, - "learning_rate": 6.699986397737142e-07, - "loss": 2.2944, - "step": 565750 + "epoch": 0.74, + "learning_rate": 1.2966400262715465e-05, + "loss": 2.6977, + "step": 207500 }, { - "epoch": 0.99, - "learning_rate": 6.691266998468873e-07, - "loss": 2.3321, - "step": 565760 + "epoch": 0.74, + "learning_rate": 1.2948552744769784e-05, + "loss": 2.7032, + "step": 207600 }, { - "epoch": 0.99, - "learning_rate": 6.682547599200606e-07, - "loss": 2.1969, - "step": 565770 + "epoch": 0.74, + "learning_rate": 1.2930705226824105e-05, + "loss": 2.7065, + "step": 207700 }, { - "epoch": 0.99, - "learning_rate": 6.673828199932338e-07, - "loss": 2.2164, - "step": 565780 + "epoch": 0.74, + "learning_rate": 1.2912857708878426e-05, + "loss": 2.7104, + "step": 207800 }, { - "epoch": 0.99, - "learning_rate": 6.665108800664069e-07, - "loss": 2.3573, - "step": 565790 + "epoch": 0.74, + "learning_rate": 1.2895010190932746e-05, + "loss": 2.7086, + "step": 207900 }, { - "epoch": 0.99, - "learning_rate": 6.656389401395802e-07, - "loss": 2.2565, - "step": 565800 + "epoch": 0.74, + "learning_rate": 1.2877162672987067e-05, + "loss": 2.7076, + "step": 208000 }, { - "epoch": 0.99, - "learning_rate": 6.647670002127533e-07, - "loss": 2.0959, - "step": 565810 + "epoch": 0.74, + "learning_rate": 1.285931515504139e-05, + "loss": 2.7008, + "step": 208100 }, { - "epoch": 0.99, - "learning_rate": 6.638950602859265e-07, - "loss": 2.2382, - "step": 565820 + "epoch": 0.74, + "learning_rate": 1.2841467637095711e-05, + "loss": 2.712, + "step": 208200 }, { - "epoch": 0.99, - "learning_rate": 6.630231203590998e-07, - "loss": 2.2548, - "step": 565830 + "epoch": 0.74, + "learning_rate": 1.2823620119150031e-05, + "loss": 2.7053, + "step": 208300 }, { - "epoch": 0.99, - "learning_rate": 6.621511804322729e-07, - "loss": 2.3389, - "step": 565840 + "epoch": 0.74, + "learning_rate": 1.2805772601204352e-05, + "loss": 2.7051, + "step": 208400 }, { - "epoch": 0.99, - "learning_rate": 6.612792405054462e-07, - "loss": 2.2666, - "step": 565850 + "epoch": 0.74, + "learning_rate": 1.2787925083258673e-05, + "loss": 2.7001, + "step": 208500 }, { - "epoch": 0.99, - "learning_rate": 6.604073005786193e-07, - "loss": 2.2959, - "step": 565860 + "epoch": 0.74, + "learning_rate": 1.2770077565312993e-05, + "loss": 2.697, + "step": 208600 }, { - "epoch": 0.99, - "learning_rate": 6.595353606517925e-07, - "loss": 2.0676, - "step": 565870 + "epoch": 0.74, + "learning_rate": 1.2752230047367314e-05, + "loss": 2.7099, + "step": 208700 }, { - "epoch": 0.99, - "learning_rate": 6.586634207249658e-07, - "loss": 2.2161, - "step": 565880 + "epoch": 0.75, + "learning_rate": 1.2734382529421635e-05, + "loss": 2.7105, + "step": 208800 }, { - "epoch": 0.99, - "learning_rate": 6.577914807981389e-07, - "loss": 2.1892, - "step": 565890 + "epoch": 0.75, + "learning_rate": 1.2716535011475955e-05, + "loss": 2.7111, + "step": 208900 }, { - "epoch": 0.99, - "learning_rate": 6.569195408713121e-07, - "loss": 2.2233, - "step": 565900 + "epoch": 0.75, + "learning_rate": 1.2698687493530276e-05, + "loss": 2.7154, + "step": 209000 }, { - "epoch": 0.99, - "learning_rate": 6.560476009444853e-07, - "loss": 2.4397, - "step": 565910 + "epoch": 0.75, + "learning_rate": 1.2680839975584596e-05, + "loss": 2.7073, + "step": 209100 }, { - "epoch": 0.99, - "learning_rate": 6.551756610176585e-07, - "loss": 2.2185, - "step": 565920 + "epoch": 0.75, + "learning_rate": 1.2662992457638917e-05, + "loss": 2.7087, + "step": 209200 }, { - "epoch": 0.99, - "learning_rate": 6.543037210908318e-07, - "loss": 2.2773, - "step": 565930 + "epoch": 0.75, + "learning_rate": 1.2645144939693238e-05, + "loss": 2.7062, + "step": 209300 }, { - "epoch": 0.99, - "learning_rate": 6.534317811640049e-07, - "loss": 2.2584, - "step": 565940 + "epoch": 0.75, + "learning_rate": 1.2627297421747557e-05, + "loss": 2.7118, + "step": 209400 }, { - "epoch": 0.99, - "learning_rate": 6.525598412371781e-07, - "loss": 2.2271, - "step": 565950 + "epoch": 0.75, + "learning_rate": 1.2609449903801879e-05, + "loss": 2.7088, + "step": 209500 }, { - "epoch": 0.99, - "learning_rate": 6.516879013103513e-07, - "loss": 2.3018, - "step": 565960 + "epoch": 0.75, + "learning_rate": 1.25916023858562e-05, + "loss": 2.7063, + "step": 209600 }, { - "epoch": 0.99, - "learning_rate": 6.508159613835245e-07, - "loss": 2.2351, - "step": 565970 + "epoch": 0.75, + "learning_rate": 1.257375486791052e-05, + "loss": 2.6977, + "step": 209700 }, { - "epoch": 0.99, - "learning_rate": 6.499440214566978e-07, - "loss": 2.3005, - "step": 565980 + "epoch": 0.75, + "learning_rate": 1.255590734996484e-05, + "loss": 2.704, + "step": 209800 }, { - "epoch": 0.99, - "learning_rate": 6.490720815298709e-07, - "loss": 2.304, - "step": 565990 + "epoch": 0.75, + "learning_rate": 1.2538059832019162e-05, + "loss": 2.7019, + "step": 209900 }, { - "epoch": 0.99, - "learning_rate": 6.482001416030441e-07, - "loss": 2.2917, - "step": 566000 + "epoch": 0.75, + "learning_rate": 1.2520212314073481e-05, + "loss": 2.7064, + "step": 210000 }, { - "epoch": 0.99, - "learning_rate": 6.473282016762173e-07, - "loss": 2.3166, - "step": 566010 + "epoch": 0.75, + "learning_rate": 1.2502364796127803e-05, + "loss": 2.7135, + "step": 210100 }, { - "epoch": 0.99, - "learning_rate": 6.464562617493905e-07, - "loss": 2.1891, - "step": 566020 + "epoch": 0.75, + "learning_rate": 1.2484517278182124e-05, + "loss": 2.699, + "step": 210200 }, { - "epoch": 0.99, - "learning_rate": 6.455843218225637e-07, - "loss": 2.2635, - "step": 566030 + "epoch": 0.75, + "learning_rate": 1.2466669760236445e-05, + "loss": 2.6967, + "step": 210300 }, { - "epoch": 0.99, - "learning_rate": 6.447123818957369e-07, - "loss": 2.2639, - "step": 566040 + "epoch": 0.75, + "learning_rate": 1.2448822242290766e-05, + "loss": 2.6995, + "step": 210400 }, { - "epoch": 0.99, - "learning_rate": 6.438404419689101e-07, - "loss": 2.1587, - "step": 566050 + "epoch": 0.75, + "learning_rate": 1.2430974724345086e-05, + "loss": 2.7137, + "step": 210500 }, { - "epoch": 0.99, - "learning_rate": 6.429685020420834e-07, - "loss": 2.3593, - "step": 566060 + "epoch": 0.75, + "learning_rate": 1.2413127206399407e-05, + "loss": 2.7117, + "step": 210600 }, { - "epoch": 0.99, - "learning_rate": 6.420965621152565e-07, - "loss": 2.231, - "step": 566070 + "epoch": 0.75, + "learning_rate": 1.2395279688453726e-05, + "loss": 2.7145, + "step": 210700 }, { - "epoch": 0.99, - "learning_rate": 6.412246221884297e-07, - "loss": 2.2201, - "step": 566080 + "epoch": 0.75, + "learning_rate": 1.2377432170508048e-05, + "loss": 2.7083, + "step": 210800 }, { - "epoch": 0.99, - "learning_rate": 6.403526822616029e-07, - "loss": 2.3107, - "step": 566090 + "epoch": 0.75, + "learning_rate": 1.2359584652562369e-05, + "loss": 2.7017, + "step": 210900 }, { - "epoch": 0.99, - "learning_rate": 6.394807423347761e-07, - "loss": 2.0938, - "step": 566100 + "epoch": 0.75, + "learning_rate": 1.2341737134616688e-05, + "loss": 2.7052, + "step": 211000 }, { - "epoch": 0.99, - "learning_rate": 6.386088024079494e-07, - "loss": 2.1503, - "step": 566110 + "epoch": 0.75, + "learning_rate": 1.232388961667101e-05, + "loss": 2.7031, + "step": 211100 }, { - "epoch": 0.99, - "learning_rate": 6.377368624811225e-07, - "loss": 2.2791, - "step": 566120 + "epoch": 0.75, + "learning_rate": 1.2306042098725331e-05, + "loss": 2.6986, + "step": 211200 }, { - "epoch": 0.99, - "learning_rate": 6.368649225542957e-07, - "loss": 2.2775, - "step": 566130 + "epoch": 0.75, + "learning_rate": 1.2288194580779652e-05, + "loss": 2.7134, + "step": 211300 }, { - "epoch": 0.99, - "learning_rate": 6.359929826274689e-07, - "loss": 2.2487, - "step": 566140 + "epoch": 0.75, + "learning_rate": 1.2270347062833973e-05, + "loss": 2.7121, + "step": 211400 }, { - "epoch": 0.99, - "learning_rate": 6.351210427006421e-07, - "loss": 2.3185, - "step": 566150 + "epoch": 0.75, + "learning_rate": 1.2252499544888293e-05, + "loss": 2.6999, + "step": 211500 }, { - "epoch": 0.99, - "learning_rate": 6.342491027738153e-07, - "loss": 2.3706, - "step": 566160 + "epoch": 0.76, + "learning_rate": 1.2234652026942614e-05, + "loss": 2.7063, + "step": 211600 }, { - "epoch": 0.99, - "learning_rate": 6.333771628469885e-07, - "loss": 2.2743, - "step": 566170 + "epoch": 0.76, + "learning_rate": 1.2216804508996935e-05, + "loss": 2.7068, + "step": 211700 }, { - "epoch": 0.99, - "learning_rate": 6.325052229201617e-07, - "loss": 2.2395, - "step": 566180 + "epoch": 0.76, + "learning_rate": 1.2198956991051255e-05, + "loss": 2.711, + "step": 211800 }, { - "epoch": 0.99, - "learning_rate": 6.316332829933349e-07, - "loss": 2.151, - "step": 566190 + "epoch": 0.76, + "learning_rate": 1.2181109473105576e-05, + "loss": 2.7179, + "step": 211900 }, { - "epoch": 0.99, - "learning_rate": 6.307613430665081e-07, - "loss": 2.266, - "step": 566200 + "epoch": 0.76, + "learning_rate": 1.2163261955159897e-05, + "loss": 2.7077, + "step": 212000 }, { - "epoch": 0.99, - "learning_rate": 6.298894031396813e-07, - "loss": 2.1623, - "step": 566210 + "epoch": 0.76, + "learning_rate": 1.2145414437214217e-05, + "loss": 2.703, + "step": 212100 }, { - "epoch": 0.99, - "learning_rate": 6.290174632128545e-07, - "loss": 2.2844, - "step": 566220 + "epoch": 0.76, + "learning_rate": 1.2127566919268538e-05, + "loss": 2.709, + "step": 212200 }, { - "epoch": 0.99, - "learning_rate": 6.281455232860277e-07, - "loss": 2.2503, - "step": 566230 + "epoch": 0.76, + "learning_rate": 1.2109719401322857e-05, + "loss": 2.703, + "step": 212300 }, { - "epoch": 0.99, - "learning_rate": 6.272735833592008e-07, - "loss": 2.3142, - "step": 566240 + "epoch": 0.76, + "learning_rate": 1.2091871883377179e-05, + "loss": 2.7035, + "step": 212400 }, { - "epoch": 0.99, - "learning_rate": 6.264016434323741e-07, - "loss": 2.2609, - "step": 566250 + "epoch": 0.76, + "learning_rate": 1.20740243654315e-05, + "loss": 2.6925, + "step": 212500 }, { - "epoch": 0.99, - "learning_rate": 6.255297035055473e-07, - "loss": 2.2132, - "step": 566260 + "epoch": 0.76, + "learning_rate": 1.2056176847485821e-05, + "loss": 2.7145, + "step": 212600 }, { - "epoch": 0.99, - "learning_rate": 6.246577635787205e-07, - "loss": 2.2403, - "step": 566270 + "epoch": 0.76, + "learning_rate": 1.2038329329540142e-05, + "loss": 2.7073, + "step": 212700 }, { - "epoch": 0.99, - "learning_rate": 6.237858236518937e-07, - "loss": 2.2105, - "step": 566280 + "epoch": 0.76, + "learning_rate": 1.2020481811594462e-05, + "loss": 2.7192, + "step": 212800 }, { - "epoch": 0.99, - "learning_rate": 6.229138837250668e-07, - "loss": 2.3248, - "step": 566290 + "epoch": 0.76, + "learning_rate": 1.2002634293648783e-05, + "loss": 2.7103, + "step": 212900 }, { - "epoch": 0.99, - "learning_rate": 6.220419437982401e-07, - "loss": 2.2775, - "step": 566300 + "epoch": 0.76, + "learning_rate": 1.1984786775703104e-05, + "loss": 2.7006, + "step": 213000 }, { - "epoch": 0.99, - "learning_rate": 6.211700038714133e-07, - "loss": 2.191, - "step": 566310 + "epoch": 0.76, + "learning_rate": 1.1966939257757424e-05, + "loss": 2.7086, + "step": 213100 }, { - "epoch": 0.99, - "learning_rate": 6.202980639445865e-07, - "loss": 2.3746, - "step": 566320 + "epoch": 0.76, + "learning_rate": 1.1949091739811745e-05, + "loss": 2.7046, + "step": 213200 }, { - "epoch": 0.99, - "learning_rate": 6.194261240177597e-07, - "loss": 2.3063, - "step": 566330 + "epoch": 0.76, + "learning_rate": 1.1931244221866066e-05, + "loss": 2.7126, + "step": 213300 }, { - "epoch": 0.99, - "learning_rate": 6.185541840909328e-07, - "loss": 2.242, - "step": 566340 + "epoch": 0.76, + "learning_rate": 1.1913396703920386e-05, + "loss": 2.6996, + "step": 213400 }, { - "epoch": 0.99, - "learning_rate": 6.176822441641061e-07, - "loss": 2.3349, - "step": 566350 + "epoch": 0.76, + "learning_rate": 1.1895549185974707e-05, + "loss": 2.7086, + "step": 213500 }, { - "epoch": 0.99, - "learning_rate": 6.168103042372793e-07, - "loss": 2.1948, - "step": 566360 + "epoch": 0.76, + "learning_rate": 1.1877701668029028e-05, + "loss": 2.7119, + "step": 213600 }, { - "epoch": 0.99, - "learning_rate": 6.159383643104524e-07, - "loss": 2.2015, - "step": 566370 + "epoch": 0.76, + "learning_rate": 1.1859854150083348e-05, + "loss": 2.6988, + "step": 213700 }, { - "epoch": 0.99, - "learning_rate": 6.150664243836257e-07, - "loss": 1.924, - "step": 566380 + "epoch": 0.76, + "learning_rate": 1.1842006632137669e-05, + "loss": 2.7048, + "step": 213800 }, { - "epoch": 0.99, - "learning_rate": 6.141944844567988e-07, - "loss": 2.2269, - "step": 566390 + "epoch": 0.76, + "learning_rate": 1.182415911419199e-05, + "loss": 2.7112, + "step": 213900 }, { - "epoch": 0.99, - "learning_rate": 6.133225445299721e-07, - "loss": 2.2264, - "step": 566400 + "epoch": 0.76, + "learning_rate": 1.1806311596246311e-05, + "loss": 2.7044, + "step": 214000 }, { - "epoch": 0.99, - "learning_rate": 6.124506046031453e-07, - "loss": 2.2052, - "step": 566410 + "epoch": 0.76, + "learning_rate": 1.1788464078300633e-05, + "loss": 2.7009, + "step": 214100 }, { - "epoch": 0.99, - "learning_rate": 6.115786646763184e-07, - "loss": 2.2907, - "step": 566420 + "epoch": 0.76, + "learning_rate": 1.1770616560354952e-05, + "loss": 2.7011, + "step": 214200 }, { - "epoch": 0.99, - "learning_rate": 6.107067247494917e-07, - "loss": 2.1831, - "step": 566430 + "epoch": 0.76, + "learning_rate": 1.1752769042409273e-05, + "loss": 2.7038, + "step": 214300 }, { - "epoch": 0.99, - "learning_rate": 6.098347848226648e-07, - "loss": 2.2179, - "step": 566440 + "epoch": 0.77, + "learning_rate": 1.1734921524463593e-05, + "loss": 2.6994, + "step": 214400 }, { - "epoch": 0.99, - "learning_rate": 6.08962844895838e-07, - "loss": 2.2396, - "step": 566450 + "epoch": 0.77, + "learning_rate": 1.1717074006517914e-05, + "loss": 2.7019, + "step": 214500 }, { - "epoch": 0.99, - "learning_rate": 6.080909049690113e-07, - "loss": 2.2669, - "step": 566460 + "epoch": 0.77, + "learning_rate": 1.1699226488572235e-05, + "loss": 2.7028, + "step": 214600 }, { - "epoch": 0.99, - "learning_rate": 6.072189650421844e-07, - "loss": 2.283, - "step": 566470 + "epoch": 0.77, + "learning_rate": 1.1681378970626555e-05, + "loss": 2.7122, + "step": 214700 }, { - "epoch": 0.99, - "learning_rate": 6.063470251153577e-07, - "loss": 2.2969, - "step": 566480 + "epoch": 0.77, + "learning_rate": 1.1663531452680876e-05, + "loss": 2.7032, + "step": 214800 }, { - "epoch": 0.99, - "learning_rate": 6.054750851885308e-07, - "loss": 2.29, - "step": 566490 + "epoch": 0.77, + "learning_rate": 1.1645683934735197e-05, + "loss": 2.6944, + "step": 214900 }, { - "epoch": 0.99, - "learning_rate": 6.04603145261704e-07, - "loss": 2.1918, - "step": 566500 + "epoch": 0.77, + "learning_rate": 1.1627836416789517e-05, + "loss": 2.7105, + "step": 215000 }, { - "epoch": 0.99, - "learning_rate": 6.037312053348773e-07, - "loss": 2.3284, - "step": 566510 + "epoch": 0.77, + "learning_rate": 1.1609988898843838e-05, + "loss": 2.6958, + "step": 215100 }, { - "epoch": 0.99, - "learning_rate": 6.028592654080504e-07, - "loss": 2.1954, - "step": 566520 + "epoch": 0.77, + "learning_rate": 1.1592141380898159e-05, + "loss": 2.701, + "step": 215200 }, { - "epoch": 0.99, - "learning_rate": 6.019873254812237e-07, - "loss": 2.1641, - "step": 566530 + "epoch": 0.77, + "learning_rate": 1.157429386295248e-05, + "loss": 2.7047, + "step": 215300 }, { - "epoch": 0.99, - "learning_rate": 6.011153855543968e-07, - "loss": 2.235, - "step": 566540 + "epoch": 0.77, + "learning_rate": 1.1556446345006802e-05, + "loss": 2.7097, + "step": 215400 }, { - "epoch": 0.99, - "learning_rate": 6.0024344562757e-07, - "loss": 2.3208, - "step": 566550 + "epoch": 0.77, + "learning_rate": 1.1538598827061121e-05, + "loss": 2.6957, + "step": 215500 }, { - "epoch": 0.99, - "learning_rate": 5.993715057007433e-07, - "loss": 2.1548, - "step": 566560 + "epoch": 0.77, + "learning_rate": 1.1520751309115442e-05, + "loss": 2.7055, + "step": 215600 }, { - "epoch": 0.99, - "learning_rate": 5.984995657739164e-07, - "loss": 2.2539, - "step": 566570 + "epoch": 0.77, + "learning_rate": 1.1502903791169762e-05, + "loss": 2.7012, + "step": 215700 }, { - "epoch": 0.99, - "learning_rate": 5.976276258470896e-07, - "loss": 2.2403, - "step": 566580 + "epoch": 0.77, + "learning_rate": 1.1485056273224083e-05, + "loss": 2.7047, + "step": 215800 }, { - "epoch": 0.99, - "learning_rate": 5.967556859202629e-07, - "loss": 2.2822, - "step": 566590 + "epoch": 0.77, + "learning_rate": 1.1467208755278404e-05, + "loss": 2.6991, + "step": 215900 }, { - "epoch": 0.99, - "learning_rate": 5.95883745993436e-07, - "loss": 2.1449, - "step": 566600 + "epoch": 0.77, + "learning_rate": 1.1449361237332724e-05, + "loss": 2.7148, + "step": 216000 }, { - "epoch": 0.99, - "learning_rate": 5.950118060666093e-07, - "loss": 2.2834, - "step": 566610 + "epoch": 0.77, + "learning_rate": 1.1431513719387045e-05, + "loss": 2.6978, + "step": 216100 }, { - "epoch": 0.99, - "learning_rate": 5.941398661397824e-07, - "loss": 2.2029, - "step": 566620 + "epoch": 0.77, + "learning_rate": 1.1413666201441366e-05, + "loss": 2.6998, + "step": 216200 }, { - "epoch": 0.99, - "learning_rate": 5.932679262129556e-07, - "loss": 2.1913, - "step": 566630 + "epoch": 0.77, + "learning_rate": 1.1395818683495686e-05, + "loss": 2.7136, + "step": 216300 }, { - "epoch": 0.99, - "learning_rate": 5.923959862861289e-07, - "loss": 2.3106, - "step": 566640 + "epoch": 0.77, + "learning_rate": 1.1377971165550009e-05, + "loss": 2.6882, + "step": 216400 }, { - "epoch": 0.99, - "learning_rate": 5.91524046359302e-07, - "loss": 2.2313, - "step": 566650 + "epoch": 0.77, + "learning_rate": 1.1360123647604328e-05, + "loss": 2.7058, + "step": 216500 }, { - "epoch": 0.99, - "learning_rate": 5.906521064324753e-07, - "loss": 2.3769, - "step": 566660 + "epoch": 0.77, + "learning_rate": 1.134227612965865e-05, + "loss": 2.7071, + "step": 216600 }, { - "epoch": 0.99, - "learning_rate": 5.897801665056484e-07, - "loss": 2.3259, - "step": 566670 + "epoch": 0.77, + "learning_rate": 1.132442861171297e-05, + "loss": 2.6967, + "step": 216700 }, { - "epoch": 0.99, - "learning_rate": 5.889082265788216e-07, - "loss": 2.2012, - "step": 566680 + "epoch": 0.77, + "learning_rate": 1.130658109376729e-05, + "loss": 2.6981, + "step": 216800 }, { - "epoch": 0.99, - "learning_rate": 5.880362866519949e-07, - "loss": 2.3323, - "step": 566690 + "epoch": 0.77, + "learning_rate": 1.1288733575821611e-05, + "loss": 2.6987, + "step": 216900 }, { - "epoch": 0.99, - "learning_rate": 5.87164346725168e-07, - "loss": 2.1371, - "step": 566700 + "epoch": 0.77, + "learning_rate": 1.1270886057875933e-05, + "loss": 2.7027, + "step": 217000 }, { - "epoch": 0.99, - "learning_rate": 5.862924067983412e-07, - "loss": 2.274, - "step": 566710 + "epoch": 0.77, + "learning_rate": 1.1253038539930252e-05, + "loss": 2.7022, + "step": 217100 }, { - "epoch": 0.99, - "learning_rate": 5.854204668715145e-07, - "loss": 2.2591, - "step": 566720 + "epoch": 0.78, + "learning_rate": 1.1235191021984573e-05, + "loss": 2.7012, + "step": 217200 }, { - "epoch": 0.99, - "learning_rate": 5.845485269446876e-07, - "loss": 2.2483, - "step": 566730 + "epoch": 0.78, + "learning_rate": 1.1217343504038893e-05, + "loss": 2.6959, + "step": 217300 }, { - "epoch": 0.99, - "learning_rate": 5.836765870178609e-07, - "loss": 2.3488, - "step": 566740 + "epoch": 0.78, + "learning_rate": 1.1199495986093214e-05, + "loss": 2.7083, + "step": 217400 }, { - "epoch": 0.99, - "learning_rate": 5.82804647091034e-07, - "loss": 2.3975, - "step": 566750 + "epoch": 0.78, + "learning_rate": 1.1181648468147535e-05, + "loss": 2.705, + "step": 217500 }, { - "epoch": 0.99, - "learning_rate": 5.819327071642072e-07, - "loss": 2.2501, - "step": 566760 + "epoch": 0.78, + "learning_rate": 1.1163800950201855e-05, + "loss": 2.7049, + "step": 217600 }, { - "epoch": 0.99, - "learning_rate": 5.810607672373805e-07, - "loss": 2.2656, - "step": 566770 + "epoch": 0.78, + "learning_rate": 1.1145953432256178e-05, + "loss": 2.7069, + "step": 217700 }, { - "epoch": 0.99, - "learning_rate": 5.801888273105536e-07, - "loss": 2.1918, - "step": 566780 + "epoch": 0.78, + "learning_rate": 1.1128105914310497e-05, + "loss": 2.7007, + "step": 217800 }, { - "epoch": 0.99, - "learning_rate": 5.793168873837268e-07, - "loss": 2.1489, - "step": 566790 + "epoch": 0.78, + "learning_rate": 1.1110258396364818e-05, + "loss": 2.7038, + "step": 217900 }, { - "epoch": 0.99, - "learning_rate": 5.784449474569001e-07, - "loss": 2.3233, - "step": 566800 + "epoch": 0.78, + "learning_rate": 1.109241087841914e-05, + "loss": 2.7036, + "step": 218000 }, { - "epoch": 0.99, - "learning_rate": 5.775730075300732e-07, - "loss": 2.2854, - "step": 566810 + "epoch": 0.78, + "learning_rate": 1.1074563360473459e-05, + "loss": 2.7045, + "step": 218100 }, { - "epoch": 0.99, - "learning_rate": 5.767010676032465e-07, - "loss": 2.4082, - "step": 566820 + "epoch": 0.78, + "learning_rate": 1.105671584252778e-05, + "loss": 2.7068, + "step": 218200 }, { - "epoch": 0.99, - "learning_rate": 5.758291276764196e-07, - "loss": 2.3313, - "step": 566830 + "epoch": 0.78, + "learning_rate": 1.1038868324582102e-05, + "loss": 2.6995, + "step": 218300 }, { - "epoch": 0.99, - "learning_rate": 5.749571877495928e-07, - "loss": 2.2422, - "step": 566840 + "epoch": 0.78, + "learning_rate": 1.1021020806636421e-05, + "loss": 2.7003, + "step": 218400 }, { - "epoch": 0.99, - "learning_rate": 5.740852478227661e-07, - "loss": 2.2496, - "step": 566850 + "epoch": 0.78, + "learning_rate": 1.1003173288690742e-05, + "loss": 2.7071, + "step": 218500 }, { - "epoch": 0.99, - "learning_rate": 5.732133078959392e-07, - "loss": 2.1388, - "step": 566860 + "epoch": 0.78, + "learning_rate": 1.0985325770745063e-05, + "loss": 2.7033, + "step": 218600 }, { - "epoch": 0.99, - "learning_rate": 5.723413679691125e-07, - "loss": 2.2519, - "step": 566870 + "epoch": 0.78, + "learning_rate": 1.0967478252799383e-05, + "loss": 2.7064, + "step": 218700 }, { - "epoch": 0.99, - "learning_rate": 5.714694280422856e-07, - "loss": 2.2346, - "step": 566880 + "epoch": 0.78, + "learning_rate": 1.0949630734853704e-05, + "loss": 2.6959, + "step": 218800 }, { - "epoch": 0.99, - "learning_rate": 5.705974881154588e-07, - "loss": 2.249, - "step": 566890 + "epoch": 0.78, + "learning_rate": 1.0931783216908024e-05, + "loss": 2.6931, + "step": 218900 }, { - "epoch": 0.99, - "learning_rate": 5.697255481886321e-07, - "loss": 2.2889, - "step": 566900 + "epoch": 0.78, + "learning_rate": 1.0913935698962347e-05, + "loss": 2.7059, + "step": 219000 }, { - "epoch": 0.99, - "learning_rate": 5.688536082618052e-07, - "loss": 2.2548, - "step": 566910 + "epoch": 0.78, + "learning_rate": 1.0896088181016668e-05, + "loss": 2.6962, + "step": 219100 }, { - "epoch": 0.99, - "learning_rate": 5.679816683349784e-07, - "loss": 2.1983, - "step": 566920 + "epoch": 0.78, + "learning_rate": 1.0878240663070987e-05, + "loss": 2.7064, + "step": 219200 }, { - "epoch": 0.99, - "learning_rate": 5.671097284081517e-07, - "loss": 2.3803, - "step": 566930 + "epoch": 0.78, + "learning_rate": 1.0860393145125309e-05, + "loss": 2.7002, + "step": 219300 }, { - "epoch": 0.99, - "learning_rate": 5.662377884813248e-07, - "loss": 2.1307, - "step": 566940 + "epoch": 0.78, + "learning_rate": 1.0842545627179628e-05, + "loss": 2.7041, + "step": 219400 }, { - "epoch": 0.99, - "learning_rate": 5.653658485544981e-07, - "loss": 2.2152, - "step": 566950 + "epoch": 0.78, + "learning_rate": 1.082469810923395e-05, + "loss": 2.7046, + "step": 219500 }, { - "epoch": 0.99, - "learning_rate": 5.644939086276712e-07, - "loss": 2.3433, - "step": 566960 + "epoch": 0.78, + "learning_rate": 1.080685059128827e-05, + "loss": 2.6958, + "step": 219600 }, { - "epoch": 0.99, - "learning_rate": 5.636219687008444e-07, - "loss": 2.2037, - "step": 566970 + "epoch": 0.78, + "learning_rate": 1.078900307334259e-05, + "loss": 2.7129, + "step": 219700 }, { - "epoch": 0.99, - "learning_rate": 5.627500287740177e-07, - "loss": 2.2483, - "step": 566980 + "epoch": 0.78, + "learning_rate": 1.0771155555396911e-05, + "loss": 2.7022, + "step": 219800 }, { - "epoch": 0.99, - "learning_rate": 5.618780888471908e-07, - "loss": 2.2732, - "step": 566990 + "epoch": 0.78, + "learning_rate": 1.0753308037451233e-05, + "loss": 2.7013, + "step": 219900 }, { - "epoch": 0.99, - "learning_rate": 5.61006148920364e-07, - "loss": 2.2291, - "step": 567000 + "epoch": 0.79, + "learning_rate": 1.0735460519505552e-05, + "loss": 2.6996, + "step": 220000 }, { - "epoch": 0.99, - "learning_rate": 5.601342089935372e-07, - "loss": 2.2342, - "step": 567010 + "epoch": 0.79, + "learning_rate": 1.0717613001559873e-05, + "loss": 2.7058, + "step": 220100 }, { - "epoch": 0.99, - "learning_rate": 5.592622690667104e-07, - "loss": 2.1306, - "step": 567020 + "epoch": 0.79, + "learning_rate": 1.0699765483614194e-05, + "loss": 2.7006, + "step": 220200 }, { - "epoch": 0.99, - "learning_rate": 5.583903291398837e-07, - "loss": 2.2656, - "step": 567030 + "epoch": 0.79, + "learning_rate": 1.0681917965668516e-05, + "loss": 2.7022, + "step": 220300 }, { - "epoch": 0.99, - "learning_rate": 5.575183892130568e-07, - "loss": 2.245, - "step": 567040 + "epoch": 0.79, + "learning_rate": 1.0664070447722837e-05, + "loss": 2.7062, + "step": 220400 }, { - "epoch": 0.99, - "learning_rate": 5.5664644928623e-07, - "loss": 2.218, - "step": 567050 + "epoch": 0.79, + "learning_rate": 1.0646222929777156e-05, + "loss": 2.6988, + "step": 220500 }, { - "epoch": 0.99, - "learning_rate": 5.557745093594033e-07, - "loss": 2.2285, - "step": 567060 + "epoch": 0.79, + "learning_rate": 1.0628375411831478e-05, + "loss": 2.7036, + "step": 220600 }, { - "epoch": 0.99, - "learning_rate": 5.549025694325764e-07, - "loss": 2.2467, - "step": 567070 + "epoch": 0.79, + "learning_rate": 1.0610527893885797e-05, + "loss": 2.6986, + "step": 220700 }, { - "epoch": 0.99, - "learning_rate": 5.540306295057497e-07, - "loss": 2.251, - "step": 567080 + "epoch": 0.79, + "learning_rate": 1.0592680375940118e-05, + "loss": 2.7137, + "step": 220800 }, { - "epoch": 0.99, - "learning_rate": 5.531586895789228e-07, - "loss": 2.2466, - "step": 567090 + "epoch": 0.79, + "learning_rate": 1.057483285799444e-05, + "loss": 2.7025, + "step": 220900 }, { - "epoch": 0.99, - "learning_rate": 5.52286749652096e-07, - "loss": 2.244, - "step": 567100 + "epoch": 0.79, + "learning_rate": 1.0556985340048759e-05, + "loss": 2.7126, + "step": 221000 }, { - "epoch": 0.99, - "learning_rate": 5.514148097252693e-07, - "loss": 2.2837, - "step": 567110 + "epoch": 0.79, + "learning_rate": 1.053913782210308e-05, + "loss": 2.7058, + "step": 221100 }, { - "epoch": 0.99, - "learning_rate": 5.505428697984424e-07, - "loss": 2.3508, - "step": 567120 + "epoch": 0.79, + "learning_rate": 1.0521290304157402e-05, + "loss": 2.7087, + "step": 221200 }, { - "epoch": 0.99, - "learning_rate": 5.496709298716156e-07, - "loss": 2.2921, - "step": 567130 + "epoch": 0.79, + "learning_rate": 1.0503442786211721e-05, + "loss": 2.6998, + "step": 221300 }, { - "epoch": 0.99, - "learning_rate": 5.487989899447888e-07, - "loss": 2.2045, - "step": 567140 + "epoch": 0.79, + "learning_rate": 1.0485595268266042e-05, + "loss": 2.7031, + "step": 221400 }, { - "epoch": 0.99, - "learning_rate": 5.47927050017962e-07, - "loss": 2.1769, - "step": 567150 + "epoch": 0.79, + "learning_rate": 1.0467747750320363e-05, + "loss": 2.7069, + "step": 221500 }, { - "epoch": 0.99, - "learning_rate": 5.470551100911353e-07, - "loss": 2.2698, - "step": 567160 + "epoch": 0.79, + "learning_rate": 1.0449900232374685e-05, + "loss": 2.708, + "step": 221600 }, { - "epoch": 0.99, - "learning_rate": 5.461831701643084e-07, - "loss": 2.2596, - "step": 567170 + "epoch": 0.79, + "learning_rate": 1.0432052714429006e-05, + "loss": 2.7032, + "step": 221700 }, { - "epoch": 0.99, - "learning_rate": 5.453112302374816e-07, - "loss": 2.3036, - "step": 567180 + "epoch": 0.79, + "learning_rate": 1.0414205196483325e-05, + "loss": 2.7039, + "step": 221800 }, { - "epoch": 0.99, - "learning_rate": 5.444392903106548e-07, - "loss": 2.2852, - "step": 567190 + "epoch": 0.79, + "learning_rate": 1.0396357678537647e-05, + "loss": 2.6945, + "step": 221900 }, { - "epoch": 0.99, - "learning_rate": 5.43567350383828e-07, - "loss": 2.3892, - "step": 567200 + "epoch": 0.79, + "learning_rate": 1.0378510160591968e-05, + "loss": 2.6955, + "step": 222000 }, { - "epoch": 0.99, - "learning_rate": 5.426954104570013e-07, - "loss": 2.2412, - "step": 567210 + "epoch": 0.79, + "learning_rate": 1.0360662642646287e-05, + "loss": 2.6966, + "step": 222100 }, { - "epoch": 0.99, - "learning_rate": 5.418234705301744e-07, - "loss": 2.232, - "step": 567220 + "epoch": 0.79, + "learning_rate": 1.0342815124700609e-05, + "loss": 2.6987, + "step": 222200 }, { - "epoch": 0.99, - "learning_rate": 5.409515306033476e-07, - "loss": 2.2865, - "step": 567230 + "epoch": 0.79, + "learning_rate": 1.0324967606754928e-05, + "loss": 2.6986, + "step": 222300 }, { - "epoch": 0.99, - "learning_rate": 5.400795906765208e-07, - "loss": 2.2369, - "step": 567240 + "epoch": 0.79, + "learning_rate": 1.030712008880925e-05, + "loss": 2.7068, + "step": 222400 }, { - "epoch": 0.99, - "learning_rate": 5.39207650749694e-07, - "loss": 2.1936, - "step": 567250 + "epoch": 0.79, + "learning_rate": 1.028927257086357e-05, + "loss": 2.7002, + "step": 222500 }, { - "epoch": 0.99, - "learning_rate": 5.383357108228672e-07, - "loss": 2.2252, - "step": 567260 + "epoch": 0.79, + "learning_rate": 1.027142505291789e-05, + "loss": 2.6913, + "step": 222600 }, { - "epoch": 0.99, - "learning_rate": 5.374637708960404e-07, - "loss": 2.214, - "step": 567270 + "epoch": 0.79, + "learning_rate": 1.0253577534972211e-05, + "loss": 2.6961, + "step": 222700 }, { - "epoch": 0.99, - "learning_rate": 5.365918309692136e-07, - "loss": 2.2131, - "step": 567280 + "epoch": 0.8, + "learning_rate": 1.0235730017026532e-05, + "loss": 2.6971, + "step": 222800 }, { - "epoch": 0.99, - "learning_rate": 5.357198910423868e-07, - "loss": 2.2423, - "step": 567290 + "epoch": 0.8, + "learning_rate": 1.0217882499080854e-05, + "loss": 2.7025, + "step": 222900 }, { - "epoch": 0.99, - "learning_rate": 5.3484795111556e-07, - "loss": 2.1948, - "step": 567300 + "epoch": 0.8, + "learning_rate": 1.0200034981135175e-05, + "loss": 2.7009, + "step": 223000 }, { - "epoch": 0.99, - "learning_rate": 5.339760111887332e-07, - "loss": 2.2632, - "step": 567310 + "epoch": 0.8, + "learning_rate": 1.0182187463189494e-05, + "loss": 2.698, + "step": 223100 }, { - "epoch": 0.99, - "learning_rate": 5.331040712619064e-07, - "loss": 2.322, - "step": 567320 + "epoch": 0.8, + "learning_rate": 1.0164339945243816e-05, + "loss": 2.6932, + "step": 223200 }, { - "epoch": 0.99, - "learning_rate": 5.322321313350796e-07, - "loss": 2.251, - "step": 567330 + "epoch": 0.8, + "learning_rate": 1.0146492427298137e-05, + "loss": 2.6892, + "step": 223300 }, { - "epoch": 0.99, - "learning_rate": 5.313601914082527e-07, - "loss": 2.3405, - "step": 567340 + "epoch": 0.8, + "learning_rate": 1.0128644909352456e-05, + "loss": 2.7013, + "step": 223400 }, { - "epoch": 0.99, - "learning_rate": 5.30488251481426e-07, - "loss": 2.157, - "step": 567350 + "epoch": 0.8, + "learning_rate": 1.0110797391406778e-05, + "loss": 2.6979, + "step": 223500 }, { - "epoch": 0.99, - "learning_rate": 5.296163115545992e-07, - "loss": 2.1394, - "step": 567360 + "epoch": 0.8, + "learning_rate": 1.0092949873461099e-05, + "loss": 2.6968, + "step": 223600 }, { - "epoch": 0.99, - "learning_rate": 5.287443716277724e-07, - "loss": 2.2781, - "step": 567370 + "epoch": 0.8, + "learning_rate": 1.0075102355515418e-05, + "loss": 2.7025, + "step": 223700 }, { - "epoch": 0.99, - "learning_rate": 5.278724317009456e-07, - "loss": 2.274, - "step": 567380 + "epoch": 0.8, + "learning_rate": 1.005725483756974e-05, + "loss": 2.7071, + "step": 223800 }, { - "epoch": 0.99, - "learning_rate": 5.270004917741187e-07, - "loss": 2.3699, - "step": 567390 + "epoch": 0.8, + "learning_rate": 1.0039407319624059e-05, + "loss": 2.7038, + "step": 223900 }, { - "epoch": 0.99, - "learning_rate": 5.26128551847292e-07, - "loss": 2.2243, - "step": 567400 + "epoch": 0.8, + "learning_rate": 1.002155980167838e-05, + "loss": 2.6933, + "step": 224000 }, { - "epoch": 0.99, - "learning_rate": 5.252566119204652e-07, - "loss": 2.2209, - "step": 567410 + "epoch": 0.8, + "learning_rate": 1.0003712283732703e-05, + "loss": 2.6946, + "step": 224100 }, { - "epoch": 0.99, - "learning_rate": 5.243846719936384e-07, - "loss": 2.2952, - "step": 567420 + "epoch": 0.8, + "learning_rate": 9.985864765787023e-06, + "loss": 2.7156, + "step": 224200 }, { - "epoch": 0.99, - "learning_rate": 5.235127320668116e-07, - "loss": 2.3311, - "step": 567430 + "epoch": 0.8, + "learning_rate": 9.968017247841344e-06, + "loss": 2.7014, + "step": 224300 }, { - "epoch": 0.99, - "learning_rate": 5.226407921399848e-07, - "loss": 2.2642, - "step": 567440 + "epoch": 0.8, + "learning_rate": 9.950169729895663e-06, + "loss": 2.7004, + "step": 224400 }, { - "epoch": 0.99, - "learning_rate": 5.21768852213158e-07, - "loss": 2.2899, - "step": 567450 + "epoch": 0.8, + "learning_rate": 9.932322211949985e-06, + "loss": 2.7012, + "step": 224500 }, { - "epoch": 0.99, - "learning_rate": 5.208969122863312e-07, - "loss": 2.2738, - "step": 567460 + "epoch": 0.8, + "learning_rate": 9.914474694004306e-06, + "loss": 2.7054, + "step": 224600 }, { - "epoch": 0.99, - "learning_rate": 5.200249723595043e-07, - "loss": 2.1831, - "step": 567470 + "epoch": 0.8, + "learning_rate": 9.896627176058625e-06, + "loss": 2.6914, + "step": 224700 }, { - "epoch": 0.99, - "learning_rate": 5.191530324326776e-07, - "loss": 2.2717, - "step": 567480 + "epoch": 0.8, + "learning_rate": 9.878779658112947e-06, + "loss": 2.7055, + "step": 224800 }, { - "epoch": 0.99, - "learning_rate": 5.182810925058508e-07, - "loss": 2.3013, - "step": 567490 + "epoch": 0.8, + "learning_rate": 9.860932140167268e-06, + "loss": 2.6997, + "step": 224900 }, { - "epoch": 0.99, - "learning_rate": 5.17409152579024e-07, - "loss": 2.1975, - "step": 567500 + "epoch": 0.8, + "learning_rate": 9.843084622221587e-06, + "loss": 2.7085, + "step": 225000 }, { - "epoch": 0.99, - "learning_rate": 5.165372126521972e-07, - "loss": 2.2462, - "step": 567510 + "epoch": 0.8, + "learning_rate": 9.825237104275909e-06, + "loss": 2.6912, + "step": 225100 }, { - "epoch": 0.99, - "learning_rate": 5.156652727253703e-07, - "loss": 2.208, - "step": 567520 + "epoch": 0.8, + "learning_rate": 9.80738958633023e-06, + "loss": 2.7002, + "step": 225200 }, { - "epoch": 0.99, - "learning_rate": 5.147933327985436e-07, - "loss": 2.2867, - "step": 567530 + "epoch": 0.8, + "learning_rate": 9.78954206838455e-06, + "loss": 2.6993, + "step": 225300 }, { - "epoch": 0.99, - "learning_rate": 5.139213928717168e-07, - "loss": 2.1761, - "step": 567540 + "epoch": 0.8, + "learning_rate": 9.771694550438872e-06, + "loss": 2.6978, + "step": 225400 }, { - "epoch": 0.99, - "learning_rate": 5.1304945294489e-07, - "loss": 2.2264, - "step": 567550 + "epoch": 0.8, + "learning_rate": 9.753847032493192e-06, + "loss": 2.7073, + "step": 225500 }, { - "epoch": 0.99, - "learning_rate": 5.121775130180632e-07, - "loss": 2.2636, - "step": 567560 + "epoch": 0.81, + "learning_rate": 9.735999514547513e-06, + "loss": 2.6984, + "step": 225600 }, { - "epoch": 0.99, - "learning_rate": 5.113055730912363e-07, - "loss": 2.2454, - "step": 567570 + "epoch": 0.81, + "learning_rate": 9.718151996601834e-06, + "loss": 2.6929, + "step": 225700 }, { - "epoch": 0.99, - "learning_rate": 5.104336331644096e-07, - "loss": 2.2504, - "step": 567580 + "epoch": 0.81, + "learning_rate": 9.700304478656154e-06, + "loss": 2.6988, + "step": 225800 }, { - "epoch": 0.99, - "learning_rate": 5.095616932375828e-07, - "loss": 2.2308, - "step": 567590 + "epoch": 0.81, + "learning_rate": 9.682456960710475e-06, + "loss": 2.6957, + "step": 225900 }, { - "epoch": 0.99, - "learning_rate": 5.086897533107559e-07, - "loss": 2.3036, - "step": 567600 + "epoch": 0.81, + "learning_rate": 9.664609442764794e-06, + "loss": 2.7019, + "step": 226000 }, { - "epoch": 0.99, - "learning_rate": 5.078178133839292e-07, - "loss": 2.3239, - "step": 567610 + "epoch": 0.81, + "learning_rate": 9.646761924819116e-06, + "loss": 2.7073, + "step": 226100 }, { - "epoch": 0.99, - "learning_rate": 5.069458734571023e-07, - "loss": 2.1471, - "step": 567620 + "epoch": 0.81, + "learning_rate": 9.628914406873437e-06, + "loss": 2.7022, + "step": 226200 }, { - "epoch": 0.99, - "learning_rate": 5.060739335302756e-07, - "loss": 2.2312, - "step": 567630 + "epoch": 0.81, + "learning_rate": 9.611066888927756e-06, + "loss": 2.7146, + "step": 226300 }, { - "epoch": 0.99, - "learning_rate": 5.052019936034488e-07, - "loss": 2.2732, - "step": 567640 + "epoch": 0.81, + "learning_rate": 9.593219370982078e-06, + "loss": 2.6932, + "step": 226400 }, { - "epoch": 0.99, - "learning_rate": 5.043300536766219e-07, - "loss": 2.2422, - "step": 567650 + "epoch": 0.81, + "learning_rate": 9.575371853036399e-06, + "loss": 2.6939, + "step": 226500 }, { - "epoch": 0.99, - "learning_rate": 5.034581137497952e-07, - "loss": 2.2932, - "step": 567660 + "epoch": 0.81, + "learning_rate": 9.557524335090718e-06, + "loss": 2.6955, + "step": 226600 }, { - "epoch": 0.99, - "learning_rate": 5.025861738229683e-07, - "loss": 2.3347, - "step": 567670 + "epoch": 0.81, + "learning_rate": 9.539676817145041e-06, + "loss": 2.6939, + "step": 226700 }, { - "epoch": 0.99, - "learning_rate": 5.017142338961415e-07, - "loss": 2.3001, - "step": 567680 + "epoch": 0.81, + "learning_rate": 9.52182929919936e-06, + "loss": 2.6939, + "step": 226800 }, { - "epoch": 0.99, - "learning_rate": 5.008422939693148e-07, - "loss": 2.4094, - "step": 567690 + "epoch": 0.81, + "learning_rate": 9.503981781253682e-06, + "loss": 2.7074, + "step": 226900 }, { - "epoch": 0.99, - "learning_rate": 4.999703540424879e-07, - "loss": 2.2282, - "step": 567700 + "epoch": 0.81, + "learning_rate": 9.486134263308003e-06, + "loss": 2.7026, + "step": 227000 }, { - "epoch": 0.99, - "learning_rate": 4.990984141156612e-07, - "loss": 2.1282, - "step": 567710 + "epoch": 0.81, + "learning_rate": 9.468286745362323e-06, + "loss": 2.7055, + "step": 227100 }, { - "epoch": 0.99, - "learning_rate": 4.982264741888343e-07, - "loss": 2.3119, - "step": 567720 + "epoch": 0.81, + "learning_rate": 9.450439227416644e-06, + "loss": 2.6944, + "step": 227200 }, { - "epoch": 0.99, - "learning_rate": 4.973545342620075e-07, - "loss": 2.2459, - "step": 567730 + "epoch": 0.81, + "learning_rate": 9.432591709470963e-06, + "loss": 2.6982, + "step": 227300 }, { - "epoch": 0.99, - "learning_rate": 4.964825943351808e-07, - "loss": 2.3325, - "step": 567740 + "epoch": 0.81, + "learning_rate": 9.414744191525285e-06, + "loss": 2.6879, + "step": 227400 }, { - "epoch": 0.99, - "learning_rate": 4.956106544083539e-07, - "loss": 2.2282, - "step": 567750 + "epoch": 0.81, + "learning_rate": 9.396896673579606e-06, + "loss": 2.7001, + "step": 227500 }, { - "epoch": 0.99, - "learning_rate": 4.947387144815272e-07, - "loss": 2.1311, - "step": 567760 + "epoch": 0.81, + "learning_rate": 9.379049155633925e-06, + "loss": 2.704, + "step": 227600 }, { - "epoch": 0.99, - "learning_rate": 4.938667745547003e-07, - "loss": 2.2202, - "step": 567770 + "epoch": 0.81, + "learning_rate": 9.361201637688247e-06, + "loss": 2.6901, + "step": 227700 }, { - "epoch": 0.99, - "learning_rate": 4.929948346278735e-07, - "loss": 2.2096, - "step": 567780 + "epoch": 0.81, + "learning_rate": 9.343354119742568e-06, + "loss": 2.7065, + "step": 227800 }, { - "epoch": 0.99, - "learning_rate": 4.921228947010468e-07, - "loss": 2.1934, - "step": 567790 + "epoch": 0.81, + "learning_rate": 9.325506601796889e-06, + "loss": 2.696, + "step": 227900 }, { - "epoch": 0.99, - "learning_rate": 4.912509547742199e-07, - "loss": 2.1147, - "step": 567800 + "epoch": 0.81, + "learning_rate": 9.30765908385121e-06, + "loss": 2.7024, + "step": 228000 }, { - "epoch": 0.99, - "learning_rate": 4.903790148473931e-07, - "loss": 2.375, - "step": 567810 + "epoch": 0.81, + "learning_rate": 9.28981156590553e-06, + "loss": 2.7057, + "step": 228100 }, { - "epoch": 0.99, - "learning_rate": 4.895070749205663e-07, - "loss": 2.344, - "step": 567820 + "epoch": 0.81, + "learning_rate": 9.271964047959851e-06, + "loss": 2.6975, + "step": 228200 }, { - "epoch": 0.99, - "learning_rate": 4.886351349937395e-07, - "loss": 2.3063, - "step": 567830 + "epoch": 0.81, + "learning_rate": 9.254116530014172e-06, + "loss": 2.7037, + "step": 228300 }, { - "epoch": 0.99, - "learning_rate": 4.877631950669128e-07, - "loss": 2.3823, - "step": 567840 + "epoch": 0.82, + "learning_rate": 9.236269012068492e-06, + "loss": 2.6997, + "step": 228400 }, { - "epoch": 0.99, - "learning_rate": 4.868912551400859e-07, - "loss": 2.2679, - "step": 567850 + "epoch": 0.82, + "learning_rate": 9.218421494122813e-06, + "loss": 2.6944, + "step": 228500 }, { - "epoch": 0.99, - "learning_rate": 4.860193152132591e-07, - "loss": 2.2819, - "step": 567860 + "epoch": 0.82, + "learning_rate": 9.200573976177134e-06, + "loss": 2.6946, + "step": 228600 }, { - "epoch": 0.99, - "learning_rate": 4.851473752864323e-07, - "loss": 2.2344, - "step": 567870 + "epoch": 0.82, + "learning_rate": 9.182726458231454e-06, + "loss": 2.7034, + "step": 228700 }, { - "epoch": 0.99, - "learning_rate": 4.842754353596055e-07, - "loss": 2.1929, - "step": 567880 + "epoch": 0.82, + "learning_rate": 9.164878940285775e-06, + "loss": 2.7105, + "step": 228800 }, { - "epoch": 0.99, - "learning_rate": 4.834034954327788e-07, - "loss": 2.3466, - "step": 567890 + "epoch": 0.82, + "learning_rate": 9.147031422340094e-06, + "loss": 2.6954, + "step": 228900 }, { - "epoch": 0.99, - "learning_rate": 4.825315555059519e-07, - "loss": 2.2778, - "step": 567900 + "epoch": 0.82, + "learning_rate": 9.129183904394416e-06, + "loss": 2.6991, + "step": 229000 }, { - "epoch": 0.99, - "learning_rate": 4.816596155791251e-07, - "loss": 2.1532, - "step": 567910 + "epoch": 0.82, + "learning_rate": 9.111336386448737e-06, + "loss": 2.7004, + "step": 229100 }, { - "epoch": 0.99, - "learning_rate": 4.807876756522983e-07, - "loss": 2.3015, - "step": 567920 + "epoch": 0.82, + "learning_rate": 9.093488868503058e-06, + "loss": 2.6985, + "step": 229200 }, { - "epoch": 0.99, - "learning_rate": 4.799157357254715e-07, - "loss": 2.2469, - "step": 567930 + "epoch": 0.82, + "learning_rate": 9.07564135055738e-06, + "loss": 2.7126, + "step": 229300 }, { - "epoch": 0.99, - "learning_rate": 4.790437957986447e-07, - "loss": 2.3165, - "step": 567940 + "epoch": 0.82, + "learning_rate": 9.057793832611699e-06, + "loss": 2.7081, + "step": 229400 }, { - "epoch": 0.99, - "learning_rate": 4.781718558718179e-07, - "loss": 2.1923, - "step": 567950 + "epoch": 0.82, + "learning_rate": 9.03994631466602e-06, + "loss": 2.6968, + "step": 229500 }, { - "epoch": 0.99, - "learning_rate": 4.772999159449911e-07, - "loss": 2.2006, - "step": 567960 + "epoch": 0.82, + "learning_rate": 9.022098796720341e-06, + "loss": 2.6953, + "step": 229600 }, { - "epoch": 0.99, - "learning_rate": 4.7642797601816425e-07, - "loss": 2.1696, - "step": 567970 + "epoch": 0.82, + "learning_rate": 9.00425127877466e-06, + "loss": 2.7023, + "step": 229700 }, { - "epoch": 0.99, - "learning_rate": 4.755560360913375e-07, - "loss": 2.1114, - "step": 567980 + "epoch": 0.82, + "learning_rate": 8.986403760828982e-06, + "loss": 2.6988, + "step": 229800 }, { - "epoch": 0.99, - "learning_rate": 4.7468409616451073e-07, - "loss": 2.2594, - "step": 567990 + "epoch": 0.82, + "learning_rate": 8.968556242883303e-06, + "loss": 2.7011, + "step": 229900 }, { - "epoch": 0.99, - "learning_rate": 4.7381215623768387e-07, - "loss": 2.2817, - "step": 568000 + "epoch": 0.82, + "learning_rate": 8.950708724937623e-06, + "loss": 2.7062, + "step": 230000 }, { - "epoch": 0.99, - "learning_rate": 4.729402163108571e-07, - "loss": 2.1544, - "step": 568010 + "epoch": 0.82, + "learning_rate": 8.932861206991944e-06, + "loss": 2.6967, + "step": 230100 }, { - "epoch": 0.99, - "learning_rate": 4.7206827638403024e-07, - "loss": 2.1606, - "step": 568020 + "epoch": 0.82, + "learning_rate": 8.915013689046265e-06, + "loss": 2.6912, + "step": 230200 }, { - "epoch": 0.99, - "learning_rate": 4.711963364572035e-07, - "loss": 2.2792, - "step": 568030 + "epoch": 0.82, + "learning_rate": 8.897166171100585e-06, + "loss": 2.7043, + "step": 230300 }, { - "epoch": 0.99, - "learning_rate": 4.703243965303767e-07, - "loss": 2.2426, - "step": 568040 + "epoch": 0.82, + "learning_rate": 8.879318653154906e-06, + "loss": 2.6933, + "step": 230400 }, { - "epoch": 0.99, - "learning_rate": 4.6945245660354986e-07, - "loss": 2.2039, - "step": 568050 + "epoch": 0.82, + "learning_rate": 8.861471135209227e-06, + "loss": 2.7098, + "step": 230500 }, { - "epoch": 0.99, - "learning_rate": 4.685805166767231e-07, - "loss": 2.4092, - "step": 568060 + "epoch": 0.82, + "learning_rate": 8.843623617263548e-06, + "loss": 2.6921, + "step": 230600 }, { - "epoch": 0.99, - "learning_rate": 4.6770857674989623e-07, - "loss": 2.3315, - "step": 568070 + "epoch": 0.82, + "learning_rate": 8.82577609931787e-06, + "loss": 2.6961, + "step": 230700 }, { - "epoch": 0.99, - "learning_rate": 4.668366368230695e-07, - "loss": 2.2655, - "step": 568080 + "epoch": 0.82, + "learning_rate": 8.807928581372189e-06, + "loss": 2.6977, + "step": 230800 }, { - "epoch": 0.99, - "learning_rate": 4.659646968962427e-07, - "loss": 2.1789, - "step": 568090 + "epoch": 0.82, + "learning_rate": 8.79008106342651e-06, + "loss": 2.7012, + "step": 230900 }, { - "epoch": 0.99, - "learning_rate": 4.6509275696941585e-07, - "loss": 2.2498, - "step": 568100 + "epoch": 0.82, + "learning_rate": 8.77223354548083e-06, + "loss": 2.7062, + "step": 231000 }, { - "epoch": 0.99, - "learning_rate": 4.642208170425891e-07, - "loss": 2.3675, - "step": 568110 + "epoch": 0.82, + "learning_rate": 8.754386027535151e-06, + "loss": 2.7066, + "step": 231100 }, { - "epoch": 0.99, - "learning_rate": 4.633488771157622e-07, - "loss": 2.25, - "step": 568120 + "epoch": 0.83, + "learning_rate": 8.736538509589472e-06, + "loss": 2.6948, + "step": 231200 }, { - "epoch": 0.99, - "learning_rate": 4.6247693718893547e-07, - "loss": 2.1755, - "step": 568130 + "epoch": 0.83, + "learning_rate": 8.718690991643792e-06, + "loss": 2.7013, + "step": 231300 }, { - "epoch": 0.99, - "learning_rate": 4.616049972621087e-07, - "loss": 2.2111, - "step": 568140 + "epoch": 0.83, + "learning_rate": 8.700843473698113e-06, + "loss": 2.7004, + "step": 231400 }, { - "epoch": 0.99, - "learning_rate": 4.6073305733528184e-07, - "loss": 2.1776, - "step": 568150 + "epoch": 0.83, + "learning_rate": 8.682995955752434e-06, + "loss": 2.6943, + "step": 231500 }, { - "epoch": 0.99, - "learning_rate": 4.598611174084551e-07, - "loss": 2.2407, - "step": 568160 + "epoch": 0.83, + "learning_rate": 8.665148437806754e-06, + "loss": 2.6959, + "step": 231600 }, { - "epoch": 0.99, - "learning_rate": 4.589891774816282e-07, - "loss": 2.113, - "step": 568170 + "epoch": 0.83, + "learning_rate": 8.647300919861075e-06, + "loss": 2.6993, + "step": 231700 }, { - "epoch": 0.99, - "learning_rate": 4.5811723755480146e-07, - "loss": 2.3497, - "step": 568180 + "epoch": 0.83, + "learning_rate": 8.629453401915396e-06, + "loss": 2.6986, + "step": 231800 }, { - "epoch": 0.99, - "learning_rate": 4.572452976279747e-07, - "loss": 2.3144, - "step": 568190 + "epoch": 0.83, + "learning_rate": 8.611605883969717e-06, + "loss": 2.7002, + "step": 231900 }, { - "epoch": 0.99, - "learning_rate": 4.5637335770114783e-07, - "loss": 2.2142, - "step": 568200 + "epoch": 0.83, + "learning_rate": 8.593758366024039e-06, + "loss": 2.6978, + "step": 232000 }, { - "epoch": 0.99, - "learning_rate": 4.5550141777432107e-07, - "loss": 2.1791, - "step": 568210 + "epoch": 0.83, + "learning_rate": 8.575910848078358e-06, + "loss": 2.6906, + "step": 232100 }, { - "epoch": 0.99, - "learning_rate": 4.546294778474942e-07, - "loss": 2.2732, - "step": 568220 + "epoch": 0.83, + "learning_rate": 8.55806333013268e-06, + "loss": 2.6979, + "step": 232200 }, { - "epoch": 0.99, - "learning_rate": 4.5375753792066745e-07, - "loss": 2.3126, - "step": 568230 + "epoch": 0.83, + "learning_rate": 8.540215812186999e-06, + "loss": 2.7052, + "step": 232300 }, { - "epoch": 0.99, - "learning_rate": 4.528855979938407e-07, - "loss": 2.3021, - "step": 568240 + "epoch": 0.83, + "learning_rate": 8.52236829424132e-06, + "loss": 2.6965, + "step": 232400 }, { - "epoch": 0.99, - "learning_rate": 4.520136580670138e-07, - "loss": 2.2609, - "step": 568250 + "epoch": 0.83, + "learning_rate": 8.504520776295641e-06, + "loss": 2.6953, + "step": 232500 }, { - "epoch": 0.99, - "learning_rate": 4.5114171814018706e-07, - "loss": 2.2906, - "step": 568260 + "epoch": 0.83, + "learning_rate": 8.48667325834996e-06, + "loss": 2.6928, + "step": 232600 }, { - "epoch": 0.99, - "learning_rate": 4.502697782133602e-07, - "loss": 2.2645, - "step": 568270 + "epoch": 0.83, + "learning_rate": 8.468825740404282e-06, + "loss": 2.7064, + "step": 232700 }, { - "epoch": 0.99, - "learning_rate": 4.4939783828653344e-07, - "loss": 2.324, - "step": 568280 + "epoch": 0.83, + "learning_rate": 8.450978222458603e-06, + "loss": 2.6998, + "step": 232800 }, { - "epoch": 0.99, - "learning_rate": 4.485258983597067e-07, - "loss": 2.2306, - "step": 568290 + "epoch": 0.83, + "learning_rate": 8.433130704512923e-06, + "loss": 2.6953, + "step": 232900 }, { - "epoch": 0.99, - "learning_rate": 4.476539584328798e-07, - "loss": 2.1467, - "step": 568300 + "epoch": 0.83, + "learning_rate": 8.415283186567246e-06, + "loss": 2.691, + "step": 233000 }, { - "epoch": 0.99, - "learning_rate": 4.4678201850605305e-07, - "loss": 2.297, - "step": 568310 + "epoch": 0.83, + "learning_rate": 8.397435668621565e-06, + "loss": 2.6897, + "step": 233100 }, { - "epoch": 0.99, - "learning_rate": 4.459100785792262e-07, - "loss": 2.3768, - "step": 568320 + "epoch": 0.83, + "learning_rate": 8.379588150675886e-06, + "loss": 2.7072, + "step": 233200 }, { - "epoch": 0.99, - "learning_rate": 4.4503813865239943e-07, - "loss": 2.2327, - "step": 568330 + "epoch": 0.83, + "learning_rate": 8.361740632730208e-06, + "loss": 2.6961, + "step": 233300 }, { - "epoch": 0.99, - "learning_rate": 4.4416619872557267e-07, - "loss": 2.2578, - "step": 568340 + "epoch": 0.83, + "learning_rate": 8.343893114784527e-06, + "loss": 2.7006, + "step": 233400 }, { - "epoch": 0.99, - "learning_rate": 4.432942587987458e-07, - "loss": 2.3469, - "step": 568350 + "epoch": 0.83, + "learning_rate": 8.326045596838848e-06, + "loss": 2.695, + "step": 233500 }, { - "epoch": 0.99, - "learning_rate": 4.4242231887191904e-07, - "loss": 2.1666, - "step": 568360 + "epoch": 0.83, + "learning_rate": 8.30819807889317e-06, + "loss": 2.6959, + "step": 233600 }, { - "epoch": 0.99, - "learning_rate": 4.415503789450922e-07, - "loss": 2.3078, - "step": 568370 + "epoch": 0.83, + "learning_rate": 8.290350560947489e-06, + "loss": 2.685, + "step": 233700 }, { - "epoch": 0.99, - "learning_rate": 4.406784390182654e-07, - "loss": 2.2391, - "step": 568380 + "epoch": 0.83, + "learning_rate": 8.27250304300181e-06, + "loss": 2.701, + "step": 233800 }, { - "epoch": 0.99, - "learning_rate": 4.3980649909143866e-07, - "loss": 2.3258, - "step": 568390 + "epoch": 0.83, + "learning_rate": 8.25465552505613e-06, + "loss": 2.7057, + "step": 233900 }, { - "epoch": 0.99, - "learning_rate": 4.389345591646118e-07, - "loss": 2.3915, - "step": 568400 + "epoch": 0.84, + "learning_rate": 8.236808007110451e-06, + "loss": 2.6963, + "step": 234000 }, { - "epoch": 0.99, - "learning_rate": 4.3806261923778504e-07, - "loss": 2.1886, - "step": 568410 + "epoch": 0.84, + "learning_rate": 8.218960489164772e-06, + "loss": 2.6934, + "step": 234100 }, { - "epoch": 0.99, - "learning_rate": 4.3719067931095817e-07, - "loss": 2.3464, - "step": 568420 + "epoch": 0.84, + "learning_rate": 8.201112971219092e-06, + "loss": 2.7008, + "step": 234200 }, { - "epoch": 0.99, - "learning_rate": 4.363187393841314e-07, - "loss": 2.2475, - "step": 568430 + "epoch": 0.84, + "learning_rate": 8.183265453273415e-06, + "loss": 2.7019, + "step": 234300 }, { - "epoch": 0.99, - "learning_rate": 4.3544679945730465e-07, - "loss": 2.2958, - "step": 568440 + "epoch": 0.84, + "learning_rate": 8.165417935327734e-06, + "loss": 2.6915, + "step": 234400 }, { - "epoch": 0.99, - "learning_rate": 4.345748595304778e-07, - "loss": 2.2589, - "step": 568450 + "epoch": 0.84, + "learning_rate": 8.147570417382055e-06, + "loss": 2.702, + "step": 234500 }, { - "epoch": 0.99, - "learning_rate": 4.33702919603651e-07, - "loss": 2.241, - "step": 568460 + "epoch": 0.84, + "learning_rate": 8.129722899436377e-06, + "loss": 2.6931, + "step": 234600 }, { - "epoch": 0.99, - "learning_rate": 4.3283097967682416e-07, - "loss": 2.2717, - "step": 568470 + "epoch": 0.84, + "learning_rate": 8.111875381490696e-06, + "loss": 2.6943, + "step": 234700 }, { - "epoch": 0.99, - "learning_rate": 4.319590397499974e-07, - "loss": 2.2042, - "step": 568480 + "epoch": 0.84, + "learning_rate": 8.094027863545017e-06, + "loss": 2.6886, + "step": 234800 }, { - "epoch": 0.99, - "learning_rate": 4.3108709982317064e-07, - "loss": 2.2261, - "step": 568490 + "epoch": 0.84, + "learning_rate": 8.076180345599339e-06, + "loss": 2.6973, + "step": 234900 }, { - "epoch": 0.99, - "learning_rate": 4.302151598963438e-07, - "loss": 2.2556, - "step": 568500 + "epoch": 0.84, + "learning_rate": 8.058332827653658e-06, + "loss": 2.6945, + "step": 235000 }, { - "epoch": 0.99, - "learning_rate": 4.29343219969517e-07, - "loss": 2.2345, - "step": 568510 + "epoch": 0.84, + "learning_rate": 8.04048530970798e-06, + "loss": 2.6986, + "step": 235100 }, { - "epoch": 0.99, - "learning_rate": 4.2847128004269015e-07, - "loss": 2.3172, - "step": 568520 + "epoch": 0.84, + "learning_rate": 8.0226377917623e-06, + "loss": 2.6973, + "step": 235200 }, { - "epoch": 0.99, - "learning_rate": 4.275993401158634e-07, - "loss": 2.2696, - "step": 568530 + "epoch": 0.84, + "learning_rate": 8.00479027381662e-06, + "loss": 2.6908, + "step": 235300 }, { - "epoch": 0.99, - "learning_rate": 4.2672740018903663e-07, - "loss": 2.2107, - "step": 568540 + "epoch": 0.84, + "learning_rate": 7.986942755870941e-06, + "loss": 2.6937, + "step": 235400 }, { - "epoch": 0.99, - "learning_rate": 4.2585546026220977e-07, - "loss": 2.2489, - "step": 568550 + "epoch": 0.84, + "learning_rate": 7.96909523792526e-06, + "loss": 2.7081, + "step": 235500 }, { - "epoch": 0.99, - "learning_rate": 4.24983520335383e-07, - "loss": 2.1769, - "step": 568560 + "epoch": 0.84, + "learning_rate": 7.951247719979584e-06, + "loss": 2.6974, + "step": 235600 }, { - "epoch": 0.99, - "learning_rate": 4.2411158040855614e-07, - "loss": 2.2242, - "step": 568570 + "epoch": 0.84, + "learning_rate": 7.933400202033905e-06, + "loss": 2.6976, + "step": 235700 }, { - "epoch": 0.99, - "learning_rate": 4.232396404817294e-07, - "loss": 2.3399, - "step": 568580 + "epoch": 0.84, + "learning_rate": 7.915552684088224e-06, + "loss": 2.6937, + "step": 235800 }, { - "epoch": 0.99, - "learning_rate": 4.223677005549026e-07, - "loss": 2.2864, - "step": 568590 + "epoch": 0.84, + "learning_rate": 7.897705166142546e-06, + "loss": 2.6938, + "step": 235900 }, { - "epoch": 0.99, - "learning_rate": 4.2149576062807576e-07, - "loss": 2.284, - "step": 568600 + "epoch": 0.84, + "learning_rate": 7.879857648196865e-06, + "loss": 2.6963, + "step": 236000 }, { - "epoch": 0.99, - "learning_rate": 4.20623820701249e-07, - "loss": 2.2034, - "step": 568610 + "epoch": 0.84, + "learning_rate": 7.862010130251186e-06, + "loss": 2.6978, + "step": 236100 }, { - "epoch": 0.99, - "learning_rate": 4.1975188077442213e-07, - "loss": 2.2895, - "step": 568620 + "epoch": 0.84, + "learning_rate": 7.844162612305508e-06, + "loss": 2.6944, + "step": 236200 }, { - "epoch": 0.99, - "learning_rate": 4.188799408475954e-07, - "loss": 2.2859, - "step": 568630 + "epoch": 0.84, + "learning_rate": 7.826315094359827e-06, + "loss": 2.6979, + "step": 236300 }, { - "epoch": 0.99, - "learning_rate": 4.180080009207686e-07, - "loss": 2.2077, - "step": 568640 + "epoch": 0.84, + "learning_rate": 7.808467576414148e-06, + "loss": 2.6917, + "step": 236400 }, { - "epoch": 0.99, - "learning_rate": 4.1713606099394175e-07, - "loss": 2.2646, - "step": 568650 + "epoch": 0.84, + "learning_rate": 7.79062005846847e-06, + "loss": 2.6964, + "step": 236500 }, { - "epoch": 0.99, - "learning_rate": 4.16264121067115e-07, - "loss": 2.3594, - "step": 568660 + "epoch": 0.84, + "learning_rate": 7.772772540522789e-06, + "loss": 2.6937, + "step": 236600 }, { - "epoch": 0.99, - "learning_rate": 4.153921811402881e-07, - "loss": 2.2671, - "step": 568670 + "epoch": 0.84, + "learning_rate": 7.75492502257711e-06, + "loss": 2.7025, + "step": 236700 }, { - "epoch": 0.99, - "learning_rate": 4.1452024121346136e-07, - "loss": 2.2002, - "step": 568680 + "epoch": 0.85, + "learning_rate": 7.737077504631431e-06, + "loss": 2.6998, + "step": 236800 }, { - "epoch": 0.99, - "learning_rate": 4.136483012866346e-07, - "loss": 2.3326, - "step": 568690 + "epoch": 0.85, + "learning_rate": 7.719229986685753e-06, + "loss": 2.6884, + "step": 236900 }, { - "epoch": 0.99, - "learning_rate": 4.1277636135980774e-07, - "loss": 2.2986, - "step": 568700 + "epoch": 0.85, + "learning_rate": 7.701382468740074e-06, + "loss": 2.7001, + "step": 237000 }, { - "epoch": 0.99, - "learning_rate": 4.11904421432981e-07, - "loss": 2.2526, - "step": 568710 + "epoch": 0.85, + "learning_rate": 7.683534950794393e-06, + "loss": 2.6938, + "step": 237100 }, { - "epoch": 0.99, - "learning_rate": 4.110324815061541e-07, - "loss": 2.233, - "step": 568720 + "epoch": 0.85, + "learning_rate": 7.665687432848715e-06, + "loss": 2.6937, + "step": 237200 }, { - "epoch": 0.99, - "learning_rate": 4.1016054157932736e-07, - "loss": 2.1782, - "step": 568730 + "epoch": 0.85, + "learning_rate": 7.647839914903036e-06, + "loss": 2.6936, + "step": 237300 }, { - "epoch": 0.99, - "learning_rate": 4.092886016525006e-07, - "loss": 2.3242, - "step": 568740 + "epoch": 0.85, + "learning_rate": 7.629992396957355e-06, + "loss": 2.6893, + "step": 237400 }, { - "epoch": 0.99, - "learning_rate": 4.0841666172567373e-07, - "loss": 2.2947, - "step": 568750 + "epoch": 0.85, + "learning_rate": 7.6121448790116766e-06, + "loss": 2.687, + "step": 237500 }, { - "epoch": 0.99, - "learning_rate": 4.0754472179884697e-07, - "loss": 2.2963, - "step": 568760 + "epoch": 0.85, + "learning_rate": 7.594297361065997e-06, + "loss": 2.6948, + "step": 237600 }, { - "epoch": 0.99, - "learning_rate": 4.066727818720201e-07, - "loss": 2.1796, - "step": 568770 + "epoch": 0.85, + "learning_rate": 7.576449843120317e-06, + "loss": 2.6913, + "step": 237700 }, { - "epoch": 0.99, - "learning_rate": 4.0580084194519335e-07, - "loss": 2.1004, - "step": 568780 + "epoch": 0.85, + "learning_rate": 7.558602325174638e-06, + "loss": 2.6908, + "step": 237800 }, { - "epoch": 0.99, - "learning_rate": 4.049289020183666e-07, - "loss": 2.263, - "step": 568790 + "epoch": 0.85, + "learning_rate": 7.540754807228959e-06, + "loss": 2.6938, + "step": 237900 }, { - "epoch": 0.99, - "learning_rate": 4.040569620915397e-07, - "loss": 2.1829, - "step": 568800 + "epoch": 0.85, + "learning_rate": 7.522907289283279e-06, + "loss": 2.6906, + "step": 238000 }, { - "epoch": 0.99, - "learning_rate": 4.0318502216471296e-07, - "loss": 2.2935, - "step": 568810 + "epoch": 0.85, + "learning_rate": 7.505059771337601e-06, + "loss": 2.6924, + "step": 238100 }, { - "epoch": 0.99, - "learning_rate": 4.023130822378862e-07, - "loss": 2.208, - "step": 568820 + "epoch": 0.85, + "learning_rate": 7.487212253391922e-06, + "loss": 2.7051, + "step": 238200 }, { - "epoch": 0.99, - "learning_rate": 4.0144114231105934e-07, - "loss": 2.2732, - "step": 568830 + "epoch": 0.85, + "learning_rate": 7.469364735446242e-06, + "loss": 2.6969, + "step": 238300 }, { - "epoch": 0.99, - "learning_rate": 4.005692023842326e-07, - "loss": 2.1925, - "step": 568840 + "epoch": 0.85, + "learning_rate": 7.451517217500563e-06, + "loss": 2.6976, + "step": 238400 }, { - "epoch": 0.99, - "learning_rate": 3.996972624574057e-07, - "loss": 2.3269, - "step": 568850 + "epoch": 0.85, + "learning_rate": 7.433669699554884e-06, + "loss": 2.6947, + "step": 238500 }, { - "epoch": 0.99, - "learning_rate": 3.9882532253057895e-07, - "loss": 2.1633, - "step": 568860 + "epoch": 0.85, + "learning_rate": 7.415822181609204e-06, + "loss": 2.6945, + "step": 238600 }, { - "epoch": 0.99, - "learning_rate": 3.979533826037522e-07, - "loss": 2.3015, - "step": 568870 + "epoch": 0.85, + "learning_rate": 7.397974663663524e-06, + "loss": 2.6951, + "step": 238700 }, { - "epoch": 0.99, - "learning_rate": 3.9708144267692533e-07, - "loss": 2.2691, - "step": 568880 + "epoch": 0.85, + "learning_rate": 7.3801271457178456e-06, + "loss": 2.6876, + "step": 238800 }, { - "epoch": 0.99, - "learning_rate": 3.9620950275009857e-07, - "loss": 2.2864, - "step": 568890 + "epoch": 0.85, + "learning_rate": 7.362279627772166e-06, + "loss": 2.6975, + "step": 238900 }, { - "epoch": 0.99, - "learning_rate": 3.953375628232717e-07, - "loss": 2.228, - "step": 568900 + "epoch": 0.85, + "learning_rate": 7.344432109826486e-06, + "loss": 2.6884, + "step": 239000 }, { - "epoch": 0.99, - "learning_rate": 3.9446562289644494e-07, - "loss": 2.2239, - "step": 568910 + "epoch": 0.85, + "learning_rate": 7.326584591880807e-06, + "loss": 2.6911, + "step": 239100 }, { - "epoch": 0.99, - "learning_rate": 3.935936829696182e-07, - "loss": 2.2473, - "step": 568920 + "epoch": 0.85, + "learning_rate": 7.308737073935128e-06, + "loss": 2.696, + "step": 239200 }, { - "epoch": 0.99, - "learning_rate": 3.927217430427913e-07, - "loss": 2.2274, - "step": 568930 + "epoch": 0.85, + "learning_rate": 7.290889555989448e-06, + "loss": 2.6989, + "step": 239300 }, { - "epoch": 0.99, - "learning_rate": 3.9184980311596456e-07, - "loss": 2.331, - "step": 568940 + "epoch": 0.85, + "learning_rate": 7.27304203804377e-06, + "loss": 2.6914, + "step": 239400 }, { - "epoch": 0.99, - "learning_rate": 3.909778631891377e-07, - "loss": 2.2807, - "step": 568950 + "epoch": 0.85, + "learning_rate": 7.255194520098091e-06, + "loss": 2.6928, + "step": 239500 }, { - "epoch": 0.99, - "learning_rate": 3.9010592326231093e-07, - "loss": 2.1732, - "step": 568960 + "epoch": 0.86, + "learning_rate": 7.237347002152411e-06, + "loss": 2.6887, + "step": 239600 }, { - "epoch": 0.99, - "learning_rate": 3.892339833354841e-07, - "loss": 2.2017, - "step": 568970 + "epoch": 0.86, + "learning_rate": 7.219499484206732e-06, + "loss": 2.7037, + "step": 239700 }, { - "epoch": 0.99, - "learning_rate": 3.883620434086573e-07, - "loss": 2.2332, - "step": 568980 + "epoch": 0.86, + "learning_rate": 7.201651966261053e-06, + "loss": 2.6903, + "step": 239800 }, { - "epoch": 0.99, - "learning_rate": 3.874901034818305e-07, - "loss": 2.3286, - "step": 568990 + "epoch": 0.86, + "learning_rate": 7.183804448315373e-06, + "loss": 2.6958, + "step": 239900 }, { - "epoch": 0.99, - "learning_rate": 3.8661816355500374e-07, - "loss": 2.2917, - "step": 569000 + "epoch": 0.86, + "learning_rate": 7.165956930369694e-06, + "loss": 2.6902, + "step": 240000 }, { - "epoch": 0.99, - "learning_rate": 3.857462236281769e-07, - "loss": 2.1798, - "step": 569010 + "epoch": 0.86, + "learning_rate": 7.148109412424015e-06, + "loss": 2.6947, + "step": 240100 }, { - "epoch": 0.99, - "learning_rate": 3.848742837013501e-07, - "loss": 2.2473, - "step": 569020 + "epoch": 0.86, + "learning_rate": 7.130261894478335e-06, + "loss": 2.7103, + "step": 240200 }, { - "epoch": 0.99, - "learning_rate": 3.840023437745233e-07, - "loss": 2.2214, - "step": 569030 + "epoch": 0.86, + "learning_rate": 7.112414376532655e-06, + "loss": 2.7019, + "step": 240300 }, { - "epoch": 0.99, - "learning_rate": 3.831304038476965e-07, - "loss": 2.1391, - "step": 569040 + "epoch": 0.86, + "learning_rate": 7.0945668585869765e-06, + "loss": 2.7102, + "step": 240400 }, { - "epoch": 0.99, - "learning_rate": 3.8225846392086973e-07, - "loss": 2.3303, - "step": 569050 + "epoch": 0.86, + "learning_rate": 7.076719340641297e-06, + "loss": 2.6914, + "step": 240500 }, { - "epoch": 0.99, - "learning_rate": 3.813865239940429e-07, - "loss": 2.1754, - "step": 569060 + "epoch": 0.86, + "learning_rate": 7.058871822695617e-06, + "loss": 2.6956, + "step": 240600 }, { - "epoch": 0.99, - "learning_rate": 3.805145840672161e-07, - "loss": 2.2982, - "step": 569070 + "epoch": 0.86, + "learning_rate": 7.041024304749939e-06, + "loss": 2.6888, + "step": 240700 }, { - "epoch": 0.99, - "learning_rate": 3.796426441403893e-07, - "loss": 2.3022, - "step": 569080 + "epoch": 0.86, + "learning_rate": 7.02317678680426e-06, + "loss": 2.6916, + "step": 240800 }, { - "epoch": 0.99, - "learning_rate": 3.787707042135625e-07, - "loss": 2.2288, - "step": 569090 + "epoch": 0.86, + "learning_rate": 7.005329268858581e-06, + "loss": 2.6881, + "step": 240900 }, { - "epoch": 0.99, - "learning_rate": 3.778987642867357e-07, - "loss": 2.1857, - "step": 569100 + "epoch": 0.86, + "learning_rate": 6.987481750912901e-06, + "loss": 2.6921, + "step": 241000 }, { - "epoch": 0.99, - "learning_rate": 3.770268243599089e-07, - "loss": 2.2683, - "step": 569110 + "epoch": 0.86, + "learning_rate": 6.969634232967222e-06, + "loss": 2.7049, + "step": 241100 }, { - "epoch": 0.99, - "learning_rate": 3.761548844330821e-07, - "loss": 2.2357, - "step": 569120 + "epoch": 0.86, + "learning_rate": 6.951786715021542e-06, + "loss": 2.6928, + "step": 241200 }, { - "epoch": 0.99, - "learning_rate": 3.752829445062553e-07, - "loss": 2.1678, - "step": 569130 + "epoch": 0.86, + "learning_rate": 6.933939197075863e-06, + "loss": 2.6975, + "step": 241300 }, { - "epoch": 0.99, - "learning_rate": 3.7441100457942847e-07, - "loss": 2.2751, - "step": 569140 + "epoch": 0.86, + "learning_rate": 6.916091679130184e-06, + "loss": 2.6956, + "step": 241400 }, { - "epoch": 0.99, - "learning_rate": 3.735390646526017e-07, - "loss": 2.1905, - "step": 569150 + "epoch": 0.86, + "learning_rate": 6.898244161184504e-06, + "loss": 2.6812, + "step": 241500 }, { - "epoch": 0.99, - "learning_rate": 3.726671247257749e-07, - "loss": 2.3222, - "step": 569160 + "epoch": 0.86, + "learning_rate": 6.880396643238825e-06, + "loss": 2.6887, + "step": 241600 }, { - "epoch": 0.99, - "learning_rate": 3.717951847989481e-07, - "loss": 2.1932, - "step": 569170 + "epoch": 0.86, + "learning_rate": 6.8625491252931456e-06, + "loss": 2.6962, + "step": 241700 }, { - "epoch": 0.99, - "learning_rate": 3.7092324487212127e-07, - "loss": 2.3227, - "step": 569180 + "epoch": 0.86, + "learning_rate": 6.844701607347466e-06, + "loss": 2.689, + "step": 241800 }, { - "epoch": 0.99, - "learning_rate": 3.700513049452945e-07, - "loss": 2.253, - "step": 569190 + "epoch": 0.86, + "learning_rate": 6.826854089401786e-06, + "loss": 2.689, + "step": 241900 }, { - "epoch": 0.99, - "learning_rate": 3.691793650184677e-07, - "loss": 2.3658, - "step": 569200 + "epoch": 0.86, + "learning_rate": 6.809006571456108e-06, + "loss": 2.6999, + "step": 242000 }, { - "epoch": 0.99, - "learning_rate": 3.683074250916409e-07, - "loss": 2.1946, - "step": 569210 + "epoch": 0.86, + "learning_rate": 6.791159053510429e-06, + "loss": 2.6883, + "step": 242100 }, { - "epoch": 0.99, - "learning_rate": 3.674354851648141e-07, - "loss": 2.3671, - "step": 569220 + "epoch": 0.86, + "learning_rate": 6.77331153556475e-06, + "loss": 2.6956, + "step": 242200 }, { - "epoch": 0.99, - "learning_rate": 3.6656354523798726e-07, - "loss": 2.183, - "step": 569230 + "epoch": 0.86, + "learning_rate": 6.75546401761907e-06, + "loss": 2.7015, + "step": 242300 }, { - "epoch": 0.99, - "learning_rate": 3.656916053111605e-07, - "loss": 2.2535, - "step": 569240 + "epoch": 0.87, + "learning_rate": 6.737616499673391e-06, + "loss": 2.688, + "step": 242400 }, { - "epoch": 0.99, - "learning_rate": 3.648196653843337e-07, - "loss": 2.2648, - "step": 569250 + "epoch": 0.87, + "learning_rate": 6.719768981727712e-06, + "loss": 2.694, + "step": 242500 }, { - "epoch": 0.99, - "learning_rate": 3.639477254575069e-07, - "loss": 2.2397, - "step": 569260 + "epoch": 0.87, + "learning_rate": 6.701921463782032e-06, + "loss": 2.688, + "step": 242600 }, { - "epoch": 0.99, - "learning_rate": 3.6307578553068007e-07, - "loss": 2.399, - "step": 569270 + "epoch": 0.87, + "learning_rate": 6.684073945836353e-06, + "loss": 2.6889, + "step": 242700 }, { - "epoch": 0.99, - "learning_rate": 3.6220384560385325e-07, - "loss": 2.3223, - "step": 569280 + "epoch": 0.87, + "learning_rate": 6.666226427890673e-06, + "loss": 2.6904, + "step": 242800 }, { - "epoch": 0.99, - "learning_rate": 3.613319056770265e-07, - "loss": 2.2022, - "step": 569290 + "epoch": 0.87, + "learning_rate": 6.648378909944994e-06, + "loss": 2.6881, + "step": 242900 }, { - "epoch": 0.99, - "learning_rate": 3.604599657501997e-07, - "loss": 2.3358, - "step": 569300 + "epoch": 0.87, + "learning_rate": 6.6305313919993146e-06, + "loss": 2.689, + "step": 243000 }, { - "epoch": 0.99, - "learning_rate": 3.5958802582337287e-07, - "loss": 2.3096, - "step": 569310 + "epoch": 0.87, + "learning_rate": 6.612683874053635e-06, + "loss": 2.6946, + "step": 243100 }, { - "epoch": 0.99, - "learning_rate": 3.5871608589654606e-07, - "loss": 2.3705, - "step": 569320 + "epoch": 0.87, + "learning_rate": 6.594836356107955e-06, + "loss": 2.6888, + "step": 243200 }, { - "epoch": 0.99, - "learning_rate": 3.578441459697193e-07, - "loss": 2.2649, - "step": 569330 + "epoch": 0.87, + "learning_rate": 6.576988838162277e-06, + "loss": 2.6866, + "step": 243300 }, { - "epoch": 0.99, - "learning_rate": 3.569722060428925e-07, - "loss": 2.266, - "step": 569340 + "epoch": 0.87, + "learning_rate": 6.559141320216599e-06, + "loss": 2.7064, + "step": 243400 }, { - "epoch": 0.99, - "learning_rate": 3.5610026611606567e-07, - "loss": 2.286, - "step": 569350 + "epoch": 0.87, + "learning_rate": 6.541293802270919e-06, + "loss": 2.6871, + "step": 243500 }, { - "epoch": 0.99, - "learning_rate": 3.5522832618923886e-07, - "loss": 2.2132, - "step": 569360 + "epoch": 0.87, + "learning_rate": 6.523446284325239e-06, + "loss": 2.6867, + "step": 243600 }, { - "epoch": 0.99, - "learning_rate": 3.5435638626241205e-07, - "loss": 2.3126, - "step": 569370 + "epoch": 0.87, + "learning_rate": 6.50559876637956e-06, + "loss": 2.6865, + "step": 243700 }, { - "epoch": 0.99, - "learning_rate": 3.534844463355853e-07, - "loss": 2.3538, - "step": 569380 + "epoch": 0.87, + "learning_rate": 6.487751248433881e-06, + "loss": 2.6934, + "step": 243800 }, { - "epoch": 0.99, - "learning_rate": 3.526125064087585e-07, - "loss": 2.2871, - "step": 569390 + "epoch": 0.87, + "learning_rate": 6.469903730488201e-06, + "loss": 2.6892, + "step": 243900 }, { - "epoch": 0.99, - "learning_rate": 3.5174056648193166e-07, - "loss": 2.2556, - "step": 569400 + "epoch": 0.87, + "learning_rate": 6.452056212542522e-06, + "loss": 2.7051, + "step": 244000 }, { - "epoch": 0.99, - "learning_rate": 3.5086862655510485e-07, - "loss": 2.2022, - "step": 569410 + "epoch": 0.87, + "learning_rate": 6.434208694596843e-06, + "loss": 2.6944, + "step": 244100 }, { - "epoch": 0.99, - "learning_rate": 3.499966866282781e-07, - "loss": 2.3677, - "step": 569420 + "epoch": 0.87, + "learning_rate": 6.416361176651163e-06, + "loss": 2.7003, + "step": 244200 }, { - "epoch": 0.99, - "learning_rate": 3.491247467014513e-07, - "loss": 2.3194, - "step": 569430 + "epoch": 0.87, + "learning_rate": 6.398513658705484e-06, + "loss": 2.6952, + "step": 244300 }, { - "epoch": 0.99, - "learning_rate": 3.4825280677462447e-07, - "loss": 2.1762, - "step": 569440 + "epoch": 0.87, + "learning_rate": 6.380666140759804e-06, + "loss": 2.6977, + "step": 244400 }, { - "epoch": 0.99, - "learning_rate": 3.4738086684779766e-07, - "loss": 2.1846, - "step": 569450 + "epoch": 0.87, + "learning_rate": 6.362818622814126e-06, + "loss": 2.6896, + "step": 244500 }, { - "epoch": 0.99, - "learning_rate": 3.465089269209709e-07, - "loss": 2.1851, - "step": 569460 + "epoch": 0.87, + "learning_rate": 6.344971104868447e-06, + "loss": 2.6967, + "step": 244600 }, { - "epoch": 0.99, - "learning_rate": 3.456369869941441e-07, - "loss": 2.3105, - "step": 569470 + "epoch": 0.87, + "learning_rate": 6.327123586922768e-06, + "loss": 2.6798, + "step": 244700 }, { - "epoch": 0.99, - "learning_rate": 3.4476504706731727e-07, - "loss": 2.2982, - "step": 569480 + "epoch": 0.87, + "learning_rate": 6.309276068977088e-06, + "loss": 2.6945, + "step": 244800 }, { - "epoch": 0.99, - "learning_rate": 3.4389310714049046e-07, - "loss": 2.264, - "step": 569490 + "epoch": 0.87, + "learning_rate": 6.291428551031408e-06, + "loss": 2.6842, + "step": 244900 }, { - "epoch": 0.99, - "learning_rate": 3.430211672136637e-07, - "loss": 2.1563, - "step": 569500 + "epoch": 0.87, + "learning_rate": 6.2735810330857296e-06, + "loss": 2.6888, + "step": 245000 }, { - "epoch": 0.99, - "learning_rate": 3.421492272868369e-07, - "loss": 2.286, - "step": 569510 + "epoch": 0.87, + "learning_rate": 6.25573351514005e-06, + "loss": 2.6997, + "step": 245100 }, { - "epoch": 0.99, - "learning_rate": 3.412772873600101e-07, - "loss": 2.2276, - "step": 569520 + "epoch": 0.88, + "learning_rate": 6.23788599719437e-06, + "loss": 2.6885, + "step": 245200 }, { - "epoch": 0.99, - "learning_rate": 3.4040534743318326e-07, - "loss": 2.1809, - "step": 569530 + "epoch": 0.88, + "learning_rate": 6.220038479248691e-06, + "loss": 2.7027, + "step": 245300 }, { - "epoch": 0.99, - "learning_rate": 3.3953340750635645e-07, - "loss": 2.2671, - "step": 569540 + "epoch": 0.88, + "learning_rate": 6.202190961303012e-06, + "loss": 2.6942, + "step": 245400 }, { - "epoch": 0.99, - "learning_rate": 3.386614675795297e-07, - "loss": 2.2493, - "step": 569550 + "epoch": 0.88, + "learning_rate": 6.184343443357333e-06, + "loss": 2.6893, + "step": 245500 }, { - "epoch": 0.99, - "learning_rate": 3.377895276527029e-07, - "loss": 2.2679, - "step": 569560 + "epoch": 0.88, + "learning_rate": 6.1664959254116535e-06, + "loss": 2.7014, + "step": 245600 }, { - "epoch": 0.99, - "learning_rate": 3.3691758772587606e-07, - "loss": 2.3518, - "step": 569570 + "epoch": 0.88, + "learning_rate": 6.148648407465974e-06, + "loss": 2.6891, + "step": 245700 }, { - "epoch": 0.99, - "learning_rate": 3.3604564779904925e-07, - "loss": 2.1933, - "step": 569580 + "epoch": 0.88, + "learning_rate": 6.130800889520295e-06, + "loss": 2.702, + "step": 245800 }, { - "epoch": 0.99, - "learning_rate": 3.351737078722225e-07, - "loss": 2.4105, - "step": 569590 + "epoch": 0.88, + "learning_rate": 6.112953371574615e-06, + "loss": 2.6909, + "step": 245900 }, { - "epoch": 0.99, - "learning_rate": 3.343017679453957e-07, - "loss": 2.2636, - "step": 569600 + "epoch": 0.88, + "learning_rate": 6.095105853628936e-06, + "loss": 2.6906, + "step": 246000 }, { - "epoch": 0.99, - "learning_rate": 3.3342982801856887e-07, - "loss": 2.3085, - "step": 569610 + "epoch": 0.88, + "learning_rate": 6.077258335683257e-06, + "loss": 2.6964, + "step": 246100 }, { - "epoch": 0.99, - "learning_rate": 3.3255788809174206e-07, - "loss": 2.3475, - "step": 569620 + "epoch": 0.88, + "learning_rate": 6.059410817737577e-06, + "loss": 2.7003, + "step": 246200 }, { - "epoch": 0.99, - "learning_rate": 3.3168594816491524e-07, - "loss": 2.3363, - "step": 569630 + "epoch": 0.88, + "learning_rate": 6.0415632997918986e-06, + "loss": 2.6929, + "step": 246300 }, { - "epoch": 0.99, - "learning_rate": 3.308140082380885e-07, - "loss": 2.3511, - "step": 569640 + "epoch": 0.88, + "learning_rate": 6.023715781846219e-06, + "loss": 2.6888, + "step": 246400 }, { - "epoch": 0.99, - "learning_rate": 3.2994206831126167e-07, - "loss": 2.269, - "step": 569650 + "epoch": 0.88, + "learning_rate": 6.005868263900539e-06, + "loss": 2.701, + "step": 246500 }, { - "epoch": 0.99, - "learning_rate": 3.2907012838443486e-07, - "loss": 2.2817, - "step": 569660 + "epoch": 0.88, + "learning_rate": 5.9880207459548605e-06, + "loss": 2.6993, + "step": 246600 }, { - "epoch": 0.99, - "learning_rate": 3.2819818845760805e-07, - "loss": 2.1899, - "step": 569670 + "epoch": 0.88, + "learning_rate": 5.970173228009181e-06, + "loss": 2.6882, + "step": 246700 }, { - "epoch": 0.99, - "learning_rate": 3.2732624853078123e-07, - "loss": 2.2339, - "step": 569680 + "epoch": 0.88, + "learning_rate": 5.952325710063502e-06, + "loss": 2.6969, + "step": 246800 }, { - "epoch": 0.99, - "learning_rate": 3.264543086039545e-07, - "loss": 2.2488, - "step": 569690 + "epoch": 0.88, + "learning_rate": 5.9344781921178225e-06, + "loss": 2.7008, + "step": 246900 }, { - "epoch": 0.99, - "learning_rate": 3.2558236867712766e-07, - "loss": 2.2322, - "step": 569700 + "epoch": 0.88, + "learning_rate": 5.916630674172143e-06, + "loss": 2.6964, + "step": 247000 }, { - "epoch": 0.99, - "learning_rate": 3.2471042875030085e-07, - "loss": 2.1889, - "step": 569710 + "epoch": 0.88, + "learning_rate": 5.898783156226464e-06, + "loss": 2.6921, + "step": 247100 }, { - "epoch": 0.99, - "learning_rate": 3.2383848882347404e-07, - "loss": 2.2424, - "step": 569720 + "epoch": 0.88, + "learning_rate": 5.8809356382807844e-06, + "loss": 2.6875, + "step": 247200 }, { - "epoch": 0.99, - "learning_rate": 3.229665488966472e-07, - "loss": 2.2317, - "step": 569730 + "epoch": 0.88, + "learning_rate": 5.863088120335105e-06, + "loss": 2.6913, + "step": 247300 }, { - "epoch": 0.99, - "learning_rate": 3.2209460896982047e-07, - "loss": 2.3667, - "step": 569740 + "epoch": 0.88, + "learning_rate": 5.845240602389426e-06, + "loss": 2.7004, + "step": 247400 }, { - "epoch": 0.99, - "learning_rate": 3.2122266904299365e-07, - "loss": 2.2508, - "step": 569750 + "epoch": 0.88, + "learning_rate": 5.827393084443747e-06, + "loss": 2.6947, + "step": 247500 }, { - "epoch": 0.99, - "learning_rate": 3.2035072911616684e-07, - "loss": 2.2583, - "step": 569760 + "epoch": 0.88, + "learning_rate": 5.809545566498068e-06, + "loss": 2.6968, + "step": 247600 }, { - "epoch": 0.99, - "learning_rate": 3.1947878918934003e-07, - "loss": 2.1606, - "step": 569770 + "epoch": 0.88, + "learning_rate": 5.791698048552388e-06, + "loss": 2.6929, + "step": 247700 }, { - "epoch": 0.99, - "learning_rate": 3.186068492625132e-07, - "loss": 2.2784, - "step": 569780 + "epoch": 0.88, + "learning_rate": 5.773850530606708e-06, + "loss": 2.686, + "step": 247800 }, { - "epoch": 0.99, - "learning_rate": 3.1773490933568646e-07, - "loss": 2.2699, - "step": 569790 + "epoch": 0.88, + "learning_rate": 5.7560030126610295e-06, + "loss": 2.6899, + "step": 247900 }, { - "epoch": 0.99, - "learning_rate": 3.1686296940885964e-07, - "loss": 2.2515, - "step": 569800 + "epoch": 0.89, + "learning_rate": 5.738155494715351e-06, + "loss": 2.6949, + "step": 248000 }, { - "epoch": 0.99, - "learning_rate": 3.1599102948203283e-07, - "loss": 2.3212, - "step": 569810 + "epoch": 0.89, + "learning_rate": 5.720307976769671e-06, + "loss": 2.6969, + "step": 248100 }, { - "epoch": 0.99, - "learning_rate": 3.15119089555206e-07, - "loss": 2.2474, - "step": 569820 + "epoch": 0.89, + "learning_rate": 5.7024604588239915e-06, + "loss": 2.691, + "step": 248200 }, { - "epoch": 0.99, - "learning_rate": 3.142471496283792e-07, - "loss": 2.3037, - "step": 569830 + "epoch": 0.89, + "learning_rate": 5.684612940878313e-06, + "loss": 2.6885, + "step": 248300 }, { - "epoch": 0.99, - "learning_rate": 3.1337520970155245e-07, - "loss": 2.159, - "step": 569840 + "epoch": 0.89, + "learning_rate": 5.666765422932633e-06, + "loss": 2.69, + "step": 248400 }, { - "epoch": 0.99, - "learning_rate": 3.1250326977472563e-07, - "loss": 2.2192, - "step": 569850 + "epoch": 0.89, + "learning_rate": 5.6489179049869534e-06, + "loss": 2.6909, + "step": 248500 }, { - "epoch": 0.99, - "learning_rate": 3.116313298478988e-07, - "loss": 2.2066, - "step": 569860 + "epoch": 0.89, + "learning_rate": 5.631070387041274e-06, + "loss": 2.7055, + "step": 248600 }, { - "epoch": 0.99, - "learning_rate": 3.10759389921072e-07, - "loss": 2.2416, - "step": 569870 + "epoch": 0.89, + "learning_rate": 5.613222869095595e-06, + "loss": 2.6838, + "step": 248700 }, { - "epoch": 0.99, - "learning_rate": 3.0988744999424525e-07, - "loss": 2.2599, - "step": 569880 + "epoch": 0.89, + "learning_rate": 5.595375351149916e-06, + "loss": 2.6962, + "step": 248800 }, { - "epoch": 0.99, - "learning_rate": 3.0901551006741844e-07, - "loss": 2.2891, - "step": 569890 + "epoch": 0.89, + "learning_rate": 5.577527833204237e-06, + "loss": 2.6954, + "step": 248900 }, { - "epoch": 0.99, - "learning_rate": 3.081435701405916e-07, - "loss": 2.2971, - "step": 569900 + "epoch": 0.89, + "learning_rate": 5.559680315258557e-06, + "loss": 2.6933, + "step": 249000 }, { - "epoch": 0.99, - "learning_rate": 3.072716302137648e-07, - "loss": 2.2429, - "step": 569910 + "epoch": 0.89, + "learning_rate": 5.541832797312878e-06, + "loss": 2.6939, + "step": 249100 }, { - "epoch": 0.99, - "learning_rate": 3.06399690286938e-07, - "loss": 2.1869, - "step": 569920 + "epoch": 0.89, + "learning_rate": 5.5239852793671986e-06, + "loss": 2.6894, + "step": 249200 }, { - "epoch": 0.99, - "learning_rate": 3.0552775036011124e-07, - "loss": 2.1962, - "step": 569930 + "epoch": 0.89, + "learning_rate": 5.50613776142152e-06, + "loss": 2.6872, + "step": 249300 }, { - "epoch": 0.99, - "learning_rate": 3.0465581043328443e-07, - "loss": 2.242, - "step": 569940 + "epoch": 0.89, + "learning_rate": 5.48829024347584e-06, + "loss": 2.6983, + "step": 249400 }, { - "epoch": 0.99, - "learning_rate": 3.037838705064576e-07, - "loss": 2.3744, - "step": 569950 + "epoch": 0.89, + "learning_rate": 5.4704427255301605e-06, + "loss": 2.6958, + "step": 249500 }, { - "epoch": 0.99, - "learning_rate": 3.029119305796308e-07, - "loss": 2.2076, - "step": 569960 + "epoch": 0.89, + "learning_rate": 5.452595207584482e-06, + "loss": 2.6866, + "step": 249600 }, { - "epoch": 0.99, - "learning_rate": 3.02039990652804e-07, - "loss": 2.399, - "step": 569970 + "epoch": 0.89, + "learning_rate": 5.434747689638802e-06, + "loss": 2.6886, + "step": 249700 }, { - "epoch": 0.99, - "learning_rate": 3.0116805072597723e-07, - "loss": 2.1036, - "step": 569980 + "epoch": 0.89, + "learning_rate": 5.4169001716931225e-06, + "loss": 2.6916, + "step": 249800 }, { - "epoch": 0.99, - "learning_rate": 3.002961107991504e-07, - "loss": 2.3789, - "step": 569990 + "epoch": 0.89, + "learning_rate": 5.399052653747444e-06, + "loss": 2.6907, + "step": 249900 }, { - "epoch": 0.99, - "learning_rate": 2.994241708723236e-07, - "loss": 2.3943, - "step": 570000 + "epoch": 0.89, + "learning_rate": 5.381205135801765e-06, + "loss": 2.6826, + "step": 250000 }, { - "epoch": 0.99, - "learning_rate": 2.985522309454968e-07, - "loss": 2.2626, - "step": 570010 + "epoch": 0.89, + "learning_rate": 5.363357617856085e-06, + "loss": 2.6888, + "step": 250100 }, { - "epoch": 0.99, - "learning_rate": 2.9768029101867e-07, - "loss": 2.2144, - "step": 570020 + "epoch": 0.89, + "learning_rate": 5.345510099910406e-06, + "loss": 2.6791, + "step": 250200 }, { - "epoch": 0.99, - "learning_rate": 2.968083510918432e-07, - "loss": 2.1759, - "step": 570030 + "epoch": 0.89, + "learning_rate": 5.327662581964726e-06, + "loss": 2.6788, + "step": 250300 }, { - "epoch": 0.99, - "learning_rate": 2.959364111650164e-07, - "loss": 2.3283, - "step": 570040 + "epoch": 0.89, + "learning_rate": 5.309815064019047e-06, + "loss": 2.7038, + "step": 250400 }, { - "epoch": 0.99, - "learning_rate": 2.950644712381896e-07, - "loss": 2.2905, - "step": 570050 + "epoch": 0.89, + "learning_rate": 5.2919675460733676e-06, + "loss": 2.6972, + "step": 250500 }, { - "epoch": 0.99, - "learning_rate": 2.941925313113628e-07, - "loss": 2.2766, - "step": 570060 + "epoch": 0.89, + "learning_rate": 5.274120028127689e-06, + "loss": 2.6859, + "step": 250600 }, { - "epoch": 0.99, - "learning_rate": 2.9332059138453597e-07, - "loss": 2.2118, - "step": 570070 + "epoch": 0.89, + "learning_rate": 5.256272510182009e-06, + "loss": 2.6911, + "step": 250700 }, { - "epoch": 0.99, - "learning_rate": 2.924486514577092e-07, - "loss": 2.3283, - "step": 570080 + "epoch": 0.9, + "learning_rate": 5.23842499223633e-06, + "loss": 2.6862, + "step": 250800 }, { - "epoch": 0.99, - "learning_rate": 2.915767115308824e-07, - "loss": 2.3458, - "step": 570090 + "epoch": 0.9, + "learning_rate": 5.220577474290651e-06, + "loss": 2.6866, + "step": 250900 }, { - "epoch": 0.99, - "learning_rate": 2.907047716040556e-07, - "loss": 2.2024, - "step": 570100 + "epoch": 0.9, + "learning_rate": 5.202729956344971e-06, + "loss": 2.676, + "step": 251000 }, { - "epoch": 0.99, - "learning_rate": 2.898328316772288e-07, - "loss": 2.1396, - "step": 570110 + "epoch": 0.9, + "learning_rate": 5.1848824383992915e-06, + "loss": 2.6817, + "step": 251100 }, { - "epoch": 0.99, - "learning_rate": 2.8896089175040196e-07, - "loss": 2.1422, - "step": 570120 + "epoch": 0.9, + "learning_rate": 5.167034920453613e-06, + "loss": 2.6998, + "step": 251200 }, { - "epoch": 0.99, - "learning_rate": 2.880889518235752e-07, - "loss": 2.2124, - "step": 570130 + "epoch": 0.9, + "learning_rate": 5.149187402507934e-06, + "loss": 2.6946, + "step": 251300 }, { - "epoch": 0.99, - "learning_rate": 2.872170118967484e-07, - "loss": 2.2138, - "step": 570140 + "epoch": 0.9, + "learning_rate": 5.131339884562254e-06, + "loss": 2.6848, + "step": 251400 }, { - "epoch": 0.99, - "learning_rate": 2.863450719699216e-07, - "loss": 2.2987, - "step": 570150 + "epoch": 0.9, + "learning_rate": 5.113492366616575e-06, + "loss": 2.7021, + "step": 251500 }, { - "epoch": 0.99, - "learning_rate": 2.8547313204309477e-07, - "loss": 2.3429, - "step": 570160 + "epoch": 0.9, + "learning_rate": 5.095644848670896e-06, + "loss": 2.695, + "step": 251600 }, { - "epoch": 0.99, - "learning_rate": 2.8460119211626795e-07, - "loss": 2.2576, - "step": 570170 + "epoch": 0.9, + "learning_rate": 5.077797330725216e-06, + "loss": 2.6968, + "step": 251700 }, { - "epoch": 0.99, - "learning_rate": 2.837292521894412e-07, - "loss": 2.3013, - "step": 570180 + "epoch": 0.9, + "learning_rate": 5.059949812779537e-06, + "loss": 2.6969, + "step": 251800 }, { - "epoch": 0.99, - "learning_rate": 2.828573122626144e-07, - "loss": 2.2701, - "step": 570190 + "epoch": 0.9, + "learning_rate": 5.042102294833858e-06, + "loss": 2.6867, + "step": 251900 }, { - "epoch": 0.99, - "learning_rate": 2.8198537233578757e-07, - "loss": 2.2244, - "step": 570200 + "epoch": 0.9, + "learning_rate": 5.024254776888178e-06, + "loss": 2.6927, + "step": 252000 }, { - "epoch": 0.99, - "learning_rate": 2.8111343240896076e-07, - "loss": 2.206, - "step": 570210 + "epoch": 0.9, + "learning_rate": 5.006407258942499e-06, + "loss": 2.692, + "step": 252100 }, { - "epoch": 0.99, - "learning_rate": 2.8024149248213395e-07, - "loss": 2.3379, - "step": 570220 + "epoch": 0.9, + "learning_rate": 4.98855974099682e-06, + "loss": 2.6792, + "step": 252200 }, { - "epoch": 0.99, - "learning_rate": 2.793695525553072e-07, - "loss": 2.2151, - "step": 570230 + "epoch": 0.9, + "learning_rate": 4.97071222305114e-06, + "loss": 2.6827, + "step": 252300 }, { - "epoch": 0.99, - "learning_rate": 2.7849761262848037e-07, - "loss": 2.166, - "step": 570240 + "epoch": 0.9, + "learning_rate": 4.952864705105461e-06, + "loss": 2.6947, + "step": 252400 }, { - "epoch": 0.99, - "learning_rate": 2.7762567270165356e-07, - "loss": 2.2287, - "step": 570250 + "epoch": 0.9, + "learning_rate": 4.9350171871597826e-06, + "loss": 2.7035, + "step": 252500 }, { - "epoch": 0.99, - "learning_rate": 2.7675373277482675e-07, - "loss": 2.277, - "step": 570260 + "epoch": 0.9, + "learning_rate": 4.917169669214103e-06, + "loss": 2.6853, + "step": 252600 }, { - "epoch": 0.99, - "learning_rate": 2.7588179284799994e-07, - "loss": 2.1623, - "step": 570270 + "epoch": 0.9, + "learning_rate": 4.899322151268423e-06, + "loss": 2.689, + "step": 252700 }, { - "epoch": 0.99, - "learning_rate": 2.750098529211732e-07, - "loss": 2.3518, - "step": 570280 + "epoch": 0.9, + "learning_rate": 4.881474633322744e-06, + "loss": 2.6917, + "step": 252800 }, { - "epoch": 0.99, - "learning_rate": 2.7413791299434636e-07, - "loss": 2.1459, - "step": 570290 + "epoch": 0.9, + "learning_rate": 4.863627115377065e-06, + "loss": 2.6907, + "step": 252900 }, { - "epoch": 0.99, - "learning_rate": 2.7326597306751955e-07, - "loss": 2.2724, - "step": 570300 + "epoch": 0.9, + "learning_rate": 4.845779597431385e-06, + "loss": 2.6849, + "step": 253000 }, { - "epoch": 0.99, - "learning_rate": 2.7239403314069274e-07, - "loss": 2.1716, - "step": 570310 + "epoch": 0.9, + "learning_rate": 4.8279320794857065e-06, + "loss": 2.6868, + "step": 253100 }, { - "epoch": 0.99, - "learning_rate": 2.7152209321386593e-07, - "loss": 2.2358, - "step": 570320 + "epoch": 0.9, + "learning_rate": 4.810084561540027e-06, + "loss": 2.6929, + "step": 253200 }, { - "epoch": 0.99, - "learning_rate": 2.7065015328703917e-07, - "loss": 2.1858, - "step": 570330 + "epoch": 0.9, + "learning_rate": 4.792237043594348e-06, + "loss": 2.6968, + "step": 253300 }, { - "epoch": 0.99, - "learning_rate": 2.6977821336021236e-07, - "loss": 2.1741, - "step": 570340 + "epoch": 0.9, + "learning_rate": 4.774389525648668e-06, + "loss": 2.683, + "step": 253400 }, { - "epoch": 0.99, - "learning_rate": 2.6890627343338554e-07, - "loss": 2.2891, - "step": 570350 + "epoch": 0.9, + "learning_rate": 4.756542007702989e-06, + "loss": 2.6751, + "step": 253500 }, { - "epoch": 0.99, - "learning_rate": 2.6803433350655873e-07, - "loss": 2.3151, - "step": 570360 + "epoch": 0.91, + "learning_rate": 4.738694489757309e-06, + "loss": 2.6998, + "step": 253600 }, { - "epoch": 0.99, - "learning_rate": 2.671623935797319e-07, - "loss": 2.308, - "step": 570370 + "epoch": 0.91, + "learning_rate": 4.72084697181163e-06, + "loss": 2.7031, + "step": 253700 }, { - "epoch": 0.99, - "learning_rate": 2.6629045365290516e-07, - "loss": 2.2182, - "step": 570380 + "epoch": 0.91, + "learning_rate": 4.7029994538659516e-06, + "loss": 2.6882, + "step": 253800 }, { - "epoch": 0.99, - "learning_rate": 2.6541851372607835e-07, - "loss": 2.1339, - "step": 570390 + "epoch": 0.91, + "learning_rate": 4.685151935920272e-06, + "loss": 2.6885, + "step": 253900 }, { - "epoch": 0.99, - "learning_rate": 2.6454657379925153e-07, - "loss": 2.2786, - "step": 570400 + "epoch": 0.91, + "learning_rate": 4.667304417974592e-06, + "loss": 2.6818, + "step": 254000 }, { - "epoch": 0.99, - "learning_rate": 2.636746338724247e-07, - "loss": 2.2791, - "step": 570410 + "epoch": 0.91, + "learning_rate": 4.6494569000289135e-06, + "loss": 2.6897, + "step": 254100 }, { - "epoch": 0.99, - "learning_rate": 2.628026939455979e-07, - "loss": 2.3565, - "step": 570420 + "epoch": 0.91, + "learning_rate": 4.631609382083234e-06, + "loss": 2.6905, + "step": 254200 }, { - "epoch": 0.99, - "learning_rate": 2.6193075401877115e-07, - "loss": 2.3134, - "step": 570430 + "epoch": 0.91, + "learning_rate": 4.613761864137554e-06, + "loss": 2.6938, + "step": 254300 }, { - "epoch": 0.99, - "learning_rate": 2.6105881409194434e-07, - "loss": 2.2277, - "step": 570440 + "epoch": 0.91, + "learning_rate": 4.5959143461918755e-06, + "loss": 2.6965, + "step": 254400 }, { - "epoch": 0.99, - "learning_rate": 2.601868741651175e-07, - "loss": 2.2907, - "step": 570450 + "epoch": 0.91, + "learning_rate": 4.578066828246196e-06, + "loss": 2.6999, + "step": 254500 }, { - "epoch": 0.99, - "learning_rate": 2.593149342382907e-07, - "loss": 2.2832, - "step": 570460 + "epoch": 0.91, + "learning_rate": 4.560219310300517e-06, + "loss": 2.6905, + "step": 254600 }, { - "epoch": 0.99, - "learning_rate": 2.584429943114639e-07, - "loss": 2.1163, - "step": 570470 + "epoch": 0.91, + "learning_rate": 4.5423717923548374e-06, + "loss": 2.6768, + "step": 254700 }, { - "epoch": 0.99, - "learning_rate": 2.5757105438463714e-07, - "loss": 2.3437, - "step": 570480 + "epoch": 0.91, + "learning_rate": 4.524524274409158e-06, + "loss": 2.6879, + "step": 254800 }, { - "epoch": 0.99, - "learning_rate": 2.5669911445781033e-07, - "loss": 2.3424, - "step": 570490 + "epoch": 0.91, + "learning_rate": 4.506676756463479e-06, + "loss": 2.6928, + "step": 254900 }, { - "epoch": 0.99, - "learning_rate": 2.558271745309835e-07, - "loss": 2.1433, - "step": 570500 + "epoch": 0.91, + "learning_rate": 4.488829238517799e-06, + "loss": 2.6959, + "step": 255000 }, { - "epoch": 0.99, - "learning_rate": 2.549552346041567e-07, - "loss": 2.2962, - "step": 570510 + "epoch": 0.91, + "learning_rate": 4.470981720572121e-06, + "loss": 2.6813, + "step": 255100 }, { - "epoch": 0.99, - "learning_rate": 2.540832946773299e-07, - "loss": 2.3742, - "step": 570520 + "epoch": 0.91, + "learning_rate": 4.453134202626441e-06, + "loss": 2.6957, + "step": 255200 }, { - "epoch": 0.99, - "learning_rate": 2.5321135475050313e-07, - "loss": 2.2036, - "step": 570530 + "epoch": 0.91, + "learning_rate": 4.435286684680761e-06, + "loss": 2.6822, + "step": 255300 }, { - "epoch": 0.99, - "learning_rate": 2.523394148236763e-07, - "loss": 2.1495, - "step": 570540 + "epoch": 0.91, + "learning_rate": 4.4174391667350825e-06, + "loss": 2.695, + "step": 255400 }, { - "epoch": 0.99, - "learning_rate": 2.514674748968495e-07, - "loss": 2.2853, - "step": 570550 + "epoch": 0.91, + "learning_rate": 4.399591648789403e-06, + "loss": 2.6949, + "step": 255500 }, { - "epoch": 0.99, - "learning_rate": 2.505955349700227e-07, - "loss": 2.2481, - "step": 570560 + "epoch": 0.91, + "learning_rate": 4.381744130843723e-06, + "loss": 2.6821, + "step": 255600 }, { - "epoch": 1.0, - "learning_rate": 2.4972359504319593e-07, - "loss": 2.2966, - "step": 570570 + "epoch": 0.91, + "learning_rate": 4.3638966128980445e-06, + "loss": 2.6904, + "step": 255700 }, { - "epoch": 1.0, - "learning_rate": 2.488516551163691e-07, - "loss": 2.2475, - "step": 570580 + "epoch": 0.91, + "learning_rate": 4.346049094952366e-06, + "loss": 2.6912, + "step": 255800 }, { - "epoch": 1.0, - "learning_rate": 2.479797151895423e-07, - "loss": 2.2644, - "step": 570590 + "epoch": 0.91, + "learning_rate": 4.328201577006686e-06, + "loss": 2.6931, + "step": 255900 }, { - "epoch": 1.0, - "learning_rate": 2.471077752627155e-07, - "loss": 2.2854, - "step": 570600 + "epoch": 0.91, + "learning_rate": 4.3103540590610064e-06, + "loss": 2.686, + "step": 256000 }, { - "epoch": 1.0, - "learning_rate": 2.462358353358887e-07, - "loss": 2.3998, - "step": 570610 + "epoch": 0.91, + "learning_rate": 4.292506541115327e-06, + "loss": 2.6957, + "step": 256100 }, { - "epoch": 1.0, - "learning_rate": 2.453638954090619e-07, - "loss": 2.2439, - "step": 570620 + "epoch": 0.91, + "learning_rate": 4.274659023169648e-06, + "loss": 2.6824, + "step": 256200 }, { - "epoch": 1.0, - "learning_rate": 2.444919554822351e-07, - "loss": 2.255, - "step": 570630 + "epoch": 0.91, + "learning_rate": 4.256811505223969e-06, + "loss": 2.6841, + "step": 256300 }, { - "epoch": 1.0, - "learning_rate": 2.436200155554083e-07, - "loss": 2.1877, - "step": 570640 + "epoch": 0.92, + "learning_rate": 4.23896398727829e-06, + "loss": 2.6876, + "step": 256400 }, { - "epoch": 1.0, - "learning_rate": 2.427480756285815e-07, - "loss": 2.3246, - "step": 570650 + "epoch": 0.92, + "learning_rate": 4.22111646933261e-06, + "loss": 2.6932, + "step": 256500 }, { - "epoch": 1.0, - "learning_rate": 2.418761357017547e-07, - "loss": 2.3867, - "step": 570660 + "epoch": 0.92, + "learning_rate": 4.203268951386931e-06, + "loss": 2.6916, + "step": 256600 }, { - "epoch": 1.0, - "learning_rate": 2.410041957749279e-07, - "loss": 2.3208, - "step": 570670 + "epoch": 0.92, + "learning_rate": 4.1854214334412516e-06, + "loss": 2.6874, + "step": 256700 }, { - "epoch": 1.0, - "learning_rate": 2.401322558481011e-07, - "loss": 2.2254, - "step": 570680 + "epoch": 0.92, + "learning_rate": 4.167573915495572e-06, + "loss": 2.6823, + "step": 256800 }, { - "epoch": 1.0, - "learning_rate": 2.392603159212743e-07, - "loss": 2.2459, - "step": 570690 + "epoch": 0.92, + "learning_rate": 4.149726397549892e-06, + "loss": 2.687, + "step": 256900 }, { - "epoch": 1.0, - "learning_rate": 2.383883759944475e-07, - "loss": 2.3352, - "step": 570700 + "epoch": 0.92, + "learning_rate": 4.1318788796042135e-06, + "loss": 2.6951, + "step": 257000 }, { - "epoch": 1.0, - "learning_rate": 2.375164360676207e-07, - "loss": 2.1953, - "step": 570710 + "epoch": 0.92, + "learning_rate": 4.114031361658535e-06, + "loss": 2.6977, + "step": 257100 }, { - "epoch": 1.0, - "learning_rate": 2.366444961407939e-07, - "loss": 2.2773, - "step": 570720 + "epoch": 0.92, + "learning_rate": 4.096183843712855e-06, + "loss": 2.6904, + "step": 257200 }, { - "epoch": 1.0, - "learning_rate": 2.357725562139671e-07, - "loss": 2.2529, - "step": 570730 + "epoch": 0.92, + "learning_rate": 4.0783363257671755e-06, + "loss": 2.6816, + "step": 257300 }, { - "epoch": 1.0, - "learning_rate": 2.3490061628714028e-07, - "loss": 2.2226, - "step": 570740 + "epoch": 0.92, + "learning_rate": 4.060488807821497e-06, + "loss": 2.6873, + "step": 257400 }, { - "epoch": 1.0, - "learning_rate": 2.340286763603135e-07, - "loss": 2.1657, - "step": 570750 + "epoch": 0.92, + "learning_rate": 4.042641289875817e-06, + "loss": 2.6894, + "step": 257500 }, { - "epoch": 1.0, - "learning_rate": 2.3315673643348668e-07, - "loss": 2.2381, - "step": 570760 + "epoch": 0.92, + "learning_rate": 4.024793771930138e-06, + "loss": 2.6893, + "step": 257600 }, { - "epoch": 1.0, - "learning_rate": 2.322847965066599e-07, - "loss": 2.1947, - "step": 570770 + "epoch": 0.92, + "learning_rate": 4.006946253984459e-06, + "loss": 2.6965, + "step": 257700 }, { - "epoch": 1.0, - "learning_rate": 2.3141285657983308e-07, - "loss": 2.2158, - "step": 570780 + "epoch": 0.92, + "learning_rate": 3.989098736038779e-06, + "loss": 2.685, + "step": 257800 }, { - "epoch": 1.0, - "learning_rate": 2.305409166530063e-07, - "loss": 2.1701, - "step": 570790 + "epoch": 0.92, + "learning_rate": 3.9712512180931e-06, + "loss": 2.6865, + "step": 257900 }, { - "epoch": 1.0, - "learning_rate": 2.2966897672617949e-07, - "loss": 2.0989, - "step": 570800 + "epoch": 0.92, + "learning_rate": 3.953403700147421e-06, + "loss": 2.6911, + "step": 258000 }, { - "epoch": 1.0, - "learning_rate": 2.2879703679935267e-07, - "loss": 2.3187, - "step": 570810 + "epoch": 0.92, + "learning_rate": 3.935556182201741e-06, + "loss": 2.6885, + "step": 258100 }, { - "epoch": 1.0, - "learning_rate": 2.279250968725259e-07, - "loss": 2.289, - "step": 570820 + "epoch": 0.92, + "learning_rate": 3.917708664256062e-06, + "loss": 2.6951, + "step": 258200 }, { - "epoch": 1.0, - "learning_rate": 2.270531569456991e-07, - "loss": 2.3191, - "step": 570830 + "epoch": 0.92, + "learning_rate": 3.899861146310383e-06, + "loss": 2.6964, + "step": 258300 }, { - "epoch": 1.0, - "learning_rate": 2.261812170188723e-07, - "loss": 2.1839, - "step": 570840 + "epoch": 0.92, + "learning_rate": 3.882013628364704e-06, + "loss": 2.6863, + "step": 258400 }, { - "epoch": 1.0, - "learning_rate": 2.2530927709204548e-07, - "loss": 2.2369, - "step": 570850 + "epoch": 0.92, + "learning_rate": 3.864166110419024e-06, + "loss": 2.6828, + "step": 258500 }, { - "epoch": 1.0, - "learning_rate": 2.2443733716521866e-07, - "loss": 2.2265, - "step": 570860 + "epoch": 0.92, + "learning_rate": 3.8463185924733445e-06, + "loss": 2.6844, + "step": 258600 }, { - "epoch": 1.0, - "learning_rate": 2.235653972383919e-07, - "loss": 2.2467, - "step": 570870 + "epoch": 0.92, + "learning_rate": 3.828471074527666e-06, + "loss": 2.6863, + "step": 258700 }, { - "epoch": 1.0, - "learning_rate": 2.226934573115651e-07, - "loss": 2.2648, - "step": 570880 + "epoch": 0.92, + "learning_rate": 3.810623556581986e-06, + "loss": 2.6983, + "step": 258800 }, { - "epoch": 1.0, - "learning_rate": 2.2182151738473828e-07, - "loss": 2.3264, - "step": 570890 + "epoch": 0.92, + "learning_rate": 3.7927760386363073e-06, + "loss": 2.6873, + "step": 258900 }, { - "epoch": 1.0, - "learning_rate": 2.2094957745791147e-07, - "loss": 2.3239, - "step": 570900 + "epoch": 0.92, + "learning_rate": 3.774928520690628e-06, + "loss": 2.6917, + "step": 259000 }, { - "epoch": 1.0, - "learning_rate": 2.2007763753108466e-07, - "loss": 2.2935, - "step": 570910 + "epoch": 0.92, + "learning_rate": 3.7570810027449484e-06, + "loss": 2.6926, + "step": 259100 }, { - "epoch": 1.0, - "learning_rate": 2.192056976042579e-07, - "loss": 2.2595, - "step": 570920 + "epoch": 0.93, + "learning_rate": 3.7392334847992692e-06, + "loss": 2.688, + "step": 259200 }, { - "epoch": 1.0, - "learning_rate": 2.1833375767743108e-07, - "loss": 2.2326, - "step": 570930 + "epoch": 0.93, + "learning_rate": 3.7213859668535896e-06, + "loss": 2.6805, + "step": 259300 }, { - "epoch": 1.0, - "learning_rate": 2.1746181775060427e-07, - "loss": 2.3095, - "step": 570940 + "epoch": 0.93, + "learning_rate": 3.7035384489079104e-06, + "loss": 2.6856, + "step": 259400 }, { - "epoch": 1.0, - "learning_rate": 2.1658987782377746e-07, - "loss": 2.236, - "step": 570950 + "epoch": 0.93, + "learning_rate": 3.6856909309622316e-06, + "loss": 2.6907, + "step": 259500 }, { - "epoch": 1.0, - "learning_rate": 2.1571793789695065e-07, - "loss": 2.2673, - "step": 570960 + "epoch": 0.93, + "learning_rate": 3.6678434130165524e-06, + "loss": 2.6858, + "step": 259600 }, { - "epoch": 1.0, - "learning_rate": 2.148459979701239e-07, - "loss": 2.2999, - "step": 570970 + "epoch": 0.93, + "learning_rate": 3.6499958950708728e-06, + "loss": 2.6867, + "step": 259700 }, { - "epoch": 1.0, - "learning_rate": 2.1397405804329707e-07, - "loss": 2.2222, - "step": 570980 + "epoch": 0.93, + "learning_rate": 3.6321483771251936e-06, + "loss": 2.688, + "step": 259800 }, { - "epoch": 1.0, - "learning_rate": 2.1310211811647026e-07, - "loss": 2.1431, - "step": 570990 + "epoch": 0.93, + "learning_rate": 3.614300859179514e-06, + "loss": 2.689, + "step": 259900 }, { - "epoch": 1.0, - "learning_rate": 2.1223017818964345e-07, - "loss": 2.2585, - "step": 571000 + "epoch": 0.93, + "learning_rate": 3.5964533412338347e-06, + "loss": 2.6853, + "step": 260000 }, { - "epoch": 1.0, - "learning_rate": 2.1135823826281664e-07, - "loss": 2.2673, - "step": 571010 + "epoch": 0.93, + "learning_rate": 3.578605823288155e-06, + "loss": 2.6822, + "step": 260100 }, { - "epoch": 1.0, - "learning_rate": 2.1048629833598988e-07, - "loss": 2.2994, - "step": 571020 + "epoch": 0.93, + "learning_rate": 3.5607583053424763e-06, + "loss": 2.6965, + "step": 260200 }, { - "epoch": 1.0, - "learning_rate": 2.0961435840916307e-07, - "loss": 2.2457, - "step": 571030 + "epoch": 0.93, + "learning_rate": 3.542910787396797e-06, + "loss": 2.6966, + "step": 260300 }, { - "epoch": 1.0, - "learning_rate": 2.0874241848233625e-07, - "loss": 2.2806, - "step": 571040 + "epoch": 0.93, + "learning_rate": 3.5250632694511175e-06, + "loss": 2.6908, + "step": 260400 }, { - "epoch": 1.0, - "learning_rate": 2.0787047855550944e-07, - "loss": 2.2804, - "step": 571050 + "epoch": 0.93, + "learning_rate": 3.5072157515054382e-06, + "loss": 2.6828, + "step": 260500 }, { - "epoch": 1.0, - "learning_rate": 2.0699853862868263e-07, - "loss": 2.456, - "step": 571060 + "epoch": 0.93, + "learning_rate": 3.489368233559759e-06, + "loss": 2.6718, + "step": 260600 }, { - "epoch": 1.0, - "learning_rate": 2.0612659870185587e-07, - "loss": 2.2934, - "step": 571070 + "epoch": 0.93, + "learning_rate": 3.4715207156140794e-06, + "loss": 2.686, + "step": 260700 }, { - "epoch": 1.0, - "learning_rate": 2.0525465877502906e-07, - "loss": 2.2359, - "step": 571080 + "epoch": 0.93, + "learning_rate": 3.4536731976684006e-06, + "loss": 2.6885, + "step": 260800 }, { - "epoch": 1.0, - "learning_rate": 2.0438271884820224e-07, - "loss": 2.2754, - "step": 571090 + "epoch": 0.93, + "learning_rate": 3.4358256797227214e-06, + "loss": 2.6732, + "step": 260900 }, { - "epoch": 1.0, - "learning_rate": 2.0351077892137543e-07, - "loss": 2.3558, - "step": 571100 + "epoch": 0.93, + "learning_rate": 3.4179781617770418e-06, + "loss": 2.68, + "step": 261000 }, { - "epoch": 1.0, - "learning_rate": 2.0263883899454862e-07, - "loss": 2.2218, - "step": 571110 + "epoch": 0.93, + "learning_rate": 3.4001306438313626e-06, + "loss": 2.6809, + "step": 261100 }, { - "epoch": 1.0, - "learning_rate": 2.0176689906772186e-07, - "loss": 2.2544, - "step": 571120 + "epoch": 0.93, + "learning_rate": 3.382283125885683e-06, + "loss": 2.6972, + "step": 261200 }, { - "epoch": 1.0, - "learning_rate": 2.0089495914089505e-07, - "loss": 2.2827, - "step": 571130 + "epoch": 0.93, + "learning_rate": 3.3644356079400037e-06, + "loss": 2.6898, + "step": 261300 }, { - "epoch": 1.0, - "learning_rate": 2.0002301921406823e-07, - "loss": 2.1714, - "step": 571140 + "epoch": 0.93, + "learning_rate": 3.346588089994325e-06, + "loss": 2.6904, + "step": 261400 }, { - "epoch": 1.0, - "learning_rate": 1.9915107928724142e-07, - "loss": 2.2969, - "step": 571150 + "epoch": 0.93, + "learning_rate": 3.3287405720486457e-06, + "loss": 2.6834, + "step": 261500 }, { - "epoch": 1.0, - "learning_rate": 1.982791393604146e-07, - "loss": 2.3732, - "step": 571160 + "epoch": 0.93, + "learning_rate": 3.310893054102966e-06, + "loss": 2.6889, + "step": 261600 }, { - "epoch": 1.0, - "learning_rate": 1.9740719943358785e-07, - "loss": 2.3197, - "step": 571170 + "epoch": 0.93, + "learning_rate": 3.293045536157287e-06, + "loss": 2.6897, + "step": 261700 }, { - "epoch": 1.0, - "learning_rate": 1.9653525950676104e-07, - "loss": 2.281, - "step": 571180 + "epoch": 0.93, + "learning_rate": 3.2751980182116073e-06, + "loss": 2.6902, + "step": 261800 }, { - "epoch": 1.0, - "learning_rate": 1.9566331957993423e-07, - "loss": 2.3257, - "step": 571190 + "epoch": 0.93, + "learning_rate": 3.257350500265928e-06, + "loss": 2.7015, + "step": 261900 }, { - "epoch": 1.0, - "learning_rate": 1.9479137965310744e-07, - "loss": 2.2665, - "step": 571200 + "epoch": 0.94, + "learning_rate": 3.2395029823202484e-06, + "loss": 2.6892, + "step": 262000 }, { - "epoch": 1.0, - "learning_rate": 1.9391943972628063e-07, - "loss": 2.3043, - "step": 571210 + "epoch": 0.94, + "learning_rate": 3.22165546437457e-06, + "loss": 2.6933, + "step": 262100 }, { - "epoch": 1.0, - "learning_rate": 1.9304749979945381e-07, - "loss": 2.2255, - "step": 571220 + "epoch": 0.94, + "learning_rate": 3.2038079464288904e-06, + "loss": 2.6754, + "step": 262200 }, { - "epoch": 1.0, - "learning_rate": 1.9217555987262703e-07, - "loss": 2.1702, - "step": 571230 + "epoch": 0.94, + "learning_rate": 3.1859604284832112e-06, + "loss": 2.6942, + "step": 262300 }, { - "epoch": 1.0, - "learning_rate": 1.9130361994580022e-07, - "loss": 2.2863, - "step": 571240 + "epoch": 0.94, + "learning_rate": 3.1681129105375316e-06, + "loss": 2.6842, + "step": 262400 }, { - "epoch": 1.0, - "learning_rate": 1.9043168001897343e-07, - "loss": 2.2577, - "step": 571250 + "epoch": 0.94, + "learning_rate": 3.1502653925918524e-06, + "loss": 2.676, + "step": 262500 }, { - "epoch": 1.0, - "learning_rate": 1.8955974009214662e-07, - "loss": 2.2701, - "step": 571260 + "epoch": 0.94, + "learning_rate": 3.1324178746461727e-06, + "loss": 2.6829, + "step": 262600 }, { - "epoch": 1.0, - "learning_rate": 1.886878001653198e-07, - "loss": 2.1525, - "step": 571270 + "epoch": 0.94, + "learning_rate": 3.114570356700494e-06, + "loss": 2.6774, + "step": 262700 }, { - "epoch": 1.0, - "learning_rate": 1.8781586023849302e-07, - "loss": 2.1675, - "step": 571280 + "epoch": 0.94, + "learning_rate": 3.0967228387548143e-06, + "loss": 2.6876, + "step": 262800 }, { - "epoch": 1.0, - "learning_rate": 1.869439203116662e-07, - "loss": 2.2049, - "step": 571290 + "epoch": 0.94, + "learning_rate": 3.078875320809135e-06, + "loss": 2.6815, + "step": 262900 }, { - "epoch": 1.0, - "learning_rate": 1.8607198038483942e-07, - "loss": 2.264, - "step": 571300 + "epoch": 0.94, + "learning_rate": 3.061027802863456e-06, + "loss": 2.6745, + "step": 263000 }, { - "epoch": 1.0, - "learning_rate": 1.852000404580126e-07, - "loss": 2.3672, - "step": 571310 + "epoch": 0.94, + "learning_rate": 3.0431802849177767e-06, + "loss": 2.6781, + "step": 263100 }, { - "epoch": 1.0, - "learning_rate": 1.843281005311858e-07, - "loss": 2.084, - "step": 571320 + "epoch": 0.94, + "learning_rate": 3.0253327669720975e-06, + "loss": 2.6946, + "step": 263200 }, { - "epoch": 1.0, - "learning_rate": 1.83456160604359e-07, - "loss": 2.3284, - "step": 571330 + "epoch": 0.94, + "learning_rate": 3.007485249026418e-06, + "loss": 2.6873, + "step": 263300 }, { - "epoch": 1.0, - "learning_rate": 1.825842206775322e-07, - "loss": 2.3041, - "step": 571340 + "epoch": 0.94, + "learning_rate": 2.9896377310807387e-06, + "loss": 2.6945, + "step": 263400 }, { - "epoch": 1.0, - "learning_rate": 1.817122807507054e-07, - "loss": 2.2113, - "step": 571350 + "epoch": 0.94, + "learning_rate": 2.9717902131350594e-06, + "loss": 2.6972, + "step": 263500 }, { - "epoch": 1.0, - "learning_rate": 1.808403408238786e-07, - "loss": 2.3083, - "step": 571360 + "epoch": 0.94, + "learning_rate": 2.9539426951893802e-06, + "loss": 2.6925, + "step": 263600 }, { - "epoch": 1.0, - "learning_rate": 1.799684008970518e-07, - "loss": 2.2247, - "step": 571370 + "epoch": 0.94, + "learning_rate": 2.9360951772437006e-06, + "loss": 2.6725, + "step": 263700 }, { - "epoch": 1.0, - "learning_rate": 1.79096460970225e-07, - "loss": 2.2277, - "step": 571380 + "epoch": 0.94, + "learning_rate": 2.918247659298022e-06, + "loss": 2.6786, + "step": 263800 }, { - "epoch": 1.0, - "learning_rate": 1.782245210433982e-07, - "loss": 2.1567, - "step": 571390 + "epoch": 0.94, + "learning_rate": 2.900400141352342e-06, + "loss": 2.6985, + "step": 263900 }, { - "epoch": 1.0, - "learning_rate": 1.773525811165714e-07, - "loss": 2.3178, - "step": 571400 + "epoch": 0.94, + "learning_rate": 2.882552623406663e-06, + "loss": 2.6911, + "step": 264000 }, { - "epoch": 1.0, - "learning_rate": 1.764806411897446e-07, - "loss": 2.226, - "step": 571410 + "epoch": 0.94, + "learning_rate": 2.8647051054609833e-06, + "loss": 2.6892, + "step": 264100 }, { - "epoch": 1.0, - "learning_rate": 1.7560870126291778e-07, - "loss": 2.2858, - "step": 571420 + "epoch": 0.94, + "learning_rate": 2.8468575875153046e-06, + "loss": 2.6764, + "step": 264200 }, { - "epoch": 1.0, - "learning_rate": 1.74736761336091e-07, - "loss": 2.203, - "step": 571430 + "epoch": 0.94, + "learning_rate": 2.829010069569625e-06, + "loss": 2.6838, + "step": 264300 }, { - "epoch": 1.0, - "learning_rate": 1.7386482140926418e-07, - "loss": 2.2729, - "step": 571440 + "epoch": 0.94, + "learning_rate": 2.8111625516239457e-06, + "loss": 2.6867, + "step": 264400 }, { - "epoch": 1.0, - "learning_rate": 1.729928814824374e-07, - "loss": 2.1332, - "step": 571450 + "epoch": 0.94, + "learning_rate": 2.7933150336782665e-06, + "loss": 2.6797, + "step": 264500 }, { - "epoch": 1.0, - "learning_rate": 1.7212094155561058e-07, - "loss": 2.2319, - "step": 571460 + "epoch": 0.94, + "learning_rate": 2.7754675157325873e-06, + "loss": 2.6744, + "step": 264600 }, { - "epoch": 1.0, - "learning_rate": 1.712490016287838e-07, - "loss": 2.2906, - "step": 571470 + "epoch": 0.94, + "learning_rate": 2.7576199977869077e-06, + "loss": 2.6841, + "step": 264700 }, { - "epoch": 1.0, - "learning_rate": 1.7037706170195698e-07, - "loss": 2.1907, - "step": 571480 + "epoch": 0.95, + "learning_rate": 2.739772479841229e-06, + "loss": 2.6936, + "step": 264800 }, { - "epoch": 1.0, - "learning_rate": 1.6950512177513017e-07, - "loss": 2.2036, - "step": 571490 + "epoch": 0.95, + "learning_rate": 2.7219249618955493e-06, + "loss": 2.6896, + "step": 264900 }, { - "epoch": 1.0, - "learning_rate": 1.6863318184830338e-07, - "loss": 2.2807, - "step": 571500 + "epoch": 0.95, + "learning_rate": 2.70407744394987e-06, + "loss": 2.6804, + "step": 265000 }, { - "epoch": 1.0, - "learning_rate": 1.6776124192147657e-07, - "loss": 2.3081, - "step": 571510 + "epoch": 0.95, + "learning_rate": 2.686229926004191e-06, + "loss": 2.6878, + "step": 265100 }, { - "epoch": 1.0, - "learning_rate": 1.6688930199464979e-07, - "loss": 2.2331, - "step": 571520 + "epoch": 0.95, + "learning_rate": 2.6683824080585116e-06, + "loss": 2.6837, + "step": 265200 }, { - "epoch": 1.0, - "learning_rate": 1.6601736206782297e-07, - "loss": 2.1752, - "step": 571530 + "epoch": 0.95, + "learning_rate": 2.650534890112832e-06, + "loss": 2.6931, + "step": 265300 }, { - "epoch": 1.0, - "learning_rate": 1.6514542214099616e-07, - "loss": 2.3517, - "step": 571540 + "epoch": 0.95, + "learning_rate": 2.6326873721671528e-06, + "loss": 2.6771, + "step": 265400 }, { - "epoch": 1.0, - "learning_rate": 1.6427348221416938e-07, - "loss": 2.2649, - "step": 571550 + "epoch": 0.95, + "learning_rate": 2.6148398542214736e-06, + "loss": 2.6959, + "step": 265500 }, { - "epoch": 1.0, - "learning_rate": 1.6340154228734256e-07, - "loss": 2.2415, - "step": 571560 + "epoch": 0.95, + "learning_rate": 2.5969923362757944e-06, + "loss": 2.6821, + "step": 265600 }, { - "epoch": 1.0, - "learning_rate": 1.6252960236051578e-07, - "loss": 2.2963, - "step": 571570 + "epoch": 0.95, + "learning_rate": 2.5791448183301147e-06, + "loss": 2.6785, + "step": 265700 }, { - "epoch": 1.0, - "learning_rate": 1.6165766243368896e-07, - "loss": 2.2559, - "step": 571580 + "epoch": 0.95, + "learning_rate": 2.5612973003844355e-06, + "loss": 2.6831, + "step": 265800 }, { - "epoch": 1.0, - "learning_rate": 1.6078572250686218e-07, - "loss": 2.2868, - "step": 571590 + "epoch": 0.95, + "learning_rate": 2.5434497824387563e-06, + "loss": 2.6949, + "step": 265900 }, { - "epoch": 1.0, - "learning_rate": 1.5991378258003537e-07, - "loss": 2.1464, - "step": 571600 + "epoch": 0.95, + "learning_rate": 2.525602264493077e-06, + "loss": 2.7065, + "step": 266000 }, { - "epoch": 1.0, - "learning_rate": 1.5904184265320858e-07, - "loss": 2.3577, - "step": 571610 + "epoch": 0.95, + "learning_rate": 2.507754746547398e-06, + "loss": 2.6873, + "step": 266100 }, { - "epoch": 1.0, - "learning_rate": 1.5816990272638177e-07, - "loss": 2.0768, - "step": 571620 + "epoch": 0.95, + "learning_rate": 2.4899072286017183e-06, + "loss": 2.688, + "step": 266200 }, { - "epoch": 1.0, - "learning_rate": 1.5729796279955498e-07, - "loss": 2.2744, - "step": 571630 + "epoch": 0.95, + "learning_rate": 2.472059710656039e-06, + "loss": 2.697, + "step": 266300 }, { - "epoch": 1.0, - "learning_rate": 1.5642602287272817e-07, - "loss": 2.1728, - "step": 571640 + "epoch": 0.95, + "learning_rate": 2.45421219271036e-06, + "loss": 2.6867, + "step": 266400 }, { - "epoch": 1.0, - "learning_rate": 1.5555408294590138e-07, - "loss": 2.3516, - "step": 571650 + "epoch": 0.95, + "learning_rate": 2.4363646747646806e-06, + "loss": 2.6913, + "step": 266500 }, { - "epoch": 1.0, - "learning_rate": 1.5468214301907457e-07, - "loss": 2.2486, - "step": 571660 + "epoch": 0.95, + "learning_rate": 2.418517156819001e-06, + "loss": 2.6789, + "step": 266600 }, { - "epoch": 1.0, - "learning_rate": 1.5381020309224778e-07, - "loss": 2.394, - "step": 571670 + "epoch": 0.95, + "learning_rate": 2.4006696388733222e-06, + "loss": 2.6866, + "step": 266700 }, { - "epoch": 1.0, - "learning_rate": 1.5293826316542097e-07, - "loss": 2.1967, - "step": 571680 + "epoch": 0.95, + "learning_rate": 2.3828221209276426e-06, + "loss": 2.6865, + "step": 266800 }, { - "epoch": 1.0, - "learning_rate": 1.5206632323859416e-07, - "loss": 2.2046, - "step": 571690 + "epoch": 0.95, + "learning_rate": 2.3649746029819634e-06, + "loss": 2.6802, + "step": 266900 }, { - "epoch": 1.0, - "learning_rate": 1.5119438331176737e-07, - "loss": 2.2563, - "step": 571700 + "epoch": 0.95, + "learning_rate": 2.347127085036284e-06, + "loss": 2.6881, + "step": 267000 }, { - "epoch": 1.0, - "learning_rate": 1.5032244338494056e-07, - "loss": 2.293, - "step": 571710 + "epoch": 0.95, + "learning_rate": 2.329279567090605e-06, + "loss": 2.6901, + "step": 267100 }, { - "epoch": 1.0, - "learning_rate": 1.4945050345811378e-07, - "loss": 2.3405, - "step": 571720 + "epoch": 0.95, + "learning_rate": 2.3114320491449253e-06, + "loss": 2.6825, + "step": 267200 }, { - "epoch": 1.0, - "learning_rate": 1.4857856353128696e-07, - "loss": 2.2204, - "step": 571730 + "epoch": 0.95, + "learning_rate": 2.293584531199246e-06, + "loss": 2.6923, + "step": 267300 }, { - "epoch": 1.0, - "learning_rate": 1.4770662360446015e-07, - "loss": 2.2555, - "step": 571740 + "epoch": 0.95, + "learning_rate": 2.275737013253567e-06, + "loss": 2.6966, + "step": 267400 }, { - "epoch": 1.0, - "learning_rate": 1.4683468367763336e-07, - "loss": 2.3056, - "step": 571750 + "epoch": 0.95, + "learning_rate": 2.2578894953078877e-06, + "loss": 2.6804, + "step": 267500 }, { - "epoch": 1.0, - "learning_rate": 1.4596274375080655e-07, - "loss": 2.2958, - "step": 571760 + "epoch": 0.96, + "learning_rate": 2.240041977362208e-06, + "loss": 2.69, + "step": 267600 }, { - "epoch": 1.0, - "learning_rate": 1.4509080382397977e-07, - "loss": 2.2775, - "step": 571770 + "epoch": 0.96, + "learning_rate": 2.2221944594165293e-06, + "loss": 2.6876, + "step": 267700 }, { - "epoch": 1.0, - "learning_rate": 1.4421886389715295e-07, - "loss": 2.2433, - "step": 571780 + "epoch": 0.96, + "learning_rate": 2.2043469414708497e-06, + "loss": 2.6957, + "step": 267800 }, { - "epoch": 1.0, - "learning_rate": 1.4334692397032617e-07, - "loss": 2.2202, - "step": 571790 + "epoch": 0.96, + "learning_rate": 2.1864994235251705e-06, + "loss": 2.6904, + "step": 267900 }, { - "epoch": 1.0, - "learning_rate": 1.4247498404349936e-07, - "loss": 2.2256, - "step": 571800 + "epoch": 0.96, + "learning_rate": 2.1686519055794912e-06, + "loss": 2.6903, + "step": 268000 }, { - "epoch": 1.0, - "learning_rate": 1.4160304411667254e-07, - "loss": 2.3036, - "step": 571810 + "epoch": 0.96, + "learning_rate": 2.150804387633812e-06, + "loss": 2.6769, + "step": 268100 }, { - "epoch": 1.0, - "learning_rate": 1.4073110418984576e-07, - "loss": 2.2836, - "step": 571820 + "epoch": 0.96, + "learning_rate": 2.1329568696881324e-06, + "loss": 2.6971, + "step": 268200 }, { - "epoch": 1.0, - "learning_rate": 1.3985916426301894e-07, - "loss": 2.3317, - "step": 571830 + "epoch": 0.96, + "learning_rate": 2.115109351742453e-06, + "loss": 2.6879, + "step": 268300 }, { - "epoch": 1.0, - "learning_rate": 1.3898722433619216e-07, - "loss": 2.2606, - "step": 571840 + "epoch": 0.96, + "learning_rate": 2.097261833796774e-06, + "loss": 2.68, + "step": 268400 }, { - "epoch": 1.0, - "learning_rate": 1.3811528440936535e-07, - "loss": 2.2207, - "step": 571850 + "epoch": 0.96, + "learning_rate": 2.0794143158510948e-06, + "loss": 2.6877, + "step": 268500 }, { - "epoch": 1.0, - "learning_rate": 1.3724334448253853e-07, - "loss": 2.0733, - "step": 571860 + "epoch": 0.96, + "learning_rate": 2.0615667979054156e-06, + "loss": 2.686, + "step": 268600 }, { - "epoch": 1.0, - "learning_rate": 1.3637140455571175e-07, - "loss": 2.342, - "step": 571870 + "epoch": 0.96, + "learning_rate": 2.043719279959736e-06, + "loss": 2.6775, + "step": 268700 }, { - "epoch": 1.0, - "learning_rate": 1.3549946462888494e-07, - "loss": 2.2708, - "step": 571880 + "epoch": 0.96, + "learning_rate": 2.0258717620140567e-06, + "loss": 2.6828, + "step": 268800 }, { - "epoch": 1.0, - "learning_rate": 1.3462752470205815e-07, - "loss": 2.3228, - "step": 571890 + "epoch": 0.96, + "learning_rate": 2.0080242440683775e-06, + "loss": 2.6877, + "step": 268900 }, { - "epoch": 1.0, - "learning_rate": 1.3375558477523134e-07, - "loss": 2.2903, - "step": 571900 + "epoch": 0.96, + "learning_rate": 1.9901767261226983e-06, + "loss": 2.6853, + "step": 269000 }, { - "epoch": 1.0, - "learning_rate": 1.3288364484840452e-07, - "loss": 2.2413, - "step": 571910 + "epoch": 0.96, + "learning_rate": 1.9723292081770187e-06, + "loss": 2.6961, + "step": 269100 }, { - "epoch": 1.0, - "learning_rate": 1.3201170492157774e-07, - "loss": 2.2956, - "step": 571920 + "epoch": 0.96, + "learning_rate": 1.9544816902313395e-06, + "loss": 2.6897, + "step": 269200 }, { - "epoch": 1.0, - "learning_rate": 1.3113976499475093e-07, - "loss": 2.2222, - "step": 571930 + "epoch": 0.96, + "learning_rate": 1.9366341722856603e-06, + "loss": 2.7004, + "step": 269300 }, { - "epoch": 1.0, - "learning_rate": 1.3026782506792414e-07, - "loss": 2.3066, - "step": 571940 + "epoch": 0.96, + "learning_rate": 1.918786654339981e-06, + "loss": 2.6924, + "step": 269400 }, { - "epoch": 1.0, - "learning_rate": 1.2939588514109733e-07, - "loss": 2.1829, - "step": 571950 + "epoch": 0.96, + "learning_rate": 1.9009391363943016e-06, + "loss": 2.6848, + "step": 269500 }, { - "epoch": 1.0, - "learning_rate": 1.2852394521427052e-07, - "loss": 2.1684, - "step": 571960 + "epoch": 0.96, + "learning_rate": 1.8830916184486226e-06, + "loss": 2.6926, + "step": 269600 }, { - "epoch": 1.0, - "learning_rate": 1.2765200528744373e-07, - "loss": 2.2244, - "step": 571970 + "epoch": 0.96, + "learning_rate": 1.8652441005029432e-06, + "loss": 2.6867, + "step": 269700 }, { - "epoch": 1.0, - "learning_rate": 1.2678006536061692e-07, - "loss": 2.3193, - "step": 571980 + "epoch": 0.96, + "learning_rate": 1.8473965825572638e-06, + "loss": 2.6938, + "step": 269800 }, { - "epoch": 1.0, - "learning_rate": 1.2590812543379013e-07, - "loss": 2.3487, - "step": 571990 + "epoch": 0.96, + "learning_rate": 1.8295490646115846e-06, + "loss": 2.6975, + "step": 269900 }, { - "epoch": 1.0, - "learning_rate": 1.2503618550696332e-07, - "loss": 2.2199, - "step": 572000 + "epoch": 0.96, + "learning_rate": 1.8117015466659054e-06, + "loss": 2.687, + "step": 270000 }, { - "epoch": 1.0, - "learning_rate": 1.241642455801365e-07, - "loss": 2.3133, - "step": 572010 + "epoch": 0.96, + "learning_rate": 1.793854028720226e-06, + "loss": 2.6801, + "step": 270100 }, { - "epoch": 1.0, - "learning_rate": 1.2329230565330972e-07, - "loss": 2.2798, - "step": 572020 + "epoch": 0.96, + "learning_rate": 1.7760065107745468e-06, + "loss": 2.6872, + "step": 270200 }, { - "epoch": 1.0, - "learning_rate": 1.224203657264829e-07, - "loss": 2.2046, - "step": 572030 + "epoch": 0.96, + "learning_rate": 1.7581589928288673e-06, + "loss": 2.6981, + "step": 270300 }, { - "epoch": 1.0, - "learning_rate": 1.2154842579965612e-07, - "loss": 2.3744, - "step": 572040 + "epoch": 0.97, + "learning_rate": 1.740311474883188e-06, + "loss": 2.6815, + "step": 270400 }, { - "epoch": 1.0, - "learning_rate": 1.206764858728293e-07, - "loss": 2.4191, - "step": 572050 + "epoch": 0.97, + "learning_rate": 1.722463956937509e-06, + "loss": 2.685, + "step": 270500 }, { - "epoch": 1.0, - "learning_rate": 1.198045459460025e-07, - "loss": 2.2782, - "step": 572060 + "epoch": 0.97, + "learning_rate": 1.7046164389918295e-06, + "loss": 2.6959, + "step": 270600 }, { - "epoch": 1.0, - "learning_rate": 1.1893260601917571e-07, - "loss": 2.2361, - "step": 572070 + "epoch": 0.97, + "learning_rate": 1.68676892104615e-06, + "loss": 2.6866, + "step": 270700 }, { - "epoch": 1.0, - "learning_rate": 1.180606660923489e-07, - "loss": 2.2564, - "step": 572080 + "epoch": 0.97, + "learning_rate": 1.6689214031004707e-06, + "loss": 2.6828, + "step": 270800 }, { - "epoch": 1.0, - "learning_rate": 1.1718872616552211e-07, - "loss": 2.3162, - "step": 572090 + "epoch": 0.97, + "learning_rate": 1.6510738851547917e-06, + "loss": 2.6883, + "step": 270900 }, { - "epoch": 1.0, - "learning_rate": 1.163167862386953e-07, - "loss": 2.0648, - "step": 572100 + "epoch": 0.97, + "learning_rate": 1.6332263672091122e-06, + "loss": 2.6851, + "step": 271000 }, { - "epoch": 1.0, - "learning_rate": 1.1544484631186849e-07, - "loss": 2.2619, - "step": 572110 + "epoch": 0.97, + "learning_rate": 1.6153788492634328e-06, + "loss": 2.6877, + "step": 271100 }, { - "epoch": 1.0, - "learning_rate": 1.145729063850417e-07, - "loss": 2.2279, - "step": 572120 + "epoch": 0.97, + "learning_rate": 1.5975313313177538e-06, + "loss": 2.6836, + "step": 271200 }, { - "epoch": 1.0, - "learning_rate": 1.1370096645821489e-07, - "loss": 2.2867, - "step": 572130 + "epoch": 0.97, + "learning_rate": 1.5796838133720744e-06, + "loss": 2.6864, + "step": 271300 }, { - "epoch": 1.0, - "learning_rate": 1.128290265313881e-07, - "loss": 2.2815, - "step": 572140 + "epoch": 0.97, + "learning_rate": 1.5618362954263952e-06, + "loss": 2.68, + "step": 271400 }, { - "epoch": 1.0, - "learning_rate": 1.1195708660456129e-07, - "loss": 2.2185, - "step": 572150 + "epoch": 0.97, + "learning_rate": 1.5439887774807158e-06, + "loss": 2.6907, + "step": 271500 }, { - "epoch": 1.0, - "learning_rate": 1.110851466777345e-07, - "loss": 2.2817, - "step": 572160 + "epoch": 0.97, + "learning_rate": 1.5261412595350366e-06, + "loss": 2.6813, + "step": 271600 }, { - "epoch": 1.0, - "learning_rate": 1.1021320675090769e-07, - "loss": 2.3216, - "step": 572170 + "epoch": 0.97, + "learning_rate": 1.5082937415893574e-06, + "loss": 2.682, + "step": 271700 }, { - "epoch": 1.0, - "learning_rate": 1.0934126682408088e-07, - "loss": 2.2245, - "step": 572180 + "epoch": 0.97, + "learning_rate": 1.490446223643678e-06, + "loss": 2.6878, + "step": 271800 }, { - "epoch": 1.0, - "learning_rate": 1.084693268972541e-07, - "loss": 2.1478, - "step": 572190 + "epoch": 0.97, + "learning_rate": 1.4725987056979987e-06, + "loss": 2.6864, + "step": 271900 }, { - "epoch": 1.0, - "learning_rate": 1.0759738697042728e-07, - "loss": 2.262, - "step": 572200 + "epoch": 0.97, + "learning_rate": 1.4547511877523193e-06, + "loss": 2.6798, + "step": 272000 }, { - "epoch": 1.0, - "learning_rate": 1.067254470436005e-07, - "loss": 2.2436, - "step": 572210 + "epoch": 0.97, + "learning_rate": 1.43690366980664e-06, + "loss": 2.6884, + "step": 272100 }, { - "epoch": 1.0, - "learning_rate": 1.0585350711677368e-07, - "loss": 2.1952, - "step": 572220 + "epoch": 0.97, + "learning_rate": 1.4190561518609609e-06, + "loss": 2.6844, + "step": 272200 }, { - "epoch": 1.0, - "learning_rate": 1.0498156718994688e-07, - "loss": 2.1884, - "step": 572230 + "epoch": 0.97, + "learning_rate": 1.4012086339152815e-06, + "loss": 2.6828, + "step": 272300 }, { - "epoch": 1.0, - "learning_rate": 1.0410962726312009e-07, - "loss": 2.296, - "step": 572240 + "epoch": 0.97, + "learning_rate": 1.3833611159696023e-06, + "loss": 2.6909, + "step": 272400 }, { - "epoch": 1.0, - "learning_rate": 1.0323768733629329e-07, - "loss": 2.4044, - "step": 572250 + "epoch": 0.97, + "learning_rate": 1.365513598023923e-06, + "loss": 2.6864, + "step": 272500 }, { - "epoch": 1.0, - "learning_rate": 1.0236574740946649e-07, - "loss": 2.2555, - "step": 572260 + "epoch": 0.97, + "learning_rate": 1.3476660800782436e-06, + "loss": 2.6834, + "step": 272600 }, { - "epoch": 1.0, - "learning_rate": 1.0149380748263969e-07, - "loss": 2.3379, - "step": 572270 + "epoch": 0.97, + "learning_rate": 1.3298185621325644e-06, + "loss": 2.6892, + "step": 272700 }, { - "epoch": 1.0, - "learning_rate": 1.0062186755581288e-07, - "loss": 2.2583, - "step": 572280 + "epoch": 0.97, + "learning_rate": 1.311971044186885e-06, + "loss": 2.6802, + "step": 272800 }, { - "epoch": 1.0, - "learning_rate": 9.974992762898608e-08, - "loss": 2.2032, - "step": 572290 + "epoch": 0.97, + "learning_rate": 1.2941235262412056e-06, + "loss": 2.684, + "step": 272900 }, { - "epoch": 1.0, - "learning_rate": 9.887798770215928e-08, - "loss": 2.3011, - "step": 572300 + "epoch": 0.97, + "learning_rate": 1.2762760082955264e-06, + "loss": 2.6775, + "step": 273000 }, { - "epoch": 1.0, - "learning_rate": 9.800604777533248e-08, - "loss": 2.2918, - "step": 572310 + "epoch": 0.97, + "learning_rate": 1.258428490349847e-06, + "loss": 2.6922, + "step": 273100 }, { - "epoch": 1.0, - "learning_rate": 9.713410784850568e-08, - "loss": 2.2356, - "step": 572320 + "epoch": 0.98, + "learning_rate": 1.2405809724041677e-06, + "loss": 2.6803, + "step": 273200 }, { - "epoch": 1.0, - "learning_rate": 9.626216792167888e-08, - "loss": 2.2875, - "step": 572330 + "epoch": 0.98, + "learning_rate": 1.2227334544584885e-06, + "loss": 2.6858, + "step": 273300 }, { - "epoch": 1.0, - "learning_rate": 9.539022799485208e-08, - "loss": 2.2941, - "step": 572340 + "epoch": 0.98, + "learning_rate": 1.2048859365128091e-06, + "loss": 2.6886, + "step": 273400 }, { - "epoch": 1.0, - "learning_rate": 9.451828806802527e-08, - "loss": 2.3867, - "step": 572350 + "epoch": 0.98, + "learning_rate": 1.18703841856713e-06, + "loss": 2.6808, + "step": 273500 }, { - "epoch": 1.0, - "learning_rate": 9.364634814119847e-08, - "loss": 2.2459, - "step": 572360 + "epoch": 0.98, + "learning_rate": 1.1691909006214505e-06, + "loss": 2.6876, + "step": 273600 }, { - "epoch": 1.0, - "learning_rate": 9.277440821437167e-08, - "loss": 2.2183, - "step": 572370 + "epoch": 0.98, + "learning_rate": 1.1513433826757713e-06, + "loss": 2.6869, + "step": 273700 }, { - "epoch": 1.0, - "learning_rate": 9.190246828754487e-08, - "loss": 2.2926, - "step": 572380 + "epoch": 0.98, + "learning_rate": 1.133495864730092e-06, + "loss": 2.6812, + "step": 273800 }, { - "epoch": 1.0, - "learning_rate": 9.103052836071807e-08, - "loss": 2.2461, - "step": 572390 + "epoch": 0.98, + "learning_rate": 1.1156483467844126e-06, + "loss": 2.6768, + "step": 273900 }, { - "epoch": 1.0, - "learning_rate": 9.015858843389126e-08, - "loss": 2.172, - "step": 572400 + "epoch": 0.98, + "learning_rate": 1.0978008288387334e-06, + "loss": 2.6939, + "step": 274000 }, { - "epoch": 1.0, - "learning_rate": 8.928664850706446e-08, - "loss": 2.2275, - "step": 572410 + "epoch": 0.98, + "learning_rate": 1.0799533108930542e-06, + "loss": 2.6957, + "step": 274100 }, { - "epoch": 1.0, - "learning_rate": 8.841470858023766e-08, - "loss": 2.2887, - "step": 572420 + "epoch": 0.98, + "learning_rate": 1.0621057929473748e-06, + "loss": 2.6826, + "step": 274200 }, { - "epoch": 1.0, - "learning_rate": 8.754276865341086e-08, - "loss": 2.2779, - "step": 572430 + "epoch": 0.98, + "learning_rate": 1.0442582750016956e-06, + "loss": 2.681, + "step": 274300 }, { - "epoch": 1.0, - "learning_rate": 8.667082872658406e-08, - "loss": 2.3215, - "step": 572440 + "epoch": 0.98, + "learning_rate": 1.0264107570560162e-06, + "loss": 2.6763, + "step": 274400 }, { - "epoch": 1.0, - "learning_rate": 8.579888879975726e-08, - "loss": 2.2636, - "step": 572450 + "epoch": 0.98, + "learning_rate": 1.008563239110337e-06, + "loss": 2.6828, + "step": 274500 }, { - "epoch": 1.0, - "learning_rate": 8.492694887293045e-08, - "loss": 2.2799, - "step": 572460 + "epoch": 0.98, + "learning_rate": 9.907157211646578e-07, + "loss": 2.6802, + "step": 274600 }, { - "epoch": 1.0, - "learning_rate": 8.405500894610365e-08, - "loss": 2.346, - "step": 572470 + "epoch": 0.98, + "learning_rate": 9.728682032189783e-07, + "loss": 2.6733, + "step": 274700 }, { - "epoch": 1.0, - "learning_rate": 8.318306901927685e-08, - "loss": 2.231, - "step": 572480 + "epoch": 0.98, + "learning_rate": 9.550206852732991e-07, + "loss": 2.6931, + "step": 274800 }, { - "epoch": 1.0, - "learning_rate": 8.231112909245005e-08, - "loss": 2.2112, - "step": 572490 + "epoch": 0.98, + "learning_rate": 9.371731673276198e-07, + "loss": 2.6864, + "step": 274900 }, { - "epoch": 1.0, - "learning_rate": 8.143918916562325e-08, - "loss": 2.1321, - "step": 572500 + "epoch": 0.98, + "learning_rate": 9.193256493819405e-07, + "loss": 2.6891, + "step": 275000 }, { - "epoch": 1.0, - "learning_rate": 8.056724923879644e-08, - "loss": 2.2999, - "step": 572510 + "epoch": 0.98, + "learning_rate": 9.014781314362612e-07, + "loss": 2.686, + "step": 275100 }, { - "epoch": 1.0, - "learning_rate": 7.969530931196964e-08, - "loss": 2.2748, - "step": 572520 + "epoch": 0.98, + "learning_rate": 8.836306134905818e-07, + "loss": 2.6796, + "step": 275200 }, { - "epoch": 1.0, - "learning_rate": 7.882336938514284e-08, - "loss": 2.2668, - "step": 572530 + "epoch": 0.98, + "learning_rate": 8.657830955449026e-07, + "loss": 2.6936, + "step": 275300 }, { - "epoch": 1.0, - "learning_rate": 7.795142945831604e-08, - "loss": 2.2804, - "step": 572540 + "epoch": 0.98, + "learning_rate": 8.479355775992234e-07, + "loss": 2.6868, + "step": 275400 }, { - "epoch": 1.0, - "learning_rate": 7.707948953148924e-08, - "loss": 2.1993, - "step": 572550 + "epoch": 0.98, + "learning_rate": 8.300880596535439e-07, + "loss": 2.6777, + "step": 275500 }, { - "epoch": 1.0, - "learning_rate": 7.620754960466243e-08, - "loss": 2.2971, - "step": 572560 + "epoch": 0.98, + "learning_rate": 8.122405417078647e-07, + "loss": 2.6859, + "step": 275600 }, { - "epoch": 1.0, - "learning_rate": 7.533560967783563e-08, - "loss": 2.1637, - "step": 572570 + "epoch": 0.98, + "learning_rate": 7.943930237621855e-07, + "loss": 2.6915, + "step": 275700 }, { - "epoch": 1.0, - "learning_rate": 7.446366975100883e-08, - "loss": 2.1807, - "step": 572580 + "epoch": 0.98, + "learning_rate": 7.765455058165062e-07, + "loss": 2.6764, + "step": 275800 }, { - "epoch": 1.0, - "learning_rate": 7.359172982418203e-08, - "loss": 2.3349, - "step": 572590 + "epoch": 0.98, + "learning_rate": 7.586979878708269e-07, + "loss": 2.6742, + "step": 275900 }, { - "epoch": 1.0, - "learning_rate": 7.271978989735524e-08, - "loss": 2.2716, - "step": 572600 + "epoch": 0.99, + "learning_rate": 7.408504699251476e-07, + "loss": 2.6871, + "step": 276000 }, { - "epoch": 1.0, - "learning_rate": 7.184784997052844e-08, - "loss": 2.2836, - "step": 572610 + "epoch": 0.99, + "learning_rate": 7.230029519794683e-07, + "loss": 2.6726, + "step": 276100 }, { - "epoch": 1.0, - "learning_rate": 7.097591004370162e-08, - "loss": 2.1811, - "step": 572620 + "epoch": 0.99, + "learning_rate": 7.05155434033789e-07, + "loss": 2.6765, + "step": 276200 }, { - "epoch": 1.0, - "learning_rate": 7.010397011687482e-08, - "loss": 2.3288, - "step": 572630 + "epoch": 0.99, + "learning_rate": 6.873079160881096e-07, + "loss": 2.6749, + "step": 276300 }, { - "epoch": 1.0, - "learning_rate": 6.923203019004803e-08, - "loss": 2.263, - "step": 572640 + "epoch": 0.99, + "learning_rate": 6.694603981424303e-07, + "loss": 2.685, + "step": 276400 }, { - "epoch": 1.0, - "learning_rate": 6.836009026322123e-08, - "loss": 2.3822, - "step": 572650 + "epoch": 0.99, + "learning_rate": 6.51612880196751e-07, + "loss": 2.6819, + "step": 276500 }, { - "epoch": 1.0, - "learning_rate": 6.748815033639443e-08, - "loss": 2.2203, - "step": 572660 + "epoch": 0.99, + "learning_rate": 6.337653622510718e-07, + "loss": 2.6861, + "step": 276600 }, { - "epoch": 1.0, - "learning_rate": 6.661621040956763e-08, - "loss": 2.3216, - "step": 572670 + "epoch": 0.99, + "learning_rate": 6.159178443053925e-07, + "loss": 2.6946, + "step": 276700 }, { - "epoch": 1.0, - "learning_rate": 6.574427048274083e-08, - "loss": 2.3593, - "step": 572680 + "epoch": 0.99, + "learning_rate": 5.980703263597132e-07, + "loss": 2.6903, + "step": 276800 }, { - "epoch": 1.0, - "learning_rate": 6.487233055591402e-08, - "loss": 2.2006, - "step": 572690 + "epoch": 0.99, + "learning_rate": 5.802228084140338e-07, + "loss": 2.6886, + "step": 276900 }, { - "epoch": 1.0, - "learning_rate": 6.400039062908722e-08, - "loss": 2.2267, - "step": 572700 + "epoch": 0.99, + "learning_rate": 5.623752904683546e-07, + "loss": 2.6833, + "step": 277000 }, { - "epoch": 1.0, - "learning_rate": 6.312845070226042e-08, - "loss": 2.3224, - "step": 572710 + "epoch": 0.99, + "learning_rate": 5.445277725226753e-07, + "loss": 2.6829, + "step": 277100 }, { - "epoch": 1.0, - "learning_rate": 6.225651077543362e-08, - "loss": 2.2104, - "step": 572720 + "epoch": 0.99, + "learning_rate": 5.26680254576996e-07, + "loss": 2.69, + "step": 277200 }, { - "epoch": 1.0, - "learning_rate": 6.138457084860682e-08, - "loss": 2.2341, - "step": 572730 + "epoch": 0.99, + "learning_rate": 5.088327366313167e-07, + "loss": 2.6866, + "step": 277300 }, { - "epoch": 1.0, - "learning_rate": 6.051263092178002e-08, - "loss": 2.2437, - "step": 572740 + "epoch": 0.99, + "learning_rate": 4.909852186856375e-07, + "loss": 2.6755, + "step": 277400 }, { - "epoch": 1.0, - "learning_rate": 5.964069099495322e-08, - "loss": 2.2385, - "step": 572750 + "epoch": 0.99, + "learning_rate": 4.731377007399581e-07, + "loss": 2.6973, + "step": 277500 }, { - "epoch": 1.0, - "learning_rate": 5.8768751068126415e-08, - "loss": 2.1971, - "step": 572760 + "epoch": 0.99, + "learning_rate": 4.552901827942788e-07, + "loss": 2.6872, + "step": 277600 }, { - "epoch": 1.0, - "learning_rate": 5.7896811141299616e-08, - "loss": 2.2889, - "step": 572770 + "epoch": 0.99, + "learning_rate": 4.374426648485995e-07, + "loss": 2.6886, + "step": 277700 }, { - "epoch": 1.0, - "learning_rate": 5.702487121447281e-08, - "loss": 2.2758, - "step": 572780 + "epoch": 0.99, + "learning_rate": 4.195951469029203e-07, + "loss": 2.697, + "step": 277800 }, { - "epoch": 1.0, - "learning_rate": 5.6152931287646004e-08, - "loss": 2.3389, - "step": 572790 + "epoch": 0.99, + "learning_rate": 4.0174762895724097e-07, + "loss": 2.6859, + "step": 277900 }, { - "epoch": 1.0, - "learning_rate": 5.5280991360819205e-08, - "loss": 2.255, - "step": 572800 + "epoch": 0.99, + "learning_rate": 3.8390011101156165e-07, + "loss": 2.7017, + "step": 278000 }, { - "epoch": 1.0, - "learning_rate": 5.4409051433992406e-08, - "loss": 2.2077, - "step": 572810 + "epoch": 0.99, + "learning_rate": 3.6605259306588234e-07, + "loss": 2.6748, + "step": 278100 }, { - "epoch": 1.0, - "learning_rate": 5.3537111507165607e-08, - "loss": 2.2487, - "step": 572820 + "epoch": 0.99, + "learning_rate": 3.48205075120203e-07, + "loss": 2.6919, + "step": 278200 }, { - "epoch": 1.0, - "learning_rate": 5.26651715803388e-08, - "loss": 2.3189, - "step": 572830 + "epoch": 0.99, + "learning_rate": 3.3035755717452376e-07, + "loss": 2.6853, + "step": 278300 }, { - "epoch": 1.0, - "learning_rate": 5.1793231653512e-08, - "loss": 2.1325, - "step": 572840 + "epoch": 0.99, + "learning_rate": 3.1251003922884445e-07, + "loss": 2.6843, + "step": 278400 }, { - "epoch": 1.0, - "learning_rate": 5.09212917266852e-08, - "loss": 2.0689, - "step": 572850 + "epoch": 0.99, + "learning_rate": 2.946625212831652e-07, + "loss": 2.6747, + "step": 278500 }, { - "epoch": 1.0, - "learning_rate": 5.00493517998584e-08, - "loss": 2.4129, - "step": 572860 + "epoch": 0.99, + "learning_rate": 2.7681500333748587e-07, + "loss": 2.6838, + "step": 278600 }, { - "epoch": 1.0, - "learning_rate": 4.9177411873031604e-08, - "loss": 2.2581, - "step": 572870 + "epoch": 0.99, + "learning_rate": 2.589674853918066e-07, + "loss": 2.6912, + "step": 278700 }, { "epoch": 1.0, - "learning_rate": 4.83054719462048e-08, - "loss": 2.1987, - "step": 572880 + "learning_rate": 2.411199674461273e-07, + "loss": 2.6809, + "step": 278800 }, { "epoch": 1.0, - "learning_rate": 4.7433532019378e-08, - "loss": 2.2559, - "step": 572890 + "learning_rate": 2.23272449500448e-07, + "loss": 2.6763, + "step": 278900 }, { "epoch": 1.0, - "learning_rate": 4.656159209255119e-08, - "loss": 2.332, - "step": 572900 + "learning_rate": 2.0542493155476867e-07, + "loss": 2.6928, + "step": 279000 }, { "epoch": 1.0, - "learning_rate": 4.5689652165724394e-08, - "loss": 2.3371, - "step": 572910 + "learning_rate": 1.8757741360908938e-07, + "loss": 2.6839, + "step": 279100 }, { "epoch": 1.0, - "learning_rate": 4.481771223889759e-08, - "loss": 2.1172, - "step": 572920 + "learning_rate": 1.697298956634101e-07, + "loss": 2.6872, + "step": 279200 }, { "epoch": 1.0, - "learning_rate": 4.394577231207079e-08, - "loss": 2.3212, - "step": 572930 + "learning_rate": 1.518823777177308e-07, + "loss": 2.6973, + "step": 279300 }, { "epoch": 1.0, - "learning_rate": 4.307383238524399e-08, - "loss": 2.1773, - "step": 572940 + "learning_rate": 1.340348597720515e-07, + "loss": 2.706, + "step": 279400 }, { "epoch": 1.0, - "learning_rate": 4.2201892458417184e-08, - "loss": 2.2615, - "step": 572950 + "learning_rate": 1.1618734182637223e-07, + "loss": 2.6818, + "step": 279500 }, { "epoch": 1.0, - "learning_rate": 4.1329952531590385e-08, - "loss": 2.3336, - "step": 572960 + "learning_rate": 9.833982388069292e-08, + "loss": 2.6777, + "step": 279600 }, { "epoch": 1.0, - "learning_rate": 4.045801260476358e-08, - "loss": 2.3124, - "step": 572970 + "learning_rate": 8.049230593501362e-08, + "loss": 2.692, + "step": 279700 }, { "epoch": 1.0, - "learning_rate": 3.958607267793678e-08, - "loss": 2.254, - "step": 572980 + "learning_rate": 6.264478798933432e-08, + "loss": 2.6734, + "step": 279800 }, { "epoch": 1.0, - "learning_rate": 3.871413275110998e-08, - "loss": 2.1415, - "step": 572990 + "learning_rate": 4.4797270043655027e-08, + "loss": 2.6892, + "step": 279900 }, { "epoch": 1.0, - "learning_rate": 3.7842192824283175e-08, - "loss": 2.2239, - "step": 573000 + "learning_rate": 2.6949752097975735e-08, + "loss": 2.6823, + "step": 280000 } ], - "max_steps": 573434, + "max_steps": 280151, "num_train_epochs": 1, - "total_flos": 4.504923244855296e+18, + "total_flos": 7.58820243932971e+18, "trial_name": null, "trial_params": null }