{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.12815255279885177, "eval_steps": 500, "global_step": 5000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 1.7079419299743807e-09, "loss": 2.8359, "step": 1 }, { "epoch": 0.0, "learning_rate": 3.4158838599487614e-09, "loss": 2.4531, "step": 2 }, { "epoch": 0.0, "learning_rate": 5.123825789923143e-09, "loss": 2.2266, "step": 3 }, { "epoch": 0.0, "learning_rate": 6.831767719897523e-09, "loss": 2.5566, "step": 4 }, { "epoch": 0.0, "learning_rate": 8.539709649871904e-09, "loss": 2.7461, "step": 5 }, { "epoch": 0.0, "learning_rate": 1.0247651579846285e-08, "loss": 2.5, "step": 6 }, { "epoch": 0.0, "learning_rate": 1.1955593509820665e-08, "loss": 2.4414, "step": 7 }, { "epoch": 0.0, "learning_rate": 1.3663535439795045e-08, "loss": 2.5781, "step": 8 }, { "epoch": 0.0, "learning_rate": 1.5371477369769426e-08, "loss": 2.8516, "step": 9 }, { "epoch": 0.0, "learning_rate": 1.707941929974381e-08, "loss": 2.3164, "step": 10 }, { "epoch": 0.0, "learning_rate": 1.8787361229718188e-08, "loss": 2.6289, "step": 11 }, { "epoch": 0.0, "learning_rate": 2.049530315969257e-08, "loss": 2.1953, "step": 12 }, { "epoch": 0.0, "learning_rate": 2.220324508966695e-08, "loss": 2.8398, "step": 13 }, { "epoch": 0.0, "learning_rate": 2.391118701964133e-08, "loss": 2.748, "step": 14 }, { "epoch": 0.0, "learning_rate": 2.561912894961571e-08, "loss": 2.5137, "step": 15 }, { "epoch": 0.0, "learning_rate": 2.732707087959009e-08, "loss": 2.5234, "step": 16 }, { "epoch": 0.0, "learning_rate": 2.9035012809564473e-08, "loss": 3.0508, "step": 17 }, { "epoch": 0.0, "learning_rate": 3.074295473953885e-08, "loss": 2.9062, "step": 18 }, { "epoch": 0.0, "learning_rate": 3.2450896669513235e-08, "loss": 2.25, "step": 19 }, { "epoch": 0.0, "learning_rate": 3.415883859948762e-08, "loss": 2.2539, "step": 20 }, { "epoch": 0.0, "learning_rate": 3.5866780529461994e-08, "loss": 2.1191, "step": 21 }, { "epoch": 0.0, "learning_rate": 3.7574722459436376e-08, "loss": 2.3359, "step": 22 }, { "epoch": 0.0, "learning_rate": 3.928266438941076e-08, "loss": 2.041, "step": 23 }, { "epoch": 0.0, "learning_rate": 4.099060631938514e-08, "loss": 2.2305, "step": 24 }, { "epoch": 0.0, "learning_rate": 4.269854824935952e-08, "loss": 2.4023, "step": 25 }, { "epoch": 0.0, "learning_rate": 4.44064901793339e-08, "loss": 3.2969, "step": 26 }, { "epoch": 0.0, "learning_rate": 4.611443210930828e-08, "loss": 2.0156, "step": 27 }, { "epoch": 0.0, "learning_rate": 4.782237403928266e-08, "loss": 2.4844, "step": 28 }, { "epoch": 0.0, "learning_rate": 4.953031596925705e-08, "loss": 2.8926, "step": 29 }, { "epoch": 0.0, "learning_rate": 5.123825789923142e-08, "loss": 2.2285, "step": 30 }, { "epoch": 0.0, "learning_rate": 5.2946199829205806e-08, "loss": 2.832, "step": 31 }, { "epoch": 0.0, "learning_rate": 5.465414175918018e-08, "loss": 2.7812, "step": 32 }, { "epoch": 0.0, "learning_rate": 5.6362083689154564e-08, "loss": 1.9473, "step": 33 }, { "epoch": 0.0, "learning_rate": 5.807002561912895e-08, "loss": 2.3086, "step": 34 }, { "epoch": 0.0, "learning_rate": 5.977796754910333e-08, "loss": 2.4219, "step": 35 }, { "epoch": 0.0, "learning_rate": 6.14859094790777e-08, "loss": 2.8789, "step": 36 }, { "epoch": 0.0, "learning_rate": 6.31938514090521e-08, "loss": 2.0215, "step": 37 }, { "epoch": 0.0, "learning_rate": 6.490179333902647e-08, "loss": 2.2305, "step": 38 }, { "epoch": 0.0, "learning_rate": 6.660973526900085e-08, "loss": 2.3164, "step": 39 }, { "epoch": 0.0, "learning_rate": 6.831767719897524e-08, "loss": 2.2891, "step": 40 }, { "epoch": 0.0, "learning_rate": 7.002561912894961e-08, "loss": 2.0488, "step": 41 }, { "epoch": 0.0, "learning_rate": 7.173356105892399e-08, "loss": 2.1172, "step": 42 }, { "epoch": 0.0, "learning_rate": 7.344150298889836e-08, "loss": 2.4062, "step": 43 }, { "epoch": 0.0, "learning_rate": 7.514944491887275e-08, "loss": 2.1133, "step": 44 }, { "epoch": 0.0, "learning_rate": 7.685738684884714e-08, "loss": 2.084, "step": 45 }, { "epoch": 0.0, "learning_rate": 7.856532877882152e-08, "loss": 2.0781, "step": 46 }, { "epoch": 0.0, "learning_rate": 8.02732707087959e-08, "loss": 1.7383, "step": 47 }, { "epoch": 0.0, "learning_rate": 8.198121263877028e-08, "loss": 1.9531, "step": 48 }, { "epoch": 0.0, "learning_rate": 8.368915456874466e-08, "loss": 1.916, "step": 49 }, { "epoch": 0.0, "learning_rate": 8.539709649871903e-08, "loss": 1.9609, "step": 50 }, { "epoch": 0.0, "learning_rate": 8.710503842869342e-08, "loss": 2.1758, "step": 51 }, { "epoch": 0.0, "learning_rate": 8.88129803586678e-08, "loss": 2.0781, "step": 52 }, { "epoch": 0.0, "learning_rate": 9.052092228864218e-08, "loss": 2.0742, "step": 53 }, { "epoch": 0.0, "learning_rate": 9.222886421861656e-08, "loss": 1.9629, "step": 54 }, { "epoch": 0.0, "learning_rate": 9.393680614859094e-08, "loss": 1.9492, "step": 55 }, { "epoch": 0.0, "learning_rate": 9.564474807856532e-08, "loss": 1.75, "step": 56 }, { "epoch": 0.0, "learning_rate": 9.73526900085397e-08, "loss": 1.7578, "step": 57 }, { "epoch": 0.0, "learning_rate": 9.90606319385141e-08, "loss": 1.707, "step": 58 }, { "epoch": 0.0, "learning_rate": 1.0076857386848847e-07, "loss": 1.9395, "step": 59 }, { "epoch": 0.0, "learning_rate": 1.0247651579846285e-07, "loss": 1.6738, "step": 60 }, { "epoch": 0.0, "learning_rate": 1.0418445772843724e-07, "loss": 1.8789, "step": 61 }, { "epoch": 0.0, "learning_rate": 1.0589239965841161e-07, "loss": 1.7871, "step": 62 }, { "epoch": 0.0, "learning_rate": 1.0760034158838599e-07, "loss": 1.6641, "step": 63 }, { "epoch": 0.0, "learning_rate": 1.0930828351836036e-07, "loss": 1.6641, "step": 64 }, { "epoch": 0.0, "learning_rate": 1.1101622544833475e-07, "loss": 1.7539, "step": 65 }, { "epoch": 0.0, "learning_rate": 1.1272416737830913e-07, "loss": 1.6777, "step": 66 }, { "epoch": 0.0, "learning_rate": 1.144321093082835e-07, "loss": 1.4297, "step": 67 }, { "epoch": 0.0, "learning_rate": 1.161400512382579e-07, "loss": 1.5352, "step": 68 }, { "epoch": 0.0, "learning_rate": 1.1784799316823227e-07, "loss": 1.6836, "step": 69 }, { "epoch": 0.0, "learning_rate": 1.1955593509820666e-07, "loss": 1.373, "step": 70 }, { "epoch": 0.0, "learning_rate": 1.2126387702818105e-07, "loss": 1.4453, "step": 71 }, { "epoch": 0.0, "learning_rate": 1.229718189581554e-07, "loss": 1.5762, "step": 72 }, { "epoch": 0.0, "learning_rate": 1.246797608881298e-07, "loss": 1.7363, "step": 73 }, { "epoch": 0.0, "learning_rate": 1.263877028181042e-07, "loss": 1.54, "step": 74 }, { "epoch": 0.0, "learning_rate": 1.2809564474807855e-07, "loss": 1.4727, "step": 75 }, { "epoch": 0.0, "learning_rate": 1.2980358667805294e-07, "loss": 1.5723, "step": 76 }, { "epoch": 0.0, "learning_rate": 1.3151152860802733e-07, "loss": 1.5781, "step": 77 }, { "epoch": 0.0, "learning_rate": 1.332194705380017e-07, "loss": 1.8008, "step": 78 }, { "epoch": 0.0, "learning_rate": 1.3492741246797608e-07, "loss": 1.4004, "step": 79 }, { "epoch": 0.0, "learning_rate": 1.3663535439795047e-07, "loss": 1.6807, "step": 80 }, { "epoch": 0.0, "learning_rate": 1.3834329632792486e-07, "loss": 1.4199, "step": 81 }, { "epoch": 0.0, "learning_rate": 1.4005123825789922e-07, "loss": 1.2354, "step": 82 }, { "epoch": 0.0, "learning_rate": 1.417591801878736e-07, "loss": 1.2344, "step": 83 }, { "epoch": 0.0, "learning_rate": 1.4346712211784797e-07, "loss": 1.6914, "step": 84 }, { "epoch": 0.0, "learning_rate": 1.4517506404782236e-07, "loss": 1.5156, "step": 85 }, { "epoch": 0.0, "learning_rate": 1.4688300597779673e-07, "loss": 1.3789, "step": 86 }, { "epoch": 0.0, "learning_rate": 1.4859094790777114e-07, "loss": 1.6191, "step": 87 }, { "epoch": 0.0, "learning_rate": 1.502988898377455e-07, "loss": 1.4922, "step": 88 }, { "epoch": 0.0, "learning_rate": 1.520068317677199e-07, "loss": 1.4766, "step": 89 }, { "epoch": 0.0, "learning_rate": 1.5371477369769428e-07, "loss": 1.165, "step": 90 }, { "epoch": 0.0, "learning_rate": 1.5542271562766865e-07, "loss": 1.3555, "step": 91 }, { "epoch": 0.0, "learning_rate": 1.5713065755764303e-07, "loss": 1.3516, "step": 92 }, { "epoch": 0.0, "learning_rate": 1.588385994876174e-07, "loss": 1.543, "step": 93 }, { "epoch": 0.0, "learning_rate": 1.605465414175918e-07, "loss": 1.416, "step": 94 }, { "epoch": 0.0, "learning_rate": 1.6225448334756618e-07, "loss": 1.4863, "step": 95 }, { "epoch": 0.0, "learning_rate": 1.6396242527754057e-07, "loss": 1.4414, "step": 96 }, { "epoch": 0.0, "learning_rate": 1.6567036720751493e-07, "loss": 1.3887, "step": 97 }, { "epoch": 0.0, "learning_rate": 1.6737830913748932e-07, "loss": 1.4336, "step": 98 }, { "epoch": 0.0, "learning_rate": 1.6908625106746368e-07, "loss": 1.3652, "step": 99 }, { "epoch": 0.0, "learning_rate": 1.7079419299743807e-07, "loss": 1.4316, "step": 100 }, { "epoch": 0.0, "learning_rate": 1.7250213492741248e-07, "loss": 1.0703, "step": 101 }, { "epoch": 0.0, "learning_rate": 1.7421007685738685e-07, "loss": 1.4082, "step": 102 }, { "epoch": 0.0, "learning_rate": 1.7591801878736124e-07, "loss": 1.1934, "step": 103 }, { "epoch": 0.0, "learning_rate": 1.776259607173356e-07, "loss": 1.4219, "step": 104 }, { "epoch": 0.0, "learning_rate": 1.7933390264731e-07, "loss": 1.3633, "step": 105 }, { "epoch": 0.0, "learning_rate": 1.8104184457728435e-07, "loss": 1.4551, "step": 106 }, { "epoch": 0.0, "learning_rate": 1.8274978650725874e-07, "loss": 1.0342, "step": 107 }, { "epoch": 0.0, "learning_rate": 1.8445772843723313e-07, "loss": 1.0078, "step": 108 }, { "epoch": 0.0, "learning_rate": 1.8616567036720752e-07, "loss": 1.3086, "step": 109 }, { "epoch": 0.0, "learning_rate": 1.8787361229718188e-07, "loss": 1.3477, "step": 110 }, { "epoch": 0.0, "learning_rate": 1.8958155422715627e-07, "loss": 1.2305, "step": 111 }, { "epoch": 0.0, "learning_rate": 1.9128949615713063e-07, "loss": 1.3457, "step": 112 }, { "epoch": 0.0, "learning_rate": 1.9299743808710502e-07, "loss": 1.2266, "step": 113 }, { "epoch": 0.0, "learning_rate": 1.947053800170794e-07, "loss": 0.9448, "step": 114 }, { "epoch": 0.0, "learning_rate": 1.964133219470538e-07, "loss": 1.0908, "step": 115 }, { "epoch": 0.0, "learning_rate": 1.981212638770282e-07, "loss": 1.1914, "step": 116 }, { "epoch": 0.0, "learning_rate": 1.9982920580700255e-07, "loss": 1.2041, "step": 117 }, { "epoch": 0.0, "learning_rate": 2.0153714773697694e-07, "loss": 1.498, "step": 118 }, { "epoch": 0.0, "learning_rate": 2.032450896669513e-07, "loss": 1.5176, "step": 119 }, { "epoch": 0.0, "learning_rate": 2.049530315969257e-07, "loss": 1.4189, "step": 120 }, { "epoch": 0.0, "learning_rate": 2.0666097352690006e-07, "loss": 1.3984, "step": 121 }, { "epoch": 0.0, "learning_rate": 2.0836891545687447e-07, "loss": 1.3066, "step": 122 }, { "epoch": 0.0, "learning_rate": 2.1007685738684883e-07, "loss": 1.1553, "step": 123 }, { "epoch": 0.0, "learning_rate": 2.1178479931682322e-07, "loss": 1.3281, "step": 124 }, { "epoch": 0.0, "learning_rate": 2.1349274124679759e-07, "loss": 1.1719, "step": 125 }, { "epoch": 0.0, "learning_rate": 2.1520068317677198e-07, "loss": 1.0166, "step": 126 }, { "epoch": 0.0, "learning_rate": 2.1690862510674636e-07, "loss": 1.0801, "step": 127 }, { "epoch": 0.0, "learning_rate": 2.1861656703672073e-07, "loss": 1.2656, "step": 128 }, { "epoch": 0.0, "learning_rate": 2.2032450896669514e-07, "loss": 1.1465, "step": 129 }, { "epoch": 0.0, "learning_rate": 2.220324508966695e-07, "loss": 1.0635, "step": 130 }, { "epoch": 0.0, "learning_rate": 2.237403928266439e-07, "loss": 1.2129, "step": 131 }, { "epoch": 0.0, "learning_rate": 2.2544833475661826e-07, "loss": 1.126, "step": 132 }, { "epoch": 0.0, "learning_rate": 2.2715627668659265e-07, "loss": 1.2422, "step": 133 }, { "epoch": 0.0, "learning_rate": 2.28864218616567e-07, "loss": 1.1582, "step": 134 }, { "epoch": 0.0, "learning_rate": 2.305721605465414e-07, "loss": 1.0537, "step": 135 }, { "epoch": 0.0, "learning_rate": 2.322801024765158e-07, "loss": 1.2129, "step": 136 }, { "epoch": 0.0, "learning_rate": 2.3398804440649018e-07, "loss": 1.1875, "step": 137 }, { "epoch": 0.0, "learning_rate": 2.3569598633646454e-07, "loss": 0.9678, "step": 138 }, { "epoch": 0.0, "learning_rate": 2.3740392826643893e-07, "loss": 1.2578, "step": 139 }, { "epoch": 0.0, "learning_rate": 2.391118701964133e-07, "loss": 1.1621, "step": 140 }, { "epoch": 0.0, "learning_rate": 2.408198121263877e-07, "loss": 1.2871, "step": 141 }, { "epoch": 0.0, "learning_rate": 2.425277540563621e-07, "loss": 1.0742, "step": 142 }, { "epoch": 0.0, "learning_rate": 2.4423569598633643e-07, "loss": 1.0781, "step": 143 }, { "epoch": 0.0, "learning_rate": 2.459436379163108e-07, "loss": 1.1885, "step": 144 }, { "epoch": 0.0, "learning_rate": 2.476515798462852e-07, "loss": 1.1855, "step": 145 }, { "epoch": 0.0, "learning_rate": 2.493595217762596e-07, "loss": 1.2354, "step": 146 }, { "epoch": 0.0, "learning_rate": 2.51067463706234e-07, "loss": 1.0176, "step": 147 }, { "epoch": 0.0, "learning_rate": 2.527754056362084e-07, "loss": 1.0557, "step": 148 }, { "epoch": 0.0, "learning_rate": 2.544833475661827e-07, "loss": 1.1113, "step": 149 }, { "epoch": 0.0, "learning_rate": 2.561912894961571e-07, "loss": 1.4492, "step": 150 }, { "epoch": 0.0, "learning_rate": 2.578992314261315e-07, "loss": 1.1611, "step": 151 }, { "epoch": 0.0, "learning_rate": 2.596071733561059e-07, "loss": 1.1807, "step": 152 }, { "epoch": 0.0, "learning_rate": 2.6131511528608027e-07, "loss": 1.25, "step": 153 }, { "epoch": 0.0, "learning_rate": 2.6302305721605466e-07, "loss": 1.1367, "step": 154 }, { "epoch": 0.0, "learning_rate": 2.6473099914602905e-07, "loss": 1.2207, "step": 155 }, { "epoch": 0.0, "learning_rate": 2.664389410760034e-07, "loss": 1.2891, "step": 156 }, { "epoch": 0.0, "learning_rate": 2.681468830059778e-07, "loss": 1.2412, "step": 157 }, { "epoch": 0.0, "learning_rate": 2.6985482493595216e-07, "loss": 0.9463, "step": 158 }, { "epoch": 0.0, "learning_rate": 2.7156276686592655e-07, "loss": 1.2891, "step": 159 }, { "epoch": 0.0, "learning_rate": 2.7327070879590094e-07, "loss": 1.2041, "step": 160 }, { "epoch": 0.0, "learning_rate": 2.749786507258753e-07, "loss": 1.0771, "step": 161 }, { "epoch": 0.0, "learning_rate": 2.766865926558497e-07, "loss": 1.2969, "step": 162 }, { "epoch": 0.0, "learning_rate": 2.7839453458582406e-07, "loss": 1.4609, "step": 163 }, { "epoch": 0.0, "learning_rate": 2.8010247651579845e-07, "loss": 0.9658, "step": 164 }, { "epoch": 0.0, "learning_rate": 2.8181041844577283e-07, "loss": 1.0439, "step": 165 }, { "epoch": 0.0, "learning_rate": 2.835183603757472e-07, "loss": 1.1113, "step": 166 }, { "epoch": 0.0, "learning_rate": 2.852263023057216e-07, "loss": 1.3906, "step": 167 }, { "epoch": 0.0, "learning_rate": 2.8693424423569595e-07, "loss": 1.0508, "step": 168 }, { "epoch": 0.0, "learning_rate": 2.886421861656704e-07, "loss": 1.1279, "step": 169 }, { "epoch": 0.0, "learning_rate": 2.9035012809564473e-07, "loss": 1.2852, "step": 170 }, { "epoch": 0.0, "learning_rate": 2.920580700256191e-07, "loss": 0.8525, "step": 171 }, { "epoch": 0.0, "learning_rate": 2.9376601195559345e-07, "loss": 1.25, "step": 172 }, { "epoch": 0.0, "learning_rate": 2.954739538855679e-07, "loss": 1.0869, "step": 173 }, { "epoch": 0.0, "learning_rate": 2.971818958155423e-07, "loss": 1.2266, "step": 174 }, { "epoch": 0.0, "learning_rate": 2.988898377455166e-07, "loss": 1.4424, "step": 175 }, { "epoch": 0.0, "learning_rate": 3.00597779675491e-07, "loss": 0.9077, "step": 176 }, { "epoch": 0.0, "learning_rate": 3.023057216054654e-07, "loss": 1.1211, "step": 177 }, { "epoch": 0.0, "learning_rate": 3.040136635354398e-07, "loss": 1.252, "step": 178 }, { "epoch": 0.0, "learning_rate": 3.057216054654141e-07, "loss": 1.0664, "step": 179 }, { "epoch": 0.0, "learning_rate": 3.0742954739538857e-07, "loss": 1.0996, "step": 180 }, { "epoch": 0.0, "learning_rate": 3.0913748932536296e-07, "loss": 1.1709, "step": 181 }, { "epoch": 0.0, "learning_rate": 3.108454312553373e-07, "loss": 0.8936, "step": 182 }, { "epoch": 0.0, "learning_rate": 3.125533731853117e-07, "loss": 1.2891, "step": 183 }, { "epoch": 0.0, "learning_rate": 3.1426131511528607e-07, "loss": 1.0977, "step": 184 }, { "epoch": 0.0, "learning_rate": 3.1596925704526046e-07, "loss": 1.4473, "step": 185 }, { "epoch": 0.0, "learning_rate": 3.176771989752348e-07, "loss": 1.3115, "step": 186 }, { "epoch": 0.0, "learning_rate": 3.193851409052092e-07, "loss": 1.0586, "step": 187 }, { "epoch": 0.0, "learning_rate": 3.210930828351836e-07, "loss": 1.3301, "step": 188 }, { "epoch": 0.0, "learning_rate": 3.2280102476515796e-07, "loss": 1.126, "step": 189 }, { "epoch": 0.0, "learning_rate": 3.2450896669513235e-07, "loss": 0.9668, "step": 190 }, { "epoch": 0.0, "learning_rate": 3.2621690862510674e-07, "loss": 1.1221, "step": 191 }, { "epoch": 0.0, "learning_rate": 3.2792485055508113e-07, "loss": 1.291, "step": 192 }, { "epoch": 0.0, "learning_rate": 3.2963279248505547e-07, "loss": 1.1934, "step": 193 }, { "epoch": 0.0, "learning_rate": 3.3134073441502986e-07, "loss": 1.1357, "step": 194 }, { "epoch": 0.0, "learning_rate": 3.330486763450043e-07, "loss": 1.1934, "step": 195 }, { "epoch": 0.01, "learning_rate": 3.3475661827497863e-07, "loss": 1.2578, "step": 196 }, { "epoch": 0.01, "learning_rate": 3.36464560204953e-07, "loss": 1.1631, "step": 197 }, { "epoch": 0.01, "learning_rate": 3.3817250213492736e-07, "loss": 1.1602, "step": 198 }, { "epoch": 0.01, "learning_rate": 3.398804440649018e-07, "loss": 1.248, "step": 199 }, { "epoch": 0.01, "learning_rate": 3.4158838599487614e-07, "loss": 1.1162, "step": 200 }, { "epoch": 0.01, "learning_rate": 3.4329632792485053e-07, "loss": 1.1123, "step": 201 }, { "epoch": 0.01, "learning_rate": 3.4500426985482497e-07, "loss": 1.1084, "step": 202 }, { "epoch": 0.01, "learning_rate": 3.467122117847993e-07, "loss": 1.2285, "step": 203 }, { "epoch": 0.01, "learning_rate": 3.484201537147737e-07, "loss": 1.1211, "step": 204 }, { "epoch": 0.01, "learning_rate": 3.5012809564474803e-07, "loss": 1.0586, "step": 205 }, { "epoch": 0.01, "learning_rate": 3.5183603757472247e-07, "loss": 1.1143, "step": 206 }, { "epoch": 0.01, "learning_rate": 3.535439795046968e-07, "loss": 1.2773, "step": 207 }, { "epoch": 0.01, "learning_rate": 3.552519214346712e-07, "loss": 1.0332, "step": 208 }, { "epoch": 0.01, "learning_rate": 3.569598633646456e-07, "loss": 1.0371, "step": 209 }, { "epoch": 0.01, "learning_rate": 3.5866780529462e-07, "loss": 0.8853, "step": 210 }, { "epoch": 0.01, "learning_rate": 3.6037574722459437e-07, "loss": 1.1816, "step": 211 }, { "epoch": 0.01, "learning_rate": 3.620836891545687e-07, "loss": 1.1865, "step": 212 }, { "epoch": 0.01, "learning_rate": 3.637916310845431e-07, "loss": 1.2402, "step": 213 }, { "epoch": 0.01, "learning_rate": 3.654995730145175e-07, "loss": 1.1846, "step": 214 }, { "epoch": 0.01, "learning_rate": 3.6720751494449187e-07, "loss": 1.2129, "step": 215 }, { "epoch": 0.01, "learning_rate": 3.6891545687446626e-07, "loss": 1.1211, "step": 216 }, { "epoch": 0.01, "learning_rate": 3.7062339880444065e-07, "loss": 1.002, "step": 217 }, { "epoch": 0.01, "learning_rate": 3.7233134073441504e-07, "loss": 0.915, "step": 218 }, { "epoch": 0.01, "learning_rate": 3.7403928266438937e-07, "loss": 1.1201, "step": 219 }, { "epoch": 0.01, "learning_rate": 3.7574722459436376e-07, "loss": 1.0869, "step": 220 }, { "epoch": 0.01, "learning_rate": 3.7745516652433815e-07, "loss": 1.0088, "step": 221 }, { "epoch": 0.01, "learning_rate": 3.7916310845431254e-07, "loss": 0.9395, "step": 222 }, { "epoch": 0.01, "learning_rate": 3.8087105038428693e-07, "loss": 1.1514, "step": 223 }, { "epoch": 0.01, "learning_rate": 3.8257899231426127e-07, "loss": 0.9434, "step": 224 }, { "epoch": 0.01, "learning_rate": 3.842869342442357e-07, "loss": 0.9873, "step": 225 }, { "epoch": 0.01, "learning_rate": 3.8599487617421004e-07, "loss": 1.1006, "step": 226 }, { "epoch": 0.01, "learning_rate": 3.8770281810418443e-07, "loss": 1.0166, "step": 227 }, { "epoch": 0.01, "learning_rate": 3.894107600341588e-07, "loss": 1.2129, "step": 228 }, { "epoch": 0.01, "learning_rate": 3.911187019641332e-07, "loss": 1.1572, "step": 229 }, { "epoch": 0.01, "learning_rate": 3.928266438941076e-07, "loss": 0.9033, "step": 230 }, { "epoch": 0.01, "learning_rate": 3.9453458582408194e-07, "loss": 0.959, "step": 231 }, { "epoch": 0.01, "learning_rate": 3.962425277540564e-07, "loss": 1.1064, "step": 232 }, { "epoch": 0.01, "learning_rate": 3.979504696840307e-07, "loss": 1.1416, "step": 233 }, { "epoch": 0.01, "learning_rate": 3.996584116140051e-07, "loss": 1.3711, "step": 234 }, { "epoch": 0.01, "learning_rate": 4.0136635354397944e-07, "loss": 1.043, "step": 235 }, { "epoch": 0.01, "learning_rate": 4.030742954739539e-07, "loss": 1.0303, "step": 236 }, { "epoch": 0.01, "learning_rate": 4.0478223740392827e-07, "loss": 0.8579, "step": 237 }, { "epoch": 0.01, "learning_rate": 4.064901793339026e-07, "loss": 1.1992, "step": 238 }, { "epoch": 0.01, "learning_rate": 4.08198121263877e-07, "loss": 0.8105, "step": 239 }, { "epoch": 0.01, "learning_rate": 4.099060631938514e-07, "loss": 1.0303, "step": 240 }, { "epoch": 0.01, "learning_rate": 4.116140051238258e-07, "loss": 1.0039, "step": 241 }, { "epoch": 0.01, "learning_rate": 4.133219470538001e-07, "loss": 1.3086, "step": 242 }, { "epoch": 0.01, "learning_rate": 4.1502988898377455e-07, "loss": 1.1338, "step": 243 }, { "epoch": 0.01, "learning_rate": 4.1673783091374894e-07, "loss": 1.0273, "step": 244 }, { "epoch": 0.01, "learning_rate": 4.184457728437233e-07, "loss": 0.9795, "step": 245 }, { "epoch": 0.01, "learning_rate": 4.2015371477369767e-07, "loss": 0.9775, "step": 246 }, { "epoch": 0.01, "learning_rate": 4.2186165670367206e-07, "loss": 1.1836, "step": 247 }, { "epoch": 0.01, "learning_rate": 4.2356959863364645e-07, "loss": 1.1309, "step": 248 }, { "epoch": 0.01, "learning_rate": 4.252775405636208e-07, "loss": 1.1484, "step": 249 }, { "epoch": 0.01, "learning_rate": 4.2698548249359517e-07, "loss": 0.7554, "step": 250 }, { "epoch": 0.01, "learning_rate": 4.286934244235696e-07, "loss": 0.9375, "step": 251 }, { "epoch": 0.01, "learning_rate": 4.3040136635354395e-07, "loss": 1.1152, "step": 252 }, { "epoch": 0.01, "learning_rate": 4.3210930828351834e-07, "loss": 0.9209, "step": 253 }, { "epoch": 0.01, "learning_rate": 4.3381725021349273e-07, "loss": 0.9922, "step": 254 }, { "epoch": 0.01, "learning_rate": 4.355251921434671e-07, "loss": 1.0566, "step": 255 }, { "epoch": 0.01, "learning_rate": 4.3723313407344145e-07, "loss": 1.0693, "step": 256 }, { "epoch": 0.01, "learning_rate": 4.3894107600341584e-07, "loss": 1.0098, "step": 257 }, { "epoch": 0.01, "learning_rate": 4.406490179333903e-07, "loss": 1.2002, "step": 258 }, { "epoch": 0.01, "learning_rate": 4.423569598633646e-07, "loss": 1.0488, "step": 259 }, { "epoch": 0.01, "learning_rate": 4.44064901793339e-07, "loss": 1.1133, "step": 260 }, { "epoch": 0.01, "learning_rate": 4.4577284372331335e-07, "loss": 1.0498, "step": 261 }, { "epoch": 0.01, "learning_rate": 4.474807856532878e-07, "loss": 0.9395, "step": 262 }, { "epoch": 0.01, "learning_rate": 4.491887275832621e-07, "loss": 1.0898, "step": 263 }, { "epoch": 0.01, "learning_rate": 4.508966695132365e-07, "loss": 1.3242, "step": 264 }, { "epoch": 0.01, "learning_rate": 4.5260461144321096e-07, "loss": 0.8994, "step": 265 }, { "epoch": 0.01, "learning_rate": 4.543125533731853e-07, "loss": 1.0664, "step": 266 }, { "epoch": 0.01, "learning_rate": 4.560204953031597e-07, "loss": 0.8447, "step": 267 }, { "epoch": 0.01, "learning_rate": 4.57728437233134e-07, "loss": 0.9893, "step": 268 }, { "epoch": 0.01, "learning_rate": 4.5943637916310846e-07, "loss": 1.0898, "step": 269 }, { "epoch": 0.01, "learning_rate": 4.611443210930828e-07, "loss": 1.2002, "step": 270 }, { "epoch": 0.01, "learning_rate": 4.628522630230572e-07, "loss": 0.9106, "step": 271 }, { "epoch": 0.01, "learning_rate": 4.645602049530316e-07, "loss": 1.2363, "step": 272 }, { "epoch": 0.01, "learning_rate": 4.6626814688300596e-07, "loss": 1.3057, "step": 273 }, { "epoch": 0.01, "learning_rate": 4.6797608881298035e-07, "loss": 0.9131, "step": 274 }, { "epoch": 0.01, "learning_rate": 4.696840307429547e-07, "loss": 1.0869, "step": 275 }, { "epoch": 0.01, "learning_rate": 4.713919726729291e-07, "loss": 1.0244, "step": 276 }, { "epoch": 0.01, "learning_rate": 4.730999146029035e-07, "loss": 1.0195, "step": 277 }, { "epoch": 0.01, "learning_rate": 4.7480785653287786e-07, "loss": 1.0977, "step": 278 }, { "epoch": 0.01, "learning_rate": 4.7651579846285225e-07, "loss": 0.9365, "step": 279 }, { "epoch": 0.01, "learning_rate": 4.782237403928266e-07, "loss": 1.2754, "step": 280 }, { "epoch": 0.01, "learning_rate": 4.79931682322801e-07, "loss": 1.0928, "step": 281 }, { "epoch": 0.01, "learning_rate": 4.816396242527754e-07, "loss": 1.1465, "step": 282 }, { "epoch": 0.01, "learning_rate": 4.833475661827497e-07, "loss": 0.856, "step": 283 }, { "epoch": 0.01, "learning_rate": 4.850555081127242e-07, "loss": 1.1621, "step": 284 }, { "epoch": 0.01, "learning_rate": 4.867634500426985e-07, "loss": 1.0645, "step": 285 }, { "epoch": 0.01, "learning_rate": 4.884713919726729e-07, "loss": 1.0635, "step": 286 }, { "epoch": 0.01, "learning_rate": 4.901793339026473e-07, "loss": 1.1826, "step": 287 }, { "epoch": 0.01, "learning_rate": 4.918872758326216e-07, "loss": 0.9922, "step": 288 }, { "epoch": 0.01, "learning_rate": 4.935952177625961e-07, "loss": 1.2051, "step": 289 }, { "epoch": 0.01, "learning_rate": 4.953031596925704e-07, "loss": 1.0996, "step": 290 }, { "epoch": 0.01, "learning_rate": 4.970111016225449e-07, "loss": 1.1465, "step": 291 }, { "epoch": 0.01, "learning_rate": 4.987190435525192e-07, "loss": 0.959, "step": 292 }, { "epoch": 0.01, "learning_rate": 5.004269854824936e-07, "loss": 1.0752, "step": 293 }, { "epoch": 0.01, "learning_rate": 5.02134927412468e-07, "loss": 1.0166, "step": 294 }, { "epoch": 0.01, "learning_rate": 5.038428693424423e-07, "loss": 1.1826, "step": 295 }, { "epoch": 0.01, "learning_rate": 5.055508112724168e-07, "loss": 1.1201, "step": 296 }, { "epoch": 0.01, "learning_rate": 5.072587532023911e-07, "loss": 1.1641, "step": 297 }, { "epoch": 0.01, "learning_rate": 5.089666951323654e-07, "loss": 0.9453, "step": 298 }, { "epoch": 0.01, "learning_rate": 5.106746370623399e-07, "loss": 1.1025, "step": 299 }, { "epoch": 0.01, "learning_rate": 5.123825789923142e-07, "loss": 1.1543, "step": 300 }, { "epoch": 0.01, "learning_rate": 5.140905209222886e-07, "loss": 1.0498, "step": 301 }, { "epoch": 0.01, "learning_rate": 5.15798462852263e-07, "loss": 0.9502, "step": 302 }, { "epoch": 0.01, "learning_rate": 5.175064047822374e-07, "loss": 1.1162, "step": 303 }, { "epoch": 0.01, "learning_rate": 5.192143467122118e-07, "loss": 0.8975, "step": 304 }, { "epoch": 0.01, "learning_rate": 5.209222886421861e-07, "loss": 1.4521, "step": 305 }, { "epoch": 0.01, "learning_rate": 5.226302305721605e-07, "loss": 1.1406, "step": 306 }, { "epoch": 0.01, "learning_rate": 5.243381725021349e-07, "loss": 1.1289, "step": 307 }, { "epoch": 0.01, "learning_rate": 5.260461144321093e-07, "loss": 1.064, "step": 308 }, { "epoch": 0.01, "learning_rate": 5.277540563620837e-07, "loss": 0.9507, "step": 309 }, { "epoch": 0.01, "learning_rate": 5.294619982920581e-07, "loss": 1.1094, "step": 310 }, { "epoch": 0.01, "learning_rate": 5.311699402220324e-07, "loss": 0.9355, "step": 311 }, { "epoch": 0.01, "learning_rate": 5.328778821520068e-07, "loss": 1.1289, "step": 312 }, { "epoch": 0.01, "learning_rate": 5.345858240819812e-07, "loss": 1.2461, "step": 313 }, { "epoch": 0.01, "learning_rate": 5.362937660119555e-07, "loss": 1.1348, "step": 314 }, { "epoch": 0.01, "learning_rate": 5.3800170794193e-07, "loss": 0.9053, "step": 315 }, { "epoch": 0.01, "learning_rate": 5.397096498719043e-07, "loss": 1.1006, "step": 316 }, { "epoch": 0.01, "learning_rate": 5.414175918018788e-07, "loss": 1.0391, "step": 317 }, { "epoch": 0.01, "learning_rate": 5.431255337318531e-07, "loss": 0.9883, "step": 318 }, { "epoch": 0.01, "learning_rate": 5.448334756618274e-07, "loss": 1.1436, "step": 319 }, { "epoch": 0.01, "learning_rate": 5.465414175918019e-07, "loss": 1.0342, "step": 320 }, { "epoch": 0.01, "learning_rate": 5.482493595217762e-07, "loss": 0.8926, "step": 321 }, { "epoch": 0.01, "learning_rate": 5.499573014517506e-07, "loss": 0.9258, "step": 322 }, { "epoch": 0.01, "learning_rate": 5.51665243381725e-07, "loss": 0.9902, "step": 323 }, { "epoch": 0.01, "learning_rate": 5.533731853116994e-07, "loss": 0.9766, "step": 324 }, { "epoch": 0.01, "learning_rate": 5.550811272416738e-07, "loss": 1.0791, "step": 325 }, { "epoch": 0.01, "learning_rate": 5.567890691716481e-07, "loss": 0.8574, "step": 326 }, { "epoch": 0.01, "learning_rate": 5.584970111016226e-07, "loss": 1.1416, "step": 327 }, { "epoch": 0.01, "learning_rate": 5.602049530315969e-07, "loss": 1.0605, "step": 328 }, { "epoch": 0.01, "learning_rate": 5.619128949615712e-07, "loss": 0.9629, "step": 329 }, { "epoch": 0.01, "learning_rate": 5.636208368915457e-07, "loss": 1.3828, "step": 330 }, { "epoch": 0.01, "learning_rate": 5.653287788215201e-07, "loss": 1.0889, "step": 331 }, { "epoch": 0.01, "learning_rate": 5.670367207514944e-07, "loss": 1.0586, "step": 332 }, { "epoch": 0.01, "learning_rate": 5.687446626814688e-07, "loss": 1.0518, "step": 333 }, { "epoch": 0.01, "learning_rate": 5.704526046114432e-07, "loss": 0.9277, "step": 334 }, { "epoch": 0.01, "learning_rate": 5.721605465414176e-07, "loss": 1.1211, "step": 335 }, { "epoch": 0.01, "learning_rate": 5.738684884713919e-07, "loss": 1.084, "step": 336 }, { "epoch": 0.01, "learning_rate": 5.755764304013662e-07, "loss": 0.9268, "step": 337 }, { "epoch": 0.01, "learning_rate": 5.772843723313408e-07, "loss": 1.1348, "step": 338 }, { "epoch": 0.01, "learning_rate": 5.789923142613151e-07, "loss": 1.0332, "step": 339 }, { "epoch": 0.01, "learning_rate": 5.807002561912895e-07, "loss": 0.8828, "step": 340 }, { "epoch": 0.01, "learning_rate": 5.824081981212639e-07, "loss": 0.8628, "step": 341 }, { "epoch": 0.01, "learning_rate": 5.841161400512382e-07, "loss": 1.0225, "step": 342 }, { "epoch": 0.01, "learning_rate": 5.858240819812126e-07, "loss": 0.6987, "step": 343 }, { "epoch": 0.01, "learning_rate": 5.875320239111869e-07, "loss": 0.9922, "step": 344 }, { "epoch": 0.01, "learning_rate": 5.892399658411615e-07, "loss": 0.9609, "step": 345 }, { "epoch": 0.01, "learning_rate": 5.909479077711358e-07, "loss": 1.0303, "step": 346 }, { "epoch": 0.01, "learning_rate": 5.926558497011101e-07, "loss": 1.0186, "step": 347 }, { "epoch": 0.01, "learning_rate": 5.943637916310846e-07, "loss": 0.9668, "step": 348 }, { "epoch": 0.01, "learning_rate": 5.960717335610589e-07, "loss": 1.0811, "step": 349 }, { "epoch": 0.01, "learning_rate": 5.977796754910332e-07, "loss": 1.0498, "step": 350 }, { "epoch": 0.01, "learning_rate": 5.994876174210076e-07, "loss": 1.2266, "step": 351 }, { "epoch": 0.01, "learning_rate": 6.01195559350982e-07, "loss": 1.1455, "step": 352 }, { "epoch": 0.01, "learning_rate": 6.029035012809565e-07, "loss": 0.8936, "step": 353 }, { "epoch": 0.01, "learning_rate": 6.046114432109308e-07, "loss": 0.9014, "step": 354 }, { "epoch": 0.01, "learning_rate": 6.063193851409052e-07, "loss": 0.9902, "step": 355 }, { "epoch": 0.01, "learning_rate": 6.080273270708796e-07, "loss": 1.1016, "step": 356 }, { "epoch": 0.01, "learning_rate": 6.097352690008539e-07, "loss": 0.9785, "step": 357 }, { "epoch": 0.01, "learning_rate": 6.114432109308282e-07, "loss": 0.9844, "step": 358 }, { "epoch": 0.01, "learning_rate": 6.131511528608027e-07, "loss": 1.0771, "step": 359 }, { "epoch": 0.01, "learning_rate": 6.148590947907771e-07, "loss": 0.9385, "step": 360 }, { "epoch": 0.01, "learning_rate": 6.165670367207515e-07, "loss": 0.9951, "step": 361 }, { "epoch": 0.01, "learning_rate": 6.182749786507259e-07, "loss": 1.0596, "step": 362 }, { "epoch": 0.01, "learning_rate": 6.199829205807002e-07, "loss": 0.8716, "step": 363 }, { "epoch": 0.01, "learning_rate": 6.216908625106746e-07, "loss": 0.9834, "step": 364 }, { "epoch": 0.01, "learning_rate": 6.233988044406489e-07, "loss": 1.1426, "step": 365 }, { "epoch": 0.01, "learning_rate": 6.251067463706234e-07, "loss": 1.0342, "step": 366 }, { "epoch": 0.01, "learning_rate": 6.268146883005978e-07, "loss": 1.1494, "step": 367 }, { "epoch": 0.01, "learning_rate": 6.285226302305721e-07, "loss": 1.1699, "step": 368 }, { "epoch": 0.01, "learning_rate": 6.302305721605466e-07, "loss": 1.1826, "step": 369 }, { "epoch": 0.01, "learning_rate": 6.319385140905209e-07, "loss": 0.9854, "step": 370 }, { "epoch": 0.01, "learning_rate": 6.336464560204953e-07, "loss": 0.8887, "step": 371 }, { "epoch": 0.01, "learning_rate": 6.353543979504696e-07, "loss": 0.7451, "step": 372 }, { "epoch": 0.01, "learning_rate": 6.37062339880444e-07, "loss": 0.9766, "step": 373 }, { "epoch": 0.01, "learning_rate": 6.387702818104184e-07, "loss": 1.3242, "step": 374 }, { "epoch": 0.01, "learning_rate": 6.404782237403928e-07, "loss": 1.0547, "step": 375 }, { "epoch": 0.01, "learning_rate": 6.421861656703673e-07, "loss": 0.9727, "step": 376 }, { "epoch": 0.01, "learning_rate": 6.438941076003416e-07, "loss": 0.6865, "step": 377 }, { "epoch": 0.01, "learning_rate": 6.456020495303159e-07, "loss": 0.9463, "step": 378 }, { "epoch": 0.01, "learning_rate": 6.473099914602903e-07, "loss": 0.9258, "step": 379 }, { "epoch": 0.01, "learning_rate": 6.490179333902647e-07, "loss": 1.1016, "step": 380 }, { "epoch": 0.01, "learning_rate": 6.50725875320239e-07, "loss": 0.9629, "step": 381 }, { "epoch": 0.01, "learning_rate": 6.524338172502135e-07, "loss": 0.9453, "step": 382 }, { "epoch": 0.01, "learning_rate": 6.541417591801879e-07, "loss": 0.8516, "step": 383 }, { "epoch": 0.01, "learning_rate": 6.558497011101623e-07, "loss": 0.9092, "step": 384 }, { "epoch": 0.01, "learning_rate": 6.575576430401366e-07, "loss": 1.1934, "step": 385 }, { "epoch": 0.01, "learning_rate": 6.592655849701109e-07, "loss": 1.0176, "step": 386 }, { "epoch": 0.01, "learning_rate": 6.609735269000854e-07, "loss": 0.9209, "step": 387 }, { "epoch": 0.01, "learning_rate": 6.626814688300597e-07, "loss": 0.8428, "step": 388 }, { "epoch": 0.01, "learning_rate": 6.64389410760034e-07, "loss": 1.083, "step": 389 }, { "epoch": 0.01, "learning_rate": 6.660973526900086e-07, "loss": 1.0059, "step": 390 }, { "epoch": 0.01, "learning_rate": 6.678052946199829e-07, "loss": 0.9551, "step": 391 }, { "epoch": 0.01, "learning_rate": 6.695132365499573e-07, "loss": 1.2363, "step": 392 }, { "epoch": 0.01, "learning_rate": 6.712211784799316e-07, "loss": 0.8877, "step": 393 }, { "epoch": 0.01, "learning_rate": 6.72929120409906e-07, "loss": 1.2549, "step": 394 }, { "epoch": 0.01, "learning_rate": 6.746370623398804e-07, "loss": 1.0254, "step": 395 }, { "epoch": 0.01, "learning_rate": 6.763450042698547e-07, "loss": 0.9619, "step": 396 }, { "epoch": 0.01, "learning_rate": 6.780529461998293e-07, "loss": 0.8408, "step": 397 }, { "epoch": 0.01, "learning_rate": 6.797608881298036e-07, "loss": 0.8213, "step": 398 }, { "epoch": 0.01, "learning_rate": 6.814688300597779e-07, "loss": 0.9805, "step": 399 }, { "epoch": 0.01, "learning_rate": 6.831767719897523e-07, "loss": 1.1094, "step": 400 }, { "epoch": 0.01, "learning_rate": 6.848847139197267e-07, "loss": 0.9609, "step": 401 }, { "epoch": 0.01, "learning_rate": 6.865926558497011e-07, "loss": 1.1543, "step": 402 }, { "epoch": 0.01, "learning_rate": 6.883005977796754e-07, "loss": 0.8228, "step": 403 }, { "epoch": 0.01, "learning_rate": 6.900085397096499e-07, "loss": 0.957, "step": 404 }, { "epoch": 0.01, "learning_rate": 6.917164816396243e-07, "loss": 0.9033, "step": 405 }, { "epoch": 0.01, "learning_rate": 6.934244235695986e-07, "loss": 1.1436, "step": 406 }, { "epoch": 0.01, "learning_rate": 6.951323654995729e-07, "loss": 1.1338, "step": 407 }, { "epoch": 0.01, "learning_rate": 6.968403074295474e-07, "loss": 0.9258, "step": 408 }, { "epoch": 0.01, "learning_rate": 6.985482493595217e-07, "loss": 1.0791, "step": 409 }, { "epoch": 0.01, "learning_rate": 7.002561912894961e-07, "loss": 1.166, "step": 410 }, { "epoch": 0.01, "learning_rate": 7.019641332194705e-07, "loss": 1.021, "step": 411 }, { "epoch": 0.01, "learning_rate": 7.036720751494449e-07, "loss": 1.0732, "step": 412 }, { "epoch": 0.01, "learning_rate": 7.053800170794193e-07, "loss": 1.0522, "step": 413 }, { "epoch": 0.01, "learning_rate": 7.070879590093936e-07, "loss": 1.0146, "step": 414 }, { "epoch": 0.01, "learning_rate": 7.087959009393681e-07, "loss": 0.9131, "step": 415 }, { "epoch": 0.01, "learning_rate": 7.105038428693424e-07, "loss": 1.0723, "step": 416 }, { "epoch": 0.01, "learning_rate": 7.122117847993167e-07, "loss": 0.814, "step": 417 }, { "epoch": 0.01, "learning_rate": 7.139197267292912e-07, "loss": 1.2051, "step": 418 }, { "epoch": 0.01, "learning_rate": 7.156276686592656e-07, "loss": 0.9053, "step": 419 }, { "epoch": 0.01, "learning_rate": 7.1733561058924e-07, "loss": 0.8457, "step": 420 }, { "epoch": 0.01, "learning_rate": 7.190435525192143e-07, "loss": 1.0205, "step": 421 }, { "epoch": 0.01, "learning_rate": 7.207514944491887e-07, "loss": 1.1445, "step": 422 }, { "epoch": 0.01, "learning_rate": 7.224594363791631e-07, "loss": 0.9727, "step": 423 }, { "epoch": 0.01, "learning_rate": 7.241673783091374e-07, "loss": 1.2812, "step": 424 }, { "epoch": 0.01, "learning_rate": 7.258753202391118e-07, "loss": 1.1436, "step": 425 }, { "epoch": 0.01, "learning_rate": 7.275832621690862e-07, "loss": 1.0098, "step": 426 }, { "epoch": 0.01, "learning_rate": 7.292912040990606e-07, "loss": 0.9795, "step": 427 }, { "epoch": 0.01, "learning_rate": 7.30999146029035e-07, "loss": 1.0107, "step": 428 }, { "epoch": 0.01, "learning_rate": 7.327070879590094e-07, "loss": 0.9326, "step": 429 }, { "epoch": 0.01, "learning_rate": 7.344150298889837e-07, "loss": 0.811, "step": 430 }, { "epoch": 0.01, "learning_rate": 7.361229718189581e-07, "loss": 1.0801, "step": 431 }, { "epoch": 0.01, "learning_rate": 7.378309137489325e-07, "loss": 1.0322, "step": 432 }, { "epoch": 0.01, "learning_rate": 7.395388556789069e-07, "loss": 0.8447, "step": 433 }, { "epoch": 0.01, "learning_rate": 7.412467976088813e-07, "loss": 0.916, "step": 434 }, { "epoch": 0.01, "learning_rate": 7.429547395388556e-07, "loss": 1.0225, "step": 435 }, { "epoch": 0.01, "learning_rate": 7.446626814688301e-07, "loss": 0.8467, "step": 436 }, { "epoch": 0.01, "learning_rate": 7.463706233988044e-07, "loss": 1.0645, "step": 437 }, { "epoch": 0.01, "learning_rate": 7.480785653287787e-07, "loss": 1.2012, "step": 438 }, { "epoch": 0.01, "learning_rate": 7.497865072587532e-07, "loss": 1.2334, "step": 439 }, { "epoch": 0.01, "learning_rate": 7.514944491887275e-07, "loss": 0.9316, "step": 440 }, { "epoch": 0.01, "learning_rate": 7.53202391118702e-07, "loss": 0.9658, "step": 441 }, { "epoch": 0.01, "learning_rate": 7.549103330486763e-07, "loss": 0.9922, "step": 442 }, { "epoch": 0.01, "learning_rate": 7.566182749786507e-07, "loss": 1.0156, "step": 443 }, { "epoch": 0.01, "learning_rate": 7.583262169086251e-07, "loss": 1.0127, "step": 444 }, { "epoch": 0.01, "learning_rate": 7.600341588385994e-07, "loss": 0.918, "step": 445 }, { "epoch": 0.01, "learning_rate": 7.617421007685739e-07, "loss": 1.0498, "step": 446 }, { "epoch": 0.01, "learning_rate": 7.634500426985482e-07, "loss": 0.959, "step": 447 }, { "epoch": 0.01, "learning_rate": 7.651579846285225e-07, "loss": 0.9277, "step": 448 }, { "epoch": 0.01, "learning_rate": 7.66865926558497e-07, "loss": 0.9609, "step": 449 }, { "epoch": 0.01, "learning_rate": 7.685738684884714e-07, "loss": 0.7563, "step": 450 }, { "epoch": 0.01, "learning_rate": 7.702818104184458e-07, "loss": 1.3008, "step": 451 }, { "epoch": 0.01, "learning_rate": 7.719897523484201e-07, "loss": 1.2383, "step": 452 }, { "epoch": 0.01, "learning_rate": 7.736976942783945e-07, "loss": 0.9932, "step": 453 }, { "epoch": 0.01, "learning_rate": 7.754056362083689e-07, "loss": 1.0752, "step": 454 }, { "epoch": 0.01, "learning_rate": 7.771135781383432e-07, "loss": 0.9736, "step": 455 }, { "epoch": 0.01, "learning_rate": 7.788215200683176e-07, "loss": 1.2686, "step": 456 }, { "epoch": 0.01, "learning_rate": 7.805294619982921e-07, "loss": 1.0439, "step": 457 }, { "epoch": 0.01, "learning_rate": 7.822374039282664e-07, "loss": 1.0811, "step": 458 }, { "epoch": 0.01, "learning_rate": 7.839453458582408e-07, "loss": 1.1406, "step": 459 }, { "epoch": 0.01, "learning_rate": 7.856532877882152e-07, "loss": 1.0122, "step": 460 }, { "epoch": 0.01, "learning_rate": 7.873612297181895e-07, "loss": 1.1104, "step": 461 }, { "epoch": 0.01, "learning_rate": 7.890691716481639e-07, "loss": 1.0459, "step": 462 }, { "epoch": 0.01, "learning_rate": 7.907771135781382e-07, "loss": 0.9883, "step": 463 }, { "epoch": 0.01, "learning_rate": 7.924850555081128e-07, "loss": 1.207, "step": 464 }, { "epoch": 0.01, "learning_rate": 7.941929974380871e-07, "loss": 0.9541, "step": 465 }, { "epoch": 0.01, "learning_rate": 7.959009393680614e-07, "loss": 1.0352, "step": 466 }, { "epoch": 0.01, "learning_rate": 7.976088812980359e-07, "loss": 0.9136, "step": 467 }, { "epoch": 0.01, "learning_rate": 7.993168232280102e-07, "loss": 1.0059, "step": 468 }, { "epoch": 0.01, "learning_rate": 8.010247651579845e-07, "loss": 0.8223, "step": 469 }, { "epoch": 0.01, "learning_rate": 8.027327070879589e-07, "loss": 0.8262, "step": 470 }, { "epoch": 0.01, "learning_rate": 8.044406490179334e-07, "loss": 1.0186, "step": 471 }, { "epoch": 0.01, "learning_rate": 8.061485909479078e-07, "loss": 0.7524, "step": 472 }, { "epoch": 0.01, "learning_rate": 8.078565328778821e-07, "loss": 0.8809, "step": 473 }, { "epoch": 0.01, "learning_rate": 8.095644748078565e-07, "loss": 0.8242, "step": 474 }, { "epoch": 0.01, "learning_rate": 8.112724167378309e-07, "loss": 1.0674, "step": 475 }, { "epoch": 0.01, "learning_rate": 8.129803586678052e-07, "loss": 1.0117, "step": 476 }, { "epoch": 0.01, "learning_rate": 8.146883005977796e-07, "loss": 1.0762, "step": 477 }, { "epoch": 0.01, "learning_rate": 8.16396242527754e-07, "loss": 0.9668, "step": 478 }, { "epoch": 0.01, "learning_rate": 8.181041844577284e-07, "loss": 1.0527, "step": 479 }, { "epoch": 0.01, "learning_rate": 8.198121263877028e-07, "loss": 1.0928, "step": 480 }, { "epoch": 0.01, "learning_rate": 8.215200683176772e-07, "loss": 1.1113, "step": 481 }, { "epoch": 0.01, "learning_rate": 8.232280102476516e-07, "loss": 0.8477, "step": 482 }, { "epoch": 0.01, "learning_rate": 8.249359521776259e-07, "loss": 0.9634, "step": 483 }, { "epoch": 0.01, "learning_rate": 8.266438941076002e-07, "loss": 0.9795, "step": 484 }, { "epoch": 0.01, "learning_rate": 8.283518360375747e-07, "loss": 1.0674, "step": 485 }, { "epoch": 0.01, "learning_rate": 8.300597779675491e-07, "loss": 1.0791, "step": 486 }, { "epoch": 0.01, "learning_rate": 8.317677198975234e-07, "loss": 1.0176, "step": 487 }, { "epoch": 0.01, "learning_rate": 8.334756618274979e-07, "loss": 0.9053, "step": 488 }, { "epoch": 0.01, "learning_rate": 8.351836037574722e-07, "loss": 0.9131, "step": 489 }, { "epoch": 0.01, "learning_rate": 8.368915456874466e-07, "loss": 1.2344, "step": 490 }, { "epoch": 0.01, "learning_rate": 8.385994876174209e-07, "loss": 1.0029, "step": 491 }, { "epoch": 0.01, "learning_rate": 8.403074295473953e-07, "loss": 1.0283, "step": 492 }, { "epoch": 0.01, "learning_rate": 8.420153714773698e-07, "loss": 0.9668, "step": 493 }, { "epoch": 0.01, "learning_rate": 8.437233134073441e-07, "loss": 1.2949, "step": 494 }, { "epoch": 0.01, "learning_rate": 8.454312553373186e-07, "loss": 1.0537, "step": 495 }, { "epoch": 0.01, "learning_rate": 8.471391972672929e-07, "loss": 1.0264, "step": 496 }, { "epoch": 0.01, "learning_rate": 8.488471391972672e-07, "loss": 0.9355, "step": 497 }, { "epoch": 0.01, "learning_rate": 8.505550811272416e-07, "loss": 1.123, "step": 498 }, { "epoch": 0.01, "learning_rate": 8.52263023057216e-07, "loss": 0.9248, "step": 499 }, { "epoch": 0.01, "learning_rate": 8.539709649871903e-07, "loss": 1.0684, "step": 500 }, { "epoch": 0.01, "learning_rate": 8.556789069171648e-07, "loss": 0.9834, "step": 501 }, { "epoch": 0.01, "learning_rate": 8.573868488471392e-07, "loss": 0.9893, "step": 502 }, { "epoch": 0.01, "learning_rate": 8.590947907771136e-07, "loss": 1.1426, "step": 503 }, { "epoch": 0.01, "learning_rate": 8.608027327070879e-07, "loss": 0.8242, "step": 504 }, { "epoch": 0.01, "learning_rate": 8.625106746370622e-07, "loss": 1.1387, "step": 505 }, { "epoch": 0.01, "learning_rate": 8.642186165670367e-07, "loss": 0.833, "step": 506 }, { "epoch": 0.01, "learning_rate": 8.65926558497011e-07, "loss": 1.1562, "step": 507 }, { "epoch": 0.01, "learning_rate": 8.676345004269855e-07, "loss": 0.9736, "step": 508 }, { "epoch": 0.01, "learning_rate": 8.693424423569599e-07, "loss": 1.168, "step": 509 }, { "epoch": 0.01, "learning_rate": 8.710503842869342e-07, "loss": 1.0205, "step": 510 }, { "epoch": 0.01, "learning_rate": 8.727583262169086e-07, "loss": 0.9839, "step": 511 }, { "epoch": 0.01, "learning_rate": 8.744662681468829e-07, "loss": 0.9004, "step": 512 }, { "epoch": 0.01, "learning_rate": 8.761742100768573e-07, "loss": 1.1885, "step": 513 }, { "epoch": 0.01, "learning_rate": 8.778821520068317e-07, "loss": 1.1719, "step": 514 }, { "epoch": 0.01, "learning_rate": 8.79590093936806e-07, "loss": 1.1523, "step": 515 }, { "epoch": 0.01, "learning_rate": 8.812980358667806e-07, "loss": 1.084, "step": 516 }, { "epoch": 0.01, "learning_rate": 8.830059777967549e-07, "loss": 1.209, "step": 517 }, { "epoch": 0.01, "learning_rate": 8.847139197267292e-07, "loss": 0.8115, "step": 518 }, { "epoch": 0.01, "learning_rate": 8.864218616567036e-07, "loss": 1.0215, "step": 519 }, { "epoch": 0.01, "learning_rate": 8.88129803586678e-07, "loss": 1.042, "step": 520 }, { "epoch": 0.01, "learning_rate": 8.898377455166524e-07, "loss": 1.0703, "step": 521 }, { "epoch": 0.01, "learning_rate": 8.915456874466267e-07, "loss": 0.9746, "step": 522 }, { "epoch": 0.01, "learning_rate": 8.932536293766012e-07, "loss": 0.9473, "step": 523 }, { "epoch": 0.01, "learning_rate": 8.949615713065756e-07, "loss": 0.9346, "step": 524 }, { "epoch": 0.01, "learning_rate": 8.966695132365499e-07, "loss": 0.9453, "step": 525 }, { "epoch": 0.01, "learning_rate": 8.983774551665242e-07, "loss": 1.0654, "step": 526 }, { "epoch": 0.01, "learning_rate": 9.000853970964987e-07, "loss": 1.0488, "step": 527 }, { "epoch": 0.01, "learning_rate": 9.01793339026473e-07, "loss": 0.9424, "step": 528 }, { "epoch": 0.01, "learning_rate": 9.035012809564474e-07, "loss": 0.8389, "step": 529 }, { "epoch": 0.01, "learning_rate": 9.052092228864219e-07, "loss": 1.1895, "step": 530 }, { "epoch": 0.01, "learning_rate": 9.069171648163962e-07, "loss": 1.0527, "step": 531 }, { "epoch": 0.01, "learning_rate": 9.086251067463706e-07, "loss": 0.9111, "step": 532 }, { "epoch": 0.01, "learning_rate": 9.103330486763449e-07, "loss": 0.9941, "step": 533 }, { "epoch": 0.01, "learning_rate": 9.120409906063194e-07, "loss": 1.0127, "step": 534 }, { "epoch": 0.01, "learning_rate": 9.137489325362937e-07, "loss": 1.0547, "step": 535 }, { "epoch": 0.01, "learning_rate": 9.15456874466268e-07, "loss": 0.9854, "step": 536 }, { "epoch": 0.01, "learning_rate": 9.171648163962425e-07, "loss": 0.9316, "step": 537 }, { "epoch": 0.01, "learning_rate": 9.188727583262169e-07, "loss": 0.9326, "step": 538 }, { "epoch": 0.01, "learning_rate": 9.205807002561913e-07, "loss": 1.0537, "step": 539 }, { "epoch": 0.01, "learning_rate": 9.222886421861656e-07, "loss": 0.917, "step": 540 }, { "epoch": 0.01, "learning_rate": 9.2399658411614e-07, "loss": 0.9658, "step": 541 }, { "epoch": 0.01, "learning_rate": 9.257045260461144e-07, "loss": 1.0029, "step": 542 }, { "epoch": 0.01, "learning_rate": 9.274124679760887e-07, "loss": 0.9424, "step": 543 }, { "epoch": 0.01, "learning_rate": 9.291204099060631e-07, "loss": 0.8638, "step": 544 }, { "epoch": 0.01, "learning_rate": 9.308283518360376e-07, "loss": 1.0195, "step": 545 }, { "epoch": 0.01, "learning_rate": 9.325362937660119e-07, "loss": 1.0195, "step": 546 }, { "epoch": 0.01, "learning_rate": 9.342442356959863e-07, "loss": 0.9619, "step": 547 }, { "epoch": 0.01, "learning_rate": 9.359521776259607e-07, "loss": 1.2627, "step": 548 }, { "epoch": 0.01, "learning_rate": 9.37660119555935e-07, "loss": 1.0508, "step": 549 }, { "epoch": 0.01, "learning_rate": 9.393680614859094e-07, "loss": 0.7354, "step": 550 }, { "epoch": 0.01, "learning_rate": 9.410760034158838e-07, "loss": 1.0186, "step": 551 }, { "epoch": 0.01, "learning_rate": 9.427839453458582e-07, "loss": 1.0352, "step": 552 }, { "epoch": 0.01, "learning_rate": 9.444918872758326e-07, "loss": 0.9785, "step": 553 }, { "epoch": 0.01, "learning_rate": 9.46199829205807e-07, "loss": 0.9395, "step": 554 }, { "epoch": 0.01, "learning_rate": 9.479077711357814e-07, "loss": 0.959, "step": 555 }, { "epoch": 0.01, "learning_rate": 9.496157130657557e-07, "loss": 0.9268, "step": 556 }, { "epoch": 0.01, "learning_rate": 9.5132365499573e-07, "loss": 0.9746, "step": 557 }, { "epoch": 0.01, "learning_rate": 9.530315969257045e-07, "loss": 0.7124, "step": 558 }, { "epoch": 0.01, "learning_rate": 9.547395388556788e-07, "loss": 0.8438, "step": 559 }, { "epoch": 0.01, "learning_rate": 9.564474807856533e-07, "loss": 1.1055, "step": 560 }, { "epoch": 0.01, "learning_rate": 9.581554227156277e-07, "loss": 0.8066, "step": 561 }, { "epoch": 0.01, "learning_rate": 9.59863364645602e-07, "loss": 0.8984, "step": 562 }, { "epoch": 0.01, "learning_rate": 9.615713065755764e-07, "loss": 0.9697, "step": 563 }, { "epoch": 0.01, "learning_rate": 9.632792485055508e-07, "loss": 0.9766, "step": 564 }, { "epoch": 0.01, "learning_rate": 9.64987190435525e-07, "loss": 1.0391, "step": 565 }, { "epoch": 0.01, "learning_rate": 9.666951323654995e-07, "loss": 0.8633, "step": 566 }, { "epoch": 0.01, "learning_rate": 9.68403074295474e-07, "loss": 1.002, "step": 567 }, { "epoch": 0.01, "learning_rate": 9.701110162254484e-07, "loss": 0.9912, "step": 568 }, { "epoch": 0.01, "learning_rate": 9.718189581554226e-07, "loss": 1.0107, "step": 569 }, { "epoch": 0.01, "learning_rate": 9.73526900085397e-07, "loss": 0.9365, "step": 570 }, { "epoch": 0.01, "learning_rate": 9.752348420153715e-07, "loss": 0.9604, "step": 571 }, { "epoch": 0.01, "learning_rate": 9.769427839453457e-07, "loss": 0.709, "step": 572 }, { "epoch": 0.01, "learning_rate": 9.786507258753202e-07, "loss": 0.8633, "step": 573 }, { "epoch": 0.01, "learning_rate": 9.803586678052946e-07, "loss": 1.0596, "step": 574 }, { "epoch": 0.01, "learning_rate": 9.82066609735269e-07, "loss": 1.1348, "step": 575 }, { "epoch": 0.01, "learning_rate": 9.837745516652433e-07, "loss": 1.0977, "step": 576 }, { "epoch": 0.01, "learning_rate": 9.854824935952177e-07, "loss": 0.7944, "step": 577 }, { "epoch": 0.01, "learning_rate": 9.871904355251922e-07, "loss": 0.9824, "step": 578 }, { "epoch": 0.01, "learning_rate": 9.888983774551664e-07, "loss": 1.0898, "step": 579 }, { "epoch": 0.01, "learning_rate": 9.906063193851408e-07, "loss": 0.8818, "step": 580 }, { "epoch": 0.01, "learning_rate": 9.923142613151153e-07, "loss": 1.1143, "step": 581 }, { "epoch": 0.01, "learning_rate": 9.940222032450897e-07, "loss": 0.8672, "step": 582 }, { "epoch": 0.01, "learning_rate": 9.95730145175064e-07, "loss": 1.0283, "step": 583 }, { "epoch": 0.01, "learning_rate": 9.974380871050384e-07, "loss": 0.8799, "step": 584 }, { "epoch": 0.01, "learning_rate": 9.991460290350128e-07, "loss": 1.1914, "step": 585 }, { "epoch": 0.02, "learning_rate": 1.0008539709649873e-06, "loss": 0.8599, "step": 586 }, { "epoch": 0.02, "learning_rate": 1.0025619128949615e-06, "loss": 1.0684, "step": 587 }, { "epoch": 0.02, "learning_rate": 1.004269854824936e-06, "loss": 1.001, "step": 588 }, { "epoch": 0.02, "learning_rate": 1.0059777967549104e-06, "loss": 0.9033, "step": 589 }, { "epoch": 0.02, "learning_rate": 1.0076857386848846e-06, "loss": 1.1318, "step": 590 }, { "epoch": 0.02, "learning_rate": 1.009393680614859e-06, "loss": 0.8853, "step": 591 }, { "epoch": 0.02, "learning_rate": 1.0111016225448335e-06, "loss": 0.9932, "step": 592 }, { "epoch": 0.02, "learning_rate": 1.0128095644748077e-06, "loss": 0.873, "step": 593 }, { "epoch": 0.02, "learning_rate": 1.0145175064047822e-06, "loss": 1.0547, "step": 594 }, { "epoch": 0.02, "learning_rate": 1.0162254483347566e-06, "loss": 0.9053, "step": 595 }, { "epoch": 0.02, "learning_rate": 1.0179333902647309e-06, "loss": 0.9551, "step": 596 }, { "epoch": 0.02, "learning_rate": 1.0196413321947053e-06, "loss": 1.0186, "step": 597 }, { "epoch": 0.02, "learning_rate": 1.0213492741246797e-06, "loss": 0.9121, "step": 598 }, { "epoch": 0.02, "learning_rate": 1.023057216054654e-06, "loss": 1.0146, "step": 599 }, { "epoch": 0.02, "learning_rate": 1.0247651579846284e-06, "loss": 1.1279, "step": 600 }, { "epoch": 0.02, "learning_rate": 1.0264730999146029e-06, "loss": 0.9238, "step": 601 }, { "epoch": 0.02, "learning_rate": 1.0281810418445773e-06, "loss": 1.0566, "step": 602 }, { "epoch": 0.02, "learning_rate": 1.0298889837745517e-06, "loss": 0.897, "step": 603 }, { "epoch": 0.02, "learning_rate": 1.031596925704526e-06, "loss": 0.9668, "step": 604 }, { "epoch": 0.02, "learning_rate": 1.0333048676345004e-06, "loss": 0.8691, "step": 605 }, { "epoch": 0.02, "learning_rate": 1.0350128095644749e-06, "loss": 0.8613, "step": 606 }, { "epoch": 0.02, "learning_rate": 1.036720751494449e-06, "loss": 1.1328, "step": 607 }, { "epoch": 0.02, "learning_rate": 1.0384286934244235e-06, "loss": 1.043, "step": 608 }, { "epoch": 0.02, "learning_rate": 1.040136635354398e-06, "loss": 0.7407, "step": 609 }, { "epoch": 0.02, "learning_rate": 1.0418445772843722e-06, "loss": 1.1055, "step": 610 }, { "epoch": 0.02, "learning_rate": 1.0435525192143466e-06, "loss": 1.042, "step": 611 }, { "epoch": 0.02, "learning_rate": 1.045260461144321e-06, "loss": 1.0234, "step": 612 }, { "epoch": 0.02, "learning_rate": 1.0469684030742953e-06, "loss": 1.0381, "step": 613 }, { "epoch": 0.02, "learning_rate": 1.0486763450042698e-06, "loss": 0.9014, "step": 614 }, { "epoch": 0.02, "learning_rate": 1.050384286934244e-06, "loss": 0.9463, "step": 615 }, { "epoch": 0.02, "learning_rate": 1.0520922288642186e-06, "loss": 1.1914, "step": 616 }, { "epoch": 0.02, "learning_rate": 1.053800170794193e-06, "loss": 0.9873, "step": 617 }, { "epoch": 0.02, "learning_rate": 1.0555081127241673e-06, "loss": 0.9131, "step": 618 }, { "epoch": 0.02, "learning_rate": 1.0572160546541418e-06, "loss": 1.1064, "step": 619 }, { "epoch": 0.02, "learning_rate": 1.0589239965841162e-06, "loss": 1.1885, "step": 620 }, { "epoch": 0.02, "learning_rate": 1.0606319385140904e-06, "loss": 0.9678, "step": 621 }, { "epoch": 0.02, "learning_rate": 1.0623398804440649e-06, "loss": 0.9121, "step": 622 }, { "epoch": 0.02, "learning_rate": 1.0640478223740393e-06, "loss": 0.9619, "step": 623 }, { "epoch": 0.02, "learning_rate": 1.0657557643040135e-06, "loss": 1.1855, "step": 624 }, { "epoch": 0.02, "learning_rate": 1.067463706233988e-06, "loss": 1.0947, "step": 625 }, { "epoch": 0.02, "learning_rate": 1.0691716481639624e-06, "loss": 1.0938, "step": 626 }, { "epoch": 0.02, "learning_rate": 1.0708795900939367e-06, "loss": 0.6758, "step": 627 }, { "epoch": 0.02, "learning_rate": 1.072587532023911e-06, "loss": 0.9932, "step": 628 }, { "epoch": 0.02, "learning_rate": 1.0742954739538853e-06, "loss": 0.9453, "step": 629 }, { "epoch": 0.02, "learning_rate": 1.07600341588386e-06, "loss": 0.9561, "step": 630 }, { "epoch": 0.02, "learning_rate": 1.0777113578138344e-06, "loss": 0.7319, "step": 631 }, { "epoch": 0.02, "learning_rate": 1.0794192997438087e-06, "loss": 0.9922, "step": 632 }, { "epoch": 0.02, "learning_rate": 1.081127241673783e-06, "loss": 1.0449, "step": 633 }, { "epoch": 0.02, "learning_rate": 1.0828351836037575e-06, "loss": 1.0742, "step": 634 }, { "epoch": 0.02, "learning_rate": 1.0845431255337318e-06, "loss": 1.1143, "step": 635 }, { "epoch": 0.02, "learning_rate": 1.0862510674637062e-06, "loss": 1.1494, "step": 636 }, { "epoch": 0.02, "learning_rate": 1.0879590093936807e-06, "loss": 0.8838, "step": 637 }, { "epoch": 0.02, "learning_rate": 1.0896669513236549e-06, "loss": 0.9619, "step": 638 }, { "epoch": 0.02, "learning_rate": 1.0913748932536293e-06, "loss": 0.915, "step": 639 }, { "epoch": 0.02, "learning_rate": 1.0930828351836038e-06, "loss": 0.9707, "step": 640 }, { "epoch": 0.02, "learning_rate": 1.094790777113578e-06, "loss": 1.0088, "step": 641 }, { "epoch": 0.02, "learning_rate": 1.0964987190435524e-06, "loss": 1.1182, "step": 642 }, { "epoch": 0.02, "learning_rate": 1.0982066609735267e-06, "loss": 1.1133, "step": 643 }, { "epoch": 0.02, "learning_rate": 1.0999146029035011e-06, "loss": 1.0312, "step": 644 }, { "epoch": 0.02, "learning_rate": 1.1016225448334758e-06, "loss": 0.9873, "step": 645 }, { "epoch": 0.02, "learning_rate": 1.10333048676345e-06, "loss": 1.1318, "step": 646 }, { "epoch": 0.02, "learning_rate": 1.1050384286934244e-06, "loss": 0.9844, "step": 647 }, { "epoch": 0.02, "learning_rate": 1.1067463706233989e-06, "loss": 0.9072, "step": 648 }, { "epoch": 0.02, "learning_rate": 1.1084543125533731e-06, "loss": 1.0332, "step": 649 }, { "epoch": 0.02, "learning_rate": 1.1101622544833476e-06, "loss": 0.8164, "step": 650 }, { "epoch": 0.02, "learning_rate": 1.111870196413322e-06, "loss": 0.9629, "step": 651 }, { "epoch": 0.02, "learning_rate": 1.1135781383432962e-06, "loss": 0.6284, "step": 652 }, { "epoch": 0.02, "learning_rate": 1.1152860802732707e-06, "loss": 0.8906, "step": 653 }, { "epoch": 0.02, "learning_rate": 1.1169940222032451e-06, "loss": 1.0557, "step": 654 }, { "epoch": 0.02, "learning_rate": 1.1187019641332193e-06, "loss": 1.0605, "step": 655 }, { "epoch": 0.02, "learning_rate": 1.1204099060631938e-06, "loss": 1.2363, "step": 656 }, { "epoch": 0.02, "learning_rate": 1.122117847993168e-06, "loss": 1.0537, "step": 657 }, { "epoch": 0.02, "learning_rate": 1.1238257899231425e-06, "loss": 0.9785, "step": 658 }, { "epoch": 0.02, "learning_rate": 1.125533731853117e-06, "loss": 0.9521, "step": 659 }, { "epoch": 0.02, "learning_rate": 1.1272416737830913e-06, "loss": 1.0654, "step": 660 }, { "epoch": 0.02, "learning_rate": 1.1289496157130658e-06, "loss": 0.6738, "step": 661 }, { "epoch": 0.02, "learning_rate": 1.1306575576430402e-06, "loss": 0.7402, "step": 662 }, { "epoch": 0.02, "learning_rate": 1.1323654995730145e-06, "loss": 1.084, "step": 663 }, { "epoch": 0.02, "learning_rate": 1.134073441502989e-06, "loss": 0.9072, "step": 664 }, { "epoch": 0.02, "learning_rate": 1.1357813834329633e-06, "loss": 1.0918, "step": 665 }, { "epoch": 0.02, "learning_rate": 1.1374893253629376e-06, "loss": 0.8584, "step": 666 }, { "epoch": 0.02, "learning_rate": 1.139197267292912e-06, "loss": 1.1641, "step": 667 }, { "epoch": 0.02, "learning_rate": 1.1409052092228865e-06, "loss": 0.8535, "step": 668 }, { "epoch": 0.02, "learning_rate": 1.1426131511528607e-06, "loss": 0.9209, "step": 669 }, { "epoch": 0.02, "learning_rate": 1.1443210930828351e-06, "loss": 0.9756, "step": 670 }, { "epoch": 0.02, "learning_rate": 1.1460290350128094e-06, "loss": 1.1562, "step": 671 }, { "epoch": 0.02, "learning_rate": 1.1477369769427838e-06, "loss": 0.9678, "step": 672 }, { "epoch": 0.02, "learning_rate": 1.1494449188727582e-06, "loss": 0.8994, "step": 673 }, { "epoch": 0.02, "learning_rate": 1.1511528608027325e-06, "loss": 0.9141, "step": 674 }, { "epoch": 0.02, "learning_rate": 1.1528608027327071e-06, "loss": 0.8994, "step": 675 }, { "epoch": 0.02, "learning_rate": 1.1545687446626816e-06, "loss": 1.166, "step": 676 }, { "epoch": 0.02, "learning_rate": 1.1562766865926558e-06, "loss": 0.9707, "step": 677 }, { "epoch": 0.02, "learning_rate": 1.1579846285226302e-06, "loss": 1.1758, "step": 678 }, { "epoch": 0.02, "learning_rate": 1.1596925704526047e-06, "loss": 0.9434, "step": 679 }, { "epoch": 0.02, "learning_rate": 1.161400512382579e-06, "loss": 1.0176, "step": 680 }, { "epoch": 0.02, "learning_rate": 1.1631084543125534e-06, "loss": 1.2666, "step": 681 }, { "epoch": 0.02, "learning_rate": 1.1648163962425278e-06, "loss": 1.0596, "step": 682 }, { "epoch": 0.02, "learning_rate": 1.166524338172502e-06, "loss": 0.9473, "step": 683 }, { "epoch": 0.02, "learning_rate": 1.1682322801024765e-06, "loss": 1.0088, "step": 684 }, { "epoch": 0.02, "learning_rate": 1.1699402220324507e-06, "loss": 0.9141, "step": 685 }, { "epoch": 0.02, "learning_rate": 1.1716481639624251e-06, "loss": 1.0713, "step": 686 }, { "epoch": 0.02, "learning_rate": 1.1733561058923996e-06, "loss": 0.9824, "step": 687 }, { "epoch": 0.02, "learning_rate": 1.1750640478223738e-06, "loss": 0.9385, "step": 688 }, { "epoch": 0.02, "learning_rate": 1.1767719897523483e-06, "loss": 1.0166, "step": 689 }, { "epoch": 0.02, "learning_rate": 1.178479931682323e-06, "loss": 0.8662, "step": 690 }, { "epoch": 0.02, "learning_rate": 1.1801878736122971e-06, "loss": 0.9346, "step": 691 }, { "epoch": 0.02, "learning_rate": 1.1818958155422716e-06, "loss": 0.7891, "step": 692 }, { "epoch": 0.02, "learning_rate": 1.183603757472246e-06, "loss": 1.0342, "step": 693 }, { "epoch": 0.02, "learning_rate": 1.1853116994022203e-06, "loss": 0.8042, "step": 694 }, { "epoch": 0.02, "learning_rate": 1.1870196413321947e-06, "loss": 1.0547, "step": 695 }, { "epoch": 0.02, "learning_rate": 1.1887275832621691e-06, "loss": 1.0205, "step": 696 }, { "epoch": 0.02, "learning_rate": 1.1904355251921434e-06, "loss": 0.9878, "step": 697 }, { "epoch": 0.02, "learning_rate": 1.1921434671221178e-06, "loss": 0.9795, "step": 698 }, { "epoch": 0.02, "learning_rate": 1.193851409052092e-06, "loss": 0.9092, "step": 699 }, { "epoch": 0.02, "learning_rate": 1.1955593509820665e-06, "loss": 0.8379, "step": 700 }, { "epoch": 0.02, "learning_rate": 1.197267292912041e-06, "loss": 0.9785, "step": 701 }, { "epoch": 0.02, "learning_rate": 1.1989752348420152e-06, "loss": 1.0195, "step": 702 }, { "epoch": 0.02, "learning_rate": 1.2006831767719896e-06, "loss": 0.8945, "step": 703 }, { "epoch": 0.02, "learning_rate": 1.202391118701964e-06, "loss": 1.0625, "step": 704 }, { "epoch": 0.02, "learning_rate": 1.2040990606319385e-06, "loss": 0.8818, "step": 705 }, { "epoch": 0.02, "learning_rate": 1.205807002561913e-06, "loss": 0.7749, "step": 706 }, { "epoch": 0.02, "learning_rate": 1.2075149444918874e-06, "loss": 1.0859, "step": 707 }, { "epoch": 0.02, "learning_rate": 1.2092228864218616e-06, "loss": 1.1035, "step": 708 }, { "epoch": 0.02, "learning_rate": 1.210930828351836e-06, "loss": 1.083, "step": 709 }, { "epoch": 0.02, "learning_rate": 1.2126387702818105e-06, "loss": 1.1172, "step": 710 }, { "epoch": 0.02, "learning_rate": 1.2143467122117847e-06, "loss": 0.8496, "step": 711 }, { "epoch": 0.02, "learning_rate": 1.2160546541417592e-06, "loss": 0.8213, "step": 712 }, { "epoch": 0.02, "learning_rate": 1.2177625960717334e-06, "loss": 1.0283, "step": 713 }, { "epoch": 0.02, "learning_rate": 1.2194705380017078e-06, "loss": 1.0127, "step": 714 }, { "epoch": 0.02, "learning_rate": 1.2211784799316823e-06, "loss": 0.998, "step": 715 }, { "epoch": 0.02, "learning_rate": 1.2228864218616565e-06, "loss": 1.0264, "step": 716 }, { "epoch": 0.02, "learning_rate": 1.224594363791631e-06, "loss": 0.9131, "step": 717 }, { "epoch": 0.02, "learning_rate": 1.2263023057216054e-06, "loss": 0.9854, "step": 718 }, { "epoch": 0.02, "learning_rate": 1.2280102476515798e-06, "loss": 0.9233, "step": 719 }, { "epoch": 0.02, "learning_rate": 1.2297181895815543e-06, "loss": 1.0811, "step": 720 }, { "epoch": 0.02, "learning_rate": 1.2314261315115287e-06, "loss": 0.8799, "step": 721 }, { "epoch": 0.02, "learning_rate": 1.233134073441503e-06, "loss": 1.0508, "step": 722 }, { "epoch": 0.02, "learning_rate": 1.2348420153714774e-06, "loss": 1.0869, "step": 723 }, { "epoch": 0.02, "learning_rate": 1.2365499573014518e-06, "loss": 1.002, "step": 724 }, { "epoch": 0.02, "learning_rate": 1.238257899231426e-06, "loss": 1.0117, "step": 725 }, { "epoch": 0.02, "learning_rate": 1.2399658411614005e-06, "loss": 0.8574, "step": 726 }, { "epoch": 0.02, "learning_rate": 1.2416737830913747e-06, "loss": 1.3379, "step": 727 }, { "epoch": 0.02, "learning_rate": 1.2433817250213492e-06, "loss": 0.9717, "step": 728 }, { "epoch": 0.02, "learning_rate": 1.2450896669513236e-06, "loss": 0.8809, "step": 729 }, { "epoch": 0.02, "learning_rate": 1.2467976088812978e-06, "loss": 0.8301, "step": 730 }, { "epoch": 0.02, "learning_rate": 1.2485055508112723e-06, "loss": 0.7637, "step": 731 }, { "epoch": 0.02, "learning_rate": 1.2502134927412467e-06, "loss": 0.6958, "step": 732 }, { "epoch": 0.02, "learning_rate": 1.251921434671221e-06, "loss": 1.1045, "step": 733 }, { "epoch": 0.02, "learning_rate": 1.2536293766011956e-06, "loss": 0.8911, "step": 734 }, { "epoch": 0.02, "learning_rate": 1.25533731853117e-06, "loss": 0.8438, "step": 735 }, { "epoch": 0.02, "learning_rate": 1.2570452604611443e-06, "loss": 1.1592, "step": 736 }, { "epoch": 0.02, "learning_rate": 1.2587532023911187e-06, "loss": 0.8154, "step": 737 }, { "epoch": 0.02, "learning_rate": 1.2604611443210932e-06, "loss": 0.9756, "step": 738 }, { "epoch": 0.02, "learning_rate": 1.2621690862510674e-06, "loss": 1.0635, "step": 739 }, { "epoch": 0.02, "learning_rate": 1.2638770281810418e-06, "loss": 0.9199, "step": 740 }, { "epoch": 0.02, "learning_rate": 1.265584970111016e-06, "loss": 0.7734, "step": 741 }, { "epoch": 0.02, "learning_rate": 1.2672929120409905e-06, "loss": 1.0293, "step": 742 }, { "epoch": 0.02, "learning_rate": 1.269000853970965e-06, "loss": 0.9814, "step": 743 }, { "epoch": 0.02, "learning_rate": 1.2707087959009392e-06, "loss": 0.9409, "step": 744 }, { "epoch": 0.02, "learning_rate": 1.2724167378309136e-06, "loss": 0.998, "step": 745 }, { "epoch": 0.02, "learning_rate": 1.274124679760888e-06, "loss": 1.0283, "step": 746 }, { "epoch": 0.02, "learning_rate": 1.2758326216908623e-06, "loss": 1.1074, "step": 747 }, { "epoch": 0.02, "learning_rate": 1.2775405636208367e-06, "loss": 0.6064, "step": 748 }, { "epoch": 0.02, "learning_rate": 1.2792485055508114e-06, "loss": 0.8022, "step": 749 }, { "epoch": 0.02, "learning_rate": 1.2809564474807856e-06, "loss": 1.0547, "step": 750 }, { "epoch": 0.02, "learning_rate": 1.28266438941076e-06, "loss": 0.9316, "step": 751 }, { "epoch": 0.02, "learning_rate": 1.2843723313407345e-06, "loss": 1.085, "step": 752 }, { "epoch": 0.02, "learning_rate": 1.2860802732707087e-06, "loss": 0.8472, "step": 753 }, { "epoch": 0.02, "learning_rate": 1.2877882152006832e-06, "loss": 1.0645, "step": 754 }, { "epoch": 0.02, "learning_rate": 1.2894961571306574e-06, "loss": 1.0449, "step": 755 }, { "epoch": 0.02, "learning_rate": 1.2912040990606319e-06, "loss": 1.0264, "step": 756 }, { "epoch": 0.02, "learning_rate": 1.2929120409906063e-06, "loss": 1.0244, "step": 757 }, { "epoch": 0.02, "learning_rate": 1.2946199829205805e-06, "loss": 0.8545, "step": 758 }, { "epoch": 0.02, "learning_rate": 1.296327924850555e-06, "loss": 1.1943, "step": 759 }, { "epoch": 0.02, "learning_rate": 1.2980358667805294e-06, "loss": 0.998, "step": 760 }, { "epoch": 0.02, "learning_rate": 1.2997438087105036e-06, "loss": 0.9805, "step": 761 }, { "epoch": 0.02, "learning_rate": 1.301451750640478e-06, "loss": 1.1426, "step": 762 }, { "epoch": 0.02, "learning_rate": 1.3031596925704525e-06, "loss": 1.1133, "step": 763 }, { "epoch": 0.02, "learning_rate": 1.304867634500427e-06, "loss": 1.1699, "step": 764 }, { "epoch": 0.02, "learning_rate": 1.3065755764304014e-06, "loss": 0.9077, "step": 765 }, { "epoch": 0.02, "learning_rate": 1.3082835183603758e-06, "loss": 0.8193, "step": 766 }, { "epoch": 0.02, "learning_rate": 1.30999146029035e-06, "loss": 0.7754, "step": 767 }, { "epoch": 0.02, "learning_rate": 1.3116994022203245e-06, "loss": 1.376, "step": 768 }, { "epoch": 0.02, "learning_rate": 1.313407344150299e-06, "loss": 1.0488, "step": 769 }, { "epoch": 0.02, "learning_rate": 1.3151152860802732e-06, "loss": 1.043, "step": 770 }, { "epoch": 0.02, "learning_rate": 1.3168232280102476e-06, "loss": 0.9512, "step": 771 }, { "epoch": 0.02, "learning_rate": 1.3185311699402219e-06, "loss": 0.9775, "step": 772 }, { "epoch": 0.02, "learning_rate": 1.3202391118701963e-06, "loss": 1.0596, "step": 773 }, { "epoch": 0.02, "learning_rate": 1.3219470538001707e-06, "loss": 1.1182, "step": 774 }, { "epoch": 0.02, "learning_rate": 1.323654995730145e-06, "loss": 0.9014, "step": 775 }, { "epoch": 0.02, "learning_rate": 1.3253629376601194e-06, "loss": 1.0137, "step": 776 }, { "epoch": 0.02, "learning_rate": 1.3270708795900939e-06, "loss": 1.1074, "step": 777 }, { "epoch": 0.02, "learning_rate": 1.328778821520068e-06, "loss": 0.8018, "step": 778 }, { "epoch": 0.02, "learning_rate": 1.3304867634500427e-06, "loss": 1.0273, "step": 779 }, { "epoch": 0.02, "learning_rate": 1.3321947053800172e-06, "loss": 1.123, "step": 780 }, { "epoch": 0.02, "learning_rate": 1.3339026473099914e-06, "loss": 1.1133, "step": 781 }, { "epoch": 0.02, "learning_rate": 1.3356105892399659e-06, "loss": 1.0449, "step": 782 }, { "epoch": 0.02, "learning_rate": 1.3373185311699403e-06, "loss": 1.001, "step": 783 }, { "epoch": 0.02, "learning_rate": 1.3390264730999145e-06, "loss": 0.8457, "step": 784 }, { "epoch": 0.02, "learning_rate": 1.340734415029889e-06, "loss": 1.0039, "step": 785 }, { "epoch": 0.02, "learning_rate": 1.3424423569598632e-06, "loss": 0.959, "step": 786 }, { "epoch": 0.02, "learning_rate": 1.3441502988898376e-06, "loss": 1.0107, "step": 787 }, { "epoch": 0.02, "learning_rate": 1.345858240819812e-06, "loss": 0.8447, "step": 788 }, { "epoch": 0.02, "learning_rate": 1.3475661827497863e-06, "loss": 1.0781, "step": 789 }, { "epoch": 0.02, "learning_rate": 1.3492741246797608e-06, "loss": 0.9902, "step": 790 }, { "epoch": 0.02, "learning_rate": 1.3509820666097352e-06, "loss": 1.0771, "step": 791 }, { "epoch": 0.02, "learning_rate": 1.3526900085397094e-06, "loss": 1.0342, "step": 792 }, { "epoch": 0.02, "learning_rate": 1.3543979504696839e-06, "loss": 1.0869, "step": 793 }, { "epoch": 0.02, "learning_rate": 1.3561058923996585e-06, "loss": 0.9365, "step": 794 }, { "epoch": 0.02, "learning_rate": 1.3578138343296328e-06, "loss": 1.0195, "step": 795 }, { "epoch": 0.02, "learning_rate": 1.3595217762596072e-06, "loss": 1.04, "step": 796 }, { "epoch": 0.02, "learning_rate": 1.3612297181895816e-06, "loss": 0.9233, "step": 797 }, { "epoch": 0.02, "learning_rate": 1.3629376601195559e-06, "loss": 1.1133, "step": 798 }, { "epoch": 0.02, "learning_rate": 1.3646456020495303e-06, "loss": 0.9268, "step": 799 }, { "epoch": 0.02, "learning_rate": 1.3663535439795045e-06, "loss": 1.1152, "step": 800 }, { "epoch": 0.02, "learning_rate": 1.368061485909479e-06, "loss": 0.9072, "step": 801 }, { "epoch": 0.02, "learning_rate": 1.3697694278394534e-06, "loss": 0.9512, "step": 802 }, { "epoch": 0.02, "learning_rate": 1.3714773697694277e-06, "loss": 1.0371, "step": 803 }, { "epoch": 0.02, "learning_rate": 1.3731853116994021e-06, "loss": 0.8809, "step": 804 }, { "epoch": 0.02, "learning_rate": 1.3748932536293765e-06, "loss": 0.7393, "step": 805 }, { "epoch": 0.02, "learning_rate": 1.3766011955593508e-06, "loss": 1.1621, "step": 806 }, { "epoch": 0.02, "learning_rate": 1.3783091374893252e-06, "loss": 0.9854, "step": 807 }, { "epoch": 0.02, "learning_rate": 1.3800170794192999e-06, "loss": 0.728, "step": 808 }, { "epoch": 0.02, "learning_rate": 1.381725021349274e-06, "loss": 0.8242, "step": 809 }, { "epoch": 0.02, "learning_rate": 1.3834329632792485e-06, "loss": 0.8809, "step": 810 }, { "epoch": 0.02, "learning_rate": 1.385140905209223e-06, "loss": 0.834, "step": 811 }, { "epoch": 0.02, "learning_rate": 1.3868488471391972e-06, "loss": 0.8906, "step": 812 }, { "epoch": 0.02, "learning_rate": 1.3885567890691717e-06, "loss": 0.9229, "step": 813 }, { "epoch": 0.02, "learning_rate": 1.3902647309991459e-06, "loss": 0.9111, "step": 814 }, { "epoch": 0.02, "learning_rate": 1.3919726729291203e-06, "loss": 0.9824, "step": 815 }, { "epoch": 0.02, "learning_rate": 1.3936806148590948e-06, "loss": 1.04, "step": 816 }, { "epoch": 0.02, "learning_rate": 1.395388556789069e-06, "loss": 0.8945, "step": 817 }, { "epoch": 0.02, "learning_rate": 1.3970964987190434e-06, "loss": 1.0371, "step": 818 }, { "epoch": 0.02, "learning_rate": 1.3988044406490179e-06, "loss": 1.0391, "step": 819 }, { "epoch": 0.02, "learning_rate": 1.4005123825789921e-06, "loss": 0.9834, "step": 820 }, { "epoch": 0.02, "learning_rate": 1.4022203245089666e-06, "loss": 1.0117, "step": 821 }, { "epoch": 0.02, "learning_rate": 1.403928266438941e-06, "loss": 1.1016, "step": 822 }, { "epoch": 0.02, "learning_rate": 1.4056362083689154e-06, "loss": 0.9141, "step": 823 }, { "epoch": 0.02, "learning_rate": 1.4073441502988899e-06, "loss": 0.8418, "step": 824 }, { "epoch": 0.02, "learning_rate": 1.4090520922288643e-06, "loss": 0.8779, "step": 825 }, { "epoch": 0.02, "learning_rate": 1.4107600341588386e-06, "loss": 0.9258, "step": 826 }, { "epoch": 0.02, "learning_rate": 1.412467976088813e-06, "loss": 1.0723, "step": 827 }, { "epoch": 0.02, "learning_rate": 1.4141759180187872e-06, "loss": 1.0674, "step": 828 }, { "epoch": 0.02, "learning_rate": 1.4158838599487617e-06, "loss": 1.2344, "step": 829 }, { "epoch": 0.02, "learning_rate": 1.4175918018787361e-06, "loss": 0.8555, "step": 830 }, { "epoch": 0.02, "learning_rate": 1.4192997438087103e-06, "loss": 1.168, "step": 831 }, { "epoch": 0.02, "learning_rate": 1.4210076857386848e-06, "loss": 0.8145, "step": 832 }, { "epoch": 0.02, "learning_rate": 1.4227156276686592e-06, "loss": 1.208, "step": 833 }, { "epoch": 0.02, "learning_rate": 1.4244235695986335e-06, "loss": 0.9678, "step": 834 }, { "epoch": 0.02, "learning_rate": 1.426131511528608e-06, "loss": 1.0273, "step": 835 }, { "epoch": 0.02, "learning_rate": 1.4278394534585823e-06, "loss": 1.0703, "step": 836 }, { "epoch": 0.02, "learning_rate": 1.4295473953885566e-06, "loss": 1.1152, "step": 837 }, { "epoch": 0.02, "learning_rate": 1.4312553373185312e-06, "loss": 1.001, "step": 838 }, { "epoch": 0.02, "learning_rate": 1.4329632792485057e-06, "loss": 1.0566, "step": 839 }, { "epoch": 0.02, "learning_rate": 1.43467122117848e-06, "loss": 0.8623, "step": 840 }, { "epoch": 0.02, "learning_rate": 1.4363791631084543e-06, "loss": 0.9131, "step": 841 }, { "epoch": 0.02, "learning_rate": 1.4380871050384286e-06, "loss": 1.0273, "step": 842 }, { "epoch": 0.02, "learning_rate": 1.439795046968403e-06, "loss": 0.9912, "step": 843 }, { "epoch": 0.02, "learning_rate": 1.4415029888983775e-06, "loss": 1.0156, "step": 844 }, { "epoch": 0.02, "learning_rate": 1.4432109308283517e-06, "loss": 0.7725, "step": 845 }, { "epoch": 0.02, "learning_rate": 1.4449188727583261e-06, "loss": 0.9414, "step": 846 }, { "epoch": 0.02, "learning_rate": 1.4466268146883006e-06, "loss": 0.8857, "step": 847 }, { "epoch": 0.02, "learning_rate": 1.4483347566182748e-06, "loss": 0.7764, "step": 848 }, { "epoch": 0.02, "learning_rate": 1.4500426985482492e-06, "loss": 1.0166, "step": 849 }, { "epoch": 0.02, "learning_rate": 1.4517506404782237e-06, "loss": 0.8965, "step": 850 }, { "epoch": 0.02, "learning_rate": 1.453458582408198e-06, "loss": 0.9111, "step": 851 }, { "epoch": 0.02, "learning_rate": 1.4551665243381724e-06, "loss": 0.9004, "step": 852 }, { "epoch": 0.02, "learning_rate": 1.456874466268147e-06, "loss": 1.082, "step": 853 }, { "epoch": 0.02, "learning_rate": 1.4585824081981212e-06, "loss": 0.8086, "step": 854 }, { "epoch": 0.02, "learning_rate": 1.4602903501280957e-06, "loss": 0.9932, "step": 855 }, { "epoch": 0.02, "learning_rate": 1.46199829205807e-06, "loss": 0.9355, "step": 856 }, { "epoch": 0.02, "learning_rate": 1.4637062339880444e-06, "loss": 1.0879, "step": 857 }, { "epoch": 0.02, "learning_rate": 1.4654141759180188e-06, "loss": 1.082, "step": 858 }, { "epoch": 0.02, "learning_rate": 1.467122117847993e-06, "loss": 0.834, "step": 859 }, { "epoch": 0.02, "learning_rate": 1.4688300597779675e-06, "loss": 0.8706, "step": 860 }, { "epoch": 0.02, "learning_rate": 1.470538001707942e-06, "loss": 1.0312, "step": 861 }, { "epoch": 0.02, "learning_rate": 1.4722459436379161e-06, "loss": 0.9141, "step": 862 }, { "epoch": 0.02, "learning_rate": 1.4739538855678906e-06, "loss": 1.3086, "step": 863 }, { "epoch": 0.02, "learning_rate": 1.475661827497865e-06, "loss": 0.9463, "step": 864 }, { "epoch": 0.02, "learning_rate": 1.4773697694278393e-06, "loss": 1.0088, "step": 865 }, { "epoch": 0.02, "learning_rate": 1.4790777113578137e-06, "loss": 1.1201, "step": 866 }, { "epoch": 0.02, "learning_rate": 1.480785653287788e-06, "loss": 1.0791, "step": 867 }, { "epoch": 0.02, "learning_rate": 1.4824935952177626e-06, "loss": 0.8369, "step": 868 }, { "epoch": 0.02, "learning_rate": 1.484201537147737e-06, "loss": 0.9839, "step": 869 }, { "epoch": 0.02, "learning_rate": 1.4859094790777113e-06, "loss": 0.9873, "step": 870 }, { "epoch": 0.02, "learning_rate": 1.4876174210076857e-06, "loss": 0.9912, "step": 871 }, { "epoch": 0.02, "learning_rate": 1.4893253629376601e-06, "loss": 1.0078, "step": 872 }, { "epoch": 0.02, "learning_rate": 1.4910333048676344e-06, "loss": 0.9521, "step": 873 }, { "epoch": 0.02, "learning_rate": 1.4927412467976088e-06, "loss": 1.0254, "step": 874 }, { "epoch": 0.02, "learning_rate": 1.4944491887275833e-06, "loss": 1.04, "step": 875 }, { "epoch": 0.02, "learning_rate": 1.4961571306575575e-06, "loss": 0.8369, "step": 876 }, { "epoch": 0.02, "learning_rate": 1.497865072587532e-06, "loss": 1.1191, "step": 877 }, { "epoch": 0.02, "learning_rate": 1.4995730145175064e-06, "loss": 0.9336, "step": 878 }, { "epoch": 0.02, "learning_rate": 1.5012809564474806e-06, "loss": 0.957, "step": 879 }, { "epoch": 0.02, "learning_rate": 1.502988898377455e-06, "loss": 0.8203, "step": 880 }, { "epoch": 0.02, "learning_rate": 1.5046968403074293e-06, "loss": 0.9077, "step": 881 }, { "epoch": 0.02, "learning_rate": 1.506404782237404e-06, "loss": 1.0049, "step": 882 }, { "epoch": 0.02, "learning_rate": 1.5081127241673784e-06, "loss": 1.0254, "step": 883 }, { "epoch": 0.02, "learning_rate": 1.5098206660973526e-06, "loss": 1.085, "step": 884 }, { "epoch": 0.02, "learning_rate": 1.511528608027327e-06, "loss": 0.8916, "step": 885 }, { "epoch": 0.02, "learning_rate": 1.5132365499573015e-06, "loss": 1.1279, "step": 886 }, { "epoch": 0.02, "learning_rate": 1.5149444918872757e-06, "loss": 1.1855, "step": 887 }, { "epoch": 0.02, "learning_rate": 1.5166524338172502e-06, "loss": 1.0742, "step": 888 }, { "epoch": 0.02, "learning_rate": 1.5183603757472246e-06, "loss": 1.0605, "step": 889 }, { "epoch": 0.02, "learning_rate": 1.5200683176771988e-06, "loss": 0.9053, "step": 890 }, { "epoch": 0.02, "learning_rate": 1.5217762596071733e-06, "loss": 1.0137, "step": 891 }, { "epoch": 0.02, "learning_rate": 1.5234842015371477e-06, "loss": 0.8271, "step": 892 }, { "epoch": 0.02, "learning_rate": 1.525192143467122e-06, "loss": 0.9521, "step": 893 }, { "epoch": 0.02, "learning_rate": 1.5269000853970964e-06, "loss": 1.1836, "step": 894 }, { "epoch": 0.02, "learning_rate": 1.5286080273270708e-06, "loss": 1.1328, "step": 895 }, { "epoch": 0.02, "learning_rate": 1.530315969257045e-06, "loss": 1.1211, "step": 896 }, { "epoch": 0.02, "learning_rate": 1.5320239111870197e-06, "loss": 0.8066, "step": 897 }, { "epoch": 0.02, "learning_rate": 1.533731853116994e-06, "loss": 1.124, "step": 898 }, { "epoch": 0.02, "learning_rate": 1.5354397950469684e-06, "loss": 0.9336, "step": 899 }, { "epoch": 0.02, "learning_rate": 1.5371477369769428e-06, "loss": 1.0684, "step": 900 }, { "epoch": 0.02, "learning_rate": 1.538855678906917e-06, "loss": 0.8394, "step": 901 }, { "epoch": 0.02, "learning_rate": 1.5405636208368915e-06, "loss": 0.7148, "step": 902 }, { "epoch": 0.02, "learning_rate": 1.542271562766866e-06, "loss": 0.8916, "step": 903 }, { "epoch": 0.02, "learning_rate": 1.5439795046968402e-06, "loss": 0.8721, "step": 904 }, { "epoch": 0.02, "learning_rate": 1.5456874466268146e-06, "loss": 1.0615, "step": 905 }, { "epoch": 0.02, "learning_rate": 1.547395388556789e-06, "loss": 1.0742, "step": 906 }, { "epoch": 0.02, "learning_rate": 1.5491033304867633e-06, "loss": 1.106, "step": 907 }, { "epoch": 0.02, "learning_rate": 1.5508112724167377e-06, "loss": 0.6533, "step": 908 }, { "epoch": 0.02, "learning_rate": 1.5525192143467122e-06, "loss": 0.8271, "step": 909 }, { "epoch": 0.02, "learning_rate": 1.5542271562766864e-06, "loss": 0.957, "step": 910 }, { "epoch": 0.02, "learning_rate": 1.5559350982066608e-06, "loss": 0.939, "step": 911 }, { "epoch": 0.02, "learning_rate": 1.5576430401366353e-06, "loss": 1.1309, "step": 912 }, { "epoch": 0.02, "learning_rate": 1.5593509820666097e-06, "loss": 0.9258, "step": 913 }, { "epoch": 0.02, "learning_rate": 1.5610589239965842e-06, "loss": 0.8096, "step": 914 }, { "epoch": 0.02, "learning_rate": 1.5627668659265584e-06, "loss": 0.9619, "step": 915 }, { "epoch": 0.02, "learning_rate": 1.5644748078565328e-06, "loss": 0.9287, "step": 916 }, { "epoch": 0.02, "learning_rate": 1.5661827497865073e-06, "loss": 0.8394, "step": 917 }, { "epoch": 0.02, "learning_rate": 1.5678906917164815e-06, "loss": 1.0352, "step": 918 }, { "epoch": 0.02, "learning_rate": 1.569598633646456e-06, "loss": 0.7988, "step": 919 }, { "epoch": 0.02, "learning_rate": 1.5713065755764304e-06, "loss": 1.0566, "step": 920 }, { "epoch": 0.02, "learning_rate": 1.5730145175064046e-06, "loss": 0.9941, "step": 921 }, { "epoch": 0.02, "learning_rate": 1.574722459436379e-06, "loss": 0.9443, "step": 922 }, { "epoch": 0.02, "learning_rate": 1.5764304013663535e-06, "loss": 1.1211, "step": 923 }, { "epoch": 0.02, "learning_rate": 1.5781383432963277e-06, "loss": 0.8564, "step": 924 }, { "epoch": 0.02, "learning_rate": 1.5798462852263022e-06, "loss": 1.1045, "step": 925 }, { "epoch": 0.02, "learning_rate": 1.5815542271562764e-06, "loss": 0.8726, "step": 926 }, { "epoch": 0.02, "learning_rate": 1.583262169086251e-06, "loss": 1.0859, "step": 927 }, { "epoch": 0.02, "learning_rate": 1.5849701110162255e-06, "loss": 1.3301, "step": 928 }, { "epoch": 0.02, "learning_rate": 1.5866780529461997e-06, "loss": 1.2305, "step": 929 }, { "epoch": 0.02, "learning_rate": 1.5883859948761742e-06, "loss": 0.9453, "step": 930 }, { "epoch": 0.02, "learning_rate": 1.5900939368061486e-06, "loss": 1.1299, "step": 931 }, { "epoch": 0.02, "learning_rate": 1.5918018787361229e-06, "loss": 0.8857, "step": 932 }, { "epoch": 0.02, "learning_rate": 1.5935098206660973e-06, "loss": 0.9326, "step": 933 }, { "epoch": 0.02, "learning_rate": 1.5952177625960717e-06, "loss": 0.8394, "step": 934 }, { "epoch": 0.02, "learning_rate": 1.596925704526046e-06, "loss": 1.1836, "step": 935 }, { "epoch": 0.02, "learning_rate": 1.5986336464560204e-06, "loss": 1.0166, "step": 936 }, { "epoch": 0.02, "learning_rate": 1.6003415883859949e-06, "loss": 1.0518, "step": 937 }, { "epoch": 0.02, "learning_rate": 1.602049530315969e-06, "loss": 0.9209, "step": 938 }, { "epoch": 0.02, "learning_rate": 1.6037574722459435e-06, "loss": 0.8721, "step": 939 }, { "epoch": 0.02, "learning_rate": 1.6054654141759178e-06, "loss": 1.1602, "step": 940 }, { "epoch": 0.02, "learning_rate": 1.6071733561058922e-06, "loss": 1.0078, "step": 941 }, { "epoch": 0.02, "learning_rate": 1.6088812980358669e-06, "loss": 0.8848, "step": 942 }, { "epoch": 0.02, "learning_rate": 1.610589239965841e-06, "loss": 0.833, "step": 943 }, { "epoch": 0.02, "learning_rate": 1.6122971818958155e-06, "loss": 0.8809, "step": 944 }, { "epoch": 0.02, "learning_rate": 1.61400512382579e-06, "loss": 0.9521, "step": 945 }, { "epoch": 0.02, "learning_rate": 1.6157130657557642e-06, "loss": 0.8433, "step": 946 }, { "epoch": 0.02, "learning_rate": 1.6174210076857386e-06, "loss": 0.6768, "step": 947 }, { "epoch": 0.02, "learning_rate": 1.619128949615713e-06, "loss": 0.9404, "step": 948 }, { "epoch": 0.02, "learning_rate": 1.6208368915456873e-06, "loss": 0.8823, "step": 949 }, { "epoch": 0.02, "learning_rate": 1.6225448334756618e-06, "loss": 0.9521, "step": 950 }, { "epoch": 0.02, "learning_rate": 1.6242527754056362e-06, "loss": 1.1934, "step": 951 }, { "epoch": 0.02, "learning_rate": 1.6259607173356104e-06, "loss": 1.041, "step": 952 }, { "epoch": 0.02, "learning_rate": 1.6276686592655849e-06, "loss": 1.0215, "step": 953 }, { "epoch": 0.02, "learning_rate": 1.629376601195559e-06, "loss": 0.8281, "step": 954 }, { "epoch": 0.02, "learning_rate": 1.6310845431255335e-06, "loss": 1.0557, "step": 955 }, { "epoch": 0.02, "learning_rate": 1.632792485055508e-06, "loss": 1.2266, "step": 956 }, { "epoch": 0.02, "learning_rate": 1.6345004269854824e-06, "loss": 1.0703, "step": 957 }, { "epoch": 0.02, "learning_rate": 1.6362083689154569e-06, "loss": 0.8506, "step": 958 }, { "epoch": 0.02, "learning_rate": 1.6379163108454313e-06, "loss": 1.1279, "step": 959 }, { "epoch": 0.02, "learning_rate": 1.6396242527754055e-06, "loss": 0.9316, "step": 960 }, { "epoch": 0.02, "learning_rate": 1.64133219470538e-06, "loss": 1.0254, "step": 961 }, { "epoch": 0.02, "learning_rate": 1.6430401366353544e-06, "loss": 0.8682, "step": 962 }, { "epoch": 0.02, "learning_rate": 1.6447480785653287e-06, "loss": 1.1543, "step": 963 }, { "epoch": 0.02, "learning_rate": 1.646456020495303e-06, "loss": 0.8853, "step": 964 }, { "epoch": 0.02, "learning_rate": 1.6481639624252775e-06, "loss": 0.9795, "step": 965 }, { "epoch": 0.02, "learning_rate": 1.6498719043552518e-06, "loss": 1.0537, "step": 966 }, { "epoch": 0.02, "learning_rate": 1.6515798462852262e-06, "loss": 1.0938, "step": 967 }, { "epoch": 0.02, "learning_rate": 1.6532877882152004e-06, "loss": 1.0791, "step": 968 }, { "epoch": 0.02, "learning_rate": 1.6549957301451749e-06, "loss": 0.7156, "step": 969 }, { "epoch": 0.02, "learning_rate": 1.6567036720751493e-06, "loss": 1.0244, "step": 970 }, { "epoch": 0.02, "learning_rate": 1.6584116140051238e-06, "loss": 1.0127, "step": 971 }, { "epoch": 0.02, "learning_rate": 1.6601195559350982e-06, "loss": 0.958, "step": 972 }, { "epoch": 0.02, "learning_rate": 1.6618274978650727e-06, "loss": 1.126, "step": 973 }, { "epoch": 0.02, "learning_rate": 1.6635354397950469e-06, "loss": 1.1924, "step": 974 }, { "epoch": 0.02, "learning_rate": 1.6652433817250213e-06, "loss": 1.1172, "step": 975 }, { "epoch": 0.03, "learning_rate": 1.6669513236549958e-06, "loss": 0.9131, "step": 976 }, { "epoch": 0.03, "learning_rate": 1.66865926558497e-06, "loss": 0.9766, "step": 977 }, { "epoch": 0.03, "learning_rate": 1.6703672075149444e-06, "loss": 0.7871, "step": 978 }, { "epoch": 0.03, "learning_rate": 1.6720751494449189e-06, "loss": 1.085, "step": 979 }, { "epoch": 0.03, "learning_rate": 1.6737830913748931e-06, "loss": 0.9561, "step": 980 }, { "epoch": 0.03, "learning_rate": 1.6754910333048676e-06, "loss": 0.7715, "step": 981 }, { "epoch": 0.03, "learning_rate": 1.6771989752348418e-06, "loss": 0.8154, "step": 982 }, { "epoch": 0.03, "learning_rate": 1.6789069171648162e-06, "loss": 1.0205, "step": 983 }, { "epoch": 0.03, "learning_rate": 1.6806148590947907e-06, "loss": 1.1289, "step": 984 }, { "epoch": 0.03, "learning_rate": 1.682322801024765e-06, "loss": 1.0391, "step": 985 }, { "epoch": 0.03, "learning_rate": 1.6840307429547396e-06, "loss": 1.0186, "step": 986 }, { "epoch": 0.03, "learning_rate": 1.685738684884714e-06, "loss": 0.959, "step": 987 }, { "epoch": 0.03, "learning_rate": 1.6874466268146882e-06, "loss": 1.0381, "step": 988 }, { "epoch": 0.03, "learning_rate": 1.6891545687446627e-06, "loss": 0.9844, "step": 989 }, { "epoch": 0.03, "learning_rate": 1.6908625106746371e-06, "loss": 1.123, "step": 990 }, { "epoch": 0.03, "learning_rate": 1.6925704526046113e-06, "loss": 1.1426, "step": 991 }, { "epoch": 0.03, "learning_rate": 1.6942783945345858e-06, "loss": 0.9521, "step": 992 }, { "epoch": 0.03, "learning_rate": 1.6959863364645602e-06, "loss": 0.7764, "step": 993 }, { "epoch": 0.03, "learning_rate": 1.6976942783945345e-06, "loss": 1.0537, "step": 994 }, { "epoch": 0.03, "learning_rate": 1.699402220324509e-06, "loss": 1.1094, "step": 995 }, { "epoch": 0.03, "learning_rate": 1.7011101622544831e-06, "loss": 0.9736, "step": 996 }, { "epoch": 0.03, "learning_rate": 1.7028181041844576e-06, "loss": 0.9883, "step": 997 }, { "epoch": 0.03, "learning_rate": 1.704526046114432e-06, "loss": 0.999, "step": 998 }, { "epoch": 0.03, "learning_rate": 1.7062339880444062e-06, "loss": 0.9941, "step": 999 }, { "epoch": 0.03, "learning_rate": 1.7079419299743807e-06, "loss": 0.9629, "step": 1000 }, { "epoch": 0.03, "learning_rate": 1.7096498719043553e-06, "loss": 0.9141, "step": 1001 }, { "epoch": 0.03, "learning_rate": 1.7113578138343296e-06, "loss": 0.759, "step": 1002 }, { "epoch": 0.03, "learning_rate": 1.713065755764304e-06, "loss": 1.0723, "step": 1003 }, { "epoch": 0.03, "learning_rate": 1.7147736976942785e-06, "loss": 0.8672, "step": 1004 }, { "epoch": 0.03, "learning_rate": 1.7164816396242527e-06, "loss": 1.1592, "step": 1005 }, { "epoch": 0.03, "learning_rate": 1.7181895815542271e-06, "loss": 1.0557, "step": 1006 }, { "epoch": 0.03, "learning_rate": 1.7198975234842016e-06, "loss": 0.8232, "step": 1007 }, { "epoch": 0.03, "learning_rate": 1.7216054654141758e-06, "loss": 0.8516, "step": 1008 }, { "epoch": 0.03, "learning_rate": 1.7233134073441502e-06, "loss": 0.8926, "step": 1009 }, { "epoch": 0.03, "learning_rate": 1.7250213492741245e-06, "loss": 0.8789, "step": 1010 }, { "epoch": 0.03, "learning_rate": 1.726729291204099e-06, "loss": 1.1182, "step": 1011 }, { "epoch": 0.03, "learning_rate": 1.7284372331340734e-06, "loss": 0.8672, "step": 1012 }, { "epoch": 0.03, "learning_rate": 1.7301451750640476e-06, "loss": 1.0625, "step": 1013 }, { "epoch": 0.03, "learning_rate": 1.731853116994022e-06, "loss": 1.0449, "step": 1014 }, { "epoch": 0.03, "learning_rate": 1.7335610589239965e-06, "loss": 0.8184, "step": 1015 }, { "epoch": 0.03, "learning_rate": 1.735269000853971e-06, "loss": 1.082, "step": 1016 }, { "epoch": 0.03, "learning_rate": 1.7369769427839454e-06, "loss": 1.1465, "step": 1017 }, { "epoch": 0.03, "learning_rate": 1.7386848847139198e-06, "loss": 0.6377, "step": 1018 }, { "epoch": 0.03, "learning_rate": 1.740392826643894e-06, "loss": 0.915, "step": 1019 }, { "epoch": 0.03, "learning_rate": 1.7421007685738685e-06, "loss": 1.0547, "step": 1020 }, { "epoch": 0.03, "learning_rate": 1.743808710503843e-06, "loss": 1.2793, "step": 1021 }, { "epoch": 0.03, "learning_rate": 1.7455166524338171e-06, "loss": 0.8604, "step": 1022 }, { "epoch": 0.03, "learning_rate": 1.7472245943637916e-06, "loss": 0.9111, "step": 1023 }, { "epoch": 0.03, "learning_rate": 1.7489325362937658e-06, "loss": 0.9062, "step": 1024 }, { "epoch": 0.03, "learning_rate": 1.7506404782237403e-06, "loss": 1.0752, "step": 1025 }, { "epoch": 0.03, "learning_rate": 1.7523484201537147e-06, "loss": 1.123, "step": 1026 }, { "epoch": 0.03, "learning_rate": 1.754056362083689e-06, "loss": 1.0762, "step": 1027 }, { "epoch": 0.03, "learning_rate": 1.7557643040136634e-06, "loss": 0.8467, "step": 1028 }, { "epoch": 0.03, "learning_rate": 1.7574722459436378e-06, "loss": 1.0283, "step": 1029 }, { "epoch": 0.03, "learning_rate": 1.759180187873612e-06, "loss": 0.9092, "step": 1030 }, { "epoch": 0.03, "learning_rate": 1.7608881298035867e-06, "loss": 0.8926, "step": 1031 }, { "epoch": 0.03, "learning_rate": 1.7625960717335611e-06, "loss": 0.9033, "step": 1032 }, { "epoch": 0.03, "learning_rate": 1.7643040136635354e-06, "loss": 0.8647, "step": 1033 }, { "epoch": 0.03, "learning_rate": 1.7660119555935098e-06, "loss": 1.1143, "step": 1034 }, { "epoch": 0.03, "learning_rate": 1.7677198975234843e-06, "loss": 0.9775, "step": 1035 }, { "epoch": 0.03, "learning_rate": 1.7694278394534585e-06, "loss": 0.9717, "step": 1036 }, { "epoch": 0.03, "learning_rate": 1.771135781383433e-06, "loss": 0.9805, "step": 1037 }, { "epoch": 0.03, "learning_rate": 1.7728437233134072e-06, "loss": 0.8062, "step": 1038 }, { "epoch": 0.03, "learning_rate": 1.7745516652433816e-06, "loss": 0.7954, "step": 1039 }, { "epoch": 0.03, "learning_rate": 1.776259607173356e-06, "loss": 0.9238, "step": 1040 }, { "epoch": 0.03, "learning_rate": 1.7779675491033303e-06, "loss": 0.9883, "step": 1041 }, { "epoch": 0.03, "learning_rate": 1.7796754910333047e-06, "loss": 1.0879, "step": 1042 }, { "epoch": 0.03, "learning_rate": 1.7813834329632792e-06, "loss": 1.127, "step": 1043 }, { "epoch": 0.03, "learning_rate": 1.7830913748932534e-06, "loss": 0.8008, "step": 1044 }, { "epoch": 0.03, "learning_rate": 1.7847993168232278e-06, "loss": 0.9463, "step": 1045 }, { "epoch": 0.03, "learning_rate": 1.7865072587532025e-06, "loss": 0.96, "step": 1046 }, { "epoch": 0.03, "learning_rate": 1.7882152006831767e-06, "loss": 1.0117, "step": 1047 }, { "epoch": 0.03, "learning_rate": 1.7899231426131512e-06, "loss": 0.8945, "step": 1048 }, { "epoch": 0.03, "learning_rate": 1.7916310845431256e-06, "loss": 0.7495, "step": 1049 }, { "epoch": 0.03, "learning_rate": 1.7933390264730998e-06, "loss": 1.0996, "step": 1050 }, { "epoch": 0.03, "learning_rate": 1.7950469684030743e-06, "loss": 1.1709, "step": 1051 }, { "epoch": 0.03, "learning_rate": 1.7967549103330485e-06, "loss": 1.0645, "step": 1052 }, { "epoch": 0.03, "learning_rate": 1.798462852263023e-06, "loss": 0.9971, "step": 1053 }, { "epoch": 0.03, "learning_rate": 1.8001707941929974e-06, "loss": 1.0469, "step": 1054 }, { "epoch": 0.03, "learning_rate": 1.8018787361229716e-06, "loss": 0.937, "step": 1055 }, { "epoch": 0.03, "learning_rate": 1.803586678052946e-06, "loss": 0.8828, "step": 1056 }, { "epoch": 0.03, "learning_rate": 1.8052946199829205e-06, "loss": 0.9277, "step": 1057 }, { "epoch": 0.03, "learning_rate": 1.8070025619128947e-06, "loss": 0.9805, "step": 1058 }, { "epoch": 0.03, "learning_rate": 1.8087105038428692e-06, "loss": 0.9165, "step": 1059 }, { "epoch": 0.03, "learning_rate": 1.8104184457728438e-06, "loss": 0.9912, "step": 1060 }, { "epoch": 0.03, "learning_rate": 1.812126387702818e-06, "loss": 0.7705, "step": 1061 }, { "epoch": 0.03, "learning_rate": 1.8138343296327925e-06, "loss": 0.8242, "step": 1062 }, { "epoch": 0.03, "learning_rate": 1.815542271562767e-06, "loss": 0.8877, "step": 1063 }, { "epoch": 0.03, "learning_rate": 1.8172502134927412e-06, "loss": 0.7451, "step": 1064 }, { "epoch": 0.03, "learning_rate": 1.8189581554227156e-06, "loss": 0.8818, "step": 1065 }, { "epoch": 0.03, "learning_rate": 1.8206660973526898e-06, "loss": 0.8135, "step": 1066 }, { "epoch": 0.03, "learning_rate": 1.8223740392826643e-06, "loss": 1.0557, "step": 1067 }, { "epoch": 0.03, "learning_rate": 1.8240819812126387e-06, "loss": 0.9028, "step": 1068 }, { "epoch": 0.03, "learning_rate": 1.825789923142613e-06, "loss": 0.6206, "step": 1069 }, { "epoch": 0.03, "learning_rate": 1.8274978650725874e-06, "loss": 1.1514, "step": 1070 }, { "epoch": 0.03, "learning_rate": 1.8292058070025618e-06, "loss": 0.9014, "step": 1071 }, { "epoch": 0.03, "learning_rate": 1.830913748932536e-06, "loss": 1.042, "step": 1072 }, { "epoch": 0.03, "learning_rate": 1.8326216908625105e-06, "loss": 0.9893, "step": 1073 }, { "epoch": 0.03, "learning_rate": 1.834329632792485e-06, "loss": 0.8906, "step": 1074 }, { "epoch": 0.03, "learning_rate": 1.8360375747224594e-06, "loss": 0.9561, "step": 1075 }, { "epoch": 0.03, "learning_rate": 1.8377455166524338e-06, "loss": 0.9414, "step": 1076 }, { "epoch": 0.03, "learning_rate": 1.8394534585824083e-06, "loss": 1.0771, "step": 1077 }, { "epoch": 0.03, "learning_rate": 1.8411614005123825e-06, "loss": 1.0557, "step": 1078 }, { "epoch": 0.03, "learning_rate": 1.842869342442357e-06, "loss": 1.0293, "step": 1079 }, { "epoch": 0.03, "learning_rate": 1.8445772843723312e-06, "loss": 0.9072, "step": 1080 }, { "epoch": 0.03, "learning_rate": 1.8462852263023056e-06, "loss": 1.0332, "step": 1081 }, { "epoch": 0.03, "learning_rate": 1.84799316823228e-06, "loss": 0.9111, "step": 1082 }, { "epoch": 0.03, "learning_rate": 1.8497011101622543e-06, "loss": 0.9839, "step": 1083 }, { "epoch": 0.03, "learning_rate": 1.8514090520922287e-06, "loss": 1.0654, "step": 1084 }, { "epoch": 0.03, "learning_rate": 1.8531169940222032e-06, "loss": 0.8013, "step": 1085 }, { "epoch": 0.03, "learning_rate": 1.8548249359521774e-06, "loss": 1.0381, "step": 1086 }, { "epoch": 0.03, "learning_rate": 1.8565328778821519e-06, "loss": 1.082, "step": 1087 }, { "epoch": 0.03, "learning_rate": 1.8582408198121263e-06, "loss": 0.9414, "step": 1088 }, { "epoch": 0.03, "learning_rate": 1.8599487617421005e-06, "loss": 1.0918, "step": 1089 }, { "epoch": 0.03, "learning_rate": 1.8616567036720752e-06, "loss": 0.8799, "step": 1090 }, { "epoch": 0.03, "learning_rate": 1.8633646456020496e-06, "loss": 0.9521, "step": 1091 }, { "epoch": 0.03, "learning_rate": 1.8650725875320239e-06, "loss": 1.0879, "step": 1092 }, { "epoch": 0.03, "learning_rate": 1.8667805294619983e-06, "loss": 1.041, "step": 1093 }, { "epoch": 0.03, "learning_rate": 1.8684884713919725e-06, "loss": 0.7607, "step": 1094 }, { "epoch": 0.03, "learning_rate": 1.870196413321947e-06, "loss": 0.9458, "step": 1095 }, { "epoch": 0.03, "learning_rate": 1.8719043552519214e-06, "loss": 1.0664, "step": 1096 }, { "epoch": 0.03, "learning_rate": 1.8736122971818956e-06, "loss": 1.0898, "step": 1097 }, { "epoch": 0.03, "learning_rate": 1.87532023911187e-06, "loss": 0.8857, "step": 1098 }, { "epoch": 0.03, "learning_rate": 1.8770281810418445e-06, "loss": 1.0527, "step": 1099 }, { "epoch": 0.03, "learning_rate": 1.8787361229718188e-06, "loss": 0.876, "step": 1100 }, { "epoch": 0.03, "learning_rate": 1.8804440649017932e-06, "loss": 1.0801, "step": 1101 }, { "epoch": 0.03, "learning_rate": 1.8821520068317676e-06, "loss": 0.8174, "step": 1102 }, { "epoch": 0.03, "learning_rate": 1.8838599487617419e-06, "loss": 0.9844, "step": 1103 }, { "epoch": 0.03, "learning_rate": 1.8855678906917163e-06, "loss": 1.2305, "step": 1104 }, { "epoch": 0.03, "learning_rate": 1.887275832621691e-06, "loss": 1.0312, "step": 1105 }, { "epoch": 0.03, "learning_rate": 1.8889837745516652e-06, "loss": 0.8306, "step": 1106 }, { "epoch": 0.03, "learning_rate": 1.8906917164816396e-06, "loss": 0.7549, "step": 1107 }, { "epoch": 0.03, "learning_rate": 1.892399658411614e-06, "loss": 0.9272, "step": 1108 }, { "epoch": 0.03, "learning_rate": 1.8941076003415883e-06, "loss": 0.8765, "step": 1109 }, { "epoch": 0.03, "learning_rate": 1.8958155422715628e-06, "loss": 1.0986, "step": 1110 }, { "epoch": 0.03, "learning_rate": 1.897523484201537e-06, "loss": 1.1367, "step": 1111 }, { "epoch": 0.03, "learning_rate": 1.8992314261315114e-06, "loss": 0.9619, "step": 1112 }, { "epoch": 0.03, "learning_rate": 1.9009393680614859e-06, "loss": 1.0088, "step": 1113 }, { "epoch": 0.03, "learning_rate": 1.90264730999146e-06, "loss": 1.0298, "step": 1114 }, { "epoch": 0.03, "learning_rate": 1.9043552519214345e-06, "loss": 0.9512, "step": 1115 }, { "epoch": 0.03, "learning_rate": 1.906063193851409e-06, "loss": 1.0615, "step": 1116 }, { "epoch": 0.03, "learning_rate": 1.9077711357813834e-06, "loss": 0.9092, "step": 1117 }, { "epoch": 0.03, "learning_rate": 1.9094790777113577e-06, "loss": 1.209, "step": 1118 }, { "epoch": 0.03, "learning_rate": 1.911187019641332e-06, "loss": 1.1641, "step": 1119 }, { "epoch": 0.03, "learning_rate": 1.9128949615713065e-06, "loss": 1.0791, "step": 1120 }, { "epoch": 0.03, "learning_rate": 1.9146029035012808e-06, "loss": 0.7524, "step": 1121 }, { "epoch": 0.03, "learning_rate": 1.9163108454312554e-06, "loss": 0.8574, "step": 1122 }, { "epoch": 0.03, "learning_rate": 1.9180187873612297e-06, "loss": 0.9902, "step": 1123 }, { "epoch": 0.03, "learning_rate": 1.919726729291204e-06, "loss": 1.2393, "step": 1124 }, { "epoch": 0.03, "learning_rate": 1.9214346712211785e-06, "loss": 0.958, "step": 1125 }, { "epoch": 0.03, "learning_rate": 1.9231426131511528e-06, "loss": 1.1992, "step": 1126 }, { "epoch": 0.03, "learning_rate": 1.924850555081127e-06, "loss": 0.9814, "step": 1127 }, { "epoch": 0.03, "learning_rate": 1.9265584970111017e-06, "loss": 1.0049, "step": 1128 }, { "epoch": 0.03, "learning_rate": 1.928266438941076e-06, "loss": 1.1299, "step": 1129 }, { "epoch": 0.03, "learning_rate": 1.92997438087105e-06, "loss": 0.8892, "step": 1130 }, { "epoch": 0.03, "learning_rate": 1.9316823228010248e-06, "loss": 0.9189, "step": 1131 }, { "epoch": 0.03, "learning_rate": 1.933390264730999e-06, "loss": 0.7764, "step": 1132 }, { "epoch": 0.03, "learning_rate": 1.9350982066609732e-06, "loss": 0.9619, "step": 1133 }, { "epoch": 0.03, "learning_rate": 1.936806148590948e-06, "loss": 0.9346, "step": 1134 }, { "epoch": 0.03, "learning_rate": 1.938514090520922e-06, "loss": 1.084, "step": 1135 }, { "epoch": 0.03, "learning_rate": 1.9402220324508968e-06, "loss": 0.9355, "step": 1136 }, { "epoch": 0.03, "learning_rate": 1.941929974380871e-06, "loss": 1.1738, "step": 1137 }, { "epoch": 0.03, "learning_rate": 1.9436379163108452e-06, "loss": 1.1045, "step": 1138 }, { "epoch": 0.03, "learning_rate": 1.94534585824082e-06, "loss": 0.9688, "step": 1139 }, { "epoch": 0.03, "learning_rate": 1.947053800170794e-06, "loss": 0.9932, "step": 1140 }, { "epoch": 0.03, "learning_rate": 1.9487617421007683e-06, "loss": 0.9414, "step": 1141 }, { "epoch": 0.03, "learning_rate": 1.950469684030743e-06, "loss": 1.0459, "step": 1142 }, { "epoch": 0.03, "learning_rate": 1.9521776259607172e-06, "loss": 1.126, "step": 1143 }, { "epoch": 0.03, "learning_rate": 1.9538855678906915e-06, "loss": 0.7808, "step": 1144 }, { "epoch": 0.03, "learning_rate": 1.955593509820666e-06, "loss": 0.916, "step": 1145 }, { "epoch": 0.03, "learning_rate": 1.9573014517506403e-06, "loss": 1.1494, "step": 1146 }, { "epoch": 0.03, "learning_rate": 1.9590093936806146e-06, "loss": 0.9453, "step": 1147 }, { "epoch": 0.03, "learning_rate": 1.9607173356105892e-06, "loss": 1.0137, "step": 1148 }, { "epoch": 0.03, "learning_rate": 1.9624252775405635e-06, "loss": 0.9766, "step": 1149 }, { "epoch": 0.03, "learning_rate": 1.964133219470538e-06, "loss": 1.1035, "step": 1150 }, { "epoch": 0.03, "learning_rate": 1.9658411614005123e-06, "loss": 1.1084, "step": 1151 }, { "epoch": 0.03, "learning_rate": 1.9675491033304866e-06, "loss": 0.9346, "step": 1152 }, { "epoch": 0.03, "learning_rate": 1.9692570452604612e-06, "loss": 1.0039, "step": 1153 }, { "epoch": 0.03, "learning_rate": 1.9709649871904355e-06, "loss": 1.1416, "step": 1154 }, { "epoch": 0.03, "learning_rate": 1.9726729291204097e-06, "loss": 0.957, "step": 1155 }, { "epoch": 0.03, "learning_rate": 1.9743808710503843e-06, "loss": 0.9189, "step": 1156 }, { "epoch": 0.03, "learning_rate": 1.9760888129803586e-06, "loss": 0.7988, "step": 1157 }, { "epoch": 0.03, "learning_rate": 1.977796754910333e-06, "loss": 0.9365, "step": 1158 }, { "epoch": 0.03, "learning_rate": 1.9795046968403075e-06, "loss": 0.6909, "step": 1159 }, { "epoch": 0.03, "learning_rate": 1.9812126387702817e-06, "loss": 1.2227, "step": 1160 }, { "epoch": 0.03, "learning_rate": 1.982920580700256e-06, "loss": 1.0127, "step": 1161 }, { "epoch": 0.03, "learning_rate": 1.9846285226302306e-06, "loss": 1.0625, "step": 1162 }, { "epoch": 0.03, "learning_rate": 1.986336464560205e-06, "loss": 1.0898, "step": 1163 }, { "epoch": 0.03, "learning_rate": 1.9880444064901795e-06, "loss": 0.9346, "step": 1164 }, { "epoch": 0.03, "learning_rate": 1.9897523484201537e-06, "loss": 0.9248, "step": 1165 }, { "epoch": 0.03, "learning_rate": 1.991460290350128e-06, "loss": 0.9502, "step": 1166 }, { "epoch": 0.03, "learning_rate": 1.9931682322801026e-06, "loss": 0.7476, "step": 1167 }, { "epoch": 0.03, "learning_rate": 1.994876174210077e-06, "loss": 1.0654, "step": 1168 }, { "epoch": 0.03, "learning_rate": 1.996584116140051e-06, "loss": 0.998, "step": 1169 }, { "epoch": 0.03, "learning_rate": 1.9982920580700257e-06, "loss": 1.2603, "step": 1170 }, { "epoch": 0.03, "learning_rate": 2e-06, "loss": 0.9443, "step": 1171 }, { "epoch": 0.03, "learning_rate": 1.999999996554496e-06, "loss": 0.918, "step": 1172 }, { "epoch": 0.03, "learning_rate": 1.999999986217985e-06, "loss": 0.9023, "step": 1173 }, { "epoch": 0.03, "learning_rate": 1.999999968990466e-06, "loss": 1.0205, "step": 1174 }, { "epoch": 0.03, "learning_rate": 1.99999994487194e-06, "loss": 0.7886, "step": 1175 }, { "epoch": 0.03, "learning_rate": 1.9999999138624065e-06, "loss": 1.0078, "step": 1176 }, { "epoch": 0.03, "learning_rate": 1.9999998759618665e-06, "loss": 0.9609, "step": 1177 }, { "epoch": 0.03, "learning_rate": 1.9999998311703195e-06, "loss": 0.959, "step": 1178 }, { "epoch": 0.03, "learning_rate": 1.999999779487766e-06, "loss": 0.8906, "step": 1179 }, { "epoch": 0.03, "learning_rate": 1.9999997209142066e-06, "loss": 1.1406, "step": 1180 }, { "epoch": 0.03, "learning_rate": 1.999999655449642e-06, "loss": 1.041, "step": 1181 }, { "epoch": 0.03, "learning_rate": 1.9999995830940713e-06, "loss": 0.9463, "step": 1182 }, { "epoch": 0.03, "learning_rate": 1.999999503847497e-06, "loss": 0.8613, "step": 1183 }, { "epoch": 0.03, "learning_rate": 1.9999994177099176e-06, "loss": 1.0049, "step": 1184 }, { "epoch": 0.03, "learning_rate": 1.9999993246813355e-06, "loss": 0.9443, "step": 1185 }, { "epoch": 0.03, "learning_rate": 1.99999922476175e-06, "loss": 1.1504, "step": 1186 }, { "epoch": 0.03, "learning_rate": 1.999999117951162e-06, "loss": 0.9932, "step": 1187 }, { "epoch": 0.03, "learning_rate": 1.999999004249573e-06, "loss": 1.0068, "step": 1188 }, { "epoch": 0.03, "learning_rate": 1.999998883656983e-06, "loss": 1.0723, "step": 1189 }, { "epoch": 0.03, "learning_rate": 1.9999987561733936e-06, "loss": 0.9795, "step": 1190 }, { "epoch": 0.03, "learning_rate": 1.999998621798805e-06, "loss": 1.0098, "step": 1191 }, { "epoch": 0.03, "learning_rate": 1.999998480533218e-06, "loss": 1.0654, "step": 1192 }, { "epoch": 0.03, "learning_rate": 1.9999983323766343e-06, "loss": 0.7603, "step": 1193 }, { "epoch": 0.03, "learning_rate": 1.9999981773290545e-06, "loss": 1.1143, "step": 1194 }, { "epoch": 0.03, "learning_rate": 1.9999980153904797e-06, "loss": 0.8125, "step": 1195 }, { "epoch": 0.03, "learning_rate": 1.999997846560911e-06, "loss": 0.999, "step": 1196 }, { "epoch": 0.03, "learning_rate": 1.9999976708403496e-06, "loss": 0.9111, "step": 1197 }, { "epoch": 0.03, "learning_rate": 1.9999974882287964e-06, "loss": 1.0264, "step": 1198 }, { "epoch": 0.03, "learning_rate": 1.9999972987262533e-06, "loss": 1.1074, "step": 1199 }, { "epoch": 0.03, "learning_rate": 1.9999971023327215e-06, "loss": 1.0342, "step": 1200 }, { "epoch": 0.03, "learning_rate": 1.9999968990482015e-06, "loss": 0.7637, "step": 1201 }, { "epoch": 0.03, "learning_rate": 1.9999966888726957e-06, "loss": 1.0762, "step": 1202 }, { "epoch": 0.03, "learning_rate": 1.999996471806205e-06, "loss": 1.0103, "step": 1203 }, { "epoch": 0.03, "learning_rate": 1.999996247848731e-06, "loss": 0.9541, "step": 1204 }, { "epoch": 0.03, "learning_rate": 1.9999960170002755e-06, "loss": 1.1533, "step": 1205 }, { "epoch": 0.03, "learning_rate": 1.99999577926084e-06, "loss": 0.6733, "step": 1206 }, { "epoch": 0.03, "learning_rate": 1.9999955346304255e-06, "loss": 0.9844, "step": 1207 }, { "epoch": 0.03, "learning_rate": 1.9999952831090346e-06, "loss": 0.7695, "step": 1208 }, { "epoch": 0.03, "learning_rate": 1.999995024696669e-06, "loss": 0.916, "step": 1209 }, { "epoch": 0.03, "learning_rate": 1.9999947593933296e-06, "loss": 0.9863, "step": 1210 }, { "epoch": 0.03, "learning_rate": 1.9999944871990188e-06, "loss": 0.9697, "step": 1211 }, { "epoch": 0.03, "learning_rate": 1.9999942081137384e-06, "loss": 0.7896, "step": 1212 }, { "epoch": 0.03, "learning_rate": 1.9999939221374905e-06, "loss": 1.0518, "step": 1213 }, { "epoch": 0.03, "learning_rate": 1.999993629270277e-06, "loss": 0.8398, "step": 1214 }, { "epoch": 0.03, "learning_rate": 1.9999933295120998e-06, "loss": 0.894, "step": 1215 }, { "epoch": 0.03, "learning_rate": 1.9999930228629608e-06, "loss": 0.6821, "step": 1216 }, { "epoch": 0.03, "learning_rate": 1.9999927093228627e-06, "loss": 1.0898, "step": 1217 }, { "epoch": 0.03, "learning_rate": 1.999992388891807e-06, "loss": 1.0723, "step": 1218 }, { "epoch": 0.03, "learning_rate": 1.9999920615697963e-06, "loss": 0.8779, "step": 1219 }, { "epoch": 0.03, "learning_rate": 1.9999917273568326e-06, "loss": 0.877, "step": 1220 }, { "epoch": 0.03, "learning_rate": 1.9999913862529183e-06, "loss": 1.0771, "step": 1221 }, { "epoch": 0.03, "learning_rate": 1.9999910382580564e-06, "loss": 0.8574, "step": 1222 }, { "epoch": 0.03, "learning_rate": 1.999990683372248e-06, "loss": 0.9736, "step": 1223 }, { "epoch": 0.03, "learning_rate": 1.9999903215954966e-06, "loss": 0.9453, "step": 1224 }, { "epoch": 0.03, "learning_rate": 1.999989952927804e-06, "loss": 0.8955, "step": 1225 }, { "epoch": 0.03, "learning_rate": 1.999989577369174e-06, "loss": 1.0928, "step": 1226 }, { "epoch": 0.03, "learning_rate": 1.9999891949196075e-06, "loss": 0.9648, "step": 1227 }, { "epoch": 0.03, "learning_rate": 1.999988805579108e-06, "loss": 0.833, "step": 1228 }, { "epoch": 0.03, "learning_rate": 1.999988409347678e-06, "loss": 1.0234, "step": 1229 }, { "epoch": 0.03, "learning_rate": 1.9999880062253203e-06, "loss": 0.8438, "step": 1230 }, { "epoch": 0.03, "learning_rate": 1.999987596212038e-06, "loss": 1.0664, "step": 1231 }, { "epoch": 0.03, "learning_rate": 1.9999871793078335e-06, "loss": 0.8477, "step": 1232 }, { "epoch": 0.03, "learning_rate": 1.9999867555127097e-06, "loss": 0.8809, "step": 1233 }, { "epoch": 0.03, "learning_rate": 1.9999863248266697e-06, "loss": 1.1553, "step": 1234 }, { "epoch": 0.03, "learning_rate": 1.9999858872497164e-06, "loss": 1.0635, "step": 1235 }, { "epoch": 0.03, "learning_rate": 1.9999854427818527e-06, "loss": 0.8882, "step": 1236 }, { "epoch": 0.03, "learning_rate": 1.9999849914230817e-06, "loss": 0.9727, "step": 1237 }, { "epoch": 0.03, "learning_rate": 1.9999845331734067e-06, "loss": 1.084, "step": 1238 }, { "epoch": 0.03, "learning_rate": 1.9999840680328307e-06, "loss": 1.1387, "step": 1239 }, { "epoch": 0.03, "learning_rate": 1.999983596001357e-06, "loss": 1.0928, "step": 1240 }, { "epoch": 0.03, "learning_rate": 1.9999831170789888e-06, "loss": 1.1201, "step": 1241 }, { "epoch": 0.03, "learning_rate": 1.999982631265729e-06, "loss": 1.0059, "step": 1242 }, { "epoch": 0.03, "learning_rate": 1.9999821385615817e-06, "loss": 0.7881, "step": 1243 }, { "epoch": 0.03, "learning_rate": 1.99998163896655e-06, "loss": 1.0986, "step": 1244 }, { "epoch": 0.03, "learning_rate": 1.999981132480637e-06, "loss": 0.9883, "step": 1245 }, { "epoch": 0.03, "learning_rate": 1.9999806191038467e-06, "loss": 0.8926, "step": 1246 }, { "epoch": 0.03, "learning_rate": 1.9999800988361824e-06, "loss": 1.0127, "step": 1247 }, { "epoch": 0.03, "learning_rate": 1.9999795716776476e-06, "loss": 1.0391, "step": 1248 }, { "epoch": 0.03, "learning_rate": 1.999979037628246e-06, "loss": 0.9375, "step": 1249 }, { "epoch": 0.03, "learning_rate": 1.999978496687981e-06, "loss": 0.8613, "step": 1250 }, { "epoch": 0.03, "learning_rate": 1.9999779488568572e-06, "loss": 0.7905, "step": 1251 }, { "epoch": 0.03, "learning_rate": 1.9999773941348776e-06, "loss": 1.0049, "step": 1252 }, { "epoch": 0.03, "learning_rate": 1.999976832522046e-06, "loss": 1.0547, "step": 1253 }, { "epoch": 0.03, "learning_rate": 1.9999762640183664e-06, "loss": 0.9321, "step": 1254 }, { "epoch": 0.03, "learning_rate": 1.9999756886238434e-06, "loss": 1.0684, "step": 1255 }, { "epoch": 0.03, "learning_rate": 1.99997510633848e-06, "loss": 1.0352, "step": 1256 }, { "epoch": 0.03, "learning_rate": 1.9999745171622806e-06, "loss": 1.0361, "step": 1257 }, { "epoch": 0.03, "learning_rate": 1.999973921095249e-06, "loss": 0.9629, "step": 1258 }, { "epoch": 0.03, "learning_rate": 1.99997331813739e-06, "loss": 0.96, "step": 1259 }, { "epoch": 0.03, "learning_rate": 1.9999727082887074e-06, "loss": 0.9287, "step": 1260 }, { "epoch": 0.03, "learning_rate": 1.9999720915492047e-06, "loss": 0.9653, "step": 1261 }, { "epoch": 0.03, "learning_rate": 1.9999714679188874e-06, "loss": 0.8271, "step": 1262 }, { "epoch": 0.03, "learning_rate": 1.999970837397759e-06, "loss": 0.8311, "step": 1263 }, { "epoch": 0.03, "learning_rate": 1.9999701999858234e-06, "loss": 1.1191, "step": 1264 }, { "epoch": 0.03, "learning_rate": 1.999969555683086e-06, "loss": 1.1191, "step": 1265 }, { "epoch": 0.03, "learning_rate": 1.999968904489551e-06, "loss": 1.0583, "step": 1266 }, { "epoch": 0.03, "learning_rate": 1.999968246405223e-06, "loss": 1.0273, "step": 1267 }, { "epoch": 0.03, "learning_rate": 1.9999675814301055e-06, "loss": 0.769, "step": 1268 }, { "epoch": 0.03, "learning_rate": 1.9999669095642045e-06, "loss": 0.7451, "step": 1269 }, { "epoch": 0.03, "learning_rate": 1.999966230807524e-06, "loss": 0.9219, "step": 1270 }, { "epoch": 0.03, "learning_rate": 1.9999655451600682e-06, "loss": 1.041, "step": 1271 }, { "epoch": 0.03, "learning_rate": 1.9999648526218424e-06, "loss": 1.1357, "step": 1272 }, { "epoch": 0.03, "learning_rate": 1.999964153192851e-06, "loss": 1.0693, "step": 1273 }, { "epoch": 0.03, "learning_rate": 1.9999634468730996e-06, "loss": 0.6895, "step": 1274 }, { "epoch": 0.03, "learning_rate": 1.999962733662592e-06, "loss": 1.1719, "step": 1275 }, { "epoch": 0.03, "learning_rate": 1.9999620135613343e-06, "loss": 1.0264, "step": 1276 }, { "epoch": 0.03, "learning_rate": 1.99996128656933e-06, "loss": 0.9707, "step": 1277 }, { "epoch": 0.03, "learning_rate": 1.9999605526865854e-06, "loss": 1.2891, "step": 1278 }, { "epoch": 0.03, "learning_rate": 1.9999598119131052e-06, "loss": 0.9844, "step": 1279 }, { "epoch": 0.03, "learning_rate": 1.9999590642488943e-06, "loss": 0.8994, "step": 1280 }, { "epoch": 0.03, "learning_rate": 1.9999583096939578e-06, "loss": 1.1836, "step": 1281 }, { "epoch": 0.03, "learning_rate": 1.999957548248301e-06, "loss": 0.9238, "step": 1282 }, { "epoch": 0.03, "learning_rate": 1.9999567799119296e-06, "loss": 1.0645, "step": 1283 }, { "epoch": 0.03, "learning_rate": 1.999956004684848e-06, "loss": 0.9746, "step": 1284 }, { "epoch": 0.03, "learning_rate": 1.999955222567062e-06, "loss": 0.9033, "step": 1285 }, { "epoch": 0.03, "learning_rate": 1.9999544335585773e-06, "loss": 0.9121, "step": 1286 }, { "epoch": 0.03, "learning_rate": 1.9999536376593992e-06, "loss": 1.125, "step": 1287 }, { "epoch": 0.03, "learning_rate": 1.9999528348695324e-06, "loss": 0.793, "step": 1288 }, { "epoch": 0.03, "learning_rate": 1.9999520251889835e-06, "loss": 0.9561, "step": 1289 }, { "epoch": 0.03, "learning_rate": 1.9999512086177576e-06, "loss": 0.9316, "step": 1290 }, { "epoch": 0.03, "learning_rate": 1.9999503851558602e-06, "loss": 0.9229, "step": 1291 }, { "epoch": 0.03, "learning_rate": 1.9999495548032973e-06, "loss": 0.9355, "step": 1292 }, { "epoch": 0.03, "learning_rate": 1.9999487175600744e-06, "loss": 1.207, "step": 1293 }, { "epoch": 0.03, "learning_rate": 1.9999478734261974e-06, "loss": 0.9131, "step": 1294 }, { "epoch": 0.03, "learning_rate": 1.999947022401672e-06, "loss": 0.7646, "step": 1295 }, { "epoch": 0.03, "learning_rate": 1.9999461644865042e-06, "loss": 0.7559, "step": 1296 }, { "epoch": 0.03, "learning_rate": 1.9999452996806996e-06, "loss": 1.0391, "step": 1297 }, { "epoch": 0.03, "learning_rate": 1.9999444279842646e-06, "loss": 0.8662, "step": 1298 }, { "epoch": 0.03, "learning_rate": 1.999943549397205e-06, "loss": 0.9121, "step": 1299 }, { "epoch": 0.03, "learning_rate": 1.9999426639195267e-06, "loss": 1.0693, "step": 1300 }, { "epoch": 0.03, "learning_rate": 1.999941771551236e-06, "loss": 0.8398, "step": 1301 }, { "epoch": 0.03, "learning_rate": 1.999940872292339e-06, "loss": 0.9824, "step": 1302 }, { "epoch": 0.03, "learning_rate": 1.999939966142842e-06, "loss": 1.1318, "step": 1303 }, { "epoch": 0.03, "learning_rate": 1.9999390531027512e-06, "loss": 0.8726, "step": 1304 }, { "epoch": 0.03, "learning_rate": 1.9999381331720725e-06, "loss": 1.002, "step": 1305 }, { "epoch": 0.03, "learning_rate": 1.999937206350813e-06, "loss": 0.8428, "step": 1306 }, { "epoch": 0.03, "learning_rate": 1.9999362726389783e-06, "loss": 1.001, "step": 1307 }, { "epoch": 0.03, "learning_rate": 1.9999353320365753e-06, "loss": 0.7402, "step": 1308 }, { "epoch": 0.03, "learning_rate": 1.9999343845436104e-06, "loss": 0.9736, "step": 1309 }, { "epoch": 0.03, "learning_rate": 1.99993343016009e-06, "loss": 0.8823, "step": 1310 }, { "epoch": 0.03, "learning_rate": 1.9999324688860208e-06, "loss": 0.9863, "step": 1311 }, { "epoch": 0.03, "learning_rate": 1.9999315007214095e-06, "loss": 0.9883, "step": 1312 }, { "epoch": 0.03, "learning_rate": 1.9999305256662628e-06, "loss": 1.1133, "step": 1313 }, { "epoch": 0.03, "learning_rate": 1.9999295437205873e-06, "loss": 0.916, "step": 1314 }, { "epoch": 0.03, "learning_rate": 1.9999285548843898e-06, "loss": 0.998, "step": 1315 }, { "epoch": 0.03, "learning_rate": 1.9999275591576767e-06, "loss": 0.7402, "step": 1316 }, { "epoch": 0.03, "learning_rate": 1.999926556540455e-06, "loss": 1.0215, "step": 1317 }, { "epoch": 0.03, "learning_rate": 1.9999255470327325e-06, "loss": 1.0527, "step": 1318 }, { "epoch": 0.03, "learning_rate": 1.9999245306345153e-06, "loss": 0.7427, "step": 1319 }, { "epoch": 0.03, "learning_rate": 1.9999235073458105e-06, "loss": 1.0127, "step": 1320 }, { "epoch": 0.03, "learning_rate": 1.9999224771666256e-06, "loss": 1.1123, "step": 1321 }, { "epoch": 0.03, "learning_rate": 1.999921440096967e-06, "loss": 0.728, "step": 1322 }, { "epoch": 0.03, "learning_rate": 1.9999203961368424e-06, "loss": 0.9824, "step": 1323 }, { "epoch": 0.03, "learning_rate": 1.9999193452862585e-06, "loss": 0.6914, "step": 1324 }, { "epoch": 0.03, "learning_rate": 1.999918287545223e-06, "loss": 0.8369, "step": 1325 }, { "epoch": 0.03, "learning_rate": 1.999917222913743e-06, "loss": 1.0996, "step": 1326 }, { "epoch": 0.03, "learning_rate": 1.999916151391826e-06, "loss": 0.8389, "step": 1327 }, { "epoch": 0.03, "learning_rate": 1.999915072979479e-06, "loss": 0.9609, "step": 1328 }, { "epoch": 0.03, "learning_rate": 1.99991398767671e-06, "loss": 0.7471, "step": 1329 }, { "epoch": 0.03, "learning_rate": 1.999912895483526e-06, "loss": 1.0107, "step": 1330 }, { "epoch": 0.03, "learning_rate": 1.9999117963999348e-06, "loss": 0.9326, "step": 1331 }, { "epoch": 0.03, "learning_rate": 1.9999106904259434e-06, "loss": 0.876, "step": 1332 }, { "epoch": 0.03, "learning_rate": 1.9999095775615604e-06, "loss": 1.207, "step": 1333 }, { "epoch": 0.03, "learning_rate": 1.9999084578067927e-06, "loss": 0.9746, "step": 1334 }, { "epoch": 0.03, "learning_rate": 1.9999073311616483e-06, "loss": 1.1729, "step": 1335 }, { "epoch": 0.03, "learning_rate": 1.9999061976261353e-06, "loss": 1.0996, "step": 1336 }, { "epoch": 0.03, "learning_rate": 1.9999050572002603e-06, "loss": 0.9258, "step": 1337 }, { "epoch": 0.03, "learning_rate": 1.999903909884033e-06, "loss": 0.9727, "step": 1338 }, { "epoch": 0.03, "learning_rate": 1.9999027556774595e-06, "loss": 1.0723, "step": 1339 }, { "epoch": 0.03, "learning_rate": 1.999901594580549e-06, "loss": 0.7607, "step": 1340 }, { "epoch": 0.03, "learning_rate": 1.9999004265933086e-06, "loss": 0.9971, "step": 1341 }, { "epoch": 0.03, "learning_rate": 1.9998992517157475e-06, "loss": 0.916, "step": 1342 }, { "epoch": 0.03, "learning_rate": 1.9998980699478724e-06, "loss": 1.124, "step": 1343 }, { "epoch": 0.03, "learning_rate": 1.9998968812896926e-06, "loss": 0.6675, "step": 1344 }, { "epoch": 0.03, "learning_rate": 1.9998956857412157e-06, "loss": 0.9834, "step": 1345 }, { "epoch": 0.03, "learning_rate": 1.99989448330245e-06, "loss": 0.7178, "step": 1346 }, { "epoch": 0.03, "learning_rate": 1.999893273973404e-06, "loss": 0.8975, "step": 1347 }, { "epoch": 0.03, "learning_rate": 1.999892057754086e-06, "loss": 0.916, "step": 1348 }, { "epoch": 0.03, "learning_rate": 1.999890834644504e-06, "loss": 0.9346, "step": 1349 }, { "epoch": 0.03, "learning_rate": 1.9998896046446667e-06, "loss": 1.1758, "step": 1350 }, { "epoch": 0.03, "learning_rate": 1.9998883677545826e-06, "loss": 0.9658, "step": 1351 }, { "epoch": 0.03, "learning_rate": 1.9998871239742604e-06, "loss": 0.8965, "step": 1352 }, { "epoch": 0.03, "learning_rate": 1.9998858733037083e-06, "loss": 0.8799, "step": 1353 }, { "epoch": 0.03, "learning_rate": 1.9998846157429355e-06, "loss": 1.085, "step": 1354 }, { "epoch": 0.03, "learning_rate": 1.9998833512919498e-06, "loss": 0.9307, "step": 1355 }, { "epoch": 0.03, "learning_rate": 1.9998820799507606e-06, "loss": 0.8916, "step": 1356 }, { "epoch": 0.03, "learning_rate": 1.9998808017193764e-06, "loss": 1.0518, "step": 1357 }, { "epoch": 0.03, "learning_rate": 1.9998795165978057e-06, "loss": 1.1328, "step": 1358 }, { "epoch": 0.03, "learning_rate": 1.999878224586058e-06, "loss": 0.9863, "step": 1359 }, { "epoch": 0.03, "learning_rate": 1.9998769256841423e-06, "loss": 0.8193, "step": 1360 }, { "epoch": 0.03, "learning_rate": 1.9998756198920666e-06, "loss": 0.7339, "step": 1361 }, { "epoch": 0.03, "learning_rate": 1.9998743072098403e-06, "loss": 1.0117, "step": 1362 }, { "epoch": 0.03, "learning_rate": 1.999872987637473e-06, "loss": 0.7773, "step": 1363 }, { "epoch": 0.03, "learning_rate": 1.9998716611749734e-06, "loss": 1.0908, "step": 1364 }, { "epoch": 0.03, "learning_rate": 1.9998703278223506e-06, "loss": 1.0107, "step": 1365 }, { "epoch": 0.04, "learning_rate": 1.9998689875796136e-06, "loss": 0.8828, "step": 1366 }, { "epoch": 0.04, "learning_rate": 1.9998676404467722e-06, "loss": 0.8174, "step": 1367 }, { "epoch": 0.04, "learning_rate": 1.9998662864238345e-06, "loss": 1.1143, "step": 1368 }, { "epoch": 0.04, "learning_rate": 1.9998649255108115e-06, "loss": 0.9473, "step": 1369 }, { "epoch": 0.04, "learning_rate": 1.9998635577077116e-06, "loss": 0.9541, "step": 1370 }, { "epoch": 0.04, "learning_rate": 1.9998621830145442e-06, "loss": 1.043, "step": 1371 }, { "epoch": 0.04, "learning_rate": 1.999860801431319e-06, "loss": 1.0986, "step": 1372 }, { "epoch": 0.04, "learning_rate": 1.9998594129580458e-06, "loss": 1.0469, "step": 1373 }, { "epoch": 0.04, "learning_rate": 1.9998580175947334e-06, "loss": 1.0, "step": 1374 }, { "epoch": 0.04, "learning_rate": 1.999856615341392e-06, "loss": 1.0068, "step": 1375 }, { "epoch": 0.04, "learning_rate": 1.9998552061980313e-06, "loss": 0.8867, "step": 1376 }, { "epoch": 0.04, "learning_rate": 1.9998537901646607e-06, "loss": 0.9561, "step": 1377 }, { "epoch": 0.04, "learning_rate": 1.99985236724129e-06, "loss": 0.8076, "step": 1378 }, { "epoch": 0.04, "learning_rate": 1.999850937427929e-06, "loss": 0.8545, "step": 1379 }, { "epoch": 0.04, "learning_rate": 1.999849500724588e-06, "loss": 0.9077, "step": 1380 }, { "epoch": 0.04, "learning_rate": 1.9998480571312758e-06, "loss": 0.8906, "step": 1381 }, { "epoch": 0.04, "learning_rate": 1.9998466066480037e-06, "loss": 0.9248, "step": 1382 }, { "epoch": 0.04, "learning_rate": 1.999845149274781e-06, "loss": 0.9844, "step": 1383 }, { "epoch": 0.04, "learning_rate": 1.9998436850116173e-06, "loss": 0.7305, "step": 1384 }, { "epoch": 0.04, "learning_rate": 1.999842213858524e-06, "loss": 1.2217, "step": 1385 }, { "epoch": 0.04, "learning_rate": 1.99984073581551e-06, "loss": 0.5537, "step": 1386 }, { "epoch": 0.04, "learning_rate": 1.999839250882586e-06, "loss": 0.9404, "step": 1387 }, { "epoch": 0.04, "learning_rate": 1.9998377590597626e-06, "loss": 0.8486, "step": 1388 }, { "epoch": 0.04, "learning_rate": 1.999836260347049e-06, "loss": 0.833, "step": 1389 }, { "epoch": 0.04, "learning_rate": 1.9998347547444564e-06, "loss": 1.1914, "step": 1390 }, { "epoch": 0.04, "learning_rate": 1.999833242251995e-06, "loss": 0.9512, "step": 1391 }, { "epoch": 0.04, "learning_rate": 1.999831722869675e-06, "loss": 1.084, "step": 1392 }, { "epoch": 0.04, "learning_rate": 1.9998301965975074e-06, "loss": 0.9863, "step": 1393 }, { "epoch": 0.04, "learning_rate": 1.999828663435502e-06, "loss": 1.0908, "step": 1394 }, { "epoch": 0.04, "learning_rate": 1.99982712338367e-06, "loss": 1.0332, "step": 1395 }, { "epoch": 0.04, "learning_rate": 1.9998255764420215e-06, "loss": 0.877, "step": 1396 }, { "epoch": 0.04, "learning_rate": 1.9998240226105676e-06, "loss": 0.8955, "step": 1397 }, { "epoch": 0.04, "learning_rate": 1.999822461889319e-06, "loss": 1.0156, "step": 1398 }, { "epoch": 0.04, "learning_rate": 1.999820894278286e-06, "loss": 0.8506, "step": 1399 }, { "epoch": 0.04, "learning_rate": 1.9998193197774795e-06, "loss": 0.873, "step": 1400 }, { "epoch": 0.04, "learning_rate": 1.9998177383869108e-06, "loss": 0.9932, "step": 1401 }, { "epoch": 0.04, "learning_rate": 1.9998161501065904e-06, "loss": 1.0742, "step": 1402 }, { "epoch": 0.04, "learning_rate": 1.999814554936529e-06, "loss": 0.9756, "step": 1403 }, { "epoch": 0.04, "learning_rate": 1.9998129528767387e-06, "loss": 0.9453, "step": 1404 }, { "epoch": 0.04, "learning_rate": 1.9998113439272297e-06, "loss": 0.9238, "step": 1405 }, { "epoch": 0.04, "learning_rate": 1.9998097280880123e-06, "loss": 1.0498, "step": 1406 }, { "epoch": 0.04, "learning_rate": 1.9998081053590996e-06, "loss": 1.04, "step": 1407 }, { "epoch": 0.04, "learning_rate": 1.999806475740501e-06, "loss": 1.165, "step": 1408 }, { "epoch": 0.04, "learning_rate": 1.9998048392322287e-06, "loss": 0.9717, "step": 1409 }, { "epoch": 0.04, "learning_rate": 1.9998031958342937e-06, "loss": 0.9297, "step": 1410 }, { "epoch": 0.04, "learning_rate": 1.999801545546707e-06, "loss": 0.9258, "step": 1411 }, { "epoch": 0.04, "learning_rate": 1.9997998883694803e-06, "loss": 1.0537, "step": 1412 }, { "epoch": 0.04, "learning_rate": 1.9997982243026256e-06, "loss": 1.0371, "step": 1413 }, { "epoch": 0.04, "learning_rate": 1.999796553346153e-06, "loss": 1.0371, "step": 1414 }, { "epoch": 0.04, "learning_rate": 1.9997948755000756e-06, "loss": 1.0049, "step": 1415 }, { "epoch": 0.04, "learning_rate": 1.9997931907644036e-06, "loss": 0.9893, "step": 1416 }, { "epoch": 0.04, "learning_rate": 1.9997914991391494e-06, "loss": 0.9556, "step": 1417 }, { "epoch": 0.04, "learning_rate": 1.9997898006243244e-06, "loss": 1.1875, "step": 1418 }, { "epoch": 0.04, "learning_rate": 1.9997880952199406e-06, "loss": 0.6499, "step": 1419 }, { "epoch": 0.04, "learning_rate": 1.999786382926009e-06, "loss": 0.7822, "step": 1420 }, { "epoch": 0.04, "learning_rate": 1.9997846637425424e-06, "loss": 1.0264, "step": 1421 }, { "epoch": 0.04, "learning_rate": 1.9997829376695513e-06, "loss": 0.8823, "step": 1422 }, { "epoch": 0.04, "learning_rate": 1.9997812047070492e-06, "loss": 1.0352, "step": 1423 }, { "epoch": 0.04, "learning_rate": 1.999779464855047e-06, "loss": 0.7891, "step": 1424 }, { "epoch": 0.04, "learning_rate": 1.999777718113557e-06, "loss": 1.0459, "step": 1425 }, { "epoch": 0.04, "learning_rate": 1.999775964482591e-06, "loss": 0.8213, "step": 1426 }, { "epoch": 0.04, "learning_rate": 1.9997742039621613e-06, "loss": 1.0518, "step": 1427 }, { "epoch": 0.04, "learning_rate": 1.99977243655228e-06, "loss": 1.042, "step": 1428 }, { "epoch": 0.04, "learning_rate": 1.9997706622529596e-06, "loss": 0.6528, "step": 1429 }, { "epoch": 0.04, "learning_rate": 1.999768881064212e-06, "loss": 1.2793, "step": 1430 }, { "epoch": 0.04, "learning_rate": 1.9997670929860492e-06, "loss": 1.0957, "step": 1431 }, { "epoch": 0.04, "learning_rate": 1.999765298018484e-06, "loss": 0.8369, "step": 1432 }, { "epoch": 0.04, "learning_rate": 1.9997634961615284e-06, "loss": 1.1738, "step": 1433 }, { "epoch": 0.04, "learning_rate": 1.999761687415195e-06, "loss": 1.0186, "step": 1434 }, { "epoch": 0.04, "learning_rate": 1.9997598717794966e-06, "loss": 1.1865, "step": 1435 }, { "epoch": 0.04, "learning_rate": 1.9997580492544454e-06, "loss": 0.9385, "step": 1436 }, { "epoch": 0.04, "learning_rate": 1.9997562198400534e-06, "loss": 1.0156, "step": 1437 }, { "epoch": 0.04, "learning_rate": 1.9997543835363338e-06, "loss": 1.127, "step": 1438 }, { "epoch": 0.04, "learning_rate": 1.9997525403432996e-06, "loss": 0.9453, "step": 1439 }, { "epoch": 0.04, "learning_rate": 1.999750690260963e-06, "loss": 1.0527, "step": 1440 }, { "epoch": 0.04, "learning_rate": 1.999748833289337e-06, "loss": 1.0205, "step": 1441 }, { "epoch": 0.04, "learning_rate": 1.9997469694284336e-06, "loss": 1.3848, "step": 1442 }, { "epoch": 0.04, "learning_rate": 1.9997450986782667e-06, "loss": 0.9551, "step": 1443 }, { "epoch": 0.04, "learning_rate": 1.999743221038849e-06, "loss": 1.127, "step": 1444 }, { "epoch": 0.04, "learning_rate": 1.9997413365101926e-06, "loss": 0.9561, "step": 1445 }, { "epoch": 0.04, "learning_rate": 1.9997394450923117e-06, "loss": 1.1621, "step": 1446 }, { "epoch": 0.04, "learning_rate": 1.9997375467852183e-06, "loss": 0.9551, "step": 1447 }, { "epoch": 0.04, "learning_rate": 1.999735641588926e-06, "loss": 1.041, "step": 1448 }, { "epoch": 0.04, "learning_rate": 1.999733729503448e-06, "loss": 1.04, "step": 1449 }, { "epoch": 0.04, "learning_rate": 1.9997318105287972e-06, "loss": 0.9551, "step": 1450 }, { "epoch": 0.04, "learning_rate": 1.999729884664987e-06, "loss": 0.7969, "step": 1451 }, { "epoch": 0.04, "learning_rate": 1.9997279519120304e-06, "loss": 0.7788, "step": 1452 }, { "epoch": 0.04, "learning_rate": 1.9997260122699414e-06, "loss": 1.0234, "step": 1453 }, { "epoch": 0.04, "learning_rate": 1.9997240657387326e-06, "loss": 1.0186, "step": 1454 }, { "epoch": 0.04, "learning_rate": 1.9997221123184177e-06, "loss": 0.9375, "step": 1455 }, { "epoch": 0.04, "learning_rate": 1.9997201520090102e-06, "loss": 1.1514, "step": 1456 }, { "epoch": 0.04, "learning_rate": 1.9997181848105237e-06, "loss": 0.9395, "step": 1457 }, { "epoch": 0.04, "learning_rate": 1.9997162107229717e-06, "loss": 0.8613, "step": 1458 }, { "epoch": 0.04, "learning_rate": 1.9997142297463673e-06, "loss": 0.9316, "step": 1459 }, { "epoch": 0.04, "learning_rate": 1.999712241880725e-06, "loss": 0.8242, "step": 1460 }, { "epoch": 0.04, "learning_rate": 1.9997102471260577e-06, "loss": 1.0547, "step": 1461 }, { "epoch": 0.04, "learning_rate": 1.99970824548238e-06, "loss": 0.8408, "step": 1462 }, { "epoch": 0.04, "learning_rate": 1.999706236949705e-06, "loss": 0.8994, "step": 1463 }, { "epoch": 0.04, "learning_rate": 1.9997042215280467e-06, "loss": 0.7217, "step": 1464 }, { "epoch": 0.04, "learning_rate": 1.999702199217419e-06, "loss": 0.7227, "step": 1465 }, { "epoch": 0.04, "learning_rate": 1.999700170017836e-06, "loss": 0.7627, "step": 1466 }, { "epoch": 0.04, "learning_rate": 1.9996981339293116e-06, "loss": 0.9014, "step": 1467 }, { "epoch": 0.04, "learning_rate": 1.9996960909518597e-06, "loss": 1.0273, "step": 1468 }, { "epoch": 0.04, "learning_rate": 1.999694041085495e-06, "loss": 0.8245, "step": 1469 }, { "epoch": 0.04, "learning_rate": 1.9996919843302304e-06, "loss": 0.9795, "step": 1470 }, { "epoch": 0.04, "learning_rate": 1.9996899206860814e-06, "loss": 0.9043, "step": 1471 }, { "epoch": 0.04, "learning_rate": 1.9996878501530613e-06, "loss": 0.8486, "step": 1472 }, { "epoch": 0.04, "learning_rate": 1.999685772731185e-06, "loss": 0.8555, "step": 1473 }, { "epoch": 0.04, "learning_rate": 1.9996836884204657e-06, "loss": 0.8545, "step": 1474 }, { "epoch": 0.04, "learning_rate": 1.999681597220919e-06, "loss": 0.9551, "step": 1475 }, { "epoch": 0.04, "learning_rate": 1.999679499132559e-06, "loss": 0.8506, "step": 1476 }, { "epoch": 0.04, "learning_rate": 1.9996773941554e-06, "loss": 0.8989, "step": 1477 }, { "epoch": 0.04, "learning_rate": 1.999675282289456e-06, "loss": 0.8877, "step": 1478 }, { "epoch": 0.04, "learning_rate": 1.9996731635347427e-06, "loss": 0.6934, "step": 1479 }, { "epoch": 0.04, "learning_rate": 1.999671037891274e-06, "loss": 1.0088, "step": 1480 }, { "epoch": 0.04, "learning_rate": 1.9996689053590643e-06, "loss": 0.8633, "step": 1481 }, { "epoch": 0.04, "learning_rate": 1.999666765938129e-06, "loss": 0.8779, "step": 1482 }, { "epoch": 0.04, "learning_rate": 1.999664619628482e-06, "loss": 1.0723, "step": 1483 }, { "epoch": 0.04, "learning_rate": 1.999662466430139e-06, "loss": 1.0791, "step": 1484 }, { "epoch": 0.04, "learning_rate": 1.9996603063431143e-06, "loss": 1.0684, "step": 1485 }, { "epoch": 0.04, "learning_rate": 1.999658139367423e-06, "loss": 0.8223, "step": 1486 }, { "epoch": 0.04, "learning_rate": 1.9996559655030795e-06, "loss": 1.0176, "step": 1487 }, { "epoch": 0.04, "learning_rate": 1.9996537847500995e-06, "loss": 1.0225, "step": 1488 }, { "epoch": 0.04, "learning_rate": 1.999651597108498e-06, "loss": 0.9043, "step": 1489 }, { "epoch": 0.04, "learning_rate": 1.999649402578289e-06, "loss": 0.8159, "step": 1490 }, { "epoch": 0.04, "learning_rate": 1.999647201159489e-06, "loss": 1.0518, "step": 1491 }, { "epoch": 0.04, "learning_rate": 1.9996449928521122e-06, "loss": 1.0391, "step": 1492 }, { "epoch": 0.04, "learning_rate": 1.9996427776561748e-06, "loss": 1.0928, "step": 1493 }, { "epoch": 0.04, "learning_rate": 1.999640555571691e-06, "loss": 0.8594, "step": 1494 }, { "epoch": 0.04, "learning_rate": 1.9996383265986763e-06, "loss": 1.124, "step": 1495 }, { "epoch": 0.04, "learning_rate": 1.9996360907371467e-06, "loss": 1.0605, "step": 1496 }, { "epoch": 0.04, "learning_rate": 1.9996338479871177e-06, "loss": 0.8867, "step": 1497 }, { "epoch": 0.04, "learning_rate": 1.999631598348604e-06, "loss": 1.0967, "step": 1498 }, { "epoch": 0.04, "learning_rate": 1.9996293418216206e-06, "loss": 0.7886, "step": 1499 }, { "epoch": 0.04, "learning_rate": 1.999627078406185e-06, "loss": 1.166, "step": 1500 }, { "epoch": 0.04, "learning_rate": 1.999624808102311e-06, "loss": 1.1758, "step": 1501 }, { "epoch": 0.04, "learning_rate": 1.999622530910015e-06, "loss": 0.9106, "step": 1502 }, { "epoch": 0.04, "learning_rate": 1.999620246829313e-06, "loss": 0.8818, "step": 1503 }, { "epoch": 0.04, "learning_rate": 1.99961795586022e-06, "loss": 1.0947, "step": 1504 }, { "epoch": 0.04, "learning_rate": 1.9996156580027517e-06, "loss": 0.8105, "step": 1505 }, { "epoch": 0.04, "learning_rate": 1.999613353256925e-06, "loss": 1.0605, "step": 1506 }, { "epoch": 0.04, "learning_rate": 1.9996110416227547e-06, "loss": 0.8506, "step": 1507 }, { "epoch": 0.04, "learning_rate": 1.9996087231002576e-06, "loss": 0.877, "step": 1508 }, { "epoch": 0.04, "learning_rate": 1.999606397689449e-06, "loss": 0.958, "step": 1509 }, { "epoch": 0.04, "learning_rate": 1.999604065390345e-06, "loss": 0.959, "step": 1510 }, { "epoch": 0.04, "learning_rate": 1.999601726202962e-06, "loss": 0.9902, "step": 1511 }, { "epoch": 0.04, "learning_rate": 1.999599380127316e-06, "loss": 1.1445, "step": 1512 }, { "epoch": 0.04, "learning_rate": 1.999597027163423e-06, "loss": 0.915, "step": 1513 }, { "epoch": 0.04, "learning_rate": 1.9995946673112996e-06, "loss": 1.0547, "step": 1514 }, { "epoch": 0.04, "learning_rate": 1.9995923005709615e-06, "loss": 0.8569, "step": 1515 }, { "epoch": 0.04, "learning_rate": 1.9995899269424253e-06, "loss": 0.9375, "step": 1516 }, { "epoch": 0.04, "learning_rate": 1.9995875464257076e-06, "loss": 1.0537, "step": 1517 }, { "epoch": 0.04, "learning_rate": 1.9995851590208242e-06, "loss": 0.9463, "step": 1518 }, { "epoch": 0.04, "learning_rate": 1.9995827647277923e-06, "loss": 1.0273, "step": 1519 }, { "epoch": 0.04, "learning_rate": 1.9995803635466275e-06, "loss": 0.835, "step": 1520 }, { "epoch": 0.04, "learning_rate": 1.9995779554773476e-06, "loss": 1.1064, "step": 1521 }, { "epoch": 0.04, "learning_rate": 1.9995755405199678e-06, "loss": 0.9014, "step": 1522 }, { "epoch": 0.04, "learning_rate": 1.999573118674506e-06, "loss": 0.8662, "step": 1523 }, { "epoch": 0.04, "learning_rate": 1.999570689940978e-06, "loss": 1.1318, "step": 1524 }, { "epoch": 0.04, "learning_rate": 1.9995682543194006e-06, "loss": 0.8418, "step": 1525 }, { "epoch": 0.04, "learning_rate": 1.999565811809791e-06, "loss": 1.0977, "step": 1526 }, { "epoch": 0.04, "learning_rate": 1.999563362412166e-06, "loss": 0.9766, "step": 1527 }, { "epoch": 0.04, "learning_rate": 1.999560906126542e-06, "loss": 1.0645, "step": 1528 }, { "epoch": 0.04, "learning_rate": 1.9995584429529363e-06, "loss": 0.9307, "step": 1529 }, { "epoch": 0.04, "learning_rate": 1.999555972891366e-06, "loss": 0.9482, "step": 1530 }, { "epoch": 0.04, "learning_rate": 1.999553495941848e-06, "loss": 0.8428, "step": 1531 }, { "epoch": 0.04, "learning_rate": 1.999551012104399e-06, "loss": 1.1367, "step": 1532 }, { "epoch": 0.04, "learning_rate": 1.9995485213790365e-06, "loss": 0.9805, "step": 1533 }, { "epoch": 0.04, "learning_rate": 1.9995460237657778e-06, "loss": 0.9844, "step": 1534 }, { "epoch": 0.04, "learning_rate": 1.99954351926464e-06, "loss": 1.0449, "step": 1535 }, { "epoch": 0.04, "learning_rate": 1.9995410078756397e-06, "loss": 0.7256, "step": 1536 }, { "epoch": 0.04, "learning_rate": 1.9995384895987954e-06, "loss": 1.0244, "step": 1537 }, { "epoch": 0.04, "learning_rate": 1.9995359644341235e-06, "loss": 1.1416, "step": 1538 }, { "epoch": 0.04, "learning_rate": 1.999533432381642e-06, "loss": 0.9023, "step": 1539 }, { "epoch": 0.04, "learning_rate": 1.9995308934413675e-06, "loss": 0.9844, "step": 1540 }, { "epoch": 0.04, "learning_rate": 1.9995283476133184e-06, "loss": 0.9971, "step": 1541 }, { "epoch": 0.04, "learning_rate": 1.999525794897512e-06, "loss": 0.9946, "step": 1542 }, { "epoch": 0.04, "learning_rate": 1.9995232352939655e-06, "loss": 0.8398, "step": 1543 }, { "epoch": 0.04, "learning_rate": 1.9995206688026972e-06, "loss": 0.7612, "step": 1544 }, { "epoch": 0.04, "learning_rate": 1.999518095423724e-06, "loss": 1.0303, "step": 1545 }, { "epoch": 0.04, "learning_rate": 1.9995155151570646e-06, "loss": 1.043, "step": 1546 }, { "epoch": 0.04, "learning_rate": 1.999512928002736e-06, "loss": 0.7935, "step": 1547 }, { "epoch": 0.04, "learning_rate": 1.9995103339607558e-06, "loss": 0.9727, "step": 1548 }, { "epoch": 0.04, "learning_rate": 1.999507733031143e-06, "loss": 1.0918, "step": 1549 }, { "epoch": 0.04, "learning_rate": 1.9995051252139147e-06, "loss": 0.9775, "step": 1550 }, { "epoch": 0.04, "learning_rate": 1.999502510509089e-06, "loss": 1.0801, "step": 1551 }, { "epoch": 0.04, "learning_rate": 1.9994998889166837e-06, "loss": 0.9668, "step": 1552 }, { "epoch": 0.04, "learning_rate": 1.9994972604367174e-06, "loss": 0.8999, "step": 1553 }, { "epoch": 0.04, "learning_rate": 1.9994946250692076e-06, "loss": 1.0742, "step": 1554 }, { "epoch": 0.04, "learning_rate": 1.999491982814173e-06, "loss": 1.0664, "step": 1555 }, { "epoch": 0.04, "learning_rate": 1.9994893336716317e-06, "loss": 0.9912, "step": 1556 }, { "epoch": 0.04, "learning_rate": 1.9994866776416016e-06, "loss": 1.0098, "step": 1557 }, { "epoch": 0.04, "learning_rate": 1.9994840147241013e-06, "loss": 1.0605, "step": 1558 }, { "epoch": 0.04, "learning_rate": 1.9994813449191495e-06, "loss": 0.9033, "step": 1559 }, { "epoch": 0.04, "learning_rate": 1.999478668226764e-06, "loss": 1.2324, "step": 1560 }, { "epoch": 0.04, "learning_rate": 1.999475984646963e-06, "loss": 1.1172, "step": 1561 }, { "epoch": 0.04, "learning_rate": 1.9994732941797658e-06, "loss": 0.918, "step": 1562 }, { "epoch": 0.04, "learning_rate": 1.9994705968251907e-06, "loss": 0.7783, "step": 1563 }, { "epoch": 0.04, "learning_rate": 1.9994678925832564e-06, "loss": 1.1055, "step": 1564 }, { "epoch": 0.04, "learning_rate": 1.9994651814539803e-06, "loss": 0.8374, "step": 1565 }, { "epoch": 0.04, "learning_rate": 1.999462463437383e-06, "loss": 1.0898, "step": 1566 }, { "epoch": 0.04, "learning_rate": 1.999459738533482e-06, "loss": 1.1279, "step": 1567 }, { "epoch": 0.04, "learning_rate": 1.9994570067422962e-06, "loss": 1.1543, "step": 1568 }, { "epoch": 0.04, "learning_rate": 1.9994542680638453e-06, "loss": 0.8213, "step": 1569 }, { "epoch": 0.04, "learning_rate": 1.999451522498147e-06, "loss": 1.0059, "step": 1570 }, { "epoch": 0.04, "learning_rate": 1.999448770045221e-06, "loss": 1.1279, "step": 1571 }, { "epoch": 0.04, "learning_rate": 1.9994460107050856e-06, "loss": 0.8525, "step": 1572 }, { "epoch": 0.04, "learning_rate": 1.99944324447776e-06, "loss": 1.1152, "step": 1573 }, { "epoch": 0.04, "learning_rate": 1.999440471363264e-06, "loss": 0.8008, "step": 1574 }, { "epoch": 0.04, "learning_rate": 1.9994376913616156e-06, "loss": 0.9697, "step": 1575 }, { "epoch": 0.04, "learning_rate": 1.9994349044728352e-06, "loss": 0.7773, "step": 1576 }, { "epoch": 0.04, "learning_rate": 1.999432110696941e-06, "loss": 0.9307, "step": 1577 }, { "epoch": 0.04, "learning_rate": 1.999429310033952e-06, "loss": 1.0098, "step": 1578 }, { "epoch": 0.04, "learning_rate": 1.9994265024838892e-06, "loss": 1.125, "step": 1579 }, { "epoch": 0.04, "learning_rate": 1.99942368804677e-06, "loss": 1.125, "step": 1580 }, { "epoch": 0.04, "learning_rate": 1.999420866722615e-06, "loss": 1.1309, "step": 1581 }, { "epoch": 0.04, "learning_rate": 1.999418038511443e-06, "loss": 0.8936, "step": 1582 }, { "epoch": 0.04, "learning_rate": 1.9994152034132742e-06, "loss": 0.7495, "step": 1583 }, { "epoch": 0.04, "learning_rate": 1.999412361428127e-06, "loss": 0.6406, "step": 1584 }, { "epoch": 0.04, "learning_rate": 1.999409512556022e-06, "loss": 1.0166, "step": 1585 }, { "epoch": 0.04, "learning_rate": 1.9994066567969787e-06, "loss": 0.8389, "step": 1586 }, { "epoch": 0.04, "learning_rate": 1.9994037941510165e-06, "loss": 0.8076, "step": 1587 }, { "epoch": 0.04, "learning_rate": 1.9994009246181547e-06, "loss": 0.7783, "step": 1588 }, { "epoch": 0.04, "learning_rate": 1.9993980481984145e-06, "loss": 0.9165, "step": 1589 }, { "epoch": 0.04, "learning_rate": 1.999395164891814e-06, "loss": 1.1572, "step": 1590 }, { "epoch": 0.04, "learning_rate": 1.9993922746983744e-06, "loss": 0.7473, "step": 1591 }, { "epoch": 0.04, "learning_rate": 1.999389377618115e-06, "loss": 0.7969, "step": 1592 }, { "epoch": 0.04, "learning_rate": 1.999386473651055e-06, "loss": 0.9785, "step": 1593 }, { "epoch": 0.04, "learning_rate": 1.999383562797216e-06, "loss": 1.0273, "step": 1594 }, { "epoch": 0.04, "learning_rate": 1.9993806450566177e-06, "loss": 0.7676, "step": 1595 }, { "epoch": 0.04, "learning_rate": 1.999377720429279e-06, "loss": 0.8628, "step": 1596 }, { "epoch": 0.04, "learning_rate": 1.9993747889152215e-06, "loss": 1.1709, "step": 1597 }, { "epoch": 0.04, "learning_rate": 1.9993718505144645e-06, "loss": 0.9492, "step": 1598 }, { "epoch": 0.04, "learning_rate": 1.9993689052270286e-06, "loss": 1.0029, "step": 1599 }, { "epoch": 0.04, "learning_rate": 1.999365953052934e-06, "loss": 0.8291, "step": 1600 }, { "epoch": 0.04, "learning_rate": 1.999362993992201e-06, "loss": 1.042, "step": 1601 }, { "epoch": 0.04, "learning_rate": 1.99936002804485e-06, "loss": 1.0566, "step": 1602 }, { "epoch": 0.04, "learning_rate": 1.999357055210902e-06, "loss": 0.8452, "step": 1603 }, { "epoch": 0.04, "learning_rate": 1.9993540754903764e-06, "loss": 1.0996, "step": 1604 }, { "epoch": 0.04, "learning_rate": 1.9993510888832947e-06, "loss": 1.166, "step": 1605 }, { "epoch": 0.04, "learning_rate": 1.999348095389677e-06, "loss": 0.9253, "step": 1606 }, { "epoch": 0.04, "learning_rate": 1.999345095009544e-06, "loss": 0.8589, "step": 1607 }, { "epoch": 0.04, "learning_rate": 1.9993420877429165e-06, "loss": 1.2207, "step": 1608 }, { "epoch": 0.04, "learning_rate": 1.9993390735898147e-06, "loss": 0.8809, "step": 1609 }, { "epoch": 0.04, "learning_rate": 1.99933605255026e-06, "loss": 1.0078, "step": 1610 }, { "epoch": 0.04, "learning_rate": 1.999333024624273e-06, "loss": 0.9238, "step": 1611 }, { "epoch": 0.04, "learning_rate": 1.999329989811875e-06, "loss": 0.8311, "step": 1612 }, { "epoch": 0.04, "learning_rate": 1.999326948113086e-06, "loss": 0.9629, "step": 1613 }, { "epoch": 0.04, "learning_rate": 1.9993238995279277e-06, "loss": 1.1055, "step": 1614 }, { "epoch": 0.04, "learning_rate": 1.9993208440564207e-06, "loss": 0.8184, "step": 1615 }, { "epoch": 0.04, "learning_rate": 1.9993177816985863e-06, "loss": 1.0654, "step": 1616 }, { "epoch": 0.04, "learning_rate": 1.9993147124544455e-06, "loss": 0.8213, "step": 1617 }, { "epoch": 0.04, "learning_rate": 1.9993116363240193e-06, "loss": 0.9639, "step": 1618 }, { "epoch": 0.04, "learning_rate": 1.9993085533073295e-06, "loss": 0.9814, "step": 1619 }, { "epoch": 0.04, "learning_rate": 1.9993054634043965e-06, "loss": 1.0938, "step": 1620 }, { "epoch": 0.04, "learning_rate": 1.9993023666152424e-06, "loss": 0.8604, "step": 1621 }, { "epoch": 0.04, "learning_rate": 1.999299262939888e-06, "loss": 0.8472, "step": 1622 }, { "epoch": 0.04, "learning_rate": 1.9992961523783545e-06, "loss": 0.9385, "step": 1623 }, { "epoch": 0.04, "learning_rate": 1.999293034930664e-06, "loss": 0.9717, "step": 1624 }, { "epoch": 0.04, "learning_rate": 1.9992899105968373e-06, "loss": 0.7954, "step": 1625 }, { "epoch": 0.04, "learning_rate": 1.9992867793768963e-06, "loss": 0.9414, "step": 1626 }, { "epoch": 0.04, "learning_rate": 1.999283641270863e-06, "loss": 0.938, "step": 1627 }, { "epoch": 0.04, "learning_rate": 1.999280496278758e-06, "loss": 0.896, "step": 1628 }, { "epoch": 0.04, "learning_rate": 1.9992773444006043e-06, "loss": 1.1504, "step": 1629 }, { "epoch": 0.04, "learning_rate": 1.9992741856364224e-06, "loss": 1.0752, "step": 1630 }, { "epoch": 0.04, "learning_rate": 1.9992710199862344e-06, "loss": 1.1104, "step": 1631 }, { "epoch": 0.04, "learning_rate": 1.9992678474500625e-06, "loss": 1.1387, "step": 1632 }, { "epoch": 0.04, "learning_rate": 1.999264668027928e-06, "loss": 0.9512, "step": 1633 }, { "epoch": 0.04, "learning_rate": 1.999261481719854e-06, "loss": 0.9375, "step": 1634 }, { "epoch": 0.04, "learning_rate": 1.9992582885258605e-06, "loss": 1.1729, "step": 1635 }, { "epoch": 0.04, "learning_rate": 1.9992550884459715e-06, "loss": 0.9688, "step": 1636 }, { "epoch": 0.04, "learning_rate": 1.9992518814802074e-06, "loss": 0.8936, "step": 1637 }, { "epoch": 0.04, "learning_rate": 1.9992486676285915e-06, "loss": 1.1064, "step": 1638 }, { "epoch": 0.04, "learning_rate": 1.9992454468911453e-06, "loss": 0.9648, "step": 1639 }, { "epoch": 0.04, "learning_rate": 1.9992422192678913e-06, "loss": 1.1211, "step": 1640 }, { "epoch": 0.04, "learning_rate": 1.999238984758851e-06, "loss": 0.8062, "step": 1641 }, { "epoch": 0.04, "learning_rate": 1.9992357433640484e-06, "loss": 0.9414, "step": 1642 }, { "epoch": 0.04, "learning_rate": 1.999232495083504e-06, "loss": 1.1533, "step": 1643 }, { "epoch": 0.04, "learning_rate": 1.999229239917241e-06, "loss": 0.9775, "step": 1644 }, { "epoch": 0.04, "learning_rate": 1.9992259778652822e-06, "loss": 1.0303, "step": 1645 }, { "epoch": 0.04, "learning_rate": 1.999222708927649e-06, "loss": 1.043, "step": 1646 }, { "epoch": 0.04, "learning_rate": 1.999219433104365e-06, "loss": 1.0879, "step": 1647 }, { "epoch": 0.04, "learning_rate": 1.999216150395452e-06, "loss": 0.9023, "step": 1648 }, { "epoch": 0.04, "learning_rate": 1.9992128608009335e-06, "loss": 1.0557, "step": 1649 }, { "epoch": 0.04, "learning_rate": 1.999209564320831e-06, "loss": 1.1309, "step": 1650 }, { "epoch": 0.04, "learning_rate": 1.9992062609551682e-06, "loss": 0.8105, "step": 1651 }, { "epoch": 0.04, "learning_rate": 1.9992029507039676e-06, "loss": 1.1309, "step": 1652 }, { "epoch": 0.04, "learning_rate": 1.9991996335672517e-06, "loss": 0.8496, "step": 1653 }, { "epoch": 0.04, "learning_rate": 1.9991963095450436e-06, "loss": 0.9219, "step": 1654 }, { "epoch": 0.04, "learning_rate": 1.999192978637366e-06, "loss": 0.9717, "step": 1655 }, { "epoch": 0.04, "learning_rate": 1.9991896408442424e-06, "loss": 0.9385, "step": 1656 }, { "epoch": 0.04, "learning_rate": 1.9991862961656954e-06, "loss": 0.7324, "step": 1657 }, { "epoch": 0.04, "learning_rate": 1.999182944601748e-06, "loss": 1.084, "step": 1658 }, { "epoch": 0.04, "learning_rate": 1.9991795861524233e-06, "loss": 0.8599, "step": 1659 }, { "epoch": 0.04, "learning_rate": 1.9991762208177447e-06, "loss": 0.8389, "step": 1660 }, { "epoch": 0.04, "learning_rate": 1.9991728485977347e-06, "loss": 0.9453, "step": 1661 }, { "epoch": 0.04, "learning_rate": 1.999169469492418e-06, "loss": 0.9941, "step": 1662 }, { "epoch": 0.04, "learning_rate": 1.999166083501816e-06, "loss": 1.2207, "step": 1663 }, { "epoch": 0.04, "learning_rate": 1.9991626906259534e-06, "loss": 1.0576, "step": 1664 }, { "epoch": 0.04, "learning_rate": 1.999159290864853e-06, "loss": 0.958, "step": 1665 }, { "epoch": 0.04, "learning_rate": 1.9991558842185386e-06, "loss": 0.8574, "step": 1666 }, { "epoch": 0.04, "learning_rate": 1.999152470687033e-06, "loss": 1.2197, "step": 1667 }, { "epoch": 0.04, "learning_rate": 1.999149050270361e-06, "loss": 0.9854, "step": 1668 }, { "epoch": 0.04, "learning_rate": 1.9991456229685446e-06, "loss": 1.0791, "step": 1669 }, { "epoch": 0.04, "learning_rate": 1.9991421887816083e-06, "loss": 1.1025, "step": 1670 }, { "epoch": 0.04, "learning_rate": 1.999138747709576e-06, "loss": 1.0205, "step": 1671 }, { "epoch": 0.04, "learning_rate": 1.999135299752471e-06, "loss": 0.8145, "step": 1672 }, { "epoch": 0.04, "learning_rate": 1.999131844910317e-06, "loss": 1.0859, "step": 1673 }, { "epoch": 0.04, "learning_rate": 1.9991283831831376e-06, "loss": 1.1084, "step": 1674 }, { "epoch": 0.04, "learning_rate": 1.9991249145709574e-06, "loss": 0.9141, "step": 1675 }, { "epoch": 0.04, "learning_rate": 1.9991214390737994e-06, "loss": 0.6851, "step": 1676 }, { "epoch": 0.04, "learning_rate": 1.9991179566916883e-06, "loss": 1.0488, "step": 1677 }, { "epoch": 0.04, "learning_rate": 1.999114467424648e-06, "loss": 0.8306, "step": 1678 }, { "epoch": 0.04, "learning_rate": 1.999110971272702e-06, "loss": 1.0273, "step": 1679 }, { "epoch": 0.04, "learning_rate": 1.999107468235875e-06, "loss": 0.915, "step": 1680 }, { "epoch": 0.04, "learning_rate": 1.9991039583141906e-06, "loss": 0.8135, "step": 1681 }, { "epoch": 0.04, "learning_rate": 1.9991004415076733e-06, "loss": 0.8157, "step": 1682 }, { "epoch": 0.04, "learning_rate": 1.9990969178163477e-06, "loss": 0.9941, "step": 1683 }, { "epoch": 0.04, "learning_rate": 1.9990933872402375e-06, "loss": 0.8926, "step": 1684 }, { "epoch": 0.04, "learning_rate": 1.999089849779367e-06, "loss": 0.9482, "step": 1685 }, { "epoch": 0.04, "learning_rate": 1.999086305433761e-06, "loss": 0.8691, "step": 1686 }, { "epoch": 0.04, "learning_rate": 1.9990827542034437e-06, "loss": 1.2578, "step": 1687 }, { "epoch": 0.04, "learning_rate": 1.9990791960884395e-06, "loss": 0.9639, "step": 1688 }, { "epoch": 0.04, "learning_rate": 1.999075631088773e-06, "loss": 1.1738, "step": 1689 }, { "epoch": 0.04, "learning_rate": 1.999072059204469e-06, "loss": 0.8311, "step": 1690 }, { "epoch": 0.04, "learning_rate": 1.9990684804355516e-06, "loss": 1.0938, "step": 1691 }, { "epoch": 0.04, "learning_rate": 1.999064894782046e-06, "loss": 1.1533, "step": 1692 }, { "epoch": 0.04, "learning_rate": 1.9990613022439765e-06, "loss": 0.9297, "step": 1693 }, { "epoch": 0.04, "learning_rate": 1.9990577028213684e-06, "loss": 0.8062, "step": 1694 }, { "epoch": 0.04, "learning_rate": 1.9990540965142455e-06, "loss": 0.6846, "step": 1695 }, { "epoch": 0.04, "learning_rate": 1.9990504833226337e-06, "loss": 0.9062, "step": 1696 }, { "epoch": 0.04, "learning_rate": 1.9990468632465574e-06, "loss": 0.9473, "step": 1697 }, { "epoch": 0.04, "learning_rate": 1.9990432362860417e-06, "loss": 0.9629, "step": 1698 }, { "epoch": 0.04, "learning_rate": 1.999039602441111e-06, "loss": 1.1035, "step": 1699 }, { "epoch": 0.04, "learning_rate": 1.9990359617117916e-06, "loss": 1.0391, "step": 1700 }, { "epoch": 0.04, "learning_rate": 1.9990323140981075e-06, "loss": 1.0166, "step": 1701 }, { "epoch": 0.04, "learning_rate": 1.9990286596000844e-06, "loss": 1.0264, "step": 1702 }, { "epoch": 0.04, "learning_rate": 1.999024998217747e-06, "loss": 1.0117, "step": 1703 }, { "epoch": 0.04, "learning_rate": 1.9990213299511206e-06, "loss": 0.9824, "step": 1704 }, { "epoch": 0.04, "learning_rate": 1.999017654800231e-06, "loss": 0.687, "step": 1705 }, { "epoch": 0.04, "learning_rate": 1.9990139727651034e-06, "loss": 0.873, "step": 1706 }, { "epoch": 0.04, "learning_rate": 1.9990102838457624e-06, "loss": 1.0879, "step": 1707 }, { "epoch": 0.04, "learning_rate": 1.999006588042234e-06, "loss": 0.8877, "step": 1708 }, { "epoch": 0.04, "learning_rate": 1.9990028853545443e-06, "loss": 1.0547, "step": 1709 }, { "epoch": 0.04, "learning_rate": 1.9989991757827176e-06, "loss": 0.8799, "step": 1710 }, { "epoch": 0.04, "learning_rate": 1.9989954593267802e-06, "loss": 0.9863, "step": 1711 }, { "epoch": 0.04, "learning_rate": 1.9989917359867574e-06, "loss": 0.7686, "step": 1712 }, { "epoch": 0.04, "learning_rate": 1.9989880057626755e-06, "loss": 0.6729, "step": 1713 }, { "epoch": 0.04, "learning_rate": 1.998984268654559e-06, "loss": 0.8477, "step": 1714 }, { "epoch": 0.04, "learning_rate": 1.9989805246624347e-06, "loss": 0.8809, "step": 1715 }, { "epoch": 0.04, "learning_rate": 1.998976773786328e-06, "loss": 0.6428, "step": 1716 }, { "epoch": 0.04, "learning_rate": 1.998973016026265e-06, "loss": 0.9922, "step": 1717 }, { "epoch": 0.04, "learning_rate": 1.9989692513822713e-06, "loss": 1.0752, "step": 1718 }, { "epoch": 0.04, "learning_rate": 1.998965479854373e-06, "loss": 1.0547, "step": 1719 }, { "epoch": 0.04, "learning_rate": 1.998961701442596e-06, "loss": 0.8896, "step": 1720 }, { "epoch": 0.04, "learning_rate": 1.998957916146966e-06, "loss": 1.1797, "step": 1721 }, { "epoch": 0.04, "learning_rate": 1.99895412396751e-06, "loss": 0.9365, "step": 1722 }, { "epoch": 0.04, "learning_rate": 1.9989503249042535e-06, "loss": 1.0645, "step": 1723 }, { "epoch": 0.04, "learning_rate": 1.9989465189572226e-06, "loss": 1.0713, "step": 1724 }, { "epoch": 0.04, "learning_rate": 1.9989427061264435e-06, "loss": 1.0586, "step": 1725 }, { "epoch": 0.04, "learning_rate": 1.998938886411943e-06, "loss": 0.8027, "step": 1726 }, { "epoch": 0.04, "learning_rate": 1.998935059813747e-06, "loss": 1.1504, "step": 1727 }, { "epoch": 0.04, "learning_rate": 1.998931226331882e-06, "loss": 1.1152, "step": 1728 }, { "epoch": 0.04, "learning_rate": 1.998927385966374e-06, "loss": 1.1221, "step": 1729 }, { "epoch": 0.04, "learning_rate": 1.9989235387172502e-06, "loss": 0.9307, "step": 1730 }, { "epoch": 0.04, "learning_rate": 1.998919684584537e-06, "loss": 0.7588, "step": 1731 }, { "epoch": 0.04, "learning_rate": 1.9989158235682604e-06, "loss": 0.8721, "step": 1732 }, { "epoch": 0.04, "learning_rate": 1.998911955668447e-06, "loss": 0.79, "step": 1733 }, { "epoch": 0.04, "learning_rate": 1.998908080885124e-06, "loss": 0.8198, "step": 1734 }, { "epoch": 0.04, "learning_rate": 1.9989041992183182e-06, "loss": 1.0439, "step": 1735 }, { "epoch": 0.04, "learning_rate": 1.9989003106680554e-06, "loss": 1.0967, "step": 1736 }, { "epoch": 0.04, "learning_rate": 1.9988964152343637e-06, "loss": 0.9146, "step": 1737 }, { "epoch": 0.04, "learning_rate": 1.998892512917269e-06, "loss": 0.9922, "step": 1738 }, { "epoch": 0.04, "learning_rate": 1.998888603716798e-06, "loss": 0.9307, "step": 1739 }, { "epoch": 0.04, "learning_rate": 1.998884687632979e-06, "loss": 1.0156, "step": 1740 }, { "epoch": 0.04, "learning_rate": 1.9988807646658375e-06, "loss": 1.0254, "step": 1741 }, { "epoch": 0.04, "learning_rate": 1.998876834815401e-06, "loss": 0.9307, "step": 1742 }, { "epoch": 0.04, "learning_rate": 1.998872898081697e-06, "loss": 0.9395, "step": 1743 }, { "epoch": 0.04, "learning_rate": 1.998868954464752e-06, "loss": 0.9395, "step": 1744 }, { "epoch": 0.04, "learning_rate": 1.9988650039645937e-06, "loss": 1.0781, "step": 1745 }, { "epoch": 0.04, "learning_rate": 1.998861046581249e-06, "loss": 0.9092, "step": 1746 }, { "epoch": 0.04, "learning_rate": 1.998857082314745e-06, "loss": 0.9619, "step": 1747 }, { "epoch": 0.04, "learning_rate": 1.99885311116511e-06, "loss": 0.8418, "step": 1748 }, { "epoch": 0.04, "learning_rate": 1.99884913313237e-06, "loss": 1.0107, "step": 1749 }, { "epoch": 0.04, "learning_rate": 1.9988451482165534e-06, "loss": 1.0693, "step": 1750 }, { "epoch": 0.04, "learning_rate": 1.9988411564176877e-06, "loss": 0.585, "step": 1751 }, { "epoch": 0.04, "learning_rate": 1.9988371577357996e-06, "loss": 1.1025, "step": 1752 }, { "epoch": 0.04, "learning_rate": 1.998833152170917e-06, "loss": 1.0127, "step": 1753 }, { "epoch": 0.04, "learning_rate": 1.9988291397230677e-06, "loss": 1.0195, "step": 1754 }, { "epoch": 0.04, "learning_rate": 1.998825120392279e-06, "loss": 1.0059, "step": 1755 }, { "epoch": 0.05, "learning_rate": 1.9988210941785794e-06, "loss": 0.813, "step": 1756 }, { "epoch": 0.05, "learning_rate": 1.998817061081996e-06, "loss": 0.9575, "step": 1757 }, { "epoch": 0.05, "learning_rate": 1.9988130211025566e-06, "loss": 0.874, "step": 1758 }, { "epoch": 0.05, "learning_rate": 1.998808974240289e-06, "loss": 0.9082, "step": 1759 }, { "epoch": 0.05, "learning_rate": 1.9988049204952215e-06, "loss": 0.9834, "step": 1760 }, { "epoch": 0.05, "learning_rate": 1.9988008598673813e-06, "loss": 0.9121, "step": 1761 }, { "epoch": 0.05, "learning_rate": 1.998796792356797e-06, "loss": 0.9648, "step": 1762 }, { "epoch": 0.05, "learning_rate": 1.9987927179634966e-06, "loss": 0.916, "step": 1763 }, { "epoch": 0.05, "learning_rate": 1.998788636687508e-06, "loss": 1.0762, "step": 1764 }, { "epoch": 0.05, "learning_rate": 1.998784548528859e-06, "loss": 0.7773, "step": 1765 }, { "epoch": 0.05, "learning_rate": 1.998780453487579e-06, "loss": 0.8271, "step": 1766 }, { "epoch": 0.05, "learning_rate": 1.998776351563694e-06, "loss": 0.9336, "step": 1767 }, { "epoch": 0.05, "learning_rate": 1.998772242757235e-06, "loss": 1.0684, "step": 1768 }, { "epoch": 0.05, "learning_rate": 1.9987681270682284e-06, "loss": 0.8691, "step": 1769 }, { "epoch": 0.05, "learning_rate": 1.9987640044967028e-06, "loss": 1.0322, "step": 1770 }, { "epoch": 0.05, "learning_rate": 1.998759875042687e-06, "loss": 1.0107, "step": 1771 }, { "epoch": 0.05, "learning_rate": 1.99875573870621e-06, "loss": 0.9771, "step": 1772 }, { "epoch": 0.05, "learning_rate": 1.998751595487299e-06, "loss": 1.0117, "step": 1773 }, { "epoch": 0.05, "learning_rate": 1.9987474453859832e-06, "loss": 1.1914, "step": 1774 }, { "epoch": 0.05, "learning_rate": 1.9987432884022914e-06, "loss": 0.7246, "step": 1775 }, { "epoch": 0.05, "learning_rate": 1.998739124536252e-06, "loss": 0.8457, "step": 1776 }, { "epoch": 0.05, "learning_rate": 1.998734953787894e-06, "loss": 0.998, "step": 1777 }, { "epoch": 0.05, "learning_rate": 1.9987307761572456e-06, "loss": 0.9697, "step": 1778 }, { "epoch": 0.05, "learning_rate": 1.998726591644336e-06, "loss": 1.0547, "step": 1779 }, { "epoch": 0.05, "learning_rate": 1.9987224002491937e-06, "loss": 0.8652, "step": 1780 }, { "epoch": 0.05, "learning_rate": 1.998718201971848e-06, "loss": 0.9814, "step": 1781 }, { "epoch": 0.05, "learning_rate": 1.998713996812328e-06, "loss": 0.999, "step": 1782 }, { "epoch": 0.05, "learning_rate": 1.9987097847706614e-06, "loss": 0.9629, "step": 1783 }, { "epoch": 0.05, "learning_rate": 1.9987055658468786e-06, "loss": 1.1191, "step": 1784 }, { "epoch": 0.05, "learning_rate": 1.998701340041008e-06, "loss": 1.0957, "step": 1785 }, { "epoch": 0.05, "learning_rate": 1.9986971073530796e-06, "loss": 1.041, "step": 1786 }, { "epoch": 0.05, "learning_rate": 1.9986928677831214e-06, "loss": 0.9502, "step": 1787 }, { "epoch": 0.05, "learning_rate": 1.998688621331163e-06, "loss": 1.0273, "step": 1788 }, { "epoch": 0.05, "learning_rate": 1.9986843679972337e-06, "loss": 0.9521, "step": 1789 }, { "epoch": 0.05, "learning_rate": 1.9986801077813633e-06, "loss": 1.0566, "step": 1790 }, { "epoch": 0.05, "learning_rate": 1.9986758406835806e-06, "loss": 0.7463, "step": 1791 }, { "epoch": 0.05, "learning_rate": 1.998671566703915e-06, "loss": 0.9502, "step": 1792 }, { "epoch": 0.05, "learning_rate": 1.998667285842396e-06, "loss": 0.915, "step": 1793 }, { "epoch": 0.05, "learning_rate": 1.9986629980990536e-06, "loss": 1.0508, "step": 1794 }, { "epoch": 0.05, "learning_rate": 1.9986587034739165e-06, "loss": 1.0264, "step": 1795 }, { "epoch": 0.05, "learning_rate": 1.998654401967015e-06, "loss": 0.8252, "step": 1796 }, { "epoch": 0.05, "learning_rate": 1.9986500935783784e-06, "loss": 0.9834, "step": 1797 }, { "epoch": 0.05, "learning_rate": 1.9986457783080363e-06, "loss": 0.8604, "step": 1798 }, { "epoch": 0.05, "learning_rate": 1.9986414561560186e-06, "loss": 0.7881, "step": 1799 }, { "epoch": 0.05, "learning_rate": 1.998637127122355e-06, "loss": 1.0645, "step": 1800 }, { "epoch": 0.05, "learning_rate": 1.998632791207076e-06, "loss": 0.8447, "step": 1801 }, { "epoch": 0.05, "learning_rate": 1.99862844841021e-06, "loss": 1.1025, "step": 1802 }, { "epoch": 0.05, "learning_rate": 1.998624098731789e-06, "loss": 1.124, "step": 1803 }, { "epoch": 0.05, "learning_rate": 1.998619742171841e-06, "loss": 0.9131, "step": 1804 }, { "epoch": 0.05, "learning_rate": 1.998615378730397e-06, "loss": 1.0791, "step": 1805 }, { "epoch": 0.05, "learning_rate": 1.9986110084074867e-06, "loss": 0.9512, "step": 1806 }, { "epoch": 0.05, "learning_rate": 1.9986066312031403e-06, "loss": 0.9814, "step": 1807 }, { "epoch": 0.05, "learning_rate": 1.998602247117388e-06, "loss": 1.0273, "step": 1808 }, { "epoch": 0.05, "learning_rate": 1.9985978561502608e-06, "loss": 0.9604, "step": 1809 }, { "epoch": 0.05, "learning_rate": 1.9985934583017877e-06, "loss": 0.7681, "step": 1810 }, { "epoch": 0.05, "learning_rate": 1.9985890535719995e-06, "loss": 0.8281, "step": 1811 }, { "epoch": 0.05, "learning_rate": 1.9985846419609266e-06, "loss": 1.3066, "step": 1812 }, { "epoch": 0.05, "learning_rate": 1.9985802234685995e-06, "loss": 1.0215, "step": 1813 }, { "epoch": 0.05, "learning_rate": 1.9985757980950484e-06, "loss": 0.5566, "step": 1814 }, { "epoch": 0.05, "learning_rate": 1.998571365840304e-06, "loss": 1.0391, "step": 1815 }, { "epoch": 0.05, "learning_rate": 1.998566926704397e-06, "loss": 0.8662, "step": 1816 }, { "epoch": 0.05, "learning_rate": 1.9985624806873576e-06, "loss": 0.8203, "step": 1817 }, { "epoch": 0.05, "learning_rate": 1.9985580277892167e-06, "loss": 0.9795, "step": 1818 }, { "epoch": 0.05, "learning_rate": 1.998553568010005e-06, "loss": 1.1699, "step": 1819 }, { "epoch": 0.05, "learning_rate": 1.9985491013497527e-06, "loss": 1.043, "step": 1820 }, { "epoch": 0.05, "learning_rate": 1.998544627808491e-06, "loss": 1.208, "step": 1821 }, { "epoch": 0.05, "learning_rate": 1.998540147386251e-06, "loss": 0.9775, "step": 1822 }, { "epoch": 0.05, "learning_rate": 1.998535660083063e-06, "loss": 1.1777, "step": 1823 }, { "epoch": 0.05, "learning_rate": 1.998531165898959e-06, "loss": 0.8574, "step": 1824 }, { "epoch": 0.05, "learning_rate": 1.9985266648339685e-06, "loss": 0.8652, "step": 1825 }, { "epoch": 0.05, "learning_rate": 1.9985221568881233e-06, "loss": 1.126, "step": 1826 }, { "epoch": 0.05, "learning_rate": 1.9985176420614546e-06, "loss": 0.9805, "step": 1827 }, { "epoch": 0.05, "learning_rate": 1.998513120353993e-06, "loss": 0.7686, "step": 1828 }, { "epoch": 0.05, "learning_rate": 1.99850859176577e-06, "loss": 0.918, "step": 1829 }, { "epoch": 0.05, "learning_rate": 1.9985040562968168e-06, "loss": 0.8945, "step": 1830 }, { "epoch": 0.05, "learning_rate": 1.9984995139471644e-06, "loss": 1.0869, "step": 1831 }, { "epoch": 0.05, "learning_rate": 1.9984949647168448e-06, "loss": 0.8994, "step": 1832 }, { "epoch": 0.05, "learning_rate": 1.9984904086058885e-06, "loss": 1.0, "step": 1833 }, { "epoch": 0.05, "learning_rate": 1.9984858456143274e-06, "loss": 1.1719, "step": 1834 }, { "epoch": 0.05, "learning_rate": 1.9984812757421927e-06, "loss": 0.9268, "step": 1835 }, { "epoch": 0.05, "learning_rate": 1.998476698989516e-06, "loss": 0.8589, "step": 1836 }, { "epoch": 0.05, "learning_rate": 1.9984721153563287e-06, "loss": 1.1191, "step": 1837 }, { "epoch": 0.05, "learning_rate": 1.9984675248426626e-06, "loss": 0.9199, "step": 1838 }, { "epoch": 0.05, "learning_rate": 1.9984629274485496e-06, "loss": 1.0771, "step": 1839 }, { "epoch": 0.05, "learning_rate": 1.9984583231740205e-06, "loss": 0.8047, "step": 1840 }, { "epoch": 0.05, "learning_rate": 1.998453712019108e-06, "loss": 1.0674, "step": 1841 }, { "epoch": 0.05, "learning_rate": 1.998449093983843e-06, "loss": 0.9473, "step": 1842 }, { "epoch": 0.05, "learning_rate": 1.998444469068258e-06, "loss": 0.9941, "step": 1843 }, { "epoch": 0.05, "learning_rate": 1.9984398372723844e-06, "loss": 0.835, "step": 1844 }, { "epoch": 0.05, "learning_rate": 1.9984351985962546e-06, "loss": 1.0693, "step": 1845 }, { "epoch": 0.05, "learning_rate": 1.9984305530399003e-06, "loss": 0.874, "step": 1846 }, { "epoch": 0.05, "learning_rate": 1.9984259006033536e-06, "loss": 0.9849, "step": 1847 }, { "epoch": 0.05, "learning_rate": 1.998421241286646e-06, "loss": 1.0693, "step": 1848 }, { "epoch": 0.05, "learning_rate": 1.9984165750898104e-06, "loss": 1.1006, "step": 1849 }, { "epoch": 0.05, "learning_rate": 1.998411902012879e-06, "loss": 1.0557, "step": 1850 }, { "epoch": 0.05, "learning_rate": 1.9984072220558834e-06, "loss": 1.084, "step": 1851 }, { "epoch": 0.05, "learning_rate": 1.9984025352188557e-06, "loss": 1.0947, "step": 1852 }, { "epoch": 0.05, "learning_rate": 1.998397841501829e-06, "loss": 1.3066, "step": 1853 }, { "epoch": 0.05, "learning_rate": 1.998393140904835e-06, "loss": 1.2227, "step": 1854 }, { "epoch": 0.05, "learning_rate": 1.9983884334279063e-06, "loss": 1.0918, "step": 1855 }, { "epoch": 0.05, "learning_rate": 1.9983837190710755e-06, "loss": 0.9248, "step": 1856 }, { "epoch": 0.05, "learning_rate": 1.9983789978343746e-06, "loss": 1.0264, "step": 1857 }, { "epoch": 0.05, "learning_rate": 1.998374269717837e-06, "loss": 1.168, "step": 1858 }, { "epoch": 0.05, "learning_rate": 1.9983695347214946e-06, "loss": 0.8779, "step": 1859 }, { "epoch": 0.05, "learning_rate": 1.9983647928453804e-06, "loss": 0.9697, "step": 1860 }, { "epoch": 0.05, "learning_rate": 1.9983600440895264e-06, "loss": 1.0752, "step": 1861 }, { "epoch": 0.05, "learning_rate": 1.9983552884539663e-06, "loss": 0.7705, "step": 1862 }, { "epoch": 0.05, "learning_rate": 1.9983505259387317e-06, "loss": 1.3057, "step": 1863 }, { "epoch": 0.05, "learning_rate": 1.998345756543857e-06, "loss": 1.0225, "step": 1864 }, { "epoch": 0.05, "learning_rate": 1.9983409802693734e-06, "loss": 1.0498, "step": 1865 }, { "epoch": 0.05, "learning_rate": 1.998336197115315e-06, "loss": 0.9961, "step": 1866 }, { "epoch": 0.05, "learning_rate": 1.998331407081714e-06, "loss": 0.8359, "step": 1867 }, { "epoch": 0.05, "learning_rate": 1.9983266101686038e-06, "loss": 0.9185, "step": 1868 }, { "epoch": 0.05, "learning_rate": 1.9983218063760175e-06, "loss": 0.9854, "step": 1869 }, { "epoch": 0.05, "learning_rate": 1.998316995703988e-06, "loss": 0.9443, "step": 1870 }, { "epoch": 0.05, "learning_rate": 1.9983121781525484e-06, "loss": 1.0449, "step": 1871 }, { "epoch": 0.05, "learning_rate": 1.9983073537217325e-06, "loss": 1.1328, "step": 1872 }, { "epoch": 0.05, "learning_rate": 1.9983025224115725e-06, "loss": 1.0195, "step": 1873 }, { "epoch": 0.05, "learning_rate": 1.9982976842221027e-06, "loss": 0.7285, "step": 1874 }, { "epoch": 0.05, "learning_rate": 1.9982928391533557e-06, "loss": 0.8398, "step": 1875 }, { "epoch": 0.05, "learning_rate": 1.998287987205366e-06, "loss": 1.1318, "step": 1876 }, { "epoch": 0.05, "learning_rate": 1.9982831283781653e-06, "loss": 1.1074, "step": 1877 }, { "epoch": 0.05, "learning_rate": 1.9982782626717883e-06, "loss": 1.0146, "step": 1878 }, { "epoch": 0.05, "learning_rate": 1.9982733900862684e-06, "loss": 1.0439, "step": 1879 }, { "epoch": 0.05, "learning_rate": 1.9982685106216387e-06, "loss": 0.9531, "step": 1880 }, { "epoch": 0.05, "learning_rate": 1.9982636242779333e-06, "loss": 0.876, "step": 1881 }, { "epoch": 0.05, "learning_rate": 1.998258731055186e-06, "loss": 0.959, "step": 1882 }, { "epoch": 0.05, "learning_rate": 1.99825383095343e-06, "loss": 0.9707, "step": 1883 }, { "epoch": 0.05, "learning_rate": 1.9982489239726995e-06, "loss": 0.6416, "step": 1884 }, { "epoch": 0.05, "learning_rate": 1.9982440101130276e-06, "loss": 0.9312, "step": 1885 }, { "epoch": 0.05, "learning_rate": 1.9982390893744496e-06, "loss": 1.0459, "step": 1886 }, { "epoch": 0.05, "learning_rate": 1.998234161756998e-06, "loss": 0.8423, "step": 1887 }, { "epoch": 0.05, "learning_rate": 1.998229227260707e-06, "loss": 0.9473, "step": 1888 }, { "epoch": 0.05, "learning_rate": 1.998224285885611e-06, "loss": 0.8452, "step": 1889 }, { "epoch": 0.05, "learning_rate": 1.9982193376317438e-06, "loss": 0.96, "step": 1890 }, { "epoch": 0.05, "learning_rate": 1.99821438249914e-06, "loss": 0.9814, "step": 1891 }, { "epoch": 0.05, "learning_rate": 1.998209420487833e-06, "loss": 0.9297, "step": 1892 }, { "epoch": 0.05, "learning_rate": 1.9982044515978574e-06, "loss": 1.084, "step": 1893 }, { "epoch": 0.05, "learning_rate": 1.998199475829248e-06, "loss": 0.9932, "step": 1894 }, { "epoch": 0.05, "learning_rate": 1.9981944931820376e-06, "loss": 0.8604, "step": 1895 }, { "epoch": 0.05, "learning_rate": 1.998189503656262e-06, "loss": 0.8037, "step": 1896 }, { "epoch": 0.05, "learning_rate": 1.9981845072519546e-06, "loss": 0.8389, "step": 1897 }, { "epoch": 0.05, "learning_rate": 1.99817950396915e-06, "loss": 0.9941, "step": 1898 }, { "epoch": 0.05, "learning_rate": 1.9981744938078834e-06, "loss": 0.916, "step": 1899 }, { "epoch": 0.05, "learning_rate": 1.9981694767681886e-06, "loss": 0.9014, "step": 1900 }, { "epoch": 0.05, "learning_rate": 1.9981644528501005e-06, "loss": 1.002, "step": 1901 }, { "epoch": 0.05, "learning_rate": 1.9981594220536538e-06, "loss": 0.9463, "step": 1902 }, { "epoch": 0.05, "learning_rate": 1.998154384378883e-06, "loss": 0.9277, "step": 1903 }, { "epoch": 0.05, "learning_rate": 1.9981493398258223e-06, "loss": 0.9814, "step": 1904 }, { "epoch": 0.05, "learning_rate": 1.9981442883945074e-06, "loss": 0.8418, "step": 1905 }, { "epoch": 0.05, "learning_rate": 1.998139230084972e-06, "loss": 1.0977, "step": 1906 }, { "epoch": 0.05, "learning_rate": 1.9981341648972525e-06, "loss": 1.1152, "step": 1907 }, { "epoch": 0.05, "learning_rate": 1.9981290928313824e-06, "loss": 0.7014, "step": 1908 }, { "epoch": 0.05, "learning_rate": 1.998124013887397e-06, "loss": 0.8828, "step": 1909 }, { "epoch": 0.05, "learning_rate": 1.998118928065332e-06, "loss": 1.0664, "step": 1910 }, { "epoch": 0.05, "learning_rate": 1.998113835365222e-06, "loss": 0.9639, "step": 1911 }, { "epoch": 0.05, "learning_rate": 1.9981087357871016e-06, "loss": 1.0498, "step": 1912 }, { "epoch": 0.05, "learning_rate": 1.9981036293310064e-06, "loss": 1.082, "step": 1913 }, { "epoch": 0.05, "learning_rate": 1.998098515996972e-06, "loss": 0.7969, "step": 1914 }, { "epoch": 0.05, "learning_rate": 1.9980933957850325e-06, "loss": 1.0264, "step": 1915 }, { "epoch": 0.05, "learning_rate": 1.998088268695224e-06, "loss": 1.0986, "step": 1916 }, { "epoch": 0.05, "learning_rate": 1.9980831347275822e-06, "loss": 0.8838, "step": 1917 }, { "epoch": 0.05, "learning_rate": 1.9980779938821417e-06, "loss": 0.9014, "step": 1918 }, { "epoch": 0.05, "learning_rate": 1.9980728461589385e-06, "loss": 0.8623, "step": 1919 }, { "epoch": 0.05, "learning_rate": 1.9980676915580073e-06, "loss": 1.084, "step": 1920 }, { "epoch": 0.05, "learning_rate": 1.998062530079384e-06, "loss": 1.1387, "step": 1921 }, { "epoch": 0.05, "learning_rate": 1.998057361723105e-06, "loss": 1.0322, "step": 1922 }, { "epoch": 0.05, "learning_rate": 1.9980521864892047e-06, "loss": 1.1797, "step": 1923 }, { "epoch": 0.05, "learning_rate": 1.998047004377719e-06, "loss": 0.9424, "step": 1924 }, { "epoch": 0.05, "learning_rate": 1.9980418153886843e-06, "loss": 0.8262, "step": 1925 }, { "epoch": 0.05, "learning_rate": 1.998036619522136e-06, "loss": 1.0312, "step": 1926 }, { "epoch": 0.05, "learning_rate": 1.9980314167781092e-06, "loss": 1.0205, "step": 1927 }, { "epoch": 0.05, "learning_rate": 1.9980262071566406e-06, "loss": 0.8232, "step": 1928 }, { "epoch": 0.05, "learning_rate": 1.9980209906577663e-06, "loss": 0.9893, "step": 1929 }, { "epoch": 0.05, "learning_rate": 1.9980157672815214e-06, "loss": 1.0996, "step": 1930 }, { "epoch": 0.05, "learning_rate": 1.998010537027942e-06, "loss": 1.0566, "step": 1931 }, { "epoch": 0.05, "learning_rate": 1.9980052998970655e-06, "loss": 1.0439, "step": 1932 }, { "epoch": 0.05, "learning_rate": 1.998000055888926e-06, "loss": 1.0957, "step": 1933 }, { "epoch": 0.05, "learning_rate": 1.997994805003561e-06, "loss": 0.9131, "step": 1934 }, { "epoch": 0.05, "learning_rate": 1.997989547241006e-06, "loss": 1.0869, "step": 1935 }, { "epoch": 0.05, "learning_rate": 1.9979842826012974e-06, "loss": 0.9053, "step": 1936 }, { "epoch": 0.05, "learning_rate": 1.997979011084472e-06, "loss": 1.0254, "step": 1937 }, { "epoch": 0.05, "learning_rate": 1.9979737326905654e-06, "loss": 1.207, "step": 1938 }, { "epoch": 0.05, "learning_rate": 1.9979684474196144e-06, "loss": 0.9668, "step": 1939 }, { "epoch": 0.05, "learning_rate": 1.9979631552716554e-06, "loss": 0.8672, "step": 1940 }, { "epoch": 0.05, "learning_rate": 1.9979578562467244e-06, "loss": 1.041, "step": 1941 }, { "epoch": 0.05, "learning_rate": 1.9979525503448587e-06, "loss": 0.7715, "step": 1942 }, { "epoch": 0.05, "learning_rate": 1.9979472375660943e-06, "loss": 0.7002, "step": 1943 }, { "epoch": 0.05, "learning_rate": 1.9979419179104675e-06, "loss": 1.0566, "step": 1944 }, { "epoch": 0.05, "learning_rate": 1.997936591378016e-06, "loss": 1.0781, "step": 1945 }, { "epoch": 0.05, "learning_rate": 1.997931257968776e-06, "loss": 1.0645, "step": 1946 }, { "epoch": 0.05, "learning_rate": 1.997925917682784e-06, "loss": 1.0869, "step": 1947 }, { "epoch": 0.05, "learning_rate": 1.9979205705200764e-06, "loss": 0.9365, "step": 1948 }, { "epoch": 0.05, "learning_rate": 1.997915216480691e-06, "loss": 0.9248, "step": 1949 }, { "epoch": 0.05, "learning_rate": 1.997909855564664e-06, "loss": 0.7549, "step": 1950 }, { "epoch": 0.05, "learning_rate": 1.9979044877720335e-06, "loss": 1.0068, "step": 1951 }, { "epoch": 0.05, "learning_rate": 1.997899113102835e-06, "loss": 1.0469, "step": 1952 }, { "epoch": 0.05, "learning_rate": 1.9978937315571065e-06, "loss": 1.0752, "step": 1953 }, { "epoch": 0.05, "learning_rate": 1.997888343134884e-06, "loss": 0.9922, "step": 1954 }, { "epoch": 0.05, "learning_rate": 1.9978829478362062e-06, "loss": 1.0, "step": 1955 }, { "epoch": 0.05, "learning_rate": 1.9978775456611094e-06, "loss": 0.8057, "step": 1956 }, { "epoch": 0.05, "learning_rate": 1.9978721366096305e-06, "loss": 0.5181, "step": 1957 }, { "epoch": 0.05, "learning_rate": 1.9978667206818073e-06, "loss": 0.8486, "step": 1958 }, { "epoch": 0.05, "learning_rate": 1.997861297877677e-06, "loss": 0.9355, "step": 1959 }, { "epoch": 0.05, "learning_rate": 1.997855868197277e-06, "loss": 0.9873, "step": 1960 }, { "epoch": 0.05, "learning_rate": 1.9978504316406447e-06, "loss": 0.9863, "step": 1961 }, { "epoch": 0.05, "learning_rate": 1.9978449882078177e-06, "loss": 0.9854, "step": 1962 }, { "epoch": 0.05, "learning_rate": 1.997839537898833e-06, "loss": 0.957, "step": 1963 }, { "epoch": 0.05, "learning_rate": 1.9978340807137287e-06, "loss": 0.6782, "step": 1964 }, { "epoch": 0.05, "learning_rate": 1.9978286166525425e-06, "loss": 0.915, "step": 1965 }, { "epoch": 0.05, "learning_rate": 1.997823145715311e-06, "loss": 0.9185, "step": 1966 }, { "epoch": 0.05, "learning_rate": 1.9978176679020736e-06, "loss": 1.3047, "step": 1967 }, { "epoch": 0.05, "learning_rate": 1.997812183212866e-06, "loss": 1.0977, "step": 1968 }, { "epoch": 0.05, "learning_rate": 1.997806691647728e-06, "loss": 1.0107, "step": 1969 }, { "epoch": 0.05, "learning_rate": 1.9978011932066965e-06, "loss": 0.8652, "step": 1970 }, { "epoch": 0.05, "learning_rate": 1.997795687889809e-06, "loss": 0.9199, "step": 1971 }, { "epoch": 0.05, "learning_rate": 1.997790175697104e-06, "loss": 0.998, "step": 1972 }, { "epoch": 0.05, "learning_rate": 1.9977846566286196e-06, "loss": 0.8711, "step": 1973 }, { "epoch": 0.05, "learning_rate": 1.9977791306843938e-06, "loss": 1.1494, "step": 1974 }, { "epoch": 0.05, "learning_rate": 1.997773597864464e-06, "loss": 0.9609, "step": 1975 }, { "epoch": 0.05, "learning_rate": 1.997768058168869e-06, "loss": 1.125, "step": 1976 }, { "epoch": 0.05, "learning_rate": 1.9977625115976468e-06, "loss": 1.1738, "step": 1977 }, { "epoch": 0.05, "learning_rate": 1.9977569581508355e-06, "loss": 0.9297, "step": 1978 }, { "epoch": 0.05, "learning_rate": 1.997751397828473e-06, "loss": 1.1328, "step": 1979 }, { "epoch": 0.05, "learning_rate": 1.997745830630599e-06, "loss": 1.0459, "step": 1980 }, { "epoch": 0.05, "learning_rate": 1.99774025655725e-06, "loss": 1.0352, "step": 1981 }, { "epoch": 0.05, "learning_rate": 1.997734675608466e-06, "loss": 0.9395, "step": 1982 }, { "epoch": 0.05, "learning_rate": 1.997729087784285e-06, "loss": 0.834, "step": 1983 }, { "epoch": 0.05, "learning_rate": 1.9977234930847447e-06, "loss": 1.0449, "step": 1984 }, { "epoch": 0.05, "learning_rate": 1.9977178915098848e-06, "loss": 0.9941, "step": 1985 }, { "epoch": 0.05, "learning_rate": 1.997712283059743e-06, "loss": 0.6355, "step": 1986 }, { "epoch": 0.05, "learning_rate": 1.997706667734358e-06, "loss": 0.7588, "step": 1987 }, { "epoch": 0.05, "learning_rate": 1.99770104553377e-06, "loss": 1.0859, "step": 1988 }, { "epoch": 0.05, "learning_rate": 1.997695416458016e-06, "loss": 1.1895, "step": 1989 }, { "epoch": 0.05, "learning_rate": 1.997689780507135e-06, "loss": 0.9248, "step": 1990 }, { "epoch": 0.05, "learning_rate": 1.997684137681166e-06, "loss": 0.7959, "step": 1991 }, { "epoch": 0.05, "learning_rate": 1.9976784879801488e-06, "loss": 0.7959, "step": 1992 }, { "epoch": 0.05, "learning_rate": 1.9976728314041213e-06, "loss": 1.1064, "step": 1993 }, { "epoch": 0.05, "learning_rate": 1.997667167953122e-06, "loss": 0.8691, "step": 1994 }, { "epoch": 0.05, "learning_rate": 1.997661497627192e-06, "loss": 0.7659, "step": 1995 }, { "epoch": 0.05, "learning_rate": 1.9976558204263686e-06, "loss": 1.1172, "step": 1996 }, { "epoch": 0.05, "learning_rate": 1.997650136350691e-06, "loss": 0.8516, "step": 1997 }, { "epoch": 0.05, "learning_rate": 1.9976444454001993e-06, "loss": 0.9766, "step": 1998 }, { "epoch": 0.05, "learning_rate": 1.997638747574932e-06, "loss": 1.0088, "step": 1999 }, { "epoch": 0.05, "learning_rate": 1.9976330428749282e-06, "loss": 1.0693, "step": 2000 }, { "epoch": 0.05, "learning_rate": 1.997627331300228e-06, "loss": 1.0771, "step": 2001 }, { "epoch": 0.05, "learning_rate": 1.9976216128508706e-06, "loss": 0.9688, "step": 2002 }, { "epoch": 0.05, "learning_rate": 1.9976158875268946e-06, "loss": 0.9004, "step": 2003 }, { "epoch": 0.05, "learning_rate": 1.99761015532834e-06, "loss": 0.9932, "step": 2004 }, { "epoch": 0.05, "learning_rate": 1.9976044162552467e-06, "loss": 0.7998, "step": 2005 }, { "epoch": 0.05, "learning_rate": 1.997598670307653e-06, "loss": 0.9551, "step": 2006 }, { "epoch": 0.05, "learning_rate": 1.9975929174856004e-06, "loss": 0.9941, "step": 2007 }, { "epoch": 0.05, "learning_rate": 1.997587157789127e-06, "loss": 0.8818, "step": 2008 }, { "epoch": 0.05, "learning_rate": 1.9975813912182724e-06, "loss": 0.9062, "step": 2009 }, { "epoch": 0.05, "learning_rate": 1.9975756177730778e-06, "loss": 0.9902, "step": 2010 }, { "epoch": 0.05, "learning_rate": 1.9975698374535814e-06, "loss": 0.8374, "step": 2011 }, { "epoch": 0.05, "learning_rate": 1.997564050259824e-06, "loss": 0.96, "step": 2012 }, { "epoch": 0.05, "learning_rate": 1.9975582561918453e-06, "loss": 1.0664, "step": 2013 }, { "epoch": 0.05, "learning_rate": 1.997552455249685e-06, "loss": 0.7451, "step": 2014 }, { "epoch": 0.05, "learning_rate": 1.9975466474333834e-06, "loss": 0.8682, "step": 2015 }, { "epoch": 0.05, "learning_rate": 1.9975408327429803e-06, "loss": 0.9102, "step": 2016 }, { "epoch": 0.05, "learning_rate": 1.9975350111785156e-06, "loss": 0.8188, "step": 2017 }, { "epoch": 0.05, "learning_rate": 1.9975291827400295e-06, "loss": 0.9688, "step": 2018 }, { "epoch": 0.05, "learning_rate": 1.9975233474275624e-06, "loss": 0.9639, "step": 2019 }, { "epoch": 0.05, "learning_rate": 1.9975175052411543e-06, "loss": 0.9707, "step": 2020 }, { "epoch": 0.05, "learning_rate": 1.997511656180845e-06, "loss": 0.9756, "step": 2021 }, { "epoch": 0.05, "learning_rate": 1.9975058002466765e-06, "loss": 1.0352, "step": 2022 }, { "epoch": 0.05, "learning_rate": 1.9974999374386873e-06, "loss": 0.7651, "step": 2023 }, { "epoch": 0.05, "learning_rate": 1.997494067756919e-06, "loss": 0.9248, "step": 2024 }, { "epoch": 0.05, "learning_rate": 1.997488191201411e-06, "loss": 1.1104, "step": 2025 }, { "epoch": 0.05, "learning_rate": 1.997482307772204e-06, "loss": 1.0605, "step": 2026 }, { "epoch": 0.05, "learning_rate": 1.9974764174693395e-06, "loss": 1.0762, "step": 2027 }, { "epoch": 0.05, "learning_rate": 1.9974705202928576e-06, "loss": 0.9766, "step": 2028 }, { "epoch": 0.05, "learning_rate": 1.997464616242799e-06, "loss": 0.9561, "step": 2029 }, { "epoch": 0.05, "learning_rate": 1.9974587053192035e-06, "loss": 1.0439, "step": 2030 }, { "epoch": 0.05, "learning_rate": 1.9974527875221127e-06, "loss": 0.8906, "step": 2031 }, { "epoch": 0.05, "learning_rate": 1.9974468628515676e-06, "loss": 1.1406, "step": 2032 }, { "epoch": 0.05, "learning_rate": 1.997440931307608e-06, "loss": 1.1562, "step": 2033 }, { "epoch": 0.05, "learning_rate": 1.9974349928902757e-06, "loss": 1.0664, "step": 2034 }, { "epoch": 0.05, "learning_rate": 1.997429047599612e-06, "loss": 0.8252, "step": 2035 }, { "epoch": 0.05, "learning_rate": 1.9974230954356563e-06, "loss": 0.9199, "step": 2036 }, { "epoch": 0.05, "learning_rate": 1.9974171363984507e-06, "loss": 0.9434, "step": 2037 }, { "epoch": 0.05, "learning_rate": 1.997411170488036e-06, "loss": 0.9541, "step": 2038 }, { "epoch": 0.05, "learning_rate": 1.997405197704454e-06, "loss": 0.8125, "step": 2039 }, { "epoch": 0.05, "learning_rate": 1.9973992180477443e-06, "loss": 0.8369, "step": 2040 }, { "epoch": 0.05, "learning_rate": 1.99739323151795e-06, "loss": 0.9072, "step": 2041 }, { "epoch": 0.05, "learning_rate": 1.9973872381151107e-06, "loss": 1.2539, "step": 2042 }, { "epoch": 0.05, "learning_rate": 1.9973812378392688e-06, "loss": 0.9834, "step": 2043 }, { "epoch": 0.05, "learning_rate": 1.997375230690465e-06, "loss": 1.0635, "step": 2044 }, { "epoch": 0.05, "learning_rate": 1.997369216668741e-06, "loss": 1.2051, "step": 2045 }, { "epoch": 0.05, "learning_rate": 1.9973631957741383e-06, "loss": 1.2891, "step": 2046 }, { "epoch": 0.05, "learning_rate": 1.997357168006698e-06, "loss": 1.1719, "step": 2047 }, { "epoch": 0.05, "learning_rate": 1.9973511333664627e-06, "loss": 0.959, "step": 2048 }, { "epoch": 0.05, "learning_rate": 1.9973450918534726e-06, "loss": 0.897, "step": 2049 }, { "epoch": 0.05, "learning_rate": 1.99733904346777e-06, "loss": 0.8496, "step": 2050 }, { "epoch": 0.05, "learning_rate": 1.9973329882093964e-06, "loss": 0.8789, "step": 2051 }, { "epoch": 0.05, "learning_rate": 1.997326926078394e-06, "loss": 0.7881, "step": 2052 }, { "epoch": 0.05, "learning_rate": 1.997320857074804e-06, "loss": 0.9092, "step": 2053 }, { "epoch": 0.05, "learning_rate": 1.9973147811986683e-06, "loss": 1.0195, "step": 2054 }, { "epoch": 0.05, "learning_rate": 1.997308698450029e-06, "loss": 0.9492, "step": 2055 }, { "epoch": 0.05, "learning_rate": 1.997302608828928e-06, "loss": 0.958, "step": 2056 }, { "epoch": 0.05, "learning_rate": 1.9972965123354072e-06, "loss": 0.9248, "step": 2057 }, { "epoch": 0.05, "learning_rate": 1.9972904089695087e-06, "loss": 0.9355, "step": 2058 }, { "epoch": 0.05, "learning_rate": 1.9972842987312744e-06, "loss": 0.9629, "step": 2059 }, { "epoch": 0.05, "learning_rate": 1.9972781816207463e-06, "loss": 0.7534, "step": 2060 }, { "epoch": 0.05, "learning_rate": 1.997272057637967e-06, "loss": 0.9316, "step": 2061 }, { "epoch": 0.05, "learning_rate": 1.997265926782978e-06, "loss": 0.9932, "step": 2062 }, { "epoch": 0.05, "learning_rate": 1.997259789055822e-06, "loss": 1.1631, "step": 2063 }, { "epoch": 0.05, "learning_rate": 1.9972536444565413e-06, "loss": 0.9307, "step": 2064 }, { "epoch": 0.05, "learning_rate": 1.9972474929851785e-06, "loss": 1.1758, "step": 2065 }, { "epoch": 0.05, "learning_rate": 1.9972413346417756e-06, "loss": 0.8535, "step": 2066 }, { "epoch": 0.05, "learning_rate": 1.9972351694263753e-06, "loss": 0.8877, "step": 2067 }, { "epoch": 0.05, "learning_rate": 1.9972289973390196e-06, "loss": 0.9014, "step": 2068 }, { "epoch": 0.05, "learning_rate": 1.9972228183797516e-06, "loss": 0.9512, "step": 2069 }, { "epoch": 0.05, "learning_rate": 1.9972166325486134e-06, "loss": 1.0146, "step": 2070 }, { "epoch": 0.05, "learning_rate": 1.9972104398456476e-06, "loss": 1.0098, "step": 2071 }, { "epoch": 0.05, "learning_rate": 1.997204240270898e-06, "loss": 0.9961, "step": 2072 }, { "epoch": 0.05, "learning_rate": 1.997198033824406e-06, "loss": 1.0635, "step": 2073 }, { "epoch": 0.05, "learning_rate": 1.9971918205062145e-06, "loss": 0.6246, "step": 2074 }, { "epoch": 0.05, "learning_rate": 1.9971856003163668e-06, "loss": 0.9639, "step": 2075 }, { "epoch": 0.05, "learning_rate": 1.9971793732549054e-06, "loss": 0.9502, "step": 2076 }, { "epoch": 0.05, "learning_rate": 1.997173139321874e-06, "loss": 0.9287, "step": 2077 }, { "epoch": 0.05, "learning_rate": 1.997166898517314e-06, "loss": 1.1602, "step": 2078 }, { "epoch": 0.05, "learning_rate": 1.9971606508412705e-06, "loss": 0.6318, "step": 2079 }, { "epoch": 0.05, "learning_rate": 1.9971543962937848e-06, "loss": 0.9038, "step": 2080 }, { "epoch": 0.05, "learning_rate": 1.9971481348749006e-06, "loss": 1.1377, "step": 2081 }, { "epoch": 0.05, "learning_rate": 1.9971418665846615e-06, "loss": 0.8838, "step": 2082 }, { "epoch": 0.05, "learning_rate": 1.9971355914231094e-06, "loss": 1.0156, "step": 2083 }, { "epoch": 0.05, "learning_rate": 1.9971293093902893e-06, "loss": 1.1309, "step": 2084 }, { "epoch": 0.05, "learning_rate": 1.997123020486243e-06, "loss": 0.9854, "step": 2085 }, { "epoch": 0.05, "learning_rate": 1.997116724711015e-06, "loss": 1.0801, "step": 2086 }, { "epoch": 0.05, "learning_rate": 1.997110422064648e-06, "loss": 0.9336, "step": 2087 }, { "epoch": 0.05, "learning_rate": 1.997104112547185e-06, "loss": 0.6624, "step": 2088 }, { "epoch": 0.05, "learning_rate": 1.9970977961586704e-06, "loss": 1.0576, "step": 2089 }, { "epoch": 0.05, "learning_rate": 1.9970914728991474e-06, "loss": 0.9463, "step": 2090 }, { "epoch": 0.05, "learning_rate": 1.9970851427686595e-06, "loss": 0.9414, "step": 2091 }, { "epoch": 0.05, "learning_rate": 1.9970788057672505e-06, "loss": 0.79, "step": 2092 }, { "epoch": 0.05, "learning_rate": 1.997072461894964e-06, "loss": 0.7668, "step": 2093 }, { "epoch": 0.05, "learning_rate": 1.997066111151843e-06, "loss": 1.0605, "step": 2094 }, { "epoch": 0.05, "learning_rate": 1.997059753537932e-06, "loss": 1.0146, "step": 2095 }, { "epoch": 0.05, "learning_rate": 1.997053389053275e-06, "loss": 0.7148, "step": 2096 }, { "epoch": 0.05, "learning_rate": 1.9970470176979156e-06, "loss": 0.9971, "step": 2097 }, { "epoch": 0.05, "learning_rate": 1.9970406394718975e-06, "loss": 0.9053, "step": 2098 }, { "epoch": 0.05, "learning_rate": 1.9970342543752653e-06, "loss": 0.9482, "step": 2099 }, { "epoch": 0.05, "learning_rate": 1.997027862408062e-06, "loss": 1.0898, "step": 2100 }, { "epoch": 0.05, "learning_rate": 1.9970214635703324e-06, "loss": 0.9189, "step": 2101 }, { "epoch": 0.05, "learning_rate": 1.9970150578621203e-06, "loss": 1.1445, "step": 2102 }, { "epoch": 0.05, "learning_rate": 1.9970086452834698e-06, "loss": 0.9629, "step": 2103 }, { "epoch": 0.05, "learning_rate": 1.9970022258344253e-06, "loss": 0.8818, "step": 2104 }, { "epoch": 0.05, "learning_rate": 1.996995799515031e-06, "loss": 1.1348, "step": 2105 }, { "epoch": 0.05, "learning_rate": 1.996989366325331e-06, "loss": 0.958, "step": 2106 }, { "epoch": 0.05, "learning_rate": 1.9969829262653697e-06, "loss": 1.0303, "step": 2107 }, { "epoch": 0.05, "learning_rate": 1.9969764793351917e-06, "loss": 1.0791, "step": 2108 }, { "epoch": 0.05, "learning_rate": 1.996970025534841e-06, "loss": 0.9785, "step": 2109 }, { "epoch": 0.05, "learning_rate": 1.9969635648643625e-06, "loss": 0.8955, "step": 2110 }, { "epoch": 0.05, "learning_rate": 1.9969570973238006e-06, "loss": 1.1738, "step": 2111 }, { "epoch": 0.05, "learning_rate": 1.9969506229131997e-06, "loss": 1.1318, "step": 2112 }, { "epoch": 0.05, "learning_rate": 1.9969441416326047e-06, "loss": 0.9668, "step": 2113 }, { "epoch": 0.05, "learning_rate": 1.99693765348206e-06, "loss": 1.0234, "step": 2114 }, { "epoch": 0.05, "learning_rate": 1.99693115846161e-06, "loss": 0.9521, "step": 2115 }, { "epoch": 0.05, "learning_rate": 1.9969246565713004e-06, "loss": 1.1494, "step": 2116 }, { "epoch": 0.05, "learning_rate": 1.9969181478111753e-06, "loss": 0.6646, "step": 2117 }, { "epoch": 0.05, "learning_rate": 1.9969116321812796e-06, "loss": 1.0762, "step": 2118 }, { "epoch": 0.05, "learning_rate": 1.9969051096816583e-06, "loss": 0.7627, "step": 2119 }, { "epoch": 0.05, "learning_rate": 1.9968985803123568e-06, "loss": 1.0381, "step": 2120 }, { "epoch": 0.05, "learning_rate": 1.996892044073419e-06, "loss": 0.8838, "step": 2121 }, { "epoch": 0.05, "learning_rate": 1.996885500964891e-06, "loss": 1.2061, "step": 2122 }, { "epoch": 0.05, "learning_rate": 1.9968789509868175e-06, "loss": 0.9219, "step": 2123 }, { "epoch": 0.05, "learning_rate": 1.9968723941392432e-06, "loss": 1.1582, "step": 2124 }, { "epoch": 0.05, "learning_rate": 1.996865830422214e-06, "loss": 1.0596, "step": 2125 }, { "epoch": 0.05, "learning_rate": 1.9968592598357746e-06, "loss": 1.1299, "step": 2126 }, { "epoch": 0.05, "learning_rate": 1.996852682379971e-06, "loss": 0.8682, "step": 2127 }, { "epoch": 0.05, "learning_rate": 1.9968460980548477e-06, "loss": 1.1045, "step": 2128 }, { "epoch": 0.05, "learning_rate": 1.9968395068604504e-06, "loss": 0.957, "step": 2129 }, { "epoch": 0.05, "learning_rate": 1.9968329087968247e-06, "loss": 1.1406, "step": 2130 }, { "epoch": 0.05, "learning_rate": 1.996826303864016e-06, "loss": 1.0205, "step": 2131 }, { "epoch": 0.05, "learning_rate": 1.9968196920620693e-06, "loss": 0.707, "step": 2132 }, { "epoch": 0.05, "learning_rate": 1.996813073391031e-06, "loss": 0.7773, "step": 2133 }, { "epoch": 0.05, "learning_rate": 1.9968064478509457e-06, "loss": 0.9658, "step": 2134 }, { "epoch": 0.05, "learning_rate": 1.99679981544186e-06, "loss": 0.9121, "step": 2135 }, { "epoch": 0.05, "learning_rate": 1.9967931761638195e-06, "loss": 1.0078, "step": 2136 }, { "epoch": 0.05, "learning_rate": 1.9967865300168692e-06, "loss": 1.0527, "step": 2137 }, { "epoch": 0.05, "learning_rate": 1.9967798770010557e-06, "loss": 0.9834, "step": 2138 }, { "epoch": 0.05, "learning_rate": 1.9967732171164245e-06, "loss": 0.877, "step": 2139 }, { "epoch": 0.05, "learning_rate": 1.9967665503630215e-06, "loss": 1.1191, "step": 2140 }, { "epoch": 0.05, "learning_rate": 1.9967598767408928e-06, "loss": 1.21, "step": 2141 }, { "epoch": 0.05, "learning_rate": 1.996753196250084e-06, "loss": 1.082, "step": 2142 }, { "epoch": 0.05, "learning_rate": 1.9967465088906416e-06, "loss": 0.8076, "step": 2143 }, { "epoch": 0.05, "learning_rate": 1.9967398146626115e-06, "loss": 0.8706, "step": 2144 }, { "epoch": 0.05, "learning_rate": 1.9967331135660395e-06, "loss": 1.1289, "step": 2145 }, { "epoch": 0.06, "learning_rate": 1.9967264056009727e-06, "loss": 0.7769, "step": 2146 }, { "epoch": 0.06, "learning_rate": 1.996719690767456e-06, "loss": 0.9902, "step": 2147 }, { "epoch": 0.06, "learning_rate": 1.996712969065537e-06, "loss": 0.8926, "step": 2148 }, { "epoch": 0.06, "learning_rate": 1.9967062404952607e-06, "loss": 0.7456, "step": 2149 }, { "epoch": 0.06, "learning_rate": 1.9966995050566746e-06, "loss": 1.042, "step": 2150 }, { "epoch": 0.06, "learning_rate": 1.9966927627498246e-06, "loss": 0.8359, "step": 2151 }, { "epoch": 0.06, "learning_rate": 1.996686013574757e-06, "loss": 0.9746, "step": 2152 }, { "epoch": 0.06, "learning_rate": 1.996679257531519e-06, "loss": 0.8081, "step": 2153 }, { "epoch": 0.06, "learning_rate": 1.9966724946201567e-06, "loss": 1.1191, "step": 2154 }, { "epoch": 0.06, "learning_rate": 1.9966657248407163e-06, "loss": 0.8574, "step": 2155 }, { "epoch": 0.06, "learning_rate": 1.996658948193245e-06, "loss": 0.8428, "step": 2156 }, { "epoch": 0.06, "learning_rate": 1.99665216467779e-06, "loss": 0.9443, "step": 2157 }, { "epoch": 0.06, "learning_rate": 1.9966453742943966e-06, "loss": 0.6816, "step": 2158 }, { "epoch": 0.06, "learning_rate": 1.996638577043113e-06, "loss": 1.002, "step": 2159 }, { "epoch": 0.06, "learning_rate": 1.996631772923985e-06, "loss": 1.0254, "step": 2160 }, { "epoch": 0.06, "learning_rate": 1.9966249619370597e-06, "loss": 0.8799, "step": 2161 }, { "epoch": 0.06, "learning_rate": 1.996618144082385e-06, "loss": 0.7119, "step": 2162 }, { "epoch": 0.06, "learning_rate": 1.9966113193600065e-06, "loss": 0.9795, "step": 2163 }, { "epoch": 0.06, "learning_rate": 1.996604487769972e-06, "loss": 0.9365, "step": 2164 }, { "epoch": 0.06, "learning_rate": 1.9965976493123285e-06, "loss": 0.9502, "step": 2165 }, { "epoch": 0.06, "learning_rate": 1.996590803987123e-06, "loss": 0.8838, "step": 2166 }, { "epoch": 0.06, "learning_rate": 1.996583951794403e-06, "loss": 0.9932, "step": 2167 }, { "epoch": 0.06, "learning_rate": 1.9965770927342158e-06, "loss": 1.1201, "step": 2168 }, { "epoch": 0.06, "learning_rate": 1.9965702268066073e-06, "loss": 1.1016, "step": 2169 }, { "epoch": 0.06, "learning_rate": 1.9965633540116267e-06, "loss": 0.9053, "step": 2170 }, { "epoch": 0.06, "learning_rate": 1.99655647434932e-06, "loss": 1.0352, "step": 2171 }, { "epoch": 0.06, "learning_rate": 1.9965495878197355e-06, "loss": 1.1172, "step": 2172 }, { "epoch": 0.06, "learning_rate": 1.9965426944229197e-06, "loss": 1.1748, "step": 2173 }, { "epoch": 0.06, "learning_rate": 1.9965357941589215e-06, "loss": 0.729, "step": 2174 }, { "epoch": 0.06, "learning_rate": 1.9965288870277866e-06, "loss": 0.8936, "step": 2175 }, { "epoch": 0.06, "learning_rate": 1.9965219730295643e-06, "loss": 0.8086, "step": 2176 }, { "epoch": 0.06, "learning_rate": 1.9965150521643013e-06, "loss": 1.0576, "step": 2177 }, { "epoch": 0.06, "learning_rate": 1.9965081244320458e-06, "loss": 1.0488, "step": 2178 }, { "epoch": 0.06, "learning_rate": 1.9965011898328454e-06, "loss": 1.0312, "step": 2179 }, { "epoch": 0.06, "learning_rate": 1.9964942483667472e-06, "loss": 0.7231, "step": 2180 }, { "epoch": 0.06, "learning_rate": 1.9964873000338e-06, "loss": 0.8984, "step": 2181 }, { "epoch": 0.06, "learning_rate": 1.9964803448340515e-06, "loss": 0.8037, "step": 2182 }, { "epoch": 0.06, "learning_rate": 1.9964733827675487e-06, "loss": 1.1738, "step": 2183 }, { "epoch": 0.06, "learning_rate": 1.996466413834341e-06, "loss": 0.9873, "step": 2184 }, { "epoch": 0.06, "learning_rate": 1.9964594380344754e-06, "loss": 0.9072, "step": 2185 }, { "epoch": 0.06, "learning_rate": 1.996452455368e-06, "loss": 1.1377, "step": 2186 }, { "epoch": 0.06, "learning_rate": 1.9964454658349637e-06, "loss": 1.0645, "step": 2187 }, { "epoch": 0.06, "learning_rate": 1.996438469435414e-06, "loss": 0.7314, "step": 2188 }, { "epoch": 0.06, "learning_rate": 1.9964314661693995e-06, "loss": 0.9355, "step": 2189 }, { "epoch": 0.06, "learning_rate": 1.9964244560369677e-06, "loss": 0.9932, "step": 2190 }, { "epoch": 0.06, "learning_rate": 1.9964174390381676e-06, "loss": 1.0088, "step": 2191 }, { "epoch": 0.06, "learning_rate": 1.996410415173048e-06, "loss": 1.0576, "step": 2192 }, { "epoch": 0.06, "learning_rate": 1.996403384441656e-06, "loss": 0.9736, "step": 2193 }, { "epoch": 0.06, "learning_rate": 1.996396346844041e-06, "loss": 1.0098, "step": 2194 }, { "epoch": 0.06, "learning_rate": 1.9963893023802513e-06, "loss": 0.7744, "step": 2195 }, { "epoch": 0.06, "learning_rate": 1.996382251050335e-06, "loss": 0.8379, "step": 2196 }, { "epoch": 0.06, "learning_rate": 1.996375192854342e-06, "loss": 1.0088, "step": 2197 }, { "epoch": 0.06, "learning_rate": 1.996368127792319e-06, "loss": 0.7959, "step": 2198 }, { "epoch": 0.06, "learning_rate": 1.9963610558643166e-06, "loss": 0.8691, "step": 2199 }, { "epoch": 0.06, "learning_rate": 1.996353977070382e-06, "loss": 0.877, "step": 2200 }, { "epoch": 0.06, "learning_rate": 1.9963468914105647e-06, "loss": 0.7087, "step": 2201 }, { "epoch": 0.06, "learning_rate": 1.9963397988849135e-06, "loss": 0.999, "step": 2202 }, { "epoch": 0.06, "learning_rate": 1.996332699493477e-06, "loss": 0.9541, "step": 2203 }, { "epoch": 0.06, "learning_rate": 1.996325593236305e-06, "loss": 0.8262, "step": 2204 }, { "epoch": 0.06, "learning_rate": 1.996318480113445e-06, "loss": 1.1494, "step": 2205 }, { "epoch": 0.06, "learning_rate": 1.9963113601249475e-06, "loss": 1.0771, "step": 2206 }, { "epoch": 0.06, "learning_rate": 1.9963042332708607e-06, "loss": 0.9941, "step": 2207 }, { "epoch": 0.06, "learning_rate": 1.996297099551234e-06, "loss": 0.8926, "step": 2208 }, { "epoch": 0.06, "learning_rate": 1.996289958966116e-06, "loss": 0.9375, "step": 2209 }, { "epoch": 0.06, "learning_rate": 1.9962828115155566e-06, "loss": 0.8057, "step": 2210 }, { "epoch": 0.06, "learning_rate": 1.996275657199605e-06, "loss": 0.9219, "step": 2211 }, { "epoch": 0.06, "learning_rate": 1.9962684960183102e-06, "loss": 1.1777, "step": 2212 }, { "epoch": 0.06, "learning_rate": 1.9962613279717215e-06, "loss": 0.876, "step": 2213 }, { "epoch": 0.06, "learning_rate": 1.996254153059889e-06, "loss": 0.957, "step": 2214 }, { "epoch": 0.06, "learning_rate": 1.996246971282861e-06, "loss": 0.9863, "step": 2215 }, { "epoch": 0.06, "learning_rate": 1.9962397826406882e-06, "loss": 0.7559, "step": 2216 }, { "epoch": 0.06, "learning_rate": 1.9962325871334193e-06, "loss": 0.999, "step": 2217 }, { "epoch": 0.06, "learning_rate": 1.996225384761104e-06, "loss": 0.8477, "step": 2218 }, { "epoch": 0.06, "learning_rate": 1.9962181755237916e-06, "loss": 0.9551, "step": 2219 }, { "epoch": 0.06, "learning_rate": 1.996210959421533e-06, "loss": 0.79, "step": 2220 }, { "epoch": 0.06, "learning_rate": 1.9962037364543765e-06, "loss": 0.4814, "step": 2221 }, { "epoch": 0.06, "learning_rate": 1.996196506622373e-06, "loss": 1.0068, "step": 2222 }, { "epoch": 0.06, "learning_rate": 1.9961892699255715e-06, "loss": 0.9521, "step": 2223 }, { "epoch": 0.06, "learning_rate": 1.9961820263640224e-06, "loss": 1.0527, "step": 2224 }, { "epoch": 0.06, "learning_rate": 1.9961747759377757e-06, "loss": 0.9619, "step": 2225 }, { "epoch": 0.06, "learning_rate": 1.9961675186468805e-06, "loss": 1.0781, "step": 2226 }, { "epoch": 0.06, "learning_rate": 1.996160254491388e-06, "loss": 1.0156, "step": 2227 }, { "epoch": 0.06, "learning_rate": 1.9961529834713474e-06, "loss": 1.1602, "step": 2228 }, { "epoch": 0.06, "learning_rate": 1.996145705586809e-06, "loss": 0.9424, "step": 2229 }, { "epoch": 0.06, "learning_rate": 1.996138420837823e-06, "loss": 1.041, "step": 2230 }, { "epoch": 0.06, "learning_rate": 1.99613112922444e-06, "loss": 0.8896, "step": 2231 }, { "epoch": 0.06, "learning_rate": 1.9961238307467096e-06, "loss": 1.0098, "step": 2232 }, { "epoch": 0.06, "learning_rate": 1.9961165254046822e-06, "loss": 0.9756, "step": 2233 }, { "epoch": 0.06, "learning_rate": 1.9961092131984083e-06, "loss": 1.25, "step": 2234 }, { "epoch": 0.06, "learning_rate": 1.9961018941279385e-06, "loss": 0.8525, "step": 2235 }, { "epoch": 0.06, "learning_rate": 1.9960945681933226e-06, "loss": 0.6929, "step": 2236 }, { "epoch": 0.06, "learning_rate": 1.996087235394612e-06, "loss": 1.0459, "step": 2237 }, { "epoch": 0.06, "learning_rate": 1.9960798957318566e-06, "loss": 1.1016, "step": 2238 }, { "epoch": 0.06, "learning_rate": 1.996072549205107e-06, "loss": 0.9277, "step": 2239 }, { "epoch": 0.06, "learning_rate": 1.996065195814414e-06, "loss": 1.0322, "step": 2240 }, { "epoch": 0.06, "learning_rate": 1.9960578355598285e-06, "loss": 0.8436, "step": 2241 }, { "epoch": 0.06, "learning_rate": 1.9960504684414004e-06, "loss": 0.8682, "step": 2242 }, { "epoch": 0.06, "learning_rate": 1.9960430944591815e-06, "loss": 0.9482, "step": 2243 }, { "epoch": 0.06, "learning_rate": 1.9960357136132217e-06, "loss": 1.0342, "step": 2244 }, { "epoch": 0.06, "learning_rate": 1.9960283259035726e-06, "loss": 0.8721, "step": 2245 }, { "epoch": 0.06, "learning_rate": 1.9960209313302847e-06, "loss": 1.1348, "step": 2246 }, { "epoch": 0.06, "learning_rate": 1.9960135298934087e-06, "loss": 0.8447, "step": 2247 }, { "epoch": 0.06, "learning_rate": 1.9960061215929964e-06, "loss": 0.8643, "step": 2248 }, { "epoch": 0.06, "learning_rate": 1.995998706429098e-06, "loss": 0.9453, "step": 2249 }, { "epoch": 0.06, "learning_rate": 1.9959912844017653e-06, "loss": 1.2715, "step": 2250 }, { "epoch": 0.06, "learning_rate": 1.995983855511049e-06, "loss": 0.8945, "step": 2251 }, { "epoch": 0.06, "learning_rate": 1.9959764197570007e-06, "loss": 0.8193, "step": 2252 }, { "epoch": 0.06, "learning_rate": 1.9959689771396707e-06, "loss": 0.9775, "step": 2253 }, { "epoch": 0.06, "learning_rate": 1.995961527659112e-06, "loss": 0.9116, "step": 2254 }, { "epoch": 0.06, "learning_rate": 1.995954071315374e-06, "loss": 0.8623, "step": 2255 }, { "epoch": 0.06, "learning_rate": 1.995946608108509e-06, "loss": 0.9756, "step": 2256 }, { "epoch": 0.06, "learning_rate": 1.995939138038569e-06, "loss": 1.0811, "step": 2257 }, { "epoch": 0.06, "learning_rate": 1.9959316611056045e-06, "loss": 0.8818, "step": 2258 }, { "epoch": 0.06, "learning_rate": 1.9959241773096674e-06, "loss": 1.0742, "step": 2259 }, { "epoch": 0.06, "learning_rate": 1.9959166866508093e-06, "loss": 1.0498, "step": 2260 }, { "epoch": 0.06, "learning_rate": 1.9959091891290815e-06, "loss": 1.0469, "step": 2261 }, { "epoch": 0.06, "learning_rate": 1.9959016847445364e-06, "loss": 0.8135, "step": 2262 }, { "epoch": 0.06, "learning_rate": 1.995894173497225e-06, "loss": 0.8057, "step": 2263 }, { "epoch": 0.06, "learning_rate": 1.9958866553871997e-06, "loss": 1.0635, "step": 2264 }, { "epoch": 0.06, "learning_rate": 1.9958791304145114e-06, "loss": 1.0615, "step": 2265 }, { "epoch": 0.06, "learning_rate": 1.995871598579213e-06, "loss": 0.8926, "step": 2266 }, { "epoch": 0.06, "learning_rate": 1.9958640598813556e-06, "loss": 1.0391, "step": 2267 }, { "epoch": 0.06, "learning_rate": 1.9958565143209914e-06, "loss": 0.9883, "step": 2268 }, { "epoch": 0.06, "learning_rate": 1.9958489618981726e-06, "loss": 0.8838, "step": 2269 }, { "epoch": 0.06, "learning_rate": 1.995841402612951e-06, "loss": 0.9658, "step": 2270 }, { "epoch": 0.06, "learning_rate": 1.9958338364653785e-06, "loss": 1.1045, "step": 2271 }, { "epoch": 0.06, "learning_rate": 1.9958262634555077e-06, "loss": 0.8887, "step": 2272 }, { "epoch": 0.06, "learning_rate": 1.995818683583391e-06, "loss": 1.0703, "step": 2273 }, { "epoch": 0.06, "learning_rate": 1.99581109684908e-06, "loss": 0.8525, "step": 2274 }, { "epoch": 0.06, "learning_rate": 1.995803503252627e-06, "loss": 0.9668, "step": 2275 }, { "epoch": 0.06, "learning_rate": 1.9957959027940847e-06, "loss": 1.1445, "step": 2276 }, { "epoch": 0.06, "learning_rate": 1.9957882954735054e-06, "loss": 0.7466, "step": 2277 }, { "epoch": 0.06, "learning_rate": 1.995780681290941e-06, "loss": 1.0049, "step": 2278 }, { "epoch": 0.06, "learning_rate": 1.9957730602464448e-06, "loss": 0.9854, "step": 2279 }, { "epoch": 0.06, "learning_rate": 1.995765432340069e-06, "loss": 1.1113, "step": 2280 }, { "epoch": 0.06, "learning_rate": 1.9957577975718655e-06, "loss": 0.9307, "step": 2281 }, { "epoch": 0.06, "learning_rate": 1.995750155941888e-06, "loss": 0.8398, "step": 2282 }, { "epoch": 0.06, "learning_rate": 1.9957425074501886e-06, "loss": 0.9756, "step": 2283 }, { "epoch": 0.06, "learning_rate": 1.99573485209682e-06, "loss": 0.7549, "step": 2284 }, { "epoch": 0.06, "learning_rate": 1.995727189881835e-06, "loss": 0.8184, "step": 2285 }, { "epoch": 0.06, "learning_rate": 1.995719520805287e-06, "loss": 1.0244, "step": 2286 }, { "epoch": 0.06, "learning_rate": 1.995711844867227e-06, "loss": 1.0615, "step": 2287 }, { "epoch": 0.06, "learning_rate": 1.9957041620677104e-06, "loss": 0.7686, "step": 2288 }, { "epoch": 0.06, "learning_rate": 1.995696472406788e-06, "loss": 1.1123, "step": 2289 }, { "epoch": 0.06, "learning_rate": 1.9956887758845144e-06, "loss": 1.1699, "step": 2290 }, { "epoch": 0.06, "learning_rate": 1.9956810725009414e-06, "loss": 0.698, "step": 2291 }, { "epoch": 0.06, "learning_rate": 1.995673362256123e-06, "loss": 0.9854, "step": 2292 }, { "epoch": 0.06, "learning_rate": 1.995665645150111e-06, "loss": 1.0225, "step": 2293 }, { "epoch": 0.06, "learning_rate": 1.9956579211829603e-06, "loss": 0.9326, "step": 2294 }, { "epoch": 0.06, "learning_rate": 1.9956501903547236e-06, "loss": 0.9395, "step": 2295 }, { "epoch": 0.06, "learning_rate": 1.9956424526654535e-06, "loss": 1.002, "step": 2296 }, { "epoch": 0.06, "learning_rate": 1.995634708115204e-06, "loss": 0.9814, "step": 2297 }, { "epoch": 0.06, "learning_rate": 1.995626956704028e-06, "loss": 0.8896, "step": 2298 }, { "epoch": 0.06, "learning_rate": 1.995619198431979e-06, "loss": 0.9082, "step": 2299 }, { "epoch": 0.06, "learning_rate": 1.995611433299111e-06, "loss": 0.8267, "step": 2300 }, { "epoch": 0.06, "learning_rate": 1.9956036613054766e-06, "loss": 1.1543, "step": 2301 }, { "epoch": 0.06, "learning_rate": 1.9955958824511303e-06, "loss": 1.0537, "step": 2302 }, { "epoch": 0.06, "learning_rate": 1.995588096736125e-06, "loss": 1.0791, "step": 2303 }, { "epoch": 0.06, "learning_rate": 1.9955803041605146e-06, "loss": 0.9893, "step": 2304 }, { "epoch": 0.06, "learning_rate": 1.9955725047243527e-06, "loss": 0.9727, "step": 2305 }, { "epoch": 0.06, "learning_rate": 1.9955646984276933e-06, "loss": 1.0098, "step": 2306 }, { "epoch": 0.06, "learning_rate": 1.9955568852705904e-06, "loss": 0.8047, "step": 2307 }, { "epoch": 0.06, "learning_rate": 1.9955490652530966e-06, "loss": 0.8506, "step": 2308 }, { "epoch": 0.06, "learning_rate": 1.995541238375267e-06, "loss": 0.835, "step": 2309 }, { "epoch": 0.06, "learning_rate": 1.995533404637156e-06, "loss": 1.0127, "step": 2310 }, { "epoch": 0.06, "learning_rate": 1.995525564038816e-06, "loss": 1.0547, "step": 2311 }, { "epoch": 0.06, "learning_rate": 1.995517716580302e-06, "loss": 1.1191, "step": 2312 }, { "epoch": 0.06, "learning_rate": 1.995509862261668e-06, "loss": 1.001, "step": 2313 }, { "epoch": 0.06, "learning_rate": 1.995502001082968e-06, "loss": 0.9307, "step": 2314 }, { "epoch": 0.06, "learning_rate": 1.9954941330442558e-06, "loss": 1.0215, "step": 2315 }, { "epoch": 0.06, "learning_rate": 1.9954862581455864e-06, "loss": 0.9375, "step": 2316 }, { "epoch": 0.06, "learning_rate": 1.9954783763870137e-06, "loss": 0.9443, "step": 2317 }, { "epoch": 0.06, "learning_rate": 1.9954704877685917e-06, "loss": 0.6733, "step": 2318 }, { "epoch": 0.06, "learning_rate": 1.995462592290375e-06, "loss": 0.8398, "step": 2319 }, { "epoch": 0.06, "learning_rate": 1.9954546899524187e-06, "loss": 0.8809, "step": 2320 }, { "epoch": 0.06, "learning_rate": 1.995446780754776e-06, "loss": 0.8125, "step": 2321 }, { "epoch": 0.06, "learning_rate": 1.9954388646975023e-06, "loss": 0.9102, "step": 2322 }, { "epoch": 0.06, "learning_rate": 1.9954309417806517e-06, "loss": 1.0957, "step": 2323 }, { "epoch": 0.06, "learning_rate": 1.995423012004279e-06, "loss": 1.0527, "step": 2324 }, { "epoch": 0.06, "learning_rate": 1.9954150753684387e-06, "loss": 0.8975, "step": 2325 }, { "epoch": 0.06, "learning_rate": 1.995407131873186e-06, "loss": 0.9062, "step": 2326 }, { "epoch": 0.06, "learning_rate": 1.995399181518575e-06, "loss": 0.957, "step": 2327 }, { "epoch": 0.06, "learning_rate": 1.9953912243046607e-06, "loss": 1.1621, "step": 2328 }, { "epoch": 0.06, "learning_rate": 1.9953832602314977e-06, "loss": 0.9873, "step": 2329 }, { "epoch": 0.06, "learning_rate": 1.9953752892991416e-06, "loss": 0.8926, "step": 2330 }, { "epoch": 0.06, "learning_rate": 1.9953673115076464e-06, "loss": 1.1045, "step": 2331 }, { "epoch": 0.06, "learning_rate": 1.995359326857068e-06, "loss": 0.833, "step": 2332 }, { "epoch": 0.06, "learning_rate": 1.9953513353474607e-06, "loss": 1.248, "step": 2333 }, { "epoch": 0.06, "learning_rate": 1.99534333697888e-06, "loss": 0.9287, "step": 2334 }, { "epoch": 0.06, "learning_rate": 1.9953353317513806e-06, "loss": 0.9062, "step": 2335 }, { "epoch": 0.06, "learning_rate": 1.995327319665018e-06, "loss": 0.9199, "step": 2336 }, { "epoch": 0.06, "learning_rate": 1.9953193007198475e-06, "loss": 1.2217, "step": 2337 }, { "epoch": 0.06, "learning_rate": 1.9953112749159236e-06, "loss": 0.999, "step": 2338 }, { "epoch": 0.06, "learning_rate": 1.995303242253303e-06, "loss": 0.8936, "step": 2339 }, { "epoch": 0.06, "learning_rate": 1.9952952027320397e-06, "loss": 1.0186, "step": 2340 }, { "epoch": 0.06, "learning_rate": 1.9952871563521897e-06, "loss": 1.043, "step": 2341 }, { "epoch": 0.06, "learning_rate": 1.9952791031138085e-06, "loss": 0.8491, "step": 2342 }, { "epoch": 0.06, "learning_rate": 1.9952710430169515e-06, "loss": 1.1406, "step": 2343 }, { "epoch": 0.06, "learning_rate": 1.9952629760616743e-06, "loss": 1.1162, "step": 2344 }, { "epoch": 0.06, "learning_rate": 1.9952549022480323e-06, "loss": 0.917, "step": 2345 }, { "epoch": 0.06, "learning_rate": 1.995246821576081e-06, "loss": 1.0137, "step": 2346 }, { "epoch": 0.06, "learning_rate": 1.995238734045877e-06, "loss": 0.8096, "step": 2347 }, { "epoch": 0.06, "learning_rate": 1.995230639657475e-06, "loss": 0.7749, "step": 2348 }, { "epoch": 0.06, "learning_rate": 1.995222538410931e-06, "loss": 1.0176, "step": 2349 }, { "epoch": 0.06, "learning_rate": 1.995214430306301e-06, "loss": 0.8799, "step": 2350 }, { "epoch": 0.06, "learning_rate": 1.995206315343641e-06, "loss": 0.9961, "step": 2351 }, { "epoch": 0.06, "learning_rate": 1.9951981935230065e-06, "loss": 0.791, "step": 2352 }, { "epoch": 0.06, "learning_rate": 1.9951900648444537e-06, "loss": 1.0195, "step": 2353 }, { "epoch": 0.06, "learning_rate": 1.995181929308039e-06, "loss": 0.6948, "step": 2354 }, { "epoch": 0.06, "learning_rate": 1.995173786913818e-06, "loss": 1.0361, "step": 2355 }, { "epoch": 0.06, "learning_rate": 1.9951656376618467e-06, "loss": 0.8799, "step": 2356 }, { "epoch": 0.06, "learning_rate": 1.995157481552182e-06, "loss": 0.6646, "step": 2357 }, { "epoch": 0.06, "learning_rate": 1.995149318584879e-06, "loss": 0.9277, "step": 2358 }, { "epoch": 0.06, "learning_rate": 1.9951411487599947e-06, "loss": 0.96, "step": 2359 }, { "epoch": 0.06, "learning_rate": 1.995132972077585e-06, "loss": 0.9971, "step": 2360 }, { "epoch": 0.06, "learning_rate": 1.995124788537707e-06, "loss": 0.9961, "step": 2361 }, { "epoch": 0.06, "learning_rate": 1.9951165981404165e-06, "loss": 1.1084, "step": 2362 }, { "epoch": 0.06, "learning_rate": 1.9951084008857696e-06, "loss": 0.7422, "step": 2363 }, { "epoch": 0.06, "learning_rate": 1.9951001967738235e-06, "loss": 1.248, "step": 2364 }, { "epoch": 0.06, "learning_rate": 1.995091985804634e-06, "loss": 0.9854, "step": 2365 }, { "epoch": 0.06, "learning_rate": 1.995083767978259e-06, "loss": 1.085, "step": 2366 }, { "epoch": 0.06, "learning_rate": 1.9950755432947536e-06, "loss": 1.1084, "step": 2367 }, { "epoch": 0.06, "learning_rate": 1.995067311754175e-06, "loss": 0.9932, "step": 2368 }, { "epoch": 0.06, "learning_rate": 1.9950590733565804e-06, "loss": 1.1162, "step": 2369 }, { "epoch": 0.06, "learning_rate": 1.995050828102026e-06, "loss": 1.0127, "step": 2370 }, { "epoch": 0.06, "learning_rate": 1.995042575990569e-06, "loss": 0.7891, "step": 2371 }, { "epoch": 0.06, "learning_rate": 1.9950343170222658e-06, "loss": 0.9844, "step": 2372 }, { "epoch": 0.06, "learning_rate": 1.9950260511971737e-06, "loss": 1.1143, "step": 2373 }, { "epoch": 0.06, "learning_rate": 1.9950177785153495e-06, "loss": 1.0068, "step": 2374 }, { "epoch": 0.06, "learning_rate": 1.995009498976851e-06, "loss": 1.1152, "step": 2375 }, { "epoch": 0.06, "learning_rate": 1.995001212581734e-06, "loss": 0.9595, "step": 2376 }, { "epoch": 0.06, "learning_rate": 1.9949929193300555e-06, "loss": 0.9932, "step": 2377 }, { "epoch": 0.06, "learning_rate": 1.994984619221874e-06, "loss": 0.9434, "step": 2378 }, { "epoch": 0.06, "learning_rate": 1.994976312257246e-06, "loss": 1.0889, "step": 2379 }, { "epoch": 0.06, "learning_rate": 1.994967998436228e-06, "loss": 0.9785, "step": 2380 }, { "epoch": 0.06, "learning_rate": 1.994959677758879e-06, "loss": 1.1016, "step": 2381 }, { "epoch": 0.06, "learning_rate": 1.9949513502252547e-06, "loss": 0.9922, "step": 2382 }, { "epoch": 0.06, "learning_rate": 1.9949430158354134e-06, "loss": 0.8086, "step": 2383 }, { "epoch": 0.06, "learning_rate": 1.994934674589412e-06, "loss": 1.002, "step": 2384 }, { "epoch": 0.06, "learning_rate": 1.994926326487309e-06, "loss": 0.894, "step": 2385 }, { "epoch": 0.06, "learning_rate": 1.9949179715291604e-06, "loss": 0.8369, "step": 2386 }, { "epoch": 0.06, "learning_rate": 1.9949096097150243e-06, "loss": 1.0791, "step": 2387 }, { "epoch": 0.06, "learning_rate": 1.994901241044959e-06, "loss": 0.998, "step": 2388 }, { "epoch": 0.06, "learning_rate": 1.994892865519022e-06, "loss": 0.8984, "step": 2389 }, { "epoch": 0.06, "learning_rate": 1.9948844831372705e-06, "loss": 0.9697, "step": 2390 }, { "epoch": 0.06, "learning_rate": 1.994876093899762e-06, "loss": 0.9067, "step": 2391 }, { "epoch": 0.06, "learning_rate": 1.9948676978065556e-06, "loss": 1.0605, "step": 2392 }, { "epoch": 0.06, "learning_rate": 1.994859294857708e-06, "loss": 1.002, "step": 2393 }, { "epoch": 0.06, "learning_rate": 1.9948508850532777e-06, "loss": 1.1035, "step": 2394 }, { "epoch": 0.06, "learning_rate": 1.994842468393322e-06, "loss": 0.8354, "step": 2395 }, { "epoch": 0.06, "learning_rate": 1.9948340448779e-06, "loss": 0.9199, "step": 2396 }, { "epoch": 0.06, "learning_rate": 1.9948256145070685e-06, "loss": 0.9971, "step": 2397 }, { "epoch": 0.06, "learning_rate": 1.9948171772808866e-06, "loss": 1.1768, "step": 2398 }, { "epoch": 0.06, "learning_rate": 1.9948087331994116e-06, "loss": 1.1006, "step": 2399 }, { "epoch": 0.06, "learning_rate": 1.9948002822627025e-06, "loss": 1.0352, "step": 2400 }, { "epoch": 0.06, "learning_rate": 1.994791824470817e-06, "loss": 0.9961, "step": 2401 }, { "epoch": 0.06, "learning_rate": 1.9947833598238135e-06, "loss": 0.9492, "step": 2402 }, { "epoch": 0.06, "learning_rate": 1.99477488832175e-06, "loss": 0.6167, "step": 2403 }, { "epoch": 0.06, "learning_rate": 1.9947664099646858e-06, "loss": 0.9932, "step": 2404 }, { "epoch": 0.06, "learning_rate": 1.9947579247526783e-06, "loss": 0.9785, "step": 2405 }, { "epoch": 0.06, "learning_rate": 1.9947494326857866e-06, "loss": 1.0459, "step": 2406 }, { "epoch": 0.06, "learning_rate": 1.9947409337640693e-06, "loss": 0.9824, "step": 2407 }, { "epoch": 0.06, "learning_rate": 1.9947324279875842e-06, "loss": 0.957, "step": 2408 }, { "epoch": 0.06, "learning_rate": 1.994723915356391e-06, "loss": 0.9336, "step": 2409 }, { "epoch": 0.06, "learning_rate": 1.9947153958705476e-06, "loss": 1.2168, "step": 2410 }, { "epoch": 0.06, "learning_rate": 1.9947068695301126e-06, "loss": 1.0107, "step": 2411 }, { "epoch": 0.06, "learning_rate": 1.994698336335145e-06, "loss": 0.9209, "step": 2412 }, { "epoch": 0.06, "learning_rate": 1.994689796285704e-06, "loss": 1.1143, "step": 2413 }, { "epoch": 0.06, "learning_rate": 1.994681249381848e-06, "loss": 1.2363, "step": 2414 }, { "epoch": 0.06, "learning_rate": 1.9946726956236364e-06, "loss": 0.7778, "step": 2415 }, { "epoch": 0.06, "learning_rate": 1.9946641350111272e-06, "loss": 1.0508, "step": 2416 }, { "epoch": 0.06, "learning_rate": 1.99465556754438e-06, "loss": 0.9121, "step": 2417 }, { "epoch": 0.06, "learning_rate": 1.994646993223454e-06, "loss": 0.876, "step": 2418 }, { "epoch": 0.06, "learning_rate": 1.994638412048408e-06, "loss": 1.0195, "step": 2419 }, { "epoch": 0.06, "learning_rate": 1.994629824019301e-06, "loss": 1.0898, "step": 2420 }, { "epoch": 0.06, "learning_rate": 1.994621229136192e-06, "loss": 1.0039, "step": 2421 }, { "epoch": 0.06, "learning_rate": 1.9946126273991415e-06, "loss": 0.5532, "step": 2422 }, { "epoch": 0.06, "learning_rate": 1.994604018808207e-06, "loss": 1.0195, "step": 2423 }, { "epoch": 0.06, "learning_rate": 1.9945954033634494e-06, "loss": 0.9448, "step": 2424 }, { "epoch": 0.06, "learning_rate": 1.994586781064927e-06, "loss": 0.707, "step": 2425 }, { "epoch": 0.06, "learning_rate": 1.9945781519127e-06, "loss": 0.9785, "step": 2426 }, { "epoch": 0.06, "learning_rate": 1.9945695159068267e-06, "loss": 1.0322, "step": 2427 }, { "epoch": 0.06, "learning_rate": 1.994560873047368e-06, "loss": 0.9736, "step": 2428 }, { "epoch": 0.06, "learning_rate": 1.9945522233343827e-06, "loss": 1.0117, "step": 2429 }, { "epoch": 0.06, "learning_rate": 1.9945435667679302e-06, "loss": 0.9004, "step": 2430 }, { "epoch": 0.06, "learning_rate": 1.9945349033480706e-06, "loss": 1.043, "step": 2431 }, { "epoch": 0.06, "learning_rate": 1.994526233074863e-06, "loss": 0.9102, "step": 2432 }, { "epoch": 0.06, "learning_rate": 1.9945175559483685e-06, "loss": 0.9858, "step": 2433 }, { "epoch": 0.06, "learning_rate": 1.994508871968646e-06, "loss": 1.1143, "step": 2434 }, { "epoch": 0.06, "learning_rate": 1.9945001811357547e-06, "loss": 1.0098, "step": 2435 }, { "epoch": 0.06, "learning_rate": 1.9944914834497557e-06, "loss": 0.8867, "step": 2436 }, { "epoch": 0.06, "learning_rate": 1.994482778910708e-06, "loss": 1.0176, "step": 2437 }, { "epoch": 0.06, "learning_rate": 1.994474067518672e-06, "loss": 1.0547, "step": 2438 }, { "epoch": 0.06, "learning_rate": 1.9944653492737074e-06, "loss": 1.25, "step": 2439 }, { "epoch": 0.06, "learning_rate": 1.9944566241758753e-06, "loss": 0.915, "step": 2440 }, { "epoch": 0.06, "learning_rate": 1.9944478922252345e-06, "loss": 0.8887, "step": 2441 }, { "epoch": 0.06, "learning_rate": 1.994439153421846e-06, "loss": 1.0244, "step": 2442 }, { "epoch": 0.06, "learning_rate": 1.99443040776577e-06, "loss": 0.8955, "step": 2443 }, { "epoch": 0.06, "learning_rate": 1.9944216552570663e-06, "loss": 0.9277, "step": 2444 }, { "epoch": 0.06, "learning_rate": 1.994412895895795e-06, "loss": 0.874, "step": 2445 }, { "epoch": 0.06, "learning_rate": 1.9944041296820178e-06, "loss": 1.0215, "step": 2446 }, { "epoch": 0.06, "learning_rate": 1.994395356615794e-06, "loss": 1.0742, "step": 2447 }, { "epoch": 0.06, "learning_rate": 1.994386576697184e-06, "loss": 0.8887, "step": 2448 }, { "epoch": 0.06, "learning_rate": 1.9943777899262484e-06, "loss": 0.8193, "step": 2449 }, { "epoch": 0.06, "learning_rate": 1.994368996303048e-06, "loss": 0.9482, "step": 2450 }, { "epoch": 0.06, "learning_rate": 1.9943601958276436e-06, "loss": 0.7939, "step": 2451 }, { "epoch": 0.06, "learning_rate": 1.9943513885000956e-06, "loss": 0.9443, "step": 2452 }, { "epoch": 0.06, "learning_rate": 1.994342574320465e-06, "loss": 0.8525, "step": 2453 }, { "epoch": 0.06, "learning_rate": 1.9943337532888116e-06, "loss": 1.1572, "step": 2454 }, { "epoch": 0.06, "learning_rate": 1.994324925405197e-06, "loss": 1.085, "step": 2455 }, { "epoch": 0.06, "learning_rate": 1.994316090669682e-06, "loss": 0.8604, "step": 2456 }, { "epoch": 0.06, "learning_rate": 1.994307249082327e-06, "loss": 0.8896, "step": 2457 }, { "epoch": 0.06, "learning_rate": 1.9942984006431934e-06, "loss": 0.7378, "step": 2458 }, { "epoch": 0.06, "learning_rate": 1.994289545352342e-06, "loss": 1.0439, "step": 2459 }, { "epoch": 0.06, "learning_rate": 1.994280683209834e-06, "loss": 0.9248, "step": 2460 }, { "epoch": 0.06, "learning_rate": 1.99427181421573e-06, "loss": 0.8896, "step": 2461 }, { "epoch": 0.06, "learning_rate": 1.9942629383700917e-06, "loss": 1.2637, "step": 2462 }, { "epoch": 0.06, "learning_rate": 1.9942540556729795e-06, "loss": 1.0723, "step": 2463 }, { "epoch": 0.06, "learning_rate": 1.994245166124456e-06, "loss": 1.0732, "step": 2464 }, { "epoch": 0.06, "learning_rate": 1.9942362697245804e-06, "loss": 0.7988, "step": 2465 }, { "epoch": 0.06, "learning_rate": 1.994227366473416e-06, "loss": 0.9678, "step": 2466 }, { "epoch": 0.06, "learning_rate": 1.994218456371023e-06, "loss": 0.895, "step": 2467 }, { "epoch": 0.06, "learning_rate": 1.994209539417463e-06, "loss": 0.9727, "step": 2468 }, { "epoch": 0.06, "learning_rate": 1.9942006156127975e-06, "loss": 0.998, "step": 2469 }, { "epoch": 0.06, "learning_rate": 1.9941916849570886e-06, "loss": 1.1523, "step": 2470 }, { "epoch": 0.06, "learning_rate": 1.9941827474503967e-06, "loss": 0.9863, "step": 2471 }, { "epoch": 0.06, "learning_rate": 1.9941738030927843e-06, "loss": 1.0078, "step": 2472 }, { "epoch": 0.06, "learning_rate": 1.9941648518843125e-06, "loss": 1.1377, "step": 2473 }, { "epoch": 0.06, "learning_rate": 1.9941558938250434e-06, "loss": 1.0957, "step": 2474 }, { "epoch": 0.06, "learning_rate": 1.9941469289150383e-06, "loss": 1.0459, "step": 2475 }, { "epoch": 0.06, "learning_rate": 1.9941379571543595e-06, "loss": 0.9922, "step": 2476 }, { "epoch": 0.06, "learning_rate": 1.9941289785430684e-06, "loss": 1.0039, "step": 2477 }, { "epoch": 0.06, "learning_rate": 1.9941199930812267e-06, "loss": 0.9248, "step": 2478 }, { "epoch": 0.06, "learning_rate": 1.994111000768897e-06, "loss": 1.1348, "step": 2479 }, { "epoch": 0.06, "learning_rate": 1.994102001606141e-06, "loss": 0.9609, "step": 2480 }, { "epoch": 0.06, "learning_rate": 1.9940929955930203e-06, "loss": 0.8936, "step": 2481 }, { "epoch": 0.06, "learning_rate": 1.9940839827295976e-06, "loss": 0.8867, "step": 2482 }, { "epoch": 0.06, "learning_rate": 1.994074963015934e-06, "loss": 0.9521, "step": 2483 }, { "epoch": 0.06, "learning_rate": 1.994065936452093e-06, "loss": 1.0039, "step": 2484 }, { "epoch": 0.06, "learning_rate": 1.9940569030381357e-06, "loss": 0.8413, "step": 2485 }, { "epoch": 0.06, "learning_rate": 1.9940478627741247e-06, "loss": 0.8691, "step": 2486 }, { "epoch": 0.06, "learning_rate": 1.9940388156601226e-06, "loss": 0.9961, "step": 2487 }, { "epoch": 0.06, "learning_rate": 1.9940297616961918e-06, "loss": 0.9375, "step": 2488 }, { "epoch": 0.06, "learning_rate": 1.994020700882394e-06, "loss": 1.0498, "step": 2489 }, { "epoch": 0.06, "learning_rate": 1.994011633218792e-06, "loss": 1.123, "step": 2490 }, { "epoch": 0.06, "learning_rate": 1.9940025587054485e-06, "loss": 0.8787, "step": 2491 }, { "epoch": 0.06, "learning_rate": 1.993993477342426e-06, "loss": 0.6821, "step": 2492 }, { "epoch": 0.06, "learning_rate": 1.9939843891297865e-06, "loss": 0.8354, "step": 2493 }, { "epoch": 0.06, "learning_rate": 1.9939752940675935e-06, "loss": 0.918, "step": 2494 }, { "epoch": 0.06, "learning_rate": 1.993966192155909e-06, "loss": 0.9932, "step": 2495 }, { "epoch": 0.06, "learning_rate": 1.993957083394796e-06, "loss": 0.8574, "step": 2496 }, { "epoch": 0.06, "learning_rate": 1.9939479677843175e-06, "loss": 0.833, "step": 2497 }, { "epoch": 0.06, "learning_rate": 1.9939388453245355e-06, "loss": 0.9707, "step": 2498 }, { "epoch": 0.06, "learning_rate": 1.993929716015514e-06, "loss": 1.0742, "step": 2499 }, { "epoch": 0.06, "learning_rate": 1.993920579857315e-06, "loss": 0.854, "step": 2500 }, { "epoch": 0.06, "learning_rate": 1.9939114368500014e-06, "loss": 0.8633, "step": 2501 }, { "epoch": 0.06, "learning_rate": 1.993902286993637e-06, "loss": 1.1475, "step": 2502 }, { "epoch": 0.06, "learning_rate": 1.9938931302882846e-06, "loss": 0.9365, "step": 2503 }, { "epoch": 0.06, "learning_rate": 1.993883966734007e-06, "loss": 1.1084, "step": 2504 }, { "epoch": 0.06, "learning_rate": 1.9938747963308677e-06, "loss": 1.1514, "step": 2505 }, { "epoch": 0.06, "learning_rate": 1.993865619078929e-06, "loss": 0.8496, "step": 2506 }, { "epoch": 0.06, "learning_rate": 1.9938564349782555e-06, "loss": 0.9902, "step": 2507 }, { "epoch": 0.06, "learning_rate": 1.9938472440289094e-06, "loss": 1.0654, "step": 2508 }, { "epoch": 0.06, "learning_rate": 1.9938380462309546e-06, "loss": 0.9268, "step": 2509 }, { "epoch": 0.06, "learning_rate": 1.993828841584454e-06, "loss": 0.7979, "step": 2510 }, { "epoch": 0.06, "learning_rate": 1.993819630089472e-06, "loss": 0.9834, "step": 2511 }, { "epoch": 0.06, "learning_rate": 1.993810411746071e-06, "loss": 0.8584, "step": 2512 }, { "epoch": 0.06, "learning_rate": 1.993801186554315e-06, "loss": 0.917, "step": 2513 }, { "epoch": 0.06, "learning_rate": 1.9937919545142673e-06, "loss": 1.0713, "step": 2514 }, { "epoch": 0.06, "learning_rate": 1.993782715625992e-06, "loss": 0.9795, "step": 2515 }, { "epoch": 0.06, "learning_rate": 1.9937734698895524e-06, "loss": 1.0176, "step": 2516 }, { "epoch": 0.06, "learning_rate": 1.9937642173050123e-06, "loss": 1.0273, "step": 2517 }, { "epoch": 0.06, "learning_rate": 1.9937549578724357e-06, "loss": 0.8877, "step": 2518 }, { "epoch": 0.06, "learning_rate": 1.9937456915918858e-06, "loss": 0.9473, "step": 2519 }, { "epoch": 0.06, "learning_rate": 1.9937364184634272e-06, "loss": 0.79, "step": 2520 }, { "epoch": 0.06, "learning_rate": 1.993727138487123e-06, "loss": 1.0098, "step": 2521 }, { "epoch": 0.06, "learning_rate": 1.993717851663038e-06, "loss": 0.8105, "step": 2522 }, { "epoch": 0.06, "learning_rate": 1.9937085579912357e-06, "loss": 1.1084, "step": 2523 }, { "epoch": 0.06, "learning_rate": 1.99369925747178e-06, "loss": 1.0166, "step": 2524 }, { "epoch": 0.06, "learning_rate": 1.9936899501047354e-06, "loss": 0.9844, "step": 2525 }, { "epoch": 0.06, "learning_rate": 1.993680635890166e-06, "loss": 0.9639, "step": 2526 }, { "epoch": 0.06, "learning_rate": 1.9936713148281356e-06, "loss": 1.0537, "step": 2527 }, { "epoch": 0.06, "learning_rate": 1.9936619869187085e-06, "loss": 0.9824, "step": 2528 }, { "epoch": 0.06, "learning_rate": 1.993652652161949e-06, "loss": 0.9834, "step": 2529 }, { "epoch": 0.06, "learning_rate": 1.993643310557922e-06, "loss": 0.8809, "step": 2530 }, { "epoch": 0.06, "learning_rate": 1.9936339621066914e-06, "loss": 0.9199, "step": 2531 }, { "epoch": 0.06, "learning_rate": 1.993624606808322e-06, "loss": 0.9561, "step": 2532 }, { "epoch": 0.06, "learning_rate": 1.993615244662877e-06, "loss": 0.9805, "step": 2533 }, { "epoch": 0.06, "learning_rate": 1.9936058756704224e-06, "loss": 0.9199, "step": 2534 }, { "epoch": 0.06, "learning_rate": 1.9935964998310223e-06, "loss": 1.0049, "step": 2535 }, { "epoch": 0.06, "learning_rate": 1.993587117144741e-06, "loss": 0.6753, "step": 2536 }, { "epoch": 0.07, "learning_rate": 1.9935777276116434e-06, "loss": 1.0479, "step": 2537 }, { "epoch": 0.07, "learning_rate": 1.9935683312317942e-06, "loss": 1.125, "step": 2538 }, { "epoch": 0.07, "learning_rate": 1.9935589280052583e-06, "loss": 0.874, "step": 2539 }, { "epoch": 0.07, "learning_rate": 1.9935495179321e-06, "loss": 1.0654, "step": 2540 }, { "epoch": 0.07, "learning_rate": 1.993540101012385e-06, "loss": 0.874, "step": 2541 }, { "epoch": 0.07, "learning_rate": 1.9935306772461773e-06, "loss": 0.9121, "step": 2542 }, { "epoch": 0.07, "learning_rate": 1.993521246633542e-06, "loss": 0.8154, "step": 2543 }, { "epoch": 0.07, "learning_rate": 1.9935118091745443e-06, "loss": 0.9971, "step": 2544 }, { "epoch": 0.07, "learning_rate": 1.9935023648692495e-06, "loss": 0.7935, "step": 2545 }, { "epoch": 0.07, "learning_rate": 1.9934929137177224e-06, "loss": 1.001, "step": 2546 }, { "epoch": 0.07, "learning_rate": 1.9934834557200283e-06, "loss": 0.9414, "step": 2547 }, { "epoch": 0.07, "learning_rate": 1.993473990876232e-06, "loss": 0.959, "step": 2548 }, { "epoch": 0.07, "learning_rate": 1.9934645191863987e-06, "loss": 0.8457, "step": 2549 }, { "epoch": 0.07, "learning_rate": 1.9934550406505937e-06, "loss": 0.9072, "step": 2550 }, { "epoch": 0.07, "learning_rate": 1.993445555268883e-06, "loss": 1.0381, "step": 2551 }, { "epoch": 0.07, "learning_rate": 1.9934360630413313e-06, "loss": 0.9355, "step": 2552 }, { "epoch": 0.07, "learning_rate": 1.9934265639680042e-06, "loss": 1.0068, "step": 2553 }, { "epoch": 0.07, "learning_rate": 1.9934170580489675e-06, "loss": 1.0029, "step": 2554 }, { "epoch": 0.07, "learning_rate": 1.993407545284286e-06, "loss": 0.9121, "step": 2555 }, { "epoch": 0.07, "learning_rate": 1.9933980256740254e-06, "loss": 0.8259, "step": 2556 }, { "epoch": 0.07, "learning_rate": 1.9933884992182517e-06, "loss": 0.917, "step": 2557 }, { "epoch": 0.07, "learning_rate": 1.9933789659170306e-06, "loss": 1.0059, "step": 2558 }, { "epoch": 0.07, "learning_rate": 1.993369425770427e-06, "loss": 1.2354, "step": 2559 }, { "epoch": 0.07, "learning_rate": 1.9933598787785073e-06, "loss": 0.9912, "step": 2560 }, { "epoch": 0.07, "learning_rate": 1.993350324941338e-06, "loss": 0.8223, "step": 2561 }, { "epoch": 0.07, "learning_rate": 1.993340764258983e-06, "loss": 0.9639, "step": 2562 }, { "epoch": 0.07, "learning_rate": 1.9933311967315096e-06, "loss": 0.9717, "step": 2563 }, { "epoch": 0.07, "learning_rate": 1.993321622358984e-06, "loss": 0.9365, "step": 2564 }, { "epoch": 0.07, "learning_rate": 1.993312041141471e-06, "loss": 0.77, "step": 2565 }, { "epoch": 0.07, "learning_rate": 1.9933024530790374e-06, "loss": 1.1982, "step": 2566 }, { "epoch": 0.07, "learning_rate": 1.993292858171749e-06, "loss": 0.9932, "step": 2567 }, { "epoch": 0.07, "learning_rate": 1.993283256419672e-06, "loss": 0.998, "step": 2568 }, { "epoch": 0.07, "learning_rate": 1.993273647822873e-06, "loss": 1.0049, "step": 2569 }, { "epoch": 0.07, "learning_rate": 1.9932640323814173e-06, "loss": 1.1357, "step": 2570 }, { "epoch": 0.07, "learning_rate": 1.9932544100953717e-06, "loss": 1.0, "step": 2571 }, { "epoch": 0.07, "learning_rate": 1.9932447809648028e-06, "loss": 1.1094, "step": 2572 }, { "epoch": 0.07, "learning_rate": 1.9932351449897765e-06, "loss": 1.1562, "step": 2573 }, { "epoch": 0.07, "learning_rate": 1.993225502170359e-06, "loss": 0.6772, "step": 2574 }, { "epoch": 0.07, "learning_rate": 1.9932158525066173e-06, "loss": 1.085, "step": 2575 }, { "epoch": 0.07, "learning_rate": 1.9932061959986175e-06, "loss": 1.2236, "step": 2576 }, { "epoch": 0.07, "learning_rate": 1.9931965326464263e-06, "loss": 0.8228, "step": 2577 }, { "epoch": 0.07, "learning_rate": 1.9931868624501106e-06, "loss": 1.0332, "step": 2578 }, { "epoch": 0.07, "learning_rate": 1.9931771854097365e-06, "loss": 1.0264, "step": 2579 }, { "epoch": 0.07, "learning_rate": 1.993167501525371e-06, "loss": 0.9141, "step": 2580 }, { "epoch": 0.07, "learning_rate": 1.9931578107970808e-06, "loss": 1.0713, "step": 2581 }, { "epoch": 0.07, "learning_rate": 1.9931481132249325e-06, "loss": 0.999, "step": 2582 }, { "epoch": 0.07, "learning_rate": 1.9931384088089927e-06, "loss": 0.9131, "step": 2583 }, { "epoch": 0.07, "learning_rate": 1.9931286975493295e-06, "loss": 1.0488, "step": 2584 }, { "epoch": 0.07, "learning_rate": 1.993118979446008e-06, "loss": 1.0127, "step": 2585 }, { "epoch": 0.07, "learning_rate": 1.9931092544990967e-06, "loss": 0.9746, "step": 2586 }, { "epoch": 0.07, "learning_rate": 1.993099522708662e-06, "loss": 0.9346, "step": 2587 }, { "epoch": 0.07, "learning_rate": 1.993089784074771e-06, "loss": 1.0518, "step": 2588 }, { "epoch": 0.07, "learning_rate": 1.9930800385974905e-06, "loss": 0.9082, "step": 2589 }, { "epoch": 0.07, "learning_rate": 1.993070286276888e-06, "loss": 0.874, "step": 2590 }, { "epoch": 0.07, "learning_rate": 1.9930605271130307e-06, "loss": 0.791, "step": 2591 }, { "epoch": 0.07, "learning_rate": 1.993050761105986e-06, "loss": 0.8486, "step": 2592 }, { "epoch": 0.07, "learning_rate": 1.9930409882558207e-06, "loss": 1.2598, "step": 2593 }, { "epoch": 0.07, "learning_rate": 1.9930312085626026e-06, "loss": 0.9111, "step": 2594 }, { "epoch": 0.07, "learning_rate": 1.993021422026399e-06, "loss": 0.6909, "step": 2595 }, { "epoch": 0.07, "learning_rate": 1.9930116286472772e-06, "loss": 0.9863, "step": 2596 }, { "epoch": 0.07, "learning_rate": 1.9930018284253046e-06, "loss": 0.9404, "step": 2597 }, { "epoch": 0.07, "learning_rate": 1.9929920213605493e-06, "loss": 0.9746, "step": 2598 }, { "epoch": 0.07, "learning_rate": 1.992982207453078e-06, "loss": 1.0322, "step": 2599 }, { "epoch": 0.07, "learning_rate": 1.9929723867029592e-06, "loss": 1.0596, "step": 2600 }, { "epoch": 0.07, "learning_rate": 1.99296255911026e-06, "loss": 1.0146, "step": 2601 }, { "epoch": 0.07, "learning_rate": 1.9929527246750487e-06, "loss": 0.9619, "step": 2602 }, { "epoch": 0.07, "learning_rate": 1.992942883397392e-06, "loss": 1.0068, "step": 2603 }, { "epoch": 0.07, "learning_rate": 1.992933035277359e-06, "loss": 1.0747, "step": 2604 }, { "epoch": 0.07, "learning_rate": 1.992923180315017e-06, "loss": 1.0303, "step": 2605 }, { "epoch": 0.07, "learning_rate": 1.9929133185104333e-06, "loss": 0.8574, "step": 2606 }, { "epoch": 0.07, "learning_rate": 1.9929034498636764e-06, "loss": 1.0771, "step": 2607 }, { "epoch": 0.07, "learning_rate": 1.992893574374815e-06, "loss": 1.0488, "step": 2608 }, { "epoch": 0.07, "learning_rate": 1.992883692043916e-06, "loss": 0.8262, "step": 2609 }, { "epoch": 0.07, "learning_rate": 1.992873802871048e-06, "loss": 0.8408, "step": 2610 }, { "epoch": 0.07, "learning_rate": 1.9928639068562793e-06, "loss": 0.9258, "step": 2611 }, { "epoch": 0.07, "learning_rate": 1.9928540039996777e-06, "loss": 0.6797, "step": 2612 }, { "epoch": 0.07, "learning_rate": 1.992844094301312e-06, "loss": 0.7793, "step": 2613 }, { "epoch": 0.07, "learning_rate": 1.9928341777612497e-06, "loss": 1.0381, "step": 2614 }, { "epoch": 0.07, "learning_rate": 1.9928242543795596e-06, "loss": 1.0342, "step": 2615 }, { "epoch": 0.07, "learning_rate": 1.9928143241563103e-06, "loss": 1.0, "step": 2616 }, { "epoch": 0.07, "learning_rate": 1.99280438709157e-06, "loss": 0.9092, "step": 2617 }, { "epoch": 0.07, "learning_rate": 1.992794443185407e-06, "loss": 0.9019, "step": 2618 }, { "epoch": 0.07, "learning_rate": 1.99278449243789e-06, "loss": 0.8799, "step": 2619 }, { "epoch": 0.07, "learning_rate": 1.992774534849088e-06, "loss": 0.998, "step": 2620 }, { "epoch": 0.07, "learning_rate": 1.992764570419069e-06, "loss": 1.001, "step": 2621 }, { "epoch": 0.07, "learning_rate": 1.9927545991479016e-06, "loss": 0.9893, "step": 2622 }, { "epoch": 0.07, "learning_rate": 1.9927446210356546e-06, "loss": 1.0596, "step": 2623 }, { "epoch": 0.07, "learning_rate": 1.9927346360823975e-06, "loss": 0.9316, "step": 2624 }, { "epoch": 0.07, "learning_rate": 1.992724644288198e-06, "loss": 1.0391, "step": 2625 }, { "epoch": 0.07, "learning_rate": 1.9927146456531256e-06, "loss": 0.752, "step": 2626 }, { "epoch": 0.07, "learning_rate": 1.992704640177249e-06, "loss": 0.9053, "step": 2627 }, { "epoch": 0.07, "learning_rate": 1.9926946278606372e-06, "loss": 0.8521, "step": 2628 }, { "epoch": 0.07, "learning_rate": 1.9926846087033597e-06, "loss": 0.5986, "step": 2629 }, { "epoch": 0.07, "learning_rate": 1.9926745827054848e-06, "loss": 0.8047, "step": 2630 }, { "epoch": 0.07, "learning_rate": 1.992664549867082e-06, "loss": 0.5306, "step": 2631 }, { "epoch": 0.07, "learning_rate": 1.99265451018822e-06, "loss": 0.918, "step": 2632 }, { "epoch": 0.07, "learning_rate": 1.9926444636689682e-06, "loss": 0.9893, "step": 2633 }, { "epoch": 0.07, "learning_rate": 1.992634410309396e-06, "loss": 1.1016, "step": 2634 }, { "epoch": 0.07, "learning_rate": 1.992624350109573e-06, "loss": 0.8965, "step": 2635 }, { "epoch": 0.07, "learning_rate": 1.9926142830695677e-06, "loss": 1.0635, "step": 2636 }, { "epoch": 0.07, "learning_rate": 1.9926042091894496e-06, "loss": 0.9795, "step": 2637 }, { "epoch": 0.07, "learning_rate": 1.992594128469289e-06, "loss": 0.9688, "step": 2638 }, { "epoch": 0.07, "learning_rate": 1.9925840409091542e-06, "loss": 0.9688, "step": 2639 }, { "epoch": 0.07, "learning_rate": 1.9925739465091154e-06, "loss": 0.5957, "step": 2640 }, { "epoch": 0.07, "learning_rate": 1.9925638452692428e-06, "loss": 1.0, "step": 2641 }, { "epoch": 0.07, "learning_rate": 1.9925537371896045e-06, "loss": 1.0049, "step": 2642 }, { "epoch": 0.07, "learning_rate": 1.992543622270271e-06, "loss": 0.9336, "step": 2643 }, { "epoch": 0.07, "learning_rate": 1.992533500511312e-06, "loss": 1.0234, "step": 2644 }, { "epoch": 0.07, "learning_rate": 1.9925233719127967e-06, "loss": 1.1602, "step": 2645 }, { "epoch": 0.07, "learning_rate": 1.992513236474796e-06, "loss": 1.0117, "step": 2646 }, { "epoch": 0.07, "learning_rate": 1.992503094197379e-06, "loss": 0.8652, "step": 2647 }, { "epoch": 0.07, "learning_rate": 1.992492945080615e-06, "loss": 0.8965, "step": 2648 }, { "epoch": 0.07, "learning_rate": 1.992482789124576e-06, "loss": 1.082, "step": 2649 }, { "epoch": 0.07, "learning_rate": 1.9924726263293294e-06, "loss": 0.8281, "step": 2650 }, { "epoch": 0.07, "learning_rate": 1.9924624566949467e-06, "loss": 1.0605, "step": 2651 }, { "epoch": 0.07, "learning_rate": 1.992452280221498e-06, "loss": 1.0293, "step": 2652 }, { "epoch": 0.07, "learning_rate": 1.9924420969090527e-06, "loss": 0.8633, "step": 2653 }, { "epoch": 0.07, "learning_rate": 1.9924319067576817e-06, "loss": 0.7598, "step": 2654 }, { "epoch": 0.07, "learning_rate": 1.9924217097674547e-06, "loss": 0.7446, "step": 2655 }, { "epoch": 0.07, "learning_rate": 1.9924115059384425e-06, "loss": 1.1201, "step": 2656 }, { "epoch": 0.07, "learning_rate": 1.992401295270715e-06, "loss": 0.8218, "step": 2657 }, { "epoch": 0.07, "learning_rate": 1.9923910777643425e-06, "loss": 0.7305, "step": 2658 }, { "epoch": 0.07, "learning_rate": 1.9923808534193957e-06, "loss": 0.8691, "step": 2659 }, { "epoch": 0.07, "learning_rate": 1.992370622235945e-06, "loss": 0.7676, "step": 2660 }, { "epoch": 0.07, "learning_rate": 1.992360384214061e-06, "loss": 1.0156, "step": 2661 }, { "epoch": 0.07, "learning_rate": 1.992350139353814e-06, "loss": 0.8999, "step": 2662 }, { "epoch": 0.07, "learning_rate": 1.9923398876552748e-06, "loss": 0.8232, "step": 2663 }, { "epoch": 0.07, "learning_rate": 1.9923296291185132e-06, "loss": 0.9248, "step": 2664 }, { "epoch": 0.07, "learning_rate": 1.9923193637436013e-06, "loss": 0.6572, "step": 2665 }, { "epoch": 0.07, "learning_rate": 1.9923090915306094e-06, "loss": 1.1377, "step": 2666 }, { "epoch": 0.07, "learning_rate": 1.9922988124796077e-06, "loss": 1.0811, "step": 2667 }, { "epoch": 0.07, "learning_rate": 1.992288526590667e-06, "loss": 0.8804, "step": 2668 }, { "epoch": 0.07, "learning_rate": 1.9922782338638594e-06, "loss": 0.9697, "step": 2669 }, { "epoch": 0.07, "learning_rate": 1.9922679342992545e-06, "loss": 1.001, "step": 2670 }, { "epoch": 0.07, "learning_rate": 1.9922576278969237e-06, "loss": 0.9785, "step": 2671 }, { "epoch": 0.07, "learning_rate": 1.9922473146569385e-06, "loss": 0.9932, "step": 2672 }, { "epoch": 0.07, "learning_rate": 1.992236994579369e-06, "loss": 1.1768, "step": 2673 }, { "epoch": 0.07, "learning_rate": 1.9922266676642873e-06, "loss": 0.7588, "step": 2674 }, { "epoch": 0.07, "learning_rate": 1.992216333911764e-06, "loss": 1.083, "step": 2675 }, { "epoch": 0.07, "learning_rate": 1.9922059933218706e-06, "loss": 0.6689, "step": 2676 }, { "epoch": 0.07, "learning_rate": 1.992195645894678e-06, "loss": 0.8896, "step": 2677 }, { "epoch": 0.07, "learning_rate": 1.9921852916302576e-06, "loss": 1.1504, "step": 2678 }, { "epoch": 0.07, "learning_rate": 1.992174930528681e-06, "loss": 0.9834, "step": 2679 }, { "epoch": 0.07, "learning_rate": 1.9921645625900196e-06, "loss": 0.8516, "step": 2680 }, { "epoch": 0.07, "learning_rate": 1.9921541878143448e-06, "loss": 0.6638, "step": 2681 }, { "epoch": 0.07, "learning_rate": 1.992143806201728e-06, "loss": 0.8564, "step": 2682 }, { "epoch": 0.07, "learning_rate": 1.99213341775224e-06, "loss": 0.8521, "step": 2683 }, { "epoch": 0.07, "learning_rate": 1.992123022465954e-06, "loss": 1.1074, "step": 2684 }, { "epoch": 0.07, "learning_rate": 1.9921126203429403e-06, "loss": 1.1094, "step": 2685 }, { "epoch": 0.07, "learning_rate": 1.9921022113832714e-06, "loss": 0.8513, "step": 2686 }, { "epoch": 0.07, "learning_rate": 1.9920917955870183e-06, "loss": 1.1465, "step": 2687 }, { "epoch": 0.07, "learning_rate": 1.992081372954253e-06, "loss": 0.8242, "step": 2688 }, { "epoch": 0.07, "learning_rate": 1.9920709434850476e-06, "loss": 1.1416, "step": 2689 }, { "epoch": 0.07, "learning_rate": 1.9920605071794744e-06, "loss": 1.2217, "step": 2690 }, { "epoch": 0.07, "learning_rate": 1.992050064037604e-06, "loss": 0.9141, "step": 2691 }, { "epoch": 0.07, "learning_rate": 1.9920396140595096e-06, "loss": 0.9512, "step": 2692 }, { "epoch": 0.07, "learning_rate": 1.9920291572452626e-06, "loss": 0.9072, "step": 2693 }, { "epoch": 0.07, "learning_rate": 1.992018693594935e-06, "loss": 1.0381, "step": 2694 }, { "epoch": 0.07, "learning_rate": 1.9920082231085994e-06, "loss": 0.8955, "step": 2695 }, { "epoch": 0.07, "learning_rate": 1.9919977457863273e-06, "loss": 0.8379, "step": 2696 }, { "epoch": 0.07, "learning_rate": 1.9919872616281914e-06, "loss": 0.7734, "step": 2697 }, { "epoch": 0.07, "learning_rate": 1.9919767706342637e-06, "loss": 0.7817, "step": 2698 }, { "epoch": 0.07, "learning_rate": 1.9919662728046167e-06, "loss": 0.8916, "step": 2699 }, { "epoch": 0.07, "learning_rate": 1.9919557681393227e-06, "loss": 1.1318, "step": 2700 }, { "epoch": 0.07, "learning_rate": 1.991945256638454e-06, "loss": 0.9844, "step": 2701 }, { "epoch": 0.07, "learning_rate": 1.9919347383020824e-06, "loss": 0.7778, "step": 2702 }, { "epoch": 0.07, "learning_rate": 1.9919242131302817e-06, "loss": 1.0879, "step": 2703 }, { "epoch": 0.07, "learning_rate": 1.9919136811231238e-06, "loss": 0.78, "step": 2704 }, { "epoch": 0.07, "learning_rate": 1.991903142280681e-06, "loss": 1.041, "step": 2705 }, { "epoch": 0.07, "learning_rate": 1.9918925966030262e-06, "loss": 0.8848, "step": 2706 }, { "epoch": 0.07, "learning_rate": 1.9918820440902323e-06, "loss": 0.9443, "step": 2707 }, { "epoch": 0.07, "learning_rate": 1.9918714847423713e-06, "loss": 0.9316, "step": 2708 }, { "epoch": 0.07, "learning_rate": 1.9918609185595163e-06, "loss": 1.0205, "step": 2709 }, { "epoch": 0.07, "learning_rate": 1.991850345541741e-06, "loss": 0.9854, "step": 2710 }, { "epoch": 0.07, "learning_rate": 1.9918397656891166e-06, "loss": 0.9766, "step": 2711 }, { "epoch": 0.07, "learning_rate": 1.9918291790017176e-06, "loss": 0.8838, "step": 2712 }, { "epoch": 0.07, "learning_rate": 1.9918185854796156e-06, "loss": 1.0967, "step": 2713 }, { "epoch": 0.07, "learning_rate": 1.9918079851228848e-06, "loss": 1.0889, "step": 2714 }, { "epoch": 0.07, "learning_rate": 1.991797377931597e-06, "loss": 1.0898, "step": 2715 }, { "epoch": 0.07, "learning_rate": 1.9917867639058264e-06, "loss": 0.9473, "step": 2716 }, { "epoch": 0.07, "learning_rate": 1.991776143045646e-06, "loss": 0.9785, "step": 2717 }, { "epoch": 0.07, "learning_rate": 1.9917655153511283e-06, "loss": 0.7195, "step": 2718 }, { "epoch": 0.07, "learning_rate": 1.991754880822347e-06, "loss": 0.9473, "step": 2719 }, { "epoch": 0.07, "learning_rate": 1.9917442394593756e-06, "loss": 1.1348, "step": 2720 }, { "epoch": 0.07, "learning_rate": 1.9917335912622866e-06, "loss": 1.1631, "step": 2721 }, { "epoch": 0.07, "learning_rate": 1.9917229362311546e-06, "loss": 0.8623, "step": 2722 }, { "epoch": 0.07, "learning_rate": 1.991712274366052e-06, "loss": 0.7261, "step": 2723 }, { "epoch": 0.07, "learning_rate": 1.9917016056670526e-06, "loss": 0.959, "step": 2724 }, { "epoch": 0.07, "learning_rate": 1.9916909301342296e-06, "loss": 0.8516, "step": 2725 }, { "epoch": 0.07, "learning_rate": 1.9916802477676574e-06, "loss": 0.9932, "step": 2726 }, { "epoch": 0.07, "learning_rate": 1.991669558567409e-06, "loss": 1.0205, "step": 2727 }, { "epoch": 0.07, "learning_rate": 1.9916588625335583e-06, "loss": 1.0449, "step": 2728 }, { "epoch": 0.07, "learning_rate": 1.991648159666179e-06, "loss": 1.0859, "step": 2729 }, { "epoch": 0.07, "learning_rate": 1.9916374499653443e-06, "loss": 0.8633, "step": 2730 }, { "epoch": 0.07, "learning_rate": 1.9916267334311288e-06, "loss": 1.0225, "step": 2731 }, { "epoch": 0.07, "learning_rate": 1.991616010063606e-06, "loss": 0.9414, "step": 2732 }, { "epoch": 0.07, "learning_rate": 1.9916052798628495e-06, "loss": 0.9434, "step": 2733 }, { "epoch": 0.07, "learning_rate": 1.9915945428289336e-06, "loss": 0.8975, "step": 2734 }, { "epoch": 0.07, "learning_rate": 1.991583798961932e-06, "loss": 1.0264, "step": 2735 }, { "epoch": 0.07, "learning_rate": 1.9915730482619197e-06, "loss": 0.8662, "step": 2736 }, { "epoch": 0.07, "learning_rate": 1.991562290728969e-06, "loss": 0.9883, "step": 2737 }, { "epoch": 0.07, "learning_rate": 1.991551526363156e-06, "loss": 0.9414, "step": 2738 }, { "epoch": 0.07, "learning_rate": 1.9915407551645536e-06, "loss": 1.0029, "step": 2739 }, { "epoch": 0.07, "learning_rate": 1.9915299771332363e-06, "loss": 0.9795, "step": 2740 }, { "epoch": 0.07, "learning_rate": 1.9915191922692786e-06, "loss": 0.8477, "step": 2741 }, { "epoch": 0.07, "learning_rate": 1.9915084005727547e-06, "loss": 0.96, "step": 2742 }, { "epoch": 0.07, "learning_rate": 1.9914976020437386e-06, "loss": 0.7598, "step": 2743 }, { "epoch": 0.07, "learning_rate": 1.991486796682305e-06, "loss": 0.9414, "step": 2744 }, { "epoch": 0.07, "learning_rate": 1.991475984488529e-06, "loss": 0.915, "step": 2745 }, { "epoch": 0.07, "learning_rate": 1.991465165462484e-06, "loss": 0.8906, "step": 2746 }, { "epoch": 0.07, "learning_rate": 1.991454339604245e-06, "loss": 1.1064, "step": 2747 }, { "epoch": 0.07, "learning_rate": 1.9914435069138865e-06, "loss": 1.04, "step": 2748 }, { "epoch": 0.07, "learning_rate": 1.9914326673914835e-06, "loss": 0.5889, "step": 2749 }, { "epoch": 0.07, "learning_rate": 1.9914218210371106e-06, "loss": 0.9678, "step": 2750 }, { "epoch": 0.07, "learning_rate": 1.9914109678508427e-06, "loss": 0.9775, "step": 2751 }, { "epoch": 0.07, "learning_rate": 1.991400107832754e-06, "loss": 0.8169, "step": 2752 }, { "epoch": 0.07, "learning_rate": 1.9913892409829195e-06, "loss": 1.0615, "step": 2753 }, { "epoch": 0.07, "learning_rate": 1.9913783673014146e-06, "loss": 1.1777, "step": 2754 }, { "epoch": 0.07, "learning_rate": 1.9913674867883138e-06, "loss": 0.9404, "step": 2755 }, { "epoch": 0.07, "learning_rate": 1.991356599443692e-06, "loss": 1.2021, "step": 2756 }, { "epoch": 0.07, "learning_rate": 1.9913457052676247e-06, "loss": 0.9014, "step": 2757 }, { "epoch": 0.07, "learning_rate": 1.9913348042601864e-06, "loss": 1.0156, "step": 2758 }, { "epoch": 0.07, "learning_rate": 1.9913238964214524e-06, "loss": 0.6641, "step": 2759 }, { "epoch": 0.07, "learning_rate": 1.9913129817514985e-06, "loss": 0.8047, "step": 2760 }, { "epoch": 0.07, "learning_rate": 1.9913020602503988e-06, "loss": 0.896, "step": 2761 }, { "epoch": 0.07, "learning_rate": 1.9912911319182295e-06, "loss": 0.9785, "step": 2762 }, { "epoch": 0.07, "learning_rate": 1.991280196755065e-06, "loss": 0.6899, "step": 2763 }, { "epoch": 0.07, "learning_rate": 1.9912692547609816e-06, "loss": 0.9307, "step": 2764 }, { "epoch": 0.07, "learning_rate": 1.9912583059360537e-06, "loss": 0.9072, "step": 2765 }, { "epoch": 0.07, "learning_rate": 1.991247350280358e-06, "loss": 1.1201, "step": 2766 }, { "epoch": 0.07, "learning_rate": 1.991236387793969e-06, "loss": 1.0303, "step": 2767 }, { "epoch": 0.07, "learning_rate": 1.9912254184769627e-06, "loss": 0.7358, "step": 2768 }, { "epoch": 0.07, "learning_rate": 1.9912144423294147e-06, "loss": 0.8237, "step": 2769 }, { "epoch": 0.07, "learning_rate": 1.9912034593514e-06, "loss": 0.9199, "step": 2770 }, { "epoch": 0.07, "learning_rate": 1.9911924695429953e-06, "loss": 0.7891, "step": 2771 }, { "epoch": 0.07, "learning_rate": 1.9911814729042757e-06, "loss": 1.0371, "step": 2772 }, { "epoch": 0.07, "learning_rate": 1.9911704694353165e-06, "loss": 0.709, "step": 2773 }, { "epoch": 0.07, "learning_rate": 1.991159459136195e-06, "loss": 1.1152, "step": 2774 }, { "epoch": 0.07, "learning_rate": 1.9911484420069855e-06, "loss": 0.8335, "step": 2775 }, { "epoch": 0.07, "learning_rate": 1.991137418047765e-06, "loss": 0.8057, "step": 2776 }, { "epoch": 0.07, "learning_rate": 1.991126387258609e-06, "loss": 0.9956, "step": 2777 }, { "epoch": 0.07, "learning_rate": 1.9911153496395933e-06, "loss": 0.8457, "step": 2778 }, { "epoch": 0.07, "learning_rate": 1.9911043051907943e-06, "loss": 0.7085, "step": 2779 }, { "epoch": 0.07, "learning_rate": 1.9910932539122882e-06, "loss": 1.1826, "step": 2780 }, { "epoch": 0.07, "learning_rate": 1.9910821958041512e-06, "loss": 1.2158, "step": 2781 }, { "epoch": 0.07, "learning_rate": 1.9910711308664588e-06, "loss": 0.8164, "step": 2782 }, { "epoch": 0.07, "learning_rate": 1.9910600590992883e-06, "loss": 0.9238, "step": 2783 }, { "epoch": 0.07, "learning_rate": 1.991048980502715e-06, "loss": 0.4988, "step": 2784 }, { "epoch": 0.07, "learning_rate": 1.9910378950768157e-06, "loss": 0.6453, "step": 2785 }, { "epoch": 0.07, "learning_rate": 1.991026802821667e-06, "loss": 1.002, "step": 2786 }, { "epoch": 0.07, "learning_rate": 1.991015703737345e-06, "loss": 1.0254, "step": 2787 }, { "epoch": 0.07, "learning_rate": 1.9910045978239264e-06, "loss": 0.8467, "step": 2788 }, { "epoch": 0.07, "learning_rate": 1.9909934850814876e-06, "loss": 0.7847, "step": 2789 }, { "epoch": 0.07, "learning_rate": 1.9909823655101052e-06, "loss": 0.9619, "step": 2790 }, { "epoch": 0.07, "learning_rate": 1.990971239109856e-06, "loss": 1.1201, "step": 2791 }, { "epoch": 0.07, "learning_rate": 1.990960105880816e-06, "loss": 1.1172, "step": 2792 }, { "epoch": 0.07, "learning_rate": 1.990948965823063e-06, "loss": 0.9219, "step": 2793 }, { "epoch": 0.07, "learning_rate": 1.9909378189366728e-06, "loss": 1.1133, "step": 2794 }, { "epoch": 0.07, "learning_rate": 1.990926665221723e-06, "loss": 0.7793, "step": 2795 }, { "epoch": 0.07, "learning_rate": 1.9909155046782894e-06, "loss": 0.9932, "step": 2796 }, { "epoch": 0.07, "learning_rate": 1.9909043373064504e-06, "loss": 0.8877, "step": 2797 }, { "epoch": 0.07, "learning_rate": 1.9908931631062816e-06, "loss": 0.9014, "step": 2798 }, { "epoch": 0.07, "learning_rate": 1.9908819820778605e-06, "loss": 0.9912, "step": 2799 }, { "epoch": 0.07, "learning_rate": 1.9908707942212645e-06, "loss": 1.1729, "step": 2800 }, { "epoch": 0.07, "learning_rate": 1.99085959953657e-06, "loss": 0.854, "step": 2801 }, { "epoch": 0.07, "learning_rate": 1.9908483980238546e-06, "loss": 1.1289, "step": 2802 }, { "epoch": 0.07, "learning_rate": 1.9908371896831958e-06, "loss": 1.0498, "step": 2803 }, { "epoch": 0.07, "learning_rate": 1.99082597451467e-06, "loss": 0.9443, "step": 2804 }, { "epoch": 0.07, "learning_rate": 1.990814752518355e-06, "loss": 0.9658, "step": 2805 }, { "epoch": 0.07, "learning_rate": 1.990803523694328e-06, "loss": 1.1309, "step": 2806 }, { "epoch": 0.07, "learning_rate": 1.9907922880426668e-06, "loss": 1.0303, "step": 2807 }, { "epoch": 0.07, "learning_rate": 1.9907810455634482e-06, "loss": 0.9609, "step": 2808 }, { "epoch": 0.07, "learning_rate": 1.99076979625675e-06, "loss": 1.0527, "step": 2809 }, { "epoch": 0.07, "learning_rate": 1.9907585401226495e-06, "loss": 0.8833, "step": 2810 }, { "epoch": 0.07, "learning_rate": 1.9907472771612244e-06, "loss": 0.8955, "step": 2811 }, { "epoch": 0.07, "learning_rate": 1.9907360073725527e-06, "loss": 1.0625, "step": 2812 }, { "epoch": 0.07, "learning_rate": 1.9907247307567113e-06, "loss": 1.1543, "step": 2813 }, { "epoch": 0.07, "learning_rate": 1.9907134473137783e-06, "loss": 1.0146, "step": 2814 }, { "epoch": 0.07, "learning_rate": 1.9907021570438318e-06, "loss": 0.8799, "step": 2815 }, { "epoch": 0.07, "learning_rate": 1.9906908599469488e-06, "loss": 1.0352, "step": 2816 }, { "epoch": 0.07, "learning_rate": 1.990679556023208e-06, "loss": 0.9443, "step": 2817 }, { "epoch": 0.07, "learning_rate": 1.9906682452726868e-06, "loss": 1.0381, "step": 2818 }, { "epoch": 0.07, "learning_rate": 1.990656927695463e-06, "loss": 0.9854, "step": 2819 }, { "epoch": 0.07, "learning_rate": 1.9906456032916152e-06, "loss": 0.9873, "step": 2820 }, { "epoch": 0.07, "learning_rate": 1.9906342720612204e-06, "loss": 0.958, "step": 2821 }, { "epoch": 0.07, "learning_rate": 1.990622934004358e-06, "loss": 1.0127, "step": 2822 }, { "epoch": 0.07, "learning_rate": 1.9906115891211054e-06, "loss": 1.1191, "step": 2823 }, { "epoch": 0.07, "learning_rate": 1.9906002374115407e-06, "loss": 0.9043, "step": 2824 }, { "epoch": 0.07, "learning_rate": 1.9905888788757424e-06, "loss": 0.9941, "step": 2825 }, { "epoch": 0.07, "learning_rate": 1.9905775135137887e-06, "loss": 1.0859, "step": 2826 }, { "epoch": 0.07, "learning_rate": 1.9905661413257574e-06, "loss": 0.6499, "step": 2827 }, { "epoch": 0.07, "learning_rate": 1.9905547623117277e-06, "loss": 1.0049, "step": 2828 }, { "epoch": 0.07, "learning_rate": 1.990543376471778e-06, "loss": 1.1191, "step": 2829 }, { "epoch": 0.07, "learning_rate": 1.9905319838059856e-06, "loss": 1.0547, "step": 2830 }, { "epoch": 0.07, "learning_rate": 1.9905205843144304e-06, "loss": 1.2803, "step": 2831 }, { "epoch": 0.07, "learning_rate": 1.9905091779971903e-06, "loss": 0.9375, "step": 2832 }, { "epoch": 0.07, "learning_rate": 1.990497764854344e-06, "loss": 0.8008, "step": 2833 }, { "epoch": 0.07, "learning_rate": 1.99048634488597e-06, "loss": 1.1465, "step": 2834 }, { "epoch": 0.07, "learning_rate": 1.990474918092147e-06, "loss": 1.0498, "step": 2835 }, { "epoch": 0.07, "learning_rate": 1.9904634844729543e-06, "loss": 0.7744, "step": 2836 }, { "epoch": 0.07, "learning_rate": 1.99045204402847e-06, "loss": 0.8257, "step": 2837 }, { "epoch": 0.07, "learning_rate": 1.990440596758773e-06, "loss": 1.0859, "step": 2838 }, { "epoch": 0.07, "learning_rate": 1.990429142663942e-06, "loss": 0.895, "step": 2839 }, { "epoch": 0.07, "learning_rate": 1.990417681744057e-06, "loss": 0.9785, "step": 2840 }, { "epoch": 0.07, "learning_rate": 1.990406213999196e-06, "loss": 1.0342, "step": 2841 }, { "epoch": 0.07, "learning_rate": 1.9903947394294386e-06, "loss": 0.9424, "step": 2842 }, { "epoch": 0.07, "learning_rate": 1.990383258034863e-06, "loss": 0.917, "step": 2843 }, { "epoch": 0.07, "learning_rate": 1.9903717698155496e-06, "loss": 0.8408, "step": 2844 }, { "epoch": 0.07, "learning_rate": 1.9903602747715764e-06, "loss": 1.0234, "step": 2845 }, { "epoch": 0.07, "learning_rate": 1.9903487729030232e-06, "loss": 0.9824, "step": 2846 }, { "epoch": 0.07, "learning_rate": 1.9903372642099688e-06, "loss": 1.1123, "step": 2847 }, { "epoch": 0.07, "learning_rate": 1.990325748692493e-06, "loss": 0.8975, "step": 2848 }, { "epoch": 0.07, "learning_rate": 1.9903142263506754e-06, "loss": 0.9746, "step": 2849 }, { "epoch": 0.07, "learning_rate": 1.9903026971845945e-06, "loss": 0.7715, "step": 2850 }, { "epoch": 0.07, "learning_rate": 1.9902911611943304e-06, "loss": 1.1191, "step": 2851 }, { "epoch": 0.07, "learning_rate": 1.9902796183799622e-06, "loss": 0.6689, "step": 2852 }, { "epoch": 0.07, "learning_rate": 1.99026806874157e-06, "loss": 0.9463, "step": 2853 }, { "epoch": 0.07, "learning_rate": 1.9902565122792333e-06, "loss": 0.9277, "step": 2854 }, { "epoch": 0.07, "learning_rate": 1.990244948993031e-06, "loss": 0.9512, "step": 2855 }, { "epoch": 0.07, "learning_rate": 1.9902333788830435e-06, "loss": 1.0078, "step": 2856 }, { "epoch": 0.07, "learning_rate": 1.99022180194935e-06, "loss": 1.0889, "step": 2857 }, { "epoch": 0.07, "learning_rate": 1.990210218192031e-06, "loss": 0.9307, "step": 2858 }, { "epoch": 0.07, "learning_rate": 1.9901986276111654e-06, "loss": 1.0117, "step": 2859 }, { "epoch": 0.07, "learning_rate": 1.990187030206834e-06, "loss": 1.0576, "step": 2860 }, { "epoch": 0.07, "learning_rate": 1.9901754259791164e-06, "loss": 0.8926, "step": 2861 }, { "epoch": 0.07, "learning_rate": 1.990163814928092e-06, "loss": 1.0303, "step": 2862 }, { "epoch": 0.07, "learning_rate": 1.990152197053842e-06, "loss": 0.8892, "step": 2863 }, { "epoch": 0.07, "learning_rate": 1.990140572356445e-06, "loss": 0.9297, "step": 2864 }, { "epoch": 0.07, "learning_rate": 1.990128940835982e-06, "loss": 1.0732, "step": 2865 }, { "epoch": 0.07, "learning_rate": 1.9901173024925332e-06, "loss": 0.8799, "step": 2866 }, { "epoch": 0.07, "learning_rate": 1.9901056573261787e-06, "loss": 1.0234, "step": 2867 }, { "epoch": 0.07, "learning_rate": 1.990094005336998e-06, "loss": 1.0488, "step": 2868 }, { "epoch": 0.07, "learning_rate": 1.9900823465250727e-06, "loss": 0.9658, "step": 2869 }, { "epoch": 0.07, "learning_rate": 1.990070680890482e-06, "loss": 0.8081, "step": 2870 }, { "epoch": 0.07, "learning_rate": 1.990059008433307e-06, "loss": 0.8076, "step": 2871 }, { "epoch": 0.07, "learning_rate": 1.990047329153628e-06, "loss": 0.8071, "step": 2872 }, { "epoch": 0.07, "learning_rate": 1.9900356430515252e-06, "loss": 0.9336, "step": 2873 }, { "epoch": 0.07, "learning_rate": 1.9900239501270794e-06, "loss": 1.0605, "step": 2874 }, { "epoch": 0.07, "learning_rate": 1.9900122503803705e-06, "loss": 0.9482, "step": 2875 }, { "epoch": 0.07, "learning_rate": 1.9900005438114804e-06, "loss": 0.9102, "step": 2876 }, { "epoch": 0.07, "learning_rate": 1.989988830420489e-06, "loss": 0.8223, "step": 2877 }, { "epoch": 0.07, "learning_rate": 1.989977110207477e-06, "loss": 1.0254, "step": 2878 }, { "epoch": 0.07, "learning_rate": 1.9899653831725253e-06, "loss": 0.7896, "step": 2879 }, { "epoch": 0.07, "learning_rate": 1.9899536493157145e-06, "loss": 1.1357, "step": 2880 }, { "epoch": 0.07, "learning_rate": 1.9899419086371257e-06, "loss": 1.0254, "step": 2881 }, { "epoch": 0.07, "learning_rate": 1.98993016113684e-06, "loss": 1.0957, "step": 2882 }, { "epoch": 0.07, "learning_rate": 1.989918406814938e-06, "loss": 0.7412, "step": 2883 }, { "epoch": 0.07, "learning_rate": 1.9899066456715003e-06, "loss": 1.082, "step": 2884 }, { "epoch": 0.07, "learning_rate": 1.9898948777066086e-06, "loss": 0.8096, "step": 2885 }, { "epoch": 0.07, "learning_rate": 1.989883102920344e-06, "loss": 0.832, "step": 2886 }, { "epoch": 0.07, "learning_rate": 1.9898713213127875e-06, "loss": 0.9775, "step": 2887 }, { "epoch": 0.07, "learning_rate": 1.9898595328840203e-06, "loss": 1.0264, "step": 2888 }, { "epoch": 0.07, "learning_rate": 1.9898477376341234e-06, "loss": 0.9502, "step": 2889 }, { "epoch": 0.07, "learning_rate": 1.9898359355631782e-06, "loss": 0.9912, "step": 2890 }, { "epoch": 0.07, "learning_rate": 1.9898241266712665e-06, "loss": 1.0322, "step": 2891 }, { "epoch": 0.07, "learning_rate": 1.989812310958469e-06, "loss": 1.0068, "step": 2892 }, { "epoch": 0.07, "learning_rate": 1.989800488424867e-06, "loss": 0.875, "step": 2893 }, { "epoch": 0.07, "learning_rate": 1.9897886590705426e-06, "loss": 0.7861, "step": 2894 }, { "epoch": 0.07, "learning_rate": 1.9897768228955772e-06, "loss": 0.9414, "step": 2895 }, { "epoch": 0.07, "learning_rate": 1.9897649799000527e-06, "loss": 1.3027, "step": 2896 }, { "epoch": 0.07, "learning_rate": 1.9897531300840494e-06, "loss": 1.0273, "step": 2897 }, { "epoch": 0.07, "learning_rate": 1.9897412734476504e-06, "loss": 0.9131, "step": 2898 }, { "epoch": 0.07, "learning_rate": 1.9897294099909367e-06, "loss": 0.9678, "step": 2899 }, { "epoch": 0.07, "learning_rate": 1.98971753971399e-06, "loss": 1.0059, "step": 2900 }, { "epoch": 0.07, "learning_rate": 1.989705662616892e-06, "loss": 0.998, "step": 2901 }, { "epoch": 0.07, "learning_rate": 1.9896937786997253e-06, "loss": 0.9189, "step": 2902 }, { "epoch": 0.07, "learning_rate": 1.989681887962571e-06, "loss": 0.7532, "step": 2903 }, { "epoch": 0.07, "learning_rate": 1.9896699904055115e-06, "loss": 1.0059, "step": 2904 }, { "epoch": 0.07, "learning_rate": 1.989658086028629e-06, "loss": 0.9658, "step": 2905 }, { "epoch": 0.07, "learning_rate": 1.9896461748320044e-06, "loss": 0.71, "step": 2906 }, { "epoch": 0.07, "learning_rate": 1.989634256815721e-06, "loss": 0.9922, "step": 2907 }, { "epoch": 0.07, "learning_rate": 1.98962233197986e-06, "loss": 0.9512, "step": 2908 }, { "epoch": 0.07, "learning_rate": 1.9896104003245043e-06, "loss": 1.0264, "step": 2909 }, { "epoch": 0.07, "learning_rate": 1.989598461849736e-06, "loss": 1.1621, "step": 2910 }, { "epoch": 0.07, "learning_rate": 1.9895865165556373e-06, "loss": 1.0566, "step": 2911 }, { "epoch": 0.07, "learning_rate": 1.98957456444229e-06, "loss": 1.0469, "step": 2912 }, { "epoch": 0.07, "learning_rate": 1.989562605509777e-06, "loss": 0.875, "step": 2913 }, { "epoch": 0.07, "learning_rate": 1.989550639758181e-06, "loss": 0.96, "step": 2914 }, { "epoch": 0.07, "learning_rate": 1.989538667187584e-06, "loss": 0.9727, "step": 2915 }, { "epoch": 0.07, "learning_rate": 1.989526687798068e-06, "loss": 1.0088, "step": 2916 }, { "epoch": 0.07, "learning_rate": 1.989514701589717e-06, "loss": 0.8945, "step": 2917 }, { "epoch": 0.07, "learning_rate": 1.9895027085626123e-06, "loss": 1.0049, "step": 2918 }, { "epoch": 0.07, "learning_rate": 1.9894907087168367e-06, "loss": 1.0801, "step": 2919 }, { "epoch": 0.07, "learning_rate": 1.9894787020524735e-06, "loss": 1.1777, "step": 2920 }, { "epoch": 0.07, "learning_rate": 1.989466688569605e-06, "loss": 0.957, "step": 2921 }, { "epoch": 0.07, "learning_rate": 1.989454668268314e-06, "loss": 1.0713, "step": 2922 }, { "epoch": 0.07, "learning_rate": 1.9894426411486835e-06, "loss": 0.8789, "step": 2923 }, { "epoch": 0.07, "learning_rate": 1.989430607210796e-06, "loss": 1.0752, "step": 2924 }, { "epoch": 0.07, "learning_rate": 1.989418566454735e-06, "loss": 0.7412, "step": 2925 }, { "epoch": 0.07, "learning_rate": 1.989406518880583e-06, "loss": 1.0684, "step": 2926 }, { "epoch": 0.08, "learning_rate": 1.9893944644884235e-06, "loss": 0.9238, "step": 2927 }, { "epoch": 0.08, "learning_rate": 1.989382403278339e-06, "loss": 0.8013, "step": 2928 }, { "epoch": 0.08, "learning_rate": 1.989370335250413e-06, "loss": 0.9658, "step": 2929 }, { "epoch": 0.08, "learning_rate": 1.9893582604047286e-06, "loss": 0.8472, "step": 2930 }, { "epoch": 0.08, "learning_rate": 1.9893461787413687e-06, "loss": 0.7554, "step": 2931 }, { "epoch": 0.08, "learning_rate": 1.989334090260417e-06, "loss": 1.1611, "step": 2932 }, { "epoch": 0.08, "learning_rate": 1.989321994961957e-06, "loss": 0.8945, "step": 2933 }, { "epoch": 0.08, "learning_rate": 1.9893098928460708e-06, "loss": 1.0947, "step": 2934 }, { "epoch": 0.08, "learning_rate": 1.989297783912843e-06, "loss": 1.2236, "step": 2935 }, { "epoch": 0.08, "learning_rate": 1.989285668162357e-06, "loss": 0.9844, "step": 2936 }, { "epoch": 0.08, "learning_rate": 1.9892735455946957e-06, "loss": 1.002, "step": 2937 }, { "epoch": 0.08, "learning_rate": 1.989261416209943e-06, "loss": 0.8232, "step": 2938 }, { "epoch": 0.08, "learning_rate": 1.9892492800081823e-06, "loss": 0.9883, "step": 2939 }, { "epoch": 0.08, "learning_rate": 1.9892371369894975e-06, "loss": 1.0098, "step": 2940 }, { "epoch": 0.08, "learning_rate": 1.9892249871539724e-06, "loss": 0.8428, "step": 2941 }, { "epoch": 0.08, "learning_rate": 1.98921283050169e-06, "loss": 0.9111, "step": 2942 }, { "epoch": 0.08, "learning_rate": 1.989200667032735e-06, "loss": 0.9883, "step": 2943 }, { "epoch": 0.08, "learning_rate": 1.98918849674719e-06, "loss": 1.127, "step": 2944 }, { "epoch": 0.08, "learning_rate": 1.98917631964514e-06, "loss": 1.0273, "step": 2945 }, { "epoch": 0.08, "learning_rate": 1.9891641357266683e-06, "loss": 0.8584, "step": 2946 }, { "epoch": 0.08, "learning_rate": 1.9891519449918596e-06, "loss": 1.292, "step": 2947 }, { "epoch": 0.08, "learning_rate": 1.989139747440797e-06, "loss": 0.8364, "step": 2948 }, { "epoch": 0.08, "learning_rate": 1.9891275430735646e-06, "loss": 0.959, "step": 2949 }, { "epoch": 0.08, "learning_rate": 1.9891153318902473e-06, "loss": 1.0781, "step": 2950 }, { "epoch": 0.08, "learning_rate": 1.9891031138909286e-06, "loss": 1.0342, "step": 2951 }, { "epoch": 0.08, "learning_rate": 1.989090889075693e-06, "loss": 0.9619, "step": 2952 }, { "epoch": 0.08, "learning_rate": 1.9890786574446247e-06, "loss": 0.9316, "step": 2953 }, { "epoch": 0.08, "learning_rate": 1.9890664189978074e-06, "loss": 1.0361, "step": 2954 }, { "epoch": 0.08, "learning_rate": 1.9890541737353265e-06, "loss": 0.8838, "step": 2955 }, { "epoch": 0.08, "learning_rate": 1.9890419216572652e-06, "loss": 0.8984, "step": 2956 }, { "epoch": 0.08, "learning_rate": 1.9890296627637092e-06, "loss": 1.1406, "step": 2957 }, { "epoch": 0.08, "learning_rate": 1.989017397054742e-06, "loss": 0.8945, "step": 2958 }, { "epoch": 0.08, "learning_rate": 1.9890051245304488e-06, "loss": 0.7891, "step": 2959 }, { "epoch": 0.08, "learning_rate": 1.9889928451909133e-06, "loss": 0.9941, "step": 2960 }, { "epoch": 0.08, "learning_rate": 1.9889805590362206e-06, "loss": 0.9668, "step": 2961 }, { "epoch": 0.08, "learning_rate": 1.988968266066456e-06, "loss": 0.7515, "step": 2962 }, { "epoch": 0.08, "learning_rate": 1.988955966281703e-06, "loss": 0.9365, "step": 2963 }, { "epoch": 0.08, "learning_rate": 1.9889436596820472e-06, "loss": 0.8535, "step": 2964 }, { "epoch": 0.08, "learning_rate": 1.988931346267573e-06, "loss": 0.9922, "step": 2965 }, { "epoch": 0.08, "learning_rate": 1.988919026038366e-06, "loss": 0.96, "step": 2966 }, { "epoch": 0.08, "learning_rate": 1.98890669899451e-06, "loss": 0.7402, "step": 2967 }, { "epoch": 0.08, "learning_rate": 1.9888943651360906e-06, "loss": 0.8906, "step": 2968 }, { "epoch": 0.08, "learning_rate": 1.9888820244631925e-06, "loss": 0.8296, "step": 2969 }, { "epoch": 0.08, "learning_rate": 1.9888696769759012e-06, "loss": 0.6973, "step": 2970 }, { "epoch": 0.08, "learning_rate": 1.9888573226743014e-06, "loss": 1.0098, "step": 2971 }, { "epoch": 0.08, "learning_rate": 1.9888449615584783e-06, "loss": 0.7231, "step": 2972 }, { "epoch": 0.08, "learning_rate": 1.988832593628517e-06, "loss": 0.9717, "step": 2973 }, { "epoch": 0.08, "learning_rate": 1.988820218884503e-06, "loss": 0.875, "step": 2974 }, { "epoch": 0.08, "learning_rate": 1.9888078373265213e-06, "loss": 1.04, "step": 2975 }, { "epoch": 0.08, "learning_rate": 1.9887954489546573e-06, "loss": 0.9883, "step": 2976 }, { "epoch": 0.08, "learning_rate": 1.9887830537689964e-06, "loss": 0.8262, "step": 2977 }, { "epoch": 0.08, "learning_rate": 1.9887706517696237e-06, "loss": 0.9004, "step": 2978 }, { "epoch": 0.08, "learning_rate": 1.9887582429566257e-06, "loss": 0.9844, "step": 2979 }, { "epoch": 0.08, "learning_rate": 1.9887458273300866e-06, "loss": 0.8457, "step": 2980 }, { "epoch": 0.08, "learning_rate": 1.988733404890093e-06, "loss": 0.8315, "step": 2981 }, { "epoch": 0.08, "learning_rate": 1.9887209756367296e-06, "loss": 0.7615, "step": 2982 }, { "epoch": 0.08, "learning_rate": 1.9887085395700823e-06, "loss": 0.9316, "step": 2983 }, { "epoch": 0.08, "learning_rate": 1.9886960966902373e-06, "loss": 0.7651, "step": 2984 }, { "epoch": 0.08, "learning_rate": 1.98868364699728e-06, "loss": 0.75, "step": 2985 }, { "epoch": 0.08, "learning_rate": 1.9886711904912965e-06, "loss": 1.1426, "step": 2986 }, { "epoch": 0.08, "learning_rate": 1.988658727172372e-06, "loss": 0.9058, "step": 2987 }, { "epoch": 0.08, "learning_rate": 1.9886462570405927e-06, "loss": 1.042, "step": 2988 }, { "epoch": 0.08, "learning_rate": 1.9886337800960447e-06, "loss": 0.9932, "step": 2989 }, { "epoch": 0.08, "learning_rate": 1.988621296338814e-06, "loss": 1.1201, "step": 2990 }, { "epoch": 0.08, "learning_rate": 1.9886088057689865e-06, "loss": 0.9629, "step": 2991 }, { "epoch": 0.08, "learning_rate": 1.9885963083866477e-06, "loss": 0.9619, "step": 2992 }, { "epoch": 0.08, "learning_rate": 1.988583804191885e-06, "loss": 1.0273, "step": 2993 }, { "epoch": 0.08, "learning_rate": 1.988571293184784e-06, "loss": 1.0088, "step": 2994 }, { "epoch": 0.08, "learning_rate": 1.98855877536543e-06, "loss": 0.8584, "step": 2995 }, { "epoch": 0.08, "learning_rate": 1.98854625073391e-06, "loss": 1.0186, "step": 2996 }, { "epoch": 0.08, "learning_rate": 1.9885337192903105e-06, "loss": 0.9092, "step": 2997 }, { "epoch": 0.08, "learning_rate": 1.9885211810347184e-06, "loss": 0.9131, "step": 2998 }, { "epoch": 0.08, "learning_rate": 1.9885086359672182e-06, "loss": 0.9131, "step": 2999 }, { "epoch": 0.08, "learning_rate": 1.988496084087898e-06, "loss": 0.918, "step": 3000 }, { "epoch": 0.08, "learning_rate": 1.988483525396844e-06, "loss": 0.7183, "step": 3001 }, { "epoch": 0.08, "learning_rate": 1.9884709598941427e-06, "loss": 1.1016, "step": 3002 }, { "epoch": 0.08, "learning_rate": 1.98845838757988e-06, "loss": 0.9834, "step": 3003 }, { "epoch": 0.08, "learning_rate": 1.9884458084541435e-06, "loss": 1.0723, "step": 3004 }, { "epoch": 0.08, "learning_rate": 1.9884332225170195e-06, "loss": 0.832, "step": 3005 }, { "epoch": 0.08, "learning_rate": 1.988420629768595e-06, "loss": 1.1221, "step": 3006 }, { "epoch": 0.08, "learning_rate": 1.9884080302089554e-06, "loss": 1.0078, "step": 3007 }, { "epoch": 0.08, "learning_rate": 1.9883954238381894e-06, "loss": 1.084, "step": 3008 }, { "epoch": 0.08, "learning_rate": 1.9883828106563828e-06, "loss": 0.9556, "step": 3009 }, { "epoch": 0.08, "learning_rate": 1.988370190663623e-06, "loss": 1.2598, "step": 3010 }, { "epoch": 0.08, "learning_rate": 1.9883575638599966e-06, "loss": 0.8438, "step": 3011 }, { "epoch": 0.08, "learning_rate": 1.9883449302455907e-06, "loss": 1.0752, "step": 3012 }, { "epoch": 0.08, "learning_rate": 1.9883322898204927e-06, "loss": 1.0166, "step": 3013 }, { "epoch": 0.08, "learning_rate": 1.988319642584789e-06, "loss": 0.7588, "step": 3014 }, { "epoch": 0.08, "learning_rate": 1.9883069885385673e-06, "loss": 1.0791, "step": 3015 }, { "epoch": 0.08, "learning_rate": 1.9882943276819153e-06, "loss": 0.7661, "step": 3016 }, { "epoch": 0.08, "learning_rate": 1.988281660014919e-06, "loss": 1.168, "step": 3017 }, { "epoch": 0.08, "learning_rate": 1.988268985537666e-06, "loss": 0.9922, "step": 3018 }, { "epoch": 0.08, "learning_rate": 1.988256304250245e-06, "loss": 0.7769, "step": 3019 }, { "epoch": 0.08, "learning_rate": 1.9882436161527413e-06, "loss": 1.0811, "step": 3020 }, { "epoch": 0.08, "learning_rate": 1.9882309212452437e-06, "loss": 1.0225, "step": 3021 }, { "epoch": 0.08, "learning_rate": 1.9882182195278396e-06, "loss": 0.8896, "step": 3022 }, { "epoch": 0.08, "learning_rate": 1.9882055110006163e-06, "loss": 1.1553, "step": 3023 }, { "epoch": 0.08, "learning_rate": 1.988192795663661e-06, "loss": 0.8662, "step": 3024 }, { "epoch": 0.08, "learning_rate": 1.988180073517062e-06, "loss": 0.9863, "step": 3025 }, { "epoch": 0.08, "learning_rate": 1.9881673445609065e-06, "loss": 0.9277, "step": 3026 }, { "epoch": 0.08, "learning_rate": 1.988154608795282e-06, "loss": 0.9092, "step": 3027 }, { "epoch": 0.08, "learning_rate": 1.9881418662202774e-06, "loss": 0.9365, "step": 3028 }, { "epoch": 0.08, "learning_rate": 1.9881291168359794e-06, "loss": 1.1035, "step": 3029 }, { "epoch": 0.08, "learning_rate": 1.988116360642476e-06, "loss": 1.2432, "step": 3030 }, { "epoch": 0.08, "learning_rate": 1.9881035976398554e-06, "loss": 1.0527, "step": 3031 }, { "epoch": 0.08, "learning_rate": 1.9880908278282055e-06, "loss": 1.0098, "step": 3032 }, { "epoch": 0.08, "learning_rate": 1.9880780512076143e-06, "loss": 0.9434, "step": 3033 }, { "epoch": 0.08, "learning_rate": 1.9880652677781696e-06, "loss": 0.9805, "step": 3034 }, { "epoch": 0.08, "learning_rate": 1.9880524775399597e-06, "loss": 1.0381, "step": 3035 }, { "epoch": 0.08, "learning_rate": 1.988039680493073e-06, "loss": 1.0117, "step": 3036 }, { "epoch": 0.08, "learning_rate": 1.9880268766375972e-06, "loss": 1.0732, "step": 3037 }, { "epoch": 0.08, "learning_rate": 1.9880140659736207e-06, "loss": 0.9932, "step": 3038 }, { "epoch": 0.08, "learning_rate": 1.988001248501232e-06, "loss": 0.5859, "step": 3039 }, { "epoch": 0.08, "learning_rate": 1.987988424220519e-06, "loss": 0.9404, "step": 3040 }, { "epoch": 0.08, "learning_rate": 1.98797559313157e-06, "loss": 0.8506, "step": 3041 }, { "epoch": 0.08, "learning_rate": 1.9879627552344743e-06, "loss": 0.9756, "step": 3042 }, { "epoch": 0.08, "learning_rate": 1.9879499105293194e-06, "loss": 1.0381, "step": 3043 }, { "epoch": 0.08, "learning_rate": 1.9879370590161948e-06, "loss": 0.8311, "step": 3044 }, { "epoch": 0.08, "learning_rate": 1.987924200695188e-06, "loss": 0.958, "step": 3045 }, { "epoch": 0.08, "learning_rate": 1.987911335566388e-06, "loss": 0.7563, "step": 3046 }, { "epoch": 0.08, "learning_rate": 1.987898463629884e-06, "loss": 1.0742, "step": 3047 }, { "epoch": 0.08, "learning_rate": 1.987885584885764e-06, "loss": 0.7568, "step": 3048 }, { "epoch": 0.08, "learning_rate": 1.987872699334116e-06, "loss": 0.8818, "step": 3049 }, { "epoch": 0.08, "learning_rate": 1.987859806975031e-06, "loss": 0.917, "step": 3050 }, { "epoch": 0.08, "learning_rate": 1.987846907808596e-06, "loss": 0.8032, "step": 3051 }, { "epoch": 0.08, "learning_rate": 1.9878340018349007e-06, "loss": 1.2471, "step": 3052 }, { "epoch": 0.08, "learning_rate": 1.987821089054034e-06, "loss": 0.8525, "step": 3053 }, { "epoch": 0.08, "learning_rate": 1.9878081694660847e-06, "loss": 0.8027, "step": 3054 }, { "epoch": 0.08, "learning_rate": 1.9877952430711415e-06, "loss": 0.9883, "step": 3055 }, { "epoch": 0.08, "learning_rate": 1.987782309869294e-06, "loss": 0.873, "step": 3056 }, { "epoch": 0.08, "learning_rate": 1.9877693698606316e-06, "loss": 0.9307, "step": 3057 }, { "epoch": 0.08, "learning_rate": 1.9877564230452424e-06, "loss": 0.9541, "step": 3058 }, { "epoch": 0.08, "learning_rate": 1.9877434694232163e-06, "loss": 1.0898, "step": 3059 }, { "epoch": 0.08, "learning_rate": 1.9877305089946426e-06, "loss": 0.959, "step": 3060 }, { "epoch": 0.08, "learning_rate": 1.9877175417596103e-06, "loss": 1.0078, "step": 3061 }, { "epoch": 0.08, "learning_rate": 1.987704567718209e-06, "loss": 0.8857, "step": 3062 }, { "epoch": 0.08, "learning_rate": 1.9876915868705286e-06, "loss": 0.8984, "step": 3063 }, { "epoch": 0.08, "learning_rate": 1.9876785992166575e-06, "loss": 0.6851, "step": 3064 }, { "epoch": 0.08, "learning_rate": 1.9876656047566857e-06, "loss": 0.9609, "step": 3065 }, { "epoch": 0.08, "learning_rate": 1.987652603490703e-06, "loss": 1.0332, "step": 3066 }, { "epoch": 0.08, "learning_rate": 1.987639595418799e-06, "loss": 0.96, "step": 3067 }, { "epoch": 0.08, "learning_rate": 1.9876265805410623e-06, "loss": 1.0068, "step": 3068 }, { "epoch": 0.08, "learning_rate": 1.987613558857584e-06, "loss": 0.8779, "step": 3069 }, { "epoch": 0.08, "learning_rate": 1.9876005303684532e-06, "loss": 1.0859, "step": 3070 }, { "epoch": 0.08, "learning_rate": 1.987587495073759e-06, "loss": 0.8457, "step": 3071 }, { "epoch": 0.08, "learning_rate": 1.9875744529735927e-06, "loss": 1.1035, "step": 3072 }, { "epoch": 0.08, "learning_rate": 1.987561404068043e-06, "loss": 0.8066, "step": 3073 }, { "epoch": 0.08, "learning_rate": 1.9875483483572002e-06, "loss": 0.9883, "step": 3074 }, { "epoch": 0.08, "learning_rate": 1.9875352858411546e-06, "loss": 0.9014, "step": 3075 }, { "epoch": 0.08, "learning_rate": 1.987522216519996e-06, "loss": 0.9658, "step": 3076 }, { "epoch": 0.08, "learning_rate": 1.9875091403938137e-06, "loss": 1.0205, "step": 3077 }, { "epoch": 0.08, "learning_rate": 1.9874960574626985e-06, "loss": 0.7451, "step": 3078 }, { "epoch": 0.08, "learning_rate": 1.987482967726741e-06, "loss": 1.0986, "step": 3079 }, { "epoch": 0.08, "learning_rate": 1.9874698711860306e-06, "loss": 0.9277, "step": 3080 }, { "epoch": 0.08, "learning_rate": 1.9874567678406578e-06, "loss": 0.959, "step": 3081 }, { "epoch": 0.08, "learning_rate": 1.987443657690713e-06, "loss": 0.8799, "step": 3082 }, { "epoch": 0.08, "learning_rate": 1.987430540736287e-06, "loss": 0.8818, "step": 3083 }, { "epoch": 0.08, "learning_rate": 1.987417416977469e-06, "loss": 1.0889, "step": 3084 }, { "epoch": 0.08, "learning_rate": 1.9874042864143506e-06, "loss": 1.002, "step": 3085 }, { "epoch": 0.08, "learning_rate": 1.9873911490470215e-06, "loss": 0.812, "step": 3086 }, { "epoch": 0.08, "learning_rate": 1.9873780048755725e-06, "loss": 0.7695, "step": 3087 }, { "epoch": 0.08, "learning_rate": 1.9873648539000946e-06, "loss": 1.0557, "step": 3088 }, { "epoch": 0.08, "learning_rate": 1.9873516961206776e-06, "loss": 0.772, "step": 3089 }, { "epoch": 0.08, "learning_rate": 1.987338531537413e-06, "loss": 0.8403, "step": 3090 }, { "epoch": 0.08, "learning_rate": 1.9873253601503904e-06, "loss": 0.8594, "step": 3091 }, { "epoch": 0.08, "learning_rate": 1.987312181959702e-06, "loss": 0.7607, "step": 3092 }, { "epoch": 0.08, "learning_rate": 1.9872989969654377e-06, "loss": 1.0889, "step": 3093 }, { "epoch": 0.08, "learning_rate": 1.9872858051676885e-06, "loss": 0.9922, "step": 3094 }, { "epoch": 0.08, "learning_rate": 1.987272606566545e-06, "loss": 1.0107, "step": 3095 }, { "epoch": 0.08, "learning_rate": 1.9872594011620993e-06, "loss": 0.8613, "step": 3096 }, { "epoch": 0.08, "learning_rate": 1.987246188954441e-06, "loss": 1.0117, "step": 3097 }, { "epoch": 0.08, "learning_rate": 1.987232969943662e-06, "loss": 0.9609, "step": 3098 }, { "epoch": 0.08, "learning_rate": 1.9872197441298534e-06, "loss": 0.9365, "step": 3099 }, { "epoch": 0.08, "learning_rate": 1.9872065115131057e-06, "loss": 0.8657, "step": 3100 }, { "epoch": 0.08, "learning_rate": 1.9871932720935103e-06, "loss": 0.9648, "step": 3101 }, { "epoch": 0.08, "learning_rate": 1.9871800258711586e-06, "loss": 0.8789, "step": 3102 }, { "epoch": 0.08, "learning_rate": 1.9871667728461427e-06, "loss": 0.8555, "step": 3103 }, { "epoch": 0.08, "learning_rate": 1.987153513018552e-06, "loss": 0.9023, "step": 3104 }, { "epoch": 0.08, "learning_rate": 1.98714024638848e-06, "loss": 1.0361, "step": 3105 }, { "epoch": 0.08, "learning_rate": 1.9871269729560164e-06, "loss": 0.6875, "step": 3106 }, { "epoch": 0.08, "learning_rate": 1.9871136927212538e-06, "loss": 0.9385, "step": 3107 }, { "epoch": 0.08, "learning_rate": 1.9871004056842833e-06, "loss": 0.9941, "step": 3108 }, { "epoch": 0.08, "learning_rate": 1.987087111845196e-06, "loss": 0.604, "step": 3109 }, { "epoch": 0.08, "learning_rate": 1.9870738112040845e-06, "loss": 1.0596, "step": 3110 }, { "epoch": 0.08, "learning_rate": 1.9870605037610396e-06, "loss": 0.8696, "step": 3111 }, { "epoch": 0.08, "learning_rate": 1.9870471895161533e-06, "loss": 0.9336, "step": 3112 }, { "epoch": 0.08, "learning_rate": 1.9870338684695174e-06, "loss": 0.9424, "step": 3113 }, { "epoch": 0.08, "learning_rate": 1.9870205406212235e-06, "loss": 1.085, "step": 3114 }, { "epoch": 0.08, "learning_rate": 1.987007205971364e-06, "loss": 0.9434, "step": 3115 }, { "epoch": 0.08, "learning_rate": 1.98699386452003e-06, "loss": 1.0039, "step": 3116 }, { "epoch": 0.08, "learning_rate": 1.9869805162673137e-06, "loss": 0.8975, "step": 3117 }, { "epoch": 0.08, "learning_rate": 1.9869671612133074e-06, "loss": 0.9746, "step": 3118 }, { "epoch": 0.08, "learning_rate": 1.9869537993581035e-06, "loss": 1.0059, "step": 3119 }, { "epoch": 0.08, "learning_rate": 1.9869404307017925e-06, "loss": 1.1191, "step": 3120 }, { "epoch": 0.08, "learning_rate": 1.9869270552444685e-06, "loss": 1.0371, "step": 3121 }, { "epoch": 0.08, "learning_rate": 1.986913672986222e-06, "loss": 1.1426, "step": 3122 }, { "epoch": 0.08, "learning_rate": 1.9869002839271464e-06, "loss": 1.0234, "step": 3123 }, { "epoch": 0.08, "learning_rate": 1.986886888067333e-06, "loss": 0.9551, "step": 3124 }, { "epoch": 0.08, "learning_rate": 1.986873485406875e-06, "loss": 1.0537, "step": 3125 }, { "epoch": 0.08, "learning_rate": 1.9868600759458644e-06, "loss": 0.8486, "step": 3126 }, { "epoch": 0.08, "learning_rate": 1.986846659684393e-06, "loss": 0.8633, "step": 3127 }, { "epoch": 0.08, "learning_rate": 1.9868332366225544e-06, "loss": 0.8975, "step": 3128 }, { "epoch": 0.08, "learning_rate": 1.98681980676044e-06, "loss": 0.8994, "step": 3129 }, { "epoch": 0.08, "learning_rate": 1.986806370098144e-06, "loss": 0.7173, "step": 3130 }, { "epoch": 0.08, "learning_rate": 1.9867929266357564e-06, "loss": 0.9727, "step": 3131 }, { "epoch": 0.08, "learning_rate": 1.986779476373372e-06, "loss": 1.0381, "step": 3132 }, { "epoch": 0.08, "learning_rate": 1.986766019311083e-06, "loss": 1.0117, "step": 3133 }, { "epoch": 0.08, "learning_rate": 1.9867525554489814e-06, "loss": 0.8042, "step": 3134 }, { "epoch": 0.08, "learning_rate": 1.9867390847871607e-06, "loss": 0.957, "step": 3135 }, { "epoch": 0.08, "learning_rate": 1.9867256073257136e-06, "loss": 0.875, "step": 3136 }, { "epoch": 0.08, "learning_rate": 1.986712123064733e-06, "loss": 1.0723, "step": 3137 }, { "epoch": 0.08, "learning_rate": 1.986698632004311e-06, "loss": 1.0518, "step": 3138 }, { "epoch": 0.08, "learning_rate": 1.986685134144542e-06, "loss": 1.0625, "step": 3139 }, { "epoch": 0.08, "learning_rate": 1.986671629485518e-06, "loss": 0.6519, "step": 3140 }, { "epoch": 0.08, "learning_rate": 1.9866581180273324e-06, "loss": 0.7412, "step": 3141 }, { "epoch": 0.08, "learning_rate": 1.986644599770078e-06, "loss": 0.8452, "step": 3142 }, { "epoch": 0.08, "learning_rate": 1.986631074713849e-06, "loss": 0.8408, "step": 3143 }, { "epoch": 0.08, "learning_rate": 1.986617542858737e-06, "loss": 1.1816, "step": 3144 }, { "epoch": 0.08, "learning_rate": 1.986604004204836e-06, "loss": 1.04, "step": 3145 }, { "epoch": 0.08, "learning_rate": 1.98659045875224e-06, "loss": 0.9365, "step": 3146 }, { "epoch": 0.08, "learning_rate": 1.986576906501041e-06, "loss": 0.917, "step": 3147 }, { "epoch": 0.08, "learning_rate": 1.9865633474513338e-06, "loss": 1.0195, "step": 3148 }, { "epoch": 0.08, "learning_rate": 1.9865497816032107e-06, "loss": 1.0205, "step": 3149 }, { "epoch": 0.08, "learning_rate": 1.9865362089567657e-06, "loss": 0.9844, "step": 3150 }, { "epoch": 0.08, "learning_rate": 1.9865226295120926e-06, "loss": 0.8721, "step": 3151 }, { "epoch": 0.08, "learning_rate": 1.986509043269284e-06, "loss": 0.958, "step": 3152 }, { "epoch": 0.08, "learning_rate": 1.9864954502284344e-06, "loss": 1.1016, "step": 3153 }, { "epoch": 0.08, "learning_rate": 1.9864818503896372e-06, "loss": 0.9072, "step": 3154 }, { "epoch": 0.08, "learning_rate": 1.986468243752986e-06, "loss": 1.0371, "step": 3155 }, { "epoch": 0.08, "learning_rate": 1.986454630318575e-06, "loss": 0.9043, "step": 3156 }, { "epoch": 0.08, "learning_rate": 1.9864410100864974e-06, "loss": 1.0107, "step": 3157 }, { "epoch": 0.08, "learning_rate": 1.9864273830568474e-06, "loss": 0.9404, "step": 3158 }, { "epoch": 0.08, "learning_rate": 1.9864137492297187e-06, "loss": 0.7251, "step": 3159 }, { "epoch": 0.08, "learning_rate": 1.986400108605205e-06, "loss": 1.1445, "step": 3160 }, { "epoch": 0.08, "learning_rate": 1.9863864611834018e-06, "loss": 0.9609, "step": 3161 }, { "epoch": 0.08, "learning_rate": 1.9863728069644016e-06, "loss": 0.7861, "step": 3162 }, { "epoch": 0.08, "learning_rate": 1.9863591459482988e-06, "loss": 0.8867, "step": 3163 }, { "epoch": 0.08, "learning_rate": 1.9863454781351877e-06, "loss": 1.2627, "step": 3164 }, { "epoch": 0.08, "learning_rate": 1.9863318035251623e-06, "loss": 0.8125, "step": 3165 }, { "epoch": 0.08, "learning_rate": 1.986318122118317e-06, "loss": 0.9907, "step": 3166 }, { "epoch": 0.08, "learning_rate": 1.9863044339147463e-06, "loss": 1.0605, "step": 3167 }, { "epoch": 0.08, "learning_rate": 1.9862907389145444e-06, "loss": 0.8779, "step": 3168 }, { "epoch": 0.08, "learning_rate": 1.9862770371178053e-06, "loss": 0.8242, "step": 3169 }, { "epoch": 0.08, "learning_rate": 1.986263328524624e-06, "loss": 0.835, "step": 3170 }, { "epoch": 0.08, "learning_rate": 1.986249613135094e-06, "loss": 1.1562, "step": 3171 }, { "epoch": 0.08, "learning_rate": 1.986235890949311e-06, "loss": 0.8447, "step": 3172 }, { "epoch": 0.08, "learning_rate": 1.9862221619673688e-06, "loss": 0.8057, "step": 3173 }, { "epoch": 0.08, "learning_rate": 1.9862084261893627e-06, "loss": 0.8965, "step": 3174 }, { "epoch": 0.08, "learning_rate": 1.9861946836153864e-06, "loss": 1.126, "step": 3175 }, { "epoch": 0.08, "learning_rate": 1.986180934245535e-06, "loss": 1.1123, "step": 3176 }, { "epoch": 0.08, "learning_rate": 1.986167178079904e-06, "loss": 0.9248, "step": 3177 }, { "epoch": 0.08, "learning_rate": 1.986153415118587e-06, "loss": 0.9414, "step": 3178 }, { "epoch": 0.08, "learning_rate": 1.9861396453616793e-06, "loss": 1.0205, "step": 3179 }, { "epoch": 0.08, "learning_rate": 1.986125868809276e-06, "loss": 0.9067, "step": 3180 }, { "epoch": 0.08, "learning_rate": 1.986112085461472e-06, "loss": 0.9961, "step": 3181 }, { "epoch": 0.08, "learning_rate": 1.986098295318362e-06, "loss": 0.7607, "step": 3182 }, { "epoch": 0.08, "learning_rate": 1.9860844983800415e-06, "loss": 1.1641, "step": 3183 }, { "epoch": 0.08, "learning_rate": 1.9860706946466048e-06, "loss": 0.9355, "step": 3184 }, { "epoch": 0.08, "learning_rate": 1.9860568841181478e-06, "loss": 0.8818, "step": 3185 }, { "epoch": 0.08, "learning_rate": 1.9860430667947654e-06, "loss": 0.7275, "step": 3186 }, { "epoch": 0.08, "learning_rate": 1.9860292426765524e-06, "loss": 1.0098, "step": 3187 }, { "epoch": 0.08, "learning_rate": 1.986015411763605e-06, "loss": 0.8857, "step": 3188 }, { "epoch": 0.08, "learning_rate": 1.986001574056018e-06, "loss": 0.7896, "step": 3189 }, { "epoch": 0.08, "learning_rate": 1.985987729553886e-06, "loss": 0.7422, "step": 3190 }, { "epoch": 0.08, "learning_rate": 1.9859738782573053e-06, "loss": 0.9219, "step": 3191 }, { "epoch": 0.08, "learning_rate": 1.9859600201663716e-06, "loss": 0.9688, "step": 3192 }, { "epoch": 0.08, "learning_rate": 1.9859461552811795e-06, "loss": 0.666, "step": 3193 }, { "epoch": 0.08, "learning_rate": 1.985932283601825e-06, "loss": 0.8091, "step": 3194 }, { "epoch": 0.08, "learning_rate": 1.985918405128404e-06, "loss": 0.8887, "step": 3195 }, { "epoch": 0.08, "learning_rate": 1.9859045198610114e-06, "loss": 0.9834, "step": 3196 }, { "epoch": 0.08, "learning_rate": 1.985890627799744e-06, "loss": 1.0039, "step": 3197 }, { "epoch": 0.08, "learning_rate": 1.9858767289446965e-06, "loss": 0.9893, "step": 3198 }, { "epoch": 0.08, "learning_rate": 1.9858628232959646e-06, "loss": 0.9639, "step": 3199 }, { "epoch": 0.08, "learning_rate": 1.985848910853645e-06, "loss": 0.9043, "step": 3200 }, { "epoch": 0.08, "learning_rate": 1.985834991617833e-06, "loss": 0.7871, "step": 3201 }, { "epoch": 0.08, "learning_rate": 1.9858210655886246e-06, "loss": 0.7026, "step": 3202 }, { "epoch": 0.08, "learning_rate": 1.985807132766116e-06, "loss": 1.1328, "step": 3203 }, { "epoch": 0.08, "learning_rate": 1.985793193150403e-06, "loss": 0.8682, "step": 3204 }, { "epoch": 0.08, "learning_rate": 1.985779246741581e-06, "loss": 0.916, "step": 3205 }, { "epoch": 0.08, "learning_rate": 1.9857652935397475e-06, "loss": 0.6958, "step": 3206 }, { "epoch": 0.08, "learning_rate": 1.9857513335449976e-06, "loss": 0.7896, "step": 3207 }, { "epoch": 0.08, "learning_rate": 1.9857373667574276e-06, "loss": 1.0303, "step": 3208 }, { "epoch": 0.08, "learning_rate": 1.9857233931771344e-06, "loss": 0.9863, "step": 3209 }, { "epoch": 0.08, "learning_rate": 1.985709412804214e-06, "loss": 0.7676, "step": 3210 }, { "epoch": 0.08, "learning_rate": 1.985695425638762e-06, "loss": 0.8838, "step": 3211 }, { "epoch": 0.08, "learning_rate": 1.9856814316808756e-06, "loss": 1.0674, "step": 3212 }, { "epoch": 0.08, "learning_rate": 1.985667430930651e-06, "loss": 0.8101, "step": 3213 }, { "epoch": 0.08, "learning_rate": 1.9856534233881846e-06, "loss": 0.6655, "step": 3214 }, { "epoch": 0.08, "learning_rate": 1.9856394090535734e-06, "loss": 0.9443, "step": 3215 }, { "epoch": 0.08, "learning_rate": 1.985625387926913e-06, "loss": 0.8696, "step": 3216 }, { "epoch": 0.08, "learning_rate": 1.985611360008301e-06, "loss": 0.9023, "step": 3217 }, { "epoch": 0.08, "learning_rate": 1.9855973252978338e-06, "loss": 0.9639, "step": 3218 }, { "epoch": 0.08, "learning_rate": 1.985583283795608e-06, "loss": 0.8926, "step": 3219 }, { "epoch": 0.08, "learning_rate": 1.98556923550172e-06, "loss": 0.7139, "step": 3220 }, { "epoch": 0.08, "learning_rate": 1.985555180416267e-06, "loss": 0.8086, "step": 3221 }, { "epoch": 0.08, "learning_rate": 1.985541118539346e-06, "loss": 0.7598, "step": 3222 }, { "epoch": 0.08, "learning_rate": 1.9855270498710536e-06, "loss": 0.9248, "step": 3223 }, { "epoch": 0.08, "learning_rate": 1.985512974411487e-06, "loss": 0.6973, "step": 3224 }, { "epoch": 0.08, "learning_rate": 1.985498892160743e-06, "loss": 0.7969, "step": 3225 }, { "epoch": 0.08, "learning_rate": 1.9854848031189183e-06, "loss": 0.8638, "step": 3226 }, { "epoch": 0.08, "learning_rate": 1.985470707286111e-06, "loss": 1.0127, "step": 3227 }, { "epoch": 0.08, "learning_rate": 1.985456604662417e-06, "loss": 1.1738, "step": 3228 }, { "epoch": 0.08, "learning_rate": 1.9854424952479343e-06, "loss": 0.8657, "step": 3229 }, { "epoch": 0.08, "learning_rate": 1.98542837904276e-06, "loss": 0.7275, "step": 3230 }, { "epoch": 0.08, "learning_rate": 1.9854142560469914e-06, "loss": 0.8442, "step": 3231 }, { "epoch": 0.08, "learning_rate": 1.9854001262607255e-06, "loss": 0.9961, "step": 3232 }, { "epoch": 0.08, "learning_rate": 1.98538598968406e-06, "loss": 1.125, "step": 3233 }, { "epoch": 0.08, "learning_rate": 1.9853718463170925e-06, "loss": 1.0234, "step": 3234 }, { "epoch": 0.08, "learning_rate": 1.9853576961599198e-06, "loss": 1.0391, "step": 3235 }, { "epoch": 0.08, "learning_rate": 1.9853435392126395e-06, "loss": 1.0684, "step": 3236 }, { "epoch": 0.08, "learning_rate": 1.98532937547535e-06, "loss": 0.8672, "step": 3237 }, { "epoch": 0.08, "learning_rate": 1.985315204948148e-06, "loss": 1.0742, "step": 3238 }, { "epoch": 0.08, "learning_rate": 1.9853010276311318e-06, "loss": 0.9111, "step": 3239 }, { "epoch": 0.08, "learning_rate": 1.9852868435243986e-06, "loss": 0.8818, "step": 3240 }, { "epoch": 0.08, "learning_rate": 1.9852726526280463e-06, "loss": 1.0518, "step": 3241 }, { "epoch": 0.08, "learning_rate": 1.9852584549421727e-06, "loss": 0.8701, "step": 3242 }, { "epoch": 0.08, "learning_rate": 1.9852442504668755e-06, "loss": 0.9092, "step": 3243 }, { "epoch": 0.08, "learning_rate": 1.985230039202253e-06, "loss": 0.9404, "step": 3244 }, { "epoch": 0.08, "learning_rate": 1.985215821148403e-06, "loss": 0.8145, "step": 3245 }, { "epoch": 0.08, "learning_rate": 1.9852015963054226e-06, "loss": 0.8525, "step": 3246 }, { "epoch": 0.08, "learning_rate": 1.985187364673411e-06, "loss": 0.8701, "step": 3247 }, { "epoch": 0.08, "learning_rate": 1.985173126252466e-06, "loss": 0.9111, "step": 3248 }, { "epoch": 0.08, "learning_rate": 1.9851588810426853e-06, "loss": 1.0, "step": 3249 }, { "epoch": 0.08, "learning_rate": 1.9851446290441675e-06, "loss": 1.0293, "step": 3250 }, { "epoch": 0.08, "learning_rate": 1.9851303702570102e-06, "loss": 0.8877, "step": 3251 }, { "epoch": 0.08, "learning_rate": 1.9851161046813125e-06, "loss": 0.9023, "step": 3252 }, { "epoch": 0.08, "learning_rate": 1.985101832317172e-06, "loss": 0.8955, "step": 3253 }, { "epoch": 0.08, "learning_rate": 1.9850875531646877e-06, "loss": 0.6221, "step": 3254 }, { "epoch": 0.08, "learning_rate": 1.9850732672239576e-06, "loss": 0.8716, "step": 3255 }, { "epoch": 0.08, "learning_rate": 1.98505897449508e-06, "loss": 0.9668, "step": 3256 }, { "epoch": 0.08, "learning_rate": 1.9850446749781533e-06, "loss": 0.8262, "step": 3257 }, { "epoch": 0.08, "learning_rate": 1.985030368673277e-06, "loss": 0.8501, "step": 3258 }, { "epoch": 0.08, "learning_rate": 1.9850160555805483e-06, "loss": 0.9023, "step": 3259 }, { "epoch": 0.08, "learning_rate": 1.985001735700067e-06, "loss": 1.0498, "step": 3260 }, { "epoch": 0.08, "learning_rate": 1.9849874090319306e-06, "loss": 0.9395, "step": 3261 }, { "epoch": 0.08, "learning_rate": 1.9849730755762394e-06, "loss": 1.0752, "step": 3262 }, { "epoch": 0.08, "learning_rate": 1.9849587353330906e-06, "loss": 0.8926, "step": 3263 }, { "epoch": 0.08, "learning_rate": 1.9849443883025842e-06, "loss": 1.0176, "step": 3264 }, { "epoch": 0.08, "learning_rate": 1.9849300344848185e-06, "loss": 0.9248, "step": 3265 }, { "epoch": 0.08, "learning_rate": 1.984915673879892e-06, "loss": 0.7703, "step": 3266 }, { "epoch": 0.08, "learning_rate": 1.9849013064879047e-06, "loss": 0.9951, "step": 3267 }, { "epoch": 0.08, "learning_rate": 1.984886932308955e-06, "loss": 1.0205, "step": 3268 }, { "epoch": 0.08, "learning_rate": 1.984872551343142e-06, "loss": 1.1758, "step": 3269 }, { "epoch": 0.08, "learning_rate": 1.9848581635905647e-06, "loss": 1.0186, "step": 3270 }, { "epoch": 0.08, "learning_rate": 1.984843769051322e-06, "loss": 0.7812, "step": 3271 }, { "epoch": 0.08, "learning_rate": 1.984829367725514e-06, "loss": 0.8828, "step": 3272 }, { "epoch": 0.08, "learning_rate": 1.9848149596132393e-06, "loss": 0.8276, "step": 3273 }, { "epoch": 0.08, "learning_rate": 1.984800544714597e-06, "loss": 0.8643, "step": 3274 }, { "epoch": 0.08, "learning_rate": 1.984786123029687e-06, "loss": 1.0312, "step": 3275 }, { "epoch": 0.08, "learning_rate": 1.9847716945586085e-06, "loss": 0.998, "step": 3276 }, { "epoch": 0.08, "learning_rate": 1.9847572593014604e-06, "loss": 0.9189, "step": 3277 }, { "epoch": 0.08, "learning_rate": 1.984742817258343e-06, "loss": 1.2344, "step": 3278 }, { "epoch": 0.08, "learning_rate": 1.984728368429355e-06, "loss": 1.0449, "step": 3279 }, { "epoch": 0.08, "learning_rate": 1.9847139128145966e-06, "loss": 0.8521, "step": 3280 }, { "epoch": 0.08, "learning_rate": 1.984699450414167e-06, "loss": 1.0049, "step": 3281 }, { "epoch": 0.08, "learning_rate": 1.9846849812281664e-06, "loss": 0.8672, "step": 3282 }, { "epoch": 0.08, "learning_rate": 1.984670505256694e-06, "loss": 0.8438, "step": 3283 }, { "epoch": 0.08, "learning_rate": 1.9846560224998496e-06, "loss": 1.0605, "step": 3284 }, { "epoch": 0.08, "learning_rate": 1.984641532957733e-06, "loss": 1.0947, "step": 3285 }, { "epoch": 0.08, "learning_rate": 1.9846270366304443e-06, "loss": 0.5449, "step": 3286 }, { "epoch": 0.08, "learning_rate": 1.9846125335180835e-06, "loss": 1.2373, "step": 3287 }, { "epoch": 0.08, "learning_rate": 1.98459802362075e-06, "loss": 1.0996, "step": 3288 }, { "epoch": 0.08, "learning_rate": 1.984583506938544e-06, "loss": 0.9277, "step": 3289 }, { "epoch": 0.08, "learning_rate": 1.984568983471566e-06, "loss": 0.917, "step": 3290 }, { "epoch": 0.08, "learning_rate": 1.9845544532199155e-06, "loss": 0.9365, "step": 3291 }, { "epoch": 0.08, "learning_rate": 1.984539916183693e-06, "loss": 1.1699, "step": 3292 }, { "epoch": 0.08, "learning_rate": 1.984525372362998e-06, "loss": 0.8091, "step": 3293 }, { "epoch": 0.08, "learning_rate": 1.9845108217579314e-06, "loss": 0.8423, "step": 3294 }, { "epoch": 0.08, "learning_rate": 1.984496264368594e-06, "loss": 0.7661, "step": 3295 }, { "epoch": 0.08, "learning_rate": 1.9844817001950843e-06, "loss": 0.8066, "step": 3296 }, { "epoch": 0.08, "learning_rate": 1.984467129237504e-06, "loss": 0.8682, "step": 3297 }, { "epoch": 0.08, "learning_rate": 1.9844525514959536e-06, "loss": 0.8389, "step": 3298 }, { "epoch": 0.08, "learning_rate": 1.9844379669705336e-06, "loss": 0.8477, "step": 3299 }, { "epoch": 0.08, "learning_rate": 1.9844233756613436e-06, "loss": 1.127, "step": 3300 }, { "epoch": 0.08, "learning_rate": 1.984408777568485e-06, "loss": 0.9746, "step": 3301 }, { "epoch": 0.08, "learning_rate": 1.9843941726920577e-06, "loss": 1.208, "step": 3302 }, { "epoch": 0.08, "learning_rate": 1.984379561032163e-06, "loss": 1.166, "step": 3303 }, { "epoch": 0.08, "learning_rate": 1.984364942588901e-06, "loss": 0.8877, "step": 3304 }, { "epoch": 0.08, "learning_rate": 1.984350317362373e-06, "loss": 1.1562, "step": 3305 }, { "epoch": 0.08, "learning_rate": 1.9843356853526795e-06, "loss": 0.9668, "step": 3306 }, { "epoch": 0.08, "learning_rate": 1.9843210465599215e-06, "loss": 0.8662, "step": 3307 }, { "epoch": 0.08, "learning_rate": 1.9843064009841995e-06, "loss": 0.9365, "step": 3308 }, { "epoch": 0.08, "learning_rate": 1.9842917486256146e-06, "loss": 0.9268, "step": 3309 }, { "epoch": 0.08, "learning_rate": 1.984277089484268e-06, "loss": 0.9473, "step": 3310 }, { "epoch": 0.08, "learning_rate": 1.9842624235602606e-06, "loss": 0.8711, "step": 3311 }, { "epoch": 0.08, "learning_rate": 1.9842477508536934e-06, "loss": 1.1396, "step": 3312 }, { "epoch": 0.08, "learning_rate": 1.984233071364667e-06, "loss": 0.9805, "step": 3313 }, { "epoch": 0.08, "learning_rate": 1.984218385093284e-06, "loss": 0.8716, "step": 3314 }, { "epoch": 0.08, "learning_rate": 1.984203692039644e-06, "loss": 0.8896, "step": 3315 }, { "epoch": 0.08, "learning_rate": 1.984188992203849e-06, "loss": 0.8955, "step": 3316 }, { "epoch": 0.09, "learning_rate": 1.984174285586e-06, "loss": 0.9785, "step": 3317 }, { "epoch": 0.09, "learning_rate": 1.9841595721861993e-06, "loss": 0.8145, "step": 3318 }, { "epoch": 0.09, "learning_rate": 1.984144852004547e-06, "loss": 0.8926, "step": 3319 }, { "epoch": 0.09, "learning_rate": 1.984130125041145e-06, "loss": 0.9863, "step": 3320 }, { "epoch": 0.09, "learning_rate": 1.984115391296095e-06, "loss": 0.9766, "step": 3321 }, { "epoch": 0.09, "learning_rate": 1.9841006507694987e-06, "loss": 0.9287, "step": 3322 }, { "epoch": 0.09, "learning_rate": 1.984085903461457e-06, "loss": 1.1035, "step": 3323 }, { "epoch": 0.09, "learning_rate": 1.984071149372072e-06, "loss": 1.0615, "step": 3324 }, { "epoch": 0.09, "learning_rate": 1.9840563885014456e-06, "loss": 0.9932, "step": 3325 }, { "epoch": 0.09, "learning_rate": 1.984041620849679e-06, "loss": 0.8818, "step": 3326 }, { "epoch": 0.09, "learning_rate": 1.9840268464168738e-06, "loss": 0.9248, "step": 3327 }, { "epoch": 0.09, "learning_rate": 1.9840120652031325e-06, "loss": 0.9883, "step": 3328 }, { "epoch": 0.09, "learning_rate": 1.9839972772085566e-06, "loss": 0.9463, "step": 3329 }, { "epoch": 0.09, "learning_rate": 1.983982482433248e-06, "loss": 1.0312, "step": 3330 }, { "epoch": 0.09, "learning_rate": 1.983967680877309e-06, "loss": 0.8433, "step": 3331 }, { "epoch": 0.09, "learning_rate": 1.983952872540841e-06, "loss": 0.8613, "step": 3332 }, { "epoch": 0.09, "learning_rate": 1.983938057423946e-06, "loss": 1.041, "step": 3333 }, { "epoch": 0.09, "learning_rate": 1.983923235526727e-06, "loss": 0.874, "step": 3334 }, { "epoch": 0.09, "learning_rate": 1.983908406849285e-06, "loss": 0.8486, "step": 3335 }, { "epoch": 0.09, "learning_rate": 1.9838935713917234e-06, "loss": 0.7642, "step": 3336 }, { "epoch": 0.09, "learning_rate": 1.983878729154143e-06, "loss": 0.9082, "step": 3337 }, { "epoch": 0.09, "learning_rate": 1.9838638801366476e-06, "loss": 0.8296, "step": 3338 }, { "epoch": 0.09, "learning_rate": 1.9838490243393383e-06, "loss": 1.1025, "step": 3339 }, { "epoch": 0.09, "learning_rate": 1.983834161762318e-06, "loss": 0.9434, "step": 3340 }, { "epoch": 0.09, "learning_rate": 1.983819292405689e-06, "loss": 0.9658, "step": 3341 }, { "epoch": 0.09, "learning_rate": 1.983804416269554e-06, "loss": 0.7695, "step": 3342 }, { "epoch": 0.09, "learning_rate": 1.9837895333540153e-06, "loss": 0.8457, "step": 3343 }, { "epoch": 0.09, "learning_rate": 1.983774643659175e-06, "loss": 0.9414, "step": 3344 }, { "epoch": 0.09, "learning_rate": 1.983759747185137e-06, "loss": 1.1035, "step": 3345 }, { "epoch": 0.09, "learning_rate": 1.9837448439320025e-06, "loss": 1.0527, "step": 3346 }, { "epoch": 0.09, "learning_rate": 1.9837299338998753e-06, "loss": 0.9824, "step": 3347 }, { "epoch": 0.09, "learning_rate": 1.9837150170888575e-06, "loss": 0.9062, "step": 3348 }, { "epoch": 0.09, "learning_rate": 1.9837000934990523e-06, "loss": 0.9463, "step": 3349 }, { "epoch": 0.09, "learning_rate": 1.983685163130562e-06, "loss": 0.9443, "step": 3350 }, { "epoch": 0.09, "learning_rate": 1.98367022598349e-06, "loss": 1.0566, "step": 3351 }, { "epoch": 0.09, "learning_rate": 1.9836552820579387e-06, "loss": 0.8633, "step": 3352 }, { "epoch": 0.09, "learning_rate": 1.983640331354012e-06, "loss": 1.0088, "step": 3353 }, { "epoch": 0.09, "learning_rate": 1.983625373871812e-06, "loss": 1.1172, "step": 3354 }, { "epoch": 0.09, "learning_rate": 1.983610409611442e-06, "loss": 0.9316, "step": 3355 }, { "epoch": 0.09, "learning_rate": 1.9835954385730056e-06, "loss": 0.8877, "step": 3356 }, { "epoch": 0.09, "learning_rate": 1.9835804607566056e-06, "loss": 0.8691, "step": 3357 }, { "epoch": 0.09, "learning_rate": 1.983565476162345e-06, "loss": 0.9854, "step": 3358 }, { "epoch": 0.09, "learning_rate": 1.9835504847903274e-06, "loss": 0.8721, "step": 3359 }, { "epoch": 0.09, "learning_rate": 1.983535486640656e-06, "loss": 0.8423, "step": 3360 }, { "epoch": 0.09, "learning_rate": 1.983520481713434e-06, "loss": 1.0791, "step": 3361 }, { "epoch": 0.09, "learning_rate": 1.983505470008765e-06, "loss": 0.8301, "step": 3362 }, { "epoch": 0.09, "learning_rate": 1.983490451526752e-06, "loss": 1.0576, "step": 3363 }, { "epoch": 0.09, "learning_rate": 1.9834754262674995e-06, "loss": 1.0068, "step": 3364 }, { "epoch": 0.09, "learning_rate": 1.98346039423111e-06, "loss": 0.9512, "step": 3365 }, { "epoch": 0.09, "learning_rate": 1.9834453554176874e-06, "loss": 0.998, "step": 3366 }, { "epoch": 0.09, "learning_rate": 1.9834303098273357e-06, "loss": 0.9092, "step": 3367 }, { "epoch": 0.09, "learning_rate": 1.9834152574601584e-06, "loss": 0.8926, "step": 3368 }, { "epoch": 0.09, "learning_rate": 1.983400198316259e-06, "loss": 0.9404, "step": 3369 }, { "epoch": 0.09, "learning_rate": 1.983385132395741e-06, "loss": 0.8965, "step": 3370 }, { "epoch": 0.09, "learning_rate": 1.9833700596987093e-06, "loss": 0.9102, "step": 3371 }, { "epoch": 0.09, "learning_rate": 1.983354980225267e-06, "loss": 1.0439, "step": 3372 }, { "epoch": 0.09, "learning_rate": 1.9833398939755176e-06, "loss": 0.9551, "step": 3373 }, { "epoch": 0.09, "learning_rate": 1.9833248009495658e-06, "loss": 0.9688, "step": 3374 }, { "epoch": 0.09, "learning_rate": 1.9833097011475155e-06, "loss": 0.7656, "step": 3375 }, { "epoch": 0.09, "learning_rate": 1.98329459456947e-06, "loss": 0.8447, "step": 3376 }, { "epoch": 0.09, "learning_rate": 1.9832794812155353e-06, "loss": 1.0879, "step": 3377 }, { "epoch": 0.09, "learning_rate": 1.9832643610858133e-06, "loss": 1.123, "step": 3378 }, { "epoch": 0.09, "learning_rate": 1.9832492341804095e-06, "loss": 0.9346, "step": 3379 }, { "epoch": 0.09, "learning_rate": 1.983234100499428e-06, "loss": 0.9829, "step": 3380 }, { "epoch": 0.09, "learning_rate": 1.983218960042972e-06, "loss": 0.8594, "step": 3381 }, { "epoch": 0.09, "learning_rate": 1.9832038128111473e-06, "loss": 0.8994, "step": 3382 }, { "epoch": 0.09, "learning_rate": 1.983188658804058e-06, "loss": 1.0859, "step": 3383 }, { "epoch": 0.09, "learning_rate": 1.983173498021808e-06, "loss": 1.0703, "step": 3384 }, { "epoch": 0.09, "learning_rate": 1.983158330464502e-06, "loss": 1.0625, "step": 3385 }, { "epoch": 0.09, "learning_rate": 1.983143156132244e-06, "loss": 1.0137, "step": 3386 }, { "epoch": 0.09, "learning_rate": 1.9831279750251396e-06, "loss": 0.9873, "step": 3387 }, { "epoch": 0.09, "learning_rate": 1.983112787143293e-06, "loss": 0.9355, "step": 3388 }, { "epoch": 0.09, "learning_rate": 1.9830975924868083e-06, "loss": 0.7539, "step": 3389 }, { "epoch": 0.09, "learning_rate": 1.9830823910557914e-06, "loss": 0.8418, "step": 3390 }, { "epoch": 0.09, "learning_rate": 1.9830671828503456e-06, "loss": 0.7686, "step": 3391 }, { "epoch": 0.09, "learning_rate": 1.9830519678705767e-06, "loss": 0.9814, "step": 3392 }, { "epoch": 0.09, "learning_rate": 1.983036746116589e-06, "loss": 0.8325, "step": 3393 }, { "epoch": 0.09, "learning_rate": 1.983021517588488e-06, "loss": 0.7979, "step": 3394 }, { "epoch": 0.09, "learning_rate": 1.983006282286378e-06, "loss": 1.0898, "step": 3395 }, { "epoch": 0.09, "learning_rate": 1.982991040210365e-06, "loss": 0.9238, "step": 3396 }, { "epoch": 0.09, "learning_rate": 1.9829757913605526e-06, "loss": 0.9756, "step": 3397 }, { "epoch": 0.09, "learning_rate": 1.9829605357370466e-06, "loss": 0.9873, "step": 3398 }, { "epoch": 0.09, "learning_rate": 1.9829452733399523e-06, "loss": 0.6626, "step": 3399 }, { "epoch": 0.09, "learning_rate": 1.982930004169375e-06, "loss": 0.9766, "step": 3400 }, { "epoch": 0.09, "learning_rate": 1.982914728225419e-06, "loss": 0.6255, "step": 3401 }, { "epoch": 0.09, "learning_rate": 1.9828994455081907e-06, "loss": 0.9238, "step": 3402 }, { "epoch": 0.09, "learning_rate": 1.9828841560177947e-06, "loss": 1.0459, "step": 3403 }, { "epoch": 0.09, "learning_rate": 1.9828688597543365e-06, "loss": 1.1904, "step": 3404 }, { "epoch": 0.09, "learning_rate": 1.9828535567179216e-06, "loss": 0.897, "step": 3405 }, { "epoch": 0.09, "learning_rate": 1.9828382469086554e-06, "loss": 1.0635, "step": 3406 }, { "epoch": 0.09, "learning_rate": 1.9828229303266437e-06, "loss": 0.9521, "step": 3407 }, { "epoch": 0.09, "learning_rate": 1.9828076069719916e-06, "loss": 0.9014, "step": 3408 }, { "epoch": 0.09, "learning_rate": 1.9827922768448046e-06, "loss": 0.9609, "step": 3409 }, { "epoch": 0.09, "learning_rate": 1.9827769399451886e-06, "loss": 0.9697, "step": 3410 }, { "epoch": 0.09, "learning_rate": 1.9827615962732498e-06, "loss": 0.8291, "step": 3411 }, { "epoch": 0.09, "learning_rate": 1.982746245829093e-06, "loss": 0.8745, "step": 3412 }, { "epoch": 0.09, "learning_rate": 1.9827308886128244e-06, "loss": 1.0225, "step": 3413 }, { "epoch": 0.09, "learning_rate": 1.9827155246245497e-06, "loss": 0.7676, "step": 3414 }, { "epoch": 0.09, "learning_rate": 1.9827001538643752e-06, "loss": 0.9854, "step": 3415 }, { "epoch": 0.09, "learning_rate": 1.9826847763324066e-06, "loss": 1.0684, "step": 3416 }, { "epoch": 0.09, "learning_rate": 1.9826693920287496e-06, "loss": 0.8672, "step": 3417 }, { "epoch": 0.09, "learning_rate": 1.98265400095351e-06, "loss": 0.9668, "step": 3418 }, { "epoch": 0.09, "learning_rate": 1.9826386031067946e-06, "loss": 0.8311, "step": 3419 }, { "epoch": 0.09, "learning_rate": 1.9826231984887096e-06, "loss": 1.0596, "step": 3420 }, { "epoch": 0.09, "learning_rate": 1.98260778709936e-06, "loss": 0.8618, "step": 3421 }, { "epoch": 0.09, "learning_rate": 1.982592368938853e-06, "loss": 0.8994, "step": 3422 }, { "epoch": 0.09, "learning_rate": 1.9825769440072947e-06, "loss": 0.998, "step": 3423 }, { "epoch": 0.09, "learning_rate": 1.9825615123047913e-06, "loss": 0.8701, "step": 3424 }, { "epoch": 0.09, "learning_rate": 1.9825460738314486e-06, "loss": 1.0703, "step": 3425 }, { "epoch": 0.09, "learning_rate": 1.9825306285873744e-06, "loss": 0.9551, "step": 3426 }, { "epoch": 0.09, "learning_rate": 1.982515176572673e-06, "loss": 1.0049, "step": 3427 }, { "epoch": 0.09, "learning_rate": 1.9824997177874533e-06, "loss": 0.9814, "step": 3428 }, { "epoch": 0.09, "learning_rate": 1.9824842522318195e-06, "loss": 0.9756, "step": 3429 }, { "epoch": 0.09, "learning_rate": 1.98246877990588e-06, "loss": 0.9854, "step": 3430 }, { "epoch": 0.09, "learning_rate": 1.9824533008097407e-06, "loss": 0.8311, "step": 3431 }, { "epoch": 0.09, "learning_rate": 1.9824378149435083e-06, "loss": 0.7773, "step": 3432 }, { "epoch": 0.09, "learning_rate": 1.9824223223072893e-06, "loss": 1.0459, "step": 3433 }, { "epoch": 0.09, "learning_rate": 1.982406822901191e-06, "loss": 1.1885, "step": 3434 }, { "epoch": 0.09, "learning_rate": 1.9823913167253195e-06, "loss": 0.8291, "step": 3435 }, { "epoch": 0.09, "learning_rate": 1.9823758037797818e-06, "loss": 0.7935, "step": 3436 }, { "epoch": 0.09, "learning_rate": 1.9823602840646856e-06, "loss": 0.668, "step": 3437 }, { "epoch": 0.09, "learning_rate": 1.9823447575801368e-06, "loss": 0.8765, "step": 3438 }, { "epoch": 0.09, "learning_rate": 1.982329224326243e-06, "loss": 1.0137, "step": 3439 }, { "epoch": 0.09, "learning_rate": 1.982313684303111e-06, "loss": 1.083, "step": 3440 }, { "epoch": 0.09, "learning_rate": 1.982298137510848e-06, "loss": 0.9062, "step": 3441 }, { "epoch": 0.09, "learning_rate": 1.9822825839495613e-06, "loss": 0.9541, "step": 3442 }, { "epoch": 0.09, "learning_rate": 1.982267023619358e-06, "loss": 0.9253, "step": 3443 }, { "epoch": 0.09, "learning_rate": 1.9822514565203448e-06, "loss": 0.9795, "step": 3444 }, { "epoch": 0.09, "learning_rate": 1.9822358826526298e-06, "loss": 1.0156, "step": 3445 }, { "epoch": 0.09, "learning_rate": 1.98222030201632e-06, "loss": 0.8994, "step": 3446 }, { "epoch": 0.09, "learning_rate": 1.982204714611522e-06, "loss": 0.854, "step": 3447 }, { "epoch": 0.09, "learning_rate": 1.9821891204383444e-06, "loss": 1.0479, "step": 3448 }, { "epoch": 0.09, "learning_rate": 1.982173519496894e-06, "loss": 1.0957, "step": 3449 }, { "epoch": 0.09, "learning_rate": 1.9821579117872787e-06, "loss": 1.2402, "step": 3450 }, { "epoch": 0.09, "learning_rate": 1.9821422973096054e-06, "loss": 0.9775, "step": 3451 }, { "epoch": 0.09, "learning_rate": 1.9821266760639826e-06, "loss": 0.9121, "step": 3452 }, { "epoch": 0.09, "learning_rate": 1.982111048050517e-06, "loss": 1.1973, "step": 3453 }, { "epoch": 0.09, "learning_rate": 1.982095413269317e-06, "loss": 0.9146, "step": 3454 }, { "epoch": 0.09, "learning_rate": 1.98207977172049e-06, "loss": 0.7881, "step": 3455 }, { "epoch": 0.09, "learning_rate": 1.982064123404144e-06, "loss": 0.8799, "step": 3456 }, { "epoch": 0.09, "learning_rate": 1.9820484683203867e-06, "loss": 0.9336, "step": 3457 }, { "epoch": 0.09, "learning_rate": 1.9820328064693257e-06, "loss": 0.8975, "step": 3458 }, { "epoch": 0.09, "learning_rate": 1.9820171378510695e-06, "loss": 0.8398, "step": 3459 }, { "epoch": 0.09, "learning_rate": 1.9820014624657257e-06, "loss": 0.8477, "step": 3460 }, { "epoch": 0.09, "learning_rate": 1.9819857803134025e-06, "loss": 0.9717, "step": 3461 }, { "epoch": 0.09, "learning_rate": 1.9819700913942077e-06, "loss": 1.125, "step": 3462 }, { "epoch": 0.09, "learning_rate": 1.9819543957082497e-06, "loss": 0.9927, "step": 3463 }, { "epoch": 0.09, "learning_rate": 1.9819386932556363e-06, "loss": 0.9736, "step": 3464 }, { "epoch": 0.09, "learning_rate": 1.981922984036476e-06, "loss": 0.8535, "step": 3465 }, { "epoch": 0.09, "learning_rate": 1.9819072680508776e-06, "loss": 0.8262, "step": 3466 }, { "epoch": 0.09, "learning_rate": 1.981891545298948e-06, "loss": 1.2754, "step": 3467 }, { "epoch": 0.09, "learning_rate": 1.9818758157807967e-06, "loss": 0.6885, "step": 3468 }, { "epoch": 0.09, "learning_rate": 1.9818600794965317e-06, "loss": 0.8311, "step": 3469 }, { "epoch": 0.09, "learning_rate": 1.9818443364462616e-06, "loss": 0.7017, "step": 3470 }, { "epoch": 0.09, "learning_rate": 1.9818285866300946e-06, "loss": 1.0674, "step": 3471 }, { "epoch": 0.09, "learning_rate": 1.9818128300481394e-06, "loss": 1.0508, "step": 3472 }, { "epoch": 0.09, "learning_rate": 1.9817970667005047e-06, "loss": 1.0576, "step": 3473 }, { "epoch": 0.09, "learning_rate": 1.981781296587299e-06, "loss": 0.8584, "step": 3474 }, { "epoch": 0.09, "learning_rate": 1.981765519708631e-06, "loss": 1.0112, "step": 3475 }, { "epoch": 0.09, "learning_rate": 1.9817497360646087e-06, "loss": 0.9346, "step": 3476 }, { "epoch": 0.09, "learning_rate": 1.9817339456553424e-06, "loss": 0.9209, "step": 3477 }, { "epoch": 0.09, "learning_rate": 1.9817181484809396e-06, "loss": 0.8174, "step": 3478 }, { "epoch": 0.09, "learning_rate": 1.9817023445415103e-06, "loss": 0.9424, "step": 3479 }, { "epoch": 0.09, "learning_rate": 1.9816865338371622e-06, "loss": 0.9639, "step": 3480 }, { "epoch": 0.09, "learning_rate": 1.9816707163680046e-06, "loss": 0.9839, "step": 3481 }, { "epoch": 0.09, "learning_rate": 1.981654892134147e-06, "loss": 1.0654, "step": 3482 }, { "epoch": 0.09, "learning_rate": 1.981639061135698e-06, "loss": 0.9609, "step": 3483 }, { "epoch": 0.09, "learning_rate": 1.9816232233727668e-06, "loss": 0.9932, "step": 3484 }, { "epoch": 0.09, "learning_rate": 1.9816073788454626e-06, "loss": 0.853, "step": 3485 }, { "epoch": 0.09, "learning_rate": 1.9815915275538944e-06, "loss": 0.8066, "step": 3486 }, { "epoch": 0.09, "learning_rate": 1.9815756694981718e-06, "loss": 1.3145, "step": 3487 }, { "epoch": 0.09, "learning_rate": 1.9815598046784036e-06, "loss": 0.8789, "step": 3488 }, { "epoch": 0.09, "learning_rate": 1.9815439330946996e-06, "loss": 0.9424, "step": 3489 }, { "epoch": 0.09, "learning_rate": 1.981528054747169e-06, "loss": 1.0273, "step": 3490 }, { "epoch": 0.09, "learning_rate": 1.981512169635921e-06, "loss": 1.2324, "step": 3491 }, { "epoch": 0.09, "learning_rate": 1.981496277761065e-06, "loss": 0.9609, "step": 3492 }, { "epoch": 0.09, "learning_rate": 1.9814803791227114e-06, "loss": 0.8066, "step": 3493 }, { "epoch": 0.09, "learning_rate": 1.9814644737209684e-06, "loss": 0.9458, "step": 3494 }, { "epoch": 0.09, "learning_rate": 1.9814485615559468e-06, "loss": 1.0811, "step": 3495 }, { "epoch": 0.09, "learning_rate": 1.9814326426277554e-06, "loss": 0.9805, "step": 3496 }, { "epoch": 0.09, "learning_rate": 1.981416716936504e-06, "loss": 1.1035, "step": 3497 }, { "epoch": 0.09, "learning_rate": 1.981400784482303e-06, "loss": 0.9629, "step": 3498 }, { "epoch": 0.09, "learning_rate": 1.981384845265262e-06, "loss": 0.7427, "step": 3499 }, { "epoch": 0.09, "learning_rate": 1.98136889928549e-06, "loss": 1.1133, "step": 3500 }, { "epoch": 0.09, "learning_rate": 1.9813529465430985e-06, "loss": 1.1309, "step": 3501 }, { "epoch": 0.09, "learning_rate": 1.9813369870381957e-06, "loss": 0.9766, "step": 3502 }, { "epoch": 0.09, "learning_rate": 1.9813210207708923e-06, "loss": 1.0459, "step": 3503 }, { "epoch": 0.09, "learning_rate": 1.9813050477412984e-06, "loss": 0.9219, "step": 3504 }, { "epoch": 0.09, "learning_rate": 1.981289067949524e-06, "loss": 0.8691, "step": 3505 }, { "epoch": 0.09, "learning_rate": 1.9812730813956792e-06, "loss": 0.9092, "step": 3506 }, { "epoch": 0.09, "learning_rate": 1.981257088079874e-06, "loss": 1.0566, "step": 3507 }, { "epoch": 0.09, "learning_rate": 1.9812410880022194e-06, "loss": 0.9473, "step": 3508 }, { "epoch": 0.09, "learning_rate": 1.9812250811628247e-06, "loss": 0.7129, "step": 3509 }, { "epoch": 0.09, "learning_rate": 1.9812090675618003e-06, "loss": 0.7993, "step": 3510 }, { "epoch": 0.09, "learning_rate": 1.981193047199257e-06, "loss": 1.1602, "step": 3511 }, { "epoch": 0.09, "learning_rate": 1.981177020075305e-06, "loss": 1.0273, "step": 3512 }, { "epoch": 0.09, "learning_rate": 1.981160986190055e-06, "loss": 0.9531, "step": 3513 }, { "epoch": 0.09, "learning_rate": 1.9811449455436167e-06, "loss": 0.8975, "step": 3514 }, { "epoch": 0.09, "learning_rate": 1.9811288981361017e-06, "loss": 1.0117, "step": 3515 }, { "epoch": 0.09, "learning_rate": 1.9811128439676196e-06, "loss": 0.5906, "step": 3516 }, { "epoch": 0.09, "learning_rate": 1.981096783038282e-06, "loss": 1.0488, "step": 3517 }, { "epoch": 0.09, "learning_rate": 1.9810807153481987e-06, "loss": 0.6719, "step": 3518 }, { "epoch": 0.09, "learning_rate": 1.9810646408974806e-06, "loss": 0.9736, "step": 3519 }, { "epoch": 0.09, "learning_rate": 1.981048559686239e-06, "loss": 0.9824, "step": 3520 }, { "epoch": 0.09, "learning_rate": 1.9810324717145844e-06, "loss": 1.1797, "step": 3521 }, { "epoch": 0.09, "learning_rate": 1.9810163769826275e-06, "loss": 1.0225, "step": 3522 }, { "epoch": 0.09, "learning_rate": 1.9810002754904795e-06, "loss": 0.9707, "step": 3523 }, { "epoch": 0.09, "learning_rate": 1.980984167238251e-06, "loss": 1.0215, "step": 3524 }, { "epoch": 0.09, "learning_rate": 1.980968052226053e-06, "loss": 0.7119, "step": 3525 }, { "epoch": 0.09, "learning_rate": 1.980951930453997e-06, "loss": 0.8613, "step": 3526 }, { "epoch": 0.09, "learning_rate": 1.9809358019221937e-06, "loss": 0.6729, "step": 3527 }, { "epoch": 0.09, "learning_rate": 1.9809196666307545e-06, "loss": 0.9814, "step": 3528 }, { "epoch": 0.09, "learning_rate": 1.9809035245797903e-06, "loss": 0.8408, "step": 3529 }, { "epoch": 0.09, "learning_rate": 1.980887375769413e-06, "loss": 0.9688, "step": 3530 }, { "epoch": 0.09, "learning_rate": 1.9808712201997327e-06, "loss": 1.0371, "step": 3531 }, { "epoch": 0.09, "learning_rate": 1.980855057870862e-06, "loss": 0.8848, "step": 3532 }, { "epoch": 0.09, "learning_rate": 1.9808388887829115e-06, "loss": 0.9922, "step": 3533 }, { "epoch": 0.09, "learning_rate": 1.9808227129359925e-06, "loss": 1.127, "step": 3534 }, { "epoch": 0.09, "learning_rate": 1.980806530330217e-06, "loss": 0.8213, "step": 3535 }, { "epoch": 0.09, "learning_rate": 1.980790340965696e-06, "loss": 0.8018, "step": 3536 }, { "epoch": 0.09, "learning_rate": 1.980774144842542e-06, "loss": 0.9824, "step": 3537 }, { "epoch": 0.09, "learning_rate": 1.9807579419608657e-06, "loss": 0.8525, "step": 3538 }, { "epoch": 0.09, "learning_rate": 1.9807417323207787e-06, "loss": 0.6411, "step": 3539 }, { "epoch": 0.09, "learning_rate": 1.9807255159223933e-06, "loss": 0.8428, "step": 3540 }, { "epoch": 0.09, "learning_rate": 1.980709292765821e-06, "loss": 0.9795, "step": 3541 }, { "epoch": 0.09, "learning_rate": 1.9806930628511732e-06, "loss": 0.957, "step": 3542 }, { "epoch": 0.09, "learning_rate": 1.9806768261785625e-06, "loss": 0.8936, "step": 3543 }, { "epoch": 0.09, "learning_rate": 1.9806605827481002e-06, "loss": 1.041, "step": 3544 }, { "epoch": 0.09, "learning_rate": 1.9806443325598985e-06, "loss": 1.0479, "step": 3545 }, { "epoch": 0.09, "learning_rate": 1.980628075614069e-06, "loss": 1.0342, "step": 3546 }, { "epoch": 0.09, "learning_rate": 1.9806118119107246e-06, "loss": 1.1104, "step": 3547 }, { "epoch": 0.09, "learning_rate": 1.980595541449976e-06, "loss": 0.9688, "step": 3548 }, { "epoch": 0.09, "learning_rate": 1.9805792642319366e-06, "loss": 0.9521, "step": 3549 }, { "epoch": 0.09, "learning_rate": 1.9805629802567184e-06, "loss": 0.9111, "step": 3550 }, { "epoch": 0.09, "learning_rate": 1.980546689524433e-06, "loss": 0.8965, "step": 3551 }, { "epoch": 0.09, "learning_rate": 1.9805303920351926e-06, "loss": 0.9395, "step": 3552 }, { "epoch": 0.09, "learning_rate": 1.9805140877891106e-06, "loss": 1.0391, "step": 3553 }, { "epoch": 0.09, "learning_rate": 1.980497776786298e-06, "loss": 0.8467, "step": 3554 }, { "epoch": 0.09, "learning_rate": 1.980481459026868e-06, "loss": 0.9619, "step": 3555 }, { "epoch": 0.09, "learning_rate": 1.9804651345109327e-06, "loss": 1.1328, "step": 3556 }, { "epoch": 0.09, "learning_rate": 1.9804488032386048e-06, "loss": 0.8101, "step": 3557 }, { "epoch": 0.09, "learning_rate": 1.980432465209997e-06, "loss": 1.0, "step": 3558 }, { "epoch": 0.09, "learning_rate": 1.9804161204252217e-06, "loss": 0.8623, "step": 3559 }, { "epoch": 0.09, "learning_rate": 1.9803997688843915e-06, "loss": 0.8398, "step": 3560 }, { "epoch": 0.09, "learning_rate": 1.980383410587619e-06, "loss": 1.0117, "step": 3561 }, { "epoch": 0.09, "learning_rate": 1.980367045535017e-06, "loss": 0.7671, "step": 3562 }, { "epoch": 0.09, "learning_rate": 1.9803506737266978e-06, "loss": 0.9961, "step": 3563 }, { "epoch": 0.09, "learning_rate": 1.9803342951627755e-06, "loss": 1.1045, "step": 3564 }, { "epoch": 0.09, "learning_rate": 1.980317909843362e-06, "loss": 1.0381, "step": 3565 }, { "epoch": 0.09, "learning_rate": 1.98030151776857e-06, "loss": 0.9795, "step": 3566 }, { "epoch": 0.09, "learning_rate": 1.980285118938513e-06, "loss": 0.9883, "step": 3567 }, { "epoch": 0.09, "learning_rate": 1.980268713353304e-06, "loss": 0.998, "step": 3568 }, { "epoch": 0.09, "learning_rate": 1.9802523010130557e-06, "loss": 0.832, "step": 3569 }, { "epoch": 0.09, "learning_rate": 1.9802358819178815e-06, "loss": 1.1631, "step": 3570 }, { "epoch": 0.09, "learning_rate": 1.9802194560678943e-06, "loss": 0.8584, "step": 3571 }, { "epoch": 0.09, "learning_rate": 1.9802030234632078e-06, "loss": 1.1465, "step": 3572 }, { "epoch": 0.09, "learning_rate": 1.980186584103934e-06, "loss": 1.0527, "step": 3573 }, { "epoch": 0.09, "learning_rate": 1.980170137990188e-06, "loss": 1.1035, "step": 3574 }, { "epoch": 0.09, "learning_rate": 1.9801536851220817e-06, "loss": 0.7163, "step": 3575 }, { "epoch": 0.09, "learning_rate": 1.9801372254997293e-06, "loss": 0.9834, "step": 3576 }, { "epoch": 0.09, "learning_rate": 1.9801207591232436e-06, "loss": 0.9434, "step": 3577 }, { "epoch": 0.09, "learning_rate": 1.980104285992738e-06, "loss": 0.9004, "step": 3578 }, { "epoch": 0.09, "learning_rate": 1.980087806108327e-06, "loss": 0.9707, "step": 3579 }, { "epoch": 0.09, "learning_rate": 1.9800713194701233e-06, "loss": 0.916, "step": 3580 }, { "epoch": 0.09, "learning_rate": 1.9800548260782406e-06, "loss": 0.9883, "step": 3581 }, { "epoch": 0.09, "learning_rate": 1.980038325932793e-06, "loss": 1.0332, "step": 3582 }, { "epoch": 0.09, "learning_rate": 1.9800218190338933e-06, "loss": 0.8501, "step": 3583 }, { "epoch": 0.09, "learning_rate": 1.9800053053816567e-06, "loss": 0.769, "step": 3584 }, { "epoch": 0.09, "learning_rate": 1.9799887849761954e-06, "loss": 0.9287, "step": 3585 }, { "epoch": 0.09, "learning_rate": 1.979972257817624e-06, "loss": 1.1221, "step": 3586 }, { "epoch": 0.09, "learning_rate": 1.979955723906057e-06, "loss": 0.9307, "step": 3587 }, { "epoch": 0.09, "learning_rate": 1.979939183241607e-06, "loss": 0.9766, "step": 3588 }, { "epoch": 0.09, "learning_rate": 1.979922635824389e-06, "loss": 0.7964, "step": 3589 }, { "epoch": 0.09, "learning_rate": 1.979906081654517e-06, "loss": 0.9414, "step": 3590 }, { "epoch": 0.09, "learning_rate": 1.9798895207321045e-06, "loss": 0.7886, "step": 3591 }, { "epoch": 0.09, "learning_rate": 1.9798729530572657e-06, "loss": 0.8467, "step": 3592 }, { "epoch": 0.09, "learning_rate": 1.9798563786301153e-06, "loss": 0.9126, "step": 3593 }, { "epoch": 0.09, "learning_rate": 1.979839797450767e-06, "loss": 0.8506, "step": 3594 }, { "epoch": 0.09, "learning_rate": 1.9798232095193353e-06, "loss": 0.9785, "step": 3595 }, { "epoch": 0.09, "learning_rate": 1.9798066148359344e-06, "loss": 1.0801, "step": 3596 }, { "epoch": 0.09, "learning_rate": 1.979790013400679e-06, "loss": 1.1357, "step": 3597 }, { "epoch": 0.09, "learning_rate": 1.979773405213683e-06, "loss": 0.9746, "step": 3598 }, { "epoch": 0.09, "learning_rate": 1.979756790275061e-06, "loss": 1.0059, "step": 3599 }, { "epoch": 0.09, "learning_rate": 1.979740168584928e-06, "loss": 0.7754, "step": 3600 }, { "epoch": 0.09, "learning_rate": 1.9797235401433973e-06, "loss": 0.8628, "step": 3601 }, { "epoch": 0.09, "learning_rate": 1.979706904950585e-06, "loss": 0.9824, "step": 3602 }, { "epoch": 0.09, "learning_rate": 1.9796902630066045e-06, "loss": 0.8779, "step": 3603 }, { "epoch": 0.09, "learning_rate": 1.9796736143115714e-06, "loss": 0.9307, "step": 3604 }, { "epoch": 0.09, "learning_rate": 1.9796569588656e-06, "loss": 0.8379, "step": 3605 }, { "epoch": 0.09, "learning_rate": 1.9796402966688046e-06, "loss": 0.8311, "step": 3606 }, { "epoch": 0.09, "learning_rate": 1.9796236277213014e-06, "loss": 0.7515, "step": 3607 }, { "epoch": 0.09, "learning_rate": 1.979606952023204e-06, "loss": 0.9229, "step": 3608 }, { "epoch": 0.09, "learning_rate": 1.9795902695746274e-06, "loss": 0.6699, "step": 3609 }, { "epoch": 0.09, "learning_rate": 1.9795735803756866e-06, "loss": 1.2305, "step": 3610 }, { "epoch": 0.09, "learning_rate": 1.9795568844264976e-06, "loss": 0.8516, "step": 3611 }, { "epoch": 0.09, "learning_rate": 1.979540181727174e-06, "loss": 0.9365, "step": 3612 }, { "epoch": 0.09, "learning_rate": 1.979523472277832e-06, "loss": 0.9209, "step": 3613 }, { "epoch": 0.09, "learning_rate": 1.9795067560785867e-06, "loss": 1.0586, "step": 3614 }, { "epoch": 0.09, "learning_rate": 1.9794900331295524e-06, "loss": 1.0186, "step": 3615 }, { "epoch": 0.09, "learning_rate": 1.979473303430845e-06, "loss": 1.168, "step": 3616 }, { "epoch": 0.09, "learning_rate": 1.97945656698258e-06, "loss": 1.0156, "step": 3617 }, { "epoch": 0.09, "learning_rate": 1.979439823784872e-06, "loss": 1.0459, "step": 3618 }, { "epoch": 0.09, "learning_rate": 1.979423073837837e-06, "loss": 0.9873, "step": 3619 }, { "epoch": 0.09, "learning_rate": 1.97940631714159e-06, "loss": 1.1172, "step": 3620 }, { "epoch": 0.09, "learning_rate": 1.979389553696247e-06, "loss": 1.1152, "step": 3621 }, { "epoch": 0.09, "learning_rate": 1.979372783501923e-06, "loss": 1.1348, "step": 3622 }, { "epoch": 0.09, "learning_rate": 1.9793560065587338e-06, "loss": 1.0254, "step": 3623 }, { "epoch": 0.09, "learning_rate": 1.9793392228667947e-06, "loss": 0.9062, "step": 3624 }, { "epoch": 0.09, "learning_rate": 1.979322432426222e-06, "loss": 0.8447, "step": 3625 }, { "epoch": 0.09, "learning_rate": 1.9793056352371303e-06, "loss": 0.6501, "step": 3626 }, { "epoch": 0.09, "learning_rate": 1.9792888312996367e-06, "loss": 0.7432, "step": 3627 }, { "epoch": 0.09, "learning_rate": 1.979272020613856e-06, "loss": 0.8154, "step": 3628 }, { "epoch": 0.09, "learning_rate": 1.979255203179905e-06, "loss": 0.8408, "step": 3629 }, { "epoch": 0.09, "learning_rate": 1.979238378997899e-06, "loss": 1.1689, "step": 3630 }, { "epoch": 0.09, "learning_rate": 1.979221548067953e-06, "loss": 1.0488, "step": 3631 }, { "epoch": 0.09, "learning_rate": 1.979204710390185e-06, "loss": 1.3066, "step": 3632 }, { "epoch": 0.09, "learning_rate": 1.979187865964709e-06, "loss": 0.8789, "step": 3633 }, { "epoch": 0.09, "learning_rate": 1.9791710147916426e-06, "loss": 0.8496, "step": 3634 }, { "epoch": 0.09, "learning_rate": 1.979154156871101e-06, "loss": 0.9893, "step": 3635 }, { "epoch": 0.09, "learning_rate": 1.979137292203201e-06, "loss": 1.083, "step": 3636 }, { "epoch": 0.09, "learning_rate": 1.9791204207880585e-06, "loss": 0.7617, "step": 3637 }, { "epoch": 0.09, "learning_rate": 1.97910354262579e-06, "loss": 1.0557, "step": 3638 }, { "epoch": 0.09, "learning_rate": 1.979086657716511e-06, "loss": 1.0049, "step": 3639 }, { "epoch": 0.09, "learning_rate": 1.979069766060339e-06, "loss": 1.1094, "step": 3640 }, { "epoch": 0.09, "learning_rate": 1.9790528676573895e-06, "loss": 0.8398, "step": 3641 }, { "epoch": 0.09, "learning_rate": 1.979035962507779e-06, "loss": 0.8857, "step": 3642 }, { "epoch": 0.09, "learning_rate": 1.979019050611625e-06, "loss": 0.7837, "step": 3643 }, { "epoch": 0.09, "learning_rate": 1.979002131969043e-06, "loss": 0.7483, "step": 3644 }, { "epoch": 0.09, "learning_rate": 1.97898520658015e-06, "loss": 0.9727, "step": 3645 }, { "epoch": 0.09, "learning_rate": 1.978968274445063e-06, "loss": 1.0391, "step": 3646 }, { "epoch": 0.09, "learning_rate": 1.9789513355638976e-06, "loss": 0.8623, "step": 3647 }, { "epoch": 0.09, "learning_rate": 1.978934389936771e-06, "loss": 1.0908, "step": 3648 }, { "epoch": 0.09, "learning_rate": 1.9789174375638002e-06, "loss": 0.8848, "step": 3649 }, { "epoch": 0.09, "learning_rate": 1.9789004784451023e-06, "loss": 0.9619, "step": 3650 }, { "epoch": 0.09, "learning_rate": 1.9788835125807933e-06, "loss": 0.9473, "step": 3651 }, { "epoch": 0.09, "learning_rate": 1.9788665399709912e-06, "loss": 0.9629, "step": 3652 }, { "epoch": 0.09, "learning_rate": 1.9788495606158122e-06, "loss": 0.9316, "step": 3653 }, { "epoch": 0.09, "learning_rate": 1.978832574515373e-06, "loss": 0.9873, "step": 3654 }, { "epoch": 0.09, "learning_rate": 1.978815581669792e-06, "loss": 0.8789, "step": 3655 }, { "epoch": 0.09, "learning_rate": 1.9787985820791846e-06, "loss": 0.9248, "step": 3656 }, { "epoch": 0.09, "learning_rate": 1.9787815757436693e-06, "loss": 1.127, "step": 3657 }, { "epoch": 0.09, "learning_rate": 1.9787645626633627e-06, "loss": 0.8652, "step": 3658 }, { "epoch": 0.09, "learning_rate": 1.978747542838382e-06, "loss": 0.998, "step": 3659 }, { "epoch": 0.09, "learning_rate": 1.9787305162688444e-06, "loss": 0.96, "step": 3660 }, { "epoch": 0.09, "learning_rate": 1.978713482954868e-06, "loss": 1.165, "step": 3661 }, { "epoch": 0.09, "learning_rate": 1.978696442896569e-06, "loss": 0.9854, "step": 3662 }, { "epoch": 0.09, "learning_rate": 1.9786793960940656e-06, "loss": 1.0596, "step": 3663 }, { "epoch": 0.09, "learning_rate": 1.9786623425474753e-06, "loss": 1.0039, "step": 3664 }, { "epoch": 0.09, "learning_rate": 1.9786452822569154e-06, "loss": 0.9346, "step": 3665 }, { "epoch": 0.09, "learning_rate": 1.9786282152225032e-06, "loss": 0.9014, "step": 3666 }, { "epoch": 0.09, "learning_rate": 1.9786111414443565e-06, "loss": 1.0381, "step": 3667 }, { "epoch": 0.09, "learning_rate": 1.9785940609225934e-06, "loss": 0.957, "step": 3668 }, { "epoch": 0.09, "learning_rate": 1.978576973657331e-06, "loss": 0.9443, "step": 3669 }, { "epoch": 0.09, "learning_rate": 1.9785598796486873e-06, "loss": 0.9033, "step": 3670 }, { "epoch": 0.09, "learning_rate": 1.97854277889678e-06, "loss": 0.9331, "step": 3671 }, { "epoch": 0.09, "learning_rate": 1.9785256714017272e-06, "loss": 0.8008, "step": 3672 }, { "epoch": 0.09, "learning_rate": 1.9785085571636466e-06, "loss": 1.0693, "step": 3673 }, { "epoch": 0.09, "learning_rate": 1.978491436182656e-06, "loss": 0.7695, "step": 3674 }, { "epoch": 0.09, "learning_rate": 1.978474308458874e-06, "loss": 0.8545, "step": 3675 }, { "epoch": 0.09, "learning_rate": 1.9784571739924174e-06, "loss": 1.1025, "step": 3676 }, { "epoch": 0.09, "learning_rate": 1.9784400327834055e-06, "loss": 0.7803, "step": 3677 }, { "epoch": 0.09, "learning_rate": 1.9784228848319557e-06, "loss": 1.0234, "step": 3678 }, { "epoch": 0.09, "learning_rate": 1.978405730138187e-06, "loss": 0.9766, "step": 3679 }, { "epoch": 0.09, "learning_rate": 1.978388568702216e-06, "loss": 0.7783, "step": 3680 }, { "epoch": 0.09, "learning_rate": 1.9783714005241626e-06, "loss": 0.9697, "step": 3681 }, { "epoch": 0.09, "learning_rate": 1.9783542256041444e-06, "loss": 1.0332, "step": 3682 }, { "epoch": 0.09, "learning_rate": 1.9783370439422797e-06, "loss": 0.9961, "step": 3683 }, { "epoch": 0.09, "learning_rate": 1.9783198555386874e-06, "loss": 0.9785, "step": 3684 }, { "epoch": 0.09, "learning_rate": 1.9783026603934854e-06, "loss": 0.7075, "step": 3685 }, { "epoch": 0.09, "learning_rate": 1.9782854585067923e-06, "loss": 1.1289, "step": 3686 }, { "epoch": 0.09, "learning_rate": 1.978268249878727e-06, "loss": 0.6968, "step": 3687 }, { "epoch": 0.09, "learning_rate": 1.9782510345094075e-06, "loss": 1.0898, "step": 3688 }, { "epoch": 0.09, "learning_rate": 1.9782338123989527e-06, "loss": 1.0859, "step": 3689 }, { "epoch": 0.09, "learning_rate": 1.9782165835474815e-06, "loss": 0.79, "step": 3690 }, { "epoch": 0.09, "learning_rate": 1.978199347955112e-06, "loss": 0.915, "step": 3691 }, { "epoch": 0.09, "learning_rate": 1.9781821056219638e-06, "loss": 0.7925, "step": 3692 }, { "epoch": 0.09, "learning_rate": 1.9781648565481556e-06, "loss": 0.8066, "step": 3693 }, { "epoch": 0.09, "learning_rate": 1.9781476007338054e-06, "loss": 1.0156, "step": 3694 }, { "epoch": 0.09, "learning_rate": 1.978130338179033e-06, "loss": 1.124, "step": 3695 }, { "epoch": 0.09, "learning_rate": 1.978113068883957e-06, "loss": 0.9717, "step": 3696 }, { "epoch": 0.09, "learning_rate": 1.9780957928486967e-06, "loss": 1.168, "step": 3697 }, { "epoch": 0.09, "learning_rate": 1.9780785100733708e-06, "loss": 0.6641, "step": 3698 }, { "epoch": 0.09, "learning_rate": 1.9780612205580983e-06, "loss": 0.9961, "step": 3699 }, { "epoch": 0.09, "learning_rate": 1.9780439243029986e-06, "loss": 0.7305, "step": 3700 }, { "epoch": 0.09, "learning_rate": 1.9780266213081907e-06, "loss": 0.8867, "step": 3701 }, { "epoch": 0.09, "learning_rate": 1.978009311573794e-06, "loss": 0.8936, "step": 3702 }, { "epoch": 0.09, "learning_rate": 1.977991995099928e-06, "loss": 0.7646, "step": 3703 }, { "epoch": 0.09, "learning_rate": 1.9779746718867114e-06, "loss": 0.856, "step": 3704 }, { "epoch": 0.09, "learning_rate": 1.9779573419342643e-06, "loss": 0.792, "step": 3705 }, { "epoch": 0.09, "learning_rate": 1.9779400052427053e-06, "loss": 0.8894, "step": 3706 }, { "epoch": 0.1, "learning_rate": 1.9779226618121548e-06, "loss": 0.8242, "step": 3707 }, { "epoch": 0.1, "learning_rate": 1.9779053116427316e-06, "loss": 0.8091, "step": 3708 }, { "epoch": 0.1, "learning_rate": 1.9778879547345557e-06, "loss": 0.9805, "step": 3709 }, { "epoch": 0.1, "learning_rate": 1.9778705910877466e-06, "loss": 0.7881, "step": 3710 }, { "epoch": 0.1, "learning_rate": 1.977853220702424e-06, "loss": 0.8789, "step": 3711 }, { "epoch": 0.1, "learning_rate": 1.977835843578707e-06, "loss": 0.9951, "step": 3712 }, { "epoch": 0.1, "learning_rate": 1.9778184597167157e-06, "loss": 0.8535, "step": 3713 }, { "epoch": 0.1, "learning_rate": 1.9778010691165707e-06, "loss": 1.0898, "step": 3714 }, { "epoch": 0.1, "learning_rate": 1.9777836717783908e-06, "loss": 0.9424, "step": 3715 }, { "epoch": 0.1, "learning_rate": 1.9777662677022963e-06, "loss": 0.793, "step": 3716 }, { "epoch": 0.1, "learning_rate": 1.9777488568884066e-06, "loss": 0.832, "step": 3717 }, { "epoch": 0.1, "learning_rate": 1.9777314393368425e-06, "loss": 1.0088, "step": 3718 }, { "epoch": 0.1, "learning_rate": 1.977714015047724e-06, "loss": 1.0449, "step": 3719 }, { "epoch": 0.1, "learning_rate": 1.9776965840211703e-06, "loss": 0.9414, "step": 3720 }, { "epoch": 0.1, "learning_rate": 1.977679146257302e-06, "loss": 0.6611, "step": 3721 }, { "epoch": 0.1, "learning_rate": 1.9776617017562395e-06, "loss": 0.7129, "step": 3722 }, { "epoch": 0.1, "learning_rate": 1.977644250518103e-06, "loss": 1.1094, "step": 3723 }, { "epoch": 0.1, "learning_rate": 1.9776267925430126e-06, "loss": 0.9404, "step": 3724 }, { "epoch": 0.1, "learning_rate": 1.9776093278310884e-06, "loss": 1.0654, "step": 3725 }, { "epoch": 0.1, "learning_rate": 1.977591856382451e-06, "loss": 1.0811, "step": 3726 }, { "epoch": 0.1, "learning_rate": 1.9775743781972205e-06, "loss": 0.7852, "step": 3727 }, { "epoch": 0.1, "learning_rate": 1.9775568932755184e-06, "loss": 0.8833, "step": 3728 }, { "epoch": 0.1, "learning_rate": 1.9775394016174635e-06, "loss": 0.8271, "step": 3729 }, { "epoch": 0.1, "learning_rate": 1.977521903223177e-06, "loss": 0.9199, "step": 3730 }, { "epoch": 0.1, "learning_rate": 1.9775043980927804e-06, "loss": 1.0264, "step": 3731 }, { "epoch": 0.1, "learning_rate": 1.9774868862263935e-06, "loss": 1.0127, "step": 3732 }, { "epoch": 0.1, "learning_rate": 1.977469367624137e-06, "loss": 1.0791, "step": 3733 }, { "epoch": 0.1, "learning_rate": 1.9774518422861317e-06, "loss": 0.9199, "step": 3734 }, { "epoch": 0.1, "learning_rate": 1.9774343102124986e-06, "loss": 0.9575, "step": 3735 }, { "epoch": 0.1, "learning_rate": 1.977416771403358e-06, "loss": 0.7998, "step": 3736 }, { "epoch": 0.1, "learning_rate": 1.977399225858831e-06, "loss": 0.9448, "step": 3737 }, { "epoch": 0.1, "learning_rate": 1.9773816735790383e-06, "loss": 0.8604, "step": 3738 }, { "epoch": 0.1, "learning_rate": 1.9773641145641015e-06, "loss": 1.0996, "step": 3739 }, { "epoch": 0.1, "learning_rate": 1.977346548814141e-06, "loss": 0.9238, "step": 3740 }, { "epoch": 0.1, "learning_rate": 1.9773289763292783e-06, "loss": 1.0986, "step": 3741 }, { "epoch": 0.1, "learning_rate": 1.977311397109634e-06, "loss": 1.0186, "step": 3742 }, { "epoch": 0.1, "learning_rate": 1.9772938111553295e-06, "loss": 0.9746, "step": 3743 }, { "epoch": 0.1, "learning_rate": 1.977276218466486e-06, "loss": 1.0029, "step": 3744 }, { "epoch": 0.1, "learning_rate": 1.977258619043225e-06, "loss": 0.9932, "step": 3745 }, { "epoch": 0.1, "learning_rate": 1.977241012885667e-06, "loss": 0.6455, "step": 3746 }, { "epoch": 0.1, "learning_rate": 1.9772233999939345e-06, "loss": 0.8579, "step": 3747 }, { "epoch": 0.1, "learning_rate": 1.9772057803681473e-06, "loss": 0.9912, "step": 3748 }, { "epoch": 0.1, "learning_rate": 1.977188154008428e-06, "loss": 0.999, "step": 3749 }, { "epoch": 0.1, "learning_rate": 1.9771705209148978e-06, "loss": 0.8613, "step": 3750 }, { "epoch": 0.1, "learning_rate": 1.9771528810876785e-06, "loss": 1.0586, "step": 3751 }, { "epoch": 0.1, "learning_rate": 1.9771352345268907e-06, "loss": 0.8877, "step": 3752 }, { "epoch": 0.1, "learning_rate": 1.977117581232657e-06, "loss": 0.7451, "step": 3753 }, { "epoch": 0.1, "learning_rate": 1.9770999212050986e-06, "loss": 0.9238, "step": 3754 }, { "epoch": 0.1, "learning_rate": 1.9770822544443373e-06, "loss": 0.9521, "step": 3755 }, { "epoch": 0.1, "learning_rate": 1.9770645809504946e-06, "loss": 0.822, "step": 3756 }, { "epoch": 0.1, "learning_rate": 1.977046900723693e-06, "loss": 0.8496, "step": 3757 }, { "epoch": 0.1, "learning_rate": 1.9770292137640532e-06, "loss": 1.1211, "step": 3758 }, { "epoch": 0.1, "learning_rate": 1.977011520071698e-06, "loss": 0.9736, "step": 3759 }, { "epoch": 0.1, "learning_rate": 1.9769938196467486e-06, "loss": 0.6973, "step": 3760 }, { "epoch": 0.1, "learning_rate": 1.976976112489328e-06, "loss": 1.0176, "step": 3761 }, { "epoch": 0.1, "learning_rate": 1.9769583985995574e-06, "loss": 1.0283, "step": 3762 }, { "epoch": 0.1, "learning_rate": 1.976940677977559e-06, "loss": 0.5742, "step": 3763 }, { "epoch": 0.1, "learning_rate": 1.9769229506234553e-06, "loss": 0.9648, "step": 3764 }, { "epoch": 0.1, "learning_rate": 1.9769052165373682e-06, "loss": 0.9326, "step": 3765 }, { "epoch": 0.1, "learning_rate": 1.97688747571942e-06, "loss": 0.8574, "step": 3766 }, { "epoch": 0.1, "learning_rate": 1.9768697281697322e-06, "loss": 0.8145, "step": 3767 }, { "epoch": 0.1, "learning_rate": 1.976851973888428e-06, "loss": 1.1182, "step": 3768 }, { "epoch": 0.1, "learning_rate": 1.9768342128756295e-06, "loss": 1.0312, "step": 3769 }, { "epoch": 0.1, "learning_rate": 1.976816445131459e-06, "loss": 1.002, "step": 3770 }, { "epoch": 0.1, "learning_rate": 1.976798670656039e-06, "loss": 1.0244, "step": 3771 }, { "epoch": 0.1, "learning_rate": 1.9767808894494923e-06, "loss": 0.9922, "step": 3772 }, { "epoch": 0.1, "learning_rate": 1.9767631015119405e-06, "loss": 1.0879, "step": 3773 }, { "epoch": 0.1, "learning_rate": 1.9767453068435075e-06, "loss": 0.9453, "step": 3774 }, { "epoch": 0.1, "learning_rate": 1.9767275054443147e-06, "loss": 1.0098, "step": 3775 }, { "epoch": 0.1, "learning_rate": 1.9767096973144855e-06, "loss": 0.77, "step": 3776 }, { "epoch": 0.1, "learning_rate": 1.9766918824541423e-06, "loss": 1.0498, "step": 3777 }, { "epoch": 0.1, "learning_rate": 1.976674060863408e-06, "loss": 1.0684, "step": 3778 }, { "epoch": 0.1, "learning_rate": 1.9766562325424053e-06, "loss": 0.9658, "step": 3779 }, { "epoch": 0.1, "learning_rate": 1.976638397491257e-06, "loss": 1.0195, "step": 3780 }, { "epoch": 0.1, "learning_rate": 1.9766205557100868e-06, "loss": 1.0234, "step": 3781 }, { "epoch": 0.1, "learning_rate": 1.9766027071990164e-06, "loss": 0.9033, "step": 3782 }, { "epoch": 0.1, "learning_rate": 1.9765848519581692e-06, "loss": 1.0156, "step": 3783 }, { "epoch": 0.1, "learning_rate": 1.9765669899876686e-06, "loss": 1.0908, "step": 3784 }, { "epoch": 0.1, "learning_rate": 1.976549121287638e-06, "loss": 0.7427, "step": 3785 }, { "epoch": 0.1, "learning_rate": 1.976531245858199e-06, "loss": 0.6909, "step": 3786 }, { "epoch": 0.1, "learning_rate": 1.9765133636994768e-06, "loss": 0.8516, "step": 3787 }, { "epoch": 0.1, "learning_rate": 1.976495474811593e-06, "loss": 0.9834, "step": 3788 }, { "epoch": 0.1, "learning_rate": 1.976477579194672e-06, "loss": 0.8945, "step": 3789 }, { "epoch": 0.1, "learning_rate": 1.976459676848836e-06, "loss": 0.9639, "step": 3790 }, { "epoch": 0.1, "learning_rate": 1.9764417677742095e-06, "loss": 0.7886, "step": 3791 }, { "epoch": 0.1, "learning_rate": 1.9764238519709154e-06, "loss": 0.5181, "step": 3792 }, { "epoch": 0.1, "learning_rate": 1.976405929439077e-06, "loss": 1.1582, "step": 3793 }, { "epoch": 0.1, "learning_rate": 1.976388000178818e-06, "loss": 0.9111, "step": 3794 }, { "epoch": 0.1, "learning_rate": 1.976370064190262e-06, "loss": 1.0, "step": 3795 }, { "epoch": 0.1, "learning_rate": 1.976352121473532e-06, "loss": 0.855, "step": 3796 }, { "epoch": 0.1, "learning_rate": 1.976334172028753e-06, "loss": 0.9062, "step": 3797 }, { "epoch": 0.1, "learning_rate": 1.976316215856047e-06, "loss": 0.7915, "step": 3798 }, { "epoch": 0.1, "learning_rate": 1.976298252955539e-06, "loss": 1.0098, "step": 3799 }, { "epoch": 0.1, "learning_rate": 1.9762802833273526e-06, "loss": 0.8057, "step": 3800 }, { "epoch": 0.1, "learning_rate": 1.976262306971611e-06, "loss": 1.0459, "step": 3801 }, { "epoch": 0.1, "learning_rate": 1.9762443238884386e-06, "loss": 0.9053, "step": 3802 }, { "epoch": 0.1, "learning_rate": 1.9762263340779595e-06, "loss": 1.0508, "step": 3803 }, { "epoch": 0.1, "learning_rate": 1.976208337540297e-06, "loss": 0.9121, "step": 3804 }, { "epoch": 0.1, "learning_rate": 1.9761903342755755e-06, "loss": 0.8271, "step": 3805 }, { "epoch": 0.1, "learning_rate": 1.976172324283919e-06, "loss": 0.7041, "step": 3806 }, { "epoch": 0.1, "learning_rate": 1.976154307565452e-06, "loss": 1.0488, "step": 3807 }, { "epoch": 0.1, "learning_rate": 1.9761362841202977e-06, "loss": 0.9189, "step": 3808 }, { "epoch": 0.1, "learning_rate": 1.9761182539485812e-06, "loss": 0.8799, "step": 3809 }, { "epoch": 0.1, "learning_rate": 1.9761002170504263e-06, "loss": 1.0928, "step": 3810 }, { "epoch": 0.1, "learning_rate": 1.9760821734259577e-06, "loss": 1.0576, "step": 3811 }, { "epoch": 0.1, "learning_rate": 1.976064123075299e-06, "loss": 1.0557, "step": 3812 }, { "epoch": 0.1, "learning_rate": 1.9760460659985755e-06, "loss": 0.9053, "step": 3813 }, { "epoch": 0.1, "learning_rate": 1.9760280021959115e-06, "loss": 0.918, "step": 3814 }, { "epoch": 0.1, "learning_rate": 1.9760099316674306e-06, "loss": 0.9824, "step": 3815 }, { "epoch": 0.1, "learning_rate": 1.9759918544132577e-06, "loss": 0.9766, "step": 3816 }, { "epoch": 0.1, "learning_rate": 1.975973770433518e-06, "loss": 1.0664, "step": 3817 }, { "epoch": 0.1, "learning_rate": 1.9759556797283357e-06, "loss": 1.0635, "step": 3818 }, { "epoch": 0.1, "learning_rate": 1.975937582297835e-06, "loss": 0.8203, "step": 3819 }, { "epoch": 0.1, "learning_rate": 1.9759194781421416e-06, "loss": 0.8423, "step": 3820 }, { "epoch": 0.1, "learning_rate": 1.9759013672613795e-06, "loss": 0.8413, "step": 3821 }, { "epoch": 0.1, "learning_rate": 1.9758832496556735e-06, "loss": 0.7852, "step": 3822 }, { "epoch": 0.1, "learning_rate": 1.975865125325149e-06, "loss": 0.686, "step": 3823 }, { "epoch": 0.1, "learning_rate": 1.97584699426993e-06, "loss": 1.1602, "step": 3824 }, { "epoch": 0.1, "learning_rate": 1.9758288564901427e-06, "loss": 0.8428, "step": 3825 }, { "epoch": 0.1, "learning_rate": 1.975810711985911e-06, "loss": 0.9307, "step": 3826 }, { "epoch": 0.1, "learning_rate": 1.9757925607573604e-06, "loss": 1.0664, "step": 3827 }, { "epoch": 0.1, "learning_rate": 1.9757744028046155e-06, "loss": 1.0195, "step": 3828 }, { "epoch": 0.1, "learning_rate": 1.9757562381278025e-06, "loss": 1.1914, "step": 3829 }, { "epoch": 0.1, "learning_rate": 1.9757380667270454e-06, "loss": 0.8672, "step": 3830 }, { "epoch": 0.1, "learning_rate": 1.97571988860247e-06, "loss": 0.9707, "step": 3831 }, { "epoch": 0.1, "learning_rate": 1.9757017037542014e-06, "loss": 0.7891, "step": 3832 }, { "epoch": 0.1, "learning_rate": 1.9756835121823652e-06, "loss": 0.9746, "step": 3833 }, { "epoch": 0.1, "learning_rate": 1.975665313887087e-06, "loss": 1.124, "step": 3834 }, { "epoch": 0.1, "learning_rate": 1.975647108868491e-06, "loss": 1.0225, "step": 3835 }, { "epoch": 0.1, "learning_rate": 1.9756288971267033e-06, "loss": 1.0117, "step": 3836 }, { "epoch": 0.1, "learning_rate": 1.9756106786618497e-06, "loss": 0.8232, "step": 3837 }, { "epoch": 0.1, "learning_rate": 1.9755924534740558e-06, "loss": 1.0967, "step": 3838 }, { "epoch": 0.1, "learning_rate": 1.975574221563447e-06, "loss": 0.9443, "step": 3839 }, { "epoch": 0.1, "learning_rate": 1.975555982930149e-06, "loss": 0.8965, "step": 3840 }, { "epoch": 0.1, "learning_rate": 1.9755377375742866e-06, "loss": 0.8413, "step": 3841 }, { "epoch": 0.1, "learning_rate": 1.9755194854959867e-06, "loss": 0.8203, "step": 3842 }, { "epoch": 0.1, "learning_rate": 1.9755012266953746e-06, "loss": 1.0498, "step": 3843 }, { "epoch": 0.1, "learning_rate": 1.975482961172576e-06, "loss": 1.0635, "step": 3844 }, { "epoch": 0.1, "learning_rate": 1.9754646889277177e-06, "loss": 1.124, "step": 3845 }, { "epoch": 0.1, "learning_rate": 1.975446409960924e-06, "loss": 1.1738, "step": 3846 }, { "epoch": 0.1, "learning_rate": 1.975428124272322e-06, "loss": 1.1123, "step": 3847 }, { "epoch": 0.1, "learning_rate": 1.9754098318620377e-06, "loss": 0.8955, "step": 3848 }, { "epoch": 0.1, "learning_rate": 1.9753915327301966e-06, "loss": 1.0967, "step": 3849 }, { "epoch": 0.1, "learning_rate": 1.975373226876925e-06, "loss": 0.8691, "step": 3850 }, { "epoch": 0.1, "learning_rate": 1.9753549143023496e-06, "loss": 0.9639, "step": 3851 }, { "epoch": 0.1, "learning_rate": 1.9753365950065957e-06, "loss": 1.1211, "step": 3852 }, { "epoch": 0.1, "learning_rate": 1.97531826898979e-06, "loss": 1.0068, "step": 3853 }, { "epoch": 0.1, "learning_rate": 1.975299936252059e-06, "loss": 1.0361, "step": 3854 }, { "epoch": 0.1, "learning_rate": 1.9752815967935285e-06, "loss": 0.9033, "step": 3855 }, { "epoch": 0.1, "learning_rate": 1.9752632506143253e-06, "loss": 1.1719, "step": 3856 }, { "epoch": 0.1, "learning_rate": 1.9752448977145755e-06, "loss": 0.6787, "step": 3857 }, { "epoch": 0.1, "learning_rate": 1.9752265380944057e-06, "loss": 0.9475, "step": 3858 }, { "epoch": 0.1, "learning_rate": 1.9752081717539426e-06, "loss": 0.8574, "step": 3859 }, { "epoch": 0.1, "learning_rate": 1.9751897986933128e-06, "loss": 0.9268, "step": 3860 }, { "epoch": 0.1, "learning_rate": 1.9751714189126425e-06, "loss": 0.8833, "step": 3861 }, { "epoch": 0.1, "learning_rate": 1.9751530324120583e-06, "loss": 0.8853, "step": 3862 }, { "epoch": 0.1, "learning_rate": 1.9751346391916877e-06, "loss": 0.8984, "step": 3863 }, { "epoch": 0.1, "learning_rate": 1.9751162392516565e-06, "loss": 0.9351, "step": 3864 }, { "epoch": 0.1, "learning_rate": 1.9750978325920923e-06, "loss": 0.7559, "step": 3865 }, { "epoch": 0.1, "learning_rate": 1.9750794192131215e-06, "loss": 1.1113, "step": 3866 }, { "epoch": 0.1, "learning_rate": 1.975060999114871e-06, "loss": 0.7617, "step": 3867 }, { "epoch": 0.1, "learning_rate": 1.975042572297468e-06, "loss": 0.8345, "step": 3868 }, { "epoch": 0.1, "learning_rate": 1.975024138761039e-06, "loss": 0.6475, "step": 3869 }, { "epoch": 0.1, "learning_rate": 1.975005698505711e-06, "loss": 1.0059, "step": 3870 }, { "epoch": 0.1, "learning_rate": 1.974987251531612e-06, "loss": 1.041, "step": 3871 }, { "epoch": 0.1, "learning_rate": 1.9749687978388683e-06, "loss": 0.6875, "step": 3872 }, { "epoch": 0.1, "learning_rate": 1.9749503374276067e-06, "loss": 0.7793, "step": 3873 }, { "epoch": 0.1, "learning_rate": 1.9749318702979554e-06, "loss": 0.8242, "step": 3874 }, { "epoch": 0.1, "learning_rate": 1.9749133964500416e-06, "loss": 0.918, "step": 3875 }, { "epoch": 0.1, "learning_rate": 1.9748949158839918e-06, "loss": 1.001, "step": 3876 }, { "epoch": 0.1, "learning_rate": 1.974876428599934e-06, "loss": 1.085, "step": 3877 }, { "epoch": 0.1, "learning_rate": 1.974857934597995e-06, "loss": 0.8164, "step": 3878 }, { "epoch": 0.1, "learning_rate": 1.9748394338783028e-06, "loss": 0.7246, "step": 3879 }, { "epoch": 0.1, "learning_rate": 1.974820926440985e-06, "loss": 1.04, "step": 3880 }, { "epoch": 0.1, "learning_rate": 1.9748024122861684e-06, "loss": 0.8857, "step": 3881 }, { "epoch": 0.1, "learning_rate": 1.974783891413981e-06, "loss": 0.9473, "step": 3882 }, { "epoch": 0.1, "learning_rate": 1.9747653638245505e-06, "loss": 0.9448, "step": 3883 }, { "epoch": 0.1, "learning_rate": 1.9747468295180045e-06, "loss": 0.9111, "step": 3884 }, { "epoch": 0.1, "learning_rate": 1.9747282884944708e-06, "loss": 0.9209, "step": 3885 }, { "epoch": 0.1, "learning_rate": 1.9747097407540775e-06, "loss": 1.1074, "step": 3886 }, { "epoch": 0.1, "learning_rate": 1.9746911862969515e-06, "loss": 0.8193, "step": 3887 }, { "epoch": 0.1, "learning_rate": 1.9746726251232213e-06, "loss": 0.8555, "step": 3888 }, { "epoch": 0.1, "learning_rate": 1.974654057233015e-06, "loss": 0.9639, "step": 3889 }, { "epoch": 0.1, "learning_rate": 1.97463548262646e-06, "loss": 0.9346, "step": 3890 }, { "epoch": 0.1, "learning_rate": 1.974616901303684e-06, "loss": 0.8291, "step": 3891 }, { "epoch": 0.1, "learning_rate": 1.974598313264816e-06, "loss": 0.8179, "step": 3892 }, { "epoch": 0.1, "learning_rate": 1.9745797185099837e-06, "loss": 1.0742, "step": 3893 }, { "epoch": 0.1, "learning_rate": 1.9745611170393155e-06, "loss": 1.0947, "step": 3894 }, { "epoch": 0.1, "learning_rate": 1.974542508852939e-06, "loss": 0.7578, "step": 3895 }, { "epoch": 0.1, "learning_rate": 1.9745238939509826e-06, "loss": 0.6943, "step": 3896 }, { "epoch": 0.1, "learning_rate": 1.9745052723335742e-06, "loss": 0.5601, "step": 3897 }, { "epoch": 0.1, "learning_rate": 1.9744866440008434e-06, "loss": 0.8633, "step": 3898 }, { "epoch": 0.1, "learning_rate": 1.974468008952918e-06, "loss": 1.1123, "step": 3899 }, { "epoch": 0.1, "learning_rate": 1.9744493671899253e-06, "loss": 0.8223, "step": 3900 }, { "epoch": 0.1, "learning_rate": 1.974430718711995e-06, "loss": 0.8613, "step": 3901 }, { "epoch": 0.1, "learning_rate": 1.9744120635192557e-06, "loss": 0.585, "step": 3902 }, { "epoch": 0.1, "learning_rate": 1.974393401611835e-06, "loss": 0.7217, "step": 3903 }, { "epoch": 0.1, "learning_rate": 1.974374732989862e-06, "loss": 0.9531, "step": 3904 }, { "epoch": 0.1, "learning_rate": 1.974356057653466e-06, "loss": 0.8887, "step": 3905 }, { "epoch": 0.1, "learning_rate": 1.974337375602774e-06, "loss": 1.1221, "step": 3906 }, { "epoch": 0.1, "learning_rate": 1.9743186868379164e-06, "loss": 1.1699, "step": 3907 }, { "epoch": 0.1, "learning_rate": 1.9742999913590212e-06, "loss": 0.8867, "step": 3908 }, { "epoch": 0.1, "learning_rate": 1.9742812891662176e-06, "loss": 0.7773, "step": 3909 }, { "epoch": 0.1, "learning_rate": 1.9742625802596343e-06, "loss": 1.0039, "step": 3910 }, { "epoch": 0.1, "learning_rate": 1.9742438646394e-06, "loss": 1.0684, "step": 3911 }, { "epoch": 0.1, "learning_rate": 1.974225142305644e-06, "loss": 0.729, "step": 3912 }, { "epoch": 0.1, "learning_rate": 1.974206413258495e-06, "loss": 0.5249, "step": 3913 }, { "epoch": 0.1, "learning_rate": 1.9741876774980827e-06, "loss": 1.0332, "step": 3914 }, { "epoch": 0.1, "learning_rate": 1.9741689350245353e-06, "loss": 0.9268, "step": 3915 }, { "epoch": 0.1, "learning_rate": 1.9741501858379825e-06, "loss": 0.7861, "step": 3916 }, { "epoch": 0.1, "learning_rate": 1.9741314299385534e-06, "loss": 0.9463, "step": 3917 }, { "epoch": 0.1, "learning_rate": 1.9741126673263776e-06, "loss": 0.9219, "step": 3918 }, { "epoch": 0.1, "learning_rate": 1.9740938980015835e-06, "loss": 0.9414, "step": 3919 }, { "epoch": 0.1, "learning_rate": 1.9740751219643014e-06, "loss": 0.8174, "step": 3920 }, { "epoch": 0.1, "learning_rate": 1.97405633921466e-06, "loss": 0.8809, "step": 3921 }, { "epoch": 0.1, "learning_rate": 1.9740375497527893e-06, "loss": 0.7959, "step": 3922 }, { "epoch": 0.1, "learning_rate": 1.9740187535788185e-06, "loss": 1.0479, "step": 3923 }, { "epoch": 0.1, "learning_rate": 1.973999950692877e-06, "loss": 0.9932, "step": 3924 }, { "epoch": 0.1, "learning_rate": 1.973981141095094e-06, "loss": 0.8838, "step": 3925 }, { "epoch": 0.1, "learning_rate": 1.9739623247856e-06, "loss": 0.8867, "step": 3926 }, { "epoch": 0.1, "learning_rate": 1.9739435017645243e-06, "loss": 0.9346, "step": 3927 }, { "epoch": 0.1, "learning_rate": 1.9739246720319967e-06, "loss": 1.1387, "step": 3928 }, { "epoch": 0.1, "learning_rate": 1.973905835588147e-06, "loss": 1.126, "step": 3929 }, { "epoch": 0.1, "learning_rate": 1.973886992433104e-06, "loss": 1.0039, "step": 3930 }, { "epoch": 0.1, "learning_rate": 1.973868142566999e-06, "loss": 0.8716, "step": 3931 }, { "epoch": 0.1, "learning_rate": 1.9738492859899613e-06, "loss": 1.0859, "step": 3932 }, { "epoch": 0.1, "learning_rate": 1.973830422702121e-06, "loss": 0.8306, "step": 3933 }, { "epoch": 0.1, "learning_rate": 1.973811552703607e-06, "loss": 1.1133, "step": 3934 }, { "epoch": 0.1, "learning_rate": 1.9737926759945508e-06, "loss": 0.6754, "step": 3935 }, { "epoch": 0.1, "learning_rate": 1.9737737925750823e-06, "loss": 0.9805, "step": 3936 }, { "epoch": 0.1, "learning_rate": 1.9737549024453307e-06, "loss": 0.8906, "step": 3937 }, { "epoch": 0.1, "learning_rate": 1.973736005605427e-06, "loss": 0.791, "step": 3938 }, { "epoch": 0.1, "learning_rate": 1.973717102055501e-06, "loss": 0.8301, "step": 3939 }, { "epoch": 0.1, "learning_rate": 1.973698191795683e-06, "loss": 0.8838, "step": 3940 }, { "epoch": 0.1, "learning_rate": 1.973679274826104e-06, "loss": 0.8711, "step": 3941 }, { "epoch": 0.1, "learning_rate": 1.973660351146893e-06, "loss": 0.8984, "step": 3942 }, { "epoch": 0.1, "learning_rate": 1.9736414207581813e-06, "loss": 1.0605, "step": 3943 }, { "epoch": 0.1, "learning_rate": 1.973622483660099e-06, "loss": 0.9648, "step": 3944 }, { "epoch": 0.1, "learning_rate": 1.9736035398527774e-06, "loss": 0.9365, "step": 3945 }, { "epoch": 0.1, "learning_rate": 1.973584589336346e-06, "loss": 0.8994, "step": 3946 }, { "epoch": 0.1, "learning_rate": 1.9735656321109362e-06, "loss": 1.0713, "step": 3947 }, { "epoch": 0.1, "learning_rate": 1.9735466681766785e-06, "loss": 1.0352, "step": 3948 }, { "epoch": 0.1, "learning_rate": 1.973527697533703e-06, "loss": 0.7363, "step": 3949 }, { "epoch": 0.1, "learning_rate": 1.9735087201821406e-06, "loss": 0.875, "step": 3950 }, { "epoch": 0.1, "learning_rate": 1.9734897361221225e-06, "loss": 0.9492, "step": 3951 }, { "epoch": 0.1, "learning_rate": 1.9734707453537793e-06, "loss": 0.959, "step": 3952 }, { "epoch": 0.1, "learning_rate": 1.9734517478772418e-06, "loss": 0.9004, "step": 3953 }, { "epoch": 0.1, "learning_rate": 1.9734327436926408e-06, "loss": 0.7739, "step": 3954 }, { "epoch": 0.1, "learning_rate": 1.9734137328001076e-06, "loss": 1.2988, "step": 3955 }, { "epoch": 0.1, "learning_rate": 1.9733947151997723e-06, "loss": 0.8765, "step": 3956 }, { "epoch": 0.1, "learning_rate": 1.9733756908917674e-06, "loss": 0.8779, "step": 3957 }, { "epoch": 0.1, "learning_rate": 1.9733566598762234e-06, "loss": 0.9619, "step": 3958 }, { "epoch": 0.1, "learning_rate": 1.9733376221532707e-06, "loss": 1.0342, "step": 3959 }, { "epoch": 0.1, "learning_rate": 1.9733185777230415e-06, "loss": 1.0391, "step": 3960 }, { "epoch": 0.1, "learning_rate": 1.973299526585667e-06, "loss": 0.6128, "step": 3961 }, { "epoch": 0.1, "learning_rate": 1.9732804687412776e-06, "loss": 0.8564, "step": 3962 }, { "epoch": 0.1, "learning_rate": 1.973261404190005e-06, "loss": 1.1143, "step": 3963 }, { "epoch": 0.1, "learning_rate": 1.973242332931981e-06, "loss": 0.9326, "step": 3964 }, { "epoch": 0.1, "learning_rate": 1.9732232549673365e-06, "loss": 1.0537, "step": 3965 }, { "epoch": 0.1, "learning_rate": 1.9732041702962037e-06, "loss": 0.8398, "step": 3966 }, { "epoch": 0.1, "learning_rate": 1.9731850789187134e-06, "loss": 0.9482, "step": 3967 }, { "epoch": 0.1, "learning_rate": 1.973165980834997e-06, "loss": 0.8462, "step": 3968 }, { "epoch": 0.1, "learning_rate": 1.9731468760451867e-06, "loss": 0.6079, "step": 3969 }, { "epoch": 0.1, "learning_rate": 1.9731277645494137e-06, "loss": 0.6143, "step": 3970 }, { "epoch": 0.1, "learning_rate": 1.9731086463478104e-06, "loss": 0.9658, "step": 3971 }, { "epoch": 0.1, "learning_rate": 1.9730895214405077e-06, "loss": 0.915, "step": 3972 }, { "epoch": 0.1, "learning_rate": 1.973070389827638e-06, "loss": 0.9629, "step": 3973 }, { "epoch": 0.1, "learning_rate": 1.973051251509333e-06, "loss": 0.8066, "step": 3974 }, { "epoch": 0.1, "learning_rate": 1.973032106485724e-06, "loss": 0.9629, "step": 3975 }, { "epoch": 0.1, "learning_rate": 1.973012954756944e-06, "loss": 1.0137, "step": 3976 }, { "epoch": 0.1, "learning_rate": 1.972993796323124e-06, "loss": 0.8545, "step": 3977 }, { "epoch": 0.1, "learning_rate": 1.972974631184396e-06, "loss": 0.8154, "step": 3978 }, { "epoch": 0.1, "learning_rate": 1.972955459340893e-06, "loss": 1.0625, "step": 3979 }, { "epoch": 0.1, "learning_rate": 1.9729362807927467e-06, "loss": 0.9111, "step": 3980 }, { "epoch": 0.1, "learning_rate": 1.972917095540089e-06, "loss": 1.0439, "step": 3981 }, { "epoch": 0.1, "learning_rate": 1.972897903583052e-06, "loss": 0.8623, "step": 3982 }, { "epoch": 0.1, "learning_rate": 1.9728787049217684e-06, "loss": 0.876, "step": 3983 }, { "epoch": 0.1, "learning_rate": 1.97285949955637e-06, "loss": 0.96, "step": 3984 }, { "epoch": 0.1, "learning_rate": 1.97284028748699e-06, "loss": 0.7756, "step": 3985 }, { "epoch": 0.1, "learning_rate": 1.9728210687137597e-06, "loss": 0.9248, "step": 3986 }, { "epoch": 0.1, "learning_rate": 1.972801843236812e-06, "loss": 0.8652, "step": 3987 }, { "epoch": 0.1, "learning_rate": 1.9727826110562804e-06, "loss": 1.0176, "step": 3988 }, { "epoch": 0.1, "learning_rate": 1.9727633721722955e-06, "loss": 1.0732, "step": 3989 }, { "epoch": 0.1, "learning_rate": 1.9727441265849914e-06, "loss": 0.9336, "step": 3990 }, { "epoch": 0.1, "learning_rate": 1.9727248742945e-06, "loss": 0.9473, "step": 3991 }, { "epoch": 0.1, "learning_rate": 1.972705615300954e-06, "loss": 1.0498, "step": 3992 }, { "epoch": 0.1, "learning_rate": 1.9726863496044864e-06, "loss": 0.8486, "step": 3993 }, { "epoch": 0.1, "learning_rate": 1.97266707720523e-06, "loss": 1.0439, "step": 3994 }, { "epoch": 0.1, "learning_rate": 1.9726477981033168e-06, "loss": 1.0156, "step": 3995 }, { "epoch": 0.1, "learning_rate": 1.9726285122988807e-06, "loss": 0.9375, "step": 3996 }, { "epoch": 0.1, "learning_rate": 1.9726092197920542e-06, "loss": 0.9775, "step": 3997 }, { "epoch": 0.1, "learning_rate": 1.9725899205829703e-06, "loss": 0.9082, "step": 3998 }, { "epoch": 0.1, "learning_rate": 1.9725706146717614e-06, "loss": 0.9697, "step": 3999 }, { "epoch": 0.1, "learning_rate": 1.972551302058562e-06, "loss": 0.9521, "step": 4000 }, { "epoch": 0.1, "learning_rate": 1.9725319827435034e-06, "loss": 1.0049, "step": 4001 }, { "epoch": 0.1, "learning_rate": 1.9725126567267195e-06, "loss": 0.999, "step": 4002 }, { "epoch": 0.1, "learning_rate": 1.9724933240083442e-06, "loss": 0.8613, "step": 4003 }, { "epoch": 0.1, "learning_rate": 1.97247398458851e-06, "loss": 1.0322, "step": 4004 }, { "epoch": 0.1, "learning_rate": 1.9724546384673493e-06, "loss": 0.8623, "step": 4005 }, { "epoch": 0.1, "learning_rate": 1.9724352856449973e-06, "loss": 1.0869, "step": 4006 }, { "epoch": 0.1, "learning_rate": 1.972415926121586e-06, "loss": 1.0791, "step": 4007 }, { "epoch": 0.1, "learning_rate": 1.972396559897249e-06, "loss": 0.8252, "step": 4008 }, { "epoch": 0.1, "learning_rate": 1.9723771869721206e-06, "loss": 0.9951, "step": 4009 }, { "epoch": 0.1, "learning_rate": 1.972357807346333e-06, "loss": 0.9033, "step": 4010 }, { "epoch": 0.1, "learning_rate": 1.972338421020021e-06, "loss": 0.9199, "step": 4011 }, { "epoch": 0.1, "learning_rate": 1.972319027993317e-06, "loss": 0.8018, "step": 4012 }, { "epoch": 0.1, "learning_rate": 1.972299628266356e-06, "loss": 1.0283, "step": 4013 }, { "epoch": 0.1, "learning_rate": 1.97228022183927e-06, "loss": 0.8584, "step": 4014 }, { "epoch": 0.1, "learning_rate": 1.9722608087121945e-06, "loss": 0.8135, "step": 4015 }, { "epoch": 0.1, "learning_rate": 1.972241388885262e-06, "loss": 1.1162, "step": 4016 }, { "epoch": 0.1, "learning_rate": 1.972221962358607e-06, "loss": 0.7607, "step": 4017 }, { "epoch": 0.1, "learning_rate": 1.9722025291323626e-06, "loss": 1.0449, "step": 4018 }, { "epoch": 0.1, "learning_rate": 1.9721830892066637e-06, "loss": 0.7881, "step": 4019 }, { "epoch": 0.1, "learning_rate": 1.972163642581643e-06, "loss": 0.7793, "step": 4020 }, { "epoch": 0.1, "learning_rate": 1.972144189257436e-06, "loss": 0.8369, "step": 4021 }, { "epoch": 0.1, "learning_rate": 1.972124729234176e-06, "loss": 0.915, "step": 4022 }, { "epoch": 0.1, "learning_rate": 1.9721052625119975e-06, "loss": 0.9043, "step": 4023 }, { "epoch": 0.1, "learning_rate": 1.9720857890910338e-06, "loss": 0.9961, "step": 4024 }, { "epoch": 0.1, "learning_rate": 1.972066308971419e-06, "loss": 0.9932, "step": 4025 }, { "epoch": 0.1, "learning_rate": 1.972046822153289e-06, "loss": 0.8838, "step": 4026 }, { "epoch": 0.1, "learning_rate": 1.9720273286367765e-06, "loss": 0.6909, "step": 4027 }, { "epoch": 0.1, "learning_rate": 1.9720078284220167e-06, "loss": 1.1221, "step": 4028 }, { "epoch": 0.1, "learning_rate": 1.9719883215091433e-06, "loss": 0.9902, "step": 4029 }, { "epoch": 0.1, "learning_rate": 1.971968807898291e-06, "loss": 0.7812, "step": 4030 }, { "epoch": 0.1, "learning_rate": 1.971949287589594e-06, "loss": 1.0889, "step": 4031 }, { "epoch": 0.1, "learning_rate": 1.9719297605831878e-06, "loss": 0.8228, "step": 4032 }, { "epoch": 0.1, "learning_rate": 1.971910226879206e-06, "loss": 0.9961, "step": 4033 }, { "epoch": 0.1, "learning_rate": 1.9718906864777838e-06, "loss": 1.0088, "step": 4034 }, { "epoch": 0.1, "learning_rate": 1.971871139379055e-06, "loss": 0.8945, "step": 4035 }, { "epoch": 0.1, "learning_rate": 1.971851585583155e-06, "loss": 0.8877, "step": 4036 }, { "epoch": 0.1, "learning_rate": 1.9718320250902183e-06, "loss": 0.9531, "step": 4037 }, { "epoch": 0.1, "learning_rate": 1.97181245790038e-06, "loss": 0.873, "step": 4038 }, { "epoch": 0.1, "learning_rate": 1.9717928840137744e-06, "loss": 0.8281, "step": 4039 }, { "epoch": 0.1, "learning_rate": 1.971773303430537e-06, "loss": 0.6963, "step": 4040 }, { "epoch": 0.1, "learning_rate": 1.971753716150802e-06, "loss": 1.0762, "step": 4041 }, { "epoch": 0.1, "learning_rate": 1.9717341221747056e-06, "loss": 1.0059, "step": 4042 }, { "epoch": 0.1, "learning_rate": 1.9717145215023818e-06, "loss": 0.8906, "step": 4043 }, { "epoch": 0.1, "learning_rate": 1.971694914133965e-06, "loss": 1.123, "step": 4044 }, { "epoch": 0.1, "learning_rate": 1.971675300069592e-06, "loss": 1.1104, "step": 4045 }, { "epoch": 0.1, "learning_rate": 1.9716556793093974e-06, "loss": 1.0596, "step": 4046 }, { "epoch": 0.1, "learning_rate": 1.9716360518535156e-06, "loss": 0.833, "step": 4047 }, { "epoch": 0.1, "learning_rate": 1.9716164177020828e-06, "loss": 1.042, "step": 4048 }, { "epoch": 0.1, "learning_rate": 1.9715967768552336e-06, "loss": 0.915, "step": 4049 }, { "epoch": 0.1, "learning_rate": 1.9715771293131034e-06, "loss": 0.9639, "step": 4050 }, { "epoch": 0.1, "learning_rate": 1.9715574750758284e-06, "loss": 0.9453, "step": 4051 }, { "epoch": 0.1, "learning_rate": 1.9715378141435435e-06, "loss": 0.9893, "step": 4052 }, { "epoch": 0.1, "learning_rate": 1.971518146516384e-06, "loss": 0.9365, "step": 4053 }, { "epoch": 0.1, "learning_rate": 1.9714984721944856e-06, "loss": 0.9258, "step": 4054 }, { "epoch": 0.1, "learning_rate": 1.9714787911779844e-06, "loss": 1.1602, "step": 4055 }, { "epoch": 0.1, "learning_rate": 1.9714591034670147e-06, "loss": 1.1182, "step": 4056 }, { "epoch": 0.1, "learning_rate": 1.9714394090617136e-06, "loss": 0.8574, "step": 4057 }, { "epoch": 0.1, "learning_rate": 1.9714197079622158e-06, "loss": 0.9287, "step": 4058 }, { "epoch": 0.1, "learning_rate": 1.9714000001686577e-06, "loss": 0.9258, "step": 4059 }, { "epoch": 0.1, "learning_rate": 1.9713802856811744e-06, "loss": 0.9521, "step": 4060 }, { "epoch": 0.1, "learning_rate": 1.971360564499903e-06, "loss": 0.874, "step": 4061 }, { "epoch": 0.1, "learning_rate": 1.971340836624978e-06, "loss": 0.793, "step": 4062 }, { "epoch": 0.1, "learning_rate": 1.9713211020565362e-06, "loss": 1.1494, "step": 4063 }, { "epoch": 0.1, "learning_rate": 1.971301360794713e-06, "loss": 0.79, "step": 4064 }, { "epoch": 0.1, "learning_rate": 1.9712816128396454e-06, "loss": 0.8965, "step": 4065 }, { "epoch": 0.1, "learning_rate": 1.9712618581914684e-06, "loss": 1.0332, "step": 4066 }, { "epoch": 0.1, "learning_rate": 1.971242096850319e-06, "loss": 0.8359, "step": 4067 }, { "epoch": 0.1, "learning_rate": 1.9712223288163326e-06, "loss": 0.8838, "step": 4068 }, { "epoch": 0.1, "learning_rate": 1.971202554089646e-06, "loss": 0.9189, "step": 4069 }, { "epoch": 0.1, "learning_rate": 1.971182772670395e-06, "loss": 0.7852, "step": 4070 }, { "epoch": 0.1, "learning_rate": 1.9711629845587163e-06, "loss": 0.8828, "step": 4071 }, { "epoch": 0.1, "learning_rate": 1.971143189754746e-06, "loss": 0.8164, "step": 4072 }, { "epoch": 0.1, "learning_rate": 1.971123388258621e-06, "loss": 0.8032, "step": 4073 }, { "epoch": 0.1, "learning_rate": 1.9711035800704773e-06, "loss": 0.8345, "step": 4074 }, { "epoch": 0.1, "learning_rate": 1.9710837651904515e-06, "loss": 0.9355, "step": 4075 }, { "epoch": 0.1, "learning_rate": 1.97106394361868e-06, "loss": 1.042, "step": 4076 }, { "epoch": 0.1, "learning_rate": 1.9710441153552993e-06, "loss": 1.0791, "step": 4077 }, { "epoch": 0.1, "learning_rate": 1.971024280400447e-06, "loss": 0.7861, "step": 4078 }, { "epoch": 0.1, "learning_rate": 1.9710044387542583e-06, "loss": 0.8501, "step": 4079 }, { "epoch": 0.1, "learning_rate": 1.970984590416871e-06, "loss": 0.5171, "step": 4080 }, { "epoch": 0.1, "learning_rate": 1.9709647353884217e-06, "loss": 0.9697, "step": 4081 }, { "epoch": 0.1, "learning_rate": 1.970944873669047e-06, "loss": 0.7319, "step": 4082 }, { "epoch": 0.1, "learning_rate": 1.9709250052588838e-06, "loss": 0.7734, "step": 4083 }, { "epoch": 0.1, "learning_rate": 1.970905130158069e-06, "loss": 0.8809, "step": 4084 }, { "epoch": 0.1, "learning_rate": 1.9708852483667393e-06, "loss": 0.8789, "step": 4085 }, { "epoch": 0.1, "learning_rate": 1.970865359885033e-06, "loss": 0.9688, "step": 4086 }, { "epoch": 0.1, "learning_rate": 1.970845464713085e-06, "loss": 0.7573, "step": 4087 }, { "epoch": 0.1, "learning_rate": 1.9708255628510344e-06, "loss": 1.1367, "step": 4088 }, { "epoch": 0.1, "learning_rate": 1.970805654299017e-06, "loss": 1.0801, "step": 4089 }, { "epoch": 0.1, "learning_rate": 1.970785739057171e-06, "loss": 1.0654, "step": 4090 }, { "epoch": 0.1, "learning_rate": 1.9707658171256326e-06, "loss": 0.8672, "step": 4091 }, { "epoch": 0.1, "learning_rate": 1.9707458885045395e-06, "loss": 1.0713, "step": 4092 }, { "epoch": 0.1, "learning_rate": 1.9707259531940295e-06, "loss": 0.9482, "step": 4093 }, { "epoch": 0.1, "learning_rate": 1.97070601119424e-06, "loss": 0.8809, "step": 4094 }, { "epoch": 0.1, "learning_rate": 1.9706860625053078e-06, "loss": 1.1396, "step": 4095 }, { "epoch": 0.1, "learning_rate": 1.97066610712737e-06, "loss": 0.9102, "step": 4096 }, { "epoch": 0.11, "learning_rate": 1.970646145060565e-06, "loss": 0.8091, "step": 4097 }, { "epoch": 0.11, "learning_rate": 1.970626176305031e-06, "loss": 0.8896, "step": 4098 }, { "epoch": 0.11, "learning_rate": 1.970606200860904e-06, "loss": 0.8682, "step": 4099 }, { "epoch": 0.11, "learning_rate": 1.970586218728322e-06, "loss": 0.7229, "step": 4100 }, { "epoch": 0.11, "learning_rate": 1.9705662299074235e-06, "loss": 0.9893, "step": 4101 }, { "epoch": 0.11, "learning_rate": 1.9705462343983454e-06, "loss": 1.0615, "step": 4102 }, { "epoch": 0.11, "learning_rate": 1.970526232201226e-06, "loss": 1.0566, "step": 4103 }, { "epoch": 0.11, "learning_rate": 1.970506223316203e-06, "loss": 0.8394, "step": 4104 }, { "epoch": 0.11, "learning_rate": 1.9704862077434146e-06, "loss": 0.8198, "step": 4105 }, { "epoch": 0.11, "learning_rate": 1.970466185482998e-06, "loss": 0.7607, "step": 4106 }, { "epoch": 0.11, "learning_rate": 1.9704461565350923e-06, "loss": 0.7827, "step": 4107 }, { "epoch": 0.11, "learning_rate": 1.9704261208998337e-06, "loss": 0.874, "step": 4108 }, { "epoch": 0.11, "learning_rate": 1.9704060785773623e-06, "loss": 0.9248, "step": 4109 }, { "epoch": 0.11, "learning_rate": 1.9703860295678147e-06, "loss": 1.0449, "step": 4110 }, { "epoch": 0.11, "learning_rate": 1.97036597387133e-06, "loss": 1.0264, "step": 4111 }, { "epoch": 0.11, "learning_rate": 1.9703459114880458e-06, "loss": 0.8535, "step": 4112 }, { "epoch": 0.11, "learning_rate": 1.970325842418101e-06, "loss": 0.9912, "step": 4113 }, { "epoch": 0.11, "learning_rate": 1.970305766661633e-06, "loss": 0.917, "step": 4114 }, { "epoch": 0.11, "learning_rate": 1.9702856842187807e-06, "loss": 0.8306, "step": 4115 }, { "epoch": 0.11, "learning_rate": 1.970265595089683e-06, "loss": 0.9561, "step": 4116 }, { "epoch": 0.11, "learning_rate": 1.970245499274477e-06, "loss": 1.0127, "step": 4117 }, { "epoch": 0.11, "learning_rate": 1.970225396773302e-06, "loss": 0.9302, "step": 4118 }, { "epoch": 0.11, "learning_rate": 1.9702052875862967e-06, "loss": 0.6108, "step": 4119 }, { "epoch": 0.11, "learning_rate": 1.9701851717135997e-06, "loss": 1.166, "step": 4120 }, { "epoch": 0.11, "learning_rate": 1.970165049155349e-06, "loss": 0.8994, "step": 4121 }, { "epoch": 0.11, "learning_rate": 1.970144919911684e-06, "loss": 0.9668, "step": 4122 }, { "epoch": 0.11, "learning_rate": 1.9701247839827427e-06, "loss": 0.875, "step": 4123 }, { "epoch": 0.11, "learning_rate": 1.970104641368664e-06, "loss": 0.5879, "step": 4124 }, { "epoch": 0.11, "learning_rate": 1.970084492069587e-06, "loss": 1.083, "step": 4125 }, { "epoch": 0.11, "learning_rate": 1.970064336085651e-06, "loss": 0.9561, "step": 4126 }, { "epoch": 0.11, "learning_rate": 1.9700441734169937e-06, "loss": 0.8184, "step": 4127 }, { "epoch": 0.11, "learning_rate": 1.970024004063755e-06, "loss": 0.8857, "step": 4128 }, { "epoch": 0.11, "learning_rate": 1.970003828026073e-06, "loss": 0.8442, "step": 4129 }, { "epoch": 0.11, "learning_rate": 1.969983645304088e-06, "loss": 0.8438, "step": 4130 }, { "epoch": 0.11, "learning_rate": 1.969963455897938e-06, "loss": 0.9004, "step": 4131 }, { "epoch": 0.11, "learning_rate": 1.9699432598077627e-06, "loss": 0.9053, "step": 4132 }, { "epoch": 0.11, "learning_rate": 1.969923057033701e-06, "loss": 1.0908, "step": 4133 }, { "epoch": 0.11, "learning_rate": 1.969902847575892e-06, "loss": 0.8467, "step": 4134 }, { "epoch": 0.11, "learning_rate": 1.9698826314344756e-06, "loss": 1.0869, "step": 4135 }, { "epoch": 0.11, "learning_rate": 1.96986240860959e-06, "loss": 1.0703, "step": 4136 }, { "epoch": 0.11, "learning_rate": 1.969842179101376e-06, "loss": 1.1797, "step": 4137 }, { "epoch": 0.11, "learning_rate": 1.9698219429099713e-06, "loss": 0.8652, "step": 4138 }, { "epoch": 0.11, "learning_rate": 1.969801700035517e-06, "loss": 0.7227, "step": 4139 }, { "epoch": 0.11, "learning_rate": 1.9697814504781514e-06, "loss": 0.8379, "step": 4140 }, { "epoch": 0.11, "learning_rate": 1.969761194238015e-06, "loss": 0.8564, "step": 4141 }, { "epoch": 0.11, "learning_rate": 1.9697409313152465e-06, "loss": 0.9795, "step": 4142 }, { "epoch": 0.11, "learning_rate": 1.969720661709986e-06, "loss": 0.8955, "step": 4143 }, { "epoch": 0.11, "learning_rate": 1.969700385422373e-06, "loss": 1.0068, "step": 4144 }, { "epoch": 0.11, "learning_rate": 1.9696801024525472e-06, "loss": 1.0479, "step": 4145 }, { "epoch": 0.11, "learning_rate": 1.969659812800649e-06, "loss": 1.0615, "step": 4146 }, { "epoch": 0.11, "learning_rate": 1.969639516466817e-06, "loss": 0.9736, "step": 4147 }, { "epoch": 0.11, "learning_rate": 1.9696192134511923e-06, "loss": 0.8096, "step": 4148 }, { "epoch": 0.11, "learning_rate": 1.969598903753914e-06, "loss": 0.9844, "step": 4149 }, { "epoch": 0.11, "learning_rate": 1.969578587375123e-06, "loss": 0.9385, "step": 4150 }, { "epoch": 0.11, "learning_rate": 1.969558264314958e-06, "loss": 1.0068, "step": 4151 }, { "epoch": 0.11, "learning_rate": 1.9695379345735596e-06, "loss": 0.8867, "step": 4152 }, { "epoch": 0.11, "learning_rate": 1.9695175981510684e-06, "loss": 0.9043, "step": 4153 }, { "epoch": 0.11, "learning_rate": 1.969497255047624e-06, "loss": 0.8574, "step": 4154 }, { "epoch": 0.11, "learning_rate": 1.9694769052633666e-06, "loss": 1.0039, "step": 4155 }, { "epoch": 0.11, "learning_rate": 1.9694565487984364e-06, "loss": 0.9297, "step": 4156 }, { "epoch": 0.11, "learning_rate": 1.969436185652974e-06, "loss": 0.9844, "step": 4157 }, { "epoch": 0.11, "learning_rate": 1.9694158158271192e-06, "loss": 0.96, "step": 4158 }, { "epoch": 0.11, "learning_rate": 1.969395439321013e-06, "loss": 1.0469, "step": 4159 }, { "epoch": 0.11, "learning_rate": 1.9693750561347954e-06, "loss": 0.9756, "step": 4160 }, { "epoch": 0.11, "learning_rate": 1.969354666268607e-06, "loss": 1.0986, "step": 4161 }, { "epoch": 0.11, "learning_rate": 1.969334269722588e-06, "loss": 0.7256, "step": 4162 }, { "epoch": 0.11, "learning_rate": 1.9693138664968797e-06, "loss": 0.9614, "step": 4163 }, { "epoch": 0.11, "learning_rate": 1.9692934565916215e-06, "loss": 0.9912, "step": 4164 }, { "epoch": 0.11, "learning_rate": 1.969273040006956e-06, "loss": 1.1162, "step": 4165 }, { "epoch": 0.11, "learning_rate": 1.9692526167430215e-06, "loss": 0.8979, "step": 4166 }, { "epoch": 0.11, "learning_rate": 1.96923218679996e-06, "loss": 0.877, "step": 4167 }, { "epoch": 0.11, "learning_rate": 1.9692117501779127e-06, "loss": 0.9385, "step": 4168 }, { "epoch": 0.11, "learning_rate": 1.9691913068770198e-06, "loss": 0.731, "step": 4169 }, { "epoch": 0.11, "learning_rate": 1.9691708568974224e-06, "loss": 1.1953, "step": 4170 }, { "epoch": 0.11, "learning_rate": 1.9691504002392608e-06, "loss": 1.0586, "step": 4171 }, { "epoch": 0.11, "learning_rate": 1.9691299369026767e-06, "loss": 0.9844, "step": 4172 }, { "epoch": 0.11, "learning_rate": 1.969109466887811e-06, "loss": 0.9229, "step": 4173 }, { "epoch": 0.11, "learning_rate": 1.969088990194805e-06, "loss": 1.0283, "step": 4174 }, { "epoch": 0.11, "learning_rate": 1.9690685068237986e-06, "loss": 0.8535, "step": 4175 }, { "epoch": 0.11, "learning_rate": 1.9690480167749346e-06, "loss": 0.875, "step": 4176 }, { "epoch": 0.11, "learning_rate": 1.969027520048353e-06, "loss": 0.9121, "step": 4177 }, { "epoch": 0.11, "learning_rate": 1.9690070166441954e-06, "loss": 0.9619, "step": 4178 }, { "epoch": 0.11, "learning_rate": 1.968986506562603e-06, "loss": 0.9756, "step": 4179 }, { "epoch": 0.11, "learning_rate": 1.9689659898037173e-06, "loss": 0.9092, "step": 4180 }, { "epoch": 0.11, "learning_rate": 1.96894546636768e-06, "loss": 0.7373, "step": 4181 }, { "epoch": 0.11, "learning_rate": 1.968924936254632e-06, "loss": 0.9287, "step": 4182 }, { "epoch": 0.11, "learning_rate": 1.9689043994647148e-06, "loss": 0.9824, "step": 4183 }, { "epoch": 0.11, "learning_rate": 1.9688838559980702e-06, "loss": 0.9951, "step": 4184 }, { "epoch": 0.11, "learning_rate": 1.9688633058548397e-06, "loss": 0.9268, "step": 4185 }, { "epoch": 0.11, "learning_rate": 1.968842749035165e-06, "loss": 0.9668, "step": 4186 }, { "epoch": 0.11, "learning_rate": 1.9688221855391873e-06, "loss": 0.8438, "step": 4187 }, { "epoch": 0.11, "learning_rate": 1.9688016153670483e-06, "loss": 0.7729, "step": 4188 }, { "epoch": 0.11, "learning_rate": 1.9687810385188904e-06, "loss": 0.7739, "step": 4189 }, { "epoch": 0.11, "learning_rate": 1.968760454994855e-06, "loss": 0.8457, "step": 4190 }, { "epoch": 0.11, "learning_rate": 1.968739864795084e-06, "loss": 0.6318, "step": 4191 }, { "epoch": 0.11, "learning_rate": 1.9687192679197194e-06, "loss": 0.7949, "step": 4192 }, { "epoch": 0.11, "learning_rate": 1.9686986643689033e-06, "loss": 0.9941, "step": 4193 }, { "epoch": 0.11, "learning_rate": 1.968678054142777e-06, "loss": 0.7578, "step": 4194 }, { "epoch": 0.11, "learning_rate": 1.9686574372414827e-06, "loss": 0.7505, "step": 4195 }, { "epoch": 0.11, "learning_rate": 1.968636813665163e-06, "loss": 1.0195, "step": 4196 }, { "epoch": 0.11, "learning_rate": 1.9686161834139594e-06, "loss": 0.9824, "step": 4197 }, { "epoch": 0.11, "learning_rate": 1.9685955464880145e-06, "loss": 1.0107, "step": 4198 }, { "epoch": 0.11, "learning_rate": 1.9685749028874706e-06, "loss": 0.9053, "step": 4199 }, { "epoch": 0.11, "learning_rate": 1.9685542526124698e-06, "loss": 0.7881, "step": 4200 }, { "epoch": 0.11, "learning_rate": 1.968533595663154e-06, "loss": 0.7734, "step": 4201 }, { "epoch": 0.11, "learning_rate": 1.968512932039666e-06, "loss": 1.0234, "step": 4202 }, { "epoch": 0.11, "learning_rate": 1.968492261742148e-06, "loss": 0.9424, "step": 4203 }, { "epoch": 0.11, "learning_rate": 1.9684715847707425e-06, "loss": 0.9141, "step": 4204 }, { "epoch": 0.11, "learning_rate": 1.968450901125592e-06, "loss": 1.0635, "step": 4205 }, { "epoch": 0.11, "learning_rate": 1.9684302108068393e-06, "loss": 1.0596, "step": 4206 }, { "epoch": 0.11, "learning_rate": 1.968409513814626e-06, "loss": 0.8389, "step": 4207 }, { "epoch": 0.11, "learning_rate": 1.9683888101490964e-06, "loss": 1.0693, "step": 4208 }, { "epoch": 0.11, "learning_rate": 1.9683680998103912e-06, "loss": 0.8076, "step": 4209 }, { "epoch": 0.11, "learning_rate": 1.9683473827986547e-06, "loss": 0.9678, "step": 4210 }, { "epoch": 0.11, "learning_rate": 1.968326659114029e-06, "loss": 1.0166, "step": 4211 }, { "epoch": 0.11, "learning_rate": 1.968305928756657e-06, "loss": 0.877, "step": 4212 }, { "epoch": 0.11, "learning_rate": 1.9682851917266815e-06, "loss": 0.9639, "step": 4213 }, { "epoch": 0.11, "learning_rate": 1.968264448024245e-06, "loss": 0.9414, "step": 4214 }, { "epoch": 0.11, "learning_rate": 1.968243697649492e-06, "loss": 0.9199, "step": 4215 }, { "epoch": 0.11, "learning_rate": 1.9682229406025634e-06, "loss": 0.8164, "step": 4216 }, { "epoch": 0.11, "learning_rate": 1.968202176883603e-06, "loss": 0.9258, "step": 4217 }, { "epoch": 0.11, "learning_rate": 1.968181406492755e-06, "loss": 0.8662, "step": 4218 }, { "epoch": 0.11, "learning_rate": 1.968160629430161e-06, "loss": 0.894, "step": 4219 }, { "epoch": 0.11, "learning_rate": 1.968139845695965e-06, "loss": 1.1016, "step": 4220 }, { "epoch": 0.11, "learning_rate": 1.9681190552903096e-06, "loss": 0.8984, "step": 4221 }, { "epoch": 0.11, "learning_rate": 1.968098258213339e-06, "loss": 1.0225, "step": 4222 }, { "epoch": 0.11, "learning_rate": 1.9680774544651956e-06, "loss": 0.7485, "step": 4223 }, { "epoch": 0.11, "learning_rate": 1.9680566440460237e-06, "loss": 0.7822, "step": 4224 }, { "epoch": 0.11, "learning_rate": 1.968035826955966e-06, "loss": 0.8774, "step": 4225 }, { "epoch": 0.11, "learning_rate": 1.9680150031951657e-06, "loss": 1.0625, "step": 4226 }, { "epoch": 0.11, "learning_rate": 1.9679941727637667e-06, "loss": 1.0195, "step": 4227 }, { "epoch": 0.11, "learning_rate": 1.967973335661913e-06, "loss": 0.8022, "step": 4228 }, { "epoch": 0.11, "learning_rate": 1.9679524918897473e-06, "loss": 0.606, "step": 4229 }, { "epoch": 0.11, "learning_rate": 1.967931641447414e-06, "loss": 1.0977, "step": 4230 }, { "epoch": 0.11, "learning_rate": 1.967910784335056e-06, "loss": 0.9805, "step": 4231 }, { "epoch": 0.11, "learning_rate": 1.967889920552818e-06, "loss": 0.9307, "step": 4232 }, { "epoch": 0.11, "learning_rate": 1.967869050100843e-06, "loss": 0.9131, "step": 4233 }, { "epoch": 0.11, "learning_rate": 1.967848172979275e-06, "loss": 0.999, "step": 4234 }, { "epoch": 0.11, "learning_rate": 1.967827289188258e-06, "loss": 0.9873, "step": 4235 }, { "epoch": 0.11, "learning_rate": 1.967806398727936e-06, "loss": 0.8105, "step": 4236 }, { "epoch": 0.11, "learning_rate": 1.9677855015984528e-06, "loss": 0.9258, "step": 4237 }, { "epoch": 0.11, "learning_rate": 1.967764597799952e-06, "loss": 0.8042, "step": 4238 }, { "epoch": 0.11, "learning_rate": 1.967743687332578e-06, "loss": 0.959, "step": 4239 }, { "epoch": 0.11, "learning_rate": 1.9677227701964757e-06, "loss": 0.9199, "step": 4240 }, { "epoch": 0.11, "learning_rate": 1.967701846391788e-06, "loss": 0.8174, "step": 4241 }, { "epoch": 0.11, "learning_rate": 1.9676809159186595e-06, "loss": 1.0625, "step": 4242 }, { "epoch": 0.11, "learning_rate": 1.9676599787772346e-06, "loss": 0.9053, "step": 4243 }, { "epoch": 0.11, "learning_rate": 1.9676390349676576e-06, "loss": 1.0273, "step": 4244 }, { "epoch": 0.11, "learning_rate": 1.9676180844900725e-06, "loss": 0.8516, "step": 4245 }, { "epoch": 0.11, "learning_rate": 1.9675971273446237e-06, "loss": 0.8772, "step": 4246 }, { "epoch": 0.11, "learning_rate": 1.967576163531456e-06, "loss": 1.1572, "step": 4247 }, { "epoch": 0.11, "learning_rate": 1.967555193050714e-06, "loss": 0.917, "step": 4248 }, { "epoch": 0.11, "learning_rate": 1.967534215902541e-06, "loss": 1.0107, "step": 4249 }, { "epoch": 0.11, "learning_rate": 1.967513232087083e-06, "loss": 1.0303, "step": 4250 }, { "epoch": 0.11, "learning_rate": 1.967492241604484e-06, "loss": 0.9229, "step": 4251 }, { "epoch": 0.11, "learning_rate": 1.967471244454889e-06, "loss": 1.0859, "step": 4252 }, { "epoch": 0.11, "learning_rate": 1.9674502406384415e-06, "loss": 1.0605, "step": 4253 }, { "epoch": 0.11, "learning_rate": 1.9674292301552878e-06, "loss": 0.9468, "step": 4254 }, { "epoch": 0.11, "learning_rate": 1.9674082130055714e-06, "loss": 1.291, "step": 4255 }, { "epoch": 0.11, "learning_rate": 1.967387189189438e-06, "loss": 1.082, "step": 4256 }, { "epoch": 0.11, "learning_rate": 1.9673661587070326e-06, "loss": 1.0449, "step": 4257 }, { "epoch": 0.11, "learning_rate": 1.967345121558499e-06, "loss": 0.9941, "step": 4258 }, { "epoch": 0.11, "learning_rate": 1.967324077743983e-06, "loss": 1.1279, "step": 4259 }, { "epoch": 0.11, "learning_rate": 1.9673030272636295e-06, "loss": 0.7354, "step": 4260 }, { "epoch": 0.11, "learning_rate": 1.9672819701175837e-06, "loss": 0.9336, "step": 4261 }, { "epoch": 0.11, "learning_rate": 1.9672609063059907e-06, "loss": 0.9531, "step": 4262 }, { "epoch": 0.11, "learning_rate": 1.967239835828995e-06, "loss": 0.7742, "step": 4263 }, { "epoch": 0.11, "learning_rate": 1.9672187586867426e-06, "loss": 0.752, "step": 4264 }, { "epoch": 0.11, "learning_rate": 1.9671976748793784e-06, "loss": 0.8975, "step": 4265 }, { "epoch": 0.11, "learning_rate": 1.9671765844070478e-06, "loss": 0.9912, "step": 4266 }, { "epoch": 0.11, "learning_rate": 1.967155487269896e-06, "loss": 0.7002, "step": 4267 }, { "epoch": 0.11, "learning_rate": 1.967134383468068e-06, "loss": 0.9795, "step": 4268 }, { "epoch": 0.11, "learning_rate": 1.96711327300171e-06, "loss": 1.043, "step": 4269 }, { "epoch": 0.11, "learning_rate": 1.9670921558709673e-06, "loss": 0.7002, "step": 4270 }, { "epoch": 0.11, "learning_rate": 1.967071032075985e-06, "loss": 1.1182, "step": 4271 }, { "epoch": 0.11, "learning_rate": 1.967049901616909e-06, "loss": 0.9805, "step": 4272 }, { "epoch": 0.11, "learning_rate": 1.967028764493885e-06, "loss": 1.2305, "step": 4273 }, { "epoch": 0.11, "learning_rate": 1.9670076207070583e-06, "loss": 0.8701, "step": 4274 }, { "epoch": 0.11, "learning_rate": 1.9669864702565746e-06, "loss": 1.0898, "step": 4275 }, { "epoch": 0.11, "learning_rate": 1.96696531314258e-06, "loss": 0.7871, "step": 4276 }, { "epoch": 0.11, "learning_rate": 1.9669441493652204e-06, "loss": 0.9797, "step": 4277 }, { "epoch": 0.11, "learning_rate": 1.966922978924641e-06, "loss": 0.9766, "step": 4278 }, { "epoch": 0.11, "learning_rate": 1.966901801820988e-06, "loss": 0.8799, "step": 4279 }, { "epoch": 0.11, "learning_rate": 1.9668806180544074e-06, "loss": 1.0547, "step": 4280 }, { "epoch": 0.11, "learning_rate": 1.9668594276250456e-06, "loss": 0.7957, "step": 4281 }, { "epoch": 0.11, "learning_rate": 1.966838230533048e-06, "loss": 0.9912, "step": 4282 }, { "epoch": 0.11, "learning_rate": 1.9668170267785606e-06, "loss": 1.0234, "step": 4283 }, { "epoch": 0.11, "learning_rate": 1.9667958163617297e-06, "loss": 0.9336, "step": 4284 }, { "epoch": 0.11, "learning_rate": 1.9667745992827017e-06, "loss": 0.918, "step": 4285 }, { "epoch": 0.11, "learning_rate": 1.9667533755416224e-06, "loss": 0.7212, "step": 4286 }, { "epoch": 0.11, "learning_rate": 1.9667321451386387e-06, "loss": 0.5596, "step": 4287 }, { "epoch": 0.11, "learning_rate": 1.9667109080738963e-06, "loss": 0.9756, "step": 4288 }, { "epoch": 0.11, "learning_rate": 1.966689664347542e-06, "loss": 0.8882, "step": 4289 }, { "epoch": 0.11, "learning_rate": 1.966668413959721e-06, "loss": 1.0371, "step": 4290 }, { "epoch": 0.11, "learning_rate": 1.966647156910582e-06, "loss": 0.8398, "step": 4291 }, { "epoch": 0.11, "learning_rate": 1.9666258932002692e-06, "loss": 0.9688, "step": 4292 }, { "epoch": 0.11, "learning_rate": 1.9666046228289306e-06, "loss": 0.9736, "step": 4293 }, { "epoch": 0.11, "learning_rate": 1.9665833457967115e-06, "loss": 1.0684, "step": 4294 }, { "epoch": 0.11, "learning_rate": 1.96656206210376e-06, "loss": 0.7754, "step": 4295 }, { "epoch": 0.11, "learning_rate": 1.9665407717502217e-06, "loss": 0.8623, "step": 4296 }, { "epoch": 0.11, "learning_rate": 1.966519474736244e-06, "loss": 1.0107, "step": 4297 }, { "epoch": 0.11, "learning_rate": 1.9664981710619727e-06, "loss": 1.0234, "step": 4298 }, { "epoch": 0.11, "learning_rate": 1.9664768607275556e-06, "loss": 1.043, "step": 4299 }, { "epoch": 0.11, "learning_rate": 1.966455543733139e-06, "loss": 0.8408, "step": 4300 }, { "epoch": 0.11, "learning_rate": 1.9664342200788697e-06, "loss": 0.9243, "step": 4301 }, { "epoch": 0.11, "learning_rate": 1.9664128897648953e-06, "loss": 0.9922, "step": 4302 }, { "epoch": 0.11, "learning_rate": 1.9663915527913623e-06, "loss": 0.9316, "step": 4303 }, { "epoch": 0.11, "learning_rate": 1.966370209158418e-06, "loss": 1.0244, "step": 4304 }, { "epoch": 0.11, "learning_rate": 1.966348858866209e-06, "loss": 0.9316, "step": 4305 }, { "epoch": 0.11, "learning_rate": 1.9663275019148827e-06, "loss": 1.0107, "step": 4306 }, { "epoch": 0.11, "learning_rate": 1.9663061383045864e-06, "loss": 1.0469, "step": 4307 }, { "epoch": 0.11, "learning_rate": 1.966284768035467e-06, "loss": 0.7871, "step": 4308 }, { "epoch": 0.11, "learning_rate": 1.9662633911076723e-06, "loss": 0.9307, "step": 4309 }, { "epoch": 0.11, "learning_rate": 1.966242007521349e-06, "loss": 1.0068, "step": 4310 }, { "epoch": 0.11, "learning_rate": 1.966220617276645e-06, "loss": 0.9229, "step": 4311 }, { "epoch": 0.11, "learning_rate": 1.966199220373707e-06, "loss": 0.7954, "step": 4312 }, { "epoch": 0.11, "learning_rate": 1.966177816812683e-06, "loss": 1.0498, "step": 4313 }, { "epoch": 0.11, "learning_rate": 1.9661564065937205e-06, "loss": 0.8594, "step": 4314 }, { "epoch": 0.11, "learning_rate": 1.966134989716967e-06, "loss": 0.832, "step": 4315 }, { "epoch": 0.11, "learning_rate": 1.96611356618257e-06, "loss": 1.0068, "step": 4316 }, { "epoch": 0.11, "learning_rate": 1.966092135990677e-06, "loss": 0.981, "step": 4317 }, { "epoch": 0.11, "learning_rate": 1.966070699141436e-06, "loss": 0.915, "step": 4318 }, { "epoch": 0.11, "learning_rate": 1.9660492556349943e-06, "loss": 0.7178, "step": 4319 }, { "epoch": 0.11, "learning_rate": 1.9660278054714995e-06, "loss": 0.9521, "step": 4320 }, { "epoch": 0.11, "learning_rate": 1.9660063486511003e-06, "loss": 0.8682, "step": 4321 }, { "epoch": 0.11, "learning_rate": 1.965984885173944e-06, "loss": 0.7876, "step": 4322 }, { "epoch": 0.11, "learning_rate": 1.9659634150401784e-06, "loss": 1.0752, "step": 4323 }, { "epoch": 0.11, "learning_rate": 1.9659419382499518e-06, "loss": 0.873, "step": 4324 }, { "epoch": 0.11, "learning_rate": 1.965920454803412e-06, "loss": 0.9727, "step": 4325 }, { "epoch": 0.11, "learning_rate": 1.965898964700707e-06, "loss": 1.0068, "step": 4326 }, { "epoch": 0.11, "learning_rate": 1.965877467941985e-06, "loss": 0.8013, "step": 4327 }, { "epoch": 0.11, "learning_rate": 1.9658559645273937e-06, "loss": 0.7939, "step": 4328 }, { "epoch": 0.11, "learning_rate": 1.965834454457082e-06, "loss": 0.8613, "step": 4329 }, { "epoch": 0.11, "learning_rate": 1.9658129377311975e-06, "loss": 0.8359, "step": 4330 }, { "epoch": 0.11, "learning_rate": 1.9657914143498893e-06, "loss": 0.75, "step": 4331 }, { "epoch": 0.11, "learning_rate": 1.9657698843133047e-06, "loss": 0.833, "step": 4332 }, { "epoch": 0.11, "learning_rate": 1.965748347621593e-06, "loss": 0.7847, "step": 4333 }, { "epoch": 0.11, "learning_rate": 1.9657268042749015e-06, "loss": 0.9785, "step": 4334 }, { "epoch": 0.11, "learning_rate": 1.9657052542733793e-06, "loss": 0.9102, "step": 4335 }, { "epoch": 0.11, "learning_rate": 1.9656836976171754e-06, "loss": 1.335, "step": 4336 }, { "epoch": 0.11, "learning_rate": 1.9656621343064376e-06, "loss": 0.9014, "step": 4337 }, { "epoch": 0.11, "learning_rate": 1.965640564341315e-06, "loss": 0.9253, "step": 4338 }, { "epoch": 0.11, "learning_rate": 1.9656189877219556e-06, "loss": 0.9023, "step": 4339 }, { "epoch": 0.11, "learning_rate": 1.965597404448509e-06, "loss": 0.8857, "step": 4340 }, { "epoch": 0.11, "learning_rate": 1.9655758145211226e-06, "loss": 0.7158, "step": 4341 }, { "epoch": 0.11, "learning_rate": 1.9655542179399467e-06, "loss": 1.0186, "step": 4342 }, { "epoch": 0.11, "learning_rate": 1.9655326147051287e-06, "loss": 1.1797, "step": 4343 }, { "epoch": 0.11, "learning_rate": 1.9655110048168186e-06, "loss": 0.8462, "step": 4344 }, { "epoch": 0.11, "learning_rate": 1.9654893882751647e-06, "loss": 1.0371, "step": 4345 }, { "epoch": 0.11, "learning_rate": 1.965467765080316e-06, "loss": 0.749, "step": 4346 }, { "epoch": 0.11, "learning_rate": 1.965446135232422e-06, "loss": 0.8506, "step": 4347 }, { "epoch": 0.11, "learning_rate": 1.9654244987316315e-06, "loss": 1.0898, "step": 4348 }, { "epoch": 0.11, "learning_rate": 1.9654028555780934e-06, "loss": 0.7068, "step": 4349 }, { "epoch": 0.11, "learning_rate": 1.9653812057719564e-06, "loss": 0.9102, "step": 4350 }, { "epoch": 0.11, "learning_rate": 1.965359549313371e-06, "loss": 0.9521, "step": 4351 }, { "epoch": 0.11, "learning_rate": 1.965337886202485e-06, "loss": 0.9463, "step": 4352 }, { "epoch": 0.11, "learning_rate": 1.9653162164394487e-06, "loss": 0.7939, "step": 4353 }, { "epoch": 0.11, "learning_rate": 1.965294540024411e-06, "loss": 0.915, "step": 4354 }, { "epoch": 0.11, "learning_rate": 1.965272856957521e-06, "loss": 0.9463, "step": 4355 }, { "epoch": 0.11, "learning_rate": 1.9652511672389286e-06, "loss": 1.0742, "step": 4356 }, { "epoch": 0.11, "learning_rate": 1.9652294708687833e-06, "loss": 0.8271, "step": 4357 }, { "epoch": 0.11, "learning_rate": 1.9652077678472347e-06, "loss": 1.1113, "step": 4358 }, { "epoch": 0.11, "learning_rate": 1.9651860581744315e-06, "loss": 1.0225, "step": 4359 }, { "epoch": 0.11, "learning_rate": 1.965164341850524e-06, "loss": 0.8398, "step": 4360 }, { "epoch": 0.11, "learning_rate": 1.965142618875662e-06, "loss": 0.8193, "step": 4361 }, { "epoch": 0.11, "learning_rate": 1.9651208892499945e-06, "loss": 1.0479, "step": 4362 }, { "epoch": 0.11, "learning_rate": 1.9650991529736723e-06, "loss": 0.8623, "step": 4363 }, { "epoch": 0.11, "learning_rate": 1.965077410046844e-06, "loss": 0.8809, "step": 4364 }, { "epoch": 0.11, "learning_rate": 1.96505566046966e-06, "loss": 0.7996, "step": 4365 }, { "epoch": 0.11, "learning_rate": 1.9650339042422705e-06, "loss": 0.9121, "step": 4366 }, { "epoch": 0.11, "learning_rate": 1.965012141364825e-06, "loss": 0.6411, "step": 4367 }, { "epoch": 0.11, "learning_rate": 1.9649903718374735e-06, "loss": 0.8315, "step": 4368 }, { "epoch": 0.11, "learning_rate": 1.964968595660366e-06, "loss": 1.0449, "step": 4369 }, { "epoch": 0.11, "learning_rate": 1.964946812833653e-06, "loss": 0.9277, "step": 4370 }, { "epoch": 0.11, "learning_rate": 1.9649250233574833e-06, "loss": 1.0576, "step": 4371 }, { "epoch": 0.11, "learning_rate": 1.9649032272320087e-06, "loss": 1.083, "step": 4372 }, { "epoch": 0.11, "learning_rate": 1.9648814244573783e-06, "loss": 1.0371, "step": 4373 }, { "epoch": 0.11, "learning_rate": 1.964859615033743e-06, "loss": 0.9893, "step": 4374 }, { "epoch": 0.11, "learning_rate": 1.9648377989612527e-06, "loss": 0.9736, "step": 4375 }, { "epoch": 0.11, "learning_rate": 1.9648159762400578e-06, "loss": 0.9004, "step": 4376 }, { "epoch": 0.11, "learning_rate": 1.9647941468703085e-06, "loss": 1.0762, "step": 4377 }, { "epoch": 0.11, "learning_rate": 1.9647723108521557e-06, "loss": 1.0322, "step": 4378 }, { "epoch": 0.11, "learning_rate": 1.96475046818575e-06, "loss": 0.9692, "step": 4379 }, { "epoch": 0.11, "learning_rate": 1.964728618871241e-06, "loss": 0.8643, "step": 4380 }, { "epoch": 0.11, "learning_rate": 1.96470676290878e-06, "loss": 1.0488, "step": 4381 }, { "epoch": 0.11, "learning_rate": 1.964684900298517e-06, "loss": 1.001, "step": 4382 }, { "epoch": 0.11, "learning_rate": 1.9646630310406036e-06, "loss": 0.9492, "step": 4383 }, { "epoch": 0.11, "learning_rate": 1.96464115513519e-06, "loss": 0.6587, "step": 4384 }, { "epoch": 0.11, "learning_rate": 1.9646192725824265e-06, "loss": 0.958, "step": 4385 }, { "epoch": 0.11, "learning_rate": 1.9645973833824647e-06, "loss": 0.9258, "step": 4386 }, { "epoch": 0.11, "learning_rate": 1.964575487535455e-06, "loss": 0.6914, "step": 4387 }, { "epoch": 0.11, "learning_rate": 1.964553585041548e-06, "loss": 1.1113, "step": 4388 }, { "epoch": 0.11, "learning_rate": 1.964531675900895e-06, "loss": 1.0508, "step": 4389 }, { "epoch": 0.11, "learning_rate": 1.9645097601136475e-06, "loss": 0.998, "step": 4390 }, { "epoch": 0.11, "learning_rate": 1.9644878376799555e-06, "loss": 1.001, "step": 4391 }, { "epoch": 0.11, "learning_rate": 1.9644659085999704e-06, "loss": 1.04, "step": 4392 }, { "epoch": 0.11, "learning_rate": 1.9644439728738437e-06, "loss": 1.0615, "step": 4393 }, { "epoch": 0.11, "learning_rate": 1.9644220305017263e-06, "loss": 0.9648, "step": 4394 }, { "epoch": 0.11, "learning_rate": 1.9644000814837693e-06, "loss": 1.0234, "step": 4395 }, { "epoch": 0.11, "learning_rate": 1.964378125820124e-06, "loss": 1.0264, "step": 4396 }, { "epoch": 0.11, "learning_rate": 1.9643561635109414e-06, "loss": 0.8701, "step": 4397 }, { "epoch": 0.11, "learning_rate": 1.964334194556374e-06, "loss": 0.8916, "step": 4398 }, { "epoch": 0.11, "learning_rate": 1.964312218956572e-06, "loss": 1.0205, "step": 4399 }, { "epoch": 0.11, "learning_rate": 1.964290236711687e-06, "loss": 0.7769, "step": 4400 }, { "epoch": 0.11, "learning_rate": 1.964268247821871e-06, "loss": 0.6143, "step": 4401 }, { "epoch": 0.11, "learning_rate": 1.9642462522872753e-06, "loss": 1.0361, "step": 4402 }, { "epoch": 0.11, "learning_rate": 1.964224250108051e-06, "loss": 0.9717, "step": 4403 }, { "epoch": 0.11, "learning_rate": 1.9642022412843504e-06, "loss": 0.9336, "step": 4404 }, { "epoch": 0.11, "learning_rate": 1.9641802258163245e-06, "loss": 1.0068, "step": 4405 }, { "epoch": 0.11, "learning_rate": 1.9641582037041257e-06, "loss": 1.0283, "step": 4406 }, { "epoch": 0.11, "learning_rate": 1.9641361749479054e-06, "loss": 1.0059, "step": 4407 }, { "epoch": 0.11, "learning_rate": 1.9641141395478157e-06, "loss": 0.8994, "step": 4408 }, { "epoch": 0.11, "learning_rate": 1.964092097504008e-06, "loss": 1.207, "step": 4409 }, { "epoch": 0.11, "learning_rate": 1.9640700488166344e-06, "loss": 0.9023, "step": 4410 }, { "epoch": 0.11, "learning_rate": 1.9640479934858463e-06, "loss": 1.0703, "step": 4411 }, { "epoch": 0.11, "learning_rate": 1.9640259315117967e-06, "loss": 0.9844, "step": 4412 }, { "epoch": 0.11, "learning_rate": 1.964003862894637e-06, "loss": 1.0625, "step": 4413 }, { "epoch": 0.11, "learning_rate": 1.9639817876345194e-06, "loss": 0.9414, "step": 4414 }, { "epoch": 0.11, "learning_rate": 1.9639597057315963e-06, "loss": 1.0703, "step": 4415 }, { "epoch": 0.11, "learning_rate": 1.963937617186019e-06, "loss": 0.8267, "step": 4416 }, { "epoch": 0.11, "learning_rate": 1.963915521997941e-06, "loss": 0.6824, "step": 4417 }, { "epoch": 0.11, "learning_rate": 1.9638934201675133e-06, "loss": 1.0137, "step": 4418 }, { "epoch": 0.11, "learning_rate": 1.9638713116948886e-06, "loss": 1.0693, "step": 4419 }, { "epoch": 0.11, "learning_rate": 1.96384919658022e-06, "loss": 1.04, "step": 4420 }, { "epoch": 0.11, "learning_rate": 1.963827074823659e-06, "loss": 0.833, "step": 4421 }, { "epoch": 0.11, "learning_rate": 1.9638049464253584e-06, "loss": 1.0342, "step": 4422 }, { "epoch": 0.11, "learning_rate": 1.963782811385471e-06, "loss": 1.1064, "step": 4423 }, { "epoch": 0.11, "learning_rate": 1.9637606697041483e-06, "loss": 0.8237, "step": 4424 }, { "epoch": 0.11, "learning_rate": 1.9637385213815437e-06, "loss": 0.7256, "step": 4425 }, { "epoch": 0.11, "learning_rate": 1.96371636641781e-06, "loss": 1.0205, "step": 4426 }, { "epoch": 0.11, "learning_rate": 1.963694204813099e-06, "loss": 0.876, "step": 4427 }, { "epoch": 0.11, "learning_rate": 1.9636720365675647e-06, "loss": 0.9658, "step": 4428 }, { "epoch": 0.11, "learning_rate": 1.963649861681359e-06, "loss": 0.6602, "step": 4429 }, { "epoch": 0.11, "learning_rate": 1.963627680154634e-06, "loss": 0.7637, "step": 4430 }, { "epoch": 0.11, "learning_rate": 1.963605491987544e-06, "loss": 1.0029, "step": 4431 }, { "epoch": 0.11, "learning_rate": 1.9635832971802414e-06, "loss": 1.0508, "step": 4432 }, { "epoch": 0.11, "learning_rate": 1.963561095732879e-06, "loss": 0.9639, "step": 4433 }, { "epoch": 0.11, "learning_rate": 1.9635388876456094e-06, "loss": 0.6597, "step": 4434 }, { "epoch": 0.11, "learning_rate": 1.9635166729185863e-06, "loss": 0.9248, "step": 4435 }, { "epoch": 0.11, "learning_rate": 1.9634944515519625e-06, "loss": 0.707, "step": 4436 }, { "epoch": 0.11, "learning_rate": 1.963472223545891e-06, "loss": 1.0088, "step": 4437 }, { "epoch": 0.11, "learning_rate": 1.963449988900526e-06, "loss": 0.8848, "step": 4438 }, { "epoch": 0.11, "learning_rate": 1.9634277476160188e-06, "loss": 1.0073, "step": 4439 }, { "epoch": 0.11, "learning_rate": 1.963405499692524e-06, "loss": 1.0625, "step": 4440 }, { "epoch": 0.11, "learning_rate": 1.9633832451301947e-06, "loss": 0.8135, "step": 4441 }, { "epoch": 0.11, "learning_rate": 1.963360983929184e-06, "loss": 0.7588, "step": 4442 }, { "epoch": 0.11, "learning_rate": 1.9633387160896455e-06, "loss": 0.9355, "step": 4443 }, { "epoch": 0.11, "learning_rate": 1.963316441611733e-06, "loss": 0.6941, "step": 4444 }, { "epoch": 0.11, "learning_rate": 1.9632941604955993e-06, "loss": 0.9043, "step": 4445 }, { "epoch": 0.11, "learning_rate": 1.9632718727413986e-06, "loss": 1.0498, "step": 4446 }, { "epoch": 0.11, "learning_rate": 1.9632495783492835e-06, "loss": 0.9453, "step": 4447 }, { "epoch": 0.11, "learning_rate": 1.9632272773194088e-06, "loss": 0.957, "step": 4448 }, { "epoch": 0.11, "learning_rate": 1.9632049696519276e-06, "loss": 0.9434, "step": 4449 }, { "epoch": 0.11, "learning_rate": 1.963182655346994e-06, "loss": 0.7002, "step": 4450 }, { "epoch": 0.11, "learning_rate": 1.9631603344047606e-06, "loss": 0.9961, "step": 4451 }, { "epoch": 0.11, "learning_rate": 1.9631380068253827e-06, "loss": 0.9492, "step": 4452 }, { "epoch": 0.11, "learning_rate": 1.9631156726090133e-06, "loss": 0.793, "step": 4453 }, { "epoch": 0.11, "learning_rate": 1.9630933317558066e-06, "loss": 0.9873, "step": 4454 }, { "epoch": 0.11, "learning_rate": 1.9630709842659163e-06, "loss": 0.9268, "step": 4455 }, { "epoch": 0.11, "learning_rate": 1.9630486301394967e-06, "loss": 1.0215, "step": 4456 }, { "epoch": 0.11, "learning_rate": 1.963026269376702e-06, "loss": 1.002, "step": 4457 }, { "epoch": 0.11, "learning_rate": 1.963003901977686e-06, "loss": 0.9766, "step": 4458 }, { "epoch": 0.11, "learning_rate": 1.962981527942602e-06, "loss": 0.8613, "step": 4459 }, { "epoch": 0.11, "learning_rate": 1.962959147271606e-06, "loss": 0.6514, "step": 4460 }, { "epoch": 0.11, "learning_rate": 1.9629367599648505e-06, "loss": 0.7637, "step": 4461 }, { "epoch": 0.11, "learning_rate": 1.962914366022491e-06, "loss": 1.084, "step": 4462 }, { "epoch": 0.11, "learning_rate": 1.962891965444681e-06, "loss": 0.8633, "step": 4463 }, { "epoch": 0.11, "learning_rate": 1.9628695582315756e-06, "loss": 1.0732, "step": 4464 }, { "epoch": 0.11, "learning_rate": 1.962847144383328e-06, "loss": 0.9131, "step": 4465 }, { "epoch": 0.11, "learning_rate": 1.962824723900094e-06, "loss": 0.9961, "step": 4466 }, { "epoch": 0.11, "learning_rate": 1.962802296782028e-06, "loss": 0.6755, "step": 4467 }, { "epoch": 0.11, "learning_rate": 1.9627798630292836e-06, "loss": 0.8174, "step": 4468 }, { "epoch": 0.11, "learning_rate": 1.9627574226420162e-06, "loss": 0.8286, "step": 4469 }, { "epoch": 0.11, "learning_rate": 1.96273497562038e-06, "loss": 0.9111, "step": 4470 }, { "epoch": 0.11, "learning_rate": 1.9627125219645294e-06, "loss": 0.9121, "step": 4471 }, { "epoch": 0.11, "learning_rate": 1.96269006167462e-06, "loss": 1.0605, "step": 4472 }, { "epoch": 0.11, "learning_rate": 1.962667594750806e-06, "loss": 0.7646, "step": 4473 }, { "epoch": 0.11, "learning_rate": 1.9626451211932423e-06, "loss": 0.998, "step": 4474 }, { "epoch": 0.11, "learning_rate": 1.962622641002084e-06, "loss": 0.9463, "step": 4475 }, { "epoch": 0.11, "learning_rate": 1.9626001541774856e-06, "loss": 0.8877, "step": 4476 }, { "epoch": 0.11, "learning_rate": 1.9625776607196023e-06, "loss": 0.9512, "step": 4477 }, { "epoch": 0.11, "learning_rate": 1.9625551606285887e-06, "loss": 0.877, "step": 4478 }, { "epoch": 0.11, "learning_rate": 1.9625326539046007e-06, "loss": 0.9922, "step": 4479 }, { "epoch": 0.11, "learning_rate": 1.9625101405477925e-06, "loss": 1.1797, "step": 4480 }, { "epoch": 0.11, "learning_rate": 1.96248762055832e-06, "loss": 0.9199, "step": 4481 }, { "epoch": 0.11, "learning_rate": 1.962465093936338e-06, "loss": 0.8574, "step": 4482 }, { "epoch": 0.11, "learning_rate": 1.962442560682002e-06, "loss": 0.8701, "step": 4483 }, { "epoch": 0.11, "learning_rate": 1.9624200207954663e-06, "loss": 1.0703, "step": 4484 }, { "epoch": 0.11, "learning_rate": 1.9623974742768874e-06, "loss": 0.8379, "step": 4485 }, { "epoch": 0.11, "learning_rate": 1.9623749211264205e-06, "loss": 0.957, "step": 4486 }, { "epoch": 0.12, "learning_rate": 1.9623523613442206e-06, "loss": 0.835, "step": 4487 }, { "epoch": 0.12, "learning_rate": 1.962329794930443e-06, "loss": 0.8184, "step": 4488 }, { "epoch": 0.12, "learning_rate": 1.962307221885244e-06, "loss": 0.8652, "step": 4489 }, { "epoch": 0.12, "learning_rate": 1.962284642208778e-06, "loss": 0.9028, "step": 4490 }, { "epoch": 0.12, "learning_rate": 1.962262055901202e-06, "loss": 0.9019, "step": 4491 }, { "epoch": 0.12, "learning_rate": 1.9622394629626706e-06, "loss": 0.9492, "step": 4492 }, { "epoch": 0.12, "learning_rate": 1.9622168633933396e-06, "loss": 0.918, "step": 4493 }, { "epoch": 0.12, "learning_rate": 1.9621942571933648e-06, "loss": 0.8682, "step": 4494 }, { "epoch": 0.12, "learning_rate": 1.9621716443629025e-06, "loss": 0.8271, "step": 4495 }, { "epoch": 0.12, "learning_rate": 1.962149024902108e-06, "loss": 1.0273, "step": 4496 }, { "epoch": 0.12, "learning_rate": 1.9621263988111375e-06, "loss": 1.0195, "step": 4497 }, { "epoch": 0.12, "learning_rate": 1.962103766090147e-06, "loss": 0.9287, "step": 4498 }, { "epoch": 0.12, "learning_rate": 1.9620811267392914e-06, "loss": 0.8516, "step": 4499 }, { "epoch": 0.12, "learning_rate": 1.9620584807587276e-06, "loss": 1.0, "step": 4500 }, { "epoch": 0.12, "learning_rate": 1.962035828148612e-06, "loss": 0.9326, "step": 4501 }, { "epoch": 0.12, "learning_rate": 1.9620131689090996e-06, "loss": 0.7256, "step": 4502 }, { "epoch": 0.12, "learning_rate": 1.961990503040348e-06, "loss": 0.9453, "step": 4503 }, { "epoch": 0.12, "learning_rate": 1.961967830542512e-06, "loss": 1.0264, "step": 4504 }, { "epoch": 0.12, "learning_rate": 1.9619451514157485e-06, "loss": 0.6426, "step": 4505 }, { "epoch": 0.12, "learning_rate": 1.9619224656602138e-06, "loss": 0.9912, "step": 4506 }, { "epoch": 0.12, "learning_rate": 1.961899773276064e-06, "loss": 0.9922, "step": 4507 }, { "epoch": 0.12, "learning_rate": 1.9618770742634555e-06, "loss": 0.7822, "step": 4508 }, { "epoch": 0.12, "learning_rate": 1.9618543686225454e-06, "loss": 0.7827, "step": 4509 }, { "epoch": 0.12, "learning_rate": 1.961831656353489e-06, "loss": 0.958, "step": 4510 }, { "epoch": 0.12, "learning_rate": 1.9618089374564433e-06, "loss": 0.8789, "step": 4511 }, { "epoch": 0.12, "learning_rate": 1.9617862119315656e-06, "loss": 0.999, "step": 4512 }, { "epoch": 0.12, "learning_rate": 1.9617634797790113e-06, "loss": 1.0166, "step": 4513 }, { "epoch": 0.12, "learning_rate": 1.961740740998938e-06, "loss": 0.9014, "step": 4514 }, { "epoch": 0.12, "learning_rate": 1.9617179955915017e-06, "loss": 1.0967, "step": 4515 }, { "epoch": 0.12, "learning_rate": 1.9616952435568594e-06, "loss": 1.0166, "step": 4516 }, { "epoch": 0.12, "learning_rate": 1.961672484895168e-06, "loss": 0.8887, "step": 4517 }, { "epoch": 0.12, "learning_rate": 1.961649719606584e-06, "loss": 1.0703, "step": 4518 }, { "epoch": 0.12, "learning_rate": 1.961626947691265e-06, "loss": 0.9277, "step": 4519 }, { "epoch": 0.12, "learning_rate": 1.961604169149367e-06, "loss": 1.0, "step": 4520 }, { "epoch": 0.12, "learning_rate": 1.9615813839810474e-06, "loss": 1.0, "step": 4521 }, { "epoch": 0.12, "learning_rate": 1.9615585921864634e-06, "loss": 1.0752, "step": 4522 }, { "epoch": 0.12, "learning_rate": 1.9615357937657723e-06, "loss": 0.7461, "step": 4523 }, { "epoch": 0.12, "learning_rate": 1.96151298871913e-06, "loss": 0.7222, "step": 4524 }, { "epoch": 0.12, "learning_rate": 1.961490177046695e-06, "loss": 1.0684, "step": 4525 }, { "epoch": 0.12, "learning_rate": 1.9614673587486235e-06, "loss": 0.9727, "step": 4526 }, { "epoch": 0.12, "learning_rate": 1.9614445338250737e-06, "loss": 0.9453, "step": 4527 }, { "epoch": 0.12, "learning_rate": 1.961421702276202e-06, "loss": 0.8232, "step": 4528 }, { "epoch": 0.12, "learning_rate": 1.9613988641021662e-06, "loss": 1.0752, "step": 4529 }, { "epoch": 0.12, "learning_rate": 1.9613760193031234e-06, "loss": 1.0098, "step": 4530 }, { "epoch": 0.12, "learning_rate": 1.9613531678792312e-06, "loss": 0.8506, "step": 4531 }, { "epoch": 0.12, "learning_rate": 1.961330309830647e-06, "loss": 1.0498, "step": 4532 }, { "epoch": 0.12, "learning_rate": 1.9613074451575286e-06, "loss": 0.8496, "step": 4533 }, { "epoch": 0.12, "learning_rate": 1.9612845738600332e-06, "loss": 0.9551, "step": 4534 }, { "epoch": 0.12, "learning_rate": 1.9612616959383188e-06, "loss": 0.7803, "step": 4535 }, { "epoch": 0.12, "learning_rate": 1.961238811392543e-06, "loss": 0.7969, "step": 4536 }, { "epoch": 0.12, "learning_rate": 1.9612159202228625e-06, "loss": 0.9014, "step": 4537 }, { "epoch": 0.12, "learning_rate": 1.9611930224294362e-06, "loss": 1.0986, "step": 4538 }, { "epoch": 0.12, "learning_rate": 1.9611701180124215e-06, "loss": 1.0234, "step": 4539 }, { "epoch": 0.12, "learning_rate": 1.9611472069719763e-06, "loss": 1.0361, "step": 4540 }, { "epoch": 0.12, "learning_rate": 1.9611242893082587e-06, "loss": 0.9512, "step": 4541 }, { "epoch": 0.12, "learning_rate": 1.9611013650214256e-06, "loss": 0.9189, "step": 4542 }, { "epoch": 0.12, "learning_rate": 1.9610784341116365e-06, "loss": 0.9688, "step": 4543 }, { "epoch": 0.12, "learning_rate": 1.9610554965790483e-06, "loss": 0.9199, "step": 4544 }, { "epoch": 0.12, "learning_rate": 1.9610325524238196e-06, "loss": 0.8848, "step": 4545 }, { "epoch": 0.12, "learning_rate": 1.961009601646108e-06, "loss": 0.998, "step": 4546 }, { "epoch": 0.12, "learning_rate": 1.960986644246072e-06, "loss": 0.4448, "step": 4547 }, { "epoch": 0.12, "learning_rate": 1.96096368022387e-06, "loss": 1.0, "step": 4548 }, { "epoch": 0.12, "learning_rate": 1.96094070957966e-06, "loss": 0.834, "step": 4549 }, { "epoch": 0.12, "learning_rate": 1.9609177323136005e-06, "loss": 1.167, "step": 4550 }, { "epoch": 0.12, "learning_rate": 1.9608947484258494e-06, "loss": 0.918, "step": 4551 }, { "epoch": 0.12, "learning_rate": 1.9608717579165655e-06, "loss": 1.0176, "step": 4552 }, { "epoch": 0.12, "learning_rate": 1.9608487607859066e-06, "loss": 0.8828, "step": 4553 }, { "epoch": 0.12, "learning_rate": 1.960825757034032e-06, "loss": 1.0127, "step": 4554 }, { "epoch": 0.12, "learning_rate": 1.9608027466611e-06, "loss": 0.9287, "step": 4555 }, { "epoch": 0.12, "learning_rate": 1.960779729667269e-06, "loss": 0.9219, "step": 4556 }, { "epoch": 0.12, "learning_rate": 1.960756706052697e-06, "loss": 0.9053, "step": 4557 }, { "epoch": 0.12, "learning_rate": 1.960733675817544e-06, "loss": 0.9766, "step": 4558 }, { "epoch": 0.12, "learning_rate": 1.9607106389619672e-06, "loss": 1.0508, "step": 4559 }, { "epoch": 0.12, "learning_rate": 1.960687595486127e-06, "loss": 0.7871, "step": 4560 }, { "epoch": 0.12, "learning_rate": 1.960664545390181e-06, "loss": 0.8428, "step": 4561 }, { "epoch": 0.12, "learning_rate": 1.9606414886742883e-06, "loss": 1.0293, "step": 4562 }, { "epoch": 0.12, "learning_rate": 1.960618425338608e-06, "loss": 0.9014, "step": 4563 }, { "epoch": 0.12, "learning_rate": 1.9605953553832986e-06, "loss": 0.9375, "step": 4564 }, { "epoch": 0.12, "learning_rate": 1.9605722788085196e-06, "loss": 0.6968, "step": 4565 }, { "epoch": 0.12, "learning_rate": 1.9605491956144296e-06, "loss": 1.0156, "step": 4566 }, { "epoch": 0.12, "learning_rate": 1.960526105801188e-06, "loss": 0.8848, "step": 4567 }, { "epoch": 0.12, "learning_rate": 1.9605030093689535e-06, "loss": 0.8506, "step": 4568 }, { "epoch": 0.12, "learning_rate": 1.960479906317886e-06, "loss": 1.0742, "step": 4569 }, { "epoch": 0.12, "learning_rate": 1.9604567966481434e-06, "loss": 0.8174, "step": 4570 }, { "epoch": 0.12, "learning_rate": 1.960433680359886e-06, "loss": 0.9629, "step": 4571 }, { "epoch": 0.12, "learning_rate": 1.9604105574532736e-06, "loss": 0.9609, "step": 4572 }, { "epoch": 0.12, "learning_rate": 1.960387427928464e-06, "loss": 1.0059, "step": 4573 }, { "epoch": 0.12, "learning_rate": 1.9603642917856176e-06, "loss": 0.9287, "step": 4574 }, { "epoch": 0.12, "learning_rate": 1.9603411490248936e-06, "loss": 1.2695, "step": 4575 }, { "epoch": 0.12, "learning_rate": 1.9603179996464516e-06, "loss": 0.7305, "step": 4576 }, { "epoch": 0.12, "learning_rate": 1.960294843650451e-06, "loss": 0.8643, "step": 4577 }, { "epoch": 0.12, "learning_rate": 1.9602716810370515e-06, "loss": 1.0205, "step": 4578 }, { "epoch": 0.12, "learning_rate": 1.9602485118064124e-06, "loss": 0.96, "step": 4579 }, { "epoch": 0.12, "learning_rate": 1.9602253359586935e-06, "loss": 1.0107, "step": 4580 }, { "epoch": 0.12, "learning_rate": 1.9602021534940544e-06, "loss": 0.9839, "step": 4581 }, { "epoch": 0.12, "learning_rate": 1.960178964412655e-06, "loss": 0.8647, "step": 4582 }, { "epoch": 0.12, "learning_rate": 1.9601557687146556e-06, "loss": 0.8672, "step": 4583 }, { "epoch": 0.12, "learning_rate": 1.9601325664002157e-06, "loss": 1.1592, "step": 4584 }, { "epoch": 0.12, "learning_rate": 1.9601093574694943e-06, "loss": 1.0381, "step": 4585 }, { "epoch": 0.12, "learning_rate": 1.9600861419226528e-06, "loss": 1.2871, "step": 4586 }, { "epoch": 0.12, "learning_rate": 1.96006291975985e-06, "loss": 0.917, "step": 4587 }, { "epoch": 0.12, "learning_rate": 1.960039690981246e-06, "loss": 0.9746, "step": 4588 }, { "epoch": 0.12, "learning_rate": 1.960016455587002e-06, "loss": 0.9868, "step": 4589 }, { "epoch": 0.12, "learning_rate": 1.959993213577277e-06, "loss": 0.8584, "step": 4590 }, { "epoch": 0.12, "learning_rate": 1.9599699649522312e-06, "loss": 1.0684, "step": 4591 }, { "epoch": 0.12, "learning_rate": 1.9599467097120256e-06, "loss": 0.9443, "step": 4592 }, { "epoch": 0.12, "learning_rate": 1.9599234478568197e-06, "loss": 0.7471, "step": 4593 }, { "epoch": 0.12, "learning_rate": 1.9599001793867743e-06, "loss": 0.9893, "step": 4594 }, { "epoch": 0.12, "learning_rate": 1.959876904302049e-06, "loss": 0.7896, "step": 4595 }, { "epoch": 0.12, "learning_rate": 1.959853622602805e-06, "loss": 0.835, "step": 4596 }, { "epoch": 0.12, "learning_rate": 1.959830334289203e-06, "loss": 0.8828, "step": 4597 }, { "epoch": 0.12, "learning_rate": 1.959807039361402e-06, "loss": 0.9775, "step": 4598 }, { "epoch": 0.12, "learning_rate": 1.959783737819564e-06, "loss": 0.8535, "step": 4599 }, { "epoch": 0.12, "learning_rate": 1.959760429663849e-06, "loss": 0.9766, "step": 4600 }, { "epoch": 0.12, "learning_rate": 1.9597371148944175e-06, "loss": 0.8906, "step": 4601 }, { "epoch": 0.12, "learning_rate": 1.9597137935114305e-06, "loss": 0.9326, "step": 4602 }, { "epoch": 0.12, "learning_rate": 1.9596904655150482e-06, "loss": 0.9297, "step": 4603 }, { "epoch": 0.12, "learning_rate": 1.9596671309054317e-06, "loss": 0.9971, "step": 4604 }, { "epoch": 0.12, "learning_rate": 1.9596437896827418e-06, "loss": 1.1973, "step": 4605 }, { "epoch": 0.12, "learning_rate": 1.9596204418471394e-06, "loss": 0.959, "step": 4606 }, { "epoch": 0.12, "learning_rate": 1.959597087398785e-06, "loss": 1.2051, "step": 4607 }, { "epoch": 0.12, "learning_rate": 1.9595737263378404e-06, "loss": 1.1426, "step": 4608 }, { "epoch": 0.12, "learning_rate": 1.959550358664465e-06, "loss": 0.8188, "step": 4609 }, { "epoch": 0.12, "learning_rate": 1.9595269843788216e-06, "loss": 1.0508, "step": 4610 }, { "epoch": 0.12, "learning_rate": 1.9595036034810708e-06, "loss": 1.0742, "step": 4611 }, { "epoch": 0.12, "learning_rate": 1.9594802159713727e-06, "loss": 1.0391, "step": 4612 }, { "epoch": 0.12, "learning_rate": 1.959456821849889e-06, "loss": 0.9619, "step": 4613 }, { "epoch": 0.12, "learning_rate": 1.959433421116782e-06, "loss": 1.001, "step": 4614 }, { "epoch": 0.12, "learning_rate": 1.959410013772211e-06, "loss": 0.8486, "step": 4615 }, { "epoch": 0.12, "learning_rate": 1.9593865998163395e-06, "loss": 0.9424, "step": 4616 }, { "epoch": 0.12, "learning_rate": 1.959363179249327e-06, "loss": 0.9287, "step": 4617 }, { "epoch": 0.12, "learning_rate": 1.9593397520713357e-06, "loss": 0.8184, "step": 4618 }, { "epoch": 0.12, "learning_rate": 1.959316318282527e-06, "loss": 0.9648, "step": 4619 }, { "epoch": 0.12, "learning_rate": 1.9592928778830623e-06, "loss": 0.998, "step": 4620 }, { "epoch": 0.12, "learning_rate": 1.9592694308731032e-06, "loss": 0.6064, "step": 4621 }, { "epoch": 0.12, "learning_rate": 1.959245977252811e-06, "loss": 0.9189, "step": 4622 }, { "epoch": 0.12, "learning_rate": 1.9592225170223473e-06, "loss": 0.6179, "step": 4623 }, { "epoch": 0.12, "learning_rate": 1.9591990501818745e-06, "loss": 0.8438, "step": 4624 }, { "epoch": 0.12, "learning_rate": 1.9591755767315537e-06, "loss": 1.1123, "step": 4625 }, { "epoch": 0.12, "learning_rate": 1.959152096671547e-06, "loss": 0.9131, "step": 4626 }, { "epoch": 0.12, "learning_rate": 1.9591286100020153e-06, "loss": 0.8779, "step": 4627 }, { "epoch": 0.12, "learning_rate": 1.9591051167231213e-06, "loss": 0.9531, "step": 4628 }, { "epoch": 0.12, "learning_rate": 1.959081616835027e-06, "loss": 0.8369, "step": 4629 }, { "epoch": 0.12, "learning_rate": 1.9590581103378936e-06, "loss": 0.8218, "step": 4630 }, { "epoch": 0.12, "learning_rate": 1.959034597231884e-06, "loss": 0.7534, "step": 4631 }, { "epoch": 0.12, "learning_rate": 1.9590110775171594e-06, "loss": 0.9355, "step": 4632 }, { "epoch": 0.12, "learning_rate": 1.958987551193882e-06, "loss": 0.9912, "step": 4633 }, { "epoch": 0.12, "learning_rate": 1.9589640182622146e-06, "loss": 0.9355, "step": 4634 }, { "epoch": 0.12, "learning_rate": 1.958940478722319e-06, "loss": 1.002, "step": 4635 }, { "epoch": 0.12, "learning_rate": 1.958916932574357e-06, "loss": 0.9697, "step": 4636 }, { "epoch": 0.12, "learning_rate": 1.958893379818491e-06, "loss": 0.9014, "step": 4637 }, { "epoch": 0.12, "learning_rate": 1.958869820454884e-06, "loss": 1.0049, "step": 4638 }, { "epoch": 0.12, "learning_rate": 1.9588462544836974e-06, "loss": 1.082, "step": 4639 }, { "epoch": 0.12, "learning_rate": 1.9588226819050943e-06, "loss": 1.0547, "step": 4640 }, { "epoch": 0.12, "learning_rate": 1.9587991027192365e-06, "loss": 0.6802, "step": 4641 }, { "epoch": 0.12, "learning_rate": 1.958775516926287e-06, "loss": 0.8682, "step": 4642 }, { "epoch": 0.12, "learning_rate": 1.9587519245264084e-06, "loss": 1.0996, "step": 4643 }, { "epoch": 0.12, "learning_rate": 1.958728325519763e-06, "loss": 0.8994, "step": 4644 }, { "epoch": 0.12, "learning_rate": 1.9587047199065136e-06, "loss": 0.9009, "step": 4645 }, { "epoch": 0.12, "learning_rate": 1.9586811076868223e-06, "loss": 0.7886, "step": 4646 }, { "epoch": 0.12, "learning_rate": 1.9586574888608522e-06, "loss": 1.1826, "step": 4647 }, { "epoch": 0.12, "learning_rate": 1.9586338634287663e-06, "loss": 0.999, "step": 4648 }, { "epoch": 0.12, "learning_rate": 1.9586102313907275e-06, "loss": 0.8564, "step": 4649 }, { "epoch": 0.12, "learning_rate": 1.9585865927468982e-06, "loss": 1.0635, "step": 4650 }, { "epoch": 0.12, "learning_rate": 1.9585629474974414e-06, "loss": 0.7344, "step": 4651 }, { "epoch": 0.12, "learning_rate": 1.9585392956425197e-06, "loss": 0.9814, "step": 4652 }, { "epoch": 0.12, "learning_rate": 1.958515637182297e-06, "loss": 0.8462, "step": 4653 }, { "epoch": 0.12, "learning_rate": 1.9584919721169355e-06, "loss": 0.8906, "step": 4654 }, { "epoch": 0.12, "learning_rate": 1.9584683004465987e-06, "loss": 1.1426, "step": 4655 }, { "epoch": 0.12, "learning_rate": 1.9584446221714497e-06, "loss": 1.0361, "step": 4656 }, { "epoch": 0.12, "learning_rate": 1.9584209372916514e-06, "loss": 0.8989, "step": 4657 }, { "epoch": 0.12, "learning_rate": 1.958397245807367e-06, "loss": 1.0293, "step": 4658 }, { "epoch": 0.12, "learning_rate": 1.9583735477187604e-06, "loss": 0.6797, "step": 4659 }, { "epoch": 0.12, "learning_rate": 1.958349843025994e-06, "loss": 0.9639, "step": 4660 }, { "epoch": 0.12, "learning_rate": 1.958326131729232e-06, "loss": 0.8169, "step": 4661 }, { "epoch": 0.12, "learning_rate": 1.9583024138286372e-06, "loss": 0.9238, "step": 4662 }, { "epoch": 0.12, "learning_rate": 1.9582786893243734e-06, "loss": 0.8262, "step": 4663 }, { "epoch": 0.12, "learning_rate": 1.9582549582166035e-06, "loss": 1.0879, "step": 4664 }, { "epoch": 0.12, "learning_rate": 1.958231220505492e-06, "loss": 1.0332, "step": 4665 }, { "epoch": 0.12, "learning_rate": 1.9582074761912013e-06, "loss": 0.875, "step": 4666 }, { "epoch": 0.12, "learning_rate": 1.958183725273896e-06, "loss": 0.583, "step": 4667 }, { "epoch": 0.12, "learning_rate": 1.9581599677537394e-06, "loss": 1.0625, "step": 4668 }, { "epoch": 0.12, "learning_rate": 1.958136203630895e-06, "loss": 1.1504, "step": 4669 }, { "epoch": 0.12, "learning_rate": 1.958112432905527e-06, "loss": 0.9893, "step": 4670 }, { "epoch": 0.12, "learning_rate": 1.9580886555777993e-06, "loss": 0.9219, "step": 4671 }, { "epoch": 0.12, "learning_rate": 1.958064871647875e-06, "loss": 1.0254, "step": 4672 }, { "epoch": 0.12, "learning_rate": 1.9580410811159186e-06, "loss": 0.7803, "step": 4673 }, { "epoch": 0.12, "learning_rate": 1.9580172839820935e-06, "loss": 0.9102, "step": 4674 }, { "epoch": 0.12, "learning_rate": 1.9579934802465647e-06, "loss": 0.9814, "step": 4675 }, { "epoch": 0.12, "learning_rate": 1.9579696699094954e-06, "loss": 0.8037, "step": 4676 }, { "epoch": 0.12, "learning_rate": 1.9579458529710494e-06, "loss": 0.7871, "step": 4677 }, { "epoch": 0.12, "learning_rate": 1.9579220294313914e-06, "loss": 0.8799, "step": 4678 }, { "epoch": 0.12, "learning_rate": 1.957898199290686e-06, "loss": 0.7114, "step": 4679 }, { "epoch": 0.12, "learning_rate": 1.957874362549096e-06, "loss": 0.915, "step": 4680 }, { "epoch": 0.12, "learning_rate": 1.9578505192067875e-06, "loss": 0.8535, "step": 4681 }, { "epoch": 0.12, "learning_rate": 1.9578266692639234e-06, "loss": 1.1543, "step": 4682 }, { "epoch": 0.12, "learning_rate": 1.9578028127206685e-06, "loss": 0.8857, "step": 4683 }, { "epoch": 0.12, "learning_rate": 1.957778949577187e-06, "loss": 0.7671, "step": 4684 }, { "epoch": 0.12, "learning_rate": 1.957755079833644e-06, "loss": 0.9873, "step": 4685 }, { "epoch": 0.12, "learning_rate": 1.957731203490203e-06, "loss": 1.0654, "step": 4686 }, { "epoch": 0.12, "learning_rate": 1.9577073205470293e-06, "loss": 0.9287, "step": 4687 }, { "epoch": 0.12, "learning_rate": 1.9576834310042873e-06, "loss": 0.8613, "step": 4688 }, { "epoch": 0.12, "learning_rate": 1.9576595348621413e-06, "loss": 1.1543, "step": 4689 }, { "epoch": 0.12, "learning_rate": 1.957635632120756e-06, "loss": 0.8032, "step": 4690 }, { "epoch": 0.12, "learning_rate": 1.957611722780297e-06, "loss": 1.1348, "step": 4691 }, { "epoch": 0.12, "learning_rate": 1.957587806840928e-06, "loss": 1.1133, "step": 4692 }, { "epoch": 0.12, "learning_rate": 1.9575638843028142e-06, "loss": 0.7556, "step": 4693 }, { "epoch": 0.12, "learning_rate": 1.9575399551661206e-06, "loss": 1.0049, "step": 4694 }, { "epoch": 0.12, "learning_rate": 1.9575160194310115e-06, "loss": 0.7139, "step": 4695 }, { "epoch": 0.12, "learning_rate": 1.957492077097653e-06, "loss": 0.7769, "step": 4696 }, { "epoch": 0.12, "learning_rate": 1.9574681281662085e-06, "loss": 1.1074, "step": 4697 }, { "epoch": 0.12, "learning_rate": 1.9574441726368445e-06, "loss": 0.9717, "step": 4698 }, { "epoch": 0.12, "learning_rate": 1.9574202105097253e-06, "loss": 0.9502, "step": 4699 }, { "epoch": 0.12, "learning_rate": 1.957396241785016e-06, "loss": 0.918, "step": 4700 }, { "epoch": 0.12, "learning_rate": 1.9573722664628824e-06, "loss": 0.8145, "step": 4701 }, { "epoch": 0.12, "learning_rate": 1.957348284543489e-06, "loss": 1.0107, "step": 4702 }, { "epoch": 0.12, "learning_rate": 1.9573242960270012e-06, "loss": 0.8828, "step": 4703 }, { "epoch": 0.12, "learning_rate": 1.957300300913585e-06, "loss": 1.0674, "step": 4704 }, { "epoch": 0.12, "learning_rate": 1.9572762992034048e-06, "loss": 0.6616, "step": 4705 }, { "epoch": 0.12, "learning_rate": 1.957252290896626e-06, "loss": 1.1553, "step": 4706 }, { "epoch": 0.12, "learning_rate": 1.9572282759934153e-06, "loss": 0.9678, "step": 4707 }, { "epoch": 0.12, "learning_rate": 1.9572042544939367e-06, "loss": 0.9834, "step": 4708 }, { "epoch": 0.12, "learning_rate": 1.9571802263983568e-06, "loss": 0.9922, "step": 4709 }, { "epoch": 0.12, "learning_rate": 1.9571561917068406e-06, "loss": 1.0732, "step": 4710 }, { "epoch": 0.12, "learning_rate": 1.9571321504195534e-06, "loss": 0.9922, "step": 4711 }, { "epoch": 0.12, "learning_rate": 1.9571081025366617e-06, "loss": 0.9248, "step": 4712 }, { "epoch": 0.12, "learning_rate": 1.9570840480583305e-06, "loss": 1.0625, "step": 4713 }, { "epoch": 0.12, "learning_rate": 1.9570599869847264e-06, "loss": 0.6919, "step": 4714 }, { "epoch": 0.12, "learning_rate": 1.9570359193160145e-06, "loss": 0.8511, "step": 4715 }, { "epoch": 0.12, "learning_rate": 1.9570118450523608e-06, "loss": 1.1348, "step": 4716 }, { "epoch": 0.12, "learning_rate": 1.9569877641939313e-06, "loss": 0.959, "step": 4717 }, { "epoch": 0.12, "learning_rate": 1.9569636767408917e-06, "loss": 0.9609, "step": 4718 }, { "epoch": 0.12, "learning_rate": 1.9569395826934083e-06, "loss": 0.917, "step": 4719 }, { "epoch": 0.12, "learning_rate": 1.956915482051647e-06, "loss": 1.1621, "step": 4720 }, { "epoch": 0.12, "learning_rate": 1.956891374815774e-06, "loss": 0.9238, "step": 4721 }, { "epoch": 0.12, "learning_rate": 1.9568672609859553e-06, "loss": 0.9062, "step": 4722 }, { "epoch": 0.12, "learning_rate": 1.956843140562357e-06, "loss": 1.0615, "step": 4723 }, { "epoch": 0.12, "learning_rate": 1.956819013545145e-06, "loss": 0.8062, "step": 4724 }, { "epoch": 0.12, "learning_rate": 1.9567948799344868e-06, "loss": 0.8086, "step": 4725 }, { "epoch": 0.12, "learning_rate": 1.956770739730547e-06, "loss": 0.7227, "step": 4726 }, { "epoch": 0.12, "learning_rate": 1.9567465929334933e-06, "loss": 0.8799, "step": 4727 }, { "epoch": 0.12, "learning_rate": 1.9567224395434915e-06, "loss": 1.0381, "step": 4728 }, { "epoch": 0.12, "learning_rate": 1.956698279560708e-06, "loss": 1.0557, "step": 4729 }, { "epoch": 0.12, "learning_rate": 1.9566741129853098e-06, "loss": 1.0244, "step": 4730 }, { "epoch": 0.12, "learning_rate": 1.956649939817463e-06, "loss": 1.0986, "step": 4731 }, { "epoch": 0.12, "learning_rate": 1.956625760057334e-06, "loss": 0.6719, "step": 4732 }, { "epoch": 0.12, "learning_rate": 1.9566015737050894e-06, "loss": 0.8057, "step": 4733 }, { "epoch": 0.12, "learning_rate": 1.9565773807608966e-06, "loss": 0.8848, "step": 4734 }, { "epoch": 0.12, "learning_rate": 1.9565531812249215e-06, "loss": 1.1465, "step": 4735 }, { "epoch": 0.12, "learning_rate": 1.9565289750973317e-06, "loss": 0.9331, "step": 4736 }, { "epoch": 0.12, "learning_rate": 1.956504762378293e-06, "loss": 0.8955, "step": 4737 }, { "epoch": 0.12, "learning_rate": 1.956480543067973e-06, "loss": 0.9248, "step": 4738 }, { "epoch": 0.12, "learning_rate": 1.9564563171665386e-06, "loss": 0.7402, "step": 4739 }, { "epoch": 0.12, "learning_rate": 1.956432084674156e-06, "loss": 0.9512, "step": 4740 }, { "epoch": 0.12, "learning_rate": 1.956407845590993e-06, "loss": 1.0938, "step": 4741 }, { "epoch": 0.12, "learning_rate": 1.9563835999172163e-06, "loss": 1.0098, "step": 4742 }, { "epoch": 0.12, "learning_rate": 1.956359347652993e-06, "loss": 1.0762, "step": 4743 }, { "epoch": 0.12, "learning_rate": 1.95633508879849e-06, "loss": 1.0986, "step": 4744 }, { "epoch": 0.12, "learning_rate": 1.9563108233538745e-06, "loss": 1.0938, "step": 4745 }, { "epoch": 0.12, "learning_rate": 1.9562865513193143e-06, "loss": 0.917, "step": 4746 }, { "epoch": 0.12, "learning_rate": 1.956262272694976e-06, "loss": 1.0586, "step": 4747 }, { "epoch": 0.12, "learning_rate": 1.9562379874810273e-06, "loss": 0.9238, "step": 4748 }, { "epoch": 0.12, "learning_rate": 1.9562136956776355e-06, "loss": 0.9365, "step": 4749 }, { "epoch": 0.12, "learning_rate": 1.9561893972849677e-06, "loss": 0.9438, "step": 4750 }, { "epoch": 0.12, "learning_rate": 1.9561650923031916e-06, "loss": 0.9053, "step": 4751 }, { "epoch": 0.12, "learning_rate": 1.9561407807324746e-06, "loss": 0.9023, "step": 4752 }, { "epoch": 0.12, "learning_rate": 1.9561164625729843e-06, "loss": 0.7988, "step": 4753 }, { "epoch": 0.12, "learning_rate": 1.9560921378248885e-06, "loss": 0.9229, "step": 4754 }, { "epoch": 0.12, "learning_rate": 1.9560678064883544e-06, "loss": 0.8467, "step": 4755 }, { "epoch": 0.12, "learning_rate": 1.9560434685635494e-06, "loss": 0.9932, "step": 4756 }, { "epoch": 0.12, "learning_rate": 1.956019124050642e-06, "loss": 1.1113, "step": 4757 }, { "epoch": 0.12, "learning_rate": 1.9559947729497997e-06, "loss": 0.8516, "step": 4758 }, { "epoch": 0.12, "learning_rate": 1.95597041526119e-06, "loss": 1.0107, "step": 4759 }, { "epoch": 0.12, "learning_rate": 1.955946050984981e-06, "loss": 0.7876, "step": 4760 }, { "epoch": 0.12, "learning_rate": 1.9559216801213405e-06, "loss": 1.0537, "step": 4761 }, { "epoch": 0.12, "learning_rate": 1.9558973026704367e-06, "loss": 0.9014, "step": 4762 }, { "epoch": 0.12, "learning_rate": 1.955872918632437e-06, "loss": 0.7114, "step": 4763 }, { "epoch": 0.12, "learning_rate": 1.95584852800751e-06, "loss": 0.9658, "step": 4764 }, { "epoch": 0.12, "learning_rate": 1.9558241307958235e-06, "loss": 0.7617, "step": 4765 }, { "epoch": 0.12, "learning_rate": 1.955799726997546e-06, "loss": 1.0488, "step": 4766 }, { "epoch": 0.12, "learning_rate": 1.955775316612845e-06, "loss": 1.0801, "step": 4767 }, { "epoch": 0.12, "learning_rate": 1.955750899641889e-06, "loss": 1.0605, "step": 4768 }, { "epoch": 0.12, "learning_rate": 1.9557264760848465e-06, "loss": 1.332, "step": 4769 }, { "epoch": 0.12, "learning_rate": 1.9557020459418857e-06, "loss": 0.915, "step": 4770 }, { "epoch": 0.12, "learning_rate": 1.955677609213175e-06, "loss": 0.9707, "step": 4771 }, { "epoch": 0.12, "learning_rate": 1.9556531658988824e-06, "loss": 0.7236, "step": 4772 }, { "epoch": 0.12, "learning_rate": 1.9556287159991766e-06, "loss": 0.6362, "step": 4773 }, { "epoch": 0.12, "learning_rate": 1.9556042595142263e-06, "loss": 0.9648, "step": 4774 }, { "epoch": 0.12, "learning_rate": 1.9555797964442e-06, "loss": 0.9248, "step": 4775 }, { "epoch": 0.12, "learning_rate": 1.9555553267892656e-06, "loss": 0.876, "step": 4776 }, { "epoch": 0.12, "learning_rate": 1.9555308505495923e-06, "loss": 0.9043, "step": 4777 }, { "epoch": 0.12, "learning_rate": 1.955506367725349e-06, "loss": 1.083, "step": 4778 }, { "epoch": 0.12, "learning_rate": 1.9554818783167038e-06, "loss": 1.0527, "step": 4779 }, { "epoch": 0.12, "learning_rate": 1.955457382323826e-06, "loss": 1.0234, "step": 4780 }, { "epoch": 0.12, "learning_rate": 1.9554328797468843e-06, "loss": 0.9131, "step": 4781 }, { "epoch": 0.12, "learning_rate": 1.9554083705860473e-06, "loss": 0.8047, "step": 4782 }, { "epoch": 0.12, "learning_rate": 1.9553838548414836e-06, "loss": 0.9053, "step": 4783 }, { "epoch": 0.12, "learning_rate": 1.955359332513363e-06, "loss": 1.124, "step": 4784 }, { "epoch": 0.12, "learning_rate": 1.955334803601854e-06, "loss": 0.8135, "step": 4785 }, { "epoch": 0.12, "learning_rate": 1.9553102681071257e-06, "loss": 0.9951, "step": 4786 }, { "epoch": 0.12, "learning_rate": 1.9552857260293466e-06, "loss": 0.8604, "step": 4787 }, { "epoch": 0.12, "learning_rate": 1.955261177368687e-06, "loss": 1.042, "step": 4788 }, { "epoch": 0.12, "learning_rate": 1.9552366221253147e-06, "loss": 1.0703, "step": 4789 }, { "epoch": 0.12, "learning_rate": 1.9552120602994004e-06, "loss": 0.8887, "step": 4790 }, { "epoch": 0.12, "learning_rate": 1.955187491891112e-06, "loss": 0.9756, "step": 4791 }, { "epoch": 0.12, "learning_rate": 1.9551629169006197e-06, "loss": 0.9824, "step": 4792 }, { "epoch": 0.12, "learning_rate": 1.9551383353280922e-06, "loss": 1.0107, "step": 4793 }, { "epoch": 0.12, "learning_rate": 1.9551137471736995e-06, "loss": 1.0557, "step": 4794 }, { "epoch": 0.12, "learning_rate": 1.955089152437611e-06, "loss": 0.7991, "step": 4795 }, { "epoch": 0.12, "learning_rate": 1.9550645511199953e-06, "loss": 1.1338, "step": 4796 }, { "epoch": 0.12, "learning_rate": 1.9550399432210227e-06, "loss": 0.9893, "step": 4797 }, { "epoch": 0.12, "learning_rate": 1.955015328740863e-06, "loss": 0.8052, "step": 4798 }, { "epoch": 0.12, "learning_rate": 1.9549907076796853e-06, "loss": 0.7949, "step": 4799 }, { "epoch": 0.12, "learning_rate": 1.954966080037659e-06, "loss": 0.9951, "step": 4800 }, { "epoch": 0.12, "learning_rate": 1.954941445814955e-06, "loss": 0.9209, "step": 4801 }, { "epoch": 0.12, "learning_rate": 1.954916805011742e-06, "loss": 1.0576, "step": 4802 }, { "epoch": 0.12, "learning_rate": 1.9548921576281896e-06, "loss": 0.6929, "step": 4803 }, { "epoch": 0.12, "learning_rate": 1.954867503664469e-06, "loss": 1.0703, "step": 4804 }, { "epoch": 0.12, "learning_rate": 1.9548428431207483e-06, "loss": 0.8975, "step": 4805 }, { "epoch": 0.12, "learning_rate": 1.954818175997199e-06, "loss": 0.8262, "step": 4806 }, { "epoch": 0.12, "learning_rate": 1.95479350229399e-06, "loss": 0.8262, "step": 4807 }, { "epoch": 0.12, "learning_rate": 1.9547688220112923e-06, "loss": 1.0352, "step": 4808 }, { "epoch": 0.12, "learning_rate": 1.954744135149275e-06, "loss": 0.9238, "step": 4809 }, { "epoch": 0.12, "learning_rate": 1.9547194417081088e-06, "loss": 0.7949, "step": 4810 }, { "epoch": 0.12, "learning_rate": 1.9546947416879635e-06, "loss": 0.9805, "step": 4811 }, { "epoch": 0.12, "learning_rate": 1.9546700350890095e-06, "loss": 1.0635, "step": 4812 }, { "epoch": 0.12, "learning_rate": 1.9546453219114175e-06, "loss": 1.0527, "step": 4813 }, { "epoch": 0.12, "learning_rate": 1.954620602155357e-06, "loss": 1.0352, "step": 4814 }, { "epoch": 0.12, "learning_rate": 1.9545958758209992e-06, "loss": 0.8496, "step": 4815 }, { "epoch": 0.12, "learning_rate": 1.9545711429085136e-06, "loss": 0.6333, "step": 4816 }, { "epoch": 0.12, "learning_rate": 1.954546403418071e-06, "loss": 0.9424, "step": 4817 }, { "epoch": 0.12, "learning_rate": 1.954521657349842e-06, "loss": 0.8101, "step": 4818 }, { "epoch": 0.12, "learning_rate": 1.9544969047039973e-06, "loss": 1.1484, "step": 4819 }, { "epoch": 0.12, "learning_rate": 1.954472145480707e-06, "loss": 1.0176, "step": 4820 }, { "epoch": 0.12, "learning_rate": 1.954447379680142e-06, "loss": 1.0684, "step": 4821 }, { "epoch": 0.12, "learning_rate": 1.9544226073024727e-06, "loss": 0.9951, "step": 4822 }, { "epoch": 0.12, "learning_rate": 1.9543978283478705e-06, "loss": 0.8633, "step": 4823 }, { "epoch": 0.12, "learning_rate": 1.954373042816505e-06, "loss": 0.916, "step": 4824 }, { "epoch": 0.12, "learning_rate": 1.954348250708548e-06, "loss": 0.9805, "step": 4825 }, { "epoch": 0.12, "learning_rate": 1.95432345202417e-06, "loss": 1.0361, "step": 4826 }, { "epoch": 0.12, "learning_rate": 1.954298646763542e-06, "loss": 1.0293, "step": 4827 }, { "epoch": 0.12, "learning_rate": 1.9542738349268343e-06, "loss": 1.0889, "step": 4828 }, { "epoch": 0.12, "learning_rate": 1.954249016514219e-06, "loss": 0.9961, "step": 4829 }, { "epoch": 0.12, "learning_rate": 1.954224191525866e-06, "loss": 0.8555, "step": 4830 }, { "epoch": 0.12, "learning_rate": 1.954199359961947e-06, "loss": 1.0273, "step": 4831 }, { "epoch": 0.12, "learning_rate": 1.9541745218226334e-06, "loss": 0.873, "step": 4832 }, { "epoch": 0.12, "learning_rate": 1.954149677108096e-06, "loss": 0.8945, "step": 4833 }, { "epoch": 0.12, "learning_rate": 1.9541248258185055e-06, "loss": 0.8555, "step": 4834 }, { "epoch": 0.12, "learning_rate": 1.954099967954034e-06, "loss": 1.0723, "step": 4835 }, { "epoch": 0.12, "learning_rate": 1.954075103514852e-06, "loss": 0.9971, "step": 4836 }, { "epoch": 0.12, "learning_rate": 1.9540502325011317e-06, "loss": 0.8037, "step": 4837 }, { "epoch": 0.12, "learning_rate": 1.9540253549130436e-06, "loss": 0.8809, "step": 4838 }, { "epoch": 0.12, "learning_rate": 1.9540004707507597e-06, "loss": 0.9277, "step": 4839 }, { "epoch": 0.12, "learning_rate": 1.953975580014452e-06, "loss": 0.8271, "step": 4840 }, { "epoch": 0.12, "learning_rate": 1.9539506827042904e-06, "loss": 0.6279, "step": 4841 }, { "epoch": 0.12, "learning_rate": 1.953925778820448e-06, "loss": 0.9736, "step": 4842 }, { "epoch": 0.12, "learning_rate": 1.9539008683630957e-06, "loss": 1.0596, "step": 4843 }, { "epoch": 0.12, "learning_rate": 1.953875951332405e-06, "loss": 1.0557, "step": 4844 }, { "epoch": 0.12, "learning_rate": 1.9538510277285487e-06, "loss": 0.9365, "step": 4845 }, { "epoch": 0.12, "learning_rate": 1.953826097551697e-06, "loss": 0.7783, "step": 4846 }, { "epoch": 0.12, "learning_rate": 1.9538011608020227e-06, "loss": 1.1475, "step": 4847 }, { "epoch": 0.12, "learning_rate": 1.9537762174796975e-06, "loss": 0.7998, "step": 4848 }, { "epoch": 0.12, "learning_rate": 1.953751267584893e-06, "loss": 0.8745, "step": 4849 }, { "epoch": 0.12, "learning_rate": 1.9537263111177815e-06, "loss": 1.0049, "step": 4850 }, { "epoch": 0.12, "learning_rate": 1.9537013480785346e-06, "loss": 0.7881, "step": 4851 }, { "epoch": 0.12, "learning_rate": 1.9536763784673247e-06, "loss": 0.6265, "step": 4852 }, { "epoch": 0.12, "learning_rate": 1.9536514022843237e-06, "loss": 0.9121, "step": 4853 }, { "epoch": 0.12, "learning_rate": 1.9536264195297035e-06, "loss": 0.916, "step": 4854 }, { "epoch": 0.12, "learning_rate": 1.9536014302036366e-06, "loss": 0.832, "step": 4855 }, { "epoch": 0.12, "learning_rate": 1.953576434306295e-06, "loss": 1.0371, "step": 4856 }, { "epoch": 0.12, "learning_rate": 1.9535514318378506e-06, "loss": 0.7466, "step": 4857 }, { "epoch": 0.12, "learning_rate": 1.9535264227984767e-06, "loss": 0.9502, "step": 4858 }, { "epoch": 0.12, "learning_rate": 1.9535014071883447e-06, "loss": 0.8115, "step": 4859 }, { "epoch": 0.12, "learning_rate": 1.9534763850076273e-06, "loss": 0.9243, "step": 4860 }, { "epoch": 0.12, "learning_rate": 1.953451356256497e-06, "loss": 0.9844, "step": 4861 }, { "epoch": 0.12, "learning_rate": 1.9534263209351265e-06, "loss": 0.9971, "step": 4862 }, { "epoch": 0.12, "learning_rate": 1.9534012790436877e-06, "loss": 0.9541, "step": 4863 }, { "epoch": 0.12, "learning_rate": 1.953376230582353e-06, "loss": 0.7859, "step": 4864 }, { "epoch": 0.12, "learning_rate": 1.9533511755512963e-06, "loss": 1.0, "step": 4865 }, { "epoch": 0.12, "learning_rate": 1.9533261139506888e-06, "loss": 1.1523, "step": 4866 }, { "epoch": 0.12, "learning_rate": 1.9533010457807046e-06, "loss": 1.0869, "step": 4867 }, { "epoch": 0.12, "learning_rate": 1.9532759710415154e-06, "loss": 1.0195, "step": 4868 }, { "epoch": 0.12, "learning_rate": 1.953250889733294e-06, "loss": 0.8398, "step": 4869 }, { "epoch": 0.12, "learning_rate": 1.9532258018562136e-06, "loss": 0.812, "step": 4870 }, { "epoch": 0.12, "learning_rate": 1.9532007074104467e-06, "loss": 0.9531, "step": 4871 }, { "epoch": 0.12, "learning_rate": 1.953175606396167e-06, "loss": 0.8853, "step": 4872 }, { "epoch": 0.12, "learning_rate": 1.953150498813547e-06, "loss": 0.9746, "step": 4873 }, { "epoch": 0.12, "learning_rate": 1.9531253846627594e-06, "loss": 1.0469, "step": 4874 }, { "epoch": 0.12, "learning_rate": 1.953100263943978e-06, "loss": 0.7832, "step": 4875 }, { "epoch": 0.12, "learning_rate": 1.953075136657375e-06, "loss": 0.7559, "step": 4876 }, { "epoch": 0.12, "learning_rate": 1.9530500028031245e-06, "loss": 1.0391, "step": 4877 }, { "epoch": 0.13, "learning_rate": 1.953024862381399e-06, "loss": 1.0439, "step": 4878 }, { "epoch": 0.13, "learning_rate": 1.952999715392372e-06, "loss": 0.8232, "step": 4879 }, { "epoch": 0.13, "learning_rate": 1.952974561836217e-06, "loss": 0.8379, "step": 4880 }, { "epoch": 0.13, "learning_rate": 1.9529494017131064e-06, "loss": 0.8291, "step": 4881 }, { "epoch": 0.13, "learning_rate": 1.952924235023215e-06, "loss": 1.0752, "step": 4882 }, { "epoch": 0.13, "learning_rate": 1.952899061766715e-06, "loss": 1.1074, "step": 4883 }, { "epoch": 0.13, "learning_rate": 1.952873881943781e-06, "loss": 0.9385, "step": 4884 }, { "epoch": 0.13, "learning_rate": 1.9528486955545854e-06, "loss": 0.6804, "step": 4885 }, { "epoch": 0.13, "learning_rate": 1.952823502599302e-06, "loss": 0.9824, "step": 4886 }, { "epoch": 0.13, "learning_rate": 1.9527983030781054e-06, "loss": 0.8164, "step": 4887 }, { "epoch": 0.13, "learning_rate": 1.952773096991168e-06, "loss": 0.8877, "step": 4888 }, { "epoch": 0.13, "learning_rate": 1.9527478843386637e-06, "loss": 1.0732, "step": 4889 }, { "epoch": 0.13, "learning_rate": 1.952722665120767e-06, "loss": 0.8857, "step": 4890 }, { "epoch": 0.13, "learning_rate": 1.952697439337651e-06, "loss": 0.79, "step": 4891 }, { "epoch": 0.13, "learning_rate": 1.95267220698949e-06, "loss": 0.8584, "step": 4892 }, { "epoch": 0.13, "learning_rate": 1.9526469680764573e-06, "loss": 0.917, "step": 4893 }, { "epoch": 0.13, "learning_rate": 1.9526217225987273e-06, "loss": 1.0332, "step": 4894 }, { "epoch": 0.13, "learning_rate": 1.952596470556474e-06, "loss": 0.9053, "step": 4895 }, { "epoch": 0.13, "learning_rate": 1.952571211949871e-06, "loss": 0.8145, "step": 4896 }, { "epoch": 0.13, "learning_rate": 1.9525459467790924e-06, "loss": 0.9531, "step": 4897 }, { "epoch": 0.13, "learning_rate": 1.952520675044313e-06, "loss": 1.0576, "step": 4898 }, { "epoch": 0.13, "learning_rate": 1.952495396745706e-06, "loss": 0.999, "step": 4899 }, { "epoch": 0.13, "learning_rate": 1.9524701118834465e-06, "loss": 1.0303, "step": 4900 }, { "epoch": 0.13, "learning_rate": 1.952444820457708e-06, "loss": 0.9131, "step": 4901 }, { "epoch": 0.13, "learning_rate": 1.9524195224686646e-06, "loss": 0.9795, "step": 4902 }, { "epoch": 0.13, "learning_rate": 1.9523942179164916e-06, "loss": 1.0859, "step": 4903 }, { "epoch": 0.13, "learning_rate": 1.952368906801363e-06, "loss": 0.9082, "step": 4904 }, { "epoch": 0.13, "learning_rate": 1.9523435891234525e-06, "loss": 0.8135, "step": 4905 }, { "epoch": 0.13, "learning_rate": 1.9523182648829354e-06, "loss": 0.9873, "step": 4906 }, { "epoch": 0.13, "learning_rate": 1.952292934079986e-06, "loss": 0.873, "step": 4907 }, { "epoch": 0.13, "learning_rate": 1.9522675967147786e-06, "loss": 0.804, "step": 4908 }, { "epoch": 0.13, "learning_rate": 1.9522422527874883e-06, "loss": 0.8818, "step": 4909 }, { "epoch": 0.13, "learning_rate": 1.9522169022982892e-06, "loss": 0.6587, "step": 4910 }, { "epoch": 0.13, "learning_rate": 1.9521915452473563e-06, "loss": 1.0029, "step": 4911 }, { "epoch": 0.13, "learning_rate": 1.9521661816348645e-06, "loss": 1.2744, "step": 4912 }, { "epoch": 0.13, "learning_rate": 1.952140811460988e-06, "loss": 0.8184, "step": 4913 }, { "epoch": 0.13, "learning_rate": 1.952115434725902e-06, "loss": 1.0098, "step": 4914 }, { "epoch": 0.13, "learning_rate": 1.952090051429782e-06, "loss": 0.9834, "step": 4915 }, { "epoch": 0.13, "learning_rate": 1.9520646615728013e-06, "loss": 0.9058, "step": 4916 }, { "epoch": 0.13, "learning_rate": 1.9520392651551363e-06, "loss": 0.9385, "step": 4917 }, { "epoch": 0.13, "learning_rate": 1.9520138621769615e-06, "loss": 0.999, "step": 4918 }, { "epoch": 0.13, "learning_rate": 1.951988452638452e-06, "loss": 0.8896, "step": 4919 }, { "epoch": 0.13, "learning_rate": 1.9519630365397826e-06, "loss": 0.8584, "step": 4920 }, { "epoch": 0.13, "learning_rate": 1.9519376138811293e-06, "loss": 0.9258, "step": 4921 }, { "epoch": 0.13, "learning_rate": 1.9519121846626665e-06, "loss": 0.8184, "step": 4922 }, { "epoch": 0.13, "learning_rate": 1.9518867488845693e-06, "loss": 0.9492, "step": 4923 }, { "epoch": 0.13, "learning_rate": 1.9518613065470134e-06, "loss": 1.1582, "step": 4924 }, { "epoch": 0.13, "learning_rate": 1.9518358576501745e-06, "loss": 0.9111, "step": 4925 }, { "epoch": 0.13, "learning_rate": 1.951810402194227e-06, "loss": 1.166, "step": 4926 }, { "epoch": 0.13, "learning_rate": 1.951784940179347e-06, "loss": 1.0293, "step": 4927 }, { "epoch": 0.13, "learning_rate": 1.95175947160571e-06, "loss": 0.958, "step": 4928 }, { "epoch": 0.13, "learning_rate": 1.951733996473491e-06, "loss": 1.1025, "step": 4929 }, { "epoch": 0.13, "learning_rate": 1.9517085147828665e-06, "loss": 0.856, "step": 4930 }, { "epoch": 0.13, "learning_rate": 1.9516830265340106e-06, "loss": 0.8232, "step": 4931 }, { "epoch": 0.13, "learning_rate": 1.9516575317271e-06, "loss": 0.918, "step": 4932 }, { "epoch": 0.13, "learning_rate": 1.9516320303623103e-06, "loss": 0.7419, "step": 4933 }, { "epoch": 0.13, "learning_rate": 1.951606522439817e-06, "loss": 0.8706, "step": 4934 }, { "epoch": 0.13, "learning_rate": 1.9515810079597962e-06, "loss": 1.04, "step": 4935 }, { "epoch": 0.13, "learning_rate": 1.9515554869224233e-06, "loss": 0.6313, "step": 4936 }, { "epoch": 0.13, "learning_rate": 1.9515299593278744e-06, "loss": 0.9355, "step": 4937 }, { "epoch": 0.13, "learning_rate": 1.951504425176325e-06, "loss": 1.0703, "step": 4938 }, { "epoch": 0.13, "learning_rate": 1.9514788844679517e-06, "loss": 0.9072, "step": 4939 }, { "epoch": 0.13, "learning_rate": 1.9514533372029304e-06, "loss": 1.0391, "step": 4940 }, { "epoch": 0.13, "learning_rate": 1.951427783381437e-06, "loss": 0.9121, "step": 4941 }, { "epoch": 0.13, "learning_rate": 1.9514022230036475e-06, "loss": 1.0957, "step": 4942 }, { "epoch": 0.13, "learning_rate": 1.9513766560697376e-06, "loss": 0.9062, "step": 4943 }, { "epoch": 0.13, "learning_rate": 1.9513510825798845e-06, "loss": 0.9355, "step": 4944 }, { "epoch": 0.13, "learning_rate": 1.9513255025342637e-06, "loss": 0.9243, "step": 4945 }, { "epoch": 0.13, "learning_rate": 1.9512999159330518e-06, "loss": 1.0723, "step": 4946 }, { "epoch": 0.13, "learning_rate": 1.951274322776425e-06, "loss": 1.0498, "step": 4947 }, { "epoch": 0.13, "learning_rate": 1.9512487230645595e-06, "loss": 0.9453, "step": 4948 }, { "epoch": 0.13, "learning_rate": 1.9512231167976315e-06, "loss": 0.916, "step": 4949 }, { "epoch": 0.13, "learning_rate": 1.9511975039758184e-06, "loss": 0.8035, "step": 4950 }, { "epoch": 0.13, "learning_rate": 1.951171884599296e-06, "loss": 0.8203, "step": 4951 }, { "epoch": 0.13, "learning_rate": 1.951146258668241e-06, "loss": 0.9717, "step": 4952 }, { "epoch": 0.13, "learning_rate": 1.95112062618283e-06, "loss": 1.0596, "step": 4953 }, { "epoch": 0.13, "learning_rate": 1.9510949871432396e-06, "loss": 1.0479, "step": 4954 }, { "epoch": 0.13, "learning_rate": 1.951069341549646e-06, "loss": 0.9463, "step": 4955 }, { "epoch": 0.13, "learning_rate": 1.9510436894022267e-06, "loss": 0.9912, "step": 4956 }, { "epoch": 0.13, "learning_rate": 1.951018030701158e-06, "loss": 1.0049, "step": 4957 }, { "epoch": 0.13, "learning_rate": 1.9509923654466174e-06, "loss": 0.9619, "step": 4958 }, { "epoch": 0.13, "learning_rate": 1.9509666936387804e-06, "loss": 1.0312, "step": 4959 }, { "epoch": 0.13, "learning_rate": 1.9509410152778256e-06, "loss": 0.748, "step": 4960 }, { "epoch": 0.13, "learning_rate": 1.9509153303639283e-06, "loss": 0.8862, "step": 4961 }, { "epoch": 0.13, "learning_rate": 1.950889638897267e-06, "loss": 0.8525, "step": 4962 }, { "epoch": 0.13, "learning_rate": 1.9508639408780173e-06, "loss": 0.7832, "step": 4963 }, { "epoch": 0.13, "learning_rate": 1.9508382363063572e-06, "loss": 1.0703, "step": 4964 }, { "epoch": 0.13, "learning_rate": 1.950812525182464e-06, "loss": 1.0908, "step": 4965 }, { "epoch": 0.13, "learning_rate": 1.950786807506514e-06, "loss": 0.9717, "step": 4966 }, { "epoch": 0.13, "learning_rate": 1.9507610832786853e-06, "loss": 0.9424, "step": 4967 }, { "epoch": 0.13, "learning_rate": 1.9507353524991545e-06, "loss": 1.0547, "step": 4968 }, { "epoch": 0.13, "learning_rate": 1.9507096151680997e-06, "loss": 0.8984, "step": 4969 }, { "epoch": 0.13, "learning_rate": 1.9506838712856973e-06, "loss": 0.9072, "step": 4970 }, { "epoch": 0.13, "learning_rate": 1.9506581208521252e-06, "loss": 1.0518, "step": 4971 }, { "epoch": 0.13, "learning_rate": 1.950632363867561e-06, "loss": 0.6567, "step": 4972 }, { "epoch": 0.13, "learning_rate": 1.950606600332182e-06, "loss": 0.7812, "step": 4973 }, { "epoch": 0.13, "learning_rate": 1.9505808302461653e-06, "loss": 1.04, "step": 4974 }, { "epoch": 0.13, "learning_rate": 1.9505550536096896e-06, "loss": 0.7524, "step": 4975 }, { "epoch": 0.13, "learning_rate": 1.9505292704229315e-06, "loss": 0.9727, "step": 4976 }, { "epoch": 0.13, "learning_rate": 1.950503480686069e-06, "loss": 1.0908, "step": 4977 }, { "epoch": 0.13, "learning_rate": 1.95047768439928e-06, "loss": 1.0566, "step": 4978 }, { "epoch": 0.13, "learning_rate": 1.950451881562742e-06, "loss": 0.9873, "step": 4979 }, { "epoch": 0.13, "learning_rate": 1.9504260721766328e-06, "loss": 0.9414, "step": 4980 }, { "epoch": 0.13, "learning_rate": 1.9504002562411305e-06, "loss": 1.1328, "step": 4981 }, { "epoch": 0.13, "learning_rate": 1.9503744337564126e-06, "loss": 1.1367, "step": 4982 }, { "epoch": 0.13, "learning_rate": 1.9503486047226575e-06, "loss": 0.9619, "step": 4983 }, { "epoch": 0.13, "learning_rate": 1.950322769140043e-06, "loss": 1.0234, "step": 4984 }, { "epoch": 0.13, "learning_rate": 1.950296927008747e-06, "loss": 0.7251, "step": 4985 }, { "epoch": 0.13, "learning_rate": 1.950271078328948e-06, "loss": 0.9648, "step": 4986 }, { "epoch": 0.13, "learning_rate": 1.9502452231008234e-06, "loss": 1.0918, "step": 4987 }, { "epoch": 0.13, "learning_rate": 1.950219361324552e-06, "loss": 0.9961, "step": 4988 }, { "epoch": 0.13, "learning_rate": 1.950193493000312e-06, "loss": 0.9492, "step": 4989 }, { "epoch": 0.13, "learning_rate": 1.9501676181282815e-06, "loss": 1.042, "step": 4990 }, { "epoch": 0.13, "learning_rate": 1.9501417367086383e-06, "loss": 0.8633, "step": 4991 }, { "epoch": 0.13, "learning_rate": 1.9501158487415613e-06, "loss": 0.8525, "step": 4992 }, { "epoch": 0.13, "learning_rate": 1.9500899542272292e-06, "loss": 1.0811, "step": 4993 }, { "epoch": 0.13, "learning_rate": 1.9500640531658195e-06, "loss": 0.7583, "step": 4994 }, { "epoch": 0.13, "learning_rate": 1.9500381455575117e-06, "loss": 0.9961, "step": 4995 }, { "epoch": 0.13, "learning_rate": 1.9500122314024838e-06, "loss": 1.0859, "step": 4996 }, { "epoch": 0.13, "learning_rate": 1.9499863107009143e-06, "loss": 0.7959, "step": 4997 }, { "epoch": 0.13, "learning_rate": 1.949960383452982e-06, "loss": 0.792, "step": 4998 }, { "epoch": 0.13, "learning_rate": 1.9499344496588655e-06, "loss": 0.9727, "step": 4999 }, { "epoch": 0.13, "learning_rate": 1.9499085093187436e-06, "loss": 0.5552, "step": 5000 } ], "logging_steps": 1.0, "max_steps": 39016, "num_train_epochs": 1, "save_steps": 5000, "total_flos": 129762904227840.0, "trial_name": null, "trial_params": null }