{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.536, "eval_steps": 500, "global_step": 48000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 1.2800000000000001e-09, "loss": 2.0804, "step": 1 }, { "epoch": 0.0, "learning_rate": 6.400000000000001e-09, "loss": 2.0692, "step": 5 }, { "epoch": 0.0, "learning_rate": 1.2800000000000002e-08, "loss": 2.1047, "step": 10 }, { "epoch": 0.0, "learning_rate": 1.9200000000000003e-08, "loss": 2.0927, "step": 15 }, { "epoch": 0.0, "learning_rate": 2.5600000000000004e-08, "loss": 2.0802, "step": 20 }, { "epoch": 0.0, "learning_rate": 3.2e-08, "loss": 2.0879, "step": 25 }, { "epoch": 0.0, "learning_rate": 3.8400000000000006e-08, "loss": 2.0852, "step": 30 }, { "epoch": 0.0, "learning_rate": 4.48e-08, "loss": 2.0654, "step": 35 }, { "epoch": 0.0, "learning_rate": 5.120000000000001e-08, "loss": 2.1006, "step": 40 }, { "epoch": 0.0, "learning_rate": 5.7600000000000006e-08, "loss": 2.0717, "step": 45 }, { "epoch": 0.0, "learning_rate": 6.4e-08, "loss": 2.0658, "step": 50 }, { "epoch": 0.0, "learning_rate": 7.040000000000001e-08, "loss": 2.036, "step": 55 }, { "epoch": 0.0, "learning_rate": 7.680000000000001e-08, "loss": 2.0428, "step": 60 }, { "epoch": 0.0, "learning_rate": 8.32e-08, "loss": 2.0419, "step": 65 }, { "epoch": 0.0, "learning_rate": 8.96e-08, "loss": 2.0317, "step": 70 }, { "epoch": 0.0, "learning_rate": 9.6e-08, "loss": 2.0456, "step": 75 }, { "epoch": 0.0, "learning_rate": 1.0240000000000002e-07, "loss": 2.0136, "step": 80 }, { "epoch": 0.0, "learning_rate": 1.0880000000000002e-07, "loss": 2.0241, "step": 85 }, { "epoch": 0.0, "learning_rate": 1.1520000000000001e-07, "loss": 2.0083, "step": 90 }, { "epoch": 0.0, "learning_rate": 1.216e-07, "loss": 2.0187, "step": 95 }, { "epoch": 0.0, "learning_rate": 1.28e-07, "loss": 2.0067, "step": 100 }, { "epoch": 0.0, "learning_rate": 1.344e-07, "loss": 2.0019, "step": 105 }, { "epoch": 0.0, "learning_rate": 1.4080000000000002e-07, "loss": 1.9899, "step": 110 }, { "epoch": 0.0, "learning_rate": 1.4720000000000002e-07, "loss": 1.9648, "step": 115 }, { "epoch": 0.0, "learning_rate": 1.5360000000000003e-07, "loss": 1.9652, "step": 120 }, { "epoch": 0.0, "learning_rate": 1.6e-07, "loss": 1.9284, "step": 125 }, { "epoch": 0.0, "learning_rate": 1.664e-07, "loss": 1.9491, "step": 130 }, { "epoch": 0.0, "learning_rate": 1.728e-07, "loss": 1.9442, "step": 135 }, { "epoch": 0.0, "learning_rate": 1.792e-07, "loss": 1.9239, "step": 140 }, { "epoch": 0.0, "learning_rate": 1.8560000000000002e-07, "loss": 1.9454, "step": 145 }, { "epoch": 0.0, "learning_rate": 1.92e-07, "loss": 1.914, "step": 150 }, { "epoch": 0.0, "learning_rate": 1.984e-07, "loss": 1.8963, "step": 155 }, { "epoch": 0.01, "learning_rate": 2.0480000000000003e-07, "loss": 1.8846, "step": 160 }, { "epoch": 0.01, "learning_rate": 2.112e-07, "loss": 1.8761, "step": 165 }, { "epoch": 0.01, "learning_rate": 2.1760000000000004e-07, "loss": 1.8882, "step": 170 }, { "epoch": 0.01, "learning_rate": 2.2400000000000002e-07, "loss": 1.8794, "step": 175 }, { "epoch": 0.01, "learning_rate": 2.3040000000000002e-07, "loss": 1.8585, "step": 180 }, { "epoch": 0.01, "learning_rate": 2.368e-07, "loss": 1.8616, "step": 185 }, { "epoch": 0.01, "learning_rate": 2.432e-07, "loss": 1.8567, "step": 190 }, { "epoch": 0.01, "learning_rate": 2.496e-07, "loss": 1.8642, "step": 195 }, { "epoch": 0.01, "learning_rate": 2.56e-07, "loss": 1.8508, "step": 200 }, { "epoch": 0.01, "learning_rate": 2.624e-07, "loss": 1.8372, "step": 205 }, { "epoch": 0.01, "learning_rate": 2.688e-07, "loss": 1.8225, "step": 210 }, { "epoch": 0.01, "learning_rate": 2.7520000000000003e-07, "loss": 1.8232, "step": 215 }, { "epoch": 0.01, "learning_rate": 2.8160000000000003e-07, "loss": 1.8183, "step": 220 }, { "epoch": 0.01, "learning_rate": 2.8800000000000004e-07, "loss": 1.8174, "step": 225 }, { "epoch": 0.01, "learning_rate": 2.9440000000000004e-07, "loss": 1.8196, "step": 230 }, { "epoch": 0.01, "learning_rate": 3.008e-07, "loss": 1.8158, "step": 235 }, { "epoch": 0.01, "learning_rate": 3.0720000000000005e-07, "loss": 1.7998, "step": 240 }, { "epoch": 0.01, "learning_rate": 3.136e-07, "loss": 1.7931, "step": 245 }, { "epoch": 0.01, "learning_rate": 3.2e-07, "loss": 1.8028, "step": 250 }, { "epoch": 0.01, "learning_rate": 3.2640000000000006e-07, "loss": 1.7743, "step": 255 }, { "epoch": 0.01, "learning_rate": 3.328e-07, "loss": 1.8076, "step": 260 }, { "epoch": 0.01, "learning_rate": 3.392e-07, "loss": 1.7776, "step": 265 }, { "epoch": 0.01, "learning_rate": 3.456e-07, "loss": 1.788, "step": 270 }, { "epoch": 0.01, "learning_rate": 3.5200000000000003e-07, "loss": 1.7723, "step": 275 }, { "epoch": 0.01, "learning_rate": 3.584e-07, "loss": 1.7644, "step": 280 }, { "epoch": 0.01, "learning_rate": 3.6480000000000004e-07, "loss": 1.7607, "step": 285 }, { "epoch": 0.01, "learning_rate": 3.7120000000000004e-07, "loss": 1.7548, "step": 290 }, { "epoch": 0.01, "learning_rate": 3.7760000000000005e-07, "loss": 1.7537, "step": 295 }, { "epoch": 0.01, "learning_rate": 3.84e-07, "loss": 1.7551, "step": 300 }, { "epoch": 0.01, "learning_rate": 3.904e-07, "loss": 1.742, "step": 305 }, { "epoch": 0.01, "learning_rate": 3.968e-07, "loss": 1.7261, "step": 310 }, { "epoch": 0.01, "learning_rate": 4.0320000000000006e-07, "loss": 1.7364, "step": 315 }, { "epoch": 0.01, "learning_rate": 4.0960000000000007e-07, "loss": 1.7286, "step": 320 }, { "epoch": 0.01, "learning_rate": 4.16e-07, "loss": 1.7373, "step": 325 }, { "epoch": 0.01, "learning_rate": 4.224e-07, "loss": 1.7206, "step": 330 }, { "epoch": 0.01, "learning_rate": 4.2880000000000003e-07, "loss": 1.6963, "step": 335 }, { "epoch": 0.01, "learning_rate": 4.352000000000001e-07, "loss": 1.7102, "step": 340 }, { "epoch": 0.01, "learning_rate": 4.4160000000000004e-07, "loss": 1.7082, "step": 345 }, { "epoch": 0.01, "learning_rate": 4.4800000000000004e-07, "loss": 1.6996, "step": 350 }, { "epoch": 0.01, "learning_rate": 4.5440000000000005e-07, "loss": 1.7064, "step": 355 }, { "epoch": 0.01, "learning_rate": 4.6080000000000005e-07, "loss": 1.6969, "step": 360 }, { "epoch": 0.01, "learning_rate": 4.672e-07, "loss": 1.703, "step": 365 }, { "epoch": 0.01, "learning_rate": 4.736e-07, "loss": 1.6827, "step": 370 }, { "epoch": 0.01, "learning_rate": 4.800000000000001e-07, "loss": 1.692, "step": 375 }, { "epoch": 0.01, "learning_rate": 4.864e-07, "loss": 1.6673, "step": 380 }, { "epoch": 0.01, "learning_rate": 4.928e-07, "loss": 1.6776, "step": 385 }, { "epoch": 0.01, "learning_rate": 4.992e-07, "loss": 1.6732, "step": 390 }, { "epoch": 0.01, "learning_rate": 5.056000000000001e-07, "loss": 1.6806, "step": 395 }, { "epoch": 0.01, "learning_rate": 5.12e-07, "loss": 1.6687, "step": 400 }, { "epoch": 0.01, "learning_rate": 5.184e-07, "loss": 1.664, "step": 405 }, { "epoch": 0.01, "learning_rate": 5.248e-07, "loss": 1.6637, "step": 410 }, { "epoch": 0.01, "learning_rate": 5.312000000000001e-07, "loss": 1.6457, "step": 415 }, { "epoch": 0.01, "learning_rate": 5.376e-07, "loss": 1.6616, "step": 420 }, { "epoch": 0.01, "learning_rate": 5.44e-07, "loss": 1.6566, "step": 425 }, { "epoch": 0.01, "learning_rate": 5.504000000000001e-07, "loss": 1.6495, "step": 430 }, { "epoch": 0.01, "learning_rate": 5.568e-07, "loss": 1.6377, "step": 435 }, { "epoch": 0.01, "learning_rate": 5.632000000000001e-07, "loss": 1.66, "step": 440 }, { "epoch": 0.01, "learning_rate": 5.696e-07, "loss": 1.6432, "step": 445 }, { "epoch": 0.01, "learning_rate": 5.760000000000001e-07, "loss": 1.6198, "step": 450 }, { "epoch": 0.01, "learning_rate": 5.824e-07, "loss": 1.6216, "step": 455 }, { "epoch": 0.01, "learning_rate": 5.888000000000001e-07, "loss": 1.6218, "step": 460 }, { "epoch": 0.01, "learning_rate": 5.952e-07, "loss": 1.6223, "step": 465 }, { "epoch": 0.02, "learning_rate": 6.016e-07, "loss": 1.6177, "step": 470 }, { "epoch": 0.02, "learning_rate": 6.08e-07, "loss": 1.6115, "step": 475 }, { "epoch": 0.02, "learning_rate": 6.144000000000001e-07, "loss": 1.6242, "step": 480 }, { "epoch": 0.02, "learning_rate": 6.208000000000001e-07, "loss": 1.6061, "step": 485 }, { "epoch": 0.02, "learning_rate": 6.272e-07, "loss": 1.625, "step": 490 }, { "epoch": 0.02, "learning_rate": 6.336000000000001e-07, "loss": 1.6041, "step": 495 }, { "epoch": 0.02, "learning_rate": 6.4e-07, "loss": 1.5859, "step": 500 }, { "epoch": 0.02, "learning_rate": 6.464000000000001e-07, "loss": 1.6088, "step": 505 }, { "epoch": 0.02, "learning_rate": 6.528000000000001e-07, "loss": 1.5875, "step": 510 }, { "epoch": 0.02, "learning_rate": 6.592000000000001e-07, "loss": 1.597, "step": 515 }, { "epoch": 0.02, "learning_rate": 6.656e-07, "loss": 1.5934, "step": 520 }, { "epoch": 0.02, "learning_rate": 6.72e-07, "loss": 1.5865, "step": 525 }, { "epoch": 0.02, "learning_rate": 6.784e-07, "loss": 1.5897, "step": 530 }, { "epoch": 0.02, "learning_rate": 6.848000000000001e-07, "loss": 1.5934, "step": 535 }, { "epoch": 0.02, "learning_rate": 6.912e-07, "loss": 1.5699, "step": 540 }, { "epoch": 0.02, "learning_rate": 6.976000000000001e-07, "loss": 1.5822, "step": 545 }, { "epoch": 0.02, "learning_rate": 7.040000000000001e-07, "loss": 1.5747, "step": 550 }, { "epoch": 0.02, "learning_rate": 7.104000000000001e-07, "loss": 1.564, "step": 555 }, { "epoch": 0.02, "learning_rate": 7.168e-07, "loss": 1.5655, "step": 560 }, { "epoch": 0.02, "learning_rate": 7.232e-07, "loss": 1.5757, "step": 565 }, { "epoch": 0.02, "learning_rate": 7.296000000000001e-07, "loss": 1.5593, "step": 570 }, { "epoch": 0.02, "learning_rate": 7.36e-07, "loss": 1.5645, "step": 575 }, { "epoch": 0.02, "learning_rate": 7.424000000000001e-07, "loss": 1.5617, "step": 580 }, { "epoch": 0.02, "learning_rate": 7.488e-07, "loss": 1.5675, "step": 585 }, { "epoch": 0.02, "learning_rate": 7.552000000000001e-07, "loss": 1.5632, "step": 590 }, { "epoch": 0.02, "learning_rate": 7.616000000000001e-07, "loss": 1.5554, "step": 595 }, { "epoch": 0.02, "learning_rate": 7.68e-07, "loss": 1.5714, "step": 600 }, { "epoch": 0.02, "learning_rate": 7.744e-07, "loss": 1.5601, "step": 605 }, { "epoch": 0.02, "learning_rate": 7.808e-07, "loss": 1.5641, "step": 610 }, { "epoch": 0.02, "learning_rate": 7.872000000000001e-07, "loss": 1.5384, "step": 615 }, { "epoch": 0.02, "learning_rate": 7.936e-07, "loss": 1.5356, "step": 620 }, { "epoch": 0.02, "learning_rate": 8.000000000000001e-07, "loss": 1.5413, "step": 625 }, { "epoch": 0.02, "learning_rate": 8.064000000000001e-07, "loss": 1.5428, "step": 630 }, { "epoch": 0.02, "learning_rate": 8.128000000000001e-07, "loss": 1.5215, "step": 635 }, { "epoch": 0.02, "learning_rate": 8.192000000000001e-07, "loss": 1.5349, "step": 640 }, { "epoch": 0.02, "learning_rate": 8.256e-07, "loss": 1.531, "step": 645 }, { "epoch": 0.02, "learning_rate": 8.32e-07, "loss": 1.5235, "step": 650 }, { "epoch": 0.02, "learning_rate": 8.384000000000001e-07, "loss": 1.5263, "step": 655 }, { "epoch": 0.02, "learning_rate": 8.448e-07, "loss": 1.5258, "step": 660 }, { "epoch": 0.02, "learning_rate": 8.512000000000001e-07, "loss": 1.5198, "step": 665 }, { "epoch": 0.02, "learning_rate": 8.576000000000001e-07, "loss": 1.509, "step": 670 }, { "epoch": 0.02, "learning_rate": 8.640000000000001e-07, "loss": 1.5356, "step": 675 }, { "epoch": 0.02, "learning_rate": 8.704000000000002e-07, "loss": 1.5134, "step": 680 }, { "epoch": 0.02, "learning_rate": 8.768e-07, "loss": 1.5173, "step": 685 }, { "epoch": 0.02, "learning_rate": 8.832000000000001e-07, "loss": 1.5056, "step": 690 }, { "epoch": 0.02, "learning_rate": 8.896e-07, "loss": 1.5093, "step": 695 }, { "epoch": 0.02, "learning_rate": 8.960000000000001e-07, "loss": 1.5077, "step": 700 }, { "epoch": 0.02, "learning_rate": 9.024e-07, "loss": 1.5128, "step": 705 }, { "epoch": 0.02, "learning_rate": 9.088000000000001e-07, "loss": 1.5049, "step": 710 }, { "epoch": 0.02, "learning_rate": 9.152000000000001e-07, "loss": 1.4956, "step": 715 }, { "epoch": 0.02, "learning_rate": 9.216000000000001e-07, "loss": 1.5162, "step": 720 }, { "epoch": 0.02, "learning_rate": 9.28e-07, "loss": 1.496, "step": 725 }, { "epoch": 0.02, "learning_rate": 9.344e-07, "loss": 1.4865, "step": 730 }, { "epoch": 0.02, "learning_rate": 9.408000000000001e-07, "loss": 1.4901, "step": 735 }, { "epoch": 0.02, "learning_rate": 9.472e-07, "loss": 1.5181, "step": 740 }, { "epoch": 0.02, "learning_rate": 9.536000000000001e-07, "loss": 1.4874, "step": 745 }, { "epoch": 0.02, "learning_rate": 9.600000000000001e-07, "loss": 1.4866, "step": 750 }, { "epoch": 0.02, "learning_rate": 9.664000000000002e-07, "loss": 1.4838, "step": 755 }, { "epoch": 0.02, "learning_rate": 9.728e-07, "loss": 1.48, "step": 760 }, { "epoch": 0.02, "learning_rate": 9.792e-07, "loss": 1.4878, "step": 765 }, { "epoch": 0.02, "learning_rate": 9.856e-07, "loss": 1.4835, "step": 770 }, { "epoch": 0.02, "learning_rate": 9.92e-07, "loss": 1.4858, "step": 775 }, { "epoch": 0.02, "learning_rate": 9.984e-07, "loss": 1.4906, "step": 780 }, { "epoch": 0.03, "learning_rate": 1.0048e-06, "loss": 1.4854, "step": 785 }, { "epoch": 0.03, "learning_rate": 1.0112000000000002e-06, "loss": 1.4715, "step": 790 }, { "epoch": 0.03, "learning_rate": 1.0176000000000002e-06, "loss": 1.4845, "step": 795 }, { "epoch": 0.03, "learning_rate": 1.024e-06, "loss": 1.4707, "step": 800 }, { "epoch": 0.03, "learning_rate": 1.0304000000000001e-06, "loss": 1.4713, "step": 805 }, { "epoch": 0.03, "learning_rate": 1.0368e-06, "loss": 1.4625, "step": 810 }, { "epoch": 0.03, "learning_rate": 1.0432e-06, "loss": 1.4681, "step": 815 }, { "epoch": 0.03, "learning_rate": 1.0496e-06, "loss": 1.4508, "step": 820 }, { "epoch": 0.03, "learning_rate": 1.0560000000000001e-06, "loss": 1.4705, "step": 825 }, { "epoch": 0.03, "learning_rate": 1.0624000000000002e-06, "loss": 1.4628, "step": 830 }, { "epoch": 0.03, "learning_rate": 1.0688e-06, "loss": 1.4703, "step": 835 }, { "epoch": 0.03, "learning_rate": 1.0752e-06, "loss": 1.4615, "step": 840 }, { "epoch": 0.03, "learning_rate": 1.0816000000000002e-06, "loss": 1.4573, "step": 845 }, { "epoch": 0.03, "learning_rate": 1.088e-06, "loss": 1.477, "step": 850 }, { "epoch": 0.03, "learning_rate": 1.0944e-06, "loss": 1.4623, "step": 855 }, { "epoch": 0.03, "learning_rate": 1.1008000000000001e-06, "loss": 1.4557, "step": 860 }, { "epoch": 0.03, "learning_rate": 1.1072000000000002e-06, "loss": 1.453, "step": 865 }, { "epoch": 0.03, "learning_rate": 1.1136e-06, "loss": 1.4659, "step": 870 }, { "epoch": 0.03, "learning_rate": 1.12e-06, "loss": 1.452, "step": 875 }, { "epoch": 0.03, "learning_rate": 1.1264000000000001e-06, "loss": 1.4496, "step": 880 }, { "epoch": 0.03, "learning_rate": 1.1328000000000002e-06, "loss": 1.4559, "step": 885 }, { "epoch": 0.03, "learning_rate": 1.1392e-06, "loss": 1.4529, "step": 890 }, { "epoch": 0.03, "learning_rate": 1.1456e-06, "loss": 1.4408, "step": 895 }, { "epoch": 0.03, "learning_rate": 1.1520000000000002e-06, "loss": 1.4372, "step": 900 }, { "epoch": 0.03, "learning_rate": 1.1584e-06, "loss": 1.4433, "step": 905 }, { "epoch": 0.03, "learning_rate": 1.1648e-06, "loss": 1.4471, "step": 910 }, { "epoch": 0.03, "learning_rate": 1.1712000000000001e-06, "loss": 1.4568, "step": 915 }, { "epoch": 0.03, "learning_rate": 1.1776000000000002e-06, "loss": 1.4407, "step": 920 }, { "epoch": 0.03, "learning_rate": 1.1840000000000002e-06, "loss": 1.4464, "step": 925 }, { "epoch": 0.03, "learning_rate": 1.1904e-06, "loss": 1.4253, "step": 930 }, { "epoch": 0.03, "learning_rate": 1.1968000000000001e-06, "loss": 1.4401, "step": 935 }, { "epoch": 0.03, "learning_rate": 1.2032e-06, "loss": 1.43, "step": 940 }, { "epoch": 0.03, "learning_rate": 1.2096e-06, "loss": 1.4409, "step": 945 }, { "epoch": 0.03, "learning_rate": 1.216e-06, "loss": 1.429, "step": 950 }, { "epoch": 0.03, "learning_rate": 1.2224000000000001e-06, "loss": 1.4276, "step": 955 }, { "epoch": 0.03, "learning_rate": 1.2288000000000002e-06, "loss": 1.4344, "step": 960 }, { "epoch": 0.03, "learning_rate": 1.2352e-06, "loss": 1.4406, "step": 965 }, { "epoch": 0.03, "learning_rate": 1.2416000000000001e-06, "loss": 1.4254, "step": 970 }, { "epoch": 0.03, "learning_rate": 1.248e-06, "loss": 1.4122, "step": 975 }, { "epoch": 0.03, "learning_rate": 1.2544e-06, "loss": 1.425, "step": 980 }, { "epoch": 0.03, "learning_rate": 1.2608e-06, "loss": 1.4237, "step": 985 }, { "epoch": 0.03, "learning_rate": 1.2672000000000001e-06, "loss": 1.4224, "step": 990 }, { "epoch": 0.03, "learning_rate": 1.2736000000000002e-06, "loss": 1.4227, "step": 995 }, { "epoch": 0.03, "learning_rate": 1.28e-06, "loss": 1.4325, "step": 1000 }, { "epoch": 0.03, "learning_rate": 1.2864e-06, "loss": 1.4278, "step": 1005 }, { "epoch": 0.03, "learning_rate": 1.2928000000000001e-06, "loss": 1.4035, "step": 1010 }, { "epoch": 0.03, "learning_rate": 1.2992000000000002e-06, "loss": 1.4231, "step": 1015 }, { "epoch": 0.03, "learning_rate": 1.3056000000000003e-06, "loss": 1.4169, "step": 1020 }, { "epoch": 0.03, "learning_rate": 1.3120000000000003e-06, "loss": 1.4035, "step": 1025 }, { "epoch": 0.03, "learning_rate": 1.3184000000000002e-06, "loss": 1.4094, "step": 1030 }, { "epoch": 0.03, "learning_rate": 1.3248e-06, "loss": 1.4097, "step": 1035 }, { "epoch": 0.03, "learning_rate": 1.3312e-06, "loss": 1.4261, "step": 1040 }, { "epoch": 0.03, "learning_rate": 1.3376e-06, "loss": 1.4113, "step": 1045 }, { "epoch": 0.03, "learning_rate": 1.344e-06, "loss": 1.4034, "step": 1050 }, { "epoch": 0.03, "learning_rate": 1.3504e-06, "loss": 1.4096, "step": 1055 }, { "epoch": 0.03, "learning_rate": 1.3568e-06, "loss": 1.4106, "step": 1060 }, { "epoch": 0.03, "learning_rate": 1.3632000000000001e-06, "loss": 1.4023, "step": 1065 }, { "epoch": 0.03, "learning_rate": 1.3696000000000002e-06, "loss": 1.4035, "step": 1070 }, { "epoch": 0.03, "learning_rate": 1.376e-06, "loss": 1.4146, "step": 1075 }, { "epoch": 0.03, "learning_rate": 1.3824e-06, "loss": 1.4054, "step": 1080 }, { "epoch": 0.03, "learning_rate": 1.3888000000000002e-06, "loss": 1.3996, "step": 1085 }, { "epoch": 0.03, "learning_rate": 1.3952000000000002e-06, "loss": 1.4073, "step": 1090 }, { "epoch": 0.04, "learning_rate": 1.4016000000000003e-06, "loss": 1.4119, "step": 1095 }, { "epoch": 0.04, "learning_rate": 1.4080000000000001e-06, "loss": 1.394, "step": 1100 }, { "epoch": 0.04, "learning_rate": 1.4144000000000002e-06, "loss": 1.3976, "step": 1105 }, { "epoch": 0.04, "learning_rate": 1.4208000000000002e-06, "loss": 1.4036, "step": 1110 }, { "epoch": 0.04, "learning_rate": 1.4272000000000003e-06, "loss": 1.3786, "step": 1115 }, { "epoch": 0.04, "learning_rate": 1.4336e-06, "loss": 1.4106, "step": 1120 }, { "epoch": 0.04, "learning_rate": 1.44e-06, "loss": 1.3807, "step": 1125 }, { "epoch": 0.04, "learning_rate": 1.4464e-06, "loss": 1.3796, "step": 1130 }, { "epoch": 0.04, "learning_rate": 1.4528e-06, "loss": 1.3996, "step": 1135 }, { "epoch": 0.04, "learning_rate": 1.4592000000000001e-06, "loss": 1.3989, "step": 1140 }, { "epoch": 0.04, "learning_rate": 1.4656e-06, "loss": 1.4022, "step": 1145 }, { "epoch": 0.04, "learning_rate": 1.472e-06, "loss": 1.3845, "step": 1150 }, { "epoch": 0.04, "learning_rate": 1.4784000000000001e-06, "loss": 1.3965, "step": 1155 }, { "epoch": 0.04, "learning_rate": 1.4848000000000002e-06, "loss": 1.3828, "step": 1160 }, { "epoch": 0.04, "learning_rate": 1.4912000000000002e-06, "loss": 1.3883, "step": 1165 }, { "epoch": 0.04, "learning_rate": 1.4976e-06, "loss": 1.3855, "step": 1170 }, { "epoch": 0.04, "learning_rate": 1.5040000000000001e-06, "loss": 1.3835, "step": 1175 }, { "epoch": 0.04, "learning_rate": 1.5104000000000002e-06, "loss": 1.3739, "step": 1180 }, { "epoch": 0.04, "learning_rate": 1.5168000000000002e-06, "loss": 1.3903, "step": 1185 }, { "epoch": 0.04, "learning_rate": 1.5232000000000003e-06, "loss": 1.3775, "step": 1190 }, { "epoch": 0.04, "learning_rate": 1.5296000000000004e-06, "loss": 1.3816, "step": 1195 }, { "epoch": 0.04, "learning_rate": 1.536e-06, "loss": 1.3702, "step": 1200 }, { "epoch": 0.04, "learning_rate": 1.5424e-06, "loss": 1.3846, "step": 1205 }, { "epoch": 0.04, "learning_rate": 1.5488e-06, "loss": 1.3755, "step": 1210 }, { "epoch": 0.04, "learning_rate": 1.5552e-06, "loss": 1.382, "step": 1215 }, { "epoch": 0.04, "learning_rate": 1.5616e-06, "loss": 1.3678, "step": 1220 }, { "epoch": 0.04, "learning_rate": 1.568e-06, "loss": 1.3717, "step": 1225 }, { "epoch": 0.04, "learning_rate": 1.5744000000000001e-06, "loss": 1.3731, "step": 1230 }, { "epoch": 0.04, "learning_rate": 1.5808000000000002e-06, "loss": 1.3582, "step": 1235 }, { "epoch": 0.04, "learning_rate": 1.5872e-06, "loss": 1.3716, "step": 1240 }, { "epoch": 0.04, "learning_rate": 1.5936e-06, "loss": 1.3805, "step": 1245 }, { "epoch": 0.04, "learning_rate": 1.6000000000000001e-06, "loss": 1.3684, "step": 1250 }, { "epoch": 0.04, "learning_rate": 1.6064000000000002e-06, "loss": 1.35, "step": 1255 }, { "epoch": 0.04, "learning_rate": 1.6128000000000003e-06, "loss": 1.3612, "step": 1260 }, { "epoch": 0.04, "learning_rate": 1.6192000000000003e-06, "loss": 1.351, "step": 1265 }, { "epoch": 0.04, "learning_rate": 1.6256000000000002e-06, "loss": 1.3513, "step": 1270 }, { "epoch": 0.04, "learning_rate": 1.6320000000000002e-06, "loss": 1.3741, "step": 1275 }, { "epoch": 0.04, "learning_rate": 1.6384000000000003e-06, "loss": 1.3708, "step": 1280 }, { "epoch": 0.04, "learning_rate": 1.6448e-06, "loss": 1.3671, "step": 1285 }, { "epoch": 0.04, "learning_rate": 1.6512e-06, "loss": 1.3587, "step": 1290 }, { "epoch": 0.04, "learning_rate": 1.6576e-06, "loss": 1.3568, "step": 1295 }, { "epoch": 0.04, "learning_rate": 1.664e-06, "loss": 1.347, "step": 1300 }, { "epoch": 0.04, "learning_rate": 1.6704000000000001e-06, "loss": 1.3528, "step": 1305 }, { "epoch": 0.04, "learning_rate": 1.6768000000000002e-06, "loss": 1.351, "step": 1310 }, { "epoch": 0.04, "learning_rate": 1.6832e-06, "loss": 1.3543, "step": 1315 }, { "epoch": 0.04, "learning_rate": 1.6896e-06, "loss": 1.3554, "step": 1320 }, { "epoch": 0.04, "learning_rate": 1.6960000000000002e-06, "loss": 1.3562, "step": 1325 }, { "epoch": 0.04, "learning_rate": 1.7024000000000002e-06, "loss": 1.3566, "step": 1330 }, { "epoch": 0.04, "learning_rate": 1.7088000000000003e-06, "loss": 1.3526, "step": 1335 }, { "epoch": 0.04, "learning_rate": 1.7152000000000001e-06, "loss": 1.3561, "step": 1340 }, { "epoch": 0.04, "learning_rate": 1.7216000000000002e-06, "loss": 1.3588, "step": 1345 }, { "epoch": 0.04, "learning_rate": 1.7280000000000002e-06, "loss": 1.3519, "step": 1350 }, { "epoch": 0.04, "learning_rate": 1.7344000000000003e-06, "loss": 1.3386, "step": 1355 }, { "epoch": 0.04, "learning_rate": 1.7408000000000003e-06, "loss": 1.3567, "step": 1360 }, { "epoch": 0.04, "learning_rate": 1.7472e-06, "loss": 1.3535, "step": 1365 }, { "epoch": 0.04, "learning_rate": 1.7536e-06, "loss": 1.3189, "step": 1370 }, { "epoch": 0.04, "learning_rate": 1.76e-06, "loss": 1.3458, "step": 1375 }, { "epoch": 0.04, "learning_rate": 1.7664000000000001e-06, "loss": 1.3399, "step": 1380 }, { "epoch": 0.04, "learning_rate": 1.7728e-06, "loss": 1.3406, "step": 1385 }, { "epoch": 0.04, "learning_rate": 1.7792e-06, "loss": 1.3407, "step": 1390 }, { "epoch": 0.04, "learning_rate": 1.7856000000000001e-06, "loss": 1.3516, "step": 1395 }, { "epoch": 0.04, "learning_rate": 1.7920000000000002e-06, "loss": 1.3394, "step": 1400 }, { "epoch": 0.04, "learning_rate": 1.7984000000000002e-06, "loss": 1.3431, "step": 1405 }, { "epoch": 0.05, "learning_rate": 1.8048e-06, "loss": 1.3346, "step": 1410 }, { "epoch": 0.05, "learning_rate": 1.8112000000000001e-06, "loss": 1.3364, "step": 1415 }, { "epoch": 0.05, "learning_rate": 1.8176000000000002e-06, "loss": 1.3337, "step": 1420 }, { "epoch": 0.05, "learning_rate": 1.8240000000000002e-06, "loss": 1.3255, "step": 1425 }, { "epoch": 0.05, "learning_rate": 1.8304000000000003e-06, "loss": 1.3376, "step": 1430 }, { "epoch": 0.05, "learning_rate": 1.8368000000000004e-06, "loss": 1.3674, "step": 1435 }, { "epoch": 0.05, "learning_rate": 1.8432000000000002e-06, "loss": 1.3323, "step": 1440 }, { "epoch": 0.05, "learning_rate": 1.8496000000000003e-06, "loss": 1.3244, "step": 1445 }, { "epoch": 0.05, "learning_rate": 1.856e-06, "loss": 1.3328, "step": 1450 }, { "epoch": 0.05, "learning_rate": 1.8624e-06, "loss": 1.3299, "step": 1455 }, { "epoch": 0.05, "learning_rate": 1.8688e-06, "loss": 1.3258, "step": 1460 }, { "epoch": 0.05, "learning_rate": 1.8752e-06, "loss": 1.3274, "step": 1465 }, { "epoch": 0.05, "learning_rate": 1.8816000000000001e-06, "loss": 1.3327, "step": 1470 }, { "epoch": 0.05, "learning_rate": 1.8880000000000002e-06, "loss": 1.3311, "step": 1475 }, { "epoch": 0.05, "learning_rate": 1.8944e-06, "loss": 1.3206, "step": 1480 }, { "epoch": 0.05, "learning_rate": 1.9008e-06, "loss": 1.3196, "step": 1485 }, { "epoch": 0.05, "learning_rate": 1.9072000000000001e-06, "loss": 1.3148, "step": 1490 }, { "epoch": 0.05, "learning_rate": 1.9136e-06, "loss": 1.3196, "step": 1495 }, { "epoch": 0.05, "learning_rate": 1.9200000000000003e-06, "loss": 1.3246, "step": 1500 }, { "epoch": 0.05, "learning_rate": 1.9264000000000003e-06, "loss": 1.3435, "step": 1505 }, { "epoch": 0.05, "learning_rate": 1.9328000000000004e-06, "loss": 1.3225, "step": 1510 }, { "epoch": 0.05, "learning_rate": 1.9392000000000004e-06, "loss": 1.306, "step": 1515 }, { "epoch": 0.05, "learning_rate": 1.9456e-06, "loss": 1.3141, "step": 1520 }, { "epoch": 0.05, "learning_rate": 1.952e-06, "loss": 1.3152, "step": 1525 }, { "epoch": 0.05, "learning_rate": 1.9584e-06, "loss": 1.324, "step": 1530 }, { "epoch": 0.05, "learning_rate": 1.9648000000000002e-06, "loss": 1.3314, "step": 1535 }, { "epoch": 0.05, "learning_rate": 1.9712e-06, "loss": 1.3185, "step": 1540 }, { "epoch": 0.05, "learning_rate": 1.9776e-06, "loss": 1.313, "step": 1545 }, { "epoch": 0.05, "learning_rate": 1.984e-06, "loss": 1.3079, "step": 1550 }, { "epoch": 0.05, "learning_rate": 1.9904e-06, "loss": 1.3119, "step": 1555 }, { "epoch": 0.05, "learning_rate": 1.9968e-06, "loss": 1.3131, "step": 1560 }, { "epoch": 0.05, "learning_rate": 2.0032e-06, "loss": 1.3072, "step": 1565 }, { "epoch": 0.05, "learning_rate": 2.0096e-06, "loss": 1.3082, "step": 1570 }, { "epoch": 0.05, "learning_rate": 2.0160000000000003e-06, "loss": 1.3033, "step": 1575 }, { "epoch": 0.05, "learning_rate": 2.0224000000000003e-06, "loss": 1.3144, "step": 1580 }, { "epoch": 0.05, "learning_rate": 2.0288000000000004e-06, "loss": 1.321, "step": 1585 }, { "epoch": 0.05, "learning_rate": 2.0352000000000004e-06, "loss": 1.3186, "step": 1590 }, { "epoch": 0.05, "learning_rate": 2.0416e-06, "loss": 1.3114, "step": 1595 }, { "epoch": 0.05, "learning_rate": 2.048e-06, "loss": 1.3239, "step": 1600 }, { "epoch": 0.05, "learning_rate": 2.0544e-06, "loss": 1.3137, "step": 1605 }, { "epoch": 0.05, "learning_rate": 2.0608000000000002e-06, "loss": 1.3011, "step": 1610 }, { "epoch": 0.05, "learning_rate": 2.0672e-06, "loss": 1.3122, "step": 1615 }, { "epoch": 0.05, "learning_rate": 2.0736e-06, "loss": 1.32, "step": 1620 }, { "epoch": 0.05, "learning_rate": 2.08e-06, "loss": 1.3039, "step": 1625 }, { "epoch": 0.05, "learning_rate": 2.0864e-06, "loss": 1.3066, "step": 1630 }, { "epoch": 0.05, "learning_rate": 2.0928e-06, "loss": 1.2993, "step": 1635 }, { "epoch": 0.05, "learning_rate": 2.0992e-06, "loss": 1.3151, "step": 1640 }, { "epoch": 0.05, "learning_rate": 2.1056000000000002e-06, "loss": 1.3069, "step": 1645 }, { "epoch": 0.05, "learning_rate": 2.1120000000000003e-06, "loss": 1.287, "step": 1650 }, { "epoch": 0.05, "learning_rate": 2.1184000000000003e-06, "loss": 1.2889, "step": 1655 }, { "epoch": 0.05, "learning_rate": 2.1248000000000004e-06, "loss": 1.3052, "step": 1660 }, { "epoch": 0.05, "learning_rate": 2.1312e-06, "loss": 1.289, "step": 1665 }, { "epoch": 0.05, "learning_rate": 2.1376e-06, "loss": 1.2908, "step": 1670 }, { "epoch": 0.05, "learning_rate": 2.144e-06, "loss": 1.2901, "step": 1675 }, { "epoch": 0.05, "learning_rate": 2.1504e-06, "loss": 1.3023, "step": 1680 }, { "epoch": 0.05, "learning_rate": 2.1568000000000003e-06, "loss": 1.2964, "step": 1685 }, { "epoch": 0.05, "learning_rate": 2.1632000000000003e-06, "loss": 1.3049, "step": 1690 }, { "epoch": 0.05, "learning_rate": 2.1696e-06, "loss": 1.2972, "step": 1695 }, { "epoch": 0.05, "learning_rate": 2.176e-06, "loss": 1.2864, "step": 1700 }, { "epoch": 0.05, "learning_rate": 2.1824e-06, "loss": 1.2845, "step": 1705 }, { "epoch": 0.05, "learning_rate": 2.1888e-06, "loss": 1.2807, "step": 1710 }, { "epoch": 0.05, "learning_rate": 2.1952e-06, "loss": 1.2886, "step": 1715 }, { "epoch": 0.06, "learning_rate": 2.2016000000000002e-06, "loss": 1.2848, "step": 1720 }, { "epoch": 0.06, "learning_rate": 2.2080000000000003e-06, "loss": 1.2882, "step": 1725 }, { "epoch": 0.06, "learning_rate": 2.2144000000000003e-06, "loss": 1.3015, "step": 1730 }, { "epoch": 0.06, "learning_rate": 2.2208e-06, "loss": 1.2901, "step": 1735 }, { "epoch": 0.06, "learning_rate": 2.2272e-06, "loss": 1.3016, "step": 1740 }, { "epoch": 0.06, "learning_rate": 2.2336e-06, "loss": 1.2893, "step": 1745 }, { "epoch": 0.06, "learning_rate": 2.24e-06, "loss": 1.2905, "step": 1750 }, { "epoch": 0.06, "learning_rate": 2.2464e-06, "loss": 1.2711, "step": 1755 }, { "epoch": 0.06, "learning_rate": 2.2528000000000003e-06, "loss": 1.2921, "step": 1760 }, { "epoch": 0.06, "learning_rate": 2.2592000000000003e-06, "loss": 1.2906, "step": 1765 }, { "epoch": 0.06, "learning_rate": 2.2656000000000004e-06, "loss": 1.2853, "step": 1770 }, { "epoch": 0.06, "learning_rate": 2.2720000000000004e-06, "loss": 1.2856, "step": 1775 }, { "epoch": 0.06, "learning_rate": 2.2784e-06, "loss": 1.2741, "step": 1780 }, { "epoch": 0.06, "learning_rate": 2.2848e-06, "loss": 1.2789, "step": 1785 }, { "epoch": 0.06, "learning_rate": 2.2912e-06, "loss": 1.2881, "step": 1790 }, { "epoch": 0.06, "learning_rate": 2.2976000000000002e-06, "loss": 1.2792, "step": 1795 }, { "epoch": 0.06, "learning_rate": 2.3040000000000003e-06, "loss": 1.2765, "step": 1800 }, { "epoch": 0.06, "learning_rate": 2.3104e-06, "loss": 1.2863, "step": 1805 }, { "epoch": 0.06, "learning_rate": 2.3168e-06, "loss": 1.2816, "step": 1810 }, { "epoch": 0.06, "learning_rate": 2.3232e-06, "loss": 1.2886, "step": 1815 }, { "epoch": 0.06, "learning_rate": 2.3296e-06, "loss": 1.2794, "step": 1820 }, { "epoch": 0.06, "learning_rate": 2.336e-06, "loss": 1.2899, "step": 1825 }, { "epoch": 0.06, "learning_rate": 2.3424000000000002e-06, "loss": 1.2895, "step": 1830 }, { "epoch": 0.06, "learning_rate": 2.3488000000000003e-06, "loss": 1.2769, "step": 1835 }, { "epoch": 0.06, "learning_rate": 2.3552000000000003e-06, "loss": 1.2717, "step": 1840 }, { "epoch": 0.06, "learning_rate": 2.3616000000000004e-06, "loss": 1.286, "step": 1845 }, { "epoch": 0.06, "learning_rate": 2.3680000000000005e-06, "loss": 1.2731, "step": 1850 }, { "epoch": 0.06, "learning_rate": 2.3744000000000005e-06, "loss": 1.2753, "step": 1855 }, { "epoch": 0.06, "learning_rate": 2.3808e-06, "loss": 1.2707, "step": 1860 }, { "epoch": 0.06, "learning_rate": 2.3872e-06, "loss": 1.2686, "step": 1865 }, { "epoch": 0.06, "learning_rate": 2.3936000000000003e-06, "loss": 1.2591, "step": 1870 }, { "epoch": 0.06, "learning_rate": 2.4000000000000003e-06, "loss": 1.2777, "step": 1875 }, { "epoch": 0.06, "learning_rate": 2.4064e-06, "loss": 1.2734, "step": 1880 }, { "epoch": 0.06, "learning_rate": 2.4128e-06, "loss": 1.2722, "step": 1885 }, { "epoch": 0.06, "learning_rate": 2.4192e-06, "loss": 1.2717, "step": 1890 }, { "epoch": 0.06, "learning_rate": 2.4256e-06, "loss": 1.2663, "step": 1895 }, { "epoch": 0.06, "learning_rate": 2.432e-06, "loss": 1.2559, "step": 1900 }, { "epoch": 0.06, "learning_rate": 2.4384000000000002e-06, "loss": 1.2556, "step": 1905 }, { "epoch": 0.06, "learning_rate": 2.4448000000000003e-06, "loss": 1.2613, "step": 1910 }, { "epoch": 0.06, "learning_rate": 2.4512000000000003e-06, "loss": 1.2756, "step": 1915 }, { "epoch": 0.06, "learning_rate": 2.4576000000000004e-06, "loss": 1.2729, "step": 1920 }, { "epoch": 0.06, "learning_rate": 2.4640000000000005e-06, "loss": 1.2669, "step": 1925 }, { "epoch": 0.06, "learning_rate": 2.4704e-06, "loss": 1.2571, "step": 1930 }, { "epoch": 0.06, "learning_rate": 2.4768e-06, "loss": 1.2653, "step": 1935 }, { "epoch": 0.06, "learning_rate": 2.4832000000000002e-06, "loss": 1.2534, "step": 1940 }, { "epoch": 0.06, "learning_rate": 2.4896000000000003e-06, "loss": 1.2628, "step": 1945 }, { "epoch": 0.06, "learning_rate": 2.496e-06, "loss": 1.2646, "step": 1950 }, { "epoch": 0.06, "learning_rate": 2.5024000000000004e-06, "loss": 1.2566, "step": 1955 }, { "epoch": 0.06, "learning_rate": 2.5088e-06, "loss": 1.2438, "step": 1960 }, { "epoch": 0.06, "learning_rate": 2.5152000000000005e-06, "loss": 1.2411, "step": 1965 }, { "epoch": 0.06, "learning_rate": 2.5216e-06, "loss": 1.2643, "step": 1970 }, { "epoch": 0.06, "learning_rate": 2.5280000000000006e-06, "loss": 1.2745, "step": 1975 }, { "epoch": 0.06, "learning_rate": 2.5344000000000002e-06, "loss": 1.2538, "step": 1980 }, { "epoch": 0.06, "learning_rate": 2.5408e-06, "loss": 1.2471, "step": 1985 }, { "epoch": 0.06, "learning_rate": 2.5472000000000004e-06, "loss": 1.2642, "step": 1990 }, { "epoch": 0.06, "learning_rate": 2.5536e-06, "loss": 1.2732, "step": 1995 }, { "epoch": 0.06, "learning_rate": 2.56e-06, "loss": 1.2555, "step": 2000 }, { "epoch": 0.06, "learning_rate": 2.5664e-06, "loss": 1.2584, "step": 2005 }, { "epoch": 0.06, "learning_rate": 2.5728e-06, "loss": 1.2624, "step": 2010 }, { "epoch": 0.06, "learning_rate": 2.5792000000000002e-06, "loss": 1.2666, "step": 2015 }, { "epoch": 0.06, "learning_rate": 2.5856000000000003e-06, "loss": 1.2667, "step": 2020 }, { "epoch": 0.06, "learning_rate": 2.592e-06, "loss": 1.2524, "step": 2025 }, { "epoch": 0.06, "learning_rate": 2.5984000000000004e-06, "loss": 1.2653, "step": 2030 }, { "epoch": 0.07, "learning_rate": 2.6048e-06, "loss": 1.2391, "step": 2035 }, { "epoch": 0.07, "learning_rate": 2.6112000000000005e-06, "loss": 1.2605, "step": 2040 }, { "epoch": 0.07, "learning_rate": 2.6176e-06, "loss": 1.2638, "step": 2045 }, { "epoch": 0.07, "learning_rate": 2.6240000000000006e-06, "loss": 1.24, "step": 2050 }, { "epoch": 0.07, "learning_rate": 2.6304000000000003e-06, "loss": 1.2586, "step": 2055 }, { "epoch": 0.07, "learning_rate": 2.6368000000000003e-06, "loss": 1.2442, "step": 2060 }, { "epoch": 0.07, "learning_rate": 2.6432000000000004e-06, "loss": 1.2321, "step": 2065 }, { "epoch": 0.07, "learning_rate": 2.6496e-06, "loss": 1.2437, "step": 2070 }, { "epoch": 0.07, "learning_rate": 2.656e-06, "loss": 1.23, "step": 2075 }, { "epoch": 0.07, "learning_rate": 2.6624e-06, "loss": 1.2537, "step": 2080 }, { "epoch": 0.07, "learning_rate": 2.6688e-06, "loss": 1.2525, "step": 2085 }, { "epoch": 0.07, "learning_rate": 2.6752e-06, "loss": 1.2437, "step": 2090 }, { "epoch": 0.07, "learning_rate": 2.6816000000000003e-06, "loss": 1.2541, "step": 2095 }, { "epoch": 0.07, "learning_rate": 2.688e-06, "loss": 1.2265, "step": 2100 }, { "epoch": 0.07, "learning_rate": 2.6944000000000004e-06, "loss": 1.2541, "step": 2105 }, { "epoch": 0.07, "learning_rate": 2.7008e-06, "loss": 1.2571, "step": 2110 }, { "epoch": 0.07, "learning_rate": 2.7072000000000005e-06, "loss": 1.2479, "step": 2115 }, { "epoch": 0.07, "learning_rate": 2.7136e-06, "loss": 1.2528, "step": 2120 }, { "epoch": 0.07, "learning_rate": 2.7200000000000002e-06, "loss": 1.2432, "step": 2125 }, { "epoch": 0.07, "learning_rate": 2.7264000000000003e-06, "loss": 1.237, "step": 2130 }, { "epoch": 0.07, "learning_rate": 2.7328000000000003e-06, "loss": 1.2459, "step": 2135 }, { "epoch": 0.07, "learning_rate": 2.7392000000000004e-06, "loss": 1.2423, "step": 2140 }, { "epoch": 0.07, "learning_rate": 2.7456000000000004e-06, "loss": 1.2416, "step": 2145 }, { "epoch": 0.07, "learning_rate": 2.752e-06, "loss": 1.2512, "step": 2150 }, { "epoch": 0.07, "learning_rate": 2.7584e-06, "loss": 1.2458, "step": 2155 }, { "epoch": 0.07, "learning_rate": 2.7648e-06, "loss": 1.2427, "step": 2160 }, { "epoch": 0.07, "learning_rate": 2.7712e-06, "loss": 1.2336, "step": 2165 }, { "epoch": 0.07, "learning_rate": 2.7776000000000003e-06, "loss": 1.2215, "step": 2170 }, { "epoch": 0.07, "learning_rate": 2.784e-06, "loss": 1.2381, "step": 2175 }, { "epoch": 0.07, "learning_rate": 2.7904000000000004e-06, "loss": 1.2487, "step": 2180 }, { "epoch": 0.07, "learning_rate": 2.7968e-06, "loss": 1.224, "step": 2185 }, { "epoch": 0.07, "learning_rate": 2.8032000000000005e-06, "loss": 1.2525, "step": 2190 }, { "epoch": 0.07, "learning_rate": 2.8096e-06, "loss": 1.2341, "step": 2195 }, { "epoch": 0.07, "learning_rate": 2.8160000000000002e-06, "loss": 1.239, "step": 2200 }, { "epoch": 0.07, "learning_rate": 2.8224000000000003e-06, "loss": 1.2339, "step": 2205 }, { "epoch": 0.07, "learning_rate": 2.8288000000000003e-06, "loss": 1.2117, "step": 2210 }, { "epoch": 0.07, "learning_rate": 2.8352e-06, "loss": 1.2403, "step": 2215 }, { "epoch": 0.07, "learning_rate": 2.8416000000000005e-06, "loss": 1.2507, "step": 2220 }, { "epoch": 0.07, "learning_rate": 2.848e-06, "loss": 1.2251, "step": 2225 }, { "epoch": 0.07, "learning_rate": 2.8544000000000006e-06, "loss": 1.2322, "step": 2230 }, { "epoch": 0.07, "learning_rate": 2.8608e-06, "loss": 1.2348, "step": 2235 }, { "epoch": 0.07, "learning_rate": 2.8672e-06, "loss": 1.2391, "step": 2240 }, { "epoch": 0.07, "learning_rate": 2.8736000000000003e-06, "loss": 1.2185, "step": 2245 }, { "epoch": 0.07, "learning_rate": 2.88e-06, "loss": 1.2274, "step": 2250 }, { "epoch": 0.07, "learning_rate": 2.8864000000000004e-06, "loss": 1.2261, "step": 2255 }, { "epoch": 0.07, "learning_rate": 2.8928e-06, "loss": 1.2378, "step": 2260 }, { "epoch": 0.07, "learning_rate": 2.8992000000000005e-06, "loss": 1.2204, "step": 2265 }, { "epoch": 0.07, "learning_rate": 2.9056e-06, "loss": 1.2223, "step": 2270 }, { "epoch": 0.07, "learning_rate": 2.9120000000000002e-06, "loss": 1.2175, "step": 2275 }, { "epoch": 0.07, "learning_rate": 2.9184000000000003e-06, "loss": 1.2354, "step": 2280 }, { "epoch": 0.07, "learning_rate": 2.9248000000000004e-06, "loss": 1.2295, "step": 2285 }, { "epoch": 0.07, "learning_rate": 2.9312e-06, "loss": 1.2229, "step": 2290 }, { "epoch": 0.07, "learning_rate": 2.9376000000000005e-06, "loss": 1.233, "step": 2295 }, { "epoch": 0.07, "learning_rate": 2.944e-06, "loss": 1.2283, "step": 2300 }, { "epoch": 0.07, "learning_rate": 2.9504000000000006e-06, "loss": 1.2305, "step": 2305 }, { "epoch": 0.07, "learning_rate": 2.9568000000000002e-06, "loss": 1.2257, "step": 2310 }, { "epoch": 0.07, "learning_rate": 2.9632e-06, "loss": 1.2202, "step": 2315 }, { "epoch": 0.07, "learning_rate": 2.9696000000000003e-06, "loss": 1.2102, "step": 2320 }, { "epoch": 0.07, "learning_rate": 2.976e-06, "loss": 1.2338, "step": 2325 }, { "epoch": 0.07, "learning_rate": 2.9824000000000004e-06, "loss": 1.2201, "step": 2330 }, { "epoch": 0.07, "learning_rate": 2.9888e-06, "loss": 1.211, "step": 2335 }, { "epoch": 0.07, "learning_rate": 2.9952e-06, "loss": 1.2137, "step": 2340 }, { "epoch": 0.08, "learning_rate": 3.0016e-06, "loss": 1.2248, "step": 2345 }, { "epoch": 0.08, "learning_rate": 3.0080000000000003e-06, "loss": 1.2224, "step": 2350 }, { "epoch": 0.08, "learning_rate": 3.0144000000000003e-06, "loss": 1.2241, "step": 2355 }, { "epoch": 0.08, "learning_rate": 3.0208000000000004e-06, "loss": 1.2072, "step": 2360 }, { "epoch": 0.08, "learning_rate": 3.0272e-06, "loss": 1.2214, "step": 2365 }, { "epoch": 0.08, "learning_rate": 3.0336000000000005e-06, "loss": 1.1977, "step": 2370 }, { "epoch": 0.08, "learning_rate": 3.04e-06, "loss": 1.2086, "step": 2375 }, { "epoch": 0.08, "learning_rate": 3.0464000000000006e-06, "loss": 1.2131, "step": 2380 }, { "epoch": 0.08, "learning_rate": 3.0528000000000002e-06, "loss": 1.2349, "step": 2385 }, { "epoch": 0.08, "learning_rate": 3.0592000000000007e-06, "loss": 1.2279, "step": 2390 }, { "epoch": 0.08, "learning_rate": 3.0656000000000003e-06, "loss": 1.2228, "step": 2395 }, { "epoch": 0.08, "learning_rate": 3.072e-06, "loss": 1.2292, "step": 2400 }, { "epoch": 0.08, "learning_rate": 3.0784000000000005e-06, "loss": 1.2195, "step": 2405 }, { "epoch": 0.08, "learning_rate": 3.0848e-06, "loss": 1.2181, "step": 2410 }, { "epoch": 0.08, "learning_rate": 3.0912e-06, "loss": 1.2208, "step": 2415 }, { "epoch": 0.08, "learning_rate": 3.0976e-06, "loss": 1.2104, "step": 2420 }, { "epoch": 0.08, "learning_rate": 3.1040000000000003e-06, "loss": 1.2094, "step": 2425 }, { "epoch": 0.08, "learning_rate": 3.1104e-06, "loss": 1.2127, "step": 2430 }, { "epoch": 0.08, "learning_rate": 3.1168000000000004e-06, "loss": 1.2238, "step": 2435 }, { "epoch": 0.08, "learning_rate": 3.1232e-06, "loss": 1.2172, "step": 2440 }, { "epoch": 0.08, "learning_rate": 3.1296000000000005e-06, "loss": 1.2101, "step": 2445 }, { "epoch": 0.08, "learning_rate": 3.136e-06, "loss": 1.2164, "step": 2450 }, { "epoch": 0.08, "learning_rate": 3.1424000000000006e-06, "loss": 1.2118, "step": 2455 }, { "epoch": 0.08, "learning_rate": 3.1488000000000002e-06, "loss": 1.2142, "step": 2460 }, { "epoch": 0.08, "learning_rate": 3.1552000000000003e-06, "loss": 1.2087, "step": 2465 }, { "epoch": 0.08, "learning_rate": 3.1616000000000004e-06, "loss": 1.2323, "step": 2470 }, { "epoch": 0.08, "learning_rate": 3.1680000000000004e-06, "loss": 1.2207, "step": 2475 }, { "epoch": 0.08, "learning_rate": 3.1744e-06, "loss": 1.2257, "step": 2480 }, { "epoch": 0.08, "learning_rate": 3.1808e-06, "loss": 1.1972, "step": 2485 }, { "epoch": 0.08, "learning_rate": 3.1872e-06, "loss": 1.2023, "step": 2490 }, { "epoch": 0.08, "learning_rate": 3.1936000000000002e-06, "loss": 1.2067, "step": 2495 }, { "epoch": 0.08, "learning_rate": 3.2000000000000003e-06, "loss": 1.2064, "step": 2500 }, { "epoch": 0.08, "learning_rate": 3.2064e-06, "loss": 1.2167, "step": 2505 }, { "epoch": 0.08, "learning_rate": 3.2128000000000004e-06, "loss": 1.2108, "step": 2510 }, { "epoch": 0.08, "learning_rate": 3.2192e-06, "loss": 1.2102, "step": 2515 }, { "epoch": 0.08, "learning_rate": 3.2256000000000005e-06, "loss": 1.2149, "step": 2520 }, { "epoch": 0.08, "learning_rate": 3.232e-06, "loss": 1.2085, "step": 2525 }, { "epoch": 0.08, "learning_rate": 3.2384000000000006e-06, "loss": 1.2, "step": 2530 }, { "epoch": 0.08, "learning_rate": 3.2448000000000003e-06, "loss": 1.2016, "step": 2535 }, { "epoch": 0.08, "learning_rate": 3.2512000000000003e-06, "loss": 1.2142, "step": 2540 }, { "epoch": 0.08, "learning_rate": 3.2576000000000004e-06, "loss": 1.2163, "step": 2545 }, { "epoch": 0.08, "learning_rate": 3.2640000000000004e-06, "loss": 1.2028, "step": 2550 }, { "epoch": 0.08, "learning_rate": 3.2704e-06, "loss": 1.1994, "step": 2555 }, { "epoch": 0.08, "learning_rate": 3.2768000000000005e-06, "loss": 1.1973, "step": 2560 }, { "epoch": 0.08, "learning_rate": 3.2832e-06, "loss": 1.2048, "step": 2565 }, { "epoch": 0.08, "learning_rate": 3.2896e-06, "loss": 1.1863, "step": 2570 }, { "epoch": 0.08, "learning_rate": 3.2960000000000003e-06, "loss": 1.2074, "step": 2575 }, { "epoch": 0.08, "learning_rate": 3.3024e-06, "loss": 1.2108, "step": 2580 }, { "epoch": 0.08, "learning_rate": 3.3088000000000004e-06, "loss": 1.2082, "step": 2585 }, { "epoch": 0.08, "learning_rate": 3.3152e-06, "loss": 1.1918, "step": 2590 }, { "epoch": 0.08, "learning_rate": 3.3216000000000005e-06, "loss": 1.2178, "step": 2595 }, { "epoch": 0.08, "learning_rate": 3.328e-06, "loss": 1.1889, "step": 2600 }, { "epoch": 0.08, "learning_rate": 3.3344e-06, "loss": 1.2029, "step": 2605 }, { "epoch": 0.08, "learning_rate": 3.3408000000000003e-06, "loss": 1.2069, "step": 2610 }, { "epoch": 0.08, "learning_rate": 3.3472000000000003e-06, "loss": 1.2117, "step": 2615 }, { "epoch": 0.08, "learning_rate": 3.3536000000000004e-06, "loss": 1.2043, "step": 2620 }, { "epoch": 0.08, "learning_rate": 3.3600000000000004e-06, "loss": 1.1912, "step": 2625 }, { "epoch": 0.08, "learning_rate": 3.3664e-06, "loss": 1.1852, "step": 2630 }, { "epoch": 0.08, "learning_rate": 3.3728000000000006e-06, "loss": 1.2023, "step": 2635 }, { "epoch": 0.08, "learning_rate": 3.3792e-06, "loss": 1.1801, "step": 2640 }, { "epoch": 0.08, "learning_rate": 3.3856000000000007e-06, "loss": 1.204, "step": 2645 }, { "epoch": 0.08, "learning_rate": 3.3920000000000003e-06, "loss": 1.2159, "step": 2650 }, { "epoch": 0.08, "learning_rate": 3.3984e-06, "loss": 1.1923, "step": 2655 }, { "epoch": 0.09, "learning_rate": 3.4048000000000004e-06, "loss": 1.1966, "step": 2660 }, { "epoch": 0.09, "learning_rate": 3.4112e-06, "loss": 1.1846, "step": 2665 }, { "epoch": 0.09, "learning_rate": 3.4176000000000005e-06, "loss": 1.1846, "step": 2670 }, { "epoch": 0.09, "learning_rate": 3.424e-06, "loss": 1.1758, "step": 2675 }, { "epoch": 0.09, "learning_rate": 3.4304000000000002e-06, "loss": 1.1757, "step": 2680 }, { "epoch": 0.09, "learning_rate": 3.4368000000000003e-06, "loss": 1.1903, "step": 2685 }, { "epoch": 0.09, "learning_rate": 3.4432000000000003e-06, "loss": 1.1876, "step": 2690 }, { "epoch": 0.09, "learning_rate": 3.4496e-06, "loss": 1.1803, "step": 2695 }, { "epoch": 0.09, "learning_rate": 3.4560000000000005e-06, "loss": 1.1645, "step": 2700 }, { "epoch": 0.09, "learning_rate": 3.4624e-06, "loss": 1.1897, "step": 2705 }, { "epoch": 0.09, "learning_rate": 3.4688000000000006e-06, "loss": 1.1921, "step": 2710 }, { "epoch": 0.09, "learning_rate": 3.4752e-06, "loss": 1.1884, "step": 2715 }, { "epoch": 0.09, "learning_rate": 3.4816000000000007e-06, "loss": 1.1819, "step": 2720 }, { "epoch": 0.09, "learning_rate": 3.4880000000000003e-06, "loss": 1.1808, "step": 2725 }, { "epoch": 0.09, "learning_rate": 3.4944e-06, "loss": 1.1762, "step": 2730 }, { "epoch": 0.09, "learning_rate": 3.5008000000000004e-06, "loss": 1.1973, "step": 2735 }, { "epoch": 0.09, "learning_rate": 3.5072e-06, "loss": 1.174, "step": 2740 }, { "epoch": 0.09, "learning_rate": 3.5136000000000005e-06, "loss": 1.2014, "step": 2745 }, { "epoch": 0.09, "learning_rate": 3.52e-06, "loss": 1.1842, "step": 2750 }, { "epoch": 0.09, "learning_rate": 3.5264000000000002e-06, "loss": 1.1756, "step": 2755 }, { "epoch": 0.09, "learning_rate": 3.5328000000000003e-06, "loss": 1.1707, "step": 2760 }, { "epoch": 0.09, "learning_rate": 3.5392000000000004e-06, "loss": 1.1843, "step": 2765 }, { "epoch": 0.09, "learning_rate": 3.5456e-06, "loss": 1.1768, "step": 2770 }, { "epoch": 0.09, "learning_rate": 3.5520000000000005e-06, "loss": 1.1657, "step": 2775 }, { "epoch": 0.09, "learning_rate": 3.5584e-06, "loss": 1.187, "step": 2780 }, { "epoch": 0.09, "learning_rate": 3.5648000000000006e-06, "loss": 1.1849, "step": 2785 }, { "epoch": 0.09, "learning_rate": 3.5712000000000002e-06, "loss": 1.1726, "step": 2790 }, { "epoch": 0.09, "learning_rate": 3.5776000000000007e-06, "loss": 1.1715, "step": 2795 }, { "epoch": 0.09, "learning_rate": 3.5840000000000003e-06, "loss": 1.1893, "step": 2800 }, { "epoch": 0.09, "learning_rate": 3.5904000000000004e-06, "loss": 1.1647, "step": 2805 }, { "epoch": 0.09, "learning_rate": 3.5968000000000004e-06, "loss": 1.1998, "step": 2810 }, { "epoch": 0.09, "learning_rate": 3.6032e-06, "loss": 1.1876, "step": 2815 }, { "epoch": 0.09, "learning_rate": 3.6096e-06, "loss": 1.1954, "step": 2820 }, { "epoch": 0.09, "learning_rate": 3.616e-06, "loss": 1.1815, "step": 2825 }, { "epoch": 0.09, "learning_rate": 3.6224000000000002e-06, "loss": 1.1883, "step": 2830 }, { "epoch": 0.09, "learning_rate": 3.6288000000000003e-06, "loss": 1.1937, "step": 2835 }, { "epoch": 0.09, "learning_rate": 3.6352000000000004e-06, "loss": 1.1706, "step": 2840 }, { "epoch": 0.09, "learning_rate": 3.6416e-06, "loss": 1.1839, "step": 2845 }, { "epoch": 0.09, "learning_rate": 3.6480000000000005e-06, "loss": 1.1614, "step": 2850 }, { "epoch": 0.09, "learning_rate": 3.6544e-06, "loss": 1.1787, "step": 2855 }, { "epoch": 0.09, "learning_rate": 3.6608000000000006e-06, "loss": 1.182, "step": 2860 }, { "epoch": 0.09, "learning_rate": 3.6672000000000002e-06, "loss": 1.1826, "step": 2865 }, { "epoch": 0.09, "learning_rate": 3.6736000000000007e-06, "loss": 1.1771, "step": 2870 }, { "epoch": 0.09, "learning_rate": 3.6800000000000003e-06, "loss": 1.1878, "step": 2875 }, { "epoch": 0.09, "learning_rate": 3.6864000000000004e-06, "loss": 1.1823, "step": 2880 }, { "epoch": 0.09, "learning_rate": 3.6928000000000005e-06, "loss": 1.1782, "step": 2885 }, { "epoch": 0.09, "learning_rate": 3.6992000000000005e-06, "loss": 1.1768, "step": 2890 }, { "epoch": 0.09, "learning_rate": 3.7056e-06, "loss": 1.1898, "step": 2895 }, { "epoch": 0.09, "learning_rate": 3.712e-06, "loss": 1.1775, "step": 2900 }, { "epoch": 0.09, "learning_rate": 3.7184000000000003e-06, "loss": 1.1724, "step": 2905 }, { "epoch": 0.09, "learning_rate": 3.7248e-06, "loss": 1.1498, "step": 2910 }, { "epoch": 0.09, "learning_rate": 3.7312000000000004e-06, "loss": 1.1684, "step": 2915 }, { "epoch": 0.09, "learning_rate": 3.7376e-06, "loss": 1.1571, "step": 2920 }, { "epoch": 0.09, "learning_rate": 3.7440000000000005e-06, "loss": 1.1717, "step": 2925 }, { "epoch": 0.09, "learning_rate": 3.7504e-06, "loss": 1.1754, "step": 2930 }, { "epoch": 0.09, "learning_rate": 3.7568000000000006e-06, "loss": 1.155, "step": 2935 }, { "epoch": 0.09, "learning_rate": 3.7632000000000002e-06, "loss": 1.1626, "step": 2940 }, { "epoch": 0.09, "learning_rate": 3.7696000000000003e-06, "loss": 1.1724, "step": 2945 }, { "epoch": 0.09, "learning_rate": 3.7760000000000004e-06, "loss": 1.1635, "step": 2950 }, { "epoch": 0.09, "learning_rate": 3.7824000000000004e-06, "loss": 1.1543, "step": 2955 }, { "epoch": 0.09, "learning_rate": 3.7888e-06, "loss": 1.1759, "step": 2960 }, { "epoch": 0.09, "learning_rate": 3.7952000000000005e-06, "loss": 1.1561, "step": 2965 }, { "epoch": 0.1, "learning_rate": 3.8016e-06, "loss": 1.1785, "step": 2970 }, { "epoch": 0.1, "learning_rate": 3.8080000000000006e-06, "loss": 1.1688, "step": 2975 }, { "epoch": 0.1, "learning_rate": 3.8144000000000003e-06, "loss": 1.1759, "step": 2980 }, { "epoch": 0.1, "learning_rate": 3.8208e-06, "loss": 1.1705, "step": 2985 }, { "epoch": 0.1, "learning_rate": 3.8272e-06, "loss": 1.1588, "step": 2990 }, { "epoch": 0.1, "learning_rate": 3.8336e-06, "loss": 1.1631, "step": 2995 }, { "epoch": 0.1, "learning_rate": 3.8400000000000005e-06, "loss": 1.1649, "step": 3000 }, { "epoch": 0.1, "learning_rate": 3.8464e-06, "loss": 1.1778, "step": 3005 }, { "epoch": 0.1, "learning_rate": 3.852800000000001e-06, "loss": 1.1691, "step": 3010 }, { "epoch": 0.1, "learning_rate": 3.8592e-06, "loss": 1.1603, "step": 3015 }, { "epoch": 0.1, "learning_rate": 3.865600000000001e-06, "loss": 1.1672, "step": 3020 }, { "epoch": 0.1, "learning_rate": 3.872e-06, "loss": 1.1635, "step": 3025 }, { "epoch": 0.1, "learning_rate": 3.878400000000001e-06, "loss": 1.1661, "step": 3030 }, { "epoch": 0.1, "learning_rate": 3.8848000000000005e-06, "loss": 1.1561, "step": 3035 }, { "epoch": 0.1, "learning_rate": 3.8912e-06, "loss": 1.1639, "step": 3040 }, { "epoch": 0.1, "learning_rate": 3.897600000000001e-06, "loss": 1.17, "step": 3045 }, { "epoch": 0.1, "learning_rate": 3.904e-06, "loss": 1.1514, "step": 3050 }, { "epoch": 0.1, "learning_rate": 3.910400000000001e-06, "loss": 1.1704, "step": 3055 }, { "epoch": 0.1, "learning_rate": 3.9168e-06, "loss": 1.1664, "step": 3060 }, { "epoch": 0.1, "learning_rate": 3.9232e-06, "loss": 1.1543, "step": 3065 }, { "epoch": 0.1, "learning_rate": 3.9296000000000005e-06, "loss": 1.1462, "step": 3070 }, { "epoch": 0.1, "learning_rate": 3.936e-06, "loss": 1.1662, "step": 3075 }, { "epoch": 0.1, "learning_rate": 3.9424e-06, "loss": 1.1567, "step": 3080 }, { "epoch": 0.1, "learning_rate": 3.9488e-06, "loss": 1.1523, "step": 3085 }, { "epoch": 0.1, "learning_rate": 3.9552e-06, "loss": 1.1354, "step": 3090 }, { "epoch": 0.1, "learning_rate": 3.9616e-06, "loss": 1.1616, "step": 3095 }, { "epoch": 0.1, "learning_rate": 3.968e-06, "loss": 1.1584, "step": 3100 }, { "epoch": 0.1, "learning_rate": 3.9744000000000004e-06, "loss": 1.1478, "step": 3105 }, { "epoch": 0.1, "learning_rate": 3.9808e-06, "loss": 1.1562, "step": 3110 }, { "epoch": 0.1, "learning_rate": 3.9872000000000006e-06, "loss": 1.157, "step": 3115 }, { "epoch": 0.1, "learning_rate": 3.9936e-06, "loss": 1.1639, "step": 3120 }, { "epoch": 0.1, "learning_rate": 4.000000000000001e-06, "loss": 1.1421, "step": 3125 }, { "epoch": 0.1, "learning_rate": 4.0064e-06, "loss": 1.1459, "step": 3130 }, { "epoch": 0.1, "learning_rate": 4.012800000000001e-06, "loss": 1.159, "step": 3135 }, { "epoch": 0.1, "learning_rate": 4.0192e-06, "loss": 1.1462, "step": 3140 }, { "epoch": 0.1, "learning_rate": 4.0256e-06, "loss": 1.1504, "step": 3145 }, { "epoch": 0.1, "learning_rate": 4.0320000000000005e-06, "loss": 1.1537, "step": 3150 }, { "epoch": 0.1, "learning_rate": 4.0384e-06, "loss": 1.1426, "step": 3155 }, { "epoch": 0.1, "learning_rate": 4.044800000000001e-06, "loss": 1.1658, "step": 3160 }, { "epoch": 0.1, "learning_rate": 4.0512e-06, "loss": 1.1394, "step": 3165 }, { "epoch": 0.1, "learning_rate": 4.057600000000001e-06, "loss": 1.1534, "step": 3170 }, { "epoch": 0.1, "learning_rate": 4.064e-06, "loss": 1.1461, "step": 3175 }, { "epoch": 0.1, "learning_rate": 4.070400000000001e-06, "loss": 1.1534, "step": 3180 }, { "epoch": 0.1, "learning_rate": 4.0768000000000005e-06, "loss": 1.1479, "step": 3185 }, { "epoch": 0.1, "learning_rate": 4.0832e-06, "loss": 1.1521, "step": 3190 }, { "epoch": 0.1, "learning_rate": 4.089600000000001e-06, "loss": 1.1643, "step": 3195 }, { "epoch": 0.1, "learning_rate": 4.096e-06, "loss": 1.1591, "step": 3200 }, { "epoch": 0.1, "learning_rate": 4.1024e-06, "loss": 1.1489, "step": 3205 }, { "epoch": 0.1, "learning_rate": 4.1088e-06, "loss": 1.1445, "step": 3210 }, { "epoch": 0.1, "learning_rate": 4.1152e-06, "loss": 1.1613, "step": 3215 }, { "epoch": 0.1, "learning_rate": 4.1216000000000005e-06, "loss": 1.1436, "step": 3220 }, { "epoch": 0.1, "learning_rate": 4.128e-06, "loss": 1.1523, "step": 3225 }, { "epoch": 0.1, "learning_rate": 4.1344e-06, "loss": 1.1571, "step": 3230 }, { "epoch": 0.1, "learning_rate": 4.1408e-06, "loss": 1.1565, "step": 3235 }, { "epoch": 0.1, "learning_rate": 4.1472e-06, "loss": 1.1406, "step": 3240 }, { "epoch": 0.1, "learning_rate": 4.1536e-06, "loss": 1.1499, "step": 3245 }, { "epoch": 0.1, "learning_rate": 4.16e-06, "loss": 1.1654, "step": 3250 }, { "epoch": 0.1, "learning_rate": 4.1664000000000005e-06, "loss": 1.156, "step": 3255 }, { "epoch": 0.1, "learning_rate": 4.1728e-06, "loss": 1.1513, "step": 3260 }, { "epoch": 0.1, "learning_rate": 4.179200000000001e-06, "loss": 1.1289, "step": 3265 }, { "epoch": 0.1, "learning_rate": 4.1856e-06, "loss": 1.1543, "step": 3270 }, { "epoch": 0.1, "learning_rate": 4.192000000000001e-06, "loss": 1.1429, "step": 3275 }, { "epoch": 0.1, "learning_rate": 4.1984e-06, "loss": 1.1467, "step": 3280 }, { "epoch": 0.11, "learning_rate": 4.204800000000001e-06, "loss": 1.1308, "step": 3285 }, { "epoch": 0.11, "learning_rate": 4.2112000000000004e-06, "loss": 1.141, "step": 3290 }, { "epoch": 0.11, "learning_rate": 4.217600000000001e-06, "loss": 1.1566, "step": 3295 }, { "epoch": 0.11, "learning_rate": 4.2240000000000006e-06, "loss": 1.1493, "step": 3300 }, { "epoch": 0.11, "learning_rate": 4.230400000000001e-06, "loss": 1.1438, "step": 3305 }, { "epoch": 0.11, "learning_rate": 4.236800000000001e-06, "loss": 1.1448, "step": 3310 }, { "epoch": 0.11, "learning_rate": 4.2432e-06, "loss": 1.1433, "step": 3315 }, { "epoch": 0.11, "learning_rate": 4.249600000000001e-06, "loss": 1.1533, "step": 3320 }, { "epoch": 0.11, "learning_rate": 4.256e-06, "loss": 1.1174, "step": 3325 }, { "epoch": 0.11, "learning_rate": 4.2624e-06, "loss": 1.1375, "step": 3330 }, { "epoch": 0.11, "learning_rate": 4.2688000000000005e-06, "loss": 1.1547, "step": 3335 }, { "epoch": 0.11, "learning_rate": 4.2752e-06, "loss": 1.1384, "step": 3340 }, { "epoch": 0.11, "learning_rate": 4.2816e-06, "loss": 1.1429, "step": 3345 }, { "epoch": 0.11, "learning_rate": 4.288e-06, "loss": 1.1531, "step": 3350 }, { "epoch": 0.11, "learning_rate": 4.2944e-06, "loss": 1.1459, "step": 3355 }, { "epoch": 0.11, "learning_rate": 4.3008e-06, "loss": 1.1463, "step": 3360 }, { "epoch": 0.11, "learning_rate": 4.3072e-06, "loss": 1.1342, "step": 3365 }, { "epoch": 0.11, "learning_rate": 4.3136000000000005e-06, "loss": 1.1486, "step": 3370 }, { "epoch": 0.11, "learning_rate": 4.32e-06, "loss": 1.1343, "step": 3375 }, { "epoch": 0.11, "learning_rate": 4.326400000000001e-06, "loss": 1.1653, "step": 3380 }, { "epoch": 0.11, "learning_rate": 4.3328e-06, "loss": 1.1446, "step": 3385 }, { "epoch": 0.11, "learning_rate": 4.3392e-06, "loss": 1.1291, "step": 3390 }, { "epoch": 0.11, "learning_rate": 4.3456e-06, "loss": 1.1394, "step": 3395 }, { "epoch": 0.11, "learning_rate": 4.352e-06, "loss": 1.1315, "step": 3400 }, { "epoch": 0.11, "learning_rate": 4.3584000000000005e-06, "loss": 1.1552, "step": 3405 }, { "epoch": 0.11, "learning_rate": 4.3648e-06, "loss": 1.1299, "step": 3410 }, { "epoch": 0.11, "learning_rate": 4.371200000000001e-06, "loss": 1.1531, "step": 3415 }, { "epoch": 0.11, "learning_rate": 4.3776e-06, "loss": 1.1364, "step": 3420 }, { "epoch": 0.11, "learning_rate": 4.384000000000001e-06, "loss": 1.1519, "step": 3425 }, { "epoch": 0.11, "learning_rate": 4.3904e-06, "loss": 1.1627, "step": 3430 }, { "epoch": 0.11, "learning_rate": 4.396800000000001e-06, "loss": 1.1275, "step": 3435 }, { "epoch": 0.11, "learning_rate": 4.4032000000000005e-06, "loss": 1.1364, "step": 3440 }, { "epoch": 0.11, "learning_rate": 4.409600000000001e-06, "loss": 1.1411, "step": 3445 }, { "epoch": 0.11, "learning_rate": 4.416000000000001e-06, "loss": 1.1468, "step": 3450 }, { "epoch": 0.11, "learning_rate": 4.4224e-06, "loss": 1.1503, "step": 3455 }, { "epoch": 0.11, "learning_rate": 4.428800000000001e-06, "loss": 1.1438, "step": 3460 }, { "epoch": 0.11, "learning_rate": 4.4352e-06, "loss": 1.1409, "step": 3465 }, { "epoch": 0.11, "learning_rate": 4.4416e-06, "loss": 1.137, "step": 3470 }, { "epoch": 0.11, "learning_rate": 4.4480000000000004e-06, "loss": 1.1411, "step": 3475 }, { "epoch": 0.11, "learning_rate": 4.4544e-06, "loss": 1.1438, "step": 3480 }, { "epoch": 0.11, "learning_rate": 4.4608e-06, "loss": 1.1329, "step": 3485 }, { "epoch": 0.11, "learning_rate": 4.4672e-06, "loss": 1.1356, "step": 3490 }, { "epoch": 0.11, "learning_rate": 4.4736e-06, "loss": 1.1393, "step": 3495 }, { "epoch": 0.11, "learning_rate": 4.48e-06, "loss": 1.1279, "step": 3500 }, { "epoch": 0.11, "learning_rate": 4.4864e-06, "loss": 1.1393, "step": 3505 }, { "epoch": 0.11, "learning_rate": 4.4928e-06, "loss": 1.1309, "step": 3510 }, { "epoch": 0.11, "learning_rate": 4.4992e-06, "loss": 1.1427, "step": 3515 }, { "epoch": 0.11, "learning_rate": 4.5056000000000005e-06, "loss": 1.1188, "step": 3520 }, { "epoch": 0.11, "learning_rate": 4.512e-06, "loss": 1.1333, "step": 3525 }, { "epoch": 0.11, "learning_rate": 4.518400000000001e-06, "loss": 1.1416, "step": 3530 }, { "epoch": 0.11, "learning_rate": 4.5248e-06, "loss": 1.1093, "step": 3535 }, { "epoch": 0.11, "learning_rate": 4.531200000000001e-06, "loss": 1.1195, "step": 3540 }, { "epoch": 0.11, "learning_rate": 4.5376e-06, "loss": 1.1359, "step": 3545 }, { "epoch": 0.11, "learning_rate": 4.544000000000001e-06, "loss": 1.144, "step": 3550 }, { "epoch": 0.11, "learning_rate": 4.5504000000000005e-06, "loss": 1.1411, "step": 3555 }, { "epoch": 0.11, "learning_rate": 4.5568e-06, "loss": 1.1247, "step": 3560 }, { "epoch": 0.11, "learning_rate": 4.563200000000001e-06, "loss": 1.1356, "step": 3565 }, { "epoch": 0.11, "learning_rate": 4.5696e-06, "loss": 1.1362, "step": 3570 }, { "epoch": 0.11, "learning_rate": 4.576000000000001e-06, "loss": 1.1328, "step": 3575 }, { "epoch": 0.11, "learning_rate": 4.5824e-06, "loss": 1.1421, "step": 3580 }, { "epoch": 0.11, "learning_rate": 4.588800000000001e-06, "loss": 1.1389, "step": 3585 }, { "epoch": 0.11, "learning_rate": 4.5952000000000005e-06, "loss": 1.1264, "step": 3590 }, { "epoch": 0.12, "learning_rate": 4.6016e-06, "loss": 1.1168, "step": 3595 }, { "epoch": 0.12, "learning_rate": 4.608000000000001e-06, "loss": 1.1224, "step": 3600 }, { "epoch": 0.12, "learning_rate": 4.6144e-06, "loss": 1.1276, "step": 3605 }, { "epoch": 0.12, "learning_rate": 4.6208e-06, "loss": 1.1343, "step": 3610 }, { "epoch": 0.12, "learning_rate": 4.6272e-06, "loss": 1.1517, "step": 3615 }, { "epoch": 0.12, "learning_rate": 4.6336e-06, "loss": 1.1194, "step": 3620 }, { "epoch": 0.12, "learning_rate": 4.6400000000000005e-06, "loss": 1.1175, "step": 3625 }, { "epoch": 0.12, "learning_rate": 4.6464e-06, "loss": 1.1301, "step": 3630 }, { "epoch": 0.12, "learning_rate": 4.652800000000001e-06, "loss": 1.1385, "step": 3635 }, { "epoch": 0.12, "learning_rate": 4.6592e-06, "loss": 1.1304, "step": 3640 }, { "epoch": 0.12, "learning_rate": 4.6656e-06, "loss": 1.13, "step": 3645 }, { "epoch": 0.12, "learning_rate": 4.672e-06, "loss": 1.136, "step": 3650 }, { "epoch": 0.12, "learning_rate": 4.6784e-06, "loss": 1.13, "step": 3655 }, { "epoch": 0.12, "learning_rate": 4.6848000000000004e-06, "loss": 1.1171, "step": 3660 }, { "epoch": 0.12, "learning_rate": 4.6912e-06, "loss": 1.117, "step": 3665 }, { "epoch": 0.12, "learning_rate": 4.6976000000000006e-06, "loss": 1.1348, "step": 3670 }, { "epoch": 0.12, "learning_rate": 4.704e-06, "loss": 1.1202, "step": 3675 }, { "epoch": 0.12, "learning_rate": 4.710400000000001e-06, "loss": 1.1244, "step": 3680 }, { "epoch": 0.12, "learning_rate": 4.7168e-06, "loss": 1.129, "step": 3685 }, { "epoch": 0.12, "learning_rate": 4.723200000000001e-06, "loss": 1.1281, "step": 3690 }, { "epoch": 0.12, "learning_rate": 4.7296e-06, "loss": 1.1292, "step": 3695 }, { "epoch": 0.12, "learning_rate": 4.736000000000001e-06, "loss": 1.1214, "step": 3700 }, { "epoch": 0.12, "learning_rate": 4.7424000000000005e-06, "loss": 1.1147, "step": 3705 }, { "epoch": 0.12, "learning_rate": 4.748800000000001e-06, "loss": 1.1221, "step": 3710 }, { "epoch": 0.12, "learning_rate": 4.755200000000001e-06, "loss": 1.1251, "step": 3715 }, { "epoch": 0.12, "learning_rate": 4.7616e-06, "loss": 1.1192, "step": 3720 }, { "epoch": 0.12, "learning_rate": 4.768000000000001e-06, "loss": 1.1113, "step": 3725 }, { "epoch": 0.12, "learning_rate": 4.7744e-06, "loss": 1.1303, "step": 3730 }, { "epoch": 0.12, "learning_rate": 4.7808e-06, "loss": 1.1382, "step": 3735 }, { "epoch": 0.12, "learning_rate": 4.7872000000000005e-06, "loss": 1.1132, "step": 3740 }, { "epoch": 0.12, "learning_rate": 4.7936e-06, "loss": 1.12, "step": 3745 }, { "epoch": 0.12, "learning_rate": 4.800000000000001e-06, "loss": 1.1229, "step": 3750 }, { "epoch": 0.12, "learning_rate": 4.8064e-06, "loss": 1.1215, "step": 3755 }, { "epoch": 0.12, "learning_rate": 4.8128e-06, "loss": 1.1218, "step": 3760 }, { "epoch": 0.12, "learning_rate": 4.8192e-06, "loss": 1.117, "step": 3765 }, { "epoch": 0.12, "learning_rate": 4.8256e-06, "loss": 1.1133, "step": 3770 }, { "epoch": 0.12, "learning_rate": 4.8320000000000005e-06, "loss": 1.1067, "step": 3775 }, { "epoch": 0.12, "learning_rate": 4.8384e-06, "loss": 1.1147, "step": 3780 }, { "epoch": 0.12, "learning_rate": 4.844800000000001e-06, "loss": 1.1081, "step": 3785 }, { "epoch": 0.12, "learning_rate": 4.8512e-06, "loss": 1.1059, "step": 3790 }, { "epoch": 0.12, "learning_rate": 4.857600000000001e-06, "loss": 1.1188, "step": 3795 }, { "epoch": 0.12, "learning_rate": 4.864e-06, "loss": 1.1219, "step": 3800 }, { "epoch": 0.12, "learning_rate": 4.8704e-06, "loss": 1.1125, "step": 3805 }, { "epoch": 0.12, "learning_rate": 4.8768000000000005e-06, "loss": 1.1102, "step": 3810 }, { "epoch": 0.12, "learning_rate": 4.8832e-06, "loss": 1.1176, "step": 3815 }, { "epoch": 0.12, "learning_rate": 4.889600000000001e-06, "loss": 1.117, "step": 3820 }, { "epoch": 0.12, "learning_rate": 4.896e-06, "loss": 1.1167, "step": 3825 }, { "epoch": 0.12, "learning_rate": 4.902400000000001e-06, "loss": 1.1284, "step": 3830 }, { "epoch": 0.12, "learning_rate": 4.9088e-06, "loss": 1.1064, "step": 3835 }, { "epoch": 0.12, "learning_rate": 4.915200000000001e-06, "loss": 1.1134, "step": 3840 }, { "epoch": 0.12, "learning_rate": 4.9216000000000004e-06, "loss": 1.1087, "step": 3845 }, { "epoch": 0.12, "learning_rate": 4.928000000000001e-06, "loss": 1.1161, "step": 3850 }, { "epoch": 0.12, "learning_rate": 4.9344000000000006e-06, "loss": 1.1061, "step": 3855 }, { "epoch": 0.12, "learning_rate": 4.9408e-06, "loss": 1.1224, "step": 3860 }, { "epoch": 0.12, "learning_rate": 4.947200000000001e-06, "loss": 1.1233, "step": 3865 }, { "epoch": 0.12, "learning_rate": 4.9536e-06, "loss": 1.1126, "step": 3870 }, { "epoch": 0.12, "learning_rate": 4.960000000000001e-06, "loss": 1.1029, "step": 3875 }, { "epoch": 0.12, "learning_rate": 4.9664000000000004e-06, "loss": 1.1088, "step": 3880 }, { "epoch": 0.12, "learning_rate": 4.9728e-06, "loss": 1.122, "step": 3885 }, { "epoch": 0.12, "learning_rate": 4.9792000000000005e-06, "loss": 1.109, "step": 3890 }, { "epoch": 0.12, "learning_rate": 4.9856e-06, "loss": 1.1128, "step": 3895 }, { "epoch": 0.12, "learning_rate": 4.992e-06, "loss": 1.1019, "step": 3900 }, { "epoch": 0.12, "learning_rate": 4.9984e-06, "loss": 1.1092, "step": 3905 }, { "epoch": 0.13, "learning_rate": 5.004800000000001e-06, "loss": 1.1368, "step": 3910 }, { "epoch": 0.13, "learning_rate": 5.0112e-06, "loss": 1.1141, "step": 3915 }, { "epoch": 0.13, "learning_rate": 5.0176e-06, "loss": 1.1032, "step": 3920 }, { "epoch": 0.13, "learning_rate": 5.024e-06, "loss": 1.1166, "step": 3925 }, { "epoch": 0.13, "learning_rate": 5.030400000000001e-06, "loss": 1.1135, "step": 3930 }, { "epoch": 0.13, "learning_rate": 5.036800000000001e-06, "loss": 1.1105, "step": 3935 }, { "epoch": 0.13, "learning_rate": 5.0432e-06, "loss": 1.1097, "step": 3940 }, { "epoch": 0.13, "learning_rate": 5.0496e-06, "loss": 1.1196, "step": 3945 }, { "epoch": 0.13, "learning_rate": 5.056000000000001e-06, "loss": 1.1085, "step": 3950 }, { "epoch": 0.13, "learning_rate": 5.062400000000001e-06, "loss": 1.1197, "step": 3955 }, { "epoch": 0.13, "learning_rate": 5.0688000000000005e-06, "loss": 1.1153, "step": 3960 }, { "epoch": 0.13, "learning_rate": 5.0752e-06, "loss": 1.1081, "step": 3965 }, { "epoch": 0.13, "learning_rate": 5.0816e-06, "loss": 1.108, "step": 3970 }, { "epoch": 0.13, "learning_rate": 5.088000000000001e-06, "loss": 1.1096, "step": 3975 }, { "epoch": 0.13, "learning_rate": 5.094400000000001e-06, "loss": 1.098, "step": 3980 }, { "epoch": 0.13, "learning_rate": 5.1008e-06, "loss": 1.1007, "step": 3985 }, { "epoch": 0.13, "learning_rate": 5.1072e-06, "loss": 1.1012, "step": 3990 }, { "epoch": 0.13, "learning_rate": 5.1136000000000005e-06, "loss": 1.1062, "step": 3995 }, { "epoch": 0.13, "learning_rate": 5.12e-06, "loss": 1.1051, "step": 4000 }, { "epoch": 0.13, "learning_rate": 5.126400000000001e-06, "loss": 1.1022, "step": 4005 }, { "epoch": 0.13, "learning_rate": 5.1328e-06, "loss": 1.1045, "step": 4010 }, { "epoch": 0.13, "learning_rate": 5.139200000000001e-06, "loss": 1.0868, "step": 4015 }, { "epoch": 0.13, "learning_rate": 5.1456e-06, "loss": 1.1038, "step": 4020 }, { "epoch": 0.13, "learning_rate": 5.152e-06, "loss": 1.1027, "step": 4025 }, { "epoch": 0.13, "learning_rate": 5.1584000000000005e-06, "loss": 1.0988, "step": 4030 }, { "epoch": 0.13, "learning_rate": 5.164800000000001e-06, "loss": 1.0951, "step": 4035 }, { "epoch": 0.13, "learning_rate": 5.1712000000000006e-06, "loss": 1.1101, "step": 4040 }, { "epoch": 0.13, "learning_rate": 5.1776e-06, "loss": 1.113, "step": 4045 }, { "epoch": 0.13, "learning_rate": 5.184e-06, "loss": 1.1006, "step": 4050 }, { "epoch": 0.13, "learning_rate": 5.1903999999999995e-06, "loss": 1.0965, "step": 4055 }, { "epoch": 0.13, "learning_rate": 5.196800000000001e-06, "loss": 1.094, "step": 4060 }, { "epoch": 0.13, "learning_rate": 5.2032000000000004e-06, "loss": 1.1024, "step": 4065 }, { "epoch": 0.13, "learning_rate": 5.2096e-06, "loss": 1.0949, "step": 4070 }, { "epoch": 0.13, "learning_rate": 5.216e-06, "loss": 1.104, "step": 4075 }, { "epoch": 0.13, "learning_rate": 5.222400000000001e-06, "loss": 1.0972, "step": 4080 }, { "epoch": 0.13, "learning_rate": 5.228800000000001e-06, "loss": 1.1053, "step": 4085 }, { "epoch": 0.13, "learning_rate": 5.2352e-06, "loss": 1.0882, "step": 4090 }, { "epoch": 0.13, "learning_rate": 5.2416e-06, "loss": 1.0947, "step": 4095 }, { "epoch": 0.13, "learning_rate": 5.248000000000001e-06, "loss": 1.0961, "step": 4100 }, { "epoch": 0.13, "learning_rate": 5.254400000000001e-06, "loss": 1.105, "step": 4105 }, { "epoch": 0.13, "learning_rate": 5.2608000000000005e-06, "loss": 1.1045, "step": 4110 }, { "epoch": 0.13, "learning_rate": 5.2672e-06, "loss": 1.0944, "step": 4115 }, { "epoch": 0.13, "learning_rate": 5.273600000000001e-06, "loss": 1.1194, "step": 4120 }, { "epoch": 0.13, "learning_rate": 5.28e-06, "loss": 1.0988, "step": 4125 }, { "epoch": 0.13, "learning_rate": 5.286400000000001e-06, "loss": 1.0964, "step": 4130 }, { "epoch": 0.13, "learning_rate": 5.2928e-06, "loss": 1.0974, "step": 4135 }, { "epoch": 0.13, "learning_rate": 5.2992e-06, "loss": 1.0932, "step": 4140 }, { "epoch": 0.13, "learning_rate": 5.3056000000000005e-06, "loss": 1.0935, "step": 4145 }, { "epoch": 0.13, "learning_rate": 5.312e-06, "loss": 1.1063, "step": 4150 }, { "epoch": 0.13, "learning_rate": 5.318400000000001e-06, "loss": 1.1039, "step": 4155 }, { "epoch": 0.13, "learning_rate": 5.3248e-06, "loss": 1.0976, "step": 4160 }, { "epoch": 0.13, "learning_rate": 5.331200000000001e-06, "loss": 1.1055, "step": 4165 }, { "epoch": 0.13, "learning_rate": 5.3376e-06, "loss": 1.1024, "step": 4170 }, { "epoch": 0.13, "learning_rate": 5.344e-06, "loss": 1.0948, "step": 4175 }, { "epoch": 0.13, "learning_rate": 5.3504e-06, "loss": 1.0916, "step": 4180 }, { "epoch": 0.13, "learning_rate": 5.356800000000001e-06, "loss": 1.1027, "step": 4185 }, { "epoch": 0.13, "learning_rate": 5.363200000000001e-06, "loss": 1.0911, "step": 4190 }, { "epoch": 0.13, "learning_rate": 5.3696e-06, "loss": 1.0785, "step": 4195 }, { "epoch": 0.13, "learning_rate": 5.376e-06, "loss": 1.0963, "step": 4200 }, { "epoch": 0.13, "learning_rate": 5.382400000000001e-06, "loss": 1.1146, "step": 4205 }, { "epoch": 0.13, "learning_rate": 5.388800000000001e-06, "loss": 1.1052, "step": 4210 }, { "epoch": 0.13, "learning_rate": 5.3952000000000005e-06, "loss": 1.0896, "step": 4215 }, { "epoch": 0.14, "learning_rate": 5.4016e-06, "loss": 1.0978, "step": 4220 }, { "epoch": 0.14, "learning_rate": 5.408e-06, "loss": 1.0934, "step": 4225 }, { "epoch": 0.14, "learning_rate": 5.414400000000001e-06, "loss": 1.0947, "step": 4230 }, { "epoch": 0.14, "learning_rate": 5.420800000000001e-06, "loss": 1.0942, "step": 4235 }, { "epoch": 0.14, "learning_rate": 5.4272e-06, "loss": 1.0831, "step": 4240 }, { "epoch": 0.14, "learning_rate": 5.4336e-06, "loss": 1.1008, "step": 4245 }, { "epoch": 0.14, "learning_rate": 5.4400000000000004e-06, "loss": 1.096, "step": 4250 }, { "epoch": 0.14, "learning_rate": 5.446400000000001e-06, "loss": 1.0949, "step": 4255 }, { "epoch": 0.14, "learning_rate": 5.4528000000000005e-06, "loss": 1.0885, "step": 4260 }, { "epoch": 0.14, "learning_rate": 5.4592e-06, "loss": 1.0937, "step": 4265 }, { "epoch": 0.14, "learning_rate": 5.465600000000001e-06, "loss": 1.0931, "step": 4270 }, { "epoch": 0.14, "learning_rate": 5.472e-06, "loss": 1.0996, "step": 4275 }, { "epoch": 0.14, "learning_rate": 5.478400000000001e-06, "loss": 1.0817, "step": 4280 }, { "epoch": 0.14, "learning_rate": 5.4848e-06, "loss": 1.0868, "step": 4285 }, { "epoch": 0.14, "learning_rate": 5.491200000000001e-06, "loss": 1.0908, "step": 4290 }, { "epoch": 0.14, "learning_rate": 5.4976000000000005e-06, "loss": 1.1053, "step": 4295 }, { "epoch": 0.14, "learning_rate": 5.504e-06, "loss": 1.0902, "step": 4300 }, { "epoch": 0.14, "learning_rate": 5.5104e-06, "loss": 1.0843, "step": 4305 }, { "epoch": 0.14, "learning_rate": 5.5168e-06, "loss": 1.0987, "step": 4310 }, { "epoch": 0.14, "learning_rate": 5.523200000000001e-06, "loss": 1.1047, "step": 4315 }, { "epoch": 0.14, "learning_rate": 5.5296e-06, "loss": 1.1021, "step": 4320 }, { "epoch": 0.14, "learning_rate": 5.536e-06, "loss": 1.091, "step": 4325 }, { "epoch": 0.14, "learning_rate": 5.5424e-06, "loss": 1.0851, "step": 4330 }, { "epoch": 0.14, "learning_rate": 5.548800000000001e-06, "loss": 1.0738, "step": 4335 }, { "epoch": 0.14, "learning_rate": 5.555200000000001e-06, "loss": 1.0986, "step": 4340 }, { "epoch": 0.14, "learning_rate": 5.5616e-06, "loss": 1.1086, "step": 4345 }, { "epoch": 0.14, "learning_rate": 5.568e-06, "loss": 1.0828, "step": 4350 }, { "epoch": 0.14, "learning_rate": 5.574400000000001e-06, "loss": 1.0802, "step": 4355 }, { "epoch": 0.14, "learning_rate": 5.580800000000001e-06, "loss": 1.0756, "step": 4360 }, { "epoch": 0.14, "learning_rate": 5.5872000000000005e-06, "loss": 1.0716, "step": 4365 }, { "epoch": 0.14, "learning_rate": 5.5936e-06, "loss": 1.0891, "step": 4370 }, { "epoch": 0.14, "learning_rate": 5.600000000000001e-06, "loss": 1.0753, "step": 4375 }, { "epoch": 0.14, "learning_rate": 5.606400000000001e-06, "loss": 1.0756, "step": 4380 }, { "epoch": 0.14, "learning_rate": 5.612800000000001e-06, "loss": 1.0906, "step": 4385 }, { "epoch": 0.14, "learning_rate": 5.6192e-06, "loss": 1.0901, "step": 4390 }, { "epoch": 0.14, "learning_rate": 5.6256e-06, "loss": 1.0683, "step": 4395 }, { "epoch": 0.14, "learning_rate": 5.6320000000000005e-06, "loss": 1.0814, "step": 4400 }, { "epoch": 0.14, "learning_rate": 5.638400000000001e-06, "loss": 1.084, "step": 4405 }, { "epoch": 0.14, "learning_rate": 5.6448000000000006e-06, "loss": 1.0843, "step": 4410 }, { "epoch": 0.14, "learning_rate": 5.6512e-06, "loss": 1.0862, "step": 4415 }, { "epoch": 0.14, "learning_rate": 5.657600000000001e-06, "loss": 1.073, "step": 4420 }, { "epoch": 0.14, "learning_rate": 5.664e-06, "loss": 1.0885, "step": 4425 }, { "epoch": 0.14, "learning_rate": 5.6704e-06, "loss": 1.0968, "step": 4430 }, { "epoch": 0.14, "learning_rate": 5.6768000000000004e-06, "loss": 1.0841, "step": 4435 }, { "epoch": 0.14, "learning_rate": 5.683200000000001e-06, "loss": 1.0782, "step": 4440 }, { "epoch": 0.14, "learning_rate": 5.6896000000000005e-06, "loss": 1.0972, "step": 4445 }, { "epoch": 0.14, "learning_rate": 5.696e-06, "loss": 1.0786, "step": 4450 }, { "epoch": 0.14, "learning_rate": 5.7024e-06, "loss": 1.0806, "step": 4455 }, { "epoch": 0.14, "learning_rate": 5.708800000000001e-06, "loss": 1.0873, "step": 4460 }, { "epoch": 0.14, "learning_rate": 5.715200000000001e-06, "loss": 1.0864, "step": 4465 }, { "epoch": 0.14, "learning_rate": 5.7216e-06, "loss": 1.0776, "step": 4470 }, { "epoch": 0.14, "learning_rate": 5.728e-06, "loss": 1.084, "step": 4475 }, { "epoch": 0.14, "learning_rate": 5.7344e-06, "loss": 1.0791, "step": 4480 }, { "epoch": 0.14, "learning_rate": 5.740800000000001e-06, "loss": 1.083, "step": 4485 }, { "epoch": 0.14, "learning_rate": 5.747200000000001e-06, "loss": 1.0859, "step": 4490 }, { "epoch": 0.14, "learning_rate": 5.7536e-06, "loss": 1.0917, "step": 4495 }, { "epoch": 0.14, "learning_rate": 5.76e-06, "loss": 1.0824, "step": 4500 }, { "epoch": 0.14, "learning_rate": 5.766400000000001e-06, "loss": 1.0849, "step": 4505 }, { "epoch": 0.14, "learning_rate": 5.772800000000001e-06, "loss": 1.0772, "step": 4510 }, { "epoch": 0.14, "learning_rate": 5.7792000000000005e-06, "loss": 1.0824, "step": 4515 }, { "epoch": 0.14, "learning_rate": 5.7856e-06, "loss": 1.0661, "step": 4520 }, { "epoch": 0.14, "learning_rate": 5.792000000000001e-06, "loss": 1.0654, "step": 4525 }, { "epoch": 0.14, "learning_rate": 5.798400000000001e-06, "loss": 1.0809, "step": 4530 }, { "epoch": 0.15, "learning_rate": 5.804800000000001e-06, "loss": 1.0822, "step": 4535 }, { "epoch": 0.15, "learning_rate": 5.8112e-06, "loss": 1.0759, "step": 4540 }, { "epoch": 0.15, "learning_rate": 5.817600000000001e-06, "loss": 1.0764, "step": 4545 }, { "epoch": 0.15, "learning_rate": 5.8240000000000005e-06, "loss": 1.084, "step": 4550 }, { "epoch": 0.15, "learning_rate": 5.8304e-06, "loss": 1.0857, "step": 4555 }, { "epoch": 0.15, "learning_rate": 5.836800000000001e-06, "loss": 1.0769, "step": 4560 }, { "epoch": 0.15, "learning_rate": 5.8432e-06, "loss": 1.0812, "step": 4565 }, { "epoch": 0.15, "learning_rate": 5.849600000000001e-06, "loss": 1.0736, "step": 4570 }, { "epoch": 0.15, "learning_rate": 5.856e-06, "loss": 1.0708, "step": 4575 }, { "epoch": 0.15, "learning_rate": 5.8624e-06, "loss": 1.0782, "step": 4580 }, { "epoch": 0.15, "learning_rate": 5.8688000000000005e-06, "loss": 1.0681, "step": 4585 }, { "epoch": 0.15, "learning_rate": 5.875200000000001e-06, "loss": 1.0737, "step": 4590 }, { "epoch": 0.15, "learning_rate": 5.8816000000000006e-06, "loss": 1.0563, "step": 4595 }, { "epoch": 0.15, "learning_rate": 5.888e-06, "loss": 1.0874, "step": 4600 }, { "epoch": 0.15, "learning_rate": 5.8944e-06, "loss": 1.0702, "step": 4605 }, { "epoch": 0.15, "learning_rate": 5.900800000000001e-06, "loss": 1.0759, "step": 4610 }, { "epoch": 0.15, "learning_rate": 5.907200000000001e-06, "loss": 1.069, "step": 4615 }, { "epoch": 0.15, "learning_rate": 5.9136000000000004e-06, "loss": 1.0854, "step": 4620 }, { "epoch": 0.15, "learning_rate": 5.92e-06, "loss": 1.0817, "step": 4625 }, { "epoch": 0.15, "learning_rate": 5.9264e-06, "loss": 1.0715, "step": 4630 }, { "epoch": 0.15, "learning_rate": 5.932800000000001e-06, "loss": 1.0658, "step": 4635 }, { "epoch": 0.15, "learning_rate": 5.939200000000001e-06, "loss": 1.0956, "step": 4640 }, { "epoch": 0.15, "learning_rate": 5.9456e-06, "loss": 1.0769, "step": 4645 }, { "epoch": 0.15, "learning_rate": 5.952e-06, "loss": 1.0765, "step": 4650 }, { "epoch": 0.15, "learning_rate": 5.958400000000001e-06, "loss": 1.0685, "step": 4655 }, { "epoch": 0.15, "learning_rate": 5.964800000000001e-06, "loss": 1.0838, "step": 4660 }, { "epoch": 0.15, "learning_rate": 5.9712000000000005e-06, "loss": 1.0689, "step": 4665 }, { "epoch": 0.15, "learning_rate": 5.9776e-06, "loss": 1.0739, "step": 4670 }, { "epoch": 0.15, "learning_rate": 5.984000000000001e-06, "loss": 1.0598, "step": 4675 }, { "epoch": 0.15, "learning_rate": 5.9904e-06, "loss": 1.0591, "step": 4680 }, { "epoch": 0.15, "learning_rate": 5.996800000000001e-06, "loss": 1.0691, "step": 4685 }, { "epoch": 0.15, "learning_rate": 6.0032e-06, "loss": 1.0649, "step": 4690 }, { "epoch": 0.15, "learning_rate": 6.009600000000001e-06, "loss": 1.0686, "step": 4695 }, { "epoch": 0.15, "learning_rate": 6.0160000000000005e-06, "loss": 1.0903, "step": 4700 }, { "epoch": 0.15, "learning_rate": 6.0224e-06, "loss": 1.0572, "step": 4705 }, { "epoch": 0.15, "learning_rate": 6.028800000000001e-06, "loss": 1.0776, "step": 4710 }, { "epoch": 0.15, "learning_rate": 6.0352e-06, "loss": 1.0562, "step": 4715 }, { "epoch": 0.15, "learning_rate": 6.041600000000001e-06, "loss": 1.0634, "step": 4720 }, { "epoch": 0.15, "learning_rate": 6.048e-06, "loss": 1.0607, "step": 4725 }, { "epoch": 0.15, "learning_rate": 6.0544e-06, "loss": 1.065, "step": 4730 }, { "epoch": 0.15, "learning_rate": 6.0608e-06, "loss": 1.0768, "step": 4735 }, { "epoch": 0.15, "learning_rate": 6.067200000000001e-06, "loss": 1.0714, "step": 4740 }, { "epoch": 0.15, "learning_rate": 6.073600000000001e-06, "loss": 1.064, "step": 4745 }, { "epoch": 0.15, "learning_rate": 6.08e-06, "loss": 1.0538, "step": 4750 }, { "epoch": 0.15, "learning_rate": 6.0864e-06, "loss": 1.0824, "step": 4755 }, { "epoch": 0.15, "learning_rate": 6.092800000000001e-06, "loss": 1.0694, "step": 4760 }, { "epoch": 0.15, "learning_rate": 6.099200000000001e-06, "loss": 1.0748, "step": 4765 }, { "epoch": 0.15, "learning_rate": 6.1056000000000005e-06, "loss": 1.0536, "step": 4770 }, { "epoch": 0.15, "learning_rate": 6.112e-06, "loss": 1.0521, "step": 4775 }, { "epoch": 0.15, "learning_rate": 6.1184000000000014e-06, "loss": 1.0677, "step": 4780 }, { "epoch": 0.15, "learning_rate": 6.124800000000001e-06, "loss": 1.0648, "step": 4785 }, { "epoch": 0.15, "learning_rate": 6.131200000000001e-06, "loss": 1.0741, "step": 4790 }, { "epoch": 0.15, "learning_rate": 6.1376e-06, "loss": 1.0583, "step": 4795 }, { "epoch": 0.15, "learning_rate": 6.144e-06, "loss": 1.0671, "step": 4800 }, { "epoch": 0.15, "learning_rate": 6.1504000000000004e-06, "loss": 1.062, "step": 4805 }, { "epoch": 0.15, "learning_rate": 6.156800000000001e-06, "loss": 1.0676, "step": 4810 }, { "epoch": 0.15, "learning_rate": 6.1632000000000006e-06, "loss": 1.068, "step": 4815 }, { "epoch": 0.15, "learning_rate": 6.1696e-06, "loss": 1.0704, "step": 4820 }, { "epoch": 0.15, "learning_rate": 6.176000000000001e-06, "loss": 1.06, "step": 4825 }, { "epoch": 0.15, "learning_rate": 6.1824e-06, "loss": 1.0835, "step": 4830 }, { "epoch": 0.15, "learning_rate": 6.188800000000001e-06, "loss": 1.0541, "step": 4835 }, { "epoch": 0.15, "learning_rate": 6.1952e-06, "loss": 1.0636, "step": 4840 }, { "epoch": 0.16, "learning_rate": 6.201600000000001e-06, "loss": 1.0613, "step": 4845 }, { "epoch": 0.16, "learning_rate": 6.2080000000000005e-06, "loss": 1.0516, "step": 4850 }, { "epoch": 0.16, "learning_rate": 6.2144e-06, "loss": 1.0537, "step": 4855 }, { "epoch": 0.16, "learning_rate": 6.2208e-06, "loss": 1.0563, "step": 4860 }, { "epoch": 0.16, "learning_rate": 6.227200000000001e-06, "loss": 1.0686, "step": 4865 }, { "epoch": 0.16, "learning_rate": 6.233600000000001e-06, "loss": 1.0635, "step": 4870 }, { "epoch": 0.16, "learning_rate": 6.24e-06, "loss": 1.0724, "step": 4875 }, { "epoch": 0.16, "learning_rate": 6.2464e-06, "loss": 1.0648, "step": 4880 }, { "epoch": 0.16, "learning_rate": 6.2528e-06, "loss": 1.0773, "step": 4885 }, { "epoch": 0.16, "learning_rate": 6.259200000000001e-06, "loss": 1.0591, "step": 4890 }, { "epoch": 0.16, "learning_rate": 6.265600000000001e-06, "loss": 1.0571, "step": 4895 }, { "epoch": 0.16, "learning_rate": 6.272e-06, "loss": 1.0419, "step": 4900 }, { "epoch": 0.16, "learning_rate": 6.2784e-06, "loss": 1.0715, "step": 4905 }, { "epoch": 0.16, "learning_rate": 6.284800000000001e-06, "loss": 1.0617, "step": 4910 }, { "epoch": 0.16, "learning_rate": 6.291200000000001e-06, "loss": 1.072, "step": 4915 }, { "epoch": 0.16, "learning_rate": 6.2976000000000005e-06, "loss": 1.0733, "step": 4920 }, { "epoch": 0.16, "learning_rate": 6.304e-06, "loss": 1.0468, "step": 4925 }, { "epoch": 0.16, "learning_rate": 6.310400000000001e-06, "loss": 1.0618, "step": 4930 }, { "epoch": 0.16, "learning_rate": 6.316800000000001e-06, "loss": 1.0567, "step": 4935 }, { "epoch": 0.16, "learning_rate": 6.323200000000001e-06, "loss": 1.076, "step": 4940 }, { "epoch": 0.16, "learning_rate": 6.3296e-06, "loss": 1.0676, "step": 4945 }, { "epoch": 0.16, "learning_rate": 6.336000000000001e-06, "loss": 1.0654, "step": 4950 }, { "epoch": 0.16, "learning_rate": 6.3424000000000005e-06, "loss": 1.056, "step": 4955 }, { "epoch": 0.16, "learning_rate": 6.3488e-06, "loss": 1.0741, "step": 4960 }, { "epoch": 0.16, "learning_rate": 6.355200000000001e-06, "loss": 1.0556, "step": 4965 }, { "epoch": 0.16, "learning_rate": 6.3616e-06, "loss": 1.0664, "step": 4970 }, { "epoch": 0.16, "learning_rate": 6.368000000000001e-06, "loss": 1.0494, "step": 4975 }, { "epoch": 0.16, "learning_rate": 6.3744e-06, "loss": 1.0628, "step": 4980 }, { "epoch": 0.16, "learning_rate": 6.3808e-06, "loss": 1.0528, "step": 4985 }, { "epoch": 0.16, "learning_rate": 6.3872000000000004e-06, "loss": 1.0606, "step": 4990 }, { "epoch": 0.16, "learning_rate": 6.393600000000001e-06, "loss": 1.0548, "step": 4995 }, { "epoch": 0.16, "learning_rate": 6.4000000000000006e-06, "loss": 1.0434, "step": 5000 }, { "epoch": 0.16, "learning_rate": 6.4064e-06, "loss": 1.0298, "step": 5005 }, { "epoch": 0.16, "learning_rate": 6.4128e-06, "loss": 1.0451, "step": 5010 }, { "epoch": 0.16, "learning_rate": 6.419200000000001e-06, "loss": 1.0565, "step": 5015 }, { "epoch": 0.16, "learning_rate": 6.425600000000001e-06, "loss": 1.0611, "step": 5020 }, { "epoch": 0.16, "learning_rate": 6.432e-06, "loss": 1.0505, "step": 5025 }, { "epoch": 0.16, "learning_rate": 6.4384e-06, "loss": 1.0563, "step": 5030 }, { "epoch": 0.16, "learning_rate": 6.444800000000001e-06, "loss": 1.0625, "step": 5035 }, { "epoch": 0.16, "learning_rate": 6.451200000000001e-06, "loss": 1.0601, "step": 5040 }, { "epoch": 0.16, "learning_rate": 6.457600000000001e-06, "loss": 1.0514, "step": 5045 }, { "epoch": 0.16, "learning_rate": 6.464e-06, "loss": 1.0434, "step": 5050 }, { "epoch": 0.16, "learning_rate": 6.4704e-06, "loss": 1.037, "step": 5055 }, { "epoch": 0.16, "learning_rate": 6.476800000000001e-06, "loss": 1.0531, "step": 5060 }, { "epoch": 0.16, "learning_rate": 6.483200000000001e-06, "loss": 1.047, "step": 5065 }, { "epoch": 0.16, "learning_rate": 6.4896000000000005e-06, "loss": 1.0408, "step": 5070 }, { "epoch": 0.16, "learning_rate": 6.496e-06, "loss": 1.0489, "step": 5075 }, { "epoch": 0.16, "learning_rate": 6.502400000000001e-06, "loss": 1.0545, "step": 5080 }, { "epoch": 0.16, "learning_rate": 6.5088e-06, "loss": 1.0555, "step": 5085 }, { "epoch": 0.16, "learning_rate": 6.515200000000001e-06, "loss": 1.0603, "step": 5090 }, { "epoch": 0.16, "learning_rate": 6.5216e-06, "loss": 1.0415, "step": 5095 }, { "epoch": 0.16, "learning_rate": 6.528000000000001e-06, "loss": 1.0547, "step": 5100 }, { "epoch": 0.16, "learning_rate": 6.5344000000000005e-06, "loss": 1.0452, "step": 5105 }, { "epoch": 0.16, "learning_rate": 6.5408e-06, "loss": 1.0611, "step": 5110 }, { "epoch": 0.16, "learning_rate": 6.547200000000001e-06, "loss": 1.0604, "step": 5115 }, { "epoch": 0.16, "learning_rate": 6.553600000000001e-06, "loss": 1.0455, "step": 5120 }, { "epoch": 0.16, "learning_rate": 6.560000000000001e-06, "loss": 1.0583, "step": 5125 }, { "epoch": 0.16, "learning_rate": 6.5664e-06, "loss": 1.0493, "step": 5130 }, { "epoch": 0.16, "learning_rate": 6.5728e-06, "loss": 1.0521, "step": 5135 }, { "epoch": 0.16, "learning_rate": 6.5792e-06, "loss": 1.0707, "step": 5140 }, { "epoch": 0.16, "learning_rate": 6.585600000000001e-06, "loss": 1.0615, "step": 5145 }, { "epoch": 0.16, "learning_rate": 6.592000000000001e-06, "loss": 1.0697, "step": 5150 }, { "epoch": 0.16, "learning_rate": 6.5984e-06, "loss": 1.0473, "step": 5155 }, { "epoch": 0.17, "learning_rate": 6.6048e-06, "loss": 1.0533, "step": 5160 }, { "epoch": 0.17, "learning_rate": 6.611200000000001e-06, "loss": 1.0601, "step": 5165 }, { "epoch": 0.17, "learning_rate": 6.617600000000001e-06, "loss": 1.0316, "step": 5170 }, { "epoch": 0.17, "learning_rate": 6.6240000000000004e-06, "loss": 1.054, "step": 5175 }, { "epoch": 0.17, "learning_rate": 6.6304e-06, "loss": 1.052, "step": 5180 }, { "epoch": 0.17, "learning_rate": 6.636800000000001e-06, "loss": 1.0508, "step": 5185 }, { "epoch": 0.17, "learning_rate": 6.643200000000001e-06, "loss": 1.0503, "step": 5190 }, { "epoch": 0.17, "learning_rate": 6.649600000000001e-06, "loss": 1.044, "step": 5195 }, { "epoch": 0.17, "learning_rate": 6.656e-06, "loss": 1.0572, "step": 5200 }, { "epoch": 0.17, "learning_rate": 6.662400000000001e-06, "loss": 1.0439, "step": 5205 }, { "epoch": 0.17, "learning_rate": 6.6688e-06, "loss": 1.0596, "step": 5210 }, { "epoch": 0.17, "learning_rate": 6.675200000000001e-06, "loss": 1.0474, "step": 5215 }, { "epoch": 0.17, "learning_rate": 6.6816000000000005e-06, "loss": 1.0536, "step": 5220 }, { "epoch": 0.17, "learning_rate": 6.688e-06, "loss": 1.0393, "step": 5225 }, { "epoch": 0.17, "learning_rate": 6.694400000000001e-06, "loss": 1.0396, "step": 5230 }, { "epoch": 0.17, "learning_rate": 6.7008e-06, "loss": 1.0473, "step": 5235 }, { "epoch": 0.17, "learning_rate": 6.707200000000001e-06, "loss": 1.0459, "step": 5240 }, { "epoch": 0.17, "learning_rate": 6.7136e-06, "loss": 1.0405, "step": 5245 }, { "epoch": 0.17, "learning_rate": 6.720000000000001e-06, "loss": 1.0418, "step": 5250 }, { "epoch": 0.17, "learning_rate": 6.7264000000000005e-06, "loss": 1.0621, "step": 5255 }, { "epoch": 0.17, "learning_rate": 6.7328e-06, "loss": 1.049, "step": 5260 }, { "epoch": 0.17, "learning_rate": 6.7392e-06, "loss": 1.0462, "step": 5265 }, { "epoch": 0.17, "learning_rate": 6.745600000000001e-06, "loss": 1.0452, "step": 5270 }, { "epoch": 0.17, "learning_rate": 6.752000000000001e-06, "loss": 1.0403, "step": 5275 }, { "epoch": 0.17, "learning_rate": 6.7584e-06, "loss": 1.052, "step": 5280 }, { "epoch": 0.17, "learning_rate": 6.7648e-06, "loss": 1.0382, "step": 5285 }, { "epoch": 0.17, "learning_rate": 6.771200000000001e-06, "loss": 1.0353, "step": 5290 }, { "epoch": 0.17, "learning_rate": 6.777600000000001e-06, "loss": 1.0386, "step": 5295 }, { "epoch": 0.17, "learning_rate": 6.784000000000001e-06, "loss": 1.0429, "step": 5300 }, { "epoch": 0.17, "learning_rate": 6.7904e-06, "loss": 1.0452, "step": 5305 }, { "epoch": 0.17, "learning_rate": 6.7968e-06, "loss": 1.0397, "step": 5310 }, { "epoch": 0.17, "learning_rate": 6.803200000000001e-06, "loss": 1.0434, "step": 5315 }, { "epoch": 0.17, "learning_rate": 6.809600000000001e-06, "loss": 1.0482, "step": 5320 }, { "epoch": 0.17, "learning_rate": 6.8160000000000005e-06, "loss": 1.0361, "step": 5325 }, { "epoch": 0.17, "learning_rate": 6.8224e-06, "loss": 1.0356, "step": 5330 }, { "epoch": 0.17, "learning_rate": 6.828800000000001e-06, "loss": 1.0478, "step": 5335 }, { "epoch": 0.17, "learning_rate": 6.835200000000001e-06, "loss": 1.048, "step": 5340 }, { "epoch": 0.17, "learning_rate": 6.841600000000001e-06, "loss": 1.0155, "step": 5345 }, { "epoch": 0.17, "learning_rate": 6.848e-06, "loss": 1.0397, "step": 5350 }, { "epoch": 0.17, "learning_rate": 6.854400000000001e-06, "loss": 1.0385, "step": 5355 }, { "epoch": 0.17, "learning_rate": 6.8608000000000004e-06, "loss": 1.0347, "step": 5360 }, { "epoch": 0.17, "learning_rate": 6.867200000000001e-06, "loss": 1.0326, "step": 5365 }, { "epoch": 0.17, "learning_rate": 6.8736000000000006e-06, "loss": 1.0423, "step": 5370 }, { "epoch": 0.17, "learning_rate": 6.88e-06, "loss": 1.0348, "step": 5375 }, { "epoch": 0.17, "learning_rate": 6.886400000000001e-06, "loss": 1.0581, "step": 5380 }, { "epoch": 0.17, "learning_rate": 6.8928e-06, "loss": 1.0366, "step": 5385 }, { "epoch": 0.17, "learning_rate": 6.8992e-06, "loss": 1.0362, "step": 5390 }, { "epoch": 0.17, "learning_rate": 6.9056000000000004e-06, "loss": 1.0369, "step": 5395 }, { "epoch": 0.17, "learning_rate": 6.912000000000001e-06, "loss": 1.031, "step": 5400 }, { "epoch": 0.17, "learning_rate": 6.9184000000000005e-06, "loss": 1.0433, "step": 5405 }, { "epoch": 0.17, "learning_rate": 6.9248e-06, "loss": 1.0308, "step": 5410 }, { "epoch": 0.17, "learning_rate": 6.9312e-06, "loss": 1.0312, "step": 5415 }, { "epoch": 0.17, "learning_rate": 6.937600000000001e-06, "loss": 1.0466, "step": 5420 }, { "epoch": 0.17, "learning_rate": 6.944000000000001e-06, "loss": 1.0449, "step": 5425 }, { "epoch": 0.17, "learning_rate": 6.9504e-06, "loss": 1.0314, "step": 5430 }, { "epoch": 0.17, "learning_rate": 6.9568e-06, "loss": 1.0337, "step": 5435 }, { "epoch": 0.17, "learning_rate": 6.963200000000001e-06, "loss": 1.0287, "step": 5440 }, { "epoch": 0.17, "learning_rate": 6.969600000000001e-06, "loss": 1.0525, "step": 5445 }, { "epoch": 0.17, "learning_rate": 6.976000000000001e-06, "loss": 1.0354, "step": 5450 }, { "epoch": 0.17, "learning_rate": 6.9824e-06, "loss": 1.0241, "step": 5455 }, { "epoch": 0.17, "learning_rate": 6.9888e-06, "loss": 1.0315, "step": 5460 }, { "epoch": 0.17, "learning_rate": 6.995200000000001e-06, "loss": 1.029, "step": 5465 }, { "epoch": 0.18, "learning_rate": 7.001600000000001e-06, "loss": 1.0309, "step": 5470 }, { "epoch": 0.18, "learning_rate": 7.0080000000000005e-06, "loss": 1.0362, "step": 5475 }, { "epoch": 0.18, "learning_rate": 7.0144e-06, "loss": 1.0282, "step": 5480 }, { "epoch": 0.18, "learning_rate": 7.020800000000001e-06, "loss": 1.0276, "step": 5485 }, { "epoch": 0.18, "learning_rate": 7.027200000000001e-06, "loss": 1.0375, "step": 5490 }, { "epoch": 0.18, "learning_rate": 7.033600000000001e-06, "loss": 1.0265, "step": 5495 }, { "epoch": 0.18, "learning_rate": 7.04e-06, "loss": 1.0319, "step": 5500 }, { "epoch": 0.18, "learning_rate": 7.046400000000001e-06, "loss": 1.0477, "step": 5505 }, { "epoch": 0.18, "learning_rate": 7.0528000000000005e-06, "loss": 1.0397, "step": 5510 }, { "epoch": 0.18, "learning_rate": 7.0592e-06, "loss": 1.0229, "step": 5515 }, { "epoch": 0.18, "learning_rate": 7.065600000000001e-06, "loss": 1.0467, "step": 5520 }, { "epoch": 0.18, "learning_rate": 7.072000000000001e-06, "loss": 1.0455, "step": 5525 }, { "epoch": 0.18, "learning_rate": 7.078400000000001e-06, "loss": 1.0294, "step": 5530 }, { "epoch": 0.18, "learning_rate": 7.0848e-06, "loss": 1.0293, "step": 5535 }, { "epoch": 0.18, "learning_rate": 7.0912e-06, "loss": 1.0459, "step": 5540 }, { "epoch": 0.18, "learning_rate": 7.0976000000000005e-06, "loss": 1.0413, "step": 5545 }, { "epoch": 0.18, "learning_rate": 7.104000000000001e-06, "loss": 1.029, "step": 5550 }, { "epoch": 0.18, "learning_rate": 7.1104000000000006e-06, "loss": 1.0304, "step": 5555 }, { "epoch": 0.18, "learning_rate": 7.1168e-06, "loss": 1.0362, "step": 5560 }, { "epoch": 0.18, "learning_rate": 7.1232e-06, "loss": 1.0438, "step": 5565 }, { "epoch": 0.18, "learning_rate": 7.129600000000001e-06, "loss": 1.0199, "step": 5570 }, { "epoch": 0.18, "learning_rate": 7.136000000000001e-06, "loss": 1.0331, "step": 5575 }, { "epoch": 0.18, "learning_rate": 7.1424000000000004e-06, "loss": 1.0426, "step": 5580 }, { "epoch": 0.18, "learning_rate": 7.1488e-06, "loss": 1.0272, "step": 5585 }, { "epoch": 0.18, "learning_rate": 7.155200000000001e-06, "loss": 1.0324, "step": 5590 }, { "epoch": 0.18, "learning_rate": 7.161600000000001e-06, "loss": 1.0401, "step": 5595 }, { "epoch": 0.18, "learning_rate": 7.168000000000001e-06, "loss": 1.031, "step": 5600 }, { "epoch": 0.18, "learning_rate": 7.1744e-06, "loss": 1.0176, "step": 5605 }, { "epoch": 0.18, "learning_rate": 7.180800000000001e-06, "loss": 1.026, "step": 5610 }, { "epoch": 0.18, "learning_rate": 7.187200000000001e-06, "loss": 1.0294, "step": 5615 }, { "epoch": 0.18, "learning_rate": 7.193600000000001e-06, "loss": 1.0272, "step": 5620 }, { "epoch": 0.18, "learning_rate": 7.2000000000000005e-06, "loss": 1.0409, "step": 5625 }, { "epoch": 0.18, "learning_rate": 7.2064e-06, "loss": 1.0474, "step": 5630 }, { "epoch": 0.18, "learning_rate": 7.212800000000001e-06, "loss": 1.025, "step": 5635 }, { "epoch": 0.18, "learning_rate": 7.2192e-06, "loss": 1.0218, "step": 5640 }, { "epoch": 0.18, "learning_rate": 7.225600000000001e-06, "loss": 1.0405, "step": 5645 }, { "epoch": 0.18, "learning_rate": 7.232e-06, "loss": 1.017, "step": 5650 }, { "epoch": 0.18, "learning_rate": 7.238400000000001e-06, "loss": 1.0334, "step": 5655 }, { "epoch": 0.18, "learning_rate": 7.2448000000000005e-06, "loss": 1.0364, "step": 5660 }, { "epoch": 0.18, "learning_rate": 7.2512e-06, "loss": 1.0327, "step": 5665 }, { "epoch": 0.18, "learning_rate": 7.257600000000001e-06, "loss": 1.0442, "step": 5670 }, { "epoch": 0.18, "learning_rate": 7.264000000000001e-06, "loss": 1.0396, "step": 5675 }, { "epoch": 0.18, "learning_rate": 7.270400000000001e-06, "loss": 1.024, "step": 5680 }, { "epoch": 0.18, "learning_rate": 7.2768e-06, "loss": 1.0282, "step": 5685 }, { "epoch": 0.18, "learning_rate": 7.2832e-06, "loss": 1.0197, "step": 5690 }, { "epoch": 0.18, "learning_rate": 7.289600000000001e-06, "loss": 1.0294, "step": 5695 }, { "epoch": 0.18, "learning_rate": 7.296000000000001e-06, "loss": 1.0107, "step": 5700 }, { "epoch": 0.18, "learning_rate": 7.302400000000001e-06, "loss": 1.0292, "step": 5705 }, { "epoch": 0.18, "learning_rate": 7.3088e-06, "loss": 1.0261, "step": 5710 }, { "epoch": 0.18, "learning_rate": 7.3152e-06, "loss": 1.0266, "step": 5715 }, { "epoch": 0.18, "learning_rate": 7.321600000000001e-06, "loss": 1.0254, "step": 5720 }, { "epoch": 0.18, "learning_rate": 7.328000000000001e-06, "loss": 1.0267, "step": 5725 }, { "epoch": 0.18, "learning_rate": 7.3344000000000005e-06, "loss": 1.013, "step": 5730 }, { "epoch": 0.18, "learning_rate": 7.3408e-06, "loss": 1.0352, "step": 5735 }, { "epoch": 0.18, "learning_rate": 7.347200000000001e-06, "loss": 1.025, "step": 5740 }, { "epoch": 0.18, "learning_rate": 7.353600000000001e-06, "loss": 1.034, "step": 5745 }, { "epoch": 0.18, "learning_rate": 7.360000000000001e-06, "loss": 1.0261, "step": 5750 }, { "epoch": 0.18, "learning_rate": 7.3664e-06, "loss": 1.029, "step": 5755 }, { "epoch": 0.18, "learning_rate": 7.372800000000001e-06, "loss": 1.0113, "step": 5760 }, { "epoch": 0.18, "learning_rate": 7.3792000000000004e-06, "loss": 1.0248, "step": 5765 }, { "epoch": 0.18, "learning_rate": 7.385600000000001e-06, "loss": 1.0338, "step": 5770 }, { "epoch": 0.18, "learning_rate": 7.3920000000000005e-06, "loss": 1.0273, "step": 5775 }, { "epoch": 0.18, "learning_rate": 7.398400000000001e-06, "loss": 1.0215, "step": 5780 }, { "epoch": 0.19, "learning_rate": 7.404800000000001e-06, "loss": 1.0135, "step": 5785 }, { "epoch": 0.19, "learning_rate": 7.4112e-06, "loss": 1.0169, "step": 5790 }, { "epoch": 0.19, "learning_rate": 7.417600000000001e-06, "loss": 1.0262, "step": 5795 }, { "epoch": 0.19, "learning_rate": 7.424e-06, "loss": 1.0164, "step": 5800 }, { "epoch": 0.19, "learning_rate": 7.430400000000001e-06, "loss": 1.0261, "step": 5805 }, { "epoch": 0.19, "learning_rate": 7.4368000000000005e-06, "loss": 1.0103, "step": 5810 }, { "epoch": 0.19, "learning_rate": 7.4432e-06, "loss": 1.0129, "step": 5815 }, { "epoch": 0.19, "learning_rate": 7.4496e-06, "loss": 1.0269, "step": 5820 }, { "epoch": 0.19, "learning_rate": 7.456000000000001e-06, "loss": 1.0242, "step": 5825 }, { "epoch": 0.19, "learning_rate": 7.462400000000001e-06, "loss": 1.0315, "step": 5830 }, { "epoch": 0.19, "learning_rate": 7.4688e-06, "loss": 1.0285, "step": 5835 }, { "epoch": 0.19, "learning_rate": 7.4752e-06, "loss": 1.0257, "step": 5840 }, { "epoch": 0.19, "learning_rate": 7.481600000000001e-06, "loss": 1.0245, "step": 5845 }, { "epoch": 0.19, "learning_rate": 7.488000000000001e-06, "loss": 1.0216, "step": 5850 }, { "epoch": 0.19, "learning_rate": 7.494400000000001e-06, "loss": 1.0197, "step": 5855 }, { "epoch": 0.19, "learning_rate": 7.5008e-06, "loss": 1.0173, "step": 5860 }, { "epoch": 0.19, "learning_rate": 7.507200000000001e-06, "loss": 1.0199, "step": 5865 }, { "epoch": 0.19, "learning_rate": 7.513600000000001e-06, "loss": 1.0172, "step": 5870 }, { "epoch": 0.19, "learning_rate": 7.520000000000001e-06, "loss": 1.0036, "step": 5875 }, { "epoch": 0.19, "learning_rate": 7.5264000000000005e-06, "loss": 1.0237, "step": 5880 }, { "epoch": 0.19, "learning_rate": 7.5328e-06, "loss": 1.0295, "step": 5885 }, { "epoch": 0.19, "learning_rate": 7.539200000000001e-06, "loss": 1.0135, "step": 5890 }, { "epoch": 0.19, "learning_rate": 7.545600000000001e-06, "loss": 1.0369, "step": 5895 }, { "epoch": 0.19, "learning_rate": 7.552000000000001e-06, "loss": 1.0127, "step": 5900 }, { "epoch": 0.19, "learning_rate": 7.5584e-06, "loss": 1.0194, "step": 5905 }, { "epoch": 0.19, "learning_rate": 7.564800000000001e-06, "loss": 1.0172, "step": 5910 }, { "epoch": 0.19, "learning_rate": 7.5712000000000005e-06, "loss": 1.0165, "step": 5915 }, { "epoch": 0.19, "learning_rate": 7.5776e-06, "loss": 1.0187, "step": 5920 }, { "epoch": 0.19, "learning_rate": 7.5840000000000006e-06, "loss": 1.0038, "step": 5925 }, { "epoch": 0.19, "learning_rate": 7.590400000000001e-06, "loss": 1.014, "step": 5930 }, { "epoch": 0.19, "learning_rate": 7.596800000000001e-06, "loss": 1.0166, "step": 5935 }, { "epoch": 0.19, "learning_rate": 7.6032e-06, "loss": 1.0013, "step": 5940 }, { "epoch": 0.19, "learning_rate": 7.6096e-06, "loss": 1.0189, "step": 5945 }, { "epoch": 0.19, "learning_rate": 7.616000000000001e-06, "loss": 1.0127, "step": 5950 }, { "epoch": 0.19, "learning_rate": 7.622400000000001e-06, "loss": 1.014, "step": 5955 }, { "epoch": 0.19, "learning_rate": 7.6288000000000005e-06, "loss": 1.0311, "step": 5960 }, { "epoch": 0.19, "learning_rate": 7.635200000000001e-06, "loss": 1.0022, "step": 5965 }, { "epoch": 0.19, "learning_rate": 7.6416e-06, "loss": 1.003, "step": 5970 }, { "epoch": 0.19, "learning_rate": 7.648e-06, "loss": 1.0197, "step": 5975 }, { "epoch": 0.19, "learning_rate": 7.6544e-06, "loss": 1.0194, "step": 5980 }, { "epoch": 0.19, "learning_rate": 7.660800000000001e-06, "loss": 1.0099, "step": 5985 }, { "epoch": 0.19, "learning_rate": 7.6672e-06, "loss": 1.0115, "step": 5990 }, { "epoch": 0.19, "learning_rate": 7.6736e-06, "loss": 1.0061, "step": 5995 }, { "epoch": 0.19, "learning_rate": 7.680000000000001e-06, "loss": 1.0131, "step": 6000 }, { "epoch": 0.19, "learning_rate": 7.6864e-06, "loss": 1.02, "step": 6005 }, { "epoch": 0.19, "learning_rate": 7.6928e-06, "loss": 1.0006, "step": 6010 }, { "epoch": 0.19, "learning_rate": 7.6992e-06, "loss": 1.0154, "step": 6015 }, { "epoch": 0.19, "learning_rate": 7.705600000000001e-06, "loss": 1.0283, "step": 6020 }, { "epoch": 0.19, "learning_rate": 7.712e-06, "loss": 1.0086, "step": 6025 }, { "epoch": 0.19, "learning_rate": 7.7184e-06, "loss": 0.9959, "step": 6030 }, { "epoch": 0.19, "learning_rate": 7.724800000000001e-06, "loss": 1.0283, "step": 6035 }, { "epoch": 0.19, "learning_rate": 7.731200000000001e-06, "loss": 1.0063, "step": 6040 }, { "epoch": 0.19, "learning_rate": 7.7376e-06, "loss": 1.0115, "step": 6045 }, { "epoch": 0.19, "learning_rate": 7.744e-06, "loss": 1.0161, "step": 6050 }, { "epoch": 0.19, "learning_rate": 7.7504e-06, "loss": 0.9981, "step": 6055 }, { "epoch": 0.19, "learning_rate": 7.756800000000002e-06, "loss": 1.0175, "step": 6060 }, { "epoch": 0.19, "learning_rate": 7.7632e-06, "loss": 1.0056, "step": 6065 }, { "epoch": 0.19, "learning_rate": 7.769600000000001e-06, "loss": 1.0104, "step": 6070 }, { "epoch": 0.19, "learning_rate": 7.776e-06, "loss": 1.0034, "step": 6075 }, { "epoch": 0.19, "learning_rate": 7.7824e-06, "loss": 1.0135, "step": 6080 }, { "epoch": 0.19, "learning_rate": 7.7888e-06, "loss": 1.0196, "step": 6085 }, { "epoch": 0.19, "learning_rate": 7.795200000000001e-06, "loss": 1.0129, "step": 6090 }, { "epoch": 0.2, "learning_rate": 7.8016e-06, "loss": 0.9997, "step": 6095 }, { "epoch": 0.2, "learning_rate": 7.808e-06, "loss": 1.014, "step": 6100 }, { "epoch": 0.2, "learning_rate": 7.814400000000001e-06, "loss": 1.0185, "step": 6105 }, { "epoch": 0.2, "learning_rate": 7.820800000000001e-06, "loss": 1.0121, "step": 6110 }, { "epoch": 0.2, "learning_rate": 7.8272e-06, "loss": 1.0132, "step": 6115 }, { "epoch": 0.2, "learning_rate": 7.8336e-06, "loss": 1.0053, "step": 6120 }, { "epoch": 0.2, "learning_rate": 7.840000000000001e-06, "loss": 1.0149, "step": 6125 }, { "epoch": 0.2, "learning_rate": 7.8464e-06, "loss": 0.9911, "step": 6130 }, { "epoch": 0.2, "learning_rate": 7.8528e-06, "loss": 1.0041, "step": 6135 }, { "epoch": 0.2, "learning_rate": 7.859200000000001e-06, "loss": 1.0129, "step": 6140 }, { "epoch": 0.2, "learning_rate": 7.865600000000001e-06, "loss": 1.0186, "step": 6145 }, { "epoch": 0.2, "learning_rate": 7.872e-06, "loss": 1.0348, "step": 6150 }, { "epoch": 0.2, "learning_rate": 7.8784e-06, "loss": 0.9939, "step": 6155 }, { "epoch": 0.2, "learning_rate": 7.8848e-06, "loss": 1.0114, "step": 6160 }, { "epoch": 0.2, "learning_rate": 7.891200000000002e-06, "loss": 1.0001, "step": 6165 }, { "epoch": 0.2, "learning_rate": 7.8976e-06, "loss": 0.9871, "step": 6170 }, { "epoch": 0.2, "learning_rate": 7.904000000000001e-06, "loss": 1.0123, "step": 6175 }, { "epoch": 0.2, "learning_rate": 7.9104e-06, "loss": 1.0083, "step": 6180 }, { "epoch": 0.2, "learning_rate": 7.916800000000002e-06, "loss": 0.9998, "step": 6185 }, { "epoch": 0.2, "learning_rate": 7.9232e-06, "loss": 1.0081, "step": 6190 }, { "epoch": 0.2, "learning_rate": 7.929600000000001e-06, "loss": 1.0202, "step": 6195 }, { "epoch": 0.2, "learning_rate": 7.936e-06, "loss": 1.0073, "step": 6200 }, { "epoch": 0.2, "learning_rate": 7.9424e-06, "loss": 0.9925, "step": 6205 }, { "epoch": 0.2, "learning_rate": 7.948800000000001e-06, "loss": 1.0175, "step": 6210 }, { "epoch": 0.2, "learning_rate": 7.955200000000001e-06, "loss": 1.0017, "step": 6215 }, { "epoch": 0.2, "learning_rate": 7.9616e-06, "loss": 1.0201, "step": 6220 }, { "epoch": 0.2, "learning_rate": 7.968e-06, "loss": 1.0017, "step": 6225 }, { "epoch": 0.2, "learning_rate": 7.974400000000001e-06, "loss": 1.0038, "step": 6230 }, { "epoch": 0.2, "learning_rate": 7.980800000000002e-06, "loss": 1.0057, "step": 6235 }, { "epoch": 0.2, "learning_rate": 7.9872e-06, "loss": 0.9943, "step": 6240 }, { "epoch": 0.2, "learning_rate": 7.993600000000001e-06, "loss": 0.9988, "step": 6245 }, { "epoch": 0.2, "learning_rate": 8.000000000000001e-06, "loss": 1.0061, "step": 6250 }, { "epoch": 0.2, "learning_rate": 8.0064e-06, "loss": 1.0027, "step": 6255 }, { "epoch": 0.2, "learning_rate": 8.0128e-06, "loss": 1.0096, "step": 6260 }, { "epoch": 0.2, "learning_rate": 8.019200000000001e-06, "loss": 1.0024, "step": 6265 }, { "epoch": 0.2, "learning_rate": 8.025600000000002e-06, "loss": 1.0018, "step": 6270 }, { "epoch": 0.2, "learning_rate": 8.032e-06, "loss": 1.0145, "step": 6275 }, { "epoch": 0.2, "learning_rate": 8.0384e-06, "loss": 1.0073, "step": 6280 }, { "epoch": 0.2, "learning_rate": 8.0448e-06, "loss": 1.0182, "step": 6285 }, { "epoch": 0.2, "learning_rate": 8.0512e-06, "loss": 1.0026, "step": 6290 }, { "epoch": 0.2, "learning_rate": 8.0576e-06, "loss": 1.0011, "step": 6295 }, { "epoch": 0.2, "learning_rate": 8.064000000000001e-06, "loss": 1.0114, "step": 6300 }, { "epoch": 0.2, "learning_rate": 8.0704e-06, "loss": 0.9968, "step": 6305 }, { "epoch": 0.2, "learning_rate": 8.0768e-06, "loss": 0.9973, "step": 6310 }, { "epoch": 0.2, "learning_rate": 8.0832e-06, "loss": 0.9983, "step": 6315 }, { "epoch": 0.2, "learning_rate": 8.089600000000001e-06, "loss": 1.0231, "step": 6320 }, { "epoch": 0.2, "learning_rate": 8.096e-06, "loss": 1.0109, "step": 6325 }, { "epoch": 0.2, "learning_rate": 8.1024e-06, "loss": 1.0037, "step": 6330 }, { "epoch": 0.2, "learning_rate": 8.108800000000001e-06, "loss": 0.9971, "step": 6335 }, { "epoch": 0.2, "learning_rate": 8.115200000000002e-06, "loss": 0.996, "step": 6340 }, { "epoch": 0.2, "learning_rate": 8.1216e-06, "loss": 1.0111, "step": 6345 }, { "epoch": 0.2, "learning_rate": 8.128e-06, "loss": 0.9987, "step": 6350 }, { "epoch": 0.2, "learning_rate": 8.134400000000001e-06, "loss": 1.0042, "step": 6355 }, { "epoch": 0.2, "learning_rate": 8.140800000000002e-06, "loss": 1.0009, "step": 6360 }, { "epoch": 0.2, "learning_rate": 8.1472e-06, "loss": 0.9924, "step": 6365 }, { "epoch": 0.2, "learning_rate": 8.153600000000001e-06, "loss": 1.0061, "step": 6370 }, { "epoch": 0.2, "learning_rate": 8.16e-06, "loss": 0.9997, "step": 6375 }, { "epoch": 0.2, "learning_rate": 8.1664e-06, "loss": 0.9925, "step": 6380 }, { "epoch": 0.2, "learning_rate": 8.1728e-06, "loss": 1.0199, "step": 6385 }, { "epoch": 0.2, "learning_rate": 8.179200000000001e-06, "loss": 0.9964, "step": 6390 }, { "epoch": 0.2, "learning_rate": 8.1856e-06, "loss": 1.0075, "step": 6395 }, { "epoch": 0.2, "learning_rate": 8.192e-06, "loss": 1.0074, "step": 6400 }, { "epoch": 0.2, "learning_rate": 8.198400000000001e-06, "loss": 0.9893, "step": 6405 }, { "epoch": 0.21, "learning_rate": 8.2048e-06, "loss": 0.9958, "step": 6410 }, { "epoch": 0.21, "learning_rate": 8.2112e-06, "loss": 0.9877, "step": 6415 }, { "epoch": 0.21, "learning_rate": 8.2176e-06, "loss": 0.985, "step": 6420 }, { "epoch": 0.21, "learning_rate": 8.224000000000001e-06, "loss": 0.9946, "step": 6425 }, { "epoch": 0.21, "learning_rate": 8.2304e-06, "loss": 1.0027, "step": 6430 }, { "epoch": 0.21, "learning_rate": 8.2368e-06, "loss": 0.9975, "step": 6435 }, { "epoch": 0.21, "learning_rate": 8.243200000000001e-06, "loss": 0.9843, "step": 6440 }, { "epoch": 0.21, "learning_rate": 8.249600000000001e-06, "loss": 1.0027, "step": 6445 }, { "epoch": 0.21, "learning_rate": 8.256e-06, "loss": 0.9821, "step": 6450 }, { "epoch": 0.21, "learning_rate": 8.2624e-06, "loss": 0.994, "step": 6455 }, { "epoch": 0.21, "learning_rate": 8.2688e-06, "loss": 1.0038, "step": 6460 }, { "epoch": 0.21, "learning_rate": 8.275200000000002e-06, "loss": 0.9958, "step": 6465 }, { "epoch": 0.21, "learning_rate": 8.2816e-06, "loss": 1.0042, "step": 6470 }, { "epoch": 0.21, "learning_rate": 8.288000000000001e-06, "loss": 1.0105, "step": 6475 }, { "epoch": 0.21, "learning_rate": 8.2944e-06, "loss": 0.9932, "step": 6480 }, { "epoch": 0.21, "learning_rate": 8.300800000000002e-06, "loss": 1.0046, "step": 6485 }, { "epoch": 0.21, "learning_rate": 8.3072e-06, "loss": 0.9986, "step": 6490 }, { "epoch": 0.21, "learning_rate": 8.313600000000001e-06, "loss": 1.0022, "step": 6495 }, { "epoch": 0.21, "learning_rate": 8.32e-06, "loss": 0.9939, "step": 6500 }, { "epoch": 0.21, "learning_rate": 8.3264e-06, "loss": 1.0096, "step": 6505 }, { "epoch": 0.21, "learning_rate": 8.332800000000001e-06, "loss": 1.0108, "step": 6510 }, { "epoch": 0.21, "learning_rate": 8.339200000000001e-06, "loss": 0.9836, "step": 6515 }, { "epoch": 0.21, "learning_rate": 8.3456e-06, "loss": 0.9977, "step": 6520 }, { "epoch": 0.21, "learning_rate": 8.352e-06, "loss": 0.9927, "step": 6525 }, { "epoch": 0.21, "learning_rate": 8.358400000000001e-06, "loss": 0.9983, "step": 6530 }, { "epoch": 0.21, "learning_rate": 8.3648e-06, "loss": 1.0027, "step": 6535 }, { "epoch": 0.21, "learning_rate": 8.3712e-06, "loss": 1.0072, "step": 6540 }, { "epoch": 0.21, "learning_rate": 8.377600000000001e-06, "loss": 1.0042, "step": 6545 }, { "epoch": 0.21, "learning_rate": 8.384000000000001e-06, "loss": 1.0007, "step": 6550 }, { "epoch": 0.21, "learning_rate": 8.3904e-06, "loss": 0.9776, "step": 6555 }, { "epoch": 0.21, "learning_rate": 8.3968e-06, "loss": 0.9978, "step": 6560 }, { "epoch": 0.21, "learning_rate": 8.4032e-06, "loss": 0.9871, "step": 6565 }, { "epoch": 0.21, "learning_rate": 8.409600000000002e-06, "loss": 0.9843, "step": 6570 }, { "epoch": 0.21, "learning_rate": 8.416e-06, "loss": 0.9816, "step": 6575 }, { "epoch": 0.21, "learning_rate": 8.422400000000001e-06, "loss": 0.9946, "step": 6580 }, { "epoch": 0.21, "learning_rate": 8.4288e-06, "loss": 0.9942, "step": 6585 }, { "epoch": 0.21, "learning_rate": 8.435200000000002e-06, "loss": 0.9847, "step": 6590 }, { "epoch": 0.21, "learning_rate": 8.4416e-06, "loss": 0.9925, "step": 6595 }, { "epoch": 0.21, "learning_rate": 8.448000000000001e-06, "loss": 0.9974, "step": 6600 }, { "epoch": 0.21, "learning_rate": 8.4544e-06, "loss": 0.9997, "step": 6605 }, { "epoch": 0.21, "learning_rate": 8.460800000000002e-06, "loss": 0.9877, "step": 6610 }, { "epoch": 0.21, "learning_rate": 8.467200000000001e-06, "loss": 0.989, "step": 6615 }, { "epoch": 0.21, "learning_rate": 8.473600000000001e-06, "loss": 0.9954, "step": 6620 }, { "epoch": 0.21, "learning_rate": 8.48e-06, "loss": 0.9919, "step": 6625 }, { "epoch": 0.21, "learning_rate": 8.4864e-06, "loss": 0.9787, "step": 6630 }, { "epoch": 0.21, "learning_rate": 8.492800000000001e-06, "loss": 0.9987, "step": 6635 }, { "epoch": 0.21, "learning_rate": 8.499200000000002e-06, "loss": 1.008, "step": 6640 }, { "epoch": 0.21, "learning_rate": 8.5056e-06, "loss": 0.984, "step": 6645 }, { "epoch": 0.21, "learning_rate": 8.512e-06, "loss": 1.0007, "step": 6650 }, { "epoch": 0.21, "learning_rate": 8.518400000000001e-06, "loss": 0.9918, "step": 6655 }, { "epoch": 0.21, "learning_rate": 8.5248e-06, "loss": 0.9753, "step": 6660 }, { "epoch": 0.21, "learning_rate": 8.5312e-06, "loss": 0.9789, "step": 6665 }, { "epoch": 0.21, "learning_rate": 8.537600000000001e-06, "loss": 0.9953, "step": 6670 }, { "epoch": 0.21, "learning_rate": 8.544000000000002e-06, "loss": 1.0014, "step": 6675 }, { "epoch": 0.21, "learning_rate": 8.5504e-06, "loss": 0.9956, "step": 6680 }, { "epoch": 0.21, "learning_rate": 8.5568e-06, "loss": 0.9911, "step": 6685 }, { "epoch": 0.21, "learning_rate": 8.5632e-06, "loss": 0.986, "step": 6690 }, { "epoch": 0.21, "learning_rate": 8.569600000000002e-06, "loss": 0.9825, "step": 6695 }, { "epoch": 0.21, "learning_rate": 8.576e-06, "loss": 1.0011, "step": 6700 }, { "epoch": 0.21, "learning_rate": 8.582400000000001e-06, "loss": 0.9717, "step": 6705 }, { "epoch": 0.21, "learning_rate": 8.5888e-06, "loss": 0.9864, "step": 6710 }, { "epoch": 0.21, "learning_rate": 8.5952e-06, "loss": 0.9962, "step": 6715 }, { "epoch": 0.22, "learning_rate": 8.6016e-06, "loss": 1.0024, "step": 6720 }, { "epoch": 0.22, "learning_rate": 8.608000000000001e-06, "loss": 0.9769, "step": 6725 }, { "epoch": 0.22, "learning_rate": 8.6144e-06, "loss": 0.9892, "step": 6730 }, { "epoch": 0.22, "learning_rate": 8.6208e-06, "loss": 0.9928, "step": 6735 }, { "epoch": 0.22, "learning_rate": 8.627200000000001e-06, "loss": 0.9906, "step": 6740 }, { "epoch": 0.22, "learning_rate": 8.633600000000001e-06, "loss": 0.9843, "step": 6745 }, { "epoch": 0.22, "learning_rate": 8.64e-06, "loss": 0.9921, "step": 6750 }, { "epoch": 0.22, "learning_rate": 8.6464e-06, "loss": 0.9954, "step": 6755 }, { "epoch": 0.22, "learning_rate": 8.652800000000001e-06, "loss": 0.993, "step": 6760 }, { "epoch": 0.22, "learning_rate": 8.659200000000002e-06, "loss": 0.9825, "step": 6765 }, { "epoch": 0.22, "learning_rate": 8.6656e-06, "loss": 1.0045, "step": 6770 }, { "epoch": 0.22, "learning_rate": 8.672000000000001e-06, "loss": 1.0073, "step": 6775 }, { "epoch": 0.22, "learning_rate": 8.6784e-06, "loss": 1.0027, "step": 6780 }, { "epoch": 0.22, "learning_rate": 8.6848e-06, "loss": 0.9958, "step": 6785 }, { "epoch": 0.22, "learning_rate": 8.6912e-06, "loss": 0.9869, "step": 6790 }, { "epoch": 0.22, "learning_rate": 8.697600000000001e-06, "loss": 0.9893, "step": 6795 }, { "epoch": 0.22, "learning_rate": 8.704e-06, "loss": 0.9952, "step": 6800 }, { "epoch": 0.22, "learning_rate": 8.7104e-06, "loss": 0.9811, "step": 6805 }, { "epoch": 0.22, "learning_rate": 8.716800000000001e-06, "loss": 0.9807, "step": 6810 }, { "epoch": 0.22, "learning_rate": 8.7232e-06, "loss": 0.9734, "step": 6815 }, { "epoch": 0.22, "learning_rate": 8.7296e-06, "loss": 0.9782, "step": 6820 }, { "epoch": 0.22, "learning_rate": 8.736e-06, "loss": 0.9795, "step": 6825 }, { "epoch": 0.22, "learning_rate": 8.742400000000001e-06, "loss": 0.9945, "step": 6830 }, { "epoch": 0.22, "learning_rate": 8.7488e-06, "loss": 0.9985, "step": 6835 }, { "epoch": 0.22, "learning_rate": 8.7552e-06, "loss": 0.9905, "step": 6840 }, { "epoch": 0.22, "learning_rate": 8.761600000000001e-06, "loss": 0.9881, "step": 6845 }, { "epoch": 0.22, "learning_rate": 8.768000000000001e-06, "loss": 0.9986, "step": 6850 }, { "epoch": 0.22, "learning_rate": 8.7744e-06, "loss": 0.9943, "step": 6855 }, { "epoch": 0.22, "learning_rate": 8.7808e-06, "loss": 0.9836, "step": 6860 }, { "epoch": 0.22, "learning_rate": 8.7872e-06, "loss": 0.9885, "step": 6865 }, { "epoch": 0.22, "learning_rate": 8.793600000000002e-06, "loss": 0.9719, "step": 6870 }, { "epoch": 0.22, "learning_rate": 8.8e-06, "loss": 0.978, "step": 6875 }, { "epoch": 0.22, "learning_rate": 8.806400000000001e-06, "loss": 0.9883, "step": 6880 }, { "epoch": 0.22, "learning_rate": 8.8128e-06, "loss": 0.9868, "step": 6885 }, { "epoch": 0.22, "learning_rate": 8.819200000000002e-06, "loss": 0.9955, "step": 6890 }, { "epoch": 0.22, "learning_rate": 8.8256e-06, "loss": 0.98, "step": 6895 }, { "epoch": 0.22, "learning_rate": 8.832000000000001e-06, "loss": 0.9979, "step": 6900 }, { "epoch": 0.22, "learning_rate": 8.8384e-06, "loss": 0.9776, "step": 6905 }, { "epoch": 0.22, "learning_rate": 8.8448e-06, "loss": 0.9883, "step": 6910 }, { "epoch": 0.22, "learning_rate": 8.851200000000001e-06, "loss": 0.9757, "step": 6915 }, { "epoch": 0.22, "learning_rate": 8.857600000000001e-06, "loss": 0.9742, "step": 6920 }, { "epoch": 0.22, "learning_rate": 8.864e-06, "loss": 0.9842, "step": 6925 }, { "epoch": 0.22, "learning_rate": 8.8704e-06, "loss": 0.9828, "step": 6930 }, { "epoch": 0.22, "learning_rate": 8.876800000000001e-06, "loss": 0.9903, "step": 6935 }, { "epoch": 0.22, "learning_rate": 8.8832e-06, "loss": 0.986, "step": 6940 }, { "epoch": 0.22, "learning_rate": 8.8896e-06, "loss": 0.9862, "step": 6945 }, { "epoch": 0.22, "learning_rate": 8.896000000000001e-06, "loss": 0.9805, "step": 6950 }, { "epoch": 0.22, "learning_rate": 8.902400000000001e-06, "loss": 0.9862, "step": 6955 }, { "epoch": 0.22, "learning_rate": 8.9088e-06, "loss": 0.9696, "step": 6960 }, { "epoch": 0.22, "learning_rate": 8.9152e-06, "loss": 0.9806, "step": 6965 }, { "epoch": 0.22, "learning_rate": 8.9216e-06, "loss": 0.9681, "step": 6970 }, { "epoch": 0.22, "learning_rate": 8.928000000000002e-06, "loss": 0.9698, "step": 6975 }, { "epoch": 0.22, "learning_rate": 8.9344e-06, "loss": 0.9781, "step": 6980 }, { "epoch": 0.22, "learning_rate": 8.940800000000001e-06, "loss": 0.983, "step": 6985 }, { "epoch": 0.22, "learning_rate": 8.9472e-06, "loss": 0.9878, "step": 6990 }, { "epoch": 0.22, "learning_rate": 8.953600000000002e-06, "loss": 0.9852, "step": 6995 }, { "epoch": 0.22, "learning_rate": 8.96e-06, "loss": 0.9707, "step": 7000 }, { "epoch": 0.22, "learning_rate": 8.966400000000001e-06, "loss": 0.9822, "step": 7005 }, { "epoch": 0.22, "learning_rate": 8.9728e-06, "loss": 0.9905, "step": 7010 }, { "epoch": 0.22, "learning_rate": 8.979200000000002e-06, "loss": 0.9615, "step": 7015 }, { "epoch": 0.22, "learning_rate": 8.9856e-06, "loss": 0.9782, "step": 7020 }, { "epoch": 0.22, "learning_rate": 8.992000000000001e-06, "loss": 0.9761, "step": 7025 }, { "epoch": 0.22, "learning_rate": 8.9984e-06, "loss": 0.9848, "step": 7030 }, { "epoch": 0.23, "learning_rate": 9.0048e-06, "loss": 0.986, "step": 7035 }, { "epoch": 0.23, "learning_rate": 9.011200000000001e-06, "loss": 0.9895, "step": 7040 }, { "epoch": 0.23, "learning_rate": 9.017600000000002e-06, "loss": 0.9893, "step": 7045 }, { "epoch": 0.23, "learning_rate": 9.024e-06, "loss": 0.9722, "step": 7050 }, { "epoch": 0.23, "learning_rate": 9.0304e-06, "loss": 0.981, "step": 7055 }, { "epoch": 0.23, "learning_rate": 9.036800000000001e-06, "loss": 0.9785, "step": 7060 }, { "epoch": 0.23, "learning_rate": 9.0432e-06, "loss": 0.9644, "step": 7065 }, { "epoch": 0.23, "learning_rate": 9.0496e-06, "loss": 0.9773, "step": 7070 }, { "epoch": 0.23, "learning_rate": 9.056000000000001e-06, "loss": 0.9854, "step": 7075 }, { "epoch": 0.23, "learning_rate": 9.062400000000002e-06, "loss": 0.9844, "step": 7080 }, { "epoch": 0.23, "learning_rate": 9.0688e-06, "loss": 0.9946, "step": 7085 }, { "epoch": 0.23, "learning_rate": 9.0752e-06, "loss": 0.9801, "step": 7090 }, { "epoch": 0.23, "learning_rate": 9.0816e-06, "loss": 1.0026, "step": 7095 }, { "epoch": 0.23, "learning_rate": 9.088000000000002e-06, "loss": 0.9759, "step": 7100 }, { "epoch": 0.23, "learning_rate": 9.0944e-06, "loss": 0.9847, "step": 7105 }, { "epoch": 0.23, "learning_rate": 9.100800000000001e-06, "loss": 0.9812, "step": 7110 }, { "epoch": 0.23, "learning_rate": 9.1072e-06, "loss": 0.9645, "step": 7115 }, { "epoch": 0.23, "learning_rate": 9.1136e-06, "loss": 0.9731, "step": 7120 }, { "epoch": 0.23, "learning_rate": 9.12e-06, "loss": 0.9727, "step": 7125 }, { "epoch": 0.23, "learning_rate": 9.126400000000001e-06, "loss": 0.9815, "step": 7130 }, { "epoch": 0.23, "learning_rate": 9.1328e-06, "loss": 0.9722, "step": 7135 }, { "epoch": 0.23, "learning_rate": 9.1392e-06, "loss": 0.976, "step": 7140 }, { "epoch": 0.23, "learning_rate": 9.145600000000001e-06, "loss": 0.9782, "step": 7145 }, { "epoch": 0.23, "learning_rate": 9.152000000000001e-06, "loss": 0.9693, "step": 7150 }, { "epoch": 0.23, "learning_rate": 9.1584e-06, "loss": 0.9755, "step": 7155 }, { "epoch": 0.23, "learning_rate": 9.1648e-06, "loss": 0.9765, "step": 7160 }, { "epoch": 0.23, "learning_rate": 9.171200000000001e-06, "loss": 0.9757, "step": 7165 }, { "epoch": 0.23, "learning_rate": 9.177600000000002e-06, "loss": 0.9711, "step": 7170 }, { "epoch": 0.23, "learning_rate": 9.184e-06, "loss": 0.9735, "step": 7175 }, { "epoch": 0.23, "learning_rate": 9.190400000000001e-06, "loss": 0.9923, "step": 7180 }, { "epoch": 0.23, "learning_rate": 9.196800000000001e-06, "loss": 0.9738, "step": 7185 }, { "epoch": 0.23, "learning_rate": 9.2032e-06, "loss": 0.9627, "step": 7190 }, { "epoch": 0.23, "learning_rate": 9.2096e-06, "loss": 0.9715, "step": 7195 }, { "epoch": 0.23, "learning_rate": 9.216000000000001e-06, "loss": 0.9722, "step": 7200 }, { "epoch": 0.23, "learning_rate": 9.2224e-06, "loss": 0.9798, "step": 7205 }, { "epoch": 0.23, "learning_rate": 9.2288e-06, "loss": 0.982, "step": 7210 }, { "epoch": 0.23, "learning_rate": 9.235200000000001e-06, "loss": 0.9637, "step": 7215 }, { "epoch": 0.23, "learning_rate": 9.2416e-06, "loss": 0.9772, "step": 7220 }, { "epoch": 0.23, "learning_rate": 9.248e-06, "loss": 0.9614, "step": 7225 }, { "epoch": 0.23, "learning_rate": 9.2544e-06, "loss": 0.9879, "step": 7230 }, { "epoch": 0.23, "learning_rate": 9.260800000000001e-06, "loss": 0.9632, "step": 7235 }, { "epoch": 0.23, "learning_rate": 9.2672e-06, "loss": 0.9738, "step": 7240 }, { "epoch": 0.23, "learning_rate": 9.2736e-06, "loss": 0.9791, "step": 7245 }, { "epoch": 0.23, "learning_rate": 9.280000000000001e-06, "loss": 0.9843, "step": 7250 }, { "epoch": 0.23, "learning_rate": 9.286400000000001e-06, "loss": 0.9616, "step": 7255 }, { "epoch": 0.23, "learning_rate": 9.2928e-06, "loss": 0.9788, "step": 7260 }, { "epoch": 0.23, "learning_rate": 9.2992e-06, "loss": 0.9705, "step": 7265 }, { "epoch": 0.23, "learning_rate": 9.305600000000001e-06, "loss": 0.9778, "step": 7270 }, { "epoch": 0.23, "learning_rate": 9.312000000000002e-06, "loss": 0.9529, "step": 7275 }, { "epoch": 0.23, "learning_rate": 9.3184e-06, "loss": 0.971, "step": 7280 }, { "epoch": 0.23, "learning_rate": 9.324800000000001e-06, "loss": 0.9659, "step": 7285 }, { "epoch": 0.23, "learning_rate": 9.3312e-06, "loss": 0.9653, "step": 7290 }, { "epoch": 0.23, "learning_rate": 9.337600000000002e-06, "loss": 0.9605, "step": 7295 }, { "epoch": 0.23, "learning_rate": 9.344e-06, "loss": 0.9651, "step": 7300 }, { "epoch": 0.23, "learning_rate": 9.350400000000001e-06, "loss": 0.9772, "step": 7305 }, { "epoch": 0.23, "learning_rate": 9.3568e-06, "loss": 0.9741, "step": 7310 }, { "epoch": 0.23, "learning_rate": 9.3632e-06, "loss": 0.9713, "step": 7315 }, { "epoch": 0.23, "learning_rate": 9.369600000000001e-06, "loss": 0.9743, "step": 7320 }, { "epoch": 0.23, "learning_rate": 9.376000000000001e-06, "loss": 0.9732, "step": 7325 }, { "epoch": 0.23, "learning_rate": 9.3824e-06, "loss": 0.9696, "step": 7330 }, { "epoch": 0.23, "learning_rate": 9.3888e-06, "loss": 0.9776, "step": 7335 }, { "epoch": 0.23, "learning_rate": 9.395200000000001e-06, "loss": 0.9802, "step": 7340 }, { "epoch": 0.24, "learning_rate": 9.4016e-06, "loss": 0.9635, "step": 7345 }, { "epoch": 0.24, "learning_rate": 9.408e-06, "loss": 0.9762, "step": 7350 }, { "epoch": 0.24, "learning_rate": 9.414400000000001e-06, "loss": 0.9474, "step": 7355 }, { "epoch": 0.24, "learning_rate": 9.420800000000001e-06, "loss": 0.9805, "step": 7360 }, { "epoch": 0.24, "learning_rate": 9.4272e-06, "loss": 0.9696, "step": 7365 }, { "epoch": 0.24, "learning_rate": 9.4336e-06, "loss": 0.9584, "step": 7370 }, { "epoch": 0.24, "learning_rate": 9.440000000000001e-06, "loss": 0.9665, "step": 7375 }, { "epoch": 0.24, "learning_rate": 9.446400000000002e-06, "loss": 0.9616, "step": 7380 }, { "epoch": 0.24, "learning_rate": 9.4528e-06, "loss": 0.9598, "step": 7385 }, { "epoch": 0.24, "learning_rate": 9.4592e-06, "loss": 0.9786, "step": 7390 }, { "epoch": 0.24, "learning_rate": 9.4656e-06, "loss": 0.9625, "step": 7395 }, { "epoch": 0.24, "learning_rate": 9.472000000000002e-06, "loss": 0.9626, "step": 7400 }, { "epoch": 0.24, "learning_rate": 9.4784e-06, "loss": 0.9677, "step": 7405 }, { "epoch": 0.24, "learning_rate": 9.484800000000001e-06, "loss": 0.9677, "step": 7410 }, { "epoch": 0.24, "learning_rate": 9.4912e-06, "loss": 0.983, "step": 7415 }, { "epoch": 0.24, "learning_rate": 9.497600000000002e-06, "loss": 0.9876, "step": 7420 }, { "epoch": 0.24, "learning_rate": 9.504e-06, "loss": 0.9888, "step": 7425 }, { "epoch": 0.24, "learning_rate": 9.510400000000001e-06, "loss": 0.9588, "step": 7430 }, { "epoch": 0.24, "learning_rate": 9.5168e-06, "loss": 0.9681, "step": 7435 }, { "epoch": 0.24, "learning_rate": 9.5232e-06, "loss": 0.9686, "step": 7440 }, { "epoch": 0.24, "learning_rate": 9.529600000000001e-06, "loss": 0.9601, "step": 7445 }, { "epoch": 0.24, "learning_rate": 9.536000000000002e-06, "loss": 0.9679, "step": 7450 }, { "epoch": 0.24, "learning_rate": 9.5424e-06, "loss": 0.9599, "step": 7455 }, { "epoch": 0.24, "learning_rate": 9.5488e-06, "loss": 0.9674, "step": 7460 }, { "epoch": 0.24, "learning_rate": 9.555200000000001e-06, "loss": 0.967, "step": 7465 }, { "epoch": 0.24, "learning_rate": 9.5616e-06, "loss": 0.9651, "step": 7470 }, { "epoch": 0.24, "learning_rate": 9.568e-06, "loss": 0.9649, "step": 7475 }, { "epoch": 0.24, "learning_rate": 9.574400000000001e-06, "loss": 0.9748, "step": 7480 }, { "epoch": 0.24, "learning_rate": 9.580800000000002e-06, "loss": 0.9587, "step": 7485 }, { "epoch": 0.24, "learning_rate": 9.5872e-06, "loss": 0.9587, "step": 7490 }, { "epoch": 0.24, "learning_rate": 9.5936e-06, "loss": 0.9587, "step": 7495 }, { "epoch": 0.24, "learning_rate": 9.600000000000001e-06, "loss": 0.9726, "step": 7500 }, { "epoch": 0.24, "learning_rate": 9.606400000000002e-06, "loss": 0.9519, "step": 7505 }, { "epoch": 0.24, "learning_rate": 9.6128e-06, "loss": 0.9618, "step": 7510 }, { "epoch": 0.24, "learning_rate": 9.619200000000001e-06, "loss": 0.9678, "step": 7515 }, { "epoch": 0.24, "learning_rate": 9.6256e-06, "loss": 0.9728, "step": 7520 }, { "epoch": 0.24, "learning_rate": 9.632e-06, "loss": 0.9613, "step": 7525 }, { "epoch": 0.24, "learning_rate": 9.6384e-06, "loss": 0.9567, "step": 7530 }, { "epoch": 0.24, "learning_rate": 9.644800000000001e-06, "loss": 0.9592, "step": 7535 }, { "epoch": 0.24, "learning_rate": 9.6512e-06, "loss": 0.9705, "step": 7540 }, { "epoch": 0.24, "learning_rate": 9.6576e-06, "loss": 0.9721, "step": 7545 }, { "epoch": 0.24, "learning_rate": 9.664000000000001e-06, "loss": 0.9618, "step": 7550 }, { "epoch": 0.24, "learning_rate": 9.670400000000001e-06, "loss": 0.9668, "step": 7555 }, { "epoch": 0.24, "learning_rate": 9.6768e-06, "loss": 0.9686, "step": 7560 }, { "epoch": 0.24, "learning_rate": 9.6832e-06, "loss": 0.9758, "step": 7565 }, { "epoch": 0.24, "learning_rate": 9.689600000000001e-06, "loss": 0.9709, "step": 7570 }, { "epoch": 0.24, "learning_rate": 9.696000000000002e-06, "loss": 0.9422, "step": 7575 }, { "epoch": 0.24, "learning_rate": 9.7024e-06, "loss": 0.9618, "step": 7580 }, { "epoch": 0.24, "learning_rate": 9.708800000000001e-06, "loss": 0.9605, "step": 7585 }, { "epoch": 0.24, "learning_rate": 9.715200000000001e-06, "loss": 0.9707, "step": 7590 }, { "epoch": 0.24, "learning_rate": 9.7216e-06, "loss": 0.9623, "step": 7595 }, { "epoch": 0.24, "learning_rate": 9.728e-06, "loss": 0.981, "step": 7600 }, { "epoch": 0.24, "learning_rate": 9.734400000000001e-06, "loss": 0.9803, "step": 7605 }, { "epoch": 0.24, "learning_rate": 9.7408e-06, "loss": 0.9603, "step": 7610 }, { "epoch": 0.24, "learning_rate": 9.7472e-06, "loss": 0.9603, "step": 7615 }, { "epoch": 0.24, "learning_rate": 9.753600000000001e-06, "loss": 0.9659, "step": 7620 }, { "epoch": 0.24, "learning_rate": 9.760000000000001e-06, "loss": 0.9534, "step": 7625 }, { "epoch": 0.24, "learning_rate": 9.7664e-06, "loss": 0.9542, "step": 7630 }, { "epoch": 0.24, "learning_rate": 9.7728e-06, "loss": 0.9696, "step": 7635 }, { "epoch": 0.24, "learning_rate": 9.779200000000001e-06, "loss": 0.9621, "step": 7640 }, { "epoch": 0.24, "learning_rate": 9.7856e-06, "loss": 0.9605, "step": 7645 }, { "epoch": 0.24, "learning_rate": 9.792e-06, "loss": 0.9636, "step": 7650 }, { "epoch": 0.24, "learning_rate": 9.798400000000001e-06, "loss": 0.9728, "step": 7655 }, { "epoch": 0.25, "learning_rate": 9.804800000000001e-06, "loss": 0.963, "step": 7660 }, { "epoch": 0.25, "learning_rate": 9.8112e-06, "loss": 0.9634, "step": 7665 }, { "epoch": 0.25, "learning_rate": 9.8176e-06, "loss": 0.9702, "step": 7670 }, { "epoch": 0.25, "learning_rate": 9.824000000000001e-06, "loss": 0.9435, "step": 7675 }, { "epoch": 0.25, "learning_rate": 9.830400000000002e-06, "loss": 0.9528, "step": 7680 }, { "epoch": 0.25, "learning_rate": 9.8368e-06, "loss": 0.957, "step": 7685 }, { "epoch": 0.25, "learning_rate": 9.843200000000001e-06, "loss": 0.9733, "step": 7690 }, { "epoch": 0.25, "learning_rate": 9.8496e-06, "loss": 0.9593, "step": 7695 }, { "epoch": 0.25, "learning_rate": 9.856000000000002e-06, "loss": 0.9534, "step": 7700 }, { "epoch": 0.25, "learning_rate": 9.8624e-06, "loss": 0.9466, "step": 7705 }, { "epoch": 0.25, "learning_rate": 9.868800000000001e-06, "loss": 0.969, "step": 7710 }, { "epoch": 0.25, "learning_rate": 9.8752e-06, "loss": 0.9587, "step": 7715 }, { "epoch": 0.25, "learning_rate": 9.8816e-06, "loss": 0.9704, "step": 7720 }, { "epoch": 0.25, "learning_rate": 9.888000000000001e-06, "loss": 0.9499, "step": 7725 }, { "epoch": 0.25, "learning_rate": 9.894400000000001e-06, "loss": 0.9482, "step": 7730 }, { "epoch": 0.25, "learning_rate": 9.9008e-06, "loss": 0.9545, "step": 7735 }, { "epoch": 0.25, "learning_rate": 9.9072e-06, "loss": 0.9682, "step": 7740 }, { "epoch": 0.25, "learning_rate": 9.913600000000001e-06, "loss": 0.9582, "step": 7745 }, { "epoch": 0.25, "learning_rate": 9.920000000000002e-06, "loss": 0.9719, "step": 7750 }, { "epoch": 0.25, "learning_rate": 9.9264e-06, "loss": 0.9541, "step": 7755 }, { "epoch": 0.25, "learning_rate": 9.932800000000001e-06, "loss": 0.9784, "step": 7760 }, { "epoch": 0.25, "learning_rate": 9.939200000000001e-06, "loss": 0.9601, "step": 7765 }, { "epoch": 0.25, "learning_rate": 9.9456e-06, "loss": 0.9605, "step": 7770 }, { "epoch": 0.25, "learning_rate": 9.952e-06, "loss": 0.9573, "step": 7775 }, { "epoch": 0.25, "learning_rate": 9.958400000000001e-06, "loss": 0.9599, "step": 7780 }, { "epoch": 0.25, "learning_rate": 9.964800000000002e-06, "loss": 0.9672, "step": 7785 }, { "epoch": 0.25, "learning_rate": 9.9712e-06, "loss": 0.9496, "step": 7790 }, { "epoch": 0.25, "learning_rate": 9.9776e-06, "loss": 0.95, "step": 7795 }, { "epoch": 0.25, "learning_rate": 9.984e-06, "loss": 0.9563, "step": 7800 }, { "epoch": 0.25, "learning_rate": 9.990400000000002e-06, "loss": 0.9676, "step": 7805 }, { "epoch": 0.25, "learning_rate": 9.9968e-06, "loss": 0.9635, "step": 7810 }, { "epoch": 0.25, "learning_rate": 1.0003200000000001e-05, "loss": 0.9633, "step": 7815 }, { "epoch": 0.25, "learning_rate": 1.0009600000000002e-05, "loss": 0.9481, "step": 7820 }, { "epoch": 0.25, "learning_rate": 1.0016000000000002e-05, "loss": 0.9518, "step": 7825 }, { "epoch": 0.25, "learning_rate": 1.00224e-05, "loss": 0.9683, "step": 7830 }, { "epoch": 0.25, "learning_rate": 1.0028800000000001e-05, "loss": 0.9573, "step": 7835 }, { "epoch": 0.25, "learning_rate": 1.00352e-05, "loss": 0.9724, "step": 7840 }, { "epoch": 0.25, "learning_rate": 1.00416e-05, "loss": 0.9588, "step": 7845 }, { "epoch": 0.25, "learning_rate": 1.0048e-05, "loss": 0.9449, "step": 7850 }, { "epoch": 0.25, "learning_rate": 1.00544e-05, "loss": 0.9617, "step": 7855 }, { "epoch": 0.25, "learning_rate": 1.0060800000000002e-05, "loss": 0.9597, "step": 7860 }, { "epoch": 0.25, "learning_rate": 1.00672e-05, "loss": 0.9517, "step": 7865 }, { "epoch": 0.25, "learning_rate": 1.0073600000000001e-05, "loss": 0.946, "step": 7870 }, { "epoch": 0.25, "learning_rate": 1.008e-05, "loss": 0.9783, "step": 7875 }, { "epoch": 0.25, "learning_rate": 1.00864e-05, "loss": 0.9491, "step": 7880 }, { "epoch": 0.25, "learning_rate": 1.0092800000000001e-05, "loss": 0.9552, "step": 7885 }, { "epoch": 0.25, "learning_rate": 1.00992e-05, "loss": 0.9549, "step": 7890 }, { "epoch": 0.25, "learning_rate": 1.01056e-05, "loss": 0.9529, "step": 7895 }, { "epoch": 0.25, "learning_rate": 1.0112000000000002e-05, "loss": 0.9556, "step": 7900 }, { "epoch": 0.25, "learning_rate": 1.0118400000000001e-05, "loss": 0.9455, "step": 7905 }, { "epoch": 0.25, "learning_rate": 1.0124800000000002e-05, "loss": 0.9593, "step": 7910 }, { "epoch": 0.25, "learning_rate": 1.01312e-05, "loss": 0.9527, "step": 7915 }, { "epoch": 0.25, "learning_rate": 1.0137600000000001e-05, "loss": 0.9659, "step": 7920 }, { "epoch": 0.25, "learning_rate": 1.0144e-05, "loss": 0.958, "step": 7925 }, { "epoch": 0.25, "learning_rate": 1.01504e-05, "loss": 0.9371, "step": 7930 }, { "epoch": 0.25, "learning_rate": 1.01568e-05, "loss": 0.9482, "step": 7935 }, { "epoch": 0.25, "learning_rate": 1.01632e-05, "loss": 0.9508, "step": 7940 }, { "epoch": 0.25, "learning_rate": 1.0169600000000002e-05, "loss": 0.9343, "step": 7945 }, { "epoch": 0.25, "learning_rate": 1.0176000000000002e-05, "loss": 0.9557, "step": 7950 }, { "epoch": 0.25, "learning_rate": 1.0182400000000001e-05, "loss": 0.9717, "step": 7955 }, { "epoch": 0.25, "learning_rate": 1.0188800000000001e-05, "loss": 0.9672, "step": 7960 }, { "epoch": 0.25, "learning_rate": 1.01952e-05, "loss": 0.9703, "step": 7965 }, { "epoch": 0.26, "learning_rate": 1.02016e-05, "loss": 0.9607, "step": 7970 }, { "epoch": 0.26, "learning_rate": 1.0208e-05, "loss": 0.9587, "step": 7975 }, { "epoch": 0.26, "learning_rate": 1.02144e-05, "loss": 0.9574, "step": 7980 }, { "epoch": 0.26, "learning_rate": 1.0220800000000002e-05, "loss": 0.9557, "step": 7985 }, { "epoch": 0.26, "learning_rate": 1.0227200000000001e-05, "loss": 0.9593, "step": 7990 }, { "epoch": 0.26, "learning_rate": 1.0233600000000001e-05, "loss": 0.9451, "step": 7995 }, { "epoch": 0.26, "learning_rate": 1.024e-05, "loss": 0.9518, "step": 8000 }, { "epoch": 0.26, "learning_rate": 1.02464e-05, "loss": 0.9555, "step": 8005 }, { "epoch": 0.26, "learning_rate": 1.0252800000000001e-05, "loss": 0.9423, "step": 8010 }, { "epoch": 0.26, "learning_rate": 1.02592e-05, "loss": 0.945, "step": 8015 }, { "epoch": 0.26, "learning_rate": 1.02656e-05, "loss": 0.9433, "step": 8020 }, { "epoch": 0.26, "learning_rate": 1.0272e-05, "loss": 0.966, "step": 8025 }, { "epoch": 0.26, "learning_rate": 1.0278400000000001e-05, "loss": 0.9671, "step": 8030 }, { "epoch": 0.26, "learning_rate": 1.0284800000000002e-05, "loss": 0.953, "step": 8035 }, { "epoch": 0.26, "learning_rate": 1.02912e-05, "loss": 0.9661, "step": 8040 }, { "epoch": 0.26, "learning_rate": 1.0297600000000001e-05, "loss": 0.9642, "step": 8045 }, { "epoch": 0.26, "learning_rate": 1.0304e-05, "loss": 0.9437, "step": 8050 }, { "epoch": 0.26, "learning_rate": 1.03104e-05, "loss": 0.964, "step": 8055 }, { "epoch": 0.26, "learning_rate": 1.0316800000000001e-05, "loss": 0.9514, "step": 8060 }, { "epoch": 0.26, "learning_rate": 1.03232e-05, "loss": 0.9459, "step": 8065 }, { "epoch": 0.26, "learning_rate": 1.0329600000000002e-05, "loss": 0.9568, "step": 8070 }, { "epoch": 0.26, "learning_rate": 1.0336000000000002e-05, "loss": 0.9602, "step": 8075 }, { "epoch": 0.26, "learning_rate": 1.0342400000000001e-05, "loss": 0.9486, "step": 8080 }, { "epoch": 0.26, "learning_rate": 1.0348800000000002e-05, "loss": 0.958, "step": 8085 }, { "epoch": 0.26, "learning_rate": 1.03552e-05, "loss": 0.955, "step": 8090 }, { "epoch": 0.26, "learning_rate": 1.0361600000000001e-05, "loss": 0.9596, "step": 8095 }, { "epoch": 0.26, "learning_rate": 1.0368e-05, "loss": 0.949, "step": 8100 }, { "epoch": 0.26, "learning_rate": 1.03744e-05, "loss": 0.9473, "step": 8105 }, { "epoch": 0.26, "learning_rate": 1.0380799999999999e-05, "loss": 0.9491, "step": 8110 }, { "epoch": 0.26, "learning_rate": 1.0387200000000001e-05, "loss": 0.9548, "step": 8115 }, { "epoch": 0.26, "learning_rate": 1.0393600000000002e-05, "loss": 0.9595, "step": 8120 }, { "epoch": 0.26, "learning_rate": 1.04e-05, "loss": 0.9522, "step": 8125 }, { "epoch": 0.26, "learning_rate": 1.0406400000000001e-05, "loss": 0.9483, "step": 8130 }, { "epoch": 0.26, "learning_rate": 1.0412800000000001e-05, "loss": 0.9468, "step": 8135 }, { "epoch": 0.26, "learning_rate": 1.04192e-05, "loss": 0.9621, "step": 8140 }, { "epoch": 0.26, "learning_rate": 1.04256e-05, "loss": 0.9509, "step": 8145 }, { "epoch": 0.26, "learning_rate": 1.0432e-05, "loss": 0.9377, "step": 8150 }, { "epoch": 0.26, "learning_rate": 1.0438400000000002e-05, "loss": 0.9569, "step": 8155 }, { "epoch": 0.26, "learning_rate": 1.0444800000000002e-05, "loss": 0.9541, "step": 8160 }, { "epoch": 0.26, "learning_rate": 1.04512e-05, "loss": 0.9495, "step": 8165 }, { "epoch": 0.26, "learning_rate": 1.0457600000000001e-05, "loss": 0.9559, "step": 8170 }, { "epoch": 0.26, "learning_rate": 1.0464e-05, "loss": 0.9416, "step": 8175 }, { "epoch": 0.26, "learning_rate": 1.04704e-05, "loss": 0.9424, "step": 8180 }, { "epoch": 0.26, "learning_rate": 1.0476800000000001e-05, "loss": 0.9488, "step": 8185 }, { "epoch": 0.26, "learning_rate": 1.04832e-05, "loss": 0.9415, "step": 8190 }, { "epoch": 0.26, "learning_rate": 1.04896e-05, "loss": 0.947, "step": 8195 }, { "epoch": 0.26, "learning_rate": 1.0496000000000003e-05, "loss": 0.9595, "step": 8200 }, { "epoch": 0.26, "learning_rate": 1.0502400000000001e-05, "loss": 0.9499, "step": 8205 }, { "epoch": 0.26, "learning_rate": 1.0508800000000002e-05, "loss": 0.9377, "step": 8210 }, { "epoch": 0.26, "learning_rate": 1.05152e-05, "loss": 0.9596, "step": 8215 }, { "epoch": 0.26, "learning_rate": 1.0521600000000001e-05, "loss": 0.9478, "step": 8220 }, { "epoch": 0.26, "learning_rate": 1.0528e-05, "loss": 0.9482, "step": 8225 }, { "epoch": 0.26, "learning_rate": 1.05344e-05, "loss": 0.9545, "step": 8230 }, { "epoch": 0.26, "learning_rate": 1.0540799999999999e-05, "loss": 0.9423, "step": 8235 }, { "epoch": 0.26, "learning_rate": 1.0547200000000001e-05, "loss": 0.9519, "step": 8240 }, { "epoch": 0.26, "learning_rate": 1.0553600000000002e-05, "loss": 0.9448, "step": 8245 }, { "epoch": 0.26, "learning_rate": 1.056e-05, "loss": 0.956, "step": 8250 }, { "epoch": 0.26, "learning_rate": 1.0566400000000001e-05, "loss": 0.9515, "step": 8255 }, { "epoch": 0.26, "learning_rate": 1.0572800000000002e-05, "loss": 0.9441, "step": 8260 }, { "epoch": 0.26, "learning_rate": 1.05792e-05, "loss": 0.9494, "step": 8265 }, { "epoch": 0.26, "learning_rate": 1.05856e-05, "loss": 0.947, "step": 8270 }, { "epoch": 0.26, "learning_rate": 1.0592e-05, "loss": 0.9463, "step": 8275 }, { "epoch": 0.26, "learning_rate": 1.05984e-05, "loss": 0.9385, "step": 8280 }, { "epoch": 0.27, "learning_rate": 1.0604800000000002e-05, "loss": 0.9471, "step": 8285 }, { "epoch": 0.27, "learning_rate": 1.0611200000000001e-05, "loss": 0.944, "step": 8290 }, { "epoch": 0.27, "learning_rate": 1.0617600000000001e-05, "loss": 0.9499, "step": 8295 }, { "epoch": 0.27, "learning_rate": 1.0624e-05, "loss": 0.9449, "step": 8300 }, { "epoch": 0.27, "learning_rate": 1.06304e-05, "loss": 0.9607, "step": 8305 }, { "epoch": 0.27, "learning_rate": 1.0636800000000001e-05, "loss": 0.9392, "step": 8310 }, { "epoch": 0.27, "learning_rate": 1.06432e-05, "loss": 0.9392, "step": 8315 }, { "epoch": 0.27, "learning_rate": 1.06496e-05, "loss": 0.9497, "step": 8320 }, { "epoch": 0.27, "learning_rate": 1.0656000000000003e-05, "loss": 0.9449, "step": 8325 }, { "epoch": 0.27, "learning_rate": 1.0662400000000001e-05, "loss": 0.9511, "step": 8330 }, { "epoch": 0.27, "learning_rate": 1.0668800000000002e-05, "loss": 0.9424, "step": 8335 }, { "epoch": 0.27, "learning_rate": 1.06752e-05, "loss": 0.9571, "step": 8340 }, { "epoch": 0.27, "learning_rate": 1.0681600000000001e-05, "loss": 0.9311, "step": 8345 }, { "epoch": 0.27, "learning_rate": 1.0688e-05, "loss": 0.9432, "step": 8350 }, { "epoch": 0.27, "learning_rate": 1.06944e-05, "loss": 0.9471, "step": 8355 }, { "epoch": 0.27, "learning_rate": 1.07008e-05, "loss": 0.9483, "step": 8360 }, { "epoch": 0.27, "learning_rate": 1.07072e-05, "loss": 0.9364, "step": 8365 }, { "epoch": 0.27, "learning_rate": 1.0713600000000002e-05, "loss": 0.9446, "step": 8370 }, { "epoch": 0.27, "learning_rate": 1.072e-05, "loss": 0.9337, "step": 8375 }, { "epoch": 0.27, "learning_rate": 1.0726400000000001e-05, "loss": 0.9391, "step": 8380 }, { "epoch": 0.27, "learning_rate": 1.0732800000000002e-05, "loss": 0.9379, "step": 8385 }, { "epoch": 0.27, "learning_rate": 1.07392e-05, "loss": 0.9314, "step": 8390 }, { "epoch": 0.27, "learning_rate": 1.0745600000000001e-05, "loss": 0.9467, "step": 8395 }, { "epoch": 0.27, "learning_rate": 1.0752e-05, "loss": 0.9382, "step": 8400 }, { "epoch": 0.27, "learning_rate": 1.07584e-05, "loss": 0.9311, "step": 8405 }, { "epoch": 0.27, "learning_rate": 1.0764800000000002e-05, "loss": 0.939, "step": 8410 }, { "epoch": 0.27, "learning_rate": 1.0771200000000001e-05, "loss": 0.9482, "step": 8415 }, { "epoch": 0.27, "learning_rate": 1.0777600000000002e-05, "loss": 0.9318, "step": 8420 }, { "epoch": 0.27, "learning_rate": 1.0784e-05, "loss": 0.9358, "step": 8425 }, { "epoch": 0.27, "learning_rate": 1.0790400000000001e-05, "loss": 0.9295, "step": 8430 }, { "epoch": 0.27, "learning_rate": 1.0796800000000001e-05, "loss": 0.9486, "step": 8435 }, { "epoch": 0.27, "learning_rate": 1.08032e-05, "loss": 0.9309, "step": 8440 }, { "epoch": 0.27, "learning_rate": 1.08096e-05, "loss": 0.9345, "step": 8445 }, { "epoch": 0.27, "learning_rate": 1.0816e-05, "loss": 0.9322, "step": 8450 }, { "epoch": 0.27, "learning_rate": 1.0822400000000002e-05, "loss": 0.9492, "step": 8455 }, { "epoch": 0.27, "learning_rate": 1.0828800000000002e-05, "loss": 0.9378, "step": 8460 }, { "epoch": 0.27, "learning_rate": 1.0835200000000001e-05, "loss": 0.9413, "step": 8465 }, { "epoch": 0.27, "learning_rate": 1.0841600000000001e-05, "loss": 0.9536, "step": 8470 }, { "epoch": 0.27, "learning_rate": 1.0848e-05, "loss": 0.9433, "step": 8475 }, { "epoch": 0.27, "learning_rate": 1.08544e-05, "loss": 0.9465, "step": 8480 }, { "epoch": 0.27, "learning_rate": 1.08608e-05, "loss": 0.9496, "step": 8485 }, { "epoch": 0.27, "learning_rate": 1.08672e-05, "loss": 0.942, "step": 8490 }, { "epoch": 0.27, "learning_rate": 1.0873600000000002e-05, "loss": 0.956, "step": 8495 }, { "epoch": 0.27, "learning_rate": 1.0880000000000001e-05, "loss": 0.9357, "step": 8500 }, { "epoch": 0.27, "learning_rate": 1.0886400000000001e-05, "loss": 0.9308, "step": 8505 }, { "epoch": 0.27, "learning_rate": 1.0892800000000002e-05, "loss": 0.9402, "step": 8510 }, { "epoch": 0.27, "learning_rate": 1.08992e-05, "loss": 0.95, "step": 8515 }, { "epoch": 0.27, "learning_rate": 1.0905600000000001e-05, "loss": 0.9567, "step": 8520 }, { "epoch": 0.27, "learning_rate": 1.0912e-05, "loss": 0.9411, "step": 8525 }, { "epoch": 0.27, "learning_rate": 1.09184e-05, "loss": 0.9344, "step": 8530 }, { "epoch": 0.27, "learning_rate": 1.0924799999999999e-05, "loss": 0.9275, "step": 8535 }, { "epoch": 0.27, "learning_rate": 1.0931200000000001e-05, "loss": 0.9222, "step": 8540 }, { "epoch": 0.27, "learning_rate": 1.0937600000000002e-05, "loss": 0.9308, "step": 8545 }, { "epoch": 0.27, "learning_rate": 1.0944e-05, "loss": 0.9452, "step": 8550 }, { "epoch": 0.27, "learning_rate": 1.0950400000000001e-05, "loss": 0.9308, "step": 8555 }, { "epoch": 0.27, "learning_rate": 1.0956800000000002e-05, "loss": 0.9473, "step": 8560 }, { "epoch": 0.27, "learning_rate": 1.09632e-05, "loss": 0.9347, "step": 8565 }, { "epoch": 0.27, "learning_rate": 1.09696e-05, "loss": 0.9397, "step": 8570 }, { "epoch": 0.27, "learning_rate": 1.0976e-05, "loss": 0.9494, "step": 8575 }, { "epoch": 0.27, "learning_rate": 1.0982400000000002e-05, "loss": 0.9255, "step": 8580 }, { "epoch": 0.27, "learning_rate": 1.0988800000000002e-05, "loss": 0.9379, "step": 8585 }, { "epoch": 0.27, "learning_rate": 1.0995200000000001e-05, "loss": 0.9376, "step": 8590 }, { "epoch": 0.28, "learning_rate": 1.1001600000000002e-05, "loss": 0.9406, "step": 8595 }, { "epoch": 0.28, "learning_rate": 1.1008e-05, "loss": 0.9508, "step": 8600 }, { "epoch": 0.28, "learning_rate": 1.10144e-05, "loss": 0.934, "step": 8605 }, { "epoch": 0.28, "learning_rate": 1.10208e-05, "loss": 0.935, "step": 8610 }, { "epoch": 0.28, "learning_rate": 1.10272e-05, "loss": 0.9394, "step": 8615 }, { "epoch": 0.28, "learning_rate": 1.10336e-05, "loss": 0.9355, "step": 8620 }, { "epoch": 0.28, "learning_rate": 1.1040000000000001e-05, "loss": 0.9221, "step": 8625 }, { "epoch": 0.28, "learning_rate": 1.1046400000000002e-05, "loss": 0.9369, "step": 8630 }, { "epoch": 0.28, "learning_rate": 1.1052800000000002e-05, "loss": 0.9249, "step": 8635 }, { "epoch": 0.28, "learning_rate": 1.10592e-05, "loss": 0.9441, "step": 8640 }, { "epoch": 0.28, "learning_rate": 1.1065600000000001e-05, "loss": 0.9273, "step": 8645 }, { "epoch": 0.28, "learning_rate": 1.1072e-05, "loss": 0.9354, "step": 8650 }, { "epoch": 0.28, "learning_rate": 1.10784e-05, "loss": 0.9372, "step": 8655 }, { "epoch": 0.28, "learning_rate": 1.10848e-05, "loss": 0.9388, "step": 8660 }, { "epoch": 0.28, "learning_rate": 1.1091200000000001e-05, "loss": 0.9393, "step": 8665 }, { "epoch": 0.28, "learning_rate": 1.1097600000000002e-05, "loss": 0.9377, "step": 8670 }, { "epoch": 0.28, "learning_rate": 1.1104e-05, "loss": 0.9401, "step": 8675 }, { "epoch": 0.28, "learning_rate": 1.1110400000000001e-05, "loss": 0.9285, "step": 8680 }, { "epoch": 0.28, "learning_rate": 1.1116800000000002e-05, "loss": 0.9381, "step": 8685 }, { "epoch": 0.28, "learning_rate": 1.11232e-05, "loss": 0.9389, "step": 8690 }, { "epoch": 0.28, "learning_rate": 1.1129600000000001e-05, "loss": 0.9154, "step": 8695 }, { "epoch": 0.28, "learning_rate": 1.1136e-05, "loss": 0.9378, "step": 8700 }, { "epoch": 0.28, "learning_rate": 1.11424e-05, "loss": 0.9411, "step": 8705 }, { "epoch": 0.28, "learning_rate": 1.1148800000000002e-05, "loss": 0.9287, "step": 8710 }, { "epoch": 0.28, "learning_rate": 1.1155200000000001e-05, "loss": 0.9373, "step": 8715 }, { "epoch": 0.28, "learning_rate": 1.1161600000000002e-05, "loss": 0.9324, "step": 8720 }, { "epoch": 0.28, "learning_rate": 1.1168e-05, "loss": 0.9263, "step": 8725 }, { "epoch": 0.28, "learning_rate": 1.1174400000000001e-05, "loss": 0.9363, "step": 8730 }, { "epoch": 0.28, "learning_rate": 1.11808e-05, "loss": 0.9297, "step": 8735 }, { "epoch": 0.28, "learning_rate": 1.11872e-05, "loss": 0.9327, "step": 8740 }, { "epoch": 0.28, "learning_rate": 1.11936e-05, "loss": 0.9277, "step": 8745 }, { "epoch": 0.28, "learning_rate": 1.1200000000000001e-05, "loss": 0.9308, "step": 8750 }, { "epoch": 0.28, "learning_rate": 1.1206400000000002e-05, "loss": 0.9352, "step": 8755 }, { "epoch": 0.28, "learning_rate": 1.1212800000000002e-05, "loss": 0.9405, "step": 8760 }, { "epoch": 0.28, "learning_rate": 1.1219200000000001e-05, "loss": 0.9167, "step": 8765 }, { "epoch": 0.28, "learning_rate": 1.1225600000000001e-05, "loss": 0.9364, "step": 8770 }, { "epoch": 0.28, "learning_rate": 1.1232e-05, "loss": 0.9389, "step": 8775 }, { "epoch": 0.28, "learning_rate": 1.12384e-05, "loss": 0.9274, "step": 8780 }, { "epoch": 0.28, "learning_rate": 1.12448e-05, "loss": 0.935, "step": 8785 }, { "epoch": 0.28, "learning_rate": 1.12512e-05, "loss": 0.9218, "step": 8790 }, { "epoch": 0.28, "learning_rate": 1.1257600000000002e-05, "loss": 0.9417, "step": 8795 }, { "epoch": 0.28, "learning_rate": 1.1264000000000001e-05, "loss": 0.9173, "step": 8800 }, { "epoch": 0.28, "learning_rate": 1.1270400000000001e-05, "loss": 0.9304, "step": 8805 }, { "epoch": 0.28, "learning_rate": 1.1276800000000002e-05, "loss": 0.9273, "step": 8810 }, { "epoch": 0.28, "learning_rate": 1.12832e-05, "loss": 0.931, "step": 8815 }, { "epoch": 0.28, "learning_rate": 1.1289600000000001e-05, "loss": 0.9311, "step": 8820 }, { "epoch": 0.28, "learning_rate": 1.1296e-05, "loss": 0.9355, "step": 8825 }, { "epoch": 0.28, "learning_rate": 1.13024e-05, "loss": 0.9451, "step": 8830 }, { "epoch": 0.28, "learning_rate": 1.1308800000000003e-05, "loss": 0.9275, "step": 8835 }, { "epoch": 0.28, "learning_rate": 1.1315200000000001e-05, "loss": 0.9271, "step": 8840 }, { "epoch": 0.28, "learning_rate": 1.1321600000000002e-05, "loss": 0.9398, "step": 8845 }, { "epoch": 0.28, "learning_rate": 1.1328e-05, "loss": 0.935, "step": 8850 }, { "epoch": 0.28, "learning_rate": 1.1334400000000001e-05, "loss": 0.9322, "step": 8855 }, { "epoch": 0.28, "learning_rate": 1.13408e-05, "loss": 0.9445, "step": 8860 }, { "epoch": 0.28, "learning_rate": 1.13472e-05, "loss": 0.9463, "step": 8865 }, { "epoch": 0.28, "learning_rate": 1.1353600000000001e-05, "loss": 0.9276, "step": 8870 }, { "epoch": 0.28, "learning_rate": 1.136e-05, "loss": 0.9246, "step": 8875 }, { "epoch": 0.28, "learning_rate": 1.1366400000000002e-05, "loss": 0.9211, "step": 8880 }, { "epoch": 0.28, "learning_rate": 1.1372800000000002e-05, "loss": 0.9354, "step": 8885 }, { "epoch": 0.28, "learning_rate": 1.1379200000000001e-05, "loss": 0.9196, "step": 8890 }, { "epoch": 0.28, "learning_rate": 1.1385600000000002e-05, "loss": 0.9265, "step": 8895 }, { "epoch": 0.28, "learning_rate": 1.1392e-05, "loss": 0.9225, "step": 8900 }, { "epoch": 0.28, "learning_rate": 1.13984e-05, "loss": 0.9132, "step": 8905 }, { "epoch": 0.29, "learning_rate": 1.14048e-05, "loss": 0.9381, "step": 8910 }, { "epoch": 0.29, "learning_rate": 1.14112e-05, "loss": 0.9352, "step": 8915 }, { "epoch": 0.29, "learning_rate": 1.1417600000000002e-05, "loss": 0.9213, "step": 8920 }, { "epoch": 0.29, "learning_rate": 1.1424000000000001e-05, "loss": 0.9346, "step": 8925 }, { "epoch": 0.29, "learning_rate": 1.1430400000000002e-05, "loss": 0.9241, "step": 8930 }, { "epoch": 0.29, "learning_rate": 1.1436800000000002e-05, "loss": 0.9441, "step": 8935 }, { "epoch": 0.29, "learning_rate": 1.14432e-05, "loss": 0.9261, "step": 8940 }, { "epoch": 0.29, "learning_rate": 1.1449600000000001e-05, "loss": 0.948, "step": 8945 }, { "epoch": 0.29, "learning_rate": 1.1456e-05, "loss": 0.9225, "step": 8950 }, { "epoch": 0.29, "learning_rate": 1.14624e-05, "loss": 0.9266, "step": 8955 }, { "epoch": 0.29, "learning_rate": 1.14688e-05, "loss": 0.9222, "step": 8960 }, { "epoch": 0.29, "learning_rate": 1.1475200000000002e-05, "loss": 0.9162, "step": 8965 }, { "epoch": 0.29, "learning_rate": 1.1481600000000002e-05, "loss": 0.9375, "step": 8970 }, { "epoch": 0.29, "learning_rate": 1.1488e-05, "loss": 0.9293, "step": 8975 }, { "epoch": 0.29, "learning_rate": 1.1494400000000001e-05, "loss": 0.9237, "step": 8980 }, { "epoch": 0.29, "learning_rate": 1.15008e-05, "loss": 0.9372, "step": 8985 }, { "epoch": 0.29, "learning_rate": 1.15072e-05, "loss": 0.931, "step": 8990 }, { "epoch": 0.29, "learning_rate": 1.1513600000000001e-05, "loss": 0.9332, "step": 8995 }, { "epoch": 0.29, "learning_rate": 1.152e-05, "loss": 0.941, "step": 9000 }, { "epoch": 0.29, "learning_rate": 1.1526400000000002e-05, "loss": 0.9396, "step": 9005 }, { "epoch": 0.29, "learning_rate": 1.1532800000000002e-05, "loss": 0.9224, "step": 9010 }, { "epoch": 0.29, "learning_rate": 1.1539200000000001e-05, "loss": 0.9137, "step": 9015 }, { "epoch": 0.29, "learning_rate": 1.1545600000000002e-05, "loss": 0.926, "step": 9020 }, { "epoch": 0.29, "learning_rate": 1.1552e-05, "loss": 0.9151, "step": 9025 }, { "epoch": 0.29, "learning_rate": 1.1558400000000001e-05, "loss": 0.9464, "step": 9030 }, { "epoch": 0.29, "learning_rate": 1.15648e-05, "loss": 0.9108, "step": 9035 }, { "epoch": 0.29, "learning_rate": 1.15712e-05, "loss": 0.9154, "step": 9040 }, { "epoch": 0.29, "learning_rate": 1.15776e-05, "loss": 0.9171, "step": 9045 }, { "epoch": 0.29, "learning_rate": 1.1584000000000001e-05, "loss": 0.9357, "step": 9050 }, { "epoch": 0.29, "learning_rate": 1.1590400000000002e-05, "loss": 0.937, "step": 9055 }, { "epoch": 0.29, "learning_rate": 1.1596800000000002e-05, "loss": 0.9269, "step": 9060 }, { "epoch": 0.29, "learning_rate": 1.1603200000000001e-05, "loss": 0.9198, "step": 9065 }, { "epoch": 0.29, "learning_rate": 1.1609600000000001e-05, "loss": 0.9186, "step": 9070 }, { "epoch": 0.29, "learning_rate": 1.1616e-05, "loss": 0.9168, "step": 9075 }, { "epoch": 0.29, "learning_rate": 1.16224e-05, "loss": 0.9208, "step": 9080 }, { "epoch": 0.29, "learning_rate": 1.16288e-05, "loss": 0.9182, "step": 9085 }, { "epoch": 0.29, "learning_rate": 1.1635200000000002e-05, "loss": 0.8972, "step": 9090 }, { "epoch": 0.29, "learning_rate": 1.1641600000000002e-05, "loss": 0.9152, "step": 9095 }, { "epoch": 0.29, "learning_rate": 1.1648000000000001e-05, "loss": 0.9268, "step": 9100 }, { "epoch": 0.29, "learning_rate": 1.1654400000000001e-05, "loss": 0.9175, "step": 9105 }, { "epoch": 0.29, "learning_rate": 1.16608e-05, "loss": 0.929, "step": 9110 }, { "epoch": 0.29, "learning_rate": 1.16672e-05, "loss": 0.9327, "step": 9115 }, { "epoch": 0.29, "learning_rate": 1.1673600000000001e-05, "loss": 0.9225, "step": 9120 }, { "epoch": 0.29, "learning_rate": 1.168e-05, "loss": 0.9307, "step": 9125 }, { "epoch": 0.29, "learning_rate": 1.16864e-05, "loss": 0.9197, "step": 9130 }, { "epoch": 0.29, "learning_rate": 1.1692800000000003e-05, "loss": 0.912, "step": 9135 }, { "epoch": 0.29, "learning_rate": 1.1699200000000001e-05, "loss": 0.9253, "step": 9140 }, { "epoch": 0.29, "learning_rate": 1.1705600000000002e-05, "loss": 0.9102, "step": 9145 }, { "epoch": 0.29, "learning_rate": 1.1712e-05, "loss": 0.9178, "step": 9150 }, { "epoch": 0.29, "learning_rate": 1.1718400000000001e-05, "loss": 0.9193, "step": 9155 }, { "epoch": 0.29, "learning_rate": 1.17248e-05, "loss": 0.923, "step": 9160 }, { "epoch": 0.29, "learning_rate": 1.17312e-05, "loss": 0.9238, "step": 9165 }, { "epoch": 0.29, "learning_rate": 1.1737600000000001e-05, "loss": 0.9092, "step": 9170 }, { "epoch": 0.29, "learning_rate": 1.1744000000000001e-05, "loss": 0.9113, "step": 9175 }, { "epoch": 0.29, "learning_rate": 1.1750400000000002e-05, "loss": 0.9125, "step": 9180 }, { "epoch": 0.29, "learning_rate": 1.1756800000000002e-05, "loss": 0.9262, "step": 9185 }, { "epoch": 0.29, "learning_rate": 1.1763200000000001e-05, "loss": 0.9306, "step": 9190 }, { "epoch": 0.29, "learning_rate": 1.1769600000000002e-05, "loss": 0.9174, "step": 9195 }, { "epoch": 0.29, "learning_rate": 1.1776e-05, "loss": 0.9411, "step": 9200 }, { "epoch": 0.29, "learning_rate": 1.1782400000000001e-05, "loss": 0.917, "step": 9205 }, { "epoch": 0.29, "learning_rate": 1.17888e-05, "loss": 0.9258, "step": 9210 }, { "epoch": 0.29, "learning_rate": 1.17952e-05, "loss": 0.9398, "step": 9215 }, { "epoch": 0.3, "learning_rate": 1.1801600000000002e-05, "loss": 0.9216, "step": 9220 }, { "epoch": 0.3, "learning_rate": 1.1808000000000001e-05, "loss": 0.9212, "step": 9225 }, { "epoch": 0.3, "learning_rate": 1.1814400000000002e-05, "loss": 0.9243, "step": 9230 }, { "epoch": 0.3, "learning_rate": 1.18208e-05, "loss": 0.9274, "step": 9235 }, { "epoch": 0.3, "learning_rate": 1.1827200000000001e-05, "loss": 0.9141, "step": 9240 }, { "epoch": 0.3, "learning_rate": 1.1833600000000001e-05, "loss": 0.9285, "step": 9245 }, { "epoch": 0.3, "learning_rate": 1.184e-05, "loss": 0.9148, "step": 9250 }, { "epoch": 0.3, "learning_rate": 1.18464e-05, "loss": 0.9232, "step": 9255 }, { "epoch": 0.3, "learning_rate": 1.18528e-05, "loss": 0.9245, "step": 9260 }, { "epoch": 0.3, "learning_rate": 1.1859200000000002e-05, "loss": 0.9254, "step": 9265 }, { "epoch": 0.3, "learning_rate": 1.1865600000000002e-05, "loss": 0.9029, "step": 9270 }, { "epoch": 0.3, "learning_rate": 1.1872000000000001e-05, "loss": 0.9173, "step": 9275 }, { "epoch": 0.3, "learning_rate": 1.1878400000000001e-05, "loss": 0.9191, "step": 9280 }, { "epoch": 0.3, "learning_rate": 1.18848e-05, "loss": 0.9216, "step": 9285 }, { "epoch": 0.3, "learning_rate": 1.18912e-05, "loss": 0.9317, "step": 9290 }, { "epoch": 0.3, "learning_rate": 1.1897600000000001e-05, "loss": 0.9226, "step": 9295 }, { "epoch": 0.3, "learning_rate": 1.1904e-05, "loss": 0.9029, "step": 9300 }, { "epoch": 0.3, "learning_rate": 1.1910400000000002e-05, "loss": 0.9145, "step": 9305 }, { "epoch": 0.3, "learning_rate": 1.1916800000000003e-05, "loss": 0.9303, "step": 9310 }, { "epoch": 0.3, "learning_rate": 1.1923200000000001e-05, "loss": 0.9234, "step": 9315 }, { "epoch": 0.3, "learning_rate": 1.1929600000000002e-05, "loss": 0.9294, "step": 9320 }, { "epoch": 0.3, "learning_rate": 1.1936e-05, "loss": 0.9136, "step": 9325 }, { "epoch": 0.3, "learning_rate": 1.1942400000000001e-05, "loss": 0.9274, "step": 9330 }, { "epoch": 0.3, "learning_rate": 1.19488e-05, "loss": 0.9115, "step": 9335 }, { "epoch": 0.3, "learning_rate": 1.19552e-05, "loss": 0.9221, "step": 9340 }, { "epoch": 0.3, "learning_rate": 1.1961599999999999e-05, "loss": 0.9223, "step": 9345 }, { "epoch": 0.3, "learning_rate": 1.1968000000000001e-05, "loss": 0.9185, "step": 9350 }, { "epoch": 0.3, "learning_rate": 1.1974400000000002e-05, "loss": 0.9242, "step": 9355 }, { "epoch": 0.3, "learning_rate": 1.19808e-05, "loss": 0.9235, "step": 9360 }, { "epoch": 0.3, "learning_rate": 1.1987200000000001e-05, "loss": 0.928, "step": 9365 }, { "epoch": 0.3, "learning_rate": 1.1993600000000002e-05, "loss": 0.9298, "step": 9370 }, { "epoch": 0.3, "learning_rate": 1.2e-05, "loss": 0.917, "step": 9375 }, { "epoch": 0.3, "learning_rate": 1.20064e-05, "loss": 0.9229, "step": 9380 }, { "epoch": 0.3, "learning_rate": 1.20128e-05, "loss": 0.9261, "step": 9385 }, { "epoch": 0.3, "learning_rate": 1.2019200000000002e-05, "loss": 0.928, "step": 9390 }, { "epoch": 0.3, "learning_rate": 1.2025600000000002e-05, "loss": 0.9266, "step": 9395 }, { "epoch": 0.3, "learning_rate": 1.2032000000000001e-05, "loss": 0.9187, "step": 9400 }, { "epoch": 0.3, "learning_rate": 1.2038400000000001e-05, "loss": 0.9241, "step": 9405 }, { "epoch": 0.3, "learning_rate": 1.20448e-05, "loss": 0.898, "step": 9410 }, { "epoch": 0.3, "learning_rate": 1.20512e-05, "loss": 0.9211, "step": 9415 }, { "epoch": 0.3, "learning_rate": 1.2057600000000001e-05, "loss": 0.9024, "step": 9420 }, { "epoch": 0.3, "learning_rate": 1.2064e-05, "loss": 0.8996, "step": 9425 }, { "epoch": 0.3, "learning_rate": 1.20704e-05, "loss": 0.9287, "step": 9430 }, { "epoch": 0.3, "learning_rate": 1.2076800000000003e-05, "loss": 0.9059, "step": 9435 }, { "epoch": 0.3, "learning_rate": 1.2083200000000001e-05, "loss": 0.9273, "step": 9440 }, { "epoch": 0.3, "learning_rate": 1.2089600000000002e-05, "loss": 0.9205, "step": 9445 }, { "epoch": 0.3, "learning_rate": 1.2096e-05, "loss": 0.9062, "step": 9450 }, { "epoch": 0.3, "learning_rate": 1.2102400000000001e-05, "loss": 0.9211, "step": 9455 }, { "epoch": 0.3, "learning_rate": 1.21088e-05, "loss": 0.9095, "step": 9460 }, { "epoch": 0.3, "learning_rate": 1.21152e-05, "loss": 0.9167, "step": 9465 }, { "epoch": 0.3, "learning_rate": 1.21216e-05, "loss": 0.9106, "step": 9470 }, { "epoch": 0.3, "learning_rate": 1.2128000000000001e-05, "loss": 0.9264, "step": 9475 }, { "epoch": 0.3, "learning_rate": 1.2134400000000002e-05, "loss": 0.9231, "step": 9480 }, { "epoch": 0.3, "learning_rate": 1.21408e-05, "loss": 0.916, "step": 9485 }, { "epoch": 0.3, "learning_rate": 1.2147200000000001e-05, "loss": 0.9295, "step": 9490 }, { "epoch": 0.3, "learning_rate": 1.2153600000000002e-05, "loss": 0.9193, "step": 9495 }, { "epoch": 0.3, "learning_rate": 1.216e-05, "loss": 0.9068, "step": 9500 }, { "epoch": 0.3, "learning_rate": 1.2166400000000001e-05, "loss": 0.9131, "step": 9505 }, { "epoch": 0.3, "learning_rate": 1.21728e-05, "loss": 0.9205, "step": 9510 }, { "epoch": 0.3, "learning_rate": 1.21792e-05, "loss": 0.9184, "step": 9515 }, { "epoch": 0.3, "learning_rate": 1.2185600000000002e-05, "loss": 0.9186, "step": 9520 }, { "epoch": 0.3, "learning_rate": 1.2192000000000001e-05, "loss": 0.9118, "step": 9525 }, { "epoch": 0.3, "learning_rate": 1.2198400000000002e-05, "loss": 0.9275, "step": 9530 }, { "epoch": 0.31, "learning_rate": 1.22048e-05, "loss": 0.9175, "step": 9535 }, { "epoch": 0.31, "learning_rate": 1.2211200000000001e-05, "loss": 0.9116, "step": 9540 }, { "epoch": 0.31, "learning_rate": 1.2217600000000001e-05, "loss": 0.9236, "step": 9545 }, { "epoch": 0.31, "learning_rate": 1.2224e-05, "loss": 0.9215, "step": 9550 }, { "epoch": 0.31, "learning_rate": 1.22304e-05, "loss": 0.9102, "step": 9555 }, { "epoch": 0.31, "learning_rate": 1.2236800000000003e-05, "loss": 0.9051, "step": 9560 }, { "epoch": 0.31, "learning_rate": 1.2243200000000002e-05, "loss": 0.9134, "step": 9565 }, { "epoch": 0.31, "learning_rate": 1.2249600000000002e-05, "loss": 0.9131, "step": 9570 }, { "epoch": 0.31, "learning_rate": 1.2256000000000001e-05, "loss": 0.9237, "step": 9575 }, { "epoch": 0.31, "learning_rate": 1.2262400000000001e-05, "loss": 0.9128, "step": 9580 }, { "epoch": 0.31, "learning_rate": 1.22688e-05, "loss": 0.9137, "step": 9585 }, { "epoch": 0.31, "learning_rate": 1.22752e-05, "loss": 0.9218, "step": 9590 }, { "epoch": 0.31, "learning_rate": 1.22816e-05, "loss": 0.9023, "step": 9595 }, { "epoch": 0.31, "learning_rate": 1.2288e-05, "loss": 0.927, "step": 9600 }, { "epoch": 0.31, "learning_rate": 1.2294400000000002e-05, "loss": 0.932, "step": 9605 }, { "epoch": 0.31, "learning_rate": 1.2300800000000001e-05, "loss": 0.9262, "step": 9610 }, { "epoch": 0.31, "learning_rate": 1.2307200000000001e-05, "loss": 0.9077, "step": 9615 }, { "epoch": 0.31, "learning_rate": 1.2313600000000002e-05, "loss": 0.9221, "step": 9620 }, { "epoch": 0.31, "learning_rate": 1.232e-05, "loss": 0.9222, "step": 9625 }, { "epoch": 0.31, "learning_rate": 1.2326400000000001e-05, "loss": 0.9179, "step": 9630 }, { "epoch": 0.31, "learning_rate": 1.23328e-05, "loss": 0.9082, "step": 9635 }, { "epoch": 0.31, "learning_rate": 1.23392e-05, "loss": 0.9231, "step": 9640 }, { "epoch": 0.31, "learning_rate": 1.2345600000000003e-05, "loss": 0.9272, "step": 9645 }, { "epoch": 0.31, "learning_rate": 1.2352000000000001e-05, "loss": 0.9067, "step": 9650 }, { "epoch": 0.31, "learning_rate": 1.2358400000000002e-05, "loss": 0.8991, "step": 9655 }, { "epoch": 0.31, "learning_rate": 1.23648e-05, "loss": 0.9077, "step": 9660 }, { "epoch": 0.31, "learning_rate": 1.2371200000000001e-05, "loss": 0.8967, "step": 9665 }, { "epoch": 0.31, "learning_rate": 1.2377600000000002e-05, "loss": 0.9157, "step": 9670 }, { "epoch": 0.31, "learning_rate": 1.2384e-05, "loss": 0.9213, "step": 9675 }, { "epoch": 0.31, "learning_rate": 1.23904e-05, "loss": 0.9032, "step": 9680 }, { "epoch": 0.31, "learning_rate": 1.23968e-05, "loss": 0.9013, "step": 9685 }, { "epoch": 0.31, "learning_rate": 1.2403200000000002e-05, "loss": 0.9094, "step": 9690 }, { "epoch": 0.31, "learning_rate": 1.2409600000000002e-05, "loss": 0.9064, "step": 9695 }, { "epoch": 0.31, "learning_rate": 1.2416000000000001e-05, "loss": 0.9015, "step": 9700 }, { "epoch": 0.31, "learning_rate": 1.2422400000000002e-05, "loss": 0.9107, "step": 9705 }, { "epoch": 0.31, "learning_rate": 1.24288e-05, "loss": 0.9085, "step": 9710 }, { "epoch": 0.31, "learning_rate": 1.24352e-05, "loss": 0.9192, "step": 9715 }, { "epoch": 0.31, "learning_rate": 1.24416e-05, "loss": 0.9013, "step": 9720 }, { "epoch": 0.31, "learning_rate": 1.2448e-05, "loss": 0.9125, "step": 9725 }, { "epoch": 0.31, "learning_rate": 1.2454400000000002e-05, "loss": 0.9074, "step": 9730 }, { "epoch": 0.31, "learning_rate": 1.2460800000000001e-05, "loss": 0.9249, "step": 9735 }, { "epoch": 0.31, "learning_rate": 1.2467200000000002e-05, "loss": 0.9085, "step": 9740 }, { "epoch": 0.31, "learning_rate": 1.2473600000000002e-05, "loss": 0.921, "step": 9745 }, { "epoch": 0.31, "learning_rate": 1.248e-05, "loss": 0.9129, "step": 9750 }, { "epoch": 0.31, "learning_rate": 1.2486400000000001e-05, "loss": 0.9149, "step": 9755 }, { "epoch": 0.31, "learning_rate": 1.24928e-05, "loss": 0.9057, "step": 9760 }, { "epoch": 0.31, "learning_rate": 1.24992e-05, "loss": 0.8884, "step": 9765 }, { "epoch": 0.31, "learning_rate": 1.25056e-05, "loss": 0.915, "step": 9770 }, { "epoch": 0.31, "learning_rate": 1.2512000000000002e-05, "loss": 0.9077, "step": 9775 }, { "epoch": 0.31, "learning_rate": 1.2518400000000002e-05, "loss": 0.905, "step": 9780 }, { "epoch": 0.31, "learning_rate": 1.25248e-05, "loss": 0.9086, "step": 9785 }, { "epoch": 0.31, "learning_rate": 1.2531200000000001e-05, "loss": 0.9147, "step": 9790 }, { "epoch": 0.31, "learning_rate": 1.25376e-05, "loss": 0.906, "step": 9795 }, { "epoch": 0.31, "learning_rate": 1.2544e-05, "loss": 0.9018, "step": 9800 }, { "epoch": 0.31, "learning_rate": 1.2550400000000001e-05, "loss": 0.8873, "step": 9805 }, { "epoch": 0.31, "learning_rate": 1.25568e-05, "loss": 0.9107, "step": 9810 }, { "epoch": 0.31, "learning_rate": 1.2563200000000002e-05, "loss": 0.9026, "step": 9815 }, { "epoch": 0.31, "learning_rate": 1.2569600000000002e-05, "loss": 0.9167, "step": 9820 }, { "epoch": 0.31, "learning_rate": 1.2576000000000001e-05, "loss": 0.9083, "step": 9825 }, { "epoch": 0.31, "learning_rate": 1.2582400000000002e-05, "loss": 0.8961, "step": 9830 }, { "epoch": 0.31, "learning_rate": 1.25888e-05, "loss": 0.8995, "step": 9835 }, { "epoch": 0.31, "learning_rate": 1.2595200000000001e-05, "loss": 0.9042, "step": 9840 }, { "epoch": 0.32, "learning_rate": 1.26016e-05, "loss": 0.9055, "step": 9845 }, { "epoch": 0.32, "learning_rate": 1.2608e-05, "loss": 0.9124, "step": 9850 }, { "epoch": 0.32, "learning_rate": 1.26144e-05, "loss": 0.9263, "step": 9855 }, { "epoch": 0.32, "learning_rate": 1.2620800000000001e-05, "loss": 0.9172, "step": 9860 }, { "epoch": 0.32, "learning_rate": 1.2627200000000002e-05, "loss": 0.8868, "step": 9865 }, { "epoch": 0.32, "learning_rate": 1.2633600000000002e-05, "loss": 0.9049, "step": 9870 }, { "epoch": 0.32, "learning_rate": 1.2640000000000001e-05, "loss": 0.8953, "step": 9875 }, { "epoch": 0.32, "learning_rate": 1.2646400000000001e-05, "loss": 0.9065, "step": 9880 }, { "epoch": 0.32, "learning_rate": 1.26528e-05, "loss": 0.9143, "step": 9885 }, { "epoch": 0.32, "learning_rate": 1.26592e-05, "loss": 0.8907, "step": 9890 }, { "epoch": 0.32, "learning_rate": 1.26656e-05, "loss": 0.8969, "step": 9895 }, { "epoch": 0.32, "learning_rate": 1.2672000000000002e-05, "loss": 0.8968, "step": 9900 }, { "epoch": 0.32, "learning_rate": 1.2678400000000002e-05, "loss": 0.9009, "step": 9905 }, { "epoch": 0.32, "learning_rate": 1.2684800000000001e-05, "loss": 0.9027, "step": 9910 }, { "epoch": 0.32, "learning_rate": 1.2691200000000001e-05, "loss": 0.9068, "step": 9915 }, { "epoch": 0.32, "learning_rate": 1.26976e-05, "loss": 0.8971, "step": 9920 }, { "epoch": 0.32, "learning_rate": 1.2704e-05, "loss": 0.9023, "step": 9925 }, { "epoch": 0.32, "learning_rate": 1.2710400000000001e-05, "loss": 0.9051, "step": 9930 }, { "epoch": 0.32, "learning_rate": 1.27168e-05, "loss": 0.9101, "step": 9935 }, { "epoch": 0.32, "learning_rate": 1.27232e-05, "loss": 0.905, "step": 9940 }, { "epoch": 0.32, "learning_rate": 1.2729600000000003e-05, "loss": 0.8991, "step": 9945 }, { "epoch": 0.32, "learning_rate": 1.2736000000000001e-05, "loss": 0.8991, "step": 9950 }, { "epoch": 0.32, "learning_rate": 1.2742400000000002e-05, "loss": 0.9173, "step": 9955 }, { "epoch": 0.32, "learning_rate": 1.27488e-05, "loss": 0.9042, "step": 9960 }, { "epoch": 0.32, "learning_rate": 1.2755200000000001e-05, "loss": 0.9377, "step": 9965 }, { "epoch": 0.32, "learning_rate": 1.27616e-05, "loss": 0.8843, "step": 9970 }, { "epoch": 0.32, "learning_rate": 1.2768e-05, "loss": 0.9002, "step": 9975 }, { "epoch": 0.32, "learning_rate": 1.2774400000000001e-05, "loss": 0.9132, "step": 9980 }, { "epoch": 0.32, "learning_rate": 1.2780800000000001e-05, "loss": 0.8997, "step": 9985 }, { "epoch": 0.32, "learning_rate": 1.2787200000000002e-05, "loss": 0.9071, "step": 9990 }, { "epoch": 0.32, "learning_rate": 1.2793600000000002e-05, "loss": 0.9108, "step": 9995 }, { "epoch": 0.32, "learning_rate": 1.2800000000000001e-05, "loss": 0.8915, "step": 10000 }, { "epoch": 0.32, "learning_rate": 1.2806400000000002e-05, "loss": 0.9139, "step": 10005 }, { "epoch": 0.32, "learning_rate": 1.28128e-05, "loss": 0.8944, "step": 10010 }, { "epoch": 0.32, "learning_rate": 1.2819200000000001e-05, "loss": 0.8891, "step": 10015 }, { "epoch": 0.32, "learning_rate": 1.28256e-05, "loss": 0.8982, "step": 10020 }, { "epoch": 0.32, "learning_rate": 1.2832e-05, "loss": 0.9087, "step": 10025 }, { "epoch": 0.32, "learning_rate": 1.2838400000000002e-05, "loss": 0.9203, "step": 10030 }, { "epoch": 0.32, "learning_rate": 1.2844800000000001e-05, "loss": 0.8993, "step": 10035 }, { "epoch": 0.32, "learning_rate": 1.2851200000000002e-05, "loss": 0.8844, "step": 10040 }, { "epoch": 0.32, "learning_rate": 1.28576e-05, "loss": 0.8984, "step": 10045 }, { "epoch": 0.32, "learning_rate": 1.2864e-05, "loss": 0.8979, "step": 10050 }, { "epoch": 0.32, "learning_rate": 1.2870400000000001e-05, "loss": 0.8995, "step": 10055 }, { "epoch": 0.32, "learning_rate": 1.28768e-05, "loss": 0.9099, "step": 10060 }, { "epoch": 0.32, "learning_rate": 1.28832e-05, "loss": 0.9072, "step": 10065 }, { "epoch": 0.32, "learning_rate": 1.2889600000000003e-05, "loss": 0.8984, "step": 10070 }, { "epoch": 0.32, "learning_rate": 1.2896000000000002e-05, "loss": 0.9012, "step": 10075 }, { "epoch": 0.32, "learning_rate": 1.2902400000000002e-05, "loss": 0.8996, "step": 10080 }, { "epoch": 0.32, "learning_rate": 1.29088e-05, "loss": 0.9115, "step": 10085 }, { "epoch": 0.32, "learning_rate": 1.2915200000000001e-05, "loss": 0.892, "step": 10090 }, { "epoch": 0.32, "learning_rate": 1.29216e-05, "loss": 0.9036, "step": 10095 }, { "epoch": 0.32, "learning_rate": 1.2928e-05, "loss": 0.8999, "step": 10100 }, { "epoch": 0.32, "learning_rate": 1.2934400000000001e-05, "loss": 0.9015, "step": 10105 }, { "epoch": 0.32, "learning_rate": 1.29408e-05, "loss": 0.9041, "step": 10110 }, { "epoch": 0.32, "learning_rate": 1.2947200000000002e-05, "loss": 0.8987, "step": 10115 }, { "epoch": 0.32, "learning_rate": 1.2953600000000002e-05, "loss": 0.9014, "step": 10120 }, { "epoch": 0.32, "learning_rate": 1.2960000000000001e-05, "loss": 0.8922, "step": 10125 }, { "epoch": 0.32, "learning_rate": 1.2966400000000002e-05, "loss": 0.8928, "step": 10130 }, { "epoch": 0.32, "learning_rate": 1.29728e-05, "loss": 0.8986, "step": 10135 }, { "epoch": 0.32, "learning_rate": 1.2979200000000001e-05, "loss": 0.8968, "step": 10140 }, { "epoch": 0.32, "learning_rate": 1.29856e-05, "loss": 0.8996, "step": 10145 }, { "epoch": 0.32, "learning_rate": 1.2992e-05, "loss": 0.8947, "step": 10150 }, { "epoch": 0.32, "learning_rate": 1.2998400000000002e-05, "loss": 0.902, "step": 10155 }, { "epoch": 0.33, "learning_rate": 1.3004800000000001e-05, "loss": 0.8956, "step": 10160 }, { "epoch": 0.33, "learning_rate": 1.3011200000000002e-05, "loss": 0.906, "step": 10165 }, { "epoch": 0.33, "learning_rate": 1.30176e-05, "loss": 0.8974, "step": 10170 }, { "epoch": 0.33, "learning_rate": 1.3024000000000001e-05, "loss": 0.8932, "step": 10175 }, { "epoch": 0.33, "learning_rate": 1.3030400000000001e-05, "loss": 0.8941, "step": 10180 }, { "epoch": 0.33, "learning_rate": 1.30368e-05, "loss": 0.8992, "step": 10185 }, { "epoch": 0.33, "learning_rate": 1.30432e-05, "loss": 0.9014, "step": 10190 }, { "epoch": 0.33, "learning_rate": 1.30496e-05, "loss": 0.8956, "step": 10195 }, { "epoch": 0.33, "learning_rate": 1.3056000000000002e-05, "loss": 0.9015, "step": 10200 }, { "epoch": 0.33, "learning_rate": 1.3062400000000002e-05, "loss": 0.9172, "step": 10205 }, { "epoch": 0.33, "learning_rate": 1.3068800000000001e-05, "loss": 0.8982, "step": 10210 }, { "epoch": 0.33, "learning_rate": 1.3075200000000001e-05, "loss": 0.887, "step": 10215 }, { "epoch": 0.33, "learning_rate": 1.30816e-05, "loss": 0.8936, "step": 10220 }, { "epoch": 0.33, "learning_rate": 1.3088e-05, "loss": 0.8933, "step": 10225 }, { "epoch": 0.33, "learning_rate": 1.3094400000000001e-05, "loss": 0.8932, "step": 10230 }, { "epoch": 0.33, "learning_rate": 1.31008e-05, "loss": 0.9066, "step": 10235 }, { "epoch": 0.33, "learning_rate": 1.3107200000000002e-05, "loss": 0.9054, "step": 10240 }, { "epoch": 0.33, "learning_rate": 1.3113600000000003e-05, "loss": 0.9054, "step": 10245 }, { "epoch": 0.33, "learning_rate": 1.3120000000000001e-05, "loss": 0.8841, "step": 10250 }, { "epoch": 0.33, "learning_rate": 1.3126400000000002e-05, "loss": 0.893, "step": 10255 }, { "epoch": 0.33, "learning_rate": 1.31328e-05, "loss": 0.9032, "step": 10260 }, { "epoch": 0.33, "learning_rate": 1.3139200000000001e-05, "loss": 0.8861, "step": 10265 }, { "epoch": 0.33, "learning_rate": 1.31456e-05, "loss": 0.8973, "step": 10270 }, { "epoch": 0.33, "learning_rate": 1.3152e-05, "loss": 0.8916, "step": 10275 }, { "epoch": 0.33, "learning_rate": 1.31584e-05, "loss": 0.8998, "step": 10280 }, { "epoch": 0.33, "learning_rate": 1.3164800000000001e-05, "loss": 0.9097, "step": 10285 }, { "epoch": 0.33, "learning_rate": 1.3171200000000002e-05, "loss": 0.8925, "step": 10290 }, { "epoch": 0.33, "learning_rate": 1.31776e-05, "loss": 0.9011, "step": 10295 }, { "epoch": 0.33, "learning_rate": 1.3184000000000001e-05, "loss": 0.9051, "step": 10300 }, { "epoch": 0.33, "learning_rate": 1.3190400000000002e-05, "loss": 0.8907, "step": 10305 }, { "epoch": 0.33, "learning_rate": 1.31968e-05, "loss": 0.9045, "step": 10310 }, { "epoch": 0.33, "learning_rate": 1.3203200000000001e-05, "loss": 0.8973, "step": 10315 }, { "epoch": 0.33, "learning_rate": 1.32096e-05, "loss": 0.9093, "step": 10320 }, { "epoch": 0.33, "learning_rate": 1.3216000000000002e-05, "loss": 0.9144, "step": 10325 }, { "epoch": 0.33, "learning_rate": 1.3222400000000002e-05, "loss": 0.8914, "step": 10330 }, { "epoch": 0.33, "learning_rate": 1.3228800000000001e-05, "loss": 0.8904, "step": 10335 }, { "epoch": 0.33, "learning_rate": 1.3235200000000002e-05, "loss": 0.9105, "step": 10340 }, { "epoch": 0.33, "learning_rate": 1.32416e-05, "loss": 0.9057, "step": 10345 }, { "epoch": 0.33, "learning_rate": 1.3248000000000001e-05, "loss": 0.9008, "step": 10350 }, { "epoch": 0.33, "learning_rate": 1.3254400000000001e-05, "loss": 0.8903, "step": 10355 }, { "epoch": 0.33, "learning_rate": 1.32608e-05, "loss": 0.9035, "step": 10360 }, { "epoch": 0.33, "learning_rate": 1.32672e-05, "loss": 0.8682, "step": 10365 }, { "epoch": 0.33, "learning_rate": 1.3273600000000003e-05, "loss": 0.8956, "step": 10370 }, { "epoch": 0.33, "learning_rate": 1.3280000000000002e-05, "loss": 0.8888, "step": 10375 }, { "epoch": 0.33, "learning_rate": 1.3286400000000002e-05, "loss": 0.8963, "step": 10380 }, { "epoch": 0.33, "learning_rate": 1.3292800000000001e-05, "loss": 0.8928, "step": 10385 }, { "epoch": 0.33, "learning_rate": 1.3299200000000001e-05, "loss": 0.8888, "step": 10390 }, { "epoch": 0.33, "learning_rate": 1.33056e-05, "loss": 0.8873, "step": 10395 }, { "epoch": 0.33, "learning_rate": 1.3312e-05, "loss": 0.9129, "step": 10400 }, { "epoch": 0.33, "learning_rate": 1.33184e-05, "loss": 0.895, "step": 10405 }, { "epoch": 0.33, "learning_rate": 1.3324800000000002e-05, "loss": 0.8897, "step": 10410 }, { "epoch": 0.33, "learning_rate": 1.3331200000000002e-05, "loss": 0.8886, "step": 10415 }, { "epoch": 0.33, "learning_rate": 1.33376e-05, "loss": 0.8916, "step": 10420 }, { "epoch": 0.33, "learning_rate": 1.3344000000000001e-05, "loss": 0.9042, "step": 10425 }, { "epoch": 0.33, "learning_rate": 1.3350400000000002e-05, "loss": 0.9021, "step": 10430 }, { "epoch": 0.33, "learning_rate": 1.33568e-05, "loss": 0.8909, "step": 10435 }, { "epoch": 0.33, "learning_rate": 1.3363200000000001e-05, "loss": 0.9035, "step": 10440 }, { "epoch": 0.33, "learning_rate": 1.33696e-05, "loss": 0.8906, "step": 10445 }, { "epoch": 0.33, "learning_rate": 1.3376e-05, "loss": 0.8947, "step": 10450 }, { "epoch": 0.33, "learning_rate": 1.3382400000000003e-05, "loss": 0.9037, "step": 10455 }, { "epoch": 0.33, "learning_rate": 1.3388800000000001e-05, "loss": 0.8924, "step": 10460 }, { "epoch": 0.33, "learning_rate": 1.3395200000000002e-05, "loss": 0.9094, "step": 10465 }, { "epoch": 0.34, "learning_rate": 1.34016e-05, "loss": 0.875, "step": 10470 }, { "epoch": 0.34, "learning_rate": 1.3408000000000001e-05, "loss": 0.8961, "step": 10475 }, { "epoch": 0.34, "learning_rate": 1.3414400000000002e-05, "loss": 0.8841, "step": 10480 }, { "epoch": 0.34, "learning_rate": 1.34208e-05, "loss": 0.8884, "step": 10485 }, { "epoch": 0.34, "learning_rate": 1.34272e-05, "loss": 0.8942, "step": 10490 }, { "epoch": 0.34, "learning_rate": 1.3433600000000003e-05, "loss": 0.893, "step": 10495 }, { "epoch": 0.34, "learning_rate": 1.3440000000000002e-05, "loss": 0.8864, "step": 10500 }, { "epoch": 0.34, "learning_rate": 1.3446400000000002e-05, "loss": 0.8647, "step": 10505 }, { "epoch": 0.34, "learning_rate": 1.3452800000000001e-05, "loss": 0.8883, "step": 10510 }, { "epoch": 0.34, "learning_rate": 1.3459200000000002e-05, "loss": 0.8849, "step": 10515 }, { "epoch": 0.34, "learning_rate": 1.34656e-05, "loss": 0.9009, "step": 10520 }, { "epoch": 0.34, "learning_rate": 1.3472e-05, "loss": 0.8747, "step": 10525 }, { "epoch": 0.34, "learning_rate": 1.34784e-05, "loss": 0.887, "step": 10530 }, { "epoch": 0.34, "learning_rate": 1.34848e-05, "loss": 0.888, "step": 10535 }, { "epoch": 0.34, "learning_rate": 1.3491200000000002e-05, "loss": 0.8838, "step": 10540 }, { "epoch": 0.34, "learning_rate": 1.3497600000000001e-05, "loss": 0.8978, "step": 10545 }, { "epoch": 0.34, "learning_rate": 1.3504000000000001e-05, "loss": 0.8814, "step": 10550 }, { "epoch": 0.34, "learning_rate": 1.3510400000000002e-05, "loss": 0.8932, "step": 10555 }, { "epoch": 0.34, "learning_rate": 1.35168e-05, "loss": 0.8947, "step": 10560 }, { "epoch": 0.34, "learning_rate": 1.3523200000000001e-05, "loss": 0.8925, "step": 10565 }, { "epoch": 0.34, "learning_rate": 1.35296e-05, "loss": 0.8764, "step": 10570 }, { "epoch": 0.34, "learning_rate": 1.3536e-05, "loss": 0.8913, "step": 10575 }, { "epoch": 0.34, "learning_rate": 1.3542400000000003e-05, "loss": 0.8893, "step": 10580 }, { "epoch": 0.34, "learning_rate": 1.3548800000000001e-05, "loss": 0.9028, "step": 10585 }, { "epoch": 0.34, "learning_rate": 1.3555200000000002e-05, "loss": 0.8939, "step": 10590 }, { "epoch": 0.34, "learning_rate": 1.35616e-05, "loss": 0.8937, "step": 10595 }, { "epoch": 0.34, "learning_rate": 1.3568000000000001e-05, "loss": 0.89, "step": 10600 }, { "epoch": 0.34, "learning_rate": 1.3574400000000002e-05, "loss": 0.8855, "step": 10605 }, { "epoch": 0.34, "learning_rate": 1.35808e-05, "loss": 0.8795, "step": 10610 }, { "epoch": 0.34, "learning_rate": 1.3587200000000001e-05, "loss": 0.8955, "step": 10615 }, { "epoch": 0.34, "learning_rate": 1.35936e-05, "loss": 0.8859, "step": 10620 }, { "epoch": 0.34, "learning_rate": 1.3600000000000002e-05, "loss": 0.8937, "step": 10625 }, { "epoch": 0.34, "learning_rate": 1.3606400000000002e-05, "loss": 0.8842, "step": 10630 }, { "epoch": 0.34, "learning_rate": 1.3612800000000001e-05, "loss": 0.9083, "step": 10635 }, { "epoch": 0.34, "learning_rate": 1.3619200000000002e-05, "loss": 0.8776, "step": 10640 }, { "epoch": 0.34, "learning_rate": 1.36256e-05, "loss": 0.8911, "step": 10645 }, { "epoch": 0.34, "learning_rate": 1.3632000000000001e-05, "loss": 0.9006, "step": 10650 }, { "epoch": 0.34, "learning_rate": 1.36384e-05, "loss": 0.8794, "step": 10655 }, { "epoch": 0.34, "learning_rate": 1.36448e-05, "loss": 0.895, "step": 10660 }, { "epoch": 0.34, "learning_rate": 1.36512e-05, "loss": 0.8938, "step": 10665 }, { "epoch": 0.34, "learning_rate": 1.3657600000000001e-05, "loss": 0.8885, "step": 10670 }, { "epoch": 0.34, "learning_rate": 1.3664000000000002e-05, "loss": 0.8899, "step": 10675 }, { "epoch": 0.34, "learning_rate": 1.3670400000000002e-05, "loss": 0.8974, "step": 10680 }, { "epoch": 0.34, "learning_rate": 1.3676800000000001e-05, "loss": 0.8844, "step": 10685 }, { "epoch": 0.34, "learning_rate": 1.3683200000000001e-05, "loss": 0.9052, "step": 10690 }, { "epoch": 0.34, "learning_rate": 1.36896e-05, "loss": 0.8925, "step": 10695 }, { "epoch": 0.34, "learning_rate": 1.3696e-05, "loss": 0.8584, "step": 10700 }, { "epoch": 0.34, "learning_rate": 1.37024e-05, "loss": 0.8801, "step": 10705 }, { "epoch": 0.34, "learning_rate": 1.3708800000000002e-05, "loss": 0.8746, "step": 10710 }, { "epoch": 0.34, "learning_rate": 1.3715200000000002e-05, "loss": 0.8947, "step": 10715 }, { "epoch": 0.34, "learning_rate": 1.3721600000000001e-05, "loss": 0.8897, "step": 10720 }, { "epoch": 0.34, "learning_rate": 1.3728000000000001e-05, "loss": 0.8944, "step": 10725 }, { "epoch": 0.34, "learning_rate": 1.3734400000000002e-05, "loss": 0.8913, "step": 10730 }, { "epoch": 0.34, "learning_rate": 1.37408e-05, "loss": 0.8884, "step": 10735 }, { "epoch": 0.34, "learning_rate": 1.3747200000000001e-05, "loss": 0.8765, "step": 10740 }, { "epoch": 0.34, "learning_rate": 1.37536e-05, "loss": 0.8909, "step": 10745 }, { "epoch": 0.34, "learning_rate": 1.376e-05, "loss": 0.8928, "step": 10750 }, { "epoch": 0.34, "learning_rate": 1.3766400000000003e-05, "loss": 0.8694, "step": 10755 }, { "epoch": 0.34, "learning_rate": 1.3772800000000001e-05, "loss": 0.8824, "step": 10760 }, { "epoch": 0.34, "learning_rate": 1.3779200000000002e-05, "loss": 0.8904, "step": 10765 }, { "epoch": 0.34, "learning_rate": 1.37856e-05, "loss": 0.8989, "step": 10770 }, { "epoch": 0.34, "learning_rate": 1.3792000000000001e-05, "loss": 0.8722, "step": 10775 }, { "epoch": 0.34, "learning_rate": 1.37984e-05, "loss": 0.8918, "step": 10780 }, { "epoch": 0.35, "learning_rate": 1.38048e-05, "loss": 0.8864, "step": 10785 }, { "epoch": 0.35, "learning_rate": 1.3811200000000001e-05, "loss": 0.8812, "step": 10790 }, { "epoch": 0.35, "learning_rate": 1.3817600000000001e-05, "loss": 0.8763, "step": 10795 }, { "epoch": 0.35, "learning_rate": 1.3824000000000002e-05, "loss": 0.8849, "step": 10800 }, { "epoch": 0.35, "learning_rate": 1.3830400000000002e-05, "loss": 0.8876, "step": 10805 }, { "epoch": 0.35, "learning_rate": 1.3836800000000001e-05, "loss": 0.8805, "step": 10810 }, { "epoch": 0.35, "learning_rate": 1.3843200000000002e-05, "loss": 0.8907, "step": 10815 }, { "epoch": 0.35, "learning_rate": 1.38496e-05, "loss": 0.8727, "step": 10820 }, { "epoch": 0.35, "learning_rate": 1.3856e-05, "loss": 0.873, "step": 10825 }, { "epoch": 0.35, "learning_rate": 1.38624e-05, "loss": 0.8913, "step": 10830 }, { "epoch": 0.35, "learning_rate": 1.38688e-05, "loss": 0.8873, "step": 10835 }, { "epoch": 0.35, "learning_rate": 1.3875200000000002e-05, "loss": 0.8699, "step": 10840 }, { "epoch": 0.35, "learning_rate": 1.3881600000000001e-05, "loss": 0.8777, "step": 10845 }, { "epoch": 0.35, "learning_rate": 1.3888000000000002e-05, "loss": 0.8758, "step": 10850 }, { "epoch": 0.35, "learning_rate": 1.3894400000000002e-05, "loss": 0.8966, "step": 10855 }, { "epoch": 0.35, "learning_rate": 1.39008e-05, "loss": 0.8867, "step": 10860 }, { "epoch": 0.35, "learning_rate": 1.3907200000000001e-05, "loss": 0.8881, "step": 10865 }, { "epoch": 0.35, "learning_rate": 1.39136e-05, "loss": 0.887, "step": 10870 }, { "epoch": 0.35, "learning_rate": 1.392e-05, "loss": 0.8844, "step": 10875 }, { "epoch": 0.35, "learning_rate": 1.3926400000000003e-05, "loss": 0.8985, "step": 10880 }, { "epoch": 0.35, "learning_rate": 1.3932800000000002e-05, "loss": 0.8694, "step": 10885 }, { "epoch": 0.35, "learning_rate": 1.3939200000000002e-05, "loss": 0.8871, "step": 10890 }, { "epoch": 0.35, "learning_rate": 1.39456e-05, "loss": 0.8858, "step": 10895 }, { "epoch": 0.35, "learning_rate": 1.3952000000000001e-05, "loss": 0.8774, "step": 10900 }, { "epoch": 0.35, "learning_rate": 1.39584e-05, "loss": 0.8787, "step": 10905 }, { "epoch": 0.35, "learning_rate": 1.39648e-05, "loss": 0.8843, "step": 10910 }, { "epoch": 0.35, "learning_rate": 1.3971200000000001e-05, "loss": 0.8954, "step": 10915 }, { "epoch": 0.35, "learning_rate": 1.39776e-05, "loss": 0.8858, "step": 10920 }, { "epoch": 0.35, "learning_rate": 1.3984000000000002e-05, "loss": 0.8776, "step": 10925 }, { "epoch": 0.35, "learning_rate": 1.3990400000000002e-05, "loss": 0.8876, "step": 10930 }, { "epoch": 0.35, "learning_rate": 1.3996800000000001e-05, "loss": 0.8831, "step": 10935 }, { "epoch": 0.35, "learning_rate": 1.4003200000000002e-05, "loss": 0.8885, "step": 10940 }, { "epoch": 0.35, "learning_rate": 1.40096e-05, "loss": 0.8852, "step": 10945 }, { "epoch": 0.35, "learning_rate": 1.4016000000000001e-05, "loss": 0.8904, "step": 10950 }, { "epoch": 0.35, "learning_rate": 1.40224e-05, "loss": 0.8809, "step": 10955 }, { "epoch": 0.35, "learning_rate": 1.40288e-05, "loss": 0.889, "step": 10960 }, { "epoch": 0.35, "learning_rate": 1.4035200000000002e-05, "loss": 0.8751, "step": 10965 }, { "epoch": 0.35, "learning_rate": 1.4041600000000001e-05, "loss": 0.8711, "step": 10970 }, { "epoch": 0.35, "learning_rate": 1.4048000000000002e-05, "loss": 0.8929, "step": 10975 }, { "epoch": 0.35, "learning_rate": 1.4054400000000002e-05, "loss": 0.8937, "step": 10980 }, { "epoch": 0.35, "learning_rate": 1.4060800000000001e-05, "loss": 0.881, "step": 10985 }, { "epoch": 0.35, "learning_rate": 1.4067200000000001e-05, "loss": 0.8847, "step": 10990 }, { "epoch": 0.35, "learning_rate": 1.40736e-05, "loss": 0.885, "step": 10995 }, { "epoch": 0.35, "learning_rate": 1.408e-05, "loss": 0.8764, "step": 11000 }, { "epoch": 0.35, "learning_rate": 1.40864e-05, "loss": 0.8761, "step": 11005 }, { "epoch": 0.35, "learning_rate": 1.4092800000000002e-05, "loss": 0.8655, "step": 11010 }, { "epoch": 0.35, "learning_rate": 1.4099200000000002e-05, "loss": 0.8817, "step": 11015 }, { "epoch": 0.35, "learning_rate": 1.4105600000000001e-05, "loss": 0.8809, "step": 11020 }, { "epoch": 0.35, "learning_rate": 1.4112000000000001e-05, "loss": 0.8836, "step": 11025 }, { "epoch": 0.35, "learning_rate": 1.41184e-05, "loss": 0.881, "step": 11030 }, { "epoch": 0.35, "learning_rate": 1.41248e-05, "loss": 0.8952, "step": 11035 }, { "epoch": 0.35, "learning_rate": 1.4131200000000001e-05, "loss": 0.8836, "step": 11040 }, { "epoch": 0.35, "learning_rate": 1.41376e-05, "loss": 0.8929, "step": 11045 }, { "epoch": 0.35, "learning_rate": 1.4144000000000002e-05, "loss": 0.8994, "step": 11050 }, { "epoch": 0.35, "learning_rate": 1.4150400000000003e-05, "loss": 0.8899, "step": 11055 }, { "epoch": 0.35, "learning_rate": 1.4156800000000001e-05, "loss": 0.8771, "step": 11060 }, { "epoch": 0.35, "learning_rate": 1.4163200000000002e-05, "loss": 0.8796, "step": 11065 }, { "epoch": 0.35, "learning_rate": 1.41696e-05, "loss": 0.8878, "step": 11070 }, { "epoch": 0.35, "learning_rate": 1.4176000000000001e-05, "loss": 0.8794, "step": 11075 }, { "epoch": 0.35, "learning_rate": 1.41824e-05, "loss": 0.883, "step": 11080 }, { "epoch": 0.35, "learning_rate": 1.41888e-05, "loss": 0.8757, "step": 11085 }, { "epoch": 0.35, "learning_rate": 1.4195200000000001e-05, "loss": 0.878, "step": 11090 }, { "epoch": 0.36, "learning_rate": 1.4201600000000001e-05, "loss": 0.8723, "step": 11095 }, { "epoch": 0.36, "learning_rate": 1.4208000000000002e-05, "loss": 0.8807, "step": 11100 }, { "epoch": 0.36, "learning_rate": 1.4214400000000002e-05, "loss": 0.8707, "step": 11105 }, { "epoch": 0.36, "learning_rate": 1.4220800000000001e-05, "loss": 0.8782, "step": 11110 }, { "epoch": 0.36, "learning_rate": 1.4227200000000002e-05, "loss": 0.8701, "step": 11115 }, { "epoch": 0.36, "learning_rate": 1.42336e-05, "loss": 0.8817, "step": 11120 }, { "epoch": 0.36, "learning_rate": 1.4240000000000001e-05, "loss": 0.8782, "step": 11125 }, { "epoch": 0.36, "learning_rate": 1.42464e-05, "loss": 0.8796, "step": 11130 }, { "epoch": 0.36, "learning_rate": 1.4252800000000002e-05, "loss": 0.8741, "step": 11135 }, { "epoch": 0.36, "learning_rate": 1.4259200000000002e-05, "loss": 0.88, "step": 11140 }, { "epoch": 0.36, "learning_rate": 1.4265600000000001e-05, "loss": 0.8824, "step": 11145 }, { "epoch": 0.36, "learning_rate": 1.4272000000000002e-05, "loss": 0.8909, "step": 11150 }, { "epoch": 0.36, "learning_rate": 1.42784e-05, "loss": 0.8851, "step": 11155 }, { "epoch": 0.36, "learning_rate": 1.4284800000000001e-05, "loss": 0.8687, "step": 11160 }, { "epoch": 0.36, "learning_rate": 1.4291200000000001e-05, "loss": 0.8837, "step": 11165 }, { "epoch": 0.36, "learning_rate": 1.42976e-05, "loss": 0.8847, "step": 11170 }, { "epoch": 0.36, "learning_rate": 1.4304e-05, "loss": 0.8693, "step": 11175 }, { "epoch": 0.36, "learning_rate": 1.4310400000000003e-05, "loss": 0.8849, "step": 11180 }, { "epoch": 0.36, "learning_rate": 1.4316800000000002e-05, "loss": 0.8762, "step": 11185 }, { "epoch": 0.36, "learning_rate": 1.4323200000000002e-05, "loss": 0.8892, "step": 11190 }, { "epoch": 0.36, "learning_rate": 1.43296e-05, "loss": 0.8773, "step": 11195 }, { "epoch": 0.36, "learning_rate": 1.4336000000000001e-05, "loss": 0.8719, "step": 11200 }, { "epoch": 0.36, "learning_rate": 1.43424e-05, "loss": 0.8862, "step": 11205 }, { "epoch": 0.36, "learning_rate": 1.43488e-05, "loss": 0.8792, "step": 11210 }, { "epoch": 0.36, "learning_rate": 1.4355200000000001e-05, "loss": 0.8937, "step": 11215 }, { "epoch": 0.36, "learning_rate": 1.4361600000000002e-05, "loss": 0.8678, "step": 11220 }, { "epoch": 0.36, "learning_rate": 1.4368000000000002e-05, "loss": 0.8753, "step": 11225 }, { "epoch": 0.36, "learning_rate": 1.4374400000000003e-05, "loss": 0.8645, "step": 11230 }, { "epoch": 0.36, "learning_rate": 1.4380800000000001e-05, "loss": 0.8675, "step": 11235 }, { "epoch": 0.36, "learning_rate": 1.4387200000000002e-05, "loss": 0.8674, "step": 11240 }, { "epoch": 0.36, "learning_rate": 1.43936e-05, "loss": 0.8764, "step": 11245 }, { "epoch": 0.36, "learning_rate": 1.4400000000000001e-05, "loss": 0.8618, "step": 11250 }, { "epoch": 0.36, "learning_rate": 1.44064e-05, "loss": 0.8752, "step": 11255 }, { "epoch": 0.36, "learning_rate": 1.44128e-05, "loss": 0.8736, "step": 11260 }, { "epoch": 0.36, "learning_rate": 1.4419200000000002e-05, "loss": 0.8728, "step": 11265 }, { "epoch": 0.36, "learning_rate": 1.4425600000000001e-05, "loss": 0.8732, "step": 11270 }, { "epoch": 0.36, "learning_rate": 1.4432000000000002e-05, "loss": 0.875, "step": 11275 }, { "epoch": 0.36, "learning_rate": 1.44384e-05, "loss": 0.8535, "step": 11280 }, { "epoch": 0.36, "learning_rate": 1.4444800000000001e-05, "loss": 0.8847, "step": 11285 }, { "epoch": 0.36, "learning_rate": 1.4451200000000002e-05, "loss": 0.8757, "step": 11290 }, { "epoch": 0.36, "learning_rate": 1.44576e-05, "loss": 0.8608, "step": 11295 }, { "epoch": 0.36, "learning_rate": 1.4464e-05, "loss": 0.8687, "step": 11300 }, { "epoch": 0.36, "learning_rate": 1.4470400000000003e-05, "loss": 0.8982, "step": 11305 }, { "epoch": 0.36, "learning_rate": 1.4476800000000002e-05, "loss": 0.8786, "step": 11310 }, { "epoch": 0.36, "learning_rate": 1.4483200000000002e-05, "loss": 0.8846, "step": 11315 }, { "epoch": 0.36, "learning_rate": 1.4489600000000001e-05, "loss": 0.8762, "step": 11320 }, { "epoch": 0.36, "learning_rate": 1.4496000000000001e-05, "loss": 0.8704, "step": 11325 }, { "epoch": 0.36, "learning_rate": 1.45024e-05, "loss": 0.8655, "step": 11330 }, { "epoch": 0.36, "learning_rate": 1.45088e-05, "loss": 0.8827, "step": 11335 }, { "epoch": 0.36, "learning_rate": 1.4515200000000001e-05, "loss": 0.8808, "step": 11340 }, { "epoch": 0.36, "learning_rate": 1.45216e-05, "loss": 0.8686, "step": 11345 }, { "epoch": 0.36, "learning_rate": 1.4528000000000002e-05, "loss": 0.871, "step": 11350 }, { "epoch": 0.36, "learning_rate": 1.4534400000000003e-05, "loss": 0.883, "step": 11355 }, { "epoch": 0.36, "learning_rate": 1.4540800000000001e-05, "loss": 0.8749, "step": 11360 }, { "epoch": 0.36, "learning_rate": 1.4547200000000002e-05, "loss": 0.8802, "step": 11365 }, { "epoch": 0.36, "learning_rate": 1.45536e-05, "loss": 0.8818, "step": 11370 }, { "epoch": 0.36, "learning_rate": 1.4560000000000001e-05, "loss": 0.8716, "step": 11375 }, { "epoch": 0.36, "learning_rate": 1.45664e-05, "loss": 0.8789, "step": 11380 }, { "epoch": 0.36, "learning_rate": 1.45728e-05, "loss": 0.8783, "step": 11385 }, { "epoch": 0.36, "learning_rate": 1.4579200000000003e-05, "loss": 0.8681, "step": 11390 }, { "epoch": 0.36, "learning_rate": 1.4585600000000001e-05, "loss": 0.8707, "step": 11395 }, { "epoch": 0.36, "learning_rate": 1.4592000000000002e-05, "loss": 0.8665, "step": 11400 }, { "epoch": 0.36, "learning_rate": 1.45984e-05, "loss": 0.8926, "step": 11405 }, { "epoch": 0.37, "learning_rate": 1.4604800000000001e-05, "loss": 0.8729, "step": 11410 }, { "epoch": 0.37, "learning_rate": 1.4611200000000002e-05, "loss": 0.8811, "step": 11415 }, { "epoch": 0.37, "learning_rate": 1.46176e-05, "loss": 0.8823, "step": 11420 }, { "epoch": 0.37, "learning_rate": 1.4624000000000001e-05, "loss": 0.8832, "step": 11425 }, { "epoch": 0.37, "learning_rate": 1.46304e-05, "loss": 0.8746, "step": 11430 }, { "epoch": 0.37, "learning_rate": 1.4636800000000002e-05, "loss": 0.8845, "step": 11435 }, { "epoch": 0.37, "learning_rate": 1.4643200000000002e-05, "loss": 0.8639, "step": 11440 }, { "epoch": 0.37, "learning_rate": 1.4649600000000001e-05, "loss": 0.8679, "step": 11445 }, { "epoch": 0.37, "learning_rate": 1.4656000000000002e-05, "loss": 0.8749, "step": 11450 }, { "epoch": 0.37, "learning_rate": 1.46624e-05, "loss": 0.8602, "step": 11455 }, { "epoch": 0.37, "learning_rate": 1.4668800000000001e-05, "loss": 0.864, "step": 11460 }, { "epoch": 0.37, "learning_rate": 1.4675200000000001e-05, "loss": 0.8632, "step": 11465 }, { "epoch": 0.37, "learning_rate": 1.46816e-05, "loss": 0.8753, "step": 11470 }, { "epoch": 0.37, "learning_rate": 1.4688000000000002e-05, "loss": 0.8707, "step": 11475 }, { "epoch": 0.37, "learning_rate": 1.4694400000000003e-05, "loss": 0.8685, "step": 11480 }, { "epoch": 0.37, "learning_rate": 1.4700800000000002e-05, "loss": 0.8751, "step": 11485 }, { "epoch": 0.37, "learning_rate": 1.4707200000000002e-05, "loss": 0.866, "step": 11490 }, { "epoch": 0.37, "learning_rate": 1.4713600000000001e-05, "loss": 0.8794, "step": 11495 }, { "epoch": 0.37, "learning_rate": 1.4720000000000001e-05, "loss": 0.8592, "step": 11500 }, { "epoch": 0.37, "learning_rate": 1.47264e-05, "loss": 0.8665, "step": 11505 }, { "epoch": 0.37, "learning_rate": 1.47328e-05, "loss": 0.8701, "step": 11510 }, { "epoch": 0.37, "learning_rate": 1.47392e-05, "loss": 0.8772, "step": 11515 }, { "epoch": 0.37, "learning_rate": 1.4745600000000002e-05, "loss": 0.8805, "step": 11520 }, { "epoch": 0.37, "learning_rate": 1.4752000000000002e-05, "loss": 0.8699, "step": 11525 }, { "epoch": 0.37, "learning_rate": 1.4758400000000001e-05, "loss": 0.8747, "step": 11530 }, { "epoch": 0.37, "learning_rate": 1.4764800000000001e-05, "loss": 0.8655, "step": 11535 }, { "epoch": 0.37, "learning_rate": 1.4771200000000002e-05, "loss": 0.8636, "step": 11540 }, { "epoch": 0.37, "learning_rate": 1.47776e-05, "loss": 0.8666, "step": 11545 }, { "epoch": 0.37, "learning_rate": 1.4784000000000001e-05, "loss": 0.8676, "step": 11550 }, { "epoch": 0.37, "learning_rate": 1.47904e-05, "loss": 0.8739, "step": 11555 }, { "epoch": 0.37, "learning_rate": 1.4796800000000002e-05, "loss": 0.8625, "step": 11560 }, { "epoch": 0.37, "learning_rate": 1.4803200000000003e-05, "loss": 0.8808, "step": 11565 }, { "epoch": 0.37, "learning_rate": 1.4809600000000001e-05, "loss": 0.8587, "step": 11570 }, { "epoch": 0.37, "learning_rate": 1.4816000000000002e-05, "loss": 0.8636, "step": 11575 }, { "epoch": 0.37, "learning_rate": 1.48224e-05, "loss": 0.8629, "step": 11580 }, { "epoch": 0.37, "learning_rate": 1.4828800000000001e-05, "loss": 0.8564, "step": 11585 }, { "epoch": 0.37, "learning_rate": 1.4835200000000002e-05, "loss": 0.8913, "step": 11590 }, { "epoch": 0.37, "learning_rate": 1.48416e-05, "loss": 0.8724, "step": 11595 }, { "epoch": 0.37, "learning_rate": 1.4848e-05, "loss": 0.8739, "step": 11600 }, { "epoch": 0.37, "learning_rate": 1.4854400000000003e-05, "loss": 0.8689, "step": 11605 }, { "epoch": 0.37, "learning_rate": 1.4860800000000002e-05, "loss": 0.8602, "step": 11610 }, { "epoch": 0.37, "learning_rate": 1.4867200000000002e-05, "loss": 0.8689, "step": 11615 }, { "epoch": 0.37, "learning_rate": 1.4873600000000001e-05, "loss": 0.8757, "step": 11620 }, { "epoch": 0.37, "learning_rate": 1.4880000000000002e-05, "loss": 0.8693, "step": 11625 }, { "epoch": 0.37, "learning_rate": 1.48864e-05, "loss": 0.8738, "step": 11630 }, { "epoch": 0.37, "learning_rate": 1.48928e-05, "loss": 0.8735, "step": 11635 }, { "epoch": 0.37, "learning_rate": 1.48992e-05, "loss": 0.8587, "step": 11640 }, { "epoch": 0.37, "learning_rate": 1.4905600000000002e-05, "loss": 0.8732, "step": 11645 }, { "epoch": 0.37, "learning_rate": 1.4912000000000002e-05, "loss": 0.8544, "step": 11650 }, { "epoch": 0.37, "learning_rate": 1.4918400000000001e-05, "loss": 0.8576, "step": 11655 }, { "epoch": 0.37, "learning_rate": 1.4924800000000002e-05, "loss": 0.8788, "step": 11660 }, { "epoch": 0.37, "learning_rate": 1.4931200000000002e-05, "loss": 0.8654, "step": 11665 }, { "epoch": 0.37, "learning_rate": 1.49376e-05, "loss": 0.8721, "step": 11670 }, { "epoch": 0.37, "learning_rate": 1.4944000000000001e-05, "loss": 0.8674, "step": 11675 }, { "epoch": 0.37, "learning_rate": 1.49504e-05, "loss": 0.8778, "step": 11680 }, { "epoch": 0.37, "learning_rate": 1.49568e-05, "loss": 0.8673, "step": 11685 }, { "epoch": 0.37, "learning_rate": 1.4963200000000003e-05, "loss": 0.8684, "step": 11690 }, { "epoch": 0.37, "learning_rate": 1.4969600000000001e-05, "loss": 0.8632, "step": 11695 }, { "epoch": 0.37, "learning_rate": 1.4976000000000002e-05, "loss": 0.8746, "step": 11700 }, { "epoch": 0.37, "learning_rate": 1.49824e-05, "loss": 0.8715, "step": 11705 }, { "epoch": 0.37, "learning_rate": 1.4988800000000001e-05, "loss": 0.8731, "step": 11710 }, { "epoch": 0.37, "learning_rate": 1.4995200000000002e-05, "loss": 0.8759, "step": 11715 }, { "epoch": 0.38, "learning_rate": 1.50016e-05, "loss": 0.8707, "step": 11720 }, { "epoch": 0.38, "learning_rate": 1.5008000000000001e-05, "loss": 0.8678, "step": 11725 }, { "epoch": 0.38, "learning_rate": 1.5014400000000001e-05, "loss": 0.8699, "step": 11730 }, { "epoch": 0.38, "learning_rate": 1.5020800000000002e-05, "loss": 0.8649, "step": 11735 }, { "epoch": 0.38, "learning_rate": 1.5027200000000002e-05, "loss": 0.8721, "step": 11740 }, { "epoch": 0.38, "learning_rate": 1.5033600000000001e-05, "loss": 0.8694, "step": 11745 }, { "epoch": 0.38, "learning_rate": 1.5040000000000002e-05, "loss": 0.8584, "step": 11750 }, { "epoch": 0.38, "learning_rate": 1.50464e-05, "loss": 0.8805, "step": 11755 }, { "epoch": 0.38, "learning_rate": 1.5052800000000001e-05, "loss": 0.8687, "step": 11760 }, { "epoch": 0.38, "learning_rate": 1.50592e-05, "loss": 0.8668, "step": 11765 }, { "epoch": 0.38, "learning_rate": 1.50656e-05, "loss": 0.846, "step": 11770 }, { "epoch": 0.38, "learning_rate": 1.5072000000000002e-05, "loss": 0.8664, "step": 11775 }, { "epoch": 0.38, "learning_rate": 1.5078400000000001e-05, "loss": 0.868, "step": 11780 }, { "epoch": 0.38, "learning_rate": 1.5084800000000002e-05, "loss": 0.8618, "step": 11785 }, { "epoch": 0.38, "learning_rate": 1.5091200000000002e-05, "loss": 0.8687, "step": 11790 }, { "epoch": 0.38, "learning_rate": 1.5097600000000001e-05, "loss": 0.8734, "step": 11795 }, { "epoch": 0.38, "learning_rate": 1.5104000000000001e-05, "loss": 0.8628, "step": 11800 }, { "epoch": 0.38, "learning_rate": 1.51104e-05, "loss": 0.8628, "step": 11805 }, { "epoch": 0.38, "learning_rate": 1.51168e-05, "loss": 0.8706, "step": 11810 }, { "epoch": 0.38, "learning_rate": 1.5123200000000003e-05, "loss": 0.8714, "step": 11815 }, { "epoch": 0.38, "learning_rate": 1.5129600000000002e-05, "loss": 0.8713, "step": 11820 }, { "epoch": 0.38, "learning_rate": 1.5136000000000002e-05, "loss": 0.8615, "step": 11825 }, { "epoch": 0.38, "learning_rate": 1.5142400000000001e-05, "loss": 0.8592, "step": 11830 }, { "epoch": 0.38, "learning_rate": 1.5148800000000001e-05, "loss": 0.8593, "step": 11835 }, { "epoch": 0.38, "learning_rate": 1.51552e-05, "loss": 0.8467, "step": 11840 }, { "epoch": 0.38, "learning_rate": 1.51616e-05, "loss": 0.8556, "step": 11845 }, { "epoch": 0.38, "learning_rate": 1.5168000000000001e-05, "loss": 0.8636, "step": 11850 }, { "epoch": 0.38, "learning_rate": 1.51744e-05, "loss": 0.8526, "step": 11855 }, { "epoch": 0.38, "learning_rate": 1.5180800000000002e-05, "loss": 0.8652, "step": 11860 }, { "epoch": 0.38, "learning_rate": 1.5187200000000003e-05, "loss": 0.8567, "step": 11865 }, { "epoch": 0.38, "learning_rate": 1.5193600000000001e-05, "loss": 0.8545, "step": 11870 }, { "epoch": 0.38, "learning_rate": 1.5200000000000002e-05, "loss": 0.8876, "step": 11875 }, { "epoch": 0.38, "learning_rate": 1.52064e-05, "loss": 0.873, "step": 11880 }, { "epoch": 0.38, "learning_rate": 1.5212800000000001e-05, "loss": 0.856, "step": 11885 }, { "epoch": 0.38, "learning_rate": 1.52192e-05, "loss": 0.8618, "step": 11890 }, { "epoch": 0.38, "learning_rate": 1.52256e-05, "loss": 0.8571, "step": 11895 }, { "epoch": 0.38, "learning_rate": 1.5232000000000003e-05, "loss": 0.8542, "step": 11900 }, { "epoch": 0.38, "learning_rate": 1.5238400000000001e-05, "loss": 0.857, "step": 11905 }, { "epoch": 0.38, "learning_rate": 1.5244800000000002e-05, "loss": 0.8711, "step": 11910 }, { "epoch": 0.38, "learning_rate": 1.5251200000000002e-05, "loss": 0.8653, "step": 11915 }, { "epoch": 0.38, "learning_rate": 1.5257600000000001e-05, "loss": 0.8591, "step": 11920 }, { "epoch": 0.38, "learning_rate": 1.5264e-05, "loss": 0.8574, "step": 11925 }, { "epoch": 0.38, "learning_rate": 1.5270400000000002e-05, "loss": 0.8592, "step": 11930 }, { "epoch": 0.38, "learning_rate": 1.52768e-05, "loss": 0.8653, "step": 11935 }, { "epoch": 0.38, "learning_rate": 1.52832e-05, "loss": 0.8716, "step": 11940 }, { "epoch": 0.38, "learning_rate": 1.5289600000000004e-05, "loss": 0.8832, "step": 11945 }, { "epoch": 0.38, "learning_rate": 1.5296e-05, "loss": 0.8701, "step": 11950 }, { "epoch": 0.38, "learning_rate": 1.53024e-05, "loss": 0.8643, "step": 11955 }, { "epoch": 0.38, "learning_rate": 1.53088e-05, "loss": 0.8659, "step": 11960 }, { "epoch": 0.38, "learning_rate": 1.5315200000000002e-05, "loss": 0.8872, "step": 11965 }, { "epoch": 0.38, "learning_rate": 1.5321600000000003e-05, "loss": 0.8671, "step": 11970 }, { "epoch": 0.38, "learning_rate": 1.5328e-05, "loss": 0.8699, "step": 11975 }, { "epoch": 0.38, "learning_rate": 1.53344e-05, "loss": 0.865, "step": 11980 }, { "epoch": 0.38, "learning_rate": 1.5340800000000004e-05, "loss": 0.8639, "step": 11985 }, { "epoch": 0.38, "learning_rate": 1.53472e-05, "loss": 0.8504, "step": 11990 }, { "epoch": 0.38, "learning_rate": 1.53536e-05, "loss": 0.8714, "step": 11995 }, { "epoch": 0.38, "learning_rate": 1.5360000000000002e-05, "loss": 0.8624, "step": 12000 }, { "epoch": 0.38, "learning_rate": 1.5366400000000002e-05, "loss": 0.8706, "step": 12005 }, { "epoch": 0.38, "learning_rate": 1.53728e-05, "loss": 0.863, "step": 12010 }, { "epoch": 0.38, "learning_rate": 1.53792e-05, "loss": 0.8778, "step": 12015 }, { "epoch": 0.38, "learning_rate": 1.53856e-05, "loss": 0.8794, "step": 12020 }, { "epoch": 0.38, "learning_rate": 1.5392e-05, "loss": 0.863, "step": 12025 }, { "epoch": 0.38, "learning_rate": 1.53984e-05, "loss": 0.8576, "step": 12030 }, { "epoch": 0.39, "learning_rate": 1.5404800000000002e-05, "loss": 0.8626, "step": 12035 }, { "epoch": 0.39, "learning_rate": 1.5411200000000002e-05, "loss": 0.8556, "step": 12040 }, { "epoch": 0.39, "learning_rate": 1.5417600000000003e-05, "loss": 0.8436, "step": 12045 }, { "epoch": 0.39, "learning_rate": 1.5424e-05, "loss": 0.8655, "step": 12050 }, { "epoch": 0.39, "learning_rate": 1.54304e-05, "loss": 0.8631, "step": 12055 }, { "epoch": 0.39, "learning_rate": 1.54368e-05, "loss": 0.868, "step": 12060 }, { "epoch": 0.39, "learning_rate": 1.54432e-05, "loss": 0.8657, "step": 12065 }, { "epoch": 0.39, "learning_rate": 1.5449600000000002e-05, "loss": 0.858, "step": 12070 }, { "epoch": 0.39, "learning_rate": 1.5456000000000002e-05, "loss": 0.8656, "step": 12075 }, { "epoch": 0.39, "learning_rate": 1.5462400000000003e-05, "loss": 0.8584, "step": 12080 }, { "epoch": 0.39, "learning_rate": 1.54688e-05, "loss": 0.8471, "step": 12085 }, { "epoch": 0.39, "learning_rate": 1.54752e-05, "loss": 0.8571, "step": 12090 }, { "epoch": 0.39, "learning_rate": 1.54816e-05, "loss": 0.8547, "step": 12095 }, { "epoch": 0.39, "learning_rate": 1.5488e-05, "loss": 0.8729, "step": 12100 }, { "epoch": 0.39, "learning_rate": 1.5494400000000002e-05, "loss": 0.8682, "step": 12105 }, { "epoch": 0.39, "learning_rate": 1.55008e-05, "loss": 0.8559, "step": 12110 }, { "epoch": 0.39, "learning_rate": 1.5507200000000003e-05, "loss": 0.8639, "step": 12115 }, { "epoch": 0.39, "learning_rate": 1.5513600000000003e-05, "loss": 0.8555, "step": 12120 }, { "epoch": 0.39, "learning_rate": 1.552e-05, "loss": 0.8574, "step": 12125 }, { "epoch": 0.39, "learning_rate": 1.55264e-05, "loss": 0.8623, "step": 12130 }, { "epoch": 0.39, "learning_rate": 1.55328e-05, "loss": 0.8655, "step": 12135 }, { "epoch": 0.39, "learning_rate": 1.5539200000000002e-05, "loss": 0.8604, "step": 12140 }, { "epoch": 0.39, "learning_rate": 1.55456e-05, "loss": 0.8628, "step": 12145 }, { "epoch": 0.39, "learning_rate": 1.5552e-05, "loss": 0.8471, "step": 12150 }, { "epoch": 0.39, "learning_rate": 1.55584e-05, "loss": 0.8698, "step": 12155 }, { "epoch": 0.39, "learning_rate": 1.55648e-05, "loss": 0.8561, "step": 12160 }, { "epoch": 0.39, "learning_rate": 1.55712e-05, "loss": 0.8602, "step": 12165 }, { "epoch": 0.39, "learning_rate": 1.55776e-05, "loss": 0.8536, "step": 12170 }, { "epoch": 0.39, "learning_rate": 1.5584000000000002e-05, "loss": 0.8674, "step": 12175 }, { "epoch": 0.39, "learning_rate": 1.5590400000000002e-05, "loss": 0.8667, "step": 12180 }, { "epoch": 0.39, "learning_rate": 1.55968e-05, "loss": 0.852, "step": 12185 }, { "epoch": 0.39, "learning_rate": 1.56032e-05, "loss": 0.8586, "step": 12190 }, { "epoch": 0.39, "learning_rate": 1.56096e-05, "loss": 0.8561, "step": 12195 }, { "epoch": 0.39, "learning_rate": 1.5616e-05, "loss": 0.8529, "step": 12200 }, { "epoch": 0.39, "learning_rate": 1.56224e-05, "loss": 0.8586, "step": 12205 }, { "epoch": 0.39, "learning_rate": 1.5628800000000002e-05, "loss": 0.8549, "step": 12210 }, { "epoch": 0.39, "learning_rate": 1.5635200000000002e-05, "loss": 0.8509, "step": 12215 }, { "epoch": 0.39, "learning_rate": 1.5641600000000003e-05, "loss": 0.8707, "step": 12220 }, { "epoch": 0.39, "learning_rate": 1.5648e-05, "loss": 0.8684, "step": 12225 }, { "epoch": 0.39, "learning_rate": 1.56544e-05, "loss": 0.865, "step": 12230 }, { "epoch": 0.39, "learning_rate": 1.56608e-05, "loss": 0.8534, "step": 12235 }, { "epoch": 0.39, "learning_rate": 1.56672e-05, "loss": 0.8701, "step": 12240 }, { "epoch": 0.39, "learning_rate": 1.5673600000000002e-05, "loss": 0.8476, "step": 12245 }, { "epoch": 0.39, "learning_rate": 1.5680000000000002e-05, "loss": 0.8584, "step": 12250 }, { "epoch": 0.39, "learning_rate": 1.5686400000000003e-05, "loss": 0.853, "step": 12255 }, { "epoch": 0.39, "learning_rate": 1.56928e-05, "loss": 0.8693, "step": 12260 }, { "epoch": 0.39, "learning_rate": 1.56992e-05, "loss": 0.8523, "step": 12265 }, { "epoch": 0.39, "learning_rate": 1.57056e-05, "loss": 0.8683, "step": 12270 }, { "epoch": 0.39, "learning_rate": 1.5712e-05, "loss": 0.8569, "step": 12275 }, { "epoch": 0.39, "learning_rate": 1.5718400000000002e-05, "loss": 0.8496, "step": 12280 }, { "epoch": 0.39, "learning_rate": 1.5724800000000002e-05, "loss": 0.8606, "step": 12285 }, { "epoch": 0.39, "learning_rate": 1.5731200000000003e-05, "loss": 0.8777, "step": 12290 }, { "epoch": 0.39, "learning_rate": 1.5737600000000003e-05, "loss": 0.8419, "step": 12295 }, { "epoch": 0.39, "learning_rate": 1.5744e-05, "loss": 0.8528, "step": 12300 }, { "epoch": 0.39, "learning_rate": 1.57504e-05, "loss": 0.8637, "step": 12305 }, { "epoch": 0.39, "learning_rate": 1.57568e-05, "loss": 0.8646, "step": 12310 }, { "epoch": 0.39, "learning_rate": 1.5763200000000002e-05, "loss": 0.869, "step": 12315 }, { "epoch": 0.39, "learning_rate": 1.57696e-05, "loss": 0.8551, "step": 12320 }, { "epoch": 0.39, "learning_rate": 1.5776e-05, "loss": 0.8652, "step": 12325 }, { "epoch": 0.39, "learning_rate": 1.5782400000000003e-05, "loss": 0.8645, "step": 12330 }, { "epoch": 0.39, "learning_rate": 1.57888e-05, "loss": 0.8595, "step": 12335 }, { "epoch": 0.39, "learning_rate": 1.57952e-05, "loss": 0.8501, "step": 12340 }, { "epoch": 0.4, "learning_rate": 1.58016e-05, "loss": 0.8583, "step": 12345 }, { "epoch": 0.4, "learning_rate": 1.5808000000000002e-05, "loss": 0.8744, "step": 12350 }, { "epoch": 0.4, "learning_rate": 1.5814400000000002e-05, "loss": 0.8608, "step": 12355 }, { "epoch": 0.4, "learning_rate": 1.58208e-05, "loss": 0.8556, "step": 12360 }, { "epoch": 0.4, "learning_rate": 1.58272e-05, "loss": 0.8554, "step": 12365 }, { "epoch": 0.4, "learning_rate": 1.5833600000000004e-05, "loss": 0.8425, "step": 12370 }, { "epoch": 0.4, "learning_rate": 1.584e-05, "loss": 0.8558, "step": 12375 }, { "epoch": 0.4, "learning_rate": 1.58464e-05, "loss": 0.8594, "step": 12380 }, { "epoch": 0.4, "learning_rate": 1.5852800000000002e-05, "loss": 0.8439, "step": 12385 }, { "epoch": 0.4, "learning_rate": 1.5859200000000002e-05, "loss": 0.8461, "step": 12390 }, { "epoch": 0.4, "learning_rate": 1.58656e-05, "loss": 0.8661, "step": 12395 }, { "epoch": 0.4, "learning_rate": 1.5872e-05, "loss": 0.8695, "step": 12400 }, { "epoch": 0.4, "learning_rate": 1.58784e-05, "loss": 0.8494, "step": 12405 }, { "epoch": 0.4, "learning_rate": 1.58848e-05, "loss": 0.8566, "step": 12410 }, { "epoch": 0.4, "learning_rate": 1.58912e-05, "loss": 0.8615, "step": 12415 }, { "epoch": 0.4, "learning_rate": 1.5897600000000002e-05, "loss": 0.8553, "step": 12420 }, { "epoch": 0.4, "learning_rate": 1.5904000000000002e-05, "loss": 0.8465, "step": 12425 }, { "epoch": 0.4, "learning_rate": 1.5910400000000003e-05, "loss": 0.8532, "step": 12430 }, { "epoch": 0.4, "learning_rate": 1.59168e-05, "loss": 0.849, "step": 12435 }, { "epoch": 0.4, "learning_rate": 1.59232e-05, "loss": 0.8599, "step": 12440 }, { "epoch": 0.4, "learning_rate": 1.59296e-05, "loss": 0.8631, "step": 12445 }, { "epoch": 0.4, "learning_rate": 1.5936e-05, "loss": 0.8571, "step": 12450 }, { "epoch": 0.4, "learning_rate": 1.5942400000000002e-05, "loss": 0.8572, "step": 12455 }, { "epoch": 0.4, "learning_rate": 1.5948800000000002e-05, "loss": 0.8501, "step": 12460 }, { "epoch": 0.4, "learning_rate": 1.5955200000000003e-05, "loss": 0.8467, "step": 12465 }, { "epoch": 0.4, "learning_rate": 1.5961600000000003e-05, "loss": 0.8675, "step": 12470 }, { "epoch": 0.4, "learning_rate": 1.5968e-05, "loss": 0.8548, "step": 12475 }, { "epoch": 0.4, "learning_rate": 1.59744e-05, "loss": 0.8594, "step": 12480 }, { "epoch": 0.4, "learning_rate": 1.59808e-05, "loss": 0.8452, "step": 12485 }, { "epoch": 0.4, "learning_rate": 1.5987200000000002e-05, "loss": 0.8532, "step": 12490 }, { "epoch": 0.4, "learning_rate": 1.59936e-05, "loss": 0.8555, "step": 12495 }, { "epoch": 0.4, "learning_rate": 1.6000000000000003e-05, "loss": 0.8615, "step": 12500 }, { "epoch": 0.4, "learning_rate": 1.6006400000000003e-05, "loss": 0.8471, "step": 12505 }, { "epoch": 0.4, "learning_rate": 1.60128e-05, "loss": 0.8555, "step": 12510 }, { "epoch": 0.4, "learning_rate": 1.60192e-05, "loss": 0.8453, "step": 12515 }, { "epoch": 0.4, "learning_rate": 1.60256e-05, "loss": 0.8502, "step": 12520 }, { "epoch": 0.4, "learning_rate": 1.6032e-05, "loss": 0.8445, "step": 12525 }, { "epoch": 0.4, "learning_rate": 1.6038400000000002e-05, "loss": 0.8469, "step": 12530 }, { "epoch": 0.4, "learning_rate": 1.60448e-05, "loss": 0.8498, "step": 12535 }, { "epoch": 0.4, "learning_rate": 1.6051200000000003e-05, "loss": 0.8576, "step": 12540 }, { "epoch": 0.4, "learning_rate": 1.6057600000000004e-05, "loss": 0.8501, "step": 12545 }, { "epoch": 0.4, "learning_rate": 1.6064e-05, "loss": 0.8534, "step": 12550 }, { "epoch": 0.4, "learning_rate": 1.60704e-05, "loss": 0.861, "step": 12555 }, { "epoch": 0.4, "learning_rate": 1.60768e-05, "loss": 0.8544, "step": 12560 }, { "epoch": 0.4, "learning_rate": 1.6083200000000002e-05, "loss": 0.8338, "step": 12565 }, { "epoch": 0.4, "learning_rate": 1.60896e-05, "loss": 0.8596, "step": 12570 }, { "epoch": 0.4, "learning_rate": 1.6096e-05, "loss": 0.8688, "step": 12575 }, { "epoch": 0.4, "learning_rate": 1.61024e-05, "loss": 0.8517, "step": 12580 }, { "epoch": 0.4, "learning_rate": 1.61088e-05, "loss": 0.8502, "step": 12585 }, { "epoch": 0.4, "learning_rate": 1.61152e-05, "loss": 0.851, "step": 12590 }, { "epoch": 0.4, "learning_rate": 1.61216e-05, "loss": 0.862, "step": 12595 }, { "epoch": 0.4, "learning_rate": 1.6128000000000002e-05, "loss": 0.8616, "step": 12600 }, { "epoch": 0.4, "learning_rate": 1.6134400000000003e-05, "loss": 0.848, "step": 12605 }, { "epoch": 0.4, "learning_rate": 1.61408e-05, "loss": 0.8418, "step": 12610 }, { "epoch": 0.4, "learning_rate": 1.61472e-05, "loss": 0.8567, "step": 12615 }, { "epoch": 0.4, "learning_rate": 1.61536e-05, "loss": 0.8545, "step": 12620 }, { "epoch": 0.4, "learning_rate": 1.616e-05, "loss": 0.8522, "step": 12625 }, { "epoch": 0.4, "learning_rate": 1.61664e-05, "loss": 0.8513, "step": 12630 }, { "epoch": 0.4, "learning_rate": 1.6172800000000002e-05, "loss": 0.8665, "step": 12635 }, { "epoch": 0.4, "learning_rate": 1.6179200000000003e-05, "loss": 0.8537, "step": 12640 }, { "epoch": 0.4, "learning_rate": 1.61856e-05, "loss": 0.8581, "step": 12645 }, { "epoch": 0.4, "learning_rate": 1.6192e-05, "loss": 0.8471, "step": 12650 }, { "epoch": 0.4, "learning_rate": 1.61984e-05, "loss": 0.8557, "step": 12655 }, { "epoch": 0.41, "learning_rate": 1.62048e-05, "loss": 0.8577, "step": 12660 }, { "epoch": 0.41, "learning_rate": 1.62112e-05, "loss": 0.8494, "step": 12665 }, { "epoch": 0.41, "learning_rate": 1.6217600000000002e-05, "loss": 0.8476, "step": 12670 }, { "epoch": 0.41, "learning_rate": 1.6224000000000003e-05, "loss": 0.8333, "step": 12675 }, { "epoch": 0.41, "learning_rate": 1.6230400000000003e-05, "loss": 0.8592, "step": 12680 }, { "epoch": 0.41, "learning_rate": 1.62368e-05, "loss": 0.8592, "step": 12685 }, { "epoch": 0.41, "learning_rate": 1.62432e-05, "loss": 0.8462, "step": 12690 }, { "epoch": 0.41, "learning_rate": 1.62496e-05, "loss": 0.8662, "step": 12695 }, { "epoch": 0.41, "learning_rate": 1.6256e-05, "loss": 0.8598, "step": 12700 }, { "epoch": 0.41, "learning_rate": 1.6262400000000002e-05, "loss": 0.8409, "step": 12705 }, { "epoch": 0.41, "learning_rate": 1.6268800000000003e-05, "loss": 0.8552, "step": 12710 }, { "epoch": 0.41, "learning_rate": 1.6275200000000003e-05, "loss": 0.8476, "step": 12715 }, { "epoch": 0.41, "learning_rate": 1.6281600000000003e-05, "loss": 0.8488, "step": 12720 }, { "epoch": 0.41, "learning_rate": 1.6288e-05, "loss": 0.8546, "step": 12725 }, { "epoch": 0.41, "learning_rate": 1.62944e-05, "loss": 0.8441, "step": 12730 }, { "epoch": 0.41, "learning_rate": 1.63008e-05, "loss": 0.8534, "step": 12735 }, { "epoch": 0.41, "learning_rate": 1.6307200000000002e-05, "loss": 0.8496, "step": 12740 }, { "epoch": 0.41, "learning_rate": 1.63136e-05, "loss": 0.844, "step": 12745 }, { "epoch": 0.41, "learning_rate": 1.632e-05, "loss": 0.8457, "step": 12750 }, { "epoch": 0.41, "learning_rate": 1.6326400000000003e-05, "loss": 0.8594, "step": 12755 }, { "epoch": 0.41, "learning_rate": 1.63328e-05, "loss": 0.8597, "step": 12760 }, { "epoch": 0.41, "learning_rate": 1.63392e-05, "loss": 0.841, "step": 12765 }, { "epoch": 0.41, "learning_rate": 1.63456e-05, "loss": 0.8607, "step": 12770 }, { "epoch": 0.41, "learning_rate": 1.6352000000000002e-05, "loss": 0.8301, "step": 12775 }, { "epoch": 0.41, "learning_rate": 1.6358400000000002e-05, "loss": 0.8445, "step": 12780 }, { "epoch": 0.41, "learning_rate": 1.63648e-05, "loss": 0.8404, "step": 12785 }, { "epoch": 0.41, "learning_rate": 1.63712e-05, "loss": 0.8545, "step": 12790 }, { "epoch": 0.41, "learning_rate": 1.6377600000000004e-05, "loss": 0.8532, "step": 12795 }, { "epoch": 0.41, "learning_rate": 1.6384e-05, "loss": 0.8558, "step": 12800 }, { "epoch": 0.41, "learning_rate": 1.63904e-05, "loss": 0.8465, "step": 12805 }, { "epoch": 0.41, "learning_rate": 1.6396800000000002e-05, "loss": 0.8459, "step": 12810 }, { "epoch": 0.41, "learning_rate": 1.6403200000000002e-05, "loss": 0.8424, "step": 12815 }, { "epoch": 0.41, "learning_rate": 1.64096e-05, "loss": 0.8409, "step": 12820 }, { "epoch": 0.41, "learning_rate": 1.6416e-05, "loss": 0.8441, "step": 12825 }, { "epoch": 0.41, "learning_rate": 1.64224e-05, "loss": 0.8437, "step": 12830 }, { "epoch": 0.41, "learning_rate": 1.64288e-05, "loss": 0.8489, "step": 12835 }, { "epoch": 0.41, "learning_rate": 1.64352e-05, "loss": 0.8468, "step": 12840 }, { "epoch": 0.41, "learning_rate": 1.6441600000000002e-05, "loss": 0.8446, "step": 12845 }, { "epoch": 0.41, "learning_rate": 1.6448000000000002e-05, "loss": 0.8517, "step": 12850 }, { "epoch": 0.41, "learning_rate": 1.6454400000000003e-05, "loss": 0.8513, "step": 12855 }, { "epoch": 0.41, "learning_rate": 1.64608e-05, "loss": 0.8444, "step": 12860 }, { "epoch": 0.41, "learning_rate": 1.64672e-05, "loss": 0.8428, "step": 12865 }, { "epoch": 0.41, "learning_rate": 1.64736e-05, "loss": 0.8445, "step": 12870 }, { "epoch": 0.41, "learning_rate": 1.648e-05, "loss": 0.8584, "step": 12875 }, { "epoch": 0.41, "learning_rate": 1.6486400000000002e-05, "loss": 0.8393, "step": 12880 }, { "epoch": 0.41, "learning_rate": 1.6492800000000002e-05, "loss": 0.8401, "step": 12885 }, { "epoch": 0.41, "learning_rate": 1.6499200000000003e-05, "loss": 0.8489, "step": 12890 }, { "epoch": 0.41, "learning_rate": 1.65056e-05, "loss": 0.8663, "step": 12895 }, { "epoch": 0.41, "learning_rate": 1.6512e-05, "loss": 0.8541, "step": 12900 }, { "epoch": 0.41, "learning_rate": 1.65184e-05, "loss": 0.8419, "step": 12905 }, { "epoch": 0.41, "learning_rate": 1.65248e-05, "loss": 0.8382, "step": 12910 }, { "epoch": 0.41, "learning_rate": 1.6531200000000002e-05, "loss": 0.8482, "step": 12915 }, { "epoch": 0.41, "learning_rate": 1.65376e-05, "loss": 0.8531, "step": 12920 }, { "epoch": 0.41, "learning_rate": 1.6544000000000003e-05, "loss": 0.8519, "step": 12925 }, { "epoch": 0.41, "learning_rate": 1.6550400000000003e-05, "loss": 0.8506, "step": 12930 }, { "epoch": 0.41, "learning_rate": 1.65568e-05, "loss": 0.8425, "step": 12935 }, { "epoch": 0.41, "learning_rate": 1.65632e-05, "loss": 0.8519, "step": 12940 }, { "epoch": 0.41, "learning_rate": 1.65696e-05, "loss": 0.8315, "step": 12945 }, { "epoch": 0.41, "learning_rate": 1.6576000000000002e-05, "loss": 0.852, "step": 12950 }, { "epoch": 0.41, "learning_rate": 1.6582400000000002e-05, "loss": 0.865, "step": 12955 }, { "epoch": 0.41, "learning_rate": 1.65888e-05, "loss": 0.8403, "step": 12960 }, { "epoch": 0.41, "learning_rate": 1.6595200000000003e-05, "loss": 0.8565, "step": 12965 }, { "epoch": 0.42, "learning_rate": 1.6601600000000004e-05, "loss": 0.8518, "step": 12970 }, { "epoch": 0.42, "learning_rate": 1.6608e-05, "loss": 0.8308, "step": 12975 }, { "epoch": 0.42, "learning_rate": 1.66144e-05, "loss": 0.8519, "step": 12980 }, { "epoch": 0.42, "learning_rate": 1.6620800000000002e-05, "loss": 0.8368, "step": 12985 }, { "epoch": 0.42, "learning_rate": 1.6627200000000002e-05, "loss": 0.8295, "step": 12990 }, { "epoch": 0.42, "learning_rate": 1.66336e-05, "loss": 0.8455, "step": 12995 }, { "epoch": 0.42, "learning_rate": 1.664e-05, "loss": 0.8491, "step": 13000 }, { "epoch": 0.42, "learning_rate": 1.66464e-05, "loss": 0.8466, "step": 13005 }, { "epoch": 0.42, "learning_rate": 1.66528e-05, "loss": 0.8259, "step": 13010 }, { "epoch": 0.42, "learning_rate": 1.66592e-05, "loss": 0.8609, "step": 13015 }, { "epoch": 0.42, "learning_rate": 1.6665600000000002e-05, "loss": 0.8392, "step": 13020 }, { "epoch": 0.42, "learning_rate": 1.6672000000000002e-05, "loss": 0.8337, "step": 13025 }, { "epoch": 0.42, "learning_rate": 1.6678400000000003e-05, "loss": 0.8452, "step": 13030 }, { "epoch": 0.42, "learning_rate": 1.66848e-05, "loss": 0.8362, "step": 13035 }, { "epoch": 0.42, "learning_rate": 1.66912e-05, "loss": 0.832, "step": 13040 }, { "epoch": 0.42, "learning_rate": 1.66976e-05, "loss": 0.8538, "step": 13045 }, { "epoch": 0.42, "learning_rate": 1.6704e-05, "loss": 0.8519, "step": 13050 }, { "epoch": 0.42, "learning_rate": 1.6710400000000002e-05, "loss": 0.8486, "step": 13055 }, { "epoch": 0.42, "learning_rate": 1.6716800000000002e-05, "loss": 0.8375, "step": 13060 }, { "epoch": 0.42, "learning_rate": 1.6723200000000003e-05, "loss": 0.8443, "step": 13065 }, { "epoch": 0.42, "learning_rate": 1.67296e-05, "loss": 0.847, "step": 13070 }, { "epoch": 0.42, "learning_rate": 1.6736e-05, "loss": 0.8426, "step": 13075 }, { "epoch": 0.42, "learning_rate": 1.67424e-05, "loss": 0.8566, "step": 13080 }, { "epoch": 0.42, "learning_rate": 1.67488e-05, "loss": 0.8459, "step": 13085 }, { "epoch": 0.42, "learning_rate": 1.6755200000000002e-05, "loss": 0.8294, "step": 13090 }, { "epoch": 0.42, "learning_rate": 1.6761600000000002e-05, "loss": 0.8421, "step": 13095 }, { "epoch": 0.42, "learning_rate": 1.6768000000000003e-05, "loss": 0.8391, "step": 13100 }, { "epoch": 0.42, "learning_rate": 1.6774400000000003e-05, "loss": 0.8439, "step": 13105 }, { "epoch": 0.42, "learning_rate": 1.67808e-05, "loss": 0.8449, "step": 13110 }, { "epoch": 0.42, "learning_rate": 1.67872e-05, "loss": 0.8493, "step": 13115 }, { "epoch": 0.42, "learning_rate": 1.67936e-05, "loss": 0.8456, "step": 13120 }, { "epoch": 0.42, "learning_rate": 1.6800000000000002e-05, "loss": 0.8449, "step": 13125 }, { "epoch": 0.42, "learning_rate": 1.68064e-05, "loss": 0.8359, "step": 13130 }, { "epoch": 0.42, "learning_rate": 1.6812800000000003e-05, "loss": 0.8436, "step": 13135 }, { "epoch": 0.42, "learning_rate": 1.6819200000000003e-05, "loss": 0.84, "step": 13140 }, { "epoch": 0.42, "learning_rate": 1.68256e-05, "loss": 0.8582, "step": 13145 }, { "epoch": 0.42, "learning_rate": 1.6832e-05, "loss": 0.837, "step": 13150 }, { "epoch": 0.42, "learning_rate": 1.68384e-05, "loss": 0.84, "step": 13155 }, { "epoch": 0.42, "learning_rate": 1.6844800000000002e-05, "loss": 0.8384, "step": 13160 }, { "epoch": 0.42, "learning_rate": 1.6851200000000002e-05, "loss": 0.8378, "step": 13165 }, { "epoch": 0.42, "learning_rate": 1.68576e-05, "loss": 0.8475, "step": 13170 }, { "epoch": 0.42, "learning_rate": 1.6864e-05, "loss": 0.8378, "step": 13175 }, { "epoch": 0.42, "learning_rate": 1.6870400000000004e-05, "loss": 0.8571, "step": 13180 }, { "epoch": 0.42, "learning_rate": 1.68768e-05, "loss": 0.8323, "step": 13185 }, { "epoch": 0.42, "learning_rate": 1.68832e-05, "loss": 0.845, "step": 13190 }, { "epoch": 0.42, "learning_rate": 1.6889600000000002e-05, "loss": 0.831, "step": 13195 }, { "epoch": 0.42, "learning_rate": 1.6896000000000002e-05, "loss": 0.8358, "step": 13200 }, { "epoch": 0.42, "learning_rate": 1.6902400000000003e-05, "loss": 0.8402, "step": 13205 }, { "epoch": 0.42, "learning_rate": 1.69088e-05, "loss": 0.8409, "step": 13210 }, { "epoch": 0.42, "learning_rate": 1.69152e-05, "loss": 0.8434, "step": 13215 }, { "epoch": 0.42, "learning_rate": 1.6921600000000004e-05, "loss": 0.8425, "step": 13220 }, { "epoch": 0.42, "learning_rate": 1.6928e-05, "loss": 0.8511, "step": 13225 }, { "epoch": 0.42, "learning_rate": 1.6934400000000002e-05, "loss": 0.829, "step": 13230 }, { "epoch": 0.42, "learning_rate": 1.6940800000000002e-05, "loss": 0.8404, "step": 13235 }, { "epoch": 0.42, "learning_rate": 1.6947200000000003e-05, "loss": 0.8536, "step": 13240 }, { "epoch": 0.42, "learning_rate": 1.69536e-05, "loss": 0.8322, "step": 13245 }, { "epoch": 0.42, "learning_rate": 1.696e-05, "loss": 0.8599, "step": 13250 }, { "epoch": 0.42, "learning_rate": 1.69664e-05, "loss": 0.8611, "step": 13255 }, { "epoch": 0.42, "learning_rate": 1.69728e-05, "loss": 0.852, "step": 13260 }, { "epoch": 0.42, "learning_rate": 1.69792e-05, "loss": 0.8429, "step": 13265 }, { "epoch": 0.42, "learning_rate": 1.6985600000000002e-05, "loss": 0.8358, "step": 13270 }, { "epoch": 0.42, "learning_rate": 1.6992000000000003e-05, "loss": 0.8437, "step": 13275 }, { "epoch": 0.42, "learning_rate": 1.6998400000000003e-05, "loss": 0.8438, "step": 13280 }, { "epoch": 0.43, "learning_rate": 1.70048e-05, "loss": 0.8245, "step": 13285 }, { "epoch": 0.43, "learning_rate": 1.70112e-05, "loss": 0.842, "step": 13290 }, { "epoch": 0.43, "learning_rate": 1.70176e-05, "loss": 0.8406, "step": 13295 }, { "epoch": 0.43, "learning_rate": 1.7024e-05, "loss": 0.8451, "step": 13300 }, { "epoch": 0.43, "learning_rate": 1.7030400000000002e-05, "loss": 0.839, "step": 13305 }, { "epoch": 0.43, "learning_rate": 1.7036800000000003e-05, "loss": 0.8245, "step": 13310 }, { "epoch": 0.43, "learning_rate": 1.7043200000000003e-05, "loss": 0.8367, "step": 13315 }, { "epoch": 0.43, "learning_rate": 1.70496e-05, "loss": 0.8473, "step": 13320 }, { "epoch": 0.43, "learning_rate": 1.7056e-05, "loss": 0.8377, "step": 13325 }, { "epoch": 0.43, "learning_rate": 1.70624e-05, "loss": 0.8472, "step": 13330 }, { "epoch": 0.43, "learning_rate": 1.70688e-05, "loss": 0.8496, "step": 13335 }, { "epoch": 0.43, "learning_rate": 1.7075200000000002e-05, "loss": 0.8464, "step": 13340 }, { "epoch": 0.43, "learning_rate": 1.70816e-05, "loss": 0.8389, "step": 13345 }, { "epoch": 0.43, "learning_rate": 1.7088000000000003e-05, "loss": 0.8449, "step": 13350 }, { "epoch": 0.43, "learning_rate": 1.7094400000000004e-05, "loss": 0.8227, "step": 13355 }, { "epoch": 0.43, "learning_rate": 1.71008e-05, "loss": 0.8428, "step": 13360 }, { "epoch": 0.43, "learning_rate": 1.71072e-05, "loss": 0.8433, "step": 13365 }, { "epoch": 0.43, "learning_rate": 1.71136e-05, "loss": 0.8234, "step": 13370 }, { "epoch": 0.43, "learning_rate": 1.7120000000000002e-05, "loss": 0.8491, "step": 13375 }, { "epoch": 0.43, "learning_rate": 1.71264e-05, "loss": 0.8404, "step": 13380 }, { "epoch": 0.43, "learning_rate": 1.71328e-05, "loss": 0.8367, "step": 13385 }, { "epoch": 0.43, "learning_rate": 1.7139200000000004e-05, "loss": 0.8479, "step": 13390 }, { "epoch": 0.43, "learning_rate": 1.71456e-05, "loss": 0.8498, "step": 13395 }, { "epoch": 0.43, "learning_rate": 1.7152e-05, "loss": 0.8428, "step": 13400 }, { "epoch": 0.43, "learning_rate": 1.71584e-05, "loss": 0.8454, "step": 13405 }, { "epoch": 0.43, "learning_rate": 1.7164800000000002e-05, "loss": 0.8406, "step": 13410 }, { "epoch": 0.43, "learning_rate": 1.7171200000000003e-05, "loss": 0.8114, "step": 13415 }, { "epoch": 0.43, "learning_rate": 1.71776e-05, "loss": 0.8524, "step": 13420 }, { "epoch": 0.43, "learning_rate": 1.7184e-05, "loss": 0.8417, "step": 13425 }, { "epoch": 0.43, "learning_rate": 1.71904e-05, "loss": 0.841, "step": 13430 }, { "epoch": 0.43, "learning_rate": 1.71968e-05, "loss": 0.8215, "step": 13435 }, { "epoch": 0.43, "learning_rate": 1.72032e-05, "loss": 0.8316, "step": 13440 }, { "epoch": 0.43, "learning_rate": 1.7209600000000002e-05, "loss": 0.8345, "step": 13445 }, { "epoch": 0.43, "learning_rate": 1.7216000000000003e-05, "loss": 0.8411, "step": 13450 }, { "epoch": 0.43, "learning_rate": 1.7222400000000003e-05, "loss": 0.8375, "step": 13455 }, { "epoch": 0.43, "learning_rate": 1.72288e-05, "loss": 0.8322, "step": 13460 }, { "epoch": 0.43, "learning_rate": 1.72352e-05, "loss": 0.8426, "step": 13465 }, { "epoch": 0.43, "learning_rate": 1.72416e-05, "loss": 0.8496, "step": 13470 }, { "epoch": 0.43, "learning_rate": 1.7248e-05, "loss": 0.8344, "step": 13475 }, { "epoch": 0.43, "learning_rate": 1.7254400000000002e-05, "loss": 0.8341, "step": 13480 }, { "epoch": 0.43, "learning_rate": 1.7260800000000003e-05, "loss": 0.84, "step": 13485 }, { "epoch": 0.43, "learning_rate": 1.7267200000000003e-05, "loss": 0.8412, "step": 13490 }, { "epoch": 0.43, "learning_rate": 1.72736e-05, "loss": 0.8325, "step": 13495 }, { "epoch": 0.43, "learning_rate": 1.728e-05, "loss": 0.823, "step": 13500 }, { "epoch": 0.43, "learning_rate": 1.72864e-05, "loss": 0.8372, "step": 13505 }, { "epoch": 0.43, "learning_rate": 1.72928e-05, "loss": 0.8447, "step": 13510 }, { "epoch": 0.43, "learning_rate": 1.7299200000000002e-05, "loss": 0.8273, "step": 13515 }, { "epoch": 0.43, "learning_rate": 1.7305600000000002e-05, "loss": 0.8418, "step": 13520 }, { "epoch": 0.43, "learning_rate": 1.7312000000000003e-05, "loss": 0.8366, "step": 13525 }, { "epoch": 0.43, "learning_rate": 1.7318400000000003e-05, "loss": 0.823, "step": 13530 }, { "epoch": 0.43, "learning_rate": 1.73248e-05, "loss": 0.8209, "step": 13535 }, { "epoch": 0.43, "learning_rate": 1.73312e-05, "loss": 0.8375, "step": 13540 }, { "epoch": 0.43, "learning_rate": 1.73376e-05, "loss": 0.8351, "step": 13545 }, { "epoch": 0.43, "learning_rate": 1.7344000000000002e-05, "loss": 0.8305, "step": 13550 }, { "epoch": 0.43, "learning_rate": 1.73504e-05, "loss": 0.8408, "step": 13555 }, { "epoch": 0.43, "learning_rate": 1.73568e-05, "loss": 0.833, "step": 13560 }, { "epoch": 0.43, "learning_rate": 1.7363200000000003e-05, "loss": 0.8321, "step": 13565 }, { "epoch": 0.43, "learning_rate": 1.73696e-05, "loss": 0.8381, "step": 13570 }, { "epoch": 0.43, "learning_rate": 1.7376e-05, "loss": 0.8467, "step": 13575 }, { "epoch": 0.43, "learning_rate": 1.73824e-05, "loss": 0.8482, "step": 13580 }, { "epoch": 0.43, "learning_rate": 1.7388800000000002e-05, "loss": 0.8389, "step": 13585 }, { "epoch": 0.43, "learning_rate": 1.7395200000000002e-05, "loss": 0.8333, "step": 13590 }, { "epoch": 0.44, "learning_rate": 1.74016e-05, "loss": 0.8334, "step": 13595 }, { "epoch": 0.44, "learning_rate": 1.7408e-05, "loss": 0.8202, "step": 13600 }, { "epoch": 0.44, "learning_rate": 1.7414400000000004e-05, "loss": 0.8289, "step": 13605 }, { "epoch": 0.44, "learning_rate": 1.74208e-05, "loss": 0.8391, "step": 13610 }, { "epoch": 0.44, "learning_rate": 1.74272e-05, "loss": 0.8322, "step": 13615 }, { "epoch": 0.44, "learning_rate": 1.7433600000000002e-05, "loss": 0.8326, "step": 13620 }, { "epoch": 0.44, "learning_rate": 1.7440000000000002e-05, "loss": 0.8305, "step": 13625 }, { "epoch": 0.44, "learning_rate": 1.74464e-05, "loss": 0.8288, "step": 13630 }, { "epoch": 0.44, "learning_rate": 1.74528e-05, "loss": 0.8473, "step": 13635 }, { "epoch": 0.44, "learning_rate": 1.74592e-05, "loss": 0.8329, "step": 13640 }, { "epoch": 0.44, "learning_rate": 1.74656e-05, "loss": 0.8264, "step": 13645 }, { "epoch": 0.44, "learning_rate": 1.7472e-05, "loss": 0.8282, "step": 13650 }, { "epoch": 0.44, "learning_rate": 1.7478400000000002e-05, "loss": 0.8288, "step": 13655 }, { "epoch": 0.44, "learning_rate": 1.7484800000000002e-05, "loss": 0.8347, "step": 13660 }, { "epoch": 0.44, "learning_rate": 1.7491200000000003e-05, "loss": 0.8384, "step": 13665 }, { "epoch": 0.44, "learning_rate": 1.74976e-05, "loss": 0.84, "step": 13670 }, { "epoch": 0.44, "learning_rate": 1.7504e-05, "loss": 0.8378, "step": 13675 }, { "epoch": 0.44, "learning_rate": 1.75104e-05, "loss": 0.8314, "step": 13680 }, { "epoch": 0.44, "learning_rate": 1.75168e-05, "loss": 0.8138, "step": 13685 }, { "epoch": 0.44, "learning_rate": 1.7523200000000002e-05, "loss": 0.844, "step": 13690 }, { "epoch": 0.44, "learning_rate": 1.7529600000000002e-05, "loss": 0.8374, "step": 13695 }, { "epoch": 0.44, "learning_rate": 1.7536000000000003e-05, "loss": 0.8283, "step": 13700 }, { "epoch": 0.44, "learning_rate": 1.75424e-05, "loss": 0.8344, "step": 13705 }, { "epoch": 0.44, "learning_rate": 1.75488e-05, "loss": 0.827, "step": 13710 }, { "epoch": 0.44, "learning_rate": 1.75552e-05, "loss": 0.8313, "step": 13715 }, { "epoch": 0.44, "learning_rate": 1.75616e-05, "loss": 0.8432, "step": 13720 }, { "epoch": 0.44, "learning_rate": 1.7568000000000002e-05, "loss": 0.8406, "step": 13725 }, { "epoch": 0.44, "learning_rate": 1.75744e-05, "loss": 0.8435, "step": 13730 }, { "epoch": 0.44, "learning_rate": 1.7580800000000003e-05, "loss": 0.8322, "step": 13735 }, { "epoch": 0.44, "learning_rate": 1.7587200000000003e-05, "loss": 0.8353, "step": 13740 }, { "epoch": 0.44, "learning_rate": 1.75936e-05, "loss": 0.8315, "step": 13745 }, { "epoch": 0.44, "learning_rate": 1.76e-05, "loss": 0.8392, "step": 13750 }, { "epoch": 0.44, "learning_rate": 1.76064e-05, "loss": 0.8329, "step": 13755 }, { "epoch": 0.44, "learning_rate": 1.7612800000000002e-05, "loss": 0.8362, "step": 13760 }, { "epoch": 0.44, "learning_rate": 1.7619200000000002e-05, "loss": 0.809, "step": 13765 }, { "epoch": 0.44, "learning_rate": 1.76256e-05, "loss": 0.8346, "step": 13770 }, { "epoch": 0.44, "learning_rate": 1.7632000000000003e-05, "loss": 0.8344, "step": 13775 }, { "epoch": 0.44, "learning_rate": 1.7638400000000004e-05, "loss": 0.8157, "step": 13780 }, { "epoch": 0.44, "learning_rate": 1.76448e-05, "loss": 0.8401, "step": 13785 }, { "epoch": 0.44, "learning_rate": 1.76512e-05, "loss": 0.8476, "step": 13790 }, { "epoch": 0.44, "learning_rate": 1.7657600000000002e-05, "loss": 0.8206, "step": 13795 }, { "epoch": 0.44, "learning_rate": 1.7664000000000002e-05, "loss": 0.8315, "step": 13800 }, { "epoch": 0.44, "learning_rate": 1.76704e-05, "loss": 0.8308, "step": 13805 }, { "epoch": 0.44, "learning_rate": 1.76768e-05, "loss": 0.8367, "step": 13810 }, { "epoch": 0.44, "learning_rate": 1.76832e-05, "loss": 0.8209, "step": 13815 }, { "epoch": 0.44, "learning_rate": 1.76896e-05, "loss": 0.8276, "step": 13820 }, { "epoch": 0.44, "learning_rate": 1.7696e-05, "loss": 0.8253, "step": 13825 }, { "epoch": 0.44, "learning_rate": 1.7702400000000002e-05, "loss": 0.8285, "step": 13830 }, { "epoch": 0.44, "learning_rate": 1.7708800000000002e-05, "loss": 0.8152, "step": 13835 }, { "epoch": 0.44, "learning_rate": 1.7715200000000003e-05, "loss": 0.8225, "step": 13840 }, { "epoch": 0.44, "learning_rate": 1.77216e-05, "loss": 0.8245, "step": 13845 }, { "epoch": 0.44, "learning_rate": 1.7728e-05, "loss": 0.8366, "step": 13850 }, { "epoch": 0.44, "learning_rate": 1.77344e-05, "loss": 0.8314, "step": 13855 }, { "epoch": 0.44, "learning_rate": 1.77408e-05, "loss": 0.8294, "step": 13860 }, { "epoch": 0.44, "learning_rate": 1.7747200000000002e-05, "loss": 0.8377, "step": 13865 }, { "epoch": 0.44, "learning_rate": 1.7753600000000002e-05, "loss": 0.8382, "step": 13870 }, { "epoch": 0.44, "learning_rate": 1.7760000000000003e-05, "loss": 0.8231, "step": 13875 }, { "epoch": 0.44, "learning_rate": 1.77664e-05, "loss": 0.8425, "step": 13880 }, { "epoch": 0.44, "learning_rate": 1.77728e-05, "loss": 0.8297, "step": 13885 }, { "epoch": 0.44, "learning_rate": 1.77792e-05, "loss": 0.8363, "step": 13890 }, { "epoch": 0.44, "learning_rate": 1.77856e-05, "loss": 0.8457, "step": 13895 }, { "epoch": 0.44, "learning_rate": 1.7792000000000002e-05, "loss": 0.8423, "step": 13900 }, { "epoch": 0.44, "learning_rate": 1.7798400000000002e-05, "loss": 0.8165, "step": 13905 }, { "epoch": 0.45, "learning_rate": 1.7804800000000003e-05, "loss": 0.831, "step": 13910 }, { "epoch": 0.45, "learning_rate": 1.7811200000000003e-05, "loss": 0.8165, "step": 13915 }, { "epoch": 0.45, "learning_rate": 1.78176e-05, "loss": 0.8331, "step": 13920 }, { "epoch": 0.45, "learning_rate": 1.7824e-05, "loss": 0.8325, "step": 13925 }, { "epoch": 0.45, "learning_rate": 1.78304e-05, "loss": 0.8252, "step": 13930 }, { "epoch": 0.45, "learning_rate": 1.7836800000000002e-05, "loss": 0.8264, "step": 13935 }, { "epoch": 0.45, "learning_rate": 1.78432e-05, "loss": 0.8399, "step": 13940 }, { "epoch": 0.45, "learning_rate": 1.7849600000000003e-05, "loss": 0.8421, "step": 13945 }, { "epoch": 0.45, "learning_rate": 1.7856000000000003e-05, "loss": 0.8385, "step": 13950 }, { "epoch": 0.45, "learning_rate": 1.78624e-05, "loss": 0.8377, "step": 13955 }, { "epoch": 0.45, "learning_rate": 1.78688e-05, "loss": 0.8317, "step": 13960 }, { "epoch": 0.45, "learning_rate": 1.78752e-05, "loss": 0.8353, "step": 13965 }, { "epoch": 0.45, "learning_rate": 1.7881600000000002e-05, "loss": 0.8298, "step": 13970 }, { "epoch": 0.45, "learning_rate": 1.7888000000000002e-05, "loss": 0.8283, "step": 13975 }, { "epoch": 0.45, "learning_rate": 1.78944e-05, "loss": 0.8425, "step": 13980 }, { "epoch": 0.45, "learning_rate": 1.79008e-05, "loss": 0.8288, "step": 13985 }, { "epoch": 0.45, "learning_rate": 1.7907200000000004e-05, "loss": 0.8473, "step": 13990 }, { "epoch": 0.45, "learning_rate": 1.79136e-05, "loss": 0.8394, "step": 13995 }, { "epoch": 0.45, "learning_rate": 1.792e-05, "loss": 0.8262, "step": 14000 }, { "epoch": 0.45, "learning_rate": 1.7926400000000002e-05, "loss": 0.837, "step": 14005 }, { "epoch": 0.45, "learning_rate": 1.7932800000000002e-05, "loss": 0.8411, "step": 14010 }, { "epoch": 0.45, "learning_rate": 1.7939200000000003e-05, "loss": 0.8244, "step": 14015 }, { "epoch": 0.45, "learning_rate": 1.79456e-05, "loss": 0.8164, "step": 14020 }, { "epoch": 0.45, "learning_rate": 1.7952e-05, "loss": 0.8266, "step": 14025 }, { "epoch": 0.45, "learning_rate": 1.7958400000000004e-05, "loss": 0.8267, "step": 14030 }, { "epoch": 0.45, "learning_rate": 1.79648e-05, "loss": 0.8274, "step": 14035 }, { "epoch": 0.45, "learning_rate": 1.79712e-05, "loss": 0.8357, "step": 14040 }, { "epoch": 0.45, "learning_rate": 1.7977600000000002e-05, "loss": 0.8345, "step": 14045 }, { "epoch": 0.45, "learning_rate": 1.7984000000000003e-05, "loss": 0.8204, "step": 14050 }, { "epoch": 0.45, "learning_rate": 1.79904e-05, "loss": 0.8326, "step": 14055 }, { "epoch": 0.45, "learning_rate": 1.79968e-05, "loss": 0.8247, "step": 14060 }, { "epoch": 0.45, "learning_rate": 1.80032e-05, "loss": 0.824, "step": 14065 }, { "epoch": 0.45, "learning_rate": 1.80096e-05, "loss": 0.8242, "step": 14070 }, { "epoch": 0.45, "learning_rate": 1.8016e-05, "loss": 0.845, "step": 14075 }, { "epoch": 0.45, "learning_rate": 1.8022400000000002e-05, "loss": 0.8278, "step": 14080 }, { "epoch": 0.45, "learning_rate": 1.8028800000000003e-05, "loss": 0.8275, "step": 14085 }, { "epoch": 0.45, "learning_rate": 1.8035200000000003e-05, "loss": 0.8284, "step": 14090 }, { "epoch": 0.45, "learning_rate": 1.80416e-05, "loss": 0.8216, "step": 14095 }, { "epoch": 0.45, "learning_rate": 1.8048e-05, "loss": 0.8265, "step": 14100 }, { "epoch": 0.45, "learning_rate": 1.80544e-05, "loss": 0.8289, "step": 14105 }, { "epoch": 0.45, "learning_rate": 1.80608e-05, "loss": 0.8176, "step": 14110 }, { "epoch": 0.45, "learning_rate": 1.8067200000000002e-05, "loss": 0.8307, "step": 14115 }, { "epoch": 0.45, "learning_rate": 1.8073600000000003e-05, "loss": 0.8193, "step": 14120 }, { "epoch": 0.45, "learning_rate": 1.8080000000000003e-05, "loss": 0.81, "step": 14125 }, { "epoch": 0.45, "learning_rate": 1.80864e-05, "loss": 0.8343, "step": 14130 }, { "epoch": 0.45, "learning_rate": 1.80928e-05, "loss": 0.8357, "step": 14135 }, { "epoch": 0.45, "learning_rate": 1.80992e-05, "loss": 0.8303, "step": 14140 }, { "epoch": 0.45, "learning_rate": 1.81056e-05, "loss": 0.8301, "step": 14145 }, { "epoch": 0.45, "learning_rate": 1.8112000000000002e-05, "loss": 0.8367, "step": 14150 }, { "epoch": 0.45, "learning_rate": 1.81184e-05, "loss": 0.8317, "step": 14155 }, { "epoch": 0.45, "learning_rate": 1.8124800000000003e-05, "loss": 0.8385, "step": 14160 }, { "epoch": 0.45, "learning_rate": 1.8131200000000004e-05, "loss": 0.826, "step": 14165 }, { "epoch": 0.45, "learning_rate": 1.81376e-05, "loss": 0.8383, "step": 14170 }, { "epoch": 0.45, "learning_rate": 1.8144e-05, "loss": 0.832, "step": 14175 }, { "epoch": 0.45, "learning_rate": 1.81504e-05, "loss": 0.8251, "step": 14180 }, { "epoch": 0.45, "learning_rate": 1.8156800000000002e-05, "loss": 0.822, "step": 14185 }, { "epoch": 0.45, "learning_rate": 1.81632e-05, "loss": 0.8238, "step": 14190 }, { "epoch": 0.45, "learning_rate": 1.81696e-05, "loss": 0.8259, "step": 14195 }, { "epoch": 0.45, "learning_rate": 1.8176000000000004e-05, "loss": 0.8203, "step": 14200 }, { "epoch": 0.45, "learning_rate": 1.81824e-05, "loss": 0.8335, "step": 14205 }, { "epoch": 0.45, "learning_rate": 1.81888e-05, "loss": 0.8195, "step": 14210 }, { "epoch": 0.45, "learning_rate": 1.81952e-05, "loss": 0.8292, "step": 14215 }, { "epoch": 0.46, "learning_rate": 1.8201600000000002e-05, "loss": 0.8102, "step": 14220 }, { "epoch": 0.46, "learning_rate": 1.8208000000000003e-05, "loss": 0.8244, "step": 14225 }, { "epoch": 0.46, "learning_rate": 1.82144e-05, "loss": 0.8269, "step": 14230 }, { "epoch": 0.46, "learning_rate": 1.82208e-05, "loss": 0.8148, "step": 14235 }, { "epoch": 0.46, "learning_rate": 1.82272e-05, "loss": 0.8124, "step": 14240 }, { "epoch": 0.46, "learning_rate": 1.82336e-05, "loss": 0.8362, "step": 14245 }, { "epoch": 0.46, "learning_rate": 1.824e-05, "loss": 0.8217, "step": 14250 }, { "epoch": 0.46, "learning_rate": 1.8246400000000002e-05, "loss": 0.8276, "step": 14255 }, { "epoch": 0.46, "learning_rate": 1.8252800000000003e-05, "loss": 0.832, "step": 14260 }, { "epoch": 0.46, "learning_rate": 1.8259200000000003e-05, "loss": 0.82, "step": 14265 }, { "epoch": 0.46, "learning_rate": 1.82656e-05, "loss": 0.8157, "step": 14270 }, { "epoch": 0.46, "learning_rate": 1.8272e-05, "loss": 0.8223, "step": 14275 }, { "epoch": 0.46, "learning_rate": 1.82784e-05, "loss": 0.8264, "step": 14280 }, { "epoch": 0.46, "learning_rate": 1.82848e-05, "loss": 0.8374, "step": 14285 }, { "epoch": 0.46, "learning_rate": 1.8291200000000002e-05, "loss": 0.8347, "step": 14290 }, { "epoch": 0.46, "learning_rate": 1.8297600000000002e-05, "loss": 0.834, "step": 14295 }, { "epoch": 0.46, "learning_rate": 1.8304000000000003e-05, "loss": 0.8229, "step": 14300 }, { "epoch": 0.46, "learning_rate": 1.83104e-05, "loss": 0.8201, "step": 14305 }, { "epoch": 0.46, "learning_rate": 1.83168e-05, "loss": 0.8185, "step": 14310 }, { "epoch": 0.46, "learning_rate": 1.83232e-05, "loss": 0.8217, "step": 14315 }, { "epoch": 0.46, "learning_rate": 1.83296e-05, "loss": 0.8258, "step": 14320 }, { "epoch": 0.46, "learning_rate": 1.8336000000000002e-05, "loss": 0.8282, "step": 14325 }, { "epoch": 0.46, "learning_rate": 1.8342400000000002e-05, "loss": 0.8146, "step": 14330 }, { "epoch": 0.46, "learning_rate": 1.8348800000000003e-05, "loss": 0.8165, "step": 14335 }, { "epoch": 0.46, "learning_rate": 1.8355200000000003e-05, "loss": 0.8282, "step": 14340 }, { "epoch": 0.46, "learning_rate": 1.83616e-05, "loss": 0.8401, "step": 14345 }, { "epoch": 0.46, "learning_rate": 1.8368e-05, "loss": 0.8248, "step": 14350 }, { "epoch": 0.46, "learning_rate": 1.83744e-05, "loss": 0.8189, "step": 14355 }, { "epoch": 0.46, "learning_rate": 1.8380800000000002e-05, "loss": 0.821, "step": 14360 }, { "epoch": 0.46, "learning_rate": 1.83872e-05, "loss": 0.8285, "step": 14365 }, { "epoch": 0.46, "learning_rate": 1.8393600000000003e-05, "loss": 0.833, "step": 14370 }, { "epoch": 0.46, "learning_rate": 1.8400000000000003e-05, "loss": 0.8169, "step": 14375 }, { "epoch": 0.46, "learning_rate": 1.84064e-05, "loss": 0.8324, "step": 14380 }, { "epoch": 0.46, "learning_rate": 1.84128e-05, "loss": 0.8258, "step": 14385 }, { "epoch": 0.46, "learning_rate": 1.84192e-05, "loss": 0.8041, "step": 14390 }, { "epoch": 0.46, "learning_rate": 1.8425600000000002e-05, "loss": 0.8109, "step": 14395 }, { "epoch": 0.46, "learning_rate": 1.8432000000000002e-05, "loss": 0.8242, "step": 14400 }, { "epoch": 0.46, "learning_rate": 1.84384e-05, "loss": 0.8168, "step": 14405 }, { "epoch": 0.46, "learning_rate": 1.84448e-05, "loss": 0.8191, "step": 14410 }, { "epoch": 0.46, "learning_rate": 1.8451200000000004e-05, "loss": 0.832, "step": 14415 }, { "epoch": 0.46, "learning_rate": 1.84576e-05, "loss": 0.8185, "step": 14420 }, { "epoch": 0.46, "learning_rate": 1.8464e-05, "loss": 0.8364, "step": 14425 }, { "epoch": 0.46, "learning_rate": 1.8470400000000002e-05, "loss": 0.8067, "step": 14430 }, { "epoch": 0.46, "learning_rate": 1.8476800000000002e-05, "loss": 0.83, "step": 14435 }, { "epoch": 0.46, "learning_rate": 1.84832e-05, "loss": 0.8221, "step": 14440 }, { "epoch": 0.46, "learning_rate": 1.84896e-05, "loss": 0.8158, "step": 14445 }, { "epoch": 0.46, "learning_rate": 1.8496e-05, "loss": 0.816, "step": 14450 }, { "epoch": 0.46, "learning_rate": 1.85024e-05, "loss": 0.8217, "step": 14455 }, { "epoch": 0.46, "learning_rate": 1.85088e-05, "loss": 0.8166, "step": 14460 }, { "epoch": 0.46, "learning_rate": 1.8515200000000002e-05, "loss": 0.8211, "step": 14465 }, { "epoch": 0.46, "learning_rate": 1.8521600000000002e-05, "loss": 0.8156, "step": 14470 }, { "epoch": 0.46, "learning_rate": 1.8528000000000003e-05, "loss": 0.8404, "step": 14475 }, { "epoch": 0.46, "learning_rate": 1.85344e-05, "loss": 0.8224, "step": 14480 }, { "epoch": 0.46, "learning_rate": 1.85408e-05, "loss": 0.8208, "step": 14485 }, { "epoch": 0.46, "learning_rate": 1.85472e-05, "loss": 0.8342, "step": 14490 }, { "epoch": 0.46, "learning_rate": 1.85536e-05, "loss": 0.8169, "step": 14495 }, { "epoch": 0.46, "learning_rate": 1.8560000000000002e-05, "loss": 0.8162, "step": 14500 }, { "epoch": 0.46, "learning_rate": 1.8566400000000002e-05, "loss": 0.8226, "step": 14505 }, { "epoch": 0.46, "learning_rate": 1.8572800000000003e-05, "loss": 0.8195, "step": 14510 }, { "epoch": 0.46, "learning_rate": 1.8579200000000003e-05, "loss": 0.823, "step": 14515 }, { "epoch": 0.46, "learning_rate": 1.85856e-05, "loss": 0.8294, "step": 14520 }, { "epoch": 0.46, "learning_rate": 1.8592e-05, "loss": 0.8119, "step": 14525 }, { "epoch": 0.46, "learning_rate": 1.85984e-05, "loss": 0.8194, "step": 14530 }, { "epoch": 0.47, "learning_rate": 1.8604800000000002e-05, "loss": 0.8173, "step": 14535 }, { "epoch": 0.47, "learning_rate": 1.8611200000000002e-05, "loss": 0.8379, "step": 14540 }, { "epoch": 0.47, "learning_rate": 1.8617600000000003e-05, "loss": 0.8357, "step": 14545 }, { "epoch": 0.47, "learning_rate": 1.8624000000000003e-05, "loss": 0.8291, "step": 14550 }, { "epoch": 0.47, "learning_rate": 1.86304e-05, "loss": 0.8102, "step": 14555 }, { "epoch": 0.47, "learning_rate": 1.86368e-05, "loss": 0.8192, "step": 14560 }, { "epoch": 0.47, "learning_rate": 1.86432e-05, "loss": 0.8203, "step": 14565 }, { "epoch": 0.47, "learning_rate": 1.8649600000000002e-05, "loss": 0.8047, "step": 14570 }, { "epoch": 0.47, "learning_rate": 1.8656000000000002e-05, "loss": 0.824, "step": 14575 }, { "epoch": 0.47, "learning_rate": 1.86624e-05, "loss": 0.8291, "step": 14580 }, { "epoch": 0.47, "learning_rate": 1.8668800000000003e-05, "loss": 0.8011, "step": 14585 }, { "epoch": 0.47, "learning_rate": 1.8675200000000004e-05, "loss": 0.8259, "step": 14590 }, { "epoch": 0.47, "learning_rate": 1.86816e-05, "loss": 0.8334, "step": 14595 }, { "epoch": 0.47, "learning_rate": 1.8688e-05, "loss": 0.8105, "step": 14600 }, { "epoch": 0.47, "learning_rate": 1.8694400000000002e-05, "loss": 0.8151, "step": 14605 }, { "epoch": 0.47, "learning_rate": 1.8700800000000002e-05, "loss": 0.8265, "step": 14610 }, { "epoch": 0.47, "learning_rate": 1.87072e-05, "loss": 0.8152, "step": 14615 }, { "epoch": 0.47, "learning_rate": 1.87136e-05, "loss": 0.8142, "step": 14620 }, { "epoch": 0.47, "learning_rate": 1.8720000000000004e-05, "loss": 0.8174, "step": 14625 }, { "epoch": 0.47, "learning_rate": 1.87264e-05, "loss": 0.8227, "step": 14630 }, { "epoch": 0.47, "learning_rate": 1.87328e-05, "loss": 0.8242, "step": 14635 }, { "epoch": 0.47, "learning_rate": 1.8739200000000002e-05, "loss": 0.813, "step": 14640 }, { "epoch": 0.47, "learning_rate": 1.8745600000000002e-05, "loss": 0.8191, "step": 14645 }, { "epoch": 0.47, "learning_rate": 1.8752000000000003e-05, "loss": 0.8163, "step": 14650 }, { "epoch": 0.47, "learning_rate": 1.87584e-05, "loss": 0.8222, "step": 14655 }, { "epoch": 0.47, "learning_rate": 1.87648e-05, "loss": 0.8249, "step": 14660 }, { "epoch": 0.47, "learning_rate": 1.87712e-05, "loss": 0.8192, "step": 14665 }, { "epoch": 0.47, "learning_rate": 1.87776e-05, "loss": 0.8249, "step": 14670 }, { "epoch": 0.47, "learning_rate": 1.8784000000000002e-05, "loss": 0.8122, "step": 14675 }, { "epoch": 0.47, "learning_rate": 1.8790400000000002e-05, "loss": 0.8147, "step": 14680 }, { "epoch": 0.47, "learning_rate": 1.8796800000000003e-05, "loss": 0.8354, "step": 14685 }, { "epoch": 0.47, "learning_rate": 1.88032e-05, "loss": 0.8265, "step": 14690 }, { "epoch": 0.47, "learning_rate": 1.88096e-05, "loss": 0.8261, "step": 14695 }, { "epoch": 0.47, "learning_rate": 1.8816e-05, "loss": 0.8129, "step": 14700 }, { "epoch": 0.47, "learning_rate": 1.88224e-05, "loss": 0.8254, "step": 14705 }, { "epoch": 0.47, "learning_rate": 1.8828800000000002e-05, "loss": 0.8266, "step": 14710 }, { "epoch": 0.47, "learning_rate": 1.8835200000000002e-05, "loss": 0.8103, "step": 14715 }, { "epoch": 0.47, "learning_rate": 1.8841600000000003e-05, "loss": 0.8131, "step": 14720 }, { "epoch": 0.47, "learning_rate": 1.8848000000000003e-05, "loss": 0.8187, "step": 14725 }, { "epoch": 0.47, "learning_rate": 1.88544e-05, "loss": 0.8266, "step": 14730 }, { "epoch": 0.47, "learning_rate": 1.88608e-05, "loss": 0.8159, "step": 14735 }, { "epoch": 0.47, "learning_rate": 1.88672e-05, "loss": 0.8238, "step": 14740 }, { "epoch": 0.47, "learning_rate": 1.8873600000000002e-05, "loss": 0.8262, "step": 14745 }, { "epoch": 0.47, "learning_rate": 1.8880000000000002e-05, "loss": 0.8193, "step": 14750 }, { "epoch": 0.47, "learning_rate": 1.8886400000000003e-05, "loss": 0.8217, "step": 14755 }, { "epoch": 0.47, "learning_rate": 1.8892800000000003e-05, "loss": 0.8167, "step": 14760 }, { "epoch": 0.47, "learning_rate": 1.8899200000000004e-05, "loss": 0.8317, "step": 14765 }, { "epoch": 0.47, "learning_rate": 1.89056e-05, "loss": 0.8183, "step": 14770 }, { "epoch": 0.47, "learning_rate": 1.8912e-05, "loss": 0.814, "step": 14775 }, { "epoch": 0.47, "learning_rate": 1.89184e-05, "loss": 0.8142, "step": 14780 }, { "epoch": 0.47, "learning_rate": 1.8924800000000002e-05, "loss": 0.8178, "step": 14785 }, { "epoch": 0.47, "learning_rate": 1.89312e-05, "loss": 0.8218, "step": 14790 }, { "epoch": 0.47, "learning_rate": 1.8937600000000003e-05, "loss": 0.8264, "step": 14795 }, { "epoch": 0.47, "learning_rate": 1.8944000000000004e-05, "loss": 0.8231, "step": 14800 }, { "epoch": 0.47, "learning_rate": 1.89504e-05, "loss": 0.8124, "step": 14805 }, { "epoch": 0.47, "learning_rate": 1.89568e-05, "loss": 0.821, "step": 14810 }, { "epoch": 0.47, "learning_rate": 1.89632e-05, "loss": 0.8452, "step": 14815 }, { "epoch": 0.47, "learning_rate": 1.8969600000000002e-05, "loss": 0.7973, "step": 14820 }, { "epoch": 0.47, "learning_rate": 1.8976000000000003e-05, "loss": 0.8171, "step": 14825 }, { "epoch": 0.47, "learning_rate": 1.89824e-05, "loss": 0.8168, "step": 14830 }, { "epoch": 0.47, "learning_rate": 1.89888e-05, "loss": 0.8293, "step": 14835 }, { "epoch": 0.47, "learning_rate": 1.8995200000000004e-05, "loss": 0.8081, "step": 14840 }, { "epoch": 0.48, "learning_rate": 1.90016e-05, "loss": 0.8286, "step": 14845 }, { "epoch": 0.48, "learning_rate": 1.9008e-05, "loss": 0.8109, "step": 14850 }, { "epoch": 0.48, "learning_rate": 1.9014400000000002e-05, "loss": 0.8159, "step": 14855 }, { "epoch": 0.48, "learning_rate": 1.9020800000000003e-05, "loss": 0.8288, "step": 14860 }, { "epoch": 0.48, "learning_rate": 1.90272e-05, "loss": 0.8245, "step": 14865 }, { "epoch": 0.48, "learning_rate": 1.90336e-05, "loss": 0.8048, "step": 14870 }, { "epoch": 0.48, "learning_rate": 1.904e-05, "loss": 0.8285, "step": 14875 }, { "epoch": 0.48, "learning_rate": 1.90464e-05, "loss": 0.8262, "step": 14880 }, { "epoch": 0.48, "learning_rate": 1.90528e-05, "loss": 0.8195, "step": 14885 }, { "epoch": 0.48, "learning_rate": 1.9059200000000002e-05, "loss": 0.82, "step": 14890 }, { "epoch": 0.48, "learning_rate": 1.9065600000000003e-05, "loss": 0.808, "step": 14895 }, { "epoch": 0.48, "learning_rate": 1.9072000000000003e-05, "loss": 0.8213, "step": 14900 }, { "epoch": 0.48, "learning_rate": 1.90784e-05, "loss": 0.8193, "step": 14905 }, { "epoch": 0.48, "learning_rate": 1.90848e-05, "loss": 0.8236, "step": 14910 }, { "epoch": 0.48, "learning_rate": 1.90912e-05, "loss": 0.8113, "step": 14915 }, { "epoch": 0.48, "learning_rate": 1.90976e-05, "loss": 0.8313, "step": 14920 }, { "epoch": 0.48, "learning_rate": 1.9104000000000002e-05, "loss": 0.814, "step": 14925 }, { "epoch": 0.48, "learning_rate": 1.9110400000000003e-05, "loss": 0.8084, "step": 14930 }, { "epoch": 0.48, "learning_rate": 1.9116800000000003e-05, "loss": 0.8003, "step": 14935 }, { "epoch": 0.48, "learning_rate": 1.91232e-05, "loss": 0.816, "step": 14940 }, { "epoch": 0.48, "learning_rate": 1.91296e-05, "loss": 0.8159, "step": 14945 }, { "epoch": 0.48, "learning_rate": 1.9136e-05, "loss": 0.8166, "step": 14950 }, { "epoch": 0.48, "learning_rate": 1.91424e-05, "loss": 0.8202, "step": 14955 }, { "epoch": 0.48, "learning_rate": 1.9148800000000002e-05, "loss": 0.8206, "step": 14960 }, { "epoch": 0.48, "learning_rate": 1.91552e-05, "loss": 0.8203, "step": 14965 }, { "epoch": 0.48, "learning_rate": 1.9161600000000003e-05, "loss": 0.8355, "step": 14970 }, { "epoch": 0.48, "learning_rate": 1.9168000000000004e-05, "loss": 0.8197, "step": 14975 }, { "epoch": 0.48, "learning_rate": 1.91744e-05, "loss": 0.8188, "step": 14980 }, { "epoch": 0.48, "learning_rate": 1.91808e-05, "loss": 0.8269, "step": 14985 }, { "epoch": 0.48, "learning_rate": 1.91872e-05, "loss": 0.8194, "step": 14990 }, { "epoch": 0.48, "learning_rate": 1.9193600000000002e-05, "loss": 0.823, "step": 14995 }, { "epoch": 0.48, "learning_rate": 1.9200000000000003e-05, "loss": 0.8193, "step": 15000 }, { "epoch": 0.48, "learning_rate": 1.92064e-05, "loss": 0.8409, "step": 15005 }, { "epoch": 0.48, "learning_rate": 1.9212800000000003e-05, "loss": 0.8122, "step": 15010 }, { "epoch": 0.48, "learning_rate": 1.9219200000000004e-05, "loss": 0.8158, "step": 15015 }, { "epoch": 0.48, "learning_rate": 1.92256e-05, "loss": 0.8234, "step": 15020 }, { "epoch": 0.48, "learning_rate": 1.9232e-05, "loss": 0.8141, "step": 15025 }, { "epoch": 0.48, "learning_rate": 1.9238400000000002e-05, "loss": 0.8137, "step": 15030 }, { "epoch": 0.48, "learning_rate": 1.9244800000000002e-05, "loss": 0.8033, "step": 15035 }, { "epoch": 0.48, "learning_rate": 1.92512e-05, "loss": 0.8187, "step": 15040 }, { "epoch": 0.48, "learning_rate": 1.92576e-05, "loss": 0.8124, "step": 15045 }, { "epoch": 0.48, "learning_rate": 1.9264e-05, "loss": 0.8189, "step": 15050 }, { "epoch": 0.48, "learning_rate": 1.92704e-05, "loss": 0.7961, "step": 15055 }, { "epoch": 0.48, "learning_rate": 1.92768e-05, "loss": 0.8208, "step": 15060 }, { "epoch": 0.48, "learning_rate": 1.9283200000000002e-05, "loss": 0.8329, "step": 15065 }, { "epoch": 0.48, "learning_rate": 1.9289600000000002e-05, "loss": 0.825, "step": 15070 }, { "epoch": 0.48, "learning_rate": 1.9296000000000003e-05, "loss": 0.8111, "step": 15075 }, { "epoch": 0.48, "learning_rate": 1.93024e-05, "loss": 0.8215, "step": 15080 }, { "epoch": 0.48, "learning_rate": 1.93088e-05, "loss": 0.8053, "step": 15085 }, { "epoch": 0.48, "learning_rate": 1.93152e-05, "loss": 0.8189, "step": 15090 }, { "epoch": 0.48, "learning_rate": 1.93216e-05, "loss": 0.8149, "step": 15095 }, { "epoch": 0.48, "learning_rate": 1.9328000000000002e-05, "loss": 0.8291, "step": 15100 }, { "epoch": 0.48, "learning_rate": 1.9334400000000002e-05, "loss": 0.8115, "step": 15105 }, { "epoch": 0.48, "learning_rate": 1.9340800000000003e-05, "loss": 0.8223, "step": 15110 }, { "epoch": 0.48, "learning_rate": 1.93472e-05, "loss": 0.8199, "step": 15115 }, { "epoch": 0.48, "learning_rate": 1.93536e-05, "loss": 0.8097, "step": 15120 }, { "epoch": 0.48, "learning_rate": 1.936e-05, "loss": 0.8141, "step": 15125 }, { "epoch": 0.48, "learning_rate": 1.93664e-05, "loss": 0.822, "step": 15130 }, { "epoch": 0.48, "learning_rate": 1.9372800000000002e-05, "loss": 0.813, "step": 15135 }, { "epoch": 0.48, "learning_rate": 1.9379200000000002e-05, "loss": 0.8085, "step": 15140 }, { "epoch": 0.48, "learning_rate": 1.9385600000000003e-05, "loss": 0.8092, "step": 15145 }, { "epoch": 0.48, "learning_rate": 1.9392000000000003e-05, "loss": 0.8128, "step": 15150 }, { "epoch": 0.48, "learning_rate": 1.93984e-05, "loss": 0.8244, "step": 15155 }, { "epoch": 0.49, "learning_rate": 1.94048e-05, "loss": 0.8262, "step": 15160 }, { "epoch": 0.49, "learning_rate": 1.94112e-05, "loss": 0.815, "step": 15165 }, { "epoch": 0.49, "learning_rate": 1.9417600000000002e-05, "loss": 0.819, "step": 15170 }, { "epoch": 0.49, "learning_rate": 1.9424e-05, "loss": 0.8138, "step": 15175 }, { "epoch": 0.49, "learning_rate": 1.9430400000000003e-05, "loss": 0.8208, "step": 15180 }, { "epoch": 0.49, "learning_rate": 1.9436800000000003e-05, "loss": 0.8094, "step": 15185 }, { "epoch": 0.49, "learning_rate": 1.94432e-05, "loss": 0.8128, "step": 15190 }, { "epoch": 0.49, "learning_rate": 1.94496e-05, "loss": 0.8044, "step": 15195 }, { "epoch": 0.49, "learning_rate": 1.9456e-05, "loss": 0.8114, "step": 15200 }, { "epoch": 0.49, "learning_rate": 1.9462400000000002e-05, "loss": 0.7994, "step": 15205 }, { "epoch": 0.49, "learning_rate": 1.9468800000000002e-05, "loss": 0.8119, "step": 15210 }, { "epoch": 0.49, "learning_rate": 1.94752e-05, "loss": 0.8175, "step": 15215 }, { "epoch": 0.49, "learning_rate": 1.94816e-05, "loss": 0.8117, "step": 15220 }, { "epoch": 0.49, "learning_rate": 1.9488000000000004e-05, "loss": 0.8078, "step": 15225 }, { "epoch": 0.49, "learning_rate": 1.94944e-05, "loss": 0.8044, "step": 15230 }, { "epoch": 0.49, "learning_rate": 1.95008e-05, "loss": 0.8112, "step": 15235 }, { "epoch": 0.49, "learning_rate": 1.9507200000000002e-05, "loss": 0.8014, "step": 15240 }, { "epoch": 0.49, "learning_rate": 1.9513600000000002e-05, "loss": 0.8117, "step": 15245 }, { "epoch": 0.49, "learning_rate": 1.9520000000000003e-05, "loss": 0.8116, "step": 15250 }, { "epoch": 0.49, "learning_rate": 1.95264e-05, "loss": 0.8038, "step": 15255 }, { "epoch": 0.49, "learning_rate": 1.95328e-05, "loss": 0.8122, "step": 15260 }, { "epoch": 0.49, "learning_rate": 1.9539200000000004e-05, "loss": 0.821, "step": 15265 }, { "epoch": 0.49, "learning_rate": 1.95456e-05, "loss": 0.8156, "step": 15270 }, { "epoch": 0.49, "learning_rate": 1.9552000000000002e-05, "loss": 0.8174, "step": 15275 }, { "epoch": 0.49, "learning_rate": 1.9558400000000002e-05, "loss": 0.8201, "step": 15280 }, { "epoch": 0.49, "learning_rate": 1.9564800000000003e-05, "loss": 0.8094, "step": 15285 }, { "epoch": 0.49, "learning_rate": 1.95712e-05, "loss": 0.8115, "step": 15290 }, { "epoch": 0.49, "learning_rate": 1.95776e-05, "loss": 0.8136, "step": 15295 }, { "epoch": 0.49, "learning_rate": 1.9584e-05, "loss": 0.8165, "step": 15300 }, { "epoch": 0.49, "learning_rate": 1.95904e-05, "loss": 0.8034, "step": 15305 }, { "epoch": 0.49, "learning_rate": 1.9596800000000002e-05, "loss": 0.8141, "step": 15310 }, { "epoch": 0.49, "learning_rate": 1.9603200000000002e-05, "loss": 0.8227, "step": 15315 }, { "epoch": 0.49, "learning_rate": 1.9609600000000003e-05, "loss": 0.8107, "step": 15320 }, { "epoch": 0.49, "learning_rate": 1.9616000000000003e-05, "loss": 0.8058, "step": 15325 }, { "epoch": 0.49, "learning_rate": 1.96224e-05, "loss": 0.8095, "step": 15330 }, { "epoch": 0.49, "learning_rate": 1.96288e-05, "loss": 0.8046, "step": 15335 }, { "epoch": 0.49, "learning_rate": 1.96352e-05, "loss": 0.804, "step": 15340 }, { "epoch": 0.49, "learning_rate": 1.9641600000000002e-05, "loss": 0.8001, "step": 15345 }, { "epoch": 0.49, "learning_rate": 1.9648000000000002e-05, "loss": 0.8179, "step": 15350 }, { "epoch": 0.49, "learning_rate": 1.9654400000000003e-05, "loss": 0.8088, "step": 15355 }, { "epoch": 0.49, "learning_rate": 1.9660800000000003e-05, "loss": 0.8192, "step": 15360 }, { "epoch": 0.49, "learning_rate": 1.96672e-05, "loss": 0.8096, "step": 15365 }, { "epoch": 0.49, "learning_rate": 1.96736e-05, "loss": 0.8134, "step": 15370 }, { "epoch": 0.49, "learning_rate": 1.968e-05, "loss": 0.816, "step": 15375 }, { "epoch": 0.49, "learning_rate": 1.9686400000000002e-05, "loss": 0.8206, "step": 15380 }, { "epoch": 0.49, "learning_rate": 1.9692800000000002e-05, "loss": 0.8196, "step": 15385 }, { "epoch": 0.49, "learning_rate": 1.96992e-05, "loss": 0.8118, "step": 15390 }, { "epoch": 0.49, "learning_rate": 1.9705600000000003e-05, "loss": 0.8125, "step": 15395 }, { "epoch": 0.49, "learning_rate": 1.9712000000000004e-05, "loss": 0.81, "step": 15400 }, { "epoch": 0.49, "learning_rate": 1.97184e-05, "loss": 0.8187, "step": 15405 }, { "epoch": 0.49, "learning_rate": 1.97248e-05, "loss": 0.8041, "step": 15410 }, { "epoch": 0.49, "learning_rate": 1.9731200000000002e-05, "loss": 0.8132, "step": 15415 }, { "epoch": 0.49, "learning_rate": 1.9737600000000002e-05, "loss": 0.8071, "step": 15420 }, { "epoch": 0.49, "learning_rate": 1.9744e-05, "loss": 0.8211, "step": 15425 }, { "epoch": 0.49, "learning_rate": 1.97504e-05, "loss": 0.8091, "step": 15430 }, { "epoch": 0.49, "learning_rate": 1.9756800000000004e-05, "loss": 0.802, "step": 15435 }, { "epoch": 0.49, "learning_rate": 1.97632e-05, "loss": 0.7965, "step": 15440 }, { "epoch": 0.49, "learning_rate": 1.97696e-05, "loss": 0.8086, "step": 15445 }, { "epoch": 0.49, "learning_rate": 1.9776000000000002e-05, "loss": 0.8325, "step": 15450 }, { "epoch": 0.49, "learning_rate": 1.9782400000000002e-05, "loss": 0.8133, "step": 15455 }, { "epoch": 0.49, "learning_rate": 1.9788800000000003e-05, "loss": 0.8049, "step": 15460 }, { "epoch": 0.49, "learning_rate": 1.97952e-05, "loss": 0.8062, "step": 15465 }, { "epoch": 0.5, "learning_rate": 1.98016e-05, "loss": 0.8196, "step": 15470 }, { "epoch": 0.5, "learning_rate": 1.9808e-05, "loss": 0.8209, "step": 15475 }, { "epoch": 0.5, "learning_rate": 1.98144e-05, "loss": 0.8192, "step": 15480 }, { "epoch": 0.5, "learning_rate": 1.9820800000000002e-05, "loss": 0.8127, "step": 15485 }, { "epoch": 0.5, "learning_rate": 1.9827200000000002e-05, "loss": 0.8146, "step": 15490 }, { "epoch": 0.5, "learning_rate": 1.9833600000000003e-05, "loss": 0.8263, "step": 15495 }, { "epoch": 0.5, "learning_rate": 1.9840000000000003e-05, "loss": 0.8107, "step": 15500 }, { "epoch": 0.5, "learning_rate": 1.98464e-05, "loss": 0.8219, "step": 15505 }, { "epoch": 0.5, "learning_rate": 1.98528e-05, "loss": 0.8127, "step": 15510 }, { "epoch": 0.5, "learning_rate": 1.98592e-05, "loss": 0.8284, "step": 15515 }, { "epoch": 0.5, "learning_rate": 1.9865600000000002e-05, "loss": 0.806, "step": 15520 }, { "epoch": 0.5, "learning_rate": 1.9872000000000002e-05, "loss": 0.8063, "step": 15525 }, { "epoch": 0.5, "learning_rate": 1.9878400000000003e-05, "loss": 0.8135, "step": 15530 }, { "epoch": 0.5, "learning_rate": 1.9884800000000003e-05, "loss": 0.8099, "step": 15535 }, { "epoch": 0.5, "learning_rate": 1.98912e-05, "loss": 0.7989, "step": 15540 }, { "epoch": 0.5, "learning_rate": 1.98976e-05, "loss": 0.8064, "step": 15545 }, { "epoch": 0.5, "learning_rate": 1.9904e-05, "loss": 0.7978, "step": 15550 }, { "epoch": 0.5, "learning_rate": 1.99104e-05, "loss": 0.8143, "step": 15555 }, { "epoch": 0.5, "learning_rate": 1.9916800000000002e-05, "loss": 0.832, "step": 15560 }, { "epoch": 0.5, "learning_rate": 1.9923200000000003e-05, "loss": 0.821, "step": 15565 }, { "epoch": 0.5, "learning_rate": 1.9929600000000003e-05, "loss": 0.8074, "step": 15570 }, { "epoch": 0.5, "learning_rate": 1.9936000000000004e-05, "loss": 0.8159, "step": 15575 }, { "epoch": 0.5, "learning_rate": 1.99424e-05, "loss": 0.8129, "step": 15580 }, { "epoch": 0.5, "learning_rate": 1.99488e-05, "loss": 0.8072, "step": 15585 }, { "epoch": 0.5, "learning_rate": 1.99552e-05, "loss": 0.8191, "step": 15590 }, { "epoch": 0.5, "learning_rate": 1.9961600000000002e-05, "loss": 0.8145, "step": 15595 }, { "epoch": 0.5, "learning_rate": 1.9968e-05, "loss": 0.8192, "step": 15600 }, { "epoch": 0.5, "learning_rate": 1.9974400000000003e-05, "loss": 0.8088, "step": 15605 }, { "epoch": 0.5, "learning_rate": 1.9980800000000004e-05, "loss": 0.8024, "step": 15610 }, { "epoch": 0.5, "learning_rate": 1.99872e-05, "loss": 0.8031, "step": 15615 }, { "epoch": 0.5, "learning_rate": 1.99936e-05, "loss": 0.8081, "step": 15620 }, { "epoch": 0.5, "learning_rate": 2e-05, "loss": 0.812, "step": 15625 }, { "epoch": 0.5, "learning_rate": 1.9999999937614355e-05, "loss": 0.8161, "step": 15630 }, { "epoch": 0.5, "learning_rate": 1.9999999750457414e-05, "loss": 0.8073, "step": 15635 }, { "epoch": 0.5, "learning_rate": 1.999999943852918e-05, "loss": 0.8099, "step": 15640 }, { "epoch": 0.5, "learning_rate": 1.9999999001829658e-05, "loss": 0.7946, "step": 15645 }, { "epoch": 0.5, "learning_rate": 1.9999998440358852e-05, "loss": 0.8048, "step": 15650 }, { "epoch": 0.5, "learning_rate": 1.9999997754116774e-05, "loss": 0.7974, "step": 15655 }, { "epoch": 0.5, "learning_rate": 1.9999996943103425e-05, "loss": 0.8168, "step": 15660 }, { "epoch": 0.5, "learning_rate": 1.9999996007318823e-05, "loss": 0.8126, "step": 15665 }, { "epoch": 0.5, "learning_rate": 1.9999994946762974e-05, "loss": 0.8016, "step": 15670 }, { "epoch": 0.5, "learning_rate": 1.9999993761435893e-05, "loss": 0.8118, "step": 15675 }, { "epoch": 0.5, "learning_rate": 1.9999992451337596e-05, "loss": 0.8062, "step": 15680 }, { "epoch": 0.5, "learning_rate": 1.9999991016468096e-05, "loss": 0.8151, "step": 15685 }, { "epoch": 0.5, "learning_rate": 1.9999989456827415e-05, "loss": 0.8158, "step": 15690 }, { "epoch": 0.5, "learning_rate": 1.9999987772415568e-05, "loss": 0.8143, "step": 15695 }, { "epoch": 0.5, "learning_rate": 1.9999985963232583e-05, "loss": 0.7976, "step": 15700 }, { "epoch": 0.5, "learning_rate": 1.9999984029278474e-05, "loss": 0.8105, "step": 15705 }, { "epoch": 0.5, "learning_rate": 1.999998197055327e-05, "loss": 0.796, "step": 15710 }, { "epoch": 0.5, "learning_rate": 1.9999979787056998e-05, "loss": 0.8051, "step": 15715 }, { "epoch": 0.5, "learning_rate": 1.9999977478789682e-05, "loss": 0.804, "step": 15720 }, { "epoch": 0.5, "learning_rate": 1.9999975045751353e-05, "loss": 0.8058, "step": 15725 }, { "epoch": 0.5, "learning_rate": 1.9999972487942035e-05, "loss": 0.7975, "step": 15730 }, { "epoch": 0.5, "learning_rate": 1.9999969805361772e-05, "loss": 0.8125, "step": 15735 }, { "epoch": 0.5, "learning_rate": 1.999996699801059e-05, "loss": 0.8174, "step": 15740 }, { "epoch": 0.5, "learning_rate": 1.999996406588852e-05, "loss": 0.8169, "step": 15745 }, { "epoch": 0.5, "learning_rate": 1.9999961008995607e-05, "loss": 0.8072, "step": 15750 }, { "epoch": 0.5, "learning_rate": 1.9999957827331883e-05, "loss": 0.8119, "step": 15755 }, { "epoch": 0.5, "learning_rate": 1.9999954520897394e-05, "loss": 0.8049, "step": 15760 }, { "epoch": 0.5, "learning_rate": 1.9999951089692174e-05, "loss": 0.7939, "step": 15765 }, { "epoch": 0.5, "learning_rate": 1.999994753371627e-05, "loss": 0.8087, "step": 15770 }, { "epoch": 0.5, "learning_rate": 1.999994385296973e-05, "loss": 0.818, "step": 15775 }, { "epoch": 0.5, "learning_rate": 1.999994004745259e-05, "loss": 0.8049, "step": 15780 }, { "epoch": 0.51, "learning_rate": 1.9999936117164904e-05, "loss": 0.8091, "step": 15785 }, { "epoch": 0.51, "learning_rate": 1.999993206210672e-05, "loss": 0.7908, "step": 15790 }, { "epoch": 0.51, "learning_rate": 1.9999927882278092e-05, "loss": 0.8107, "step": 15795 }, { "epoch": 0.51, "learning_rate": 1.9999923577679066e-05, "loss": 0.8138, "step": 15800 }, { "epoch": 0.51, "learning_rate": 1.99999191483097e-05, "loss": 0.8172, "step": 15805 }, { "epoch": 0.51, "learning_rate": 1.9999914594170044e-05, "loss": 0.8231, "step": 15810 }, { "epoch": 0.51, "learning_rate": 1.999990991526016e-05, "loss": 0.804, "step": 15815 }, { "epoch": 0.51, "learning_rate": 1.9999905111580106e-05, "loss": 0.7954, "step": 15820 }, { "epoch": 0.51, "learning_rate": 1.9999900183129944e-05, "loss": 0.805, "step": 15825 }, { "epoch": 0.51, "learning_rate": 1.999989512990973e-05, "loss": 0.8058, "step": 15830 }, { "epoch": 0.51, "learning_rate": 1.9999889951919527e-05, "loss": 0.7999, "step": 15835 }, { "epoch": 0.51, "learning_rate": 1.9999884649159404e-05, "loss": 0.8072, "step": 15840 }, { "epoch": 0.51, "learning_rate": 1.9999879221629427e-05, "loss": 0.7836, "step": 15845 }, { "epoch": 0.51, "learning_rate": 1.999987366932966e-05, "loss": 0.8084, "step": 15850 }, { "epoch": 0.51, "learning_rate": 1.9999867992260173e-05, "loss": 0.7962, "step": 15855 }, { "epoch": 0.51, "learning_rate": 1.999986219042104e-05, "loss": 0.8081, "step": 15860 }, { "epoch": 0.51, "learning_rate": 1.9999856263812333e-05, "loss": 0.8021, "step": 15865 }, { "epoch": 0.51, "learning_rate": 1.9999850212434123e-05, "loss": 0.8116, "step": 15870 }, { "epoch": 0.51, "learning_rate": 1.9999844036286483e-05, "loss": 0.7887, "step": 15875 }, { "epoch": 0.51, "learning_rate": 1.9999837735369497e-05, "loss": 0.8014, "step": 15880 }, { "epoch": 0.51, "learning_rate": 1.999983130968324e-05, "loss": 0.8128, "step": 15885 }, { "epoch": 0.51, "learning_rate": 1.9999824759227794e-05, "loss": 0.7902, "step": 15890 }, { "epoch": 0.51, "learning_rate": 1.9999818084003243e-05, "loss": 0.8068, "step": 15895 }, { "epoch": 0.51, "learning_rate": 1.999981128400966e-05, "loss": 0.8007, "step": 15900 }, { "epoch": 0.51, "learning_rate": 1.9999804359247143e-05, "loss": 0.8065, "step": 15905 }, { "epoch": 0.51, "learning_rate": 1.9999797309715764e-05, "loss": 0.8123, "step": 15910 }, { "epoch": 0.51, "learning_rate": 1.9999790135415625e-05, "loss": 0.8061, "step": 15915 }, { "epoch": 0.51, "learning_rate": 1.999978283634681e-05, "loss": 0.8218, "step": 15920 }, { "epoch": 0.51, "learning_rate": 1.9999775412509405e-05, "loss": 0.8129, "step": 15925 }, { "epoch": 0.51, "learning_rate": 1.999976786390351e-05, "loss": 0.7972, "step": 15930 }, { "epoch": 0.51, "learning_rate": 1.9999760190529214e-05, "loss": 0.8042, "step": 15935 }, { "epoch": 0.51, "learning_rate": 1.999975239238662e-05, "loss": 0.8006, "step": 15940 }, { "epoch": 0.51, "learning_rate": 1.999974446947582e-05, "loss": 0.8065, "step": 15945 }, { "epoch": 0.51, "learning_rate": 1.9999736421796908e-05, "loss": 0.8079, "step": 15950 }, { "epoch": 0.51, "learning_rate": 1.9999728249349994e-05, "loss": 0.8058, "step": 15955 }, { "epoch": 0.51, "learning_rate": 1.9999719952135173e-05, "loss": 0.8074, "step": 15960 }, { "epoch": 0.51, "learning_rate": 1.9999711530152553e-05, "loss": 0.8038, "step": 15965 }, { "epoch": 0.51, "learning_rate": 1.9999702983402236e-05, "loss": 0.8037, "step": 15970 }, { "epoch": 0.51, "learning_rate": 1.999969431188433e-05, "loss": 0.8069, "step": 15975 }, { "epoch": 0.51, "learning_rate": 1.9999685515598943e-05, "loss": 0.7963, "step": 15980 }, { "epoch": 0.51, "learning_rate": 1.9999676594546187e-05, "loss": 0.798, "step": 15985 }, { "epoch": 0.51, "learning_rate": 1.999966754872617e-05, "loss": 0.7953, "step": 15990 }, { "epoch": 0.51, "learning_rate": 1.9999658378139007e-05, "loss": 0.7928, "step": 15995 }, { "epoch": 0.51, "learning_rate": 1.9999649082784807e-05, "loss": 0.812, "step": 16000 }, { "epoch": 0.51, "learning_rate": 1.9999639662663694e-05, "loss": 0.801, "step": 16005 }, { "epoch": 0.51, "learning_rate": 1.9999630117775784e-05, "loss": 0.8012, "step": 16010 }, { "epoch": 0.51, "learning_rate": 1.999962044812119e-05, "loss": 0.8092, "step": 16015 }, { "epoch": 0.51, "learning_rate": 1.9999610653700037e-05, "loss": 0.7979, "step": 16020 }, { "epoch": 0.51, "learning_rate": 1.999960073451245e-05, "loss": 0.813, "step": 16025 }, { "epoch": 0.51, "learning_rate": 1.9999590690558545e-05, "loss": 0.8182, "step": 16030 }, { "epoch": 0.51, "learning_rate": 1.999958052183846e-05, "loss": 0.804, "step": 16035 }, { "epoch": 0.51, "learning_rate": 1.9999570228352305e-05, "loss": 0.7902, "step": 16040 }, { "epoch": 0.51, "learning_rate": 1.9999559810100222e-05, "loss": 0.8077, "step": 16045 }, { "epoch": 0.51, "learning_rate": 1.9999549267082337e-05, "loss": 0.7958, "step": 16050 }, { "epoch": 0.51, "learning_rate": 1.999953859929878e-05, "loss": 0.8167, "step": 16055 }, { "epoch": 0.51, "learning_rate": 1.999952780674968e-05, "loss": 0.8166, "step": 16060 }, { "epoch": 0.51, "learning_rate": 1.9999516889435184e-05, "loss": 0.7958, "step": 16065 }, { "epoch": 0.51, "learning_rate": 1.9999505847355417e-05, "loss": 0.7823, "step": 16070 }, { "epoch": 0.51, "learning_rate": 1.999949468051052e-05, "loss": 0.7901, "step": 16075 }, { "epoch": 0.51, "learning_rate": 1.9999483388900633e-05, "loss": 0.8043, "step": 16080 }, { "epoch": 0.51, "learning_rate": 1.9999471972525897e-05, "loss": 0.7981, "step": 16085 }, { "epoch": 0.51, "learning_rate": 1.9999460431386458e-05, "loss": 0.806, "step": 16090 }, { "epoch": 0.52, "learning_rate": 1.9999448765482453e-05, "loss": 0.8109, "step": 16095 }, { "epoch": 0.52, "learning_rate": 1.999943697481403e-05, "loss": 0.8082, "step": 16100 }, { "epoch": 0.52, "learning_rate": 1.9999425059381335e-05, "loss": 0.8006, "step": 16105 }, { "epoch": 0.52, "learning_rate": 1.9999413019184523e-05, "loss": 0.8063, "step": 16110 }, { "epoch": 0.52, "learning_rate": 1.999940085422374e-05, "loss": 0.8109, "step": 16115 }, { "epoch": 0.52, "learning_rate": 1.9999388564499135e-05, "loss": 0.7764, "step": 16120 }, { "epoch": 0.52, "learning_rate": 1.9999376150010868e-05, "loss": 0.7937, "step": 16125 }, { "epoch": 0.52, "learning_rate": 1.9999363610759082e-05, "loss": 0.7925, "step": 16130 }, { "epoch": 0.52, "learning_rate": 1.9999350946743948e-05, "loss": 0.7932, "step": 16135 }, { "epoch": 0.52, "learning_rate": 1.9999338157965618e-05, "loss": 0.7925, "step": 16140 }, { "epoch": 0.52, "learning_rate": 1.9999325244424247e-05, "loss": 0.7932, "step": 16145 }, { "epoch": 0.52, "learning_rate": 1.9999312206120002e-05, "loss": 0.8033, "step": 16150 }, { "epoch": 0.52, "learning_rate": 1.9999299043053046e-05, "loss": 0.8026, "step": 16155 }, { "epoch": 0.52, "learning_rate": 1.9999285755223536e-05, "loss": 0.8036, "step": 16160 }, { "epoch": 0.52, "learning_rate": 1.9999272342631644e-05, "loss": 0.805, "step": 16165 }, { "epoch": 0.52, "learning_rate": 1.999925880527754e-05, "loss": 0.8061, "step": 16170 }, { "epoch": 0.52, "learning_rate": 1.999924514316138e-05, "loss": 0.8002, "step": 16175 }, { "epoch": 0.52, "learning_rate": 1.999923135628335e-05, "loss": 0.8003, "step": 16180 }, { "epoch": 0.52, "learning_rate": 1.9999217444643616e-05, "loss": 0.8034, "step": 16185 }, { "epoch": 0.52, "learning_rate": 1.999920340824235e-05, "loss": 0.8001, "step": 16190 }, { "epoch": 0.52, "learning_rate": 1.9999189247079727e-05, "loss": 0.8051, "step": 16195 }, { "epoch": 0.52, "learning_rate": 1.9999174961155928e-05, "loss": 0.81, "step": 16200 }, { "epoch": 0.52, "learning_rate": 1.999916055047112e-05, "loss": 0.8035, "step": 16205 }, { "epoch": 0.52, "learning_rate": 1.9999146015025503e-05, "loss": 0.8204, "step": 16210 }, { "epoch": 0.52, "learning_rate": 1.9999131354819236e-05, "loss": 0.7889, "step": 16215 }, { "epoch": 0.52, "learning_rate": 1.9999116569852518e-05, "loss": 0.808, "step": 16220 }, { "epoch": 0.52, "learning_rate": 1.9999101660125525e-05, "loss": 0.8148, "step": 16225 }, { "epoch": 0.52, "learning_rate": 1.9999086625638445e-05, "loss": 0.8018, "step": 16230 }, { "epoch": 0.52, "learning_rate": 1.999907146639147e-05, "loss": 0.8026, "step": 16235 }, { "epoch": 0.52, "learning_rate": 1.999905618238478e-05, "loss": 0.8034, "step": 16240 }, { "epoch": 0.52, "learning_rate": 1.9999040773618578e-05, "loss": 0.7854, "step": 16245 }, { "epoch": 0.52, "learning_rate": 1.9999025240093045e-05, "loss": 0.7926, "step": 16250 }, { "epoch": 0.52, "learning_rate": 1.999900958180838e-05, "loss": 0.8031, "step": 16255 }, { "epoch": 0.52, "learning_rate": 1.9998993798764775e-05, "loss": 0.8155, "step": 16260 }, { "epoch": 0.52, "learning_rate": 1.9998977890962434e-05, "loss": 0.7911, "step": 16265 }, { "epoch": 0.52, "learning_rate": 1.9998961858401545e-05, "loss": 0.8107, "step": 16270 }, { "epoch": 0.52, "learning_rate": 1.9998945701082322e-05, "loss": 0.7884, "step": 16275 }, { "epoch": 0.52, "learning_rate": 1.9998929419004954e-05, "loss": 0.7931, "step": 16280 }, { "epoch": 0.52, "learning_rate": 1.9998913012169646e-05, "loss": 0.8023, "step": 16285 }, { "epoch": 0.52, "learning_rate": 1.999889648057661e-05, "loss": 0.8034, "step": 16290 }, { "epoch": 0.52, "learning_rate": 1.9998879824226048e-05, "loss": 0.795, "step": 16295 }, { "epoch": 0.52, "learning_rate": 1.9998863043118163e-05, "loss": 0.8051, "step": 16300 }, { "epoch": 0.52, "learning_rate": 1.9998846137253173e-05, "loss": 0.8022, "step": 16305 }, { "epoch": 0.52, "learning_rate": 1.9998829106631285e-05, "loss": 0.795, "step": 16310 }, { "epoch": 0.52, "learning_rate": 1.999881195125271e-05, "loss": 0.8107, "step": 16315 }, { "epoch": 0.52, "learning_rate": 1.9998794671117664e-05, "loss": 0.8018, "step": 16320 }, { "epoch": 0.52, "learning_rate": 1.999877726622636e-05, "loss": 0.8064, "step": 16325 }, { "epoch": 0.52, "learning_rate": 1.9998759736579018e-05, "loss": 0.8018, "step": 16330 }, { "epoch": 0.52, "learning_rate": 1.999874208217586e-05, "loss": 0.8011, "step": 16335 }, { "epoch": 0.52, "learning_rate": 1.99987243030171e-05, "loss": 0.8013, "step": 16340 }, { "epoch": 0.52, "learning_rate": 1.999870639910296e-05, "loss": 0.8062, "step": 16345 }, { "epoch": 0.52, "learning_rate": 1.9998688370433667e-05, "loss": 0.7988, "step": 16350 }, { "epoch": 0.52, "learning_rate": 1.999867021700944e-05, "loss": 0.7937, "step": 16355 }, { "epoch": 0.52, "learning_rate": 1.9998651938830517e-05, "loss": 0.8087, "step": 16360 }, { "epoch": 0.52, "learning_rate": 1.9998633535897114e-05, "loss": 0.8028, "step": 16365 }, { "epoch": 0.52, "learning_rate": 1.9998615008209467e-05, "loss": 0.7911, "step": 16370 }, { "epoch": 0.52, "learning_rate": 1.9998596355767805e-05, "loss": 0.7958, "step": 16375 }, { "epoch": 0.52, "learning_rate": 1.9998577578572362e-05, "loss": 0.7933, "step": 16380 }, { "epoch": 0.52, "learning_rate": 1.9998558676623373e-05, "loss": 0.8002, "step": 16385 }, { "epoch": 0.52, "learning_rate": 1.999853964992107e-05, "loss": 0.7892, "step": 16390 }, { "epoch": 0.52, "learning_rate": 1.9998520498465696e-05, "loss": 0.7978, "step": 16395 }, { "epoch": 0.52, "learning_rate": 1.9998501222257486e-05, "loss": 0.7932, "step": 16400 }, { "epoch": 0.52, "learning_rate": 1.999848182129668e-05, "loss": 0.7964, "step": 16405 }, { "epoch": 0.53, "learning_rate": 1.9998462295583522e-05, "loss": 0.7962, "step": 16410 }, { "epoch": 0.53, "learning_rate": 1.9998442645118253e-05, "loss": 0.7919, "step": 16415 }, { "epoch": 0.53, "learning_rate": 1.9998422869901124e-05, "loss": 0.7992, "step": 16420 }, { "epoch": 0.53, "learning_rate": 1.9998402969932376e-05, "loss": 0.7978, "step": 16425 }, { "epoch": 0.53, "learning_rate": 1.9998382945212264e-05, "loss": 0.8122, "step": 16430 }, { "epoch": 0.53, "learning_rate": 1.9998362795741027e-05, "loss": 0.8033, "step": 16435 }, { "epoch": 0.53, "learning_rate": 1.9998342521518924e-05, "loss": 0.8104, "step": 16440 }, { "epoch": 0.53, "learning_rate": 1.9998322122546208e-05, "loss": 0.8012, "step": 16445 }, { "epoch": 0.53, "learning_rate": 1.999830159882313e-05, "loss": 0.7953, "step": 16450 }, { "epoch": 0.53, "learning_rate": 1.999828095034995e-05, "loss": 0.7918, "step": 16455 }, { "epoch": 0.53, "learning_rate": 1.9998260177126924e-05, "loss": 0.7934, "step": 16460 }, { "epoch": 0.53, "learning_rate": 1.9998239279154312e-05, "loss": 0.8083, "step": 16465 }, { "epoch": 0.53, "learning_rate": 1.999821825643237e-05, "loss": 0.7969, "step": 16470 }, { "epoch": 0.53, "learning_rate": 1.999819710896137e-05, "loss": 0.7886, "step": 16475 }, { "epoch": 0.53, "learning_rate": 1.9998175836741564e-05, "loss": 0.7856, "step": 16480 }, { "epoch": 0.53, "learning_rate": 1.9998154439773227e-05, "loss": 0.7983, "step": 16485 }, { "epoch": 0.53, "learning_rate": 1.9998132918056618e-05, "loss": 0.7917, "step": 16490 }, { "epoch": 0.53, "learning_rate": 1.9998111271592015e-05, "loss": 0.7987, "step": 16495 }, { "epoch": 0.53, "learning_rate": 1.999808950037968e-05, "loss": 0.7993, "step": 16500 }, { "epoch": 0.53, "learning_rate": 1.9998067604419886e-05, "loss": 0.7989, "step": 16505 }, { "epoch": 0.53, "learning_rate": 1.9998045583712912e-05, "loss": 0.7924, "step": 16510 }, { "epoch": 0.53, "learning_rate": 1.9998023438259025e-05, "loss": 0.8027, "step": 16515 }, { "epoch": 0.53, "learning_rate": 1.9998001168058506e-05, "loss": 0.8022, "step": 16520 }, { "epoch": 0.53, "learning_rate": 1.999797877311163e-05, "loss": 0.8021, "step": 16525 }, { "epoch": 0.53, "learning_rate": 1.999795625341868e-05, "loss": 0.7978, "step": 16530 }, { "epoch": 0.53, "learning_rate": 1.9997933608979935e-05, "loss": 0.7946, "step": 16535 }, { "epoch": 0.53, "learning_rate": 1.999791083979568e-05, "loss": 0.791, "step": 16540 }, { "epoch": 0.53, "learning_rate": 1.9997887945866193e-05, "loss": 0.7827, "step": 16545 }, { "epoch": 0.53, "learning_rate": 1.9997864927191763e-05, "loss": 0.8033, "step": 16550 }, { "epoch": 0.53, "learning_rate": 1.9997841783772677e-05, "loss": 0.8018, "step": 16555 }, { "epoch": 0.53, "learning_rate": 1.999781851560923e-05, "loss": 0.7866, "step": 16560 }, { "epoch": 0.53, "learning_rate": 1.99977951227017e-05, "loss": 0.791, "step": 16565 }, { "epoch": 0.53, "learning_rate": 1.999777160505039e-05, "loss": 0.7873, "step": 16570 }, { "epoch": 0.53, "learning_rate": 1.999774796265559e-05, "loss": 0.7936, "step": 16575 }, { "epoch": 0.53, "learning_rate": 1.999772419551759e-05, "loss": 0.7932, "step": 16580 }, { "epoch": 0.53, "learning_rate": 1.999770030363669e-05, "loss": 0.79, "step": 16585 }, { "epoch": 0.53, "learning_rate": 1.9997676287013192e-05, "loss": 0.8021, "step": 16590 }, { "epoch": 0.53, "learning_rate": 1.9997652145647392e-05, "loss": 0.7878, "step": 16595 }, { "epoch": 0.53, "learning_rate": 1.999762787953959e-05, "loss": 0.777, "step": 16600 }, { "epoch": 0.53, "learning_rate": 1.999760348869009e-05, "loss": 0.799, "step": 16605 }, { "epoch": 0.53, "learning_rate": 1.9997578973099198e-05, "loss": 0.7981, "step": 16610 }, { "epoch": 0.53, "learning_rate": 1.9997554332767214e-05, "loss": 0.7854, "step": 16615 }, { "epoch": 0.53, "learning_rate": 1.9997529567694457e-05, "loss": 0.7926, "step": 16620 }, { "epoch": 0.53, "learning_rate": 1.9997504677881224e-05, "loss": 0.7918, "step": 16625 }, { "epoch": 0.53, "learning_rate": 1.999747966332783e-05, "loss": 0.7897, "step": 16630 }, { "epoch": 0.53, "learning_rate": 1.999745452403459e-05, "loss": 0.8022, "step": 16635 }, { "epoch": 0.53, "learning_rate": 1.9997429260001814e-05, "loss": 0.7988, "step": 16640 }, { "epoch": 0.53, "learning_rate": 1.999740387122982e-05, "loss": 0.7887, "step": 16645 }, { "epoch": 0.53, "learning_rate": 1.9997378357718923e-05, "loss": 0.7911, "step": 16650 }, { "epoch": 0.53, "learning_rate": 1.999735271946944e-05, "loss": 0.7977, "step": 16655 }, { "epoch": 0.53, "learning_rate": 1.9997326956481693e-05, "loss": 0.7926, "step": 16660 }, { "epoch": 0.53, "learning_rate": 1.9997301068756e-05, "loss": 0.7915, "step": 16665 }, { "epoch": 0.53, "learning_rate": 1.9997275056292692e-05, "loss": 0.7975, "step": 16670 }, { "epoch": 0.53, "learning_rate": 1.9997248919092087e-05, "loss": 0.7834, "step": 16675 }, { "epoch": 0.53, "learning_rate": 1.9997222657154512e-05, "loss": 0.7915, "step": 16680 }, { "epoch": 0.53, "learning_rate": 1.9997196270480295e-05, "loss": 0.7949, "step": 16685 }, { "epoch": 0.53, "learning_rate": 1.9997169759069766e-05, "loss": 0.8013, "step": 16690 }, { "epoch": 0.53, "learning_rate": 1.9997143122923254e-05, "loss": 0.7742, "step": 16695 }, { "epoch": 0.53, "learning_rate": 1.9997116362041095e-05, "loss": 0.7995, "step": 16700 }, { "epoch": 0.53, "learning_rate": 1.9997089476423617e-05, "loss": 0.7932, "step": 16705 }, { "epoch": 0.53, "learning_rate": 1.9997062466071163e-05, "loss": 0.7954, "step": 16710 }, { "epoch": 0.53, "learning_rate": 1.999703533098406e-05, "loss": 0.8034, "step": 16715 }, { "epoch": 0.54, "learning_rate": 1.999700807116266e-05, "loss": 0.8046, "step": 16720 }, { "epoch": 0.54, "learning_rate": 1.9996980686607293e-05, "loss": 0.7854, "step": 16725 }, { "epoch": 0.54, "learning_rate": 1.99969531773183e-05, "loss": 0.7747, "step": 16730 }, { "epoch": 0.54, "learning_rate": 1.9996925543296033e-05, "loss": 0.7984, "step": 16735 }, { "epoch": 0.54, "learning_rate": 1.999689778454083e-05, "loss": 0.8052, "step": 16740 }, { "epoch": 0.54, "learning_rate": 1.9996869901053033e-05, "loss": 0.7937, "step": 16745 }, { "epoch": 0.54, "learning_rate": 1.9996841892833e-05, "loss": 0.7886, "step": 16750 }, { "epoch": 0.54, "learning_rate": 1.9996813759881077e-05, "loss": 0.7856, "step": 16755 }, { "epoch": 0.54, "learning_rate": 1.9996785502197612e-05, "loss": 0.7923, "step": 16760 }, { "epoch": 0.54, "learning_rate": 1.9996757119782965e-05, "loss": 0.8013, "step": 16765 }, { "epoch": 0.54, "learning_rate": 1.9996728612637478e-05, "loss": 0.7776, "step": 16770 }, { "epoch": 0.54, "learning_rate": 1.9996699980761515e-05, "loss": 0.7908, "step": 16775 }, { "epoch": 0.54, "learning_rate": 1.9996671224155433e-05, "loss": 0.7996, "step": 16780 }, { "epoch": 0.54, "learning_rate": 1.999664234281959e-05, "loss": 0.792, "step": 16785 }, { "epoch": 0.54, "learning_rate": 1.9996613336754347e-05, "loss": 0.7879, "step": 16790 }, { "epoch": 0.54, "learning_rate": 1.9996584205960063e-05, "loss": 0.7953, "step": 16795 }, { "epoch": 0.54, "learning_rate": 1.9996554950437105e-05, "loss": 0.7925, "step": 16800 }, { "epoch": 0.54, "learning_rate": 1.999652557018583e-05, "loss": 0.7896, "step": 16805 }, { "epoch": 0.54, "learning_rate": 1.9996496065206615e-05, "loss": 0.7841, "step": 16810 }, { "epoch": 0.54, "learning_rate": 1.999646643549983e-05, "loss": 0.7986, "step": 16815 }, { "epoch": 0.54, "learning_rate": 1.9996436681065832e-05, "loss": 0.7807, "step": 16820 }, { "epoch": 0.54, "learning_rate": 1.9996406801905e-05, "loss": 0.7994, "step": 16825 }, { "epoch": 0.54, "learning_rate": 1.9996376798017703e-05, "loss": 0.7908, "step": 16830 }, { "epoch": 0.54, "learning_rate": 1.9996346669404324e-05, "loss": 0.7914, "step": 16835 }, { "epoch": 0.54, "learning_rate": 1.999631641606523e-05, "loss": 0.7935, "step": 16840 }, { "epoch": 0.54, "learning_rate": 1.9996286038000804e-05, "loss": 0.8017, "step": 16845 }, { "epoch": 0.54, "learning_rate": 1.999625553521142e-05, "loss": 0.7787, "step": 16850 }, { "epoch": 0.54, "learning_rate": 1.9996224907697463e-05, "loss": 0.7809, "step": 16855 }, { "epoch": 0.54, "learning_rate": 1.999619415545931e-05, "loss": 0.7966, "step": 16860 }, { "epoch": 0.54, "learning_rate": 1.999616327849735e-05, "loss": 0.7997, "step": 16865 }, { "epoch": 0.54, "learning_rate": 1.9996132276811967e-05, "loss": 0.7927, "step": 16870 }, { "epoch": 0.54, "learning_rate": 1.9996101150403543e-05, "loss": 0.8082, "step": 16875 }, { "epoch": 0.54, "learning_rate": 1.9996069899272473e-05, "loss": 0.7971, "step": 16880 }, { "epoch": 0.54, "learning_rate": 1.9996038523419148e-05, "loss": 0.8072, "step": 16885 }, { "epoch": 0.54, "learning_rate": 1.9996007022843952e-05, "loss": 0.795, "step": 16890 }, { "epoch": 0.54, "learning_rate": 1.999597539754728e-05, "loss": 0.7845, "step": 16895 }, { "epoch": 0.54, "learning_rate": 1.9995943647529533e-05, "loss": 0.8029, "step": 16900 }, { "epoch": 0.54, "learning_rate": 1.9995911772791102e-05, "loss": 0.7906, "step": 16905 }, { "epoch": 0.54, "learning_rate": 1.9995879773332386e-05, "loss": 0.7852, "step": 16910 }, { "epoch": 0.54, "learning_rate": 1.999584764915378e-05, "loss": 0.7807, "step": 16915 }, { "epoch": 0.54, "learning_rate": 1.9995815400255692e-05, "loss": 0.8018, "step": 16920 }, { "epoch": 0.54, "learning_rate": 1.999578302663852e-05, "loss": 0.7903, "step": 16925 }, { "epoch": 0.54, "learning_rate": 1.9995750528302668e-05, "loss": 0.8071, "step": 16930 }, { "epoch": 0.54, "learning_rate": 1.999571790524854e-05, "loss": 0.7847, "step": 16935 }, { "epoch": 0.54, "learning_rate": 1.999568515747655e-05, "loss": 0.7888, "step": 16940 }, { "epoch": 0.54, "learning_rate": 1.9995652284987096e-05, "loss": 0.8046, "step": 16945 }, { "epoch": 0.54, "learning_rate": 1.99956192877806e-05, "loss": 0.7917, "step": 16950 }, { "epoch": 0.54, "learning_rate": 1.999558616585746e-05, "loss": 0.8026, "step": 16955 }, { "epoch": 0.54, "learning_rate": 1.9995552919218106e-05, "loss": 0.7967, "step": 16960 }, { "epoch": 0.54, "learning_rate": 1.9995519547862937e-05, "loss": 0.797, "step": 16965 }, { "epoch": 0.54, "learning_rate": 1.999548605179238e-05, "loss": 0.7935, "step": 16970 }, { "epoch": 0.54, "learning_rate": 1.9995452431006844e-05, "loss": 0.7889, "step": 16975 }, { "epoch": 0.54, "learning_rate": 1.999541868550676e-05, "loss": 0.7921, "step": 16980 }, { "epoch": 0.54, "learning_rate": 1.9995384815292537e-05, "loss": 0.8021, "step": 16985 }, { "epoch": 0.54, "learning_rate": 1.9995350820364608e-05, "loss": 0.7878, "step": 16990 }, { "epoch": 0.54, "learning_rate": 1.9995316700723393e-05, "loss": 0.7911, "step": 16995 }, { "epoch": 0.54, "learning_rate": 1.9995282456369313e-05, "loss": 0.7908, "step": 17000 }, { "epoch": 0.54, "learning_rate": 1.99952480873028e-05, "loss": 0.7852, "step": 17005 }, { "epoch": 0.54, "learning_rate": 1.9995213593524284e-05, "loss": 0.7886, "step": 17010 }, { "epoch": 0.54, "learning_rate": 1.9995178975034192e-05, "loss": 0.8128, "step": 17015 }, { "epoch": 0.54, "learning_rate": 1.999514423183296e-05, "loss": 0.7891, "step": 17020 }, { "epoch": 0.54, "learning_rate": 1.9995109363921017e-05, "loss": 0.7979, "step": 17025 }, { "epoch": 0.54, "learning_rate": 1.99950743712988e-05, "loss": 0.7899, "step": 17030 }, { "epoch": 0.55, "learning_rate": 1.9995039253966747e-05, "loss": 0.7863, "step": 17035 }, { "epoch": 0.55, "learning_rate": 1.9995004011925294e-05, "loss": 0.7946, "step": 17040 }, { "epoch": 0.55, "learning_rate": 1.9994968645174882e-05, "loss": 0.8047, "step": 17045 }, { "epoch": 0.55, "learning_rate": 1.999493315371595e-05, "loss": 0.7986, "step": 17050 }, { "epoch": 0.55, "learning_rate": 1.9994897537548944e-05, "loss": 0.7912, "step": 17055 }, { "epoch": 0.55, "learning_rate": 1.9994861796674308e-05, "loss": 0.7776, "step": 17060 }, { "epoch": 0.55, "learning_rate": 1.9994825931092486e-05, "loss": 0.7861, "step": 17065 }, { "epoch": 0.55, "learning_rate": 1.9994789940803926e-05, "loss": 0.7856, "step": 17070 }, { "epoch": 0.55, "learning_rate": 1.999475382580908e-05, "loss": 0.7942, "step": 17075 }, { "epoch": 0.55, "learning_rate": 1.9994717586108395e-05, "loss": 0.783, "step": 17080 }, { "epoch": 0.55, "learning_rate": 1.9994681221702324e-05, "loss": 0.7999, "step": 17085 }, { "epoch": 0.55, "learning_rate": 1.9994644732591322e-05, "loss": 0.7919, "step": 17090 }, { "epoch": 0.55, "learning_rate": 1.999460811877584e-05, "loss": 0.7913, "step": 17095 }, { "epoch": 0.55, "learning_rate": 1.9994571380256343e-05, "loss": 0.7873, "step": 17100 }, { "epoch": 0.55, "learning_rate": 1.999453451703328e-05, "loss": 0.781, "step": 17105 }, { "epoch": 0.55, "learning_rate": 1.9994497529107118e-05, "loss": 0.7837, "step": 17110 }, { "epoch": 0.55, "learning_rate": 1.9994460416478315e-05, "loss": 0.7863, "step": 17115 }, { "epoch": 0.55, "learning_rate": 1.9994423179147335e-05, "loss": 0.7935, "step": 17120 }, { "epoch": 0.55, "learning_rate": 1.9994385817114644e-05, "loss": 0.7906, "step": 17125 }, { "epoch": 0.55, "learning_rate": 1.9994348330380706e-05, "loss": 0.7967, "step": 17130 }, { "epoch": 0.55, "learning_rate": 1.999431071894599e-05, "loss": 0.7842, "step": 17135 }, { "epoch": 0.55, "learning_rate": 1.9994272982810966e-05, "loss": 0.8055, "step": 17140 }, { "epoch": 0.55, "learning_rate": 1.9994235121976104e-05, "loss": 0.7899, "step": 17145 }, { "epoch": 0.55, "learning_rate": 1.9994197136441874e-05, "loss": 0.8048, "step": 17150 }, { "epoch": 0.55, "learning_rate": 1.999415902620875e-05, "loss": 0.7852, "step": 17155 }, { "epoch": 0.55, "learning_rate": 1.9994120791277214e-05, "loss": 0.7933, "step": 17160 }, { "epoch": 0.55, "learning_rate": 1.9994082431647735e-05, "loss": 0.7959, "step": 17165 }, { "epoch": 0.55, "learning_rate": 1.9994043947320797e-05, "loss": 0.7917, "step": 17170 }, { "epoch": 0.55, "learning_rate": 1.999400533829688e-05, "loss": 0.7864, "step": 17175 }, { "epoch": 0.55, "learning_rate": 1.9993966604576463e-05, "loss": 0.7963, "step": 17180 }, { "epoch": 0.55, "learning_rate": 1.999392774616003e-05, "loss": 0.7757, "step": 17185 }, { "epoch": 0.55, "learning_rate": 1.9993888763048068e-05, "loss": 0.7946, "step": 17190 }, { "epoch": 0.55, "learning_rate": 1.9993849655241058e-05, "loss": 0.7849, "step": 17195 }, { "epoch": 0.55, "learning_rate": 1.9993810422739496e-05, "loss": 0.788, "step": 17200 }, { "epoch": 0.55, "learning_rate": 1.9993771065543862e-05, "loss": 0.8009, "step": 17205 }, { "epoch": 0.55, "learning_rate": 1.9993731583654655e-05, "loss": 0.8047, "step": 17210 }, { "epoch": 0.55, "learning_rate": 1.9993691977072366e-05, "loss": 0.7931, "step": 17215 }, { "epoch": 0.55, "learning_rate": 1.999365224579749e-05, "loss": 0.7869, "step": 17220 }, { "epoch": 0.55, "learning_rate": 1.9993612389830516e-05, "loss": 0.8, "step": 17225 }, { "epoch": 0.55, "learning_rate": 1.9993572409171945e-05, "loss": 0.7887, "step": 17230 }, { "epoch": 0.55, "learning_rate": 1.999353230382228e-05, "loss": 0.8025, "step": 17235 }, { "epoch": 0.55, "learning_rate": 1.999349207378202e-05, "loss": 0.7926, "step": 17240 }, { "epoch": 0.55, "learning_rate": 1.9993451719051663e-05, "loss": 0.7856, "step": 17245 }, { "epoch": 0.55, "learning_rate": 1.9993411239631713e-05, "loss": 0.7885, "step": 17250 }, { "epoch": 0.55, "learning_rate": 1.9993370635522676e-05, "loss": 0.7891, "step": 17255 }, { "epoch": 0.55, "learning_rate": 1.9993329906725066e-05, "loss": 0.7792, "step": 17260 }, { "epoch": 0.55, "learning_rate": 1.999328905323938e-05, "loss": 0.7941, "step": 17265 }, { "epoch": 0.55, "learning_rate": 1.9993248075066135e-05, "loss": 0.7877, "step": 17270 }, { "epoch": 0.55, "learning_rate": 1.9993206972205836e-05, "loss": 0.7872, "step": 17275 }, { "epoch": 0.55, "learning_rate": 1.9993165744659e-05, "loss": 0.7769, "step": 17280 }, { "epoch": 0.55, "learning_rate": 1.9993124392426142e-05, "loss": 0.7763, "step": 17285 }, { "epoch": 0.55, "learning_rate": 1.9993082915507776e-05, "loss": 0.7893, "step": 17290 }, { "epoch": 0.55, "learning_rate": 1.9993041313904422e-05, "loss": 0.792, "step": 17295 }, { "epoch": 0.55, "learning_rate": 1.99929995876166e-05, "loss": 0.7964, "step": 17300 }, { "epoch": 0.55, "learning_rate": 1.999295773664482e-05, "loss": 0.8055, "step": 17305 }, { "epoch": 0.55, "learning_rate": 1.9992915760989617e-05, "loss": 0.7838, "step": 17310 }, { "epoch": 0.55, "learning_rate": 1.9992873660651512e-05, "loss": 0.7795, "step": 17315 }, { "epoch": 0.55, "learning_rate": 1.9992831435631024e-05, "loss": 0.7923, "step": 17320 }, { "epoch": 0.55, "learning_rate": 1.9992789085928686e-05, "loss": 0.7888, "step": 17325 }, { "epoch": 0.55, "learning_rate": 1.9992746611545027e-05, "loss": 0.7942, "step": 17330 }, { "epoch": 0.55, "learning_rate": 1.999270401248057e-05, "loss": 0.7993, "step": 17335 }, { "epoch": 0.55, "learning_rate": 1.999266128873585e-05, "loss": 0.7932, "step": 17340 }, { "epoch": 0.56, "learning_rate": 1.9992618440311407e-05, "loss": 0.7697, "step": 17345 }, { "epoch": 0.56, "learning_rate": 1.9992575467207765e-05, "loss": 0.785, "step": 17350 }, { "epoch": 0.56, "learning_rate": 1.9992532369425468e-05, "loss": 0.7809, "step": 17355 }, { "epoch": 0.56, "learning_rate": 1.999248914696505e-05, "loss": 0.7794, "step": 17360 }, { "epoch": 0.56, "learning_rate": 1.999244579982705e-05, "loss": 0.7813, "step": 17365 }, { "epoch": 0.56, "learning_rate": 1.999240232801201e-05, "loss": 0.7972, "step": 17370 }, { "epoch": 0.56, "learning_rate": 1.999235873152047e-05, "loss": 0.7865, "step": 17375 }, { "epoch": 0.56, "learning_rate": 1.9992315010352978e-05, "loss": 0.7781, "step": 17380 }, { "epoch": 0.56, "learning_rate": 1.9992271164510077e-05, "loss": 0.7833, "step": 17385 }, { "epoch": 0.56, "learning_rate": 1.9992227193992316e-05, "loss": 0.7826, "step": 17390 }, { "epoch": 0.56, "learning_rate": 1.999218309880024e-05, "loss": 0.7971, "step": 17395 }, { "epoch": 0.56, "learning_rate": 1.9992138878934405e-05, "loss": 0.8041, "step": 17400 }, { "epoch": 0.56, "learning_rate": 1.9992094534395358e-05, "loss": 0.7839, "step": 17405 }, { "epoch": 0.56, "learning_rate": 1.999205006518365e-05, "loss": 0.7784, "step": 17410 }, { "epoch": 0.56, "learning_rate": 1.9992005471299843e-05, "loss": 0.7738, "step": 17415 }, { "epoch": 0.56, "learning_rate": 1.9991960752744487e-05, "loss": 0.7821, "step": 17420 }, { "epoch": 0.56, "learning_rate": 1.9991915909518146e-05, "loss": 0.8009, "step": 17425 }, { "epoch": 0.56, "learning_rate": 1.9991870941621373e-05, "loss": 0.7956, "step": 17430 }, { "epoch": 0.56, "learning_rate": 1.9991825849054736e-05, "loss": 0.7858, "step": 17435 }, { "epoch": 0.56, "learning_rate": 1.999178063181879e-05, "loss": 0.7937, "step": 17440 }, { "epoch": 0.56, "learning_rate": 1.999173528991411e-05, "loss": 0.7911, "step": 17445 }, { "epoch": 0.56, "learning_rate": 1.9991689823341246e-05, "loss": 0.7851, "step": 17450 }, { "epoch": 0.56, "learning_rate": 1.9991644232100777e-05, "loss": 0.7952, "step": 17455 }, { "epoch": 0.56, "learning_rate": 1.999159851619327e-05, "loss": 0.7841, "step": 17460 }, { "epoch": 0.56, "learning_rate": 1.9991552675619295e-05, "loss": 0.7903, "step": 17465 }, { "epoch": 0.56, "learning_rate": 1.9991506710379424e-05, "loss": 0.7887, "step": 17470 }, { "epoch": 0.56, "learning_rate": 1.9991460620474226e-05, "loss": 0.789, "step": 17475 }, { "epoch": 0.56, "learning_rate": 1.9991414405904285e-05, "loss": 0.7943, "step": 17480 }, { "epoch": 0.56, "learning_rate": 1.999136806667017e-05, "loss": 0.7921, "step": 17485 }, { "epoch": 0.56, "learning_rate": 1.999132160277246e-05, "loss": 0.7916, "step": 17490 }, { "epoch": 0.56, "learning_rate": 1.999127501421174e-05, "loss": 0.7846, "step": 17495 }, { "epoch": 0.56, "learning_rate": 1.9991228300988586e-05, "loss": 0.7849, "step": 17500 }, { "epoch": 0.56, "learning_rate": 1.9991181463103582e-05, "loss": 0.7762, "step": 17505 }, { "epoch": 0.56, "learning_rate": 1.9991134500557314e-05, "loss": 0.7766, "step": 17510 }, { "epoch": 0.56, "learning_rate": 1.9991087413350367e-05, "loss": 0.7789, "step": 17515 }, { "epoch": 0.56, "learning_rate": 1.9991040201483326e-05, "loss": 0.7817, "step": 17520 }, { "epoch": 0.56, "learning_rate": 1.9990992864956785e-05, "loss": 0.7826, "step": 17525 }, { "epoch": 0.56, "learning_rate": 1.9990945403771334e-05, "loss": 0.7854, "step": 17530 }, { "epoch": 0.56, "learning_rate": 1.999089781792756e-05, "loss": 0.7736, "step": 17535 }, { "epoch": 0.56, "learning_rate": 1.999085010742606e-05, "loss": 0.7784, "step": 17540 }, { "epoch": 0.56, "learning_rate": 1.9990802272267432e-05, "loss": 0.7852, "step": 17545 }, { "epoch": 0.56, "learning_rate": 1.9990754312452266e-05, "loss": 0.793, "step": 17550 }, { "epoch": 0.56, "learning_rate": 1.999070622798117e-05, "loss": 0.793, "step": 17555 }, { "epoch": 0.56, "learning_rate": 1.9990658018854737e-05, "loss": 0.7967, "step": 17560 }, { "epoch": 0.56, "learning_rate": 1.999060968507357e-05, "loss": 0.7935, "step": 17565 }, { "epoch": 0.56, "learning_rate": 1.999056122663827e-05, "loss": 0.7738, "step": 17570 }, { "epoch": 0.56, "learning_rate": 1.9990512643549444e-05, "loss": 0.7943, "step": 17575 }, { "epoch": 0.56, "learning_rate": 1.99904639358077e-05, "loss": 0.7765, "step": 17580 }, { "epoch": 0.56, "learning_rate": 1.999041510341364e-05, "loss": 0.7782, "step": 17585 }, { "epoch": 0.56, "learning_rate": 1.999036614636788e-05, "loss": 0.7819, "step": 17590 }, { "epoch": 0.56, "learning_rate": 1.999031706467103e-05, "loss": 0.7797, "step": 17595 }, { "epoch": 0.56, "learning_rate": 1.9990267858323697e-05, "loss": 0.7859, "step": 17600 }, { "epoch": 0.56, "learning_rate": 1.99902185273265e-05, "loss": 0.7792, "step": 17605 }, { "epoch": 0.56, "learning_rate": 1.999016907168005e-05, "loss": 0.7817, "step": 17610 }, { "epoch": 0.56, "learning_rate": 1.999011949138497e-05, "loss": 0.7855, "step": 17615 }, { "epoch": 0.56, "learning_rate": 1.9990069786441874e-05, "loss": 0.7691, "step": 17620 }, { "epoch": 0.56, "learning_rate": 1.9990019956851384e-05, "loss": 0.7852, "step": 17625 }, { "epoch": 0.56, "learning_rate": 1.9989970002614118e-05, "loss": 0.7847, "step": 17630 }, { "epoch": 0.56, "learning_rate": 1.998991992373071e-05, "loss": 0.7722, "step": 17635 }, { "epoch": 0.56, "learning_rate": 1.998986972020177e-05, "loss": 0.7866, "step": 17640 }, { "epoch": 0.56, "learning_rate": 1.998981939202793e-05, "loss": 0.7912, "step": 17645 }, { "epoch": 0.56, "learning_rate": 1.9989768939209826e-05, "loss": 0.7878, "step": 17650 }, { "epoch": 0.56, "learning_rate": 1.9989718361748082e-05, "loss": 0.7918, "step": 17655 }, { "epoch": 0.57, "learning_rate": 1.9989667659643322e-05, "loss": 0.7751, "step": 17660 }, { "epoch": 0.57, "learning_rate": 1.998961683289619e-05, "loss": 0.7902, "step": 17665 }, { "epoch": 0.57, "learning_rate": 1.9989565881507317e-05, "loss": 0.7958, "step": 17670 }, { "epoch": 0.57, "learning_rate": 1.9989514805477332e-05, "loss": 0.7786, "step": 17675 }, { "epoch": 0.57, "learning_rate": 1.998946360480688e-05, "loss": 0.7785, "step": 17680 }, { "epoch": 0.57, "learning_rate": 1.998941227949659e-05, "loss": 0.7763, "step": 17685 }, { "epoch": 0.57, "learning_rate": 1.9989360829547117e-05, "loss": 0.7854, "step": 17690 }, { "epoch": 0.57, "learning_rate": 1.9989309254959096e-05, "loss": 0.7791, "step": 17695 }, { "epoch": 0.57, "learning_rate": 1.9989257555733164e-05, "loss": 0.7901, "step": 17700 }, { "epoch": 0.57, "learning_rate": 1.9989205731869977e-05, "loss": 0.7867, "step": 17705 }, { "epoch": 0.57, "learning_rate": 1.998915378337017e-05, "loss": 0.7873, "step": 17710 }, { "epoch": 0.57, "learning_rate": 1.9989101710234403e-05, "loss": 0.8055, "step": 17715 }, { "epoch": 0.57, "learning_rate": 1.998904951246332e-05, "loss": 0.791, "step": 17720 }, { "epoch": 0.57, "learning_rate": 1.9988997190057574e-05, "loss": 0.7741, "step": 17725 }, { "epoch": 0.57, "learning_rate": 1.9988944743017814e-05, "loss": 0.7945, "step": 17730 }, { "epoch": 0.57, "learning_rate": 1.9988892171344698e-05, "loss": 0.7847, "step": 17735 }, { "epoch": 0.57, "learning_rate": 1.998883947503888e-05, "loss": 0.7916, "step": 17740 }, { "epoch": 0.57, "learning_rate": 1.9988786654101016e-05, "loss": 0.7865, "step": 17745 }, { "epoch": 0.57, "learning_rate": 1.9988733708531772e-05, "loss": 0.7945, "step": 17750 }, { "epoch": 0.57, "learning_rate": 1.99886806383318e-05, "loss": 0.7809, "step": 17755 }, { "epoch": 0.57, "learning_rate": 1.998862744350177e-05, "loss": 0.7709, "step": 17760 }, { "epoch": 0.57, "learning_rate": 1.998857412404234e-05, "loss": 0.7882, "step": 17765 }, { "epoch": 0.57, "learning_rate": 1.9988520679954175e-05, "loss": 0.7893, "step": 17770 }, { "epoch": 0.57, "learning_rate": 1.9988467111237947e-05, "loss": 0.7949, "step": 17775 }, { "epoch": 0.57, "learning_rate": 1.9988413417894322e-05, "loss": 0.7723, "step": 17780 }, { "epoch": 0.57, "learning_rate": 1.9988359599923964e-05, "loss": 0.7767, "step": 17785 }, { "epoch": 0.57, "learning_rate": 1.9988305657327552e-05, "loss": 0.7874, "step": 17790 }, { "epoch": 0.57, "learning_rate": 1.998825159010576e-05, "loss": 0.7961, "step": 17795 }, { "epoch": 0.57, "learning_rate": 1.9988197398259257e-05, "loss": 0.7845, "step": 17800 }, { "epoch": 0.57, "learning_rate": 1.9988143081788722e-05, "loss": 0.787, "step": 17805 }, { "epoch": 0.57, "learning_rate": 1.998808864069483e-05, "loss": 0.7909, "step": 17810 }, { "epoch": 0.57, "learning_rate": 1.9988034074978268e-05, "loss": 0.7986, "step": 17815 }, { "epoch": 0.57, "learning_rate": 1.998797938463971e-05, "loss": 0.7742, "step": 17820 }, { "epoch": 0.57, "learning_rate": 1.9987924569679836e-05, "loss": 0.7799, "step": 17825 }, { "epoch": 0.57, "learning_rate": 1.9987869630099333e-05, "loss": 0.7805, "step": 17830 }, { "epoch": 0.57, "learning_rate": 1.9987814565898894e-05, "loss": 0.7886, "step": 17835 }, { "epoch": 0.57, "learning_rate": 1.9987759377079193e-05, "loss": 0.7778, "step": 17840 }, { "epoch": 0.57, "learning_rate": 1.9987704063640925e-05, "loss": 0.7831, "step": 17845 }, { "epoch": 0.57, "learning_rate": 1.9987648625584785e-05, "loss": 0.7849, "step": 17850 }, { "epoch": 0.57, "learning_rate": 1.9987593062911457e-05, "loss": 0.7729, "step": 17855 }, { "epoch": 0.57, "learning_rate": 1.9987537375621635e-05, "loss": 0.7932, "step": 17860 }, { "epoch": 0.57, "learning_rate": 1.9987481563716015e-05, "loss": 0.789, "step": 17865 }, { "epoch": 0.57, "learning_rate": 1.99874256271953e-05, "loss": 0.7778, "step": 17870 }, { "epoch": 0.57, "learning_rate": 1.998736956606018e-05, "loss": 0.7953, "step": 17875 }, { "epoch": 0.57, "learning_rate": 1.9987313380311352e-05, "loss": 0.7918, "step": 17880 }, { "epoch": 0.57, "learning_rate": 1.9987257069949522e-05, "loss": 0.7737, "step": 17885 }, { "epoch": 0.57, "learning_rate": 1.9987200634975397e-05, "loss": 0.7828, "step": 17890 }, { "epoch": 0.57, "learning_rate": 1.9987144075389674e-05, "loss": 0.7836, "step": 17895 }, { "epoch": 0.57, "learning_rate": 1.998708739119306e-05, "loss": 0.7735, "step": 17900 }, { "epoch": 0.57, "learning_rate": 1.9987030582386264e-05, "loss": 0.7686, "step": 17905 }, { "epoch": 0.57, "learning_rate": 1.9986973648969996e-05, "loss": 0.7814, "step": 17910 }, { "epoch": 0.57, "learning_rate": 1.9986916590944964e-05, "loss": 0.7792, "step": 17915 }, { "epoch": 0.57, "learning_rate": 1.9986859408311878e-05, "loss": 0.783, "step": 17920 }, { "epoch": 0.57, "learning_rate": 1.9986802101071453e-05, "loss": 0.7787, "step": 17925 }, { "epoch": 0.57, "learning_rate": 1.998674466922441e-05, "loss": 0.7809, "step": 17930 }, { "epoch": 0.57, "learning_rate": 1.9986687112771457e-05, "loss": 0.7825, "step": 17935 }, { "epoch": 0.57, "learning_rate": 1.9986629431713315e-05, "loss": 0.7737, "step": 17940 }, { "epoch": 0.57, "learning_rate": 1.9986571626050705e-05, "loss": 0.7896, "step": 17945 }, { "epoch": 0.57, "learning_rate": 1.998651369578435e-05, "loss": 0.7813, "step": 17950 }, { "epoch": 0.57, "learning_rate": 1.9986455640914967e-05, "loss": 0.7751, "step": 17955 }, { "epoch": 0.57, "learning_rate": 1.9986397461443286e-05, "loss": 0.7832, "step": 17960 }, { "epoch": 0.57, "learning_rate": 1.9986339157370026e-05, "loss": 0.7842, "step": 17965 }, { "epoch": 0.58, "learning_rate": 1.9986280728695923e-05, "loss": 0.7829, "step": 17970 }, { "epoch": 0.58, "learning_rate": 1.9986222175421704e-05, "loss": 0.7832, "step": 17975 }, { "epoch": 0.58, "learning_rate": 1.9986163497548096e-05, "loss": 0.7913, "step": 17980 }, { "epoch": 0.58, "learning_rate": 1.9986104695075832e-05, "loss": 0.7809, "step": 17985 }, { "epoch": 0.58, "learning_rate": 1.9986045768005645e-05, "loss": 0.7859, "step": 17990 }, { "epoch": 0.58, "learning_rate": 1.9985986716338274e-05, "loss": 0.7821, "step": 17995 }, { "epoch": 0.58, "learning_rate": 1.9985927540074453e-05, "loss": 0.7691, "step": 18000 }, { "epoch": 0.58, "learning_rate": 1.9985868239214922e-05, "loss": 0.7877, "step": 18005 }, { "epoch": 0.58, "learning_rate": 1.998580881376042e-05, "loss": 0.781, "step": 18010 }, { "epoch": 0.58, "learning_rate": 1.9985749263711685e-05, "loss": 0.7697, "step": 18015 }, { "epoch": 0.58, "learning_rate": 1.9985689589069467e-05, "loss": 0.7816, "step": 18020 }, { "epoch": 0.58, "learning_rate": 1.9985629789834503e-05, "loss": 0.7736, "step": 18025 }, { "epoch": 0.58, "learning_rate": 1.9985569866007545e-05, "loss": 0.781, "step": 18030 }, { "epoch": 0.58, "learning_rate": 1.9985509817589338e-05, "loss": 0.7733, "step": 18035 }, { "epoch": 0.58, "learning_rate": 1.9985449644580635e-05, "loss": 0.7856, "step": 18040 }, { "epoch": 0.58, "learning_rate": 1.998538934698218e-05, "loss": 0.781, "step": 18045 }, { "epoch": 0.58, "learning_rate": 1.9985328924794732e-05, "loss": 0.7725, "step": 18050 }, { "epoch": 0.58, "learning_rate": 1.998526837801904e-05, "loss": 0.7625, "step": 18055 }, { "epoch": 0.58, "learning_rate": 1.998520770665586e-05, "loss": 0.7889, "step": 18060 }, { "epoch": 0.58, "learning_rate": 1.9985146910705954e-05, "loss": 0.783, "step": 18065 }, { "epoch": 0.58, "learning_rate": 1.9985085990170072e-05, "loss": 0.7721, "step": 18070 }, { "epoch": 0.58, "learning_rate": 1.9985024945048982e-05, "loss": 0.7708, "step": 18075 }, { "epoch": 0.58, "learning_rate": 1.998496377534344e-05, "loss": 0.7721, "step": 18080 }, { "epoch": 0.58, "learning_rate": 1.9984902481054217e-05, "loss": 0.7922, "step": 18085 }, { "epoch": 0.58, "learning_rate": 1.998484106218207e-05, "loss": 0.7676, "step": 18090 }, { "epoch": 0.58, "learning_rate": 1.998477951872777e-05, "loss": 0.7756, "step": 18095 }, { "epoch": 0.58, "learning_rate": 1.998471785069208e-05, "loss": 0.7706, "step": 18100 }, { "epoch": 0.58, "learning_rate": 1.9984656058075772e-05, "loss": 0.7932, "step": 18105 }, { "epoch": 0.58, "learning_rate": 1.998459414087962e-05, "loss": 0.783, "step": 18110 }, { "epoch": 0.58, "learning_rate": 1.998453209910439e-05, "loss": 0.766, "step": 18115 }, { "epoch": 0.58, "learning_rate": 1.9984469932750862e-05, "loss": 0.7776, "step": 18120 }, { "epoch": 0.58, "learning_rate": 1.9984407641819812e-05, "loss": 0.7832, "step": 18125 }, { "epoch": 0.58, "learning_rate": 1.9984345226312012e-05, "loss": 0.7855, "step": 18130 }, { "epoch": 0.58, "learning_rate": 1.9984282686228244e-05, "loss": 0.7837, "step": 18135 }, { "epoch": 0.58, "learning_rate": 1.998422002156929e-05, "loss": 0.7945, "step": 18140 }, { "epoch": 0.58, "learning_rate": 1.9984157232335926e-05, "loss": 0.7823, "step": 18145 }, { "epoch": 0.58, "learning_rate": 1.9984094318528943e-05, "loss": 0.7739, "step": 18150 }, { "epoch": 0.58, "learning_rate": 1.9984031280149122e-05, "loss": 0.784, "step": 18155 }, { "epoch": 0.58, "learning_rate": 1.9983968117197247e-05, "loss": 0.7687, "step": 18160 }, { "epoch": 0.58, "learning_rate": 1.9983904829674113e-05, "loss": 0.7749, "step": 18165 }, { "epoch": 0.58, "learning_rate": 1.99838414175805e-05, "loss": 0.7871, "step": 18170 }, { "epoch": 0.58, "learning_rate": 1.998377788091721e-05, "loss": 0.785, "step": 18175 }, { "epoch": 0.58, "learning_rate": 1.9983714219685027e-05, "loss": 0.7903, "step": 18180 }, { "epoch": 0.58, "learning_rate": 1.998365043388475e-05, "loss": 0.7881, "step": 18185 }, { "epoch": 0.58, "learning_rate": 1.9983586523517175e-05, "loss": 0.7811, "step": 18190 }, { "epoch": 0.58, "learning_rate": 1.9983522488583095e-05, "loss": 0.7674, "step": 18195 }, { "epoch": 0.58, "learning_rate": 1.9983458329083313e-05, "loss": 0.7784, "step": 18200 }, { "epoch": 0.58, "learning_rate": 1.9983394045018628e-05, "loss": 0.7572, "step": 18205 }, { "epoch": 0.58, "learning_rate": 1.9983329636389844e-05, "loss": 0.772, "step": 18210 }, { "epoch": 0.58, "learning_rate": 1.9983265103197764e-05, "loss": 0.7824, "step": 18215 }, { "epoch": 0.58, "learning_rate": 1.998320044544319e-05, "loss": 0.7781, "step": 18220 }, { "epoch": 0.58, "learning_rate": 1.9983135663126937e-05, "loss": 0.7825, "step": 18225 }, { "epoch": 0.58, "learning_rate": 1.9983070756249802e-05, "loss": 0.7669, "step": 18230 }, { "epoch": 0.58, "learning_rate": 1.99830057248126e-05, "loss": 0.7682, "step": 18235 }, { "epoch": 0.58, "learning_rate": 1.9982940568816147e-05, "loss": 0.7862, "step": 18240 }, { "epoch": 0.58, "learning_rate": 1.9982875288261246e-05, "loss": 0.7574, "step": 18245 }, { "epoch": 0.58, "learning_rate": 1.998280988314872e-05, "loss": 0.7726, "step": 18250 }, { "epoch": 0.58, "learning_rate": 1.9982744353479383e-05, "loss": 0.7774, "step": 18255 }, { "epoch": 0.58, "learning_rate": 1.9982678699254054e-05, "loss": 0.7779, "step": 18260 }, { "epoch": 0.58, "learning_rate": 1.9982612920473547e-05, "loss": 0.7687, "step": 18265 }, { "epoch": 0.58, "learning_rate": 1.9982547017138688e-05, "loss": 0.7738, "step": 18270 }, { "epoch": 0.58, "learning_rate": 1.9982480989250293e-05, "loss": 0.7755, "step": 18275 }, { "epoch": 0.58, "learning_rate": 1.998241483680919e-05, "loss": 0.7638, "step": 18280 }, { "epoch": 0.59, "learning_rate": 1.998234855981621e-05, "loss": 0.7847, "step": 18285 }, { "epoch": 0.59, "learning_rate": 1.9982282158272173e-05, "loss": 0.7699, "step": 18290 }, { "epoch": 0.59, "learning_rate": 1.9982215632177905e-05, "loss": 0.7734, "step": 18295 }, { "epoch": 0.59, "learning_rate": 1.998214898153424e-05, "loss": 0.7749, "step": 18300 }, { "epoch": 0.59, "learning_rate": 1.9982082206342014e-05, "loss": 0.771, "step": 18305 }, { "epoch": 0.59, "learning_rate": 1.998201530660205e-05, "loss": 0.784, "step": 18310 }, { "epoch": 0.59, "learning_rate": 1.9981948282315194e-05, "loss": 0.7818, "step": 18315 }, { "epoch": 0.59, "learning_rate": 1.9981881133482273e-05, "loss": 0.7738, "step": 18320 }, { "epoch": 0.59, "learning_rate": 1.998181386010413e-05, "loss": 0.773, "step": 18325 }, { "epoch": 0.59, "learning_rate": 1.99817464621816e-05, "loss": 0.7871, "step": 18330 }, { "epoch": 0.59, "learning_rate": 1.9981678939715528e-05, "loss": 0.7758, "step": 18335 }, { "epoch": 0.59, "learning_rate": 1.998161129270676e-05, "loss": 0.7792, "step": 18340 }, { "epoch": 0.59, "learning_rate": 1.998154352115613e-05, "loss": 0.7832, "step": 18345 }, { "epoch": 0.59, "learning_rate": 1.998147562506449e-05, "loss": 0.7741, "step": 18350 }, { "epoch": 0.59, "learning_rate": 1.9981407604432686e-05, "loss": 0.7716, "step": 18355 }, { "epoch": 0.59, "learning_rate": 1.9981339459261567e-05, "loss": 0.7788, "step": 18360 }, { "epoch": 0.59, "learning_rate": 1.9981271189551983e-05, "loss": 0.776, "step": 18365 }, { "epoch": 0.59, "learning_rate": 1.9981202795304787e-05, "loss": 0.7827, "step": 18370 }, { "epoch": 0.59, "learning_rate": 1.9981134276520828e-05, "loss": 0.7732, "step": 18375 }, { "epoch": 0.59, "learning_rate": 1.9981065633200966e-05, "loss": 0.7686, "step": 18380 }, { "epoch": 0.59, "learning_rate": 1.9980996865346057e-05, "loss": 0.7664, "step": 18385 }, { "epoch": 0.59, "learning_rate": 1.9980927972956952e-05, "loss": 0.7757, "step": 18390 }, { "epoch": 0.59, "learning_rate": 1.9980858956034523e-05, "loss": 0.782, "step": 18395 }, { "epoch": 0.59, "learning_rate": 1.9980789814579622e-05, "loss": 0.7716, "step": 18400 }, { "epoch": 0.59, "learning_rate": 1.998072054859311e-05, "loss": 0.7846, "step": 18405 }, { "epoch": 0.59, "learning_rate": 1.998065115807586e-05, "loss": 0.7947, "step": 18410 }, { "epoch": 0.59, "learning_rate": 1.9980581643028732e-05, "loss": 0.7732, "step": 18415 }, { "epoch": 0.59, "learning_rate": 1.9980512003452593e-05, "loss": 0.7669, "step": 18420 }, { "epoch": 0.59, "learning_rate": 1.9980442239348313e-05, "loss": 0.7637, "step": 18425 }, { "epoch": 0.59, "learning_rate": 1.9980372350716766e-05, "loss": 0.7702, "step": 18430 }, { "epoch": 0.59, "learning_rate": 1.998030233755882e-05, "loss": 0.7664, "step": 18435 }, { "epoch": 0.59, "learning_rate": 1.9980232199875343e-05, "loss": 0.779, "step": 18440 }, { "epoch": 0.59, "learning_rate": 1.9980161937667223e-05, "loss": 0.7699, "step": 18445 }, { "epoch": 0.59, "learning_rate": 1.998009155093533e-05, "loss": 0.7792, "step": 18450 }, { "epoch": 0.59, "learning_rate": 1.998002103968054e-05, "loss": 0.7805, "step": 18455 }, { "epoch": 0.59, "learning_rate": 1.9979950403903732e-05, "loss": 0.7716, "step": 18460 }, { "epoch": 0.59, "learning_rate": 1.99798796436058e-05, "loss": 0.783, "step": 18465 }, { "epoch": 0.59, "learning_rate": 1.9979808758787608e-05, "loss": 0.7766, "step": 18470 }, { "epoch": 0.59, "learning_rate": 1.997973774945005e-05, "loss": 0.7756, "step": 18475 }, { "epoch": 0.59, "learning_rate": 1.9979666615594017e-05, "loss": 0.7746, "step": 18480 }, { "epoch": 0.59, "learning_rate": 1.9979595357220388e-05, "loss": 0.7724, "step": 18485 }, { "epoch": 0.59, "learning_rate": 1.9979523974330056e-05, "loss": 0.7666, "step": 18490 }, { "epoch": 0.59, "learning_rate": 1.9979452466923913e-05, "loss": 0.782, "step": 18495 }, { "epoch": 0.59, "learning_rate": 1.9979380835002846e-05, "loss": 0.7774, "step": 18500 }, { "epoch": 0.59, "learning_rate": 1.9979309078567756e-05, "loss": 0.7661, "step": 18505 }, { "epoch": 0.59, "learning_rate": 1.997923719761953e-05, "loss": 0.7799, "step": 18510 }, { "epoch": 0.59, "learning_rate": 1.9979165192159068e-05, "loss": 0.7618, "step": 18515 }, { "epoch": 0.59, "learning_rate": 1.9979093062187273e-05, "loss": 0.7753, "step": 18520 }, { "epoch": 0.59, "learning_rate": 1.9979020807705043e-05, "loss": 0.7724, "step": 18525 }, { "epoch": 0.59, "learning_rate": 1.9978948428713276e-05, "loss": 0.7846, "step": 18530 }, { "epoch": 0.59, "learning_rate": 1.9978875925212876e-05, "loss": 0.7761, "step": 18535 }, { "epoch": 0.59, "learning_rate": 1.997880329720475e-05, "loss": 0.7746, "step": 18540 }, { "epoch": 0.59, "learning_rate": 1.9978730544689803e-05, "loss": 0.7699, "step": 18545 }, { "epoch": 0.59, "learning_rate": 1.9978657667668945e-05, "loss": 0.7656, "step": 18550 }, { "epoch": 0.59, "learning_rate": 1.997858466614308e-05, "loss": 0.7729, "step": 18555 }, { "epoch": 0.59, "learning_rate": 1.9978511540113122e-05, "loss": 0.783, "step": 18560 }, { "epoch": 0.59, "learning_rate": 1.9978438289579984e-05, "loss": 0.7778, "step": 18565 }, { "epoch": 0.59, "learning_rate": 1.997836491454458e-05, "loss": 0.7675, "step": 18570 }, { "epoch": 0.59, "learning_rate": 1.997829141500782e-05, "loss": 0.7762, "step": 18575 }, { "epoch": 0.59, "learning_rate": 1.9978217790970633e-05, "loss": 0.7723, "step": 18580 }, { "epoch": 0.59, "learning_rate": 1.9978144042433926e-05, "loss": 0.7802, "step": 18585 }, { "epoch": 0.59, "learning_rate": 1.9978070169398626e-05, "loss": 0.7696, "step": 18590 }, { "epoch": 0.6, "learning_rate": 1.997799617186565e-05, "loss": 0.7659, "step": 18595 }, { "epoch": 0.6, "learning_rate": 1.9977922049835926e-05, "loss": 0.7762, "step": 18600 }, { "epoch": 0.6, "learning_rate": 1.9977847803310376e-05, "loss": 0.777, "step": 18605 }, { "epoch": 0.6, "learning_rate": 1.9977773432289926e-05, "loss": 0.7876, "step": 18610 }, { "epoch": 0.6, "learning_rate": 1.9977698936775503e-05, "loss": 0.7681, "step": 18615 }, { "epoch": 0.6, "learning_rate": 1.997762431676804e-05, "loss": 0.7774, "step": 18620 }, { "epoch": 0.6, "learning_rate": 1.997754957226847e-05, "loss": 0.7636, "step": 18625 }, { "epoch": 0.6, "learning_rate": 1.9977474703277716e-05, "loss": 0.7647, "step": 18630 }, { "epoch": 0.6, "learning_rate": 1.997739970979672e-05, "loss": 0.7675, "step": 18635 }, { "epoch": 0.6, "learning_rate": 1.9977324591826415e-05, "loss": 0.764, "step": 18640 }, { "epoch": 0.6, "learning_rate": 1.997724934936774e-05, "loss": 0.7801, "step": 18645 }, { "epoch": 0.6, "learning_rate": 1.997717398242163e-05, "loss": 0.7612, "step": 18650 }, { "epoch": 0.6, "learning_rate": 1.9977098490989035e-05, "loss": 0.7747, "step": 18655 }, { "epoch": 0.6, "learning_rate": 1.9977022875070885e-05, "loss": 0.7594, "step": 18660 }, { "epoch": 0.6, "learning_rate": 1.997694713466813e-05, "loss": 0.7751, "step": 18665 }, { "epoch": 0.6, "learning_rate": 1.9976871269781714e-05, "loss": 0.7744, "step": 18670 }, { "epoch": 0.6, "learning_rate": 1.997679528041258e-05, "loss": 0.7688, "step": 18675 }, { "epoch": 0.6, "learning_rate": 1.997671916656168e-05, "loss": 0.7768, "step": 18680 }, { "epoch": 0.6, "learning_rate": 1.9976642928229965e-05, "loss": 0.7793, "step": 18685 }, { "epoch": 0.6, "learning_rate": 1.9976566565418383e-05, "loss": 0.7845, "step": 18690 }, { "epoch": 0.6, "learning_rate": 1.997649007812789e-05, "loss": 0.7827, "step": 18695 }, { "epoch": 0.6, "learning_rate": 1.9976413466359437e-05, "loss": 0.7606, "step": 18700 }, { "epoch": 0.6, "learning_rate": 1.997633673011398e-05, "loss": 0.7717, "step": 18705 }, { "epoch": 0.6, "learning_rate": 1.997625986939248e-05, "loss": 0.7697, "step": 18710 }, { "epoch": 0.6, "learning_rate": 1.9976182884195892e-05, "loss": 0.7663, "step": 18715 }, { "epoch": 0.6, "learning_rate": 1.997610577452518e-05, "loss": 0.7781, "step": 18720 }, { "epoch": 0.6, "learning_rate": 1.9976028540381304e-05, "loss": 0.7785, "step": 18725 }, { "epoch": 0.6, "learning_rate": 1.9975951181765226e-05, "loss": 0.7779, "step": 18730 }, { "epoch": 0.6, "learning_rate": 1.9975873698677914e-05, "loss": 0.7792, "step": 18735 }, { "epoch": 0.6, "learning_rate": 1.9975796091120333e-05, "loss": 0.7655, "step": 18740 }, { "epoch": 0.6, "learning_rate": 1.9975718359093453e-05, "loss": 0.7638, "step": 18745 }, { "epoch": 0.6, "learning_rate": 1.9975640502598243e-05, "loss": 0.7833, "step": 18750 }, { "epoch": 0.6, "learning_rate": 1.9975562521635678e-05, "loss": 0.7668, "step": 18755 }, { "epoch": 0.6, "learning_rate": 1.9975484416206723e-05, "loss": 0.7619, "step": 18760 }, { "epoch": 0.6, "learning_rate": 1.997540618631236e-05, "loss": 0.7721, "step": 18765 }, { "epoch": 0.6, "learning_rate": 1.997532783195356e-05, "loss": 0.762, "step": 18770 }, { "epoch": 0.6, "learning_rate": 1.9975249353131304e-05, "loss": 0.7724, "step": 18775 }, { "epoch": 0.6, "learning_rate": 1.997517074984657e-05, "loss": 0.7809, "step": 18780 }, { "epoch": 0.6, "learning_rate": 1.997509202210034e-05, "loss": 0.7667, "step": 18785 }, { "epoch": 0.6, "learning_rate": 1.9975013169893593e-05, "loss": 0.7661, "step": 18790 }, { "epoch": 0.6, "learning_rate": 1.9974934193227315e-05, "loss": 0.778, "step": 18795 }, { "epoch": 0.6, "learning_rate": 1.997485509210249e-05, "loss": 0.7694, "step": 18800 }, { "epoch": 0.6, "learning_rate": 1.997477586652011e-05, "loss": 0.7692, "step": 18805 }, { "epoch": 0.6, "learning_rate": 1.9974696516481158e-05, "loss": 0.7676, "step": 18810 }, { "epoch": 0.6, "learning_rate": 1.9974617041986627e-05, "loss": 0.7791, "step": 18815 }, { "epoch": 0.6, "learning_rate": 1.9974537443037504e-05, "loss": 0.7748, "step": 18820 }, { "epoch": 0.6, "learning_rate": 1.997445771963479e-05, "loss": 0.7713, "step": 18825 }, { "epoch": 0.6, "learning_rate": 1.9974377871779472e-05, "loss": 0.7651, "step": 18830 }, { "epoch": 0.6, "learning_rate": 1.997429789947255e-05, "loss": 0.7716, "step": 18835 }, { "epoch": 0.6, "learning_rate": 1.9974217802715024e-05, "loss": 0.7727, "step": 18840 }, { "epoch": 0.6, "learning_rate": 1.997413758150789e-05, "loss": 0.7516, "step": 18845 }, { "epoch": 0.6, "learning_rate": 1.9974057235852148e-05, "loss": 0.7719, "step": 18850 }, { "epoch": 0.6, "learning_rate": 1.9973976765748803e-05, "loss": 0.7647, "step": 18855 }, { "epoch": 0.6, "learning_rate": 1.9973896171198858e-05, "loss": 0.764, "step": 18860 }, { "epoch": 0.6, "learning_rate": 1.9973815452203314e-05, "loss": 0.767, "step": 18865 }, { "epoch": 0.6, "learning_rate": 1.997373460876319e-05, "loss": 0.7818, "step": 18870 }, { "epoch": 0.6, "learning_rate": 1.9973653640879486e-05, "loss": 0.7703, "step": 18875 }, { "epoch": 0.6, "learning_rate": 1.9973572548553215e-05, "loss": 0.7616, "step": 18880 }, { "epoch": 0.6, "learning_rate": 1.9973491331785384e-05, "loss": 0.7724, "step": 18885 }, { "epoch": 0.6, "learning_rate": 1.9973409990577014e-05, "loss": 0.7678, "step": 18890 }, { "epoch": 0.6, "learning_rate": 1.9973328524929113e-05, "loss": 0.7691, "step": 18895 }, { "epoch": 0.6, "learning_rate": 1.99732469348427e-05, "loss": 0.7775, "step": 18900 }, { "epoch": 0.6, "learning_rate": 1.9973165220318797e-05, "loss": 0.7597, "step": 18905 }, { "epoch": 0.61, "learning_rate": 1.997308338135842e-05, "loss": 0.7806, "step": 18910 }, { "epoch": 0.61, "learning_rate": 1.9973001417962586e-05, "loss": 0.7739, "step": 18915 }, { "epoch": 0.61, "learning_rate": 1.9972919330132326e-05, "loss": 0.7714, "step": 18920 }, { "epoch": 0.61, "learning_rate": 1.9972837117868657e-05, "loss": 0.7745, "step": 18925 }, { "epoch": 0.61, "learning_rate": 1.997275478117261e-05, "loss": 0.7742, "step": 18930 }, { "epoch": 0.61, "learning_rate": 1.997267232004521e-05, "loss": 0.7666, "step": 18935 }, { "epoch": 0.61, "learning_rate": 1.9972589734487485e-05, "loss": 0.794, "step": 18940 }, { "epoch": 0.61, "learning_rate": 1.9972507024500463e-05, "loss": 0.7598, "step": 18945 }, { "epoch": 0.61, "learning_rate": 1.9972424190085186e-05, "loss": 0.7586, "step": 18950 }, { "epoch": 0.61, "learning_rate": 1.9972341231242675e-05, "loss": 0.7678, "step": 18955 }, { "epoch": 0.61, "learning_rate": 1.9972258147973976e-05, "loss": 0.7576, "step": 18960 }, { "epoch": 0.61, "learning_rate": 1.9972174940280118e-05, "loss": 0.7733, "step": 18965 }, { "epoch": 0.61, "learning_rate": 1.997209160816214e-05, "loss": 0.7643, "step": 18970 }, { "epoch": 0.61, "learning_rate": 1.9972008151621086e-05, "loss": 0.7718, "step": 18975 }, { "epoch": 0.61, "learning_rate": 1.9971924570657996e-05, "loss": 0.7775, "step": 18980 }, { "epoch": 0.61, "learning_rate": 1.997184086527391e-05, "loss": 0.7647, "step": 18985 }, { "epoch": 0.61, "learning_rate": 1.9971757035469874e-05, "loss": 0.7547, "step": 18990 }, { "epoch": 0.61, "learning_rate": 1.9971673081246936e-05, "loss": 0.7677, "step": 18995 }, { "epoch": 0.61, "learning_rate": 1.997158900260614e-05, "loss": 0.7569, "step": 19000 }, { "epoch": 0.61, "learning_rate": 1.997150479954854e-05, "loss": 0.7683, "step": 19005 }, { "epoch": 0.61, "learning_rate": 1.997142047207518e-05, "loss": 0.7662, "step": 19010 }, { "epoch": 0.61, "learning_rate": 1.9971336020187114e-05, "loss": 0.7727, "step": 19015 }, { "epoch": 0.61, "learning_rate": 1.99712514438854e-05, "loss": 0.7742, "step": 19020 }, { "epoch": 0.61, "learning_rate": 1.997116674317109e-05, "loss": 0.7698, "step": 19025 }, { "epoch": 0.61, "learning_rate": 1.997108191804524e-05, "loss": 0.7806, "step": 19030 }, { "epoch": 0.61, "learning_rate": 1.9970996968508908e-05, "loss": 0.7785, "step": 19035 }, { "epoch": 0.61, "learning_rate": 1.997091189456316e-05, "loss": 0.7665, "step": 19040 }, { "epoch": 0.61, "learning_rate": 1.997082669620905e-05, "loss": 0.7701, "step": 19045 }, { "epoch": 0.61, "learning_rate": 1.9970741373447645e-05, "loss": 0.7717, "step": 19050 }, { "epoch": 0.61, "learning_rate": 1.997065592628001e-05, "loss": 0.7688, "step": 19055 }, { "epoch": 0.61, "learning_rate": 1.997057035470721e-05, "loss": 0.7412, "step": 19060 }, { "epoch": 0.61, "learning_rate": 1.997048465873031e-05, "loss": 0.7745, "step": 19065 }, { "epoch": 0.61, "learning_rate": 1.997039883835038e-05, "loss": 0.7613, "step": 19070 }, { "epoch": 0.61, "learning_rate": 1.9970312893568497e-05, "loss": 0.7666, "step": 19075 }, { "epoch": 0.61, "learning_rate": 1.9970226824385728e-05, "loss": 0.7644, "step": 19080 }, { "epoch": 0.61, "learning_rate": 1.9970140630803145e-05, "loss": 0.762, "step": 19085 }, { "epoch": 0.61, "learning_rate": 1.997005431282183e-05, "loss": 0.7598, "step": 19090 }, { "epoch": 0.61, "learning_rate": 1.996996787044285e-05, "loss": 0.7699, "step": 19095 }, { "epoch": 0.61, "learning_rate": 1.9969881303667296e-05, "loss": 0.7787, "step": 19100 }, { "epoch": 0.61, "learning_rate": 1.996979461249624e-05, "loss": 0.778, "step": 19105 }, { "epoch": 0.61, "learning_rate": 1.9969707796930768e-05, "loss": 0.7649, "step": 19110 }, { "epoch": 0.61, "learning_rate": 1.9969620856971955e-05, "loss": 0.7654, "step": 19115 }, { "epoch": 0.61, "learning_rate": 1.9969533792620895e-05, "loss": 0.7714, "step": 19120 }, { "epoch": 0.61, "learning_rate": 1.9969446603878673e-05, "loss": 0.7586, "step": 19125 }, { "epoch": 0.61, "learning_rate": 1.996935929074637e-05, "loss": 0.7638, "step": 19130 }, { "epoch": 0.61, "learning_rate": 1.9969271853225083e-05, "loss": 0.76, "step": 19135 }, { "epoch": 0.61, "learning_rate": 1.99691842913159e-05, "loss": 0.7905, "step": 19140 }, { "epoch": 0.61, "learning_rate": 1.996909660501991e-05, "loss": 0.7799, "step": 19145 }, { "epoch": 0.61, "learning_rate": 1.9969008794338214e-05, "loss": 0.7528, "step": 19150 }, { "epoch": 0.61, "learning_rate": 1.9968920859271905e-05, "loss": 0.7562, "step": 19155 }, { "epoch": 0.61, "learning_rate": 1.9968832799822077e-05, "loss": 0.7776, "step": 19160 }, { "epoch": 0.61, "learning_rate": 1.996874461598983e-05, "loss": 0.7703, "step": 19165 }, { "epoch": 0.61, "learning_rate": 1.996865630777627e-05, "loss": 0.7593, "step": 19170 }, { "epoch": 0.61, "learning_rate": 1.9968567875182492e-05, "loss": 0.7627, "step": 19175 }, { "epoch": 0.61, "learning_rate": 1.9968479318209603e-05, "loss": 0.7513, "step": 19180 }, { "epoch": 0.61, "learning_rate": 1.9968390636858706e-05, "loss": 0.7595, "step": 19185 }, { "epoch": 0.61, "learning_rate": 1.9968301831130906e-05, "loss": 0.7761, "step": 19190 }, { "epoch": 0.61, "learning_rate": 1.9968212901027316e-05, "loss": 0.7635, "step": 19195 }, { "epoch": 0.61, "learning_rate": 1.996812384654904e-05, "loss": 0.7626, "step": 19200 }, { "epoch": 0.61, "learning_rate": 1.9968034667697193e-05, "loss": 0.7652, "step": 19205 }, { "epoch": 0.61, "learning_rate": 1.9967945364472885e-05, "loss": 0.7585, "step": 19210 }, { "epoch": 0.61, "learning_rate": 1.9967855936877237e-05, "loss": 0.7631, "step": 19215 }, { "epoch": 0.62, "learning_rate": 1.9967766384911357e-05, "loss": 0.7661, "step": 19220 }, { "epoch": 0.62, "learning_rate": 1.9967676708576362e-05, "loss": 0.7701, "step": 19225 }, { "epoch": 0.62, "learning_rate": 1.9967586907873376e-05, "loss": 0.7597, "step": 19230 }, { "epoch": 0.62, "learning_rate": 1.9967496982803517e-05, "loss": 0.7587, "step": 19235 }, { "epoch": 0.62, "learning_rate": 1.9967406933367906e-05, "loss": 0.7568, "step": 19240 }, { "epoch": 0.62, "learning_rate": 1.9967316759567673e-05, "loss": 0.781, "step": 19245 }, { "epoch": 0.62, "learning_rate": 1.9967226461403934e-05, "loss": 0.759, "step": 19250 }, { "epoch": 0.62, "learning_rate": 1.996713603887782e-05, "loss": 0.776, "step": 19255 }, { "epoch": 0.62, "learning_rate": 1.996704549199046e-05, "loss": 0.7502, "step": 19260 }, { "epoch": 0.62, "learning_rate": 1.996695482074298e-05, "loss": 0.7634, "step": 19265 }, { "epoch": 0.62, "learning_rate": 1.9966864025136518e-05, "loss": 0.7659, "step": 19270 }, { "epoch": 0.62, "learning_rate": 1.99667731051722e-05, "loss": 0.7609, "step": 19275 }, { "epoch": 0.62, "learning_rate": 1.9966682060851163e-05, "loss": 0.7731, "step": 19280 }, { "epoch": 0.62, "learning_rate": 1.9966590892174544e-05, "loss": 0.7647, "step": 19285 }, { "epoch": 0.62, "learning_rate": 1.996649959914348e-05, "loss": 0.7616, "step": 19290 }, { "epoch": 0.62, "learning_rate": 1.996640818175911e-05, "loss": 0.76, "step": 19295 }, { "epoch": 0.62, "learning_rate": 1.9966316640022577e-05, "loss": 0.7579, "step": 19300 }, { "epoch": 0.62, "learning_rate": 1.9966224973935014e-05, "loss": 0.7702, "step": 19305 }, { "epoch": 0.62, "learning_rate": 1.9966133183497578e-05, "loss": 0.7618, "step": 19310 }, { "epoch": 0.62, "learning_rate": 1.9966041268711404e-05, "loss": 0.7619, "step": 19315 }, { "epoch": 0.62, "learning_rate": 1.996594922957764e-05, "loss": 0.7632, "step": 19320 }, { "epoch": 0.62, "learning_rate": 1.9965857066097444e-05, "loss": 0.761, "step": 19325 }, { "epoch": 0.62, "learning_rate": 1.9965764778271954e-05, "loss": 0.751, "step": 19330 }, { "epoch": 0.62, "learning_rate": 1.9965672366102325e-05, "loss": 0.7748, "step": 19335 }, { "epoch": 0.62, "learning_rate": 1.9965579829589713e-05, "loss": 0.7642, "step": 19340 }, { "epoch": 0.62, "learning_rate": 1.9965487168735273e-05, "loss": 0.7597, "step": 19345 }, { "epoch": 0.62, "learning_rate": 1.9965394383540158e-05, "loss": 0.7553, "step": 19350 }, { "epoch": 0.62, "learning_rate": 1.996530147400553e-05, "loss": 0.7664, "step": 19355 }, { "epoch": 0.62, "learning_rate": 1.9965208440132538e-05, "loss": 0.764, "step": 19360 }, { "epoch": 0.62, "learning_rate": 1.9965115281922354e-05, "loss": 0.7648, "step": 19365 }, { "epoch": 0.62, "learning_rate": 1.9965021999376133e-05, "loss": 0.7651, "step": 19370 }, { "epoch": 0.62, "learning_rate": 1.9964928592495046e-05, "loss": 0.764, "step": 19375 }, { "epoch": 0.62, "learning_rate": 1.9964835061280253e-05, "loss": 0.7552, "step": 19380 }, { "epoch": 0.62, "learning_rate": 1.996474140573292e-05, "loss": 0.758, "step": 19385 }, { "epoch": 0.62, "learning_rate": 1.996464762585422e-05, "loss": 0.764, "step": 19390 }, { "epoch": 0.62, "learning_rate": 1.9964553721645322e-05, "loss": 0.7608, "step": 19395 }, { "epoch": 0.62, "learning_rate": 1.9964459693107396e-05, "loss": 0.7669, "step": 19400 }, { "epoch": 0.62, "learning_rate": 1.9964365540241614e-05, "loss": 0.7527, "step": 19405 }, { "epoch": 0.62, "learning_rate": 1.9964271263049157e-05, "loss": 0.7619, "step": 19410 }, { "epoch": 0.62, "learning_rate": 1.9964176861531196e-05, "loss": 0.7653, "step": 19415 }, { "epoch": 0.62, "learning_rate": 1.996408233568891e-05, "loss": 0.7707, "step": 19420 }, { "epoch": 0.62, "learning_rate": 1.9963987685523475e-05, "loss": 0.7721, "step": 19425 }, { "epoch": 0.62, "learning_rate": 1.9963892911036077e-05, "loss": 0.7563, "step": 19430 }, { "epoch": 0.62, "learning_rate": 1.9963798012227898e-05, "loss": 0.7595, "step": 19435 }, { "epoch": 0.62, "learning_rate": 1.996370298910012e-05, "loss": 0.7696, "step": 19440 }, { "epoch": 0.62, "learning_rate": 1.9963607841653928e-05, "loss": 0.7586, "step": 19445 }, { "epoch": 0.62, "learning_rate": 1.9963512569890512e-05, "loss": 0.7654, "step": 19450 }, { "epoch": 0.62, "learning_rate": 1.996341717381106e-05, "loss": 0.7665, "step": 19455 }, { "epoch": 0.62, "learning_rate": 1.9963321653416764e-05, "loss": 0.7559, "step": 19460 }, { "epoch": 0.62, "learning_rate": 1.996322600870881e-05, "loss": 0.758, "step": 19465 }, { "epoch": 0.62, "learning_rate": 1.9963130239688397e-05, "loss": 0.7677, "step": 19470 }, { "epoch": 0.62, "learning_rate": 1.9963034346356714e-05, "loss": 0.7574, "step": 19475 }, { "epoch": 0.62, "learning_rate": 1.9962938328714966e-05, "loss": 0.7735, "step": 19480 }, { "epoch": 0.62, "learning_rate": 1.996284218676434e-05, "loss": 0.7566, "step": 19485 }, { "epoch": 0.62, "learning_rate": 1.996274592050605e-05, "loss": 0.7588, "step": 19490 }, { "epoch": 0.62, "learning_rate": 1.9962649529941283e-05, "loss": 0.7699, "step": 19495 }, { "epoch": 0.62, "learning_rate": 1.996255301507125e-05, "loss": 0.7653, "step": 19500 }, { "epoch": 0.62, "learning_rate": 1.996245637589715e-05, "loss": 0.7713, "step": 19505 }, { "epoch": 0.62, "learning_rate": 1.9962359612420195e-05, "loss": 0.7727, "step": 19510 }, { "epoch": 0.62, "learning_rate": 1.9962262724641585e-05, "loss": 0.7612, "step": 19515 }, { "epoch": 0.62, "learning_rate": 1.9962165712562538e-05, "loss": 0.7773, "step": 19520 }, { "epoch": 0.62, "learning_rate": 1.9962068576184258e-05, "loss": 0.7574, "step": 19525 }, { "epoch": 0.62, "learning_rate": 1.9961971315507955e-05, "loss": 0.7599, "step": 19530 }, { "epoch": 0.63, "learning_rate": 1.996187393053485e-05, "loss": 0.7653, "step": 19535 }, { "epoch": 0.63, "learning_rate": 1.996177642126615e-05, "loss": 0.7613, "step": 19540 }, { "epoch": 0.63, "learning_rate": 1.996167878770308e-05, "loss": 0.7711, "step": 19545 }, { "epoch": 0.63, "learning_rate": 1.996158102984685e-05, "loss": 0.741, "step": 19550 }, { "epoch": 0.63, "learning_rate": 1.9961483147698682e-05, "loss": 0.7531, "step": 19555 }, { "epoch": 0.63, "learning_rate": 1.9961385141259804e-05, "loss": 0.7742, "step": 19560 }, { "epoch": 0.63, "learning_rate": 1.996128701053143e-05, "loss": 0.7611, "step": 19565 }, { "epoch": 0.63, "learning_rate": 1.996118875551479e-05, "loss": 0.7453, "step": 19570 }, { "epoch": 0.63, "learning_rate": 1.9961090376211107e-05, "loss": 0.7636, "step": 19575 }, { "epoch": 0.63, "learning_rate": 1.9960991872621605e-05, "loss": 0.7659, "step": 19580 }, { "epoch": 0.63, "learning_rate": 1.9960893244747525e-05, "loss": 0.7558, "step": 19585 }, { "epoch": 0.63, "learning_rate": 1.9960794492590087e-05, "loss": 0.7626, "step": 19590 }, { "epoch": 0.63, "learning_rate": 1.9960695616150526e-05, "loss": 0.761, "step": 19595 }, { "epoch": 0.63, "learning_rate": 1.9960596615430076e-05, "loss": 0.7618, "step": 19600 }, { "epoch": 0.63, "learning_rate": 1.9960497490429967e-05, "loss": 0.7638, "step": 19605 }, { "epoch": 0.63, "learning_rate": 1.996039824115145e-05, "loss": 0.7757, "step": 19610 }, { "epoch": 0.63, "learning_rate": 1.996029886759575e-05, "loss": 0.7667, "step": 19615 }, { "epoch": 0.63, "learning_rate": 1.9960199369764108e-05, "loss": 0.7751, "step": 19620 }, { "epoch": 0.63, "learning_rate": 1.9960099747657774e-05, "loss": 0.7624, "step": 19625 }, { "epoch": 0.63, "learning_rate": 1.9960000001277985e-05, "loss": 0.767, "step": 19630 }, { "epoch": 0.63, "learning_rate": 1.995990013062598e-05, "loss": 0.7533, "step": 19635 }, { "epoch": 0.63, "learning_rate": 1.9959800135703018e-05, "loss": 0.7736, "step": 19640 }, { "epoch": 0.63, "learning_rate": 1.9959700016510337e-05, "loss": 0.7558, "step": 19645 }, { "epoch": 0.63, "learning_rate": 1.9959599773049188e-05, "loss": 0.781, "step": 19650 }, { "epoch": 0.63, "learning_rate": 1.9959499405320825e-05, "loss": 0.7573, "step": 19655 }, { "epoch": 0.63, "learning_rate": 1.99593989133265e-05, "loss": 0.7641, "step": 19660 }, { "epoch": 0.63, "learning_rate": 1.9959298297067463e-05, "loss": 0.7696, "step": 19665 }, { "epoch": 0.63, "learning_rate": 1.9959197556544972e-05, "loss": 0.7607, "step": 19670 }, { "epoch": 0.63, "learning_rate": 1.9959096691760284e-05, "loss": 0.7722, "step": 19675 }, { "epoch": 0.63, "learning_rate": 1.9958995702714653e-05, "loss": 0.7746, "step": 19680 }, { "epoch": 0.63, "learning_rate": 1.9958894589409343e-05, "loss": 0.771, "step": 19685 }, { "epoch": 0.63, "learning_rate": 1.995879335184562e-05, "loss": 0.7464, "step": 19690 }, { "epoch": 0.63, "learning_rate": 1.995869199002474e-05, "loss": 0.7708, "step": 19695 }, { "epoch": 0.63, "learning_rate": 1.9958590503947973e-05, "loss": 0.7592, "step": 19700 }, { "epoch": 0.63, "learning_rate": 1.9958488893616577e-05, "loss": 0.7622, "step": 19705 }, { "epoch": 0.63, "learning_rate": 1.995838715903183e-05, "loss": 0.7576, "step": 19710 }, { "epoch": 0.63, "learning_rate": 1.9958285300194996e-05, "loss": 0.7676, "step": 19715 }, { "epoch": 0.63, "learning_rate": 1.9958183317107345e-05, "loss": 0.7792, "step": 19720 }, { "epoch": 0.63, "learning_rate": 1.9958081209770155e-05, "loss": 0.7621, "step": 19725 }, { "epoch": 0.63, "learning_rate": 1.995797897818469e-05, "loss": 0.7542, "step": 19730 }, { "epoch": 0.63, "learning_rate": 1.9957876622352235e-05, "loss": 0.7638, "step": 19735 }, { "epoch": 0.63, "learning_rate": 1.9957774142274067e-05, "loss": 0.7735, "step": 19740 }, { "epoch": 0.63, "learning_rate": 1.995767153795146e-05, "loss": 0.7545, "step": 19745 }, { "epoch": 0.63, "learning_rate": 1.9957568809385693e-05, "loss": 0.7682, "step": 19750 }, { "epoch": 0.63, "learning_rate": 1.995746595657805e-05, "loss": 0.7553, "step": 19755 }, { "epoch": 0.63, "learning_rate": 1.995736297952982e-05, "loss": 0.7529, "step": 19760 }, { "epoch": 0.63, "learning_rate": 1.9957259878242277e-05, "loss": 0.7565, "step": 19765 }, { "epoch": 0.63, "learning_rate": 1.9957156652716717e-05, "loss": 0.7673, "step": 19770 }, { "epoch": 0.63, "learning_rate": 1.9957053302954422e-05, "loss": 0.7601, "step": 19775 }, { "epoch": 0.63, "learning_rate": 1.995694982895668e-05, "loss": 0.7601, "step": 19780 }, { "epoch": 0.63, "learning_rate": 1.9956846230724793e-05, "loss": 0.7525, "step": 19785 }, { "epoch": 0.63, "learning_rate": 1.995674250826004e-05, "loss": 0.7469, "step": 19790 }, { "epoch": 0.63, "learning_rate": 1.9956638661563725e-05, "loss": 0.7623, "step": 19795 }, { "epoch": 0.63, "learning_rate": 1.9956534690637137e-05, "loss": 0.7706, "step": 19800 }, { "epoch": 0.63, "learning_rate": 1.995643059548158e-05, "loss": 0.7583, "step": 19805 }, { "epoch": 0.63, "learning_rate": 1.9956326376098345e-05, "loss": 0.7609, "step": 19810 }, { "epoch": 0.63, "learning_rate": 1.995622203248874e-05, "loss": 0.7644, "step": 19815 }, { "epoch": 0.63, "learning_rate": 1.9956117564654064e-05, "loss": 0.7574, "step": 19820 }, { "epoch": 0.63, "learning_rate": 1.9956012972595617e-05, "loss": 0.7598, "step": 19825 }, { "epoch": 0.63, "learning_rate": 1.9955908256314706e-05, "loss": 0.7519, "step": 19830 }, { "epoch": 0.63, "learning_rate": 1.995580341581264e-05, "loss": 0.7533, "step": 19835 }, { "epoch": 0.63, "learning_rate": 1.9955698451090727e-05, "loss": 0.7571, "step": 19840 }, { "epoch": 0.64, "learning_rate": 1.995559336215027e-05, "loss": 0.7532, "step": 19845 }, { "epoch": 0.64, "learning_rate": 1.9955488148992593e-05, "loss": 0.7702, "step": 19850 }, { "epoch": 0.64, "learning_rate": 1.9955382811618994e-05, "loss": 0.7661, "step": 19855 }, { "epoch": 0.64, "learning_rate": 1.99552773500308e-05, "loss": 0.7627, "step": 19860 }, { "epoch": 0.64, "learning_rate": 1.9955171764229316e-05, "loss": 0.7629, "step": 19865 }, { "epoch": 0.64, "learning_rate": 1.9955066054215867e-05, "loss": 0.7553, "step": 19870 }, { "epoch": 0.64, "learning_rate": 1.995496021999177e-05, "loss": 0.755, "step": 19875 }, { "epoch": 0.64, "learning_rate": 1.9954854261558348e-05, "loss": 0.7572, "step": 19880 }, { "epoch": 0.64, "learning_rate": 1.9954748178916915e-05, "loss": 0.7503, "step": 19885 }, { "epoch": 0.64, "learning_rate": 1.9954641972068806e-05, "loss": 0.764, "step": 19890 }, { "epoch": 0.64, "learning_rate": 1.9954535641015333e-05, "loss": 0.7498, "step": 19895 }, { "epoch": 0.64, "learning_rate": 1.9954429185757835e-05, "loss": 0.7619, "step": 19900 }, { "epoch": 0.64, "learning_rate": 1.9954322606297632e-05, "loss": 0.773, "step": 19905 }, { "epoch": 0.64, "learning_rate": 1.9954215902636056e-05, "loss": 0.766, "step": 19910 }, { "epoch": 0.64, "learning_rate": 1.9954109074774443e-05, "loss": 0.7509, "step": 19915 }, { "epoch": 0.64, "learning_rate": 1.9954002122714116e-05, "loss": 0.7628, "step": 19920 }, { "epoch": 0.64, "learning_rate": 1.995389504645642e-05, "loss": 0.7527, "step": 19925 }, { "epoch": 0.64, "learning_rate": 1.9953787846002687e-05, "loss": 0.7692, "step": 19930 }, { "epoch": 0.64, "learning_rate": 1.995368052135425e-05, "loss": 0.7639, "step": 19935 }, { "epoch": 0.64, "learning_rate": 1.995357307251246e-05, "loss": 0.7639, "step": 19940 }, { "epoch": 0.64, "learning_rate": 1.995346549947864e-05, "loss": 0.7587, "step": 19945 }, { "epoch": 0.64, "learning_rate": 1.9953357802254147e-05, "loss": 0.7507, "step": 19950 }, { "epoch": 0.64, "learning_rate": 1.9953249980840322e-05, "loss": 0.7694, "step": 19955 }, { "epoch": 0.64, "learning_rate": 1.9953142035238504e-05, "loss": 0.7696, "step": 19960 }, { "epoch": 0.64, "learning_rate": 1.9953033965450044e-05, "loss": 0.7663, "step": 19965 }, { "epoch": 0.64, "learning_rate": 1.995292577147629e-05, "loss": 0.7558, "step": 19970 }, { "epoch": 0.64, "learning_rate": 1.9952817453318592e-05, "loss": 0.7504, "step": 19975 }, { "epoch": 0.64, "learning_rate": 1.9952709010978307e-05, "loss": 0.7558, "step": 19980 }, { "epoch": 0.64, "learning_rate": 1.995260044445678e-05, "loss": 0.7484, "step": 19985 }, { "epoch": 0.64, "learning_rate": 1.9952491753755366e-05, "loss": 0.7685, "step": 19990 }, { "epoch": 0.64, "learning_rate": 1.9952382938875425e-05, "loss": 0.7633, "step": 19995 }, { "epoch": 0.64, "learning_rate": 1.9952273999818312e-05, "loss": 0.7555, "step": 20000 }, { "epoch": 0.64, "learning_rate": 1.995216493658539e-05, "loss": 0.7522, "step": 20005 }, { "epoch": 0.64, "learning_rate": 1.9952055749178018e-05, "loss": 0.7594, "step": 20010 }, { "epoch": 0.64, "learning_rate": 1.9951946437597553e-05, "loss": 0.7537, "step": 20015 }, { "epoch": 0.64, "learning_rate": 1.9951837001845365e-05, "loss": 0.7442, "step": 20020 }, { "epoch": 0.64, "learning_rate": 1.9951727441922823e-05, "loss": 0.754, "step": 20025 }, { "epoch": 0.64, "learning_rate": 1.9951617757831285e-05, "loss": 0.7598, "step": 20030 }, { "epoch": 0.64, "learning_rate": 1.995150794957212e-05, "loss": 0.751, "step": 20035 }, { "epoch": 0.64, "learning_rate": 1.9951398017146706e-05, "loss": 0.7587, "step": 20040 }, { "epoch": 0.64, "learning_rate": 1.995128796055641e-05, "loss": 0.7514, "step": 20045 }, { "epoch": 0.64, "learning_rate": 1.9951177779802604e-05, "loss": 0.7731, "step": 20050 }, { "epoch": 0.64, "learning_rate": 1.9951067474886666e-05, "loss": 0.7627, "step": 20055 }, { "epoch": 0.64, "learning_rate": 1.995095704580997e-05, "loss": 0.758, "step": 20060 }, { "epoch": 0.64, "learning_rate": 1.9950846492573892e-05, "loss": 0.7678, "step": 20065 }, { "epoch": 0.64, "learning_rate": 1.9950735815179817e-05, "loss": 0.7498, "step": 20070 }, { "epoch": 0.64, "learning_rate": 1.995062501362912e-05, "loss": 0.7654, "step": 20075 }, { "epoch": 0.64, "learning_rate": 1.9950514087923185e-05, "loss": 0.7546, "step": 20080 }, { "epoch": 0.64, "learning_rate": 1.99504030380634e-05, "loss": 0.7527, "step": 20085 }, { "epoch": 0.64, "learning_rate": 1.9950291864051147e-05, "loss": 0.7616, "step": 20090 }, { "epoch": 0.64, "learning_rate": 1.9950180565887814e-05, "loss": 0.7514, "step": 20095 }, { "epoch": 0.64, "learning_rate": 1.9950069143574787e-05, "loss": 0.7529, "step": 20100 }, { "epoch": 0.64, "learning_rate": 1.9949957597113463e-05, "loss": 0.7537, "step": 20105 }, { "epoch": 0.64, "learning_rate": 1.9949845926505227e-05, "loss": 0.7503, "step": 20110 }, { "epoch": 0.64, "learning_rate": 1.9949734131751475e-05, "loss": 0.7693, "step": 20115 }, { "epoch": 0.64, "learning_rate": 1.9949622212853603e-05, "loss": 0.7645, "step": 20120 }, { "epoch": 0.64, "learning_rate": 1.9949510169813006e-05, "loss": 0.7689, "step": 20125 }, { "epoch": 0.64, "learning_rate": 1.994939800263108e-05, "loss": 0.7709, "step": 20130 }, { "epoch": 0.64, "learning_rate": 1.9949285711309224e-05, "loss": 0.7488, "step": 20135 }, { "epoch": 0.64, "learning_rate": 1.994917329584885e-05, "loss": 0.7458, "step": 20140 }, { "epoch": 0.64, "learning_rate": 1.9949060756251347e-05, "loss": 0.7625, "step": 20145 }, { "epoch": 0.64, "learning_rate": 1.994894809251812e-05, "loss": 0.7495, "step": 20150 }, { "epoch": 0.64, "learning_rate": 1.994883530465059e-05, "loss": 0.7622, "step": 20155 }, { "epoch": 0.65, "learning_rate": 1.9948722392650147e-05, "loss": 0.7713, "step": 20160 }, { "epoch": 0.65, "learning_rate": 1.9948609356518206e-05, "loss": 0.7567, "step": 20165 }, { "epoch": 0.65, "learning_rate": 1.9948496196256178e-05, "loss": 0.7527, "step": 20170 }, { "epoch": 0.65, "learning_rate": 1.994838291186548e-05, "loss": 0.7649, "step": 20175 }, { "epoch": 0.65, "learning_rate": 1.9948269503347515e-05, "loss": 0.7619, "step": 20180 }, { "epoch": 0.65, "learning_rate": 1.9948155970703705e-05, "loss": 0.7586, "step": 20185 }, { "epoch": 0.65, "learning_rate": 1.9948042313935463e-05, "loss": 0.7546, "step": 20190 }, { "epoch": 0.65, "learning_rate": 1.994792853304421e-05, "loss": 0.7613, "step": 20195 }, { "epoch": 0.65, "learning_rate": 1.9947814628031363e-05, "loss": 0.7662, "step": 20200 }, { "epoch": 0.65, "learning_rate": 1.9947700598898344e-05, "loss": 0.7497, "step": 20205 }, { "epoch": 0.65, "learning_rate": 1.994758644564658e-05, "loss": 0.736, "step": 20210 }, { "epoch": 0.65, "learning_rate": 1.994747216827749e-05, "loss": 0.7649, "step": 20215 }, { "epoch": 0.65, "learning_rate": 1.99473577667925e-05, "loss": 0.7403, "step": 20220 }, { "epoch": 0.65, "learning_rate": 1.994724324119304e-05, "loss": 0.7585, "step": 20225 }, { "epoch": 0.65, "learning_rate": 1.9947128591480536e-05, "loss": 0.7609, "step": 20230 }, { "epoch": 0.65, "learning_rate": 1.9947013817656425e-05, "loss": 0.7493, "step": 20235 }, { "epoch": 0.65, "learning_rate": 1.994689891972213e-05, "loss": 0.7581, "step": 20240 }, { "epoch": 0.65, "learning_rate": 1.994678389767909e-05, "loss": 0.7328, "step": 20245 }, { "epoch": 0.65, "learning_rate": 1.9946668751528745e-05, "loss": 0.754, "step": 20250 }, { "epoch": 0.65, "learning_rate": 1.994655348127252e-05, "loss": 0.7686, "step": 20255 }, { "epoch": 0.65, "learning_rate": 1.9946438086911855e-05, "loss": 0.757, "step": 20260 }, { "epoch": 0.65, "learning_rate": 1.99463225684482e-05, "loss": 0.7637, "step": 20265 }, { "epoch": 0.65, "learning_rate": 1.9946206925882992e-05, "loss": 0.751, "step": 20270 }, { "epoch": 0.65, "learning_rate": 1.9946091159217668e-05, "loss": 0.7393, "step": 20275 }, { "epoch": 0.65, "learning_rate": 1.994597526845368e-05, "loss": 0.7449, "step": 20280 }, { "epoch": 0.65, "learning_rate": 1.994585925359247e-05, "loss": 0.759, "step": 20285 }, { "epoch": 0.65, "learning_rate": 1.994574311463548e-05, "loss": 0.7524, "step": 20290 }, { "epoch": 0.65, "learning_rate": 1.994562685158417e-05, "loss": 0.7746, "step": 20295 }, { "epoch": 0.65, "learning_rate": 1.9945510464439984e-05, "loss": 0.7499, "step": 20300 }, { "epoch": 0.65, "learning_rate": 1.9945393953204378e-05, "loss": 0.753, "step": 20305 }, { "epoch": 0.65, "learning_rate": 1.9945277317878808e-05, "loss": 0.7546, "step": 20310 }, { "epoch": 0.65, "learning_rate": 1.9945160558464717e-05, "loss": 0.7579, "step": 20315 }, { "epoch": 0.65, "learning_rate": 1.9945043674963575e-05, "loss": 0.7449, "step": 20320 }, { "epoch": 0.65, "learning_rate": 1.9944926667376833e-05, "loss": 0.7658, "step": 20325 }, { "epoch": 0.65, "learning_rate": 1.9944809535705954e-05, "loss": 0.7615, "step": 20330 }, { "epoch": 0.65, "learning_rate": 1.9944692279952396e-05, "loss": 0.7602, "step": 20335 }, { "epoch": 0.65, "learning_rate": 1.9944574900117625e-05, "loss": 0.7592, "step": 20340 }, { "epoch": 0.65, "learning_rate": 1.9944457396203108e-05, "loss": 0.7551, "step": 20345 }, { "epoch": 0.65, "learning_rate": 1.994433976821031e-05, "loss": 0.7421, "step": 20350 }, { "epoch": 0.65, "learning_rate": 1.9944222016140692e-05, "loss": 0.757, "step": 20355 }, { "epoch": 0.65, "learning_rate": 1.9944104139995727e-05, "loss": 0.7556, "step": 20360 }, { "epoch": 0.65, "learning_rate": 1.994398613977689e-05, "loss": 0.7651, "step": 20365 }, { "epoch": 0.65, "learning_rate": 1.994386801548565e-05, "loss": 0.7561, "step": 20370 }, { "epoch": 0.65, "learning_rate": 1.994374976712348e-05, "loss": 0.755, "step": 20375 }, { "epoch": 0.65, "learning_rate": 1.994363139469186e-05, "loss": 0.7451, "step": 20380 }, { "epoch": 0.65, "learning_rate": 1.9943512898192263e-05, "loss": 0.7576, "step": 20385 }, { "epoch": 0.65, "learning_rate": 1.994339427762616e-05, "loss": 0.7399, "step": 20390 }, { "epoch": 0.65, "learning_rate": 1.994327553299505e-05, "loss": 0.7573, "step": 20395 }, { "epoch": 0.65, "learning_rate": 1.9943156664300394e-05, "loss": 0.7508, "step": 20400 }, { "epoch": 0.65, "learning_rate": 1.994303767154369e-05, "loss": 0.7579, "step": 20405 }, { "epoch": 0.65, "learning_rate": 1.9942918554726415e-05, "loss": 0.7491, "step": 20410 }, { "epoch": 0.65, "learning_rate": 1.994279931385006e-05, "loss": 0.7433, "step": 20415 }, { "epoch": 0.65, "learning_rate": 1.9942679948916107e-05, "loss": 0.7433, "step": 20420 }, { "epoch": 0.65, "learning_rate": 1.994256045992605e-05, "loss": 0.7557, "step": 20425 }, { "epoch": 0.65, "learning_rate": 1.9942440846881383e-05, "loss": 0.7545, "step": 20430 }, { "epoch": 0.65, "learning_rate": 1.9942321109783586e-05, "loss": 0.7474, "step": 20435 }, { "epoch": 0.65, "learning_rate": 1.9942201248634165e-05, "loss": 0.7594, "step": 20440 }, { "epoch": 0.65, "learning_rate": 1.994208126343461e-05, "loss": 0.753, "step": 20445 }, { "epoch": 0.65, "learning_rate": 1.9941961154186424e-05, "loss": 0.7359, "step": 20450 }, { "epoch": 0.65, "learning_rate": 1.99418409208911e-05, "loss": 0.7487, "step": 20455 }, { "epoch": 0.65, "learning_rate": 1.9941720563550136e-05, "loss": 0.7452, "step": 20460 }, { "epoch": 0.65, "learning_rate": 1.9941600082165037e-05, "loss": 0.7582, "step": 20465 }, { "epoch": 0.66, "learning_rate": 1.994147947673731e-05, "loss": 0.7478, "step": 20470 }, { "epoch": 0.66, "learning_rate": 1.9941358747268455e-05, "loss": 0.7505, "step": 20475 }, { "epoch": 0.66, "learning_rate": 1.9941237893759976e-05, "loss": 0.7588, "step": 20480 }, { "epoch": 0.66, "learning_rate": 1.994111691621339e-05, "loss": 0.7559, "step": 20485 }, { "epoch": 0.66, "learning_rate": 1.9940995814630194e-05, "loss": 0.765, "step": 20490 }, { "epoch": 0.66, "learning_rate": 1.9940874589011912e-05, "loss": 0.7553, "step": 20495 }, { "epoch": 0.66, "learning_rate": 1.9940753239360047e-05, "loss": 0.754, "step": 20500 }, { "epoch": 0.66, "learning_rate": 1.994063176567612e-05, "loss": 0.7531, "step": 20505 }, { "epoch": 0.66, "learning_rate": 1.994051016796164e-05, "loss": 0.754, "step": 20510 }, { "epoch": 0.66, "learning_rate": 1.9940388446218126e-05, "loss": 0.7445, "step": 20515 }, { "epoch": 0.66, "learning_rate": 1.99402666004471e-05, "loss": 0.7673, "step": 20520 }, { "epoch": 0.66, "learning_rate": 1.9940144630650083e-05, "loss": 0.767, "step": 20525 }, { "epoch": 0.66, "learning_rate": 1.994002253682859e-05, "loss": 0.7436, "step": 20530 }, { "epoch": 0.66, "learning_rate": 1.993990031898415e-05, "loss": 0.7479, "step": 20535 }, { "epoch": 0.66, "learning_rate": 1.9939777977118287e-05, "loss": 0.7516, "step": 20540 }, { "epoch": 0.66, "learning_rate": 1.9939655511232527e-05, "loss": 0.7559, "step": 20545 }, { "epoch": 0.66, "learning_rate": 1.9939532921328398e-05, "loss": 0.7493, "step": 20550 }, { "epoch": 0.66, "learning_rate": 1.9939410207407427e-05, "loss": 0.7585, "step": 20555 }, { "epoch": 0.66, "learning_rate": 1.993928736947115e-05, "loss": 0.7563, "step": 20560 }, { "epoch": 0.66, "learning_rate": 1.99391644075211e-05, "loss": 0.7461, "step": 20565 }, { "epoch": 0.66, "learning_rate": 1.99390413215588e-05, "loss": 0.7544, "step": 20570 }, { "epoch": 0.66, "learning_rate": 1.9938918111585805e-05, "loss": 0.7483, "step": 20575 }, { "epoch": 0.66, "learning_rate": 1.9938794777603635e-05, "loss": 0.7547, "step": 20580 }, { "epoch": 0.66, "learning_rate": 1.993867131961384e-05, "loss": 0.7632, "step": 20585 }, { "epoch": 0.66, "learning_rate": 1.993854773761795e-05, "loss": 0.7554, "step": 20590 }, { "epoch": 0.66, "learning_rate": 1.9938424031617515e-05, "loss": 0.7448, "step": 20595 }, { "epoch": 0.66, "learning_rate": 1.9938300201614077e-05, "loss": 0.7525, "step": 20600 }, { "epoch": 0.66, "learning_rate": 1.9938176247609183e-05, "loss": 0.7465, "step": 20605 }, { "epoch": 0.66, "learning_rate": 1.9938052169604375e-05, "loss": 0.7537, "step": 20610 }, { "epoch": 0.66, "learning_rate": 1.9937927967601204e-05, "loss": 0.7499, "step": 20615 }, { "epoch": 0.66, "learning_rate": 1.9937803641601215e-05, "loss": 0.7677, "step": 20620 }, { "epoch": 0.66, "learning_rate": 1.9937679191605964e-05, "loss": 0.7475, "step": 20625 }, { "epoch": 0.66, "learning_rate": 1.9937554617617005e-05, "loss": 0.762, "step": 20630 }, { "epoch": 0.66, "learning_rate": 1.9937429919635888e-05, "loss": 0.7583, "step": 20635 }, { "epoch": 0.66, "learning_rate": 1.9937305097664176e-05, "loss": 0.7431, "step": 20640 }, { "epoch": 0.66, "learning_rate": 1.9937180151703416e-05, "loss": 0.7521, "step": 20645 }, { "epoch": 0.66, "learning_rate": 1.9937055081755172e-05, "loss": 0.742, "step": 20650 }, { "epoch": 0.66, "learning_rate": 1.9936929887821007e-05, "loss": 0.746, "step": 20655 }, { "epoch": 0.66, "learning_rate": 1.9936804569902482e-05, "loss": 0.7737, "step": 20660 }, { "epoch": 0.66, "learning_rate": 1.993667912800116e-05, "loss": 0.7451, "step": 20665 }, { "epoch": 0.66, "learning_rate": 1.9936553562118602e-05, "loss": 0.7507, "step": 20670 }, { "epoch": 0.66, "learning_rate": 1.993642787225638e-05, "loss": 0.7498, "step": 20675 }, { "epoch": 0.66, "learning_rate": 1.993630205841606e-05, "loss": 0.7428, "step": 20680 }, { "epoch": 0.66, "learning_rate": 1.9936176120599214e-05, "loss": 0.7458, "step": 20685 }, { "epoch": 0.66, "learning_rate": 1.9936050058807414e-05, "loss": 0.7563, "step": 20690 }, { "epoch": 0.66, "learning_rate": 1.9935923873042225e-05, "loss": 0.7516, "step": 20695 }, { "epoch": 0.66, "learning_rate": 1.9935797563305233e-05, "loss": 0.7459, "step": 20700 }, { "epoch": 0.66, "learning_rate": 1.9935671129598003e-05, "loss": 0.752, "step": 20705 }, { "epoch": 0.66, "learning_rate": 1.9935544571922124e-05, "loss": 0.7541, "step": 20710 }, { "epoch": 0.66, "learning_rate": 1.9935417890279162e-05, "loss": 0.7419, "step": 20715 }, { "epoch": 0.66, "learning_rate": 1.993529108467071e-05, "loss": 0.7506, "step": 20720 }, { "epoch": 0.66, "learning_rate": 1.993516415509834e-05, "loss": 0.7525, "step": 20725 }, { "epoch": 0.66, "learning_rate": 1.993503710156364e-05, "loss": 0.7559, "step": 20730 }, { "epoch": 0.66, "learning_rate": 1.9934909924068198e-05, "loss": 0.7533, "step": 20735 }, { "epoch": 0.66, "learning_rate": 1.9934782622613596e-05, "loss": 0.7562, "step": 20740 }, { "epoch": 0.66, "learning_rate": 1.9934655197201428e-05, "loss": 0.7544, "step": 20745 }, { "epoch": 0.66, "learning_rate": 1.9934527647833276e-05, "loss": 0.7553, "step": 20750 }, { "epoch": 0.66, "learning_rate": 1.993439997451074e-05, "loss": 0.7656, "step": 20755 }, { "epoch": 0.66, "learning_rate": 1.9934272177235407e-05, "loss": 0.7323, "step": 20760 }, { "epoch": 0.66, "learning_rate": 1.9934144256008878e-05, "loss": 0.7614, "step": 20765 }, { "epoch": 0.66, "learning_rate": 1.9934016210832738e-05, "loss": 0.7423, "step": 20770 }, { "epoch": 0.66, "learning_rate": 1.9933888041708593e-05, "loss": 0.7552, "step": 20775 }, { "epoch": 0.66, "learning_rate": 1.9933759748638043e-05, "loss": 0.7572, "step": 20780 }, { "epoch": 0.67, "learning_rate": 1.9933631331622686e-05, "loss": 0.7553, "step": 20785 }, { "epoch": 0.67, "learning_rate": 1.993350279066412e-05, "loss": 0.7397, "step": 20790 }, { "epoch": 0.67, "learning_rate": 1.993337412576396e-05, "loss": 0.7449, "step": 20795 }, { "epoch": 0.67, "learning_rate": 1.9933245336923798e-05, "loss": 0.7519, "step": 20800 }, { "epoch": 0.67, "learning_rate": 1.993311642414525e-05, "loss": 0.752, "step": 20805 }, { "epoch": 0.67, "learning_rate": 1.9932987387429924e-05, "loss": 0.7341, "step": 20810 }, { "epoch": 0.67, "learning_rate": 1.9932858226779426e-05, "loss": 0.75, "step": 20815 }, { "epoch": 0.67, "learning_rate": 1.993272894219537e-05, "loss": 0.7529, "step": 20820 }, { "epoch": 0.67, "learning_rate": 1.993259953367937e-05, "loss": 0.7608, "step": 20825 }, { "epoch": 0.67, "learning_rate": 1.993247000123304e-05, "loss": 0.7517, "step": 20830 }, { "epoch": 0.67, "learning_rate": 1.993234034485799e-05, "loss": 0.7501, "step": 20835 }, { "epoch": 0.67, "learning_rate": 1.993221056455585e-05, "loss": 0.7485, "step": 20840 }, { "epoch": 0.67, "learning_rate": 1.993208066032823e-05, "loss": 0.7538, "step": 20845 }, { "epoch": 0.67, "learning_rate": 1.9931950632176753e-05, "loss": 0.7591, "step": 20850 }, { "epoch": 0.67, "learning_rate": 1.9931820480103037e-05, "loss": 0.7675, "step": 20855 }, { "epoch": 0.67, "learning_rate": 1.9931690204108716e-05, "loss": 0.7677, "step": 20860 }, { "epoch": 0.67, "learning_rate": 1.9931559804195413e-05, "loss": 0.7464, "step": 20865 }, { "epoch": 0.67, "learning_rate": 1.9931429280364747e-05, "loss": 0.7474, "step": 20870 }, { "epoch": 0.67, "learning_rate": 1.9931298632618355e-05, "loss": 0.7398, "step": 20875 }, { "epoch": 0.67, "learning_rate": 1.9931167860957864e-05, "loss": 0.7535, "step": 20880 }, { "epoch": 0.67, "learning_rate": 1.99310369653849e-05, "loss": 0.7442, "step": 20885 }, { "epoch": 0.67, "learning_rate": 1.9930905945901106e-05, "loss": 0.7478, "step": 20890 }, { "epoch": 0.67, "learning_rate": 1.9930774802508113e-05, "loss": 0.7484, "step": 20895 }, { "epoch": 0.67, "learning_rate": 1.9930643535207556e-05, "loss": 0.7555, "step": 20900 }, { "epoch": 0.67, "learning_rate": 1.9930512144001074e-05, "loss": 0.7462, "step": 20905 }, { "epoch": 0.67, "learning_rate": 1.9930380628890305e-05, "loss": 0.7631, "step": 20910 }, { "epoch": 0.67, "learning_rate": 1.993024898987689e-05, "loss": 0.7579, "step": 20915 }, { "epoch": 0.67, "learning_rate": 1.9930117226962475e-05, "loss": 0.7509, "step": 20920 }, { "epoch": 0.67, "learning_rate": 1.99299853401487e-05, "loss": 0.7524, "step": 20925 }, { "epoch": 0.67, "learning_rate": 1.992985332943721e-05, "loss": 0.748, "step": 20930 }, { "epoch": 0.67, "learning_rate": 1.9929721194829657e-05, "loss": 0.7531, "step": 20935 }, { "epoch": 0.67, "learning_rate": 1.9929588936327686e-05, "loss": 0.746, "step": 20940 }, { "epoch": 0.67, "learning_rate": 1.992945655393295e-05, "loss": 0.7464, "step": 20945 }, { "epoch": 0.67, "learning_rate": 1.9929324047647095e-05, "loss": 0.7463, "step": 20950 }, { "epoch": 0.67, "learning_rate": 1.992919141747178e-05, "loss": 0.7512, "step": 20955 }, { "epoch": 0.67, "learning_rate": 1.9929058663408656e-05, "loss": 0.7466, "step": 20960 }, { "epoch": 0.67, "learning_rate": 1.9928925785459385e-05, "loss": 0.7504, "step": 20965 }, { "epoch": 0.67, "learning_rate": 1.9928792783625615e-05, "loss": 0.7537, "step": 20970 }, { "epoch": 0.67, "learning_rate": 1.992865965790902e-05, "loss": 0.7646, "step": 20975 }, { "epoch": 0.67, "learning_rate": 1.9928526408311245e-05, "loss": 0.7401, "step": 20980 }, { "epoch": 0.67, "learning_rate": 1.9928393034833964e-05, "loss": 0.7527, "step": 20985 }, { "epoch": 0.67, "learning_rate": 1.9928259537478832e-05, "loss": 0.7539, "step": 20990 }, { "epoch": 0.67, "learning_rate": 1.9928125916247528e-05, "loss": 0.7515, "step": 20995 }, { "epoch": 0.67, "learning_rate": 1.9927992171141707e-05, "loss": 0.7422, "step": 21000 }, { "epoch": 0.67, "learning_rate": 1.9927858302163044e-05, "loss": 0.7408, "step": 21005 }, { "epoch": 0.67, "learning_rate": 1.9927724309313205e-05, "loss": 0.756, "step": 21010 }, { "epoch": 0.67, "learning_rate": 1.9927590192593867e-05, "loss": 0.7471, "step": 21015 }, { "epoch": 0.67, "learning_rate": 1.9927455952006695e-05, "loss": 0.756, "step": 21020 }, { "epoch": 0.67, "learning_rate": 1.9927321587553378e-05, "loss": 0.7339, "step": 21025 }, { "epoch": 0.67, "learning_rate": 1.9927187099235577e-05, "loss": 0.7436, "step": 21030 }, { "epoch": 0.67, "learning_rate": 1.992705248705498e-05, "loss": 0.743, "step": 21035 }, { "epoch": 0.67, "learning_rate": 1.9926917751013262e-05, "loss": 0.7502, "step": 21040 }, { "epoch": 0.67, "learning_rate": 1.9926782891112103e-05, "loss": 0.7494, "step": 21045 }, { "epoch": 0.67, "learning_rate": 1.9926647907353198e-05, "loss": 0.7562, "step": 21050 }, { "epoch": 0.67, "learning_rate": 1.992651279973821e-05, "loss": 0.7415, "step": 21055 }, { "epoch": 0.67, "learning_rate": 1.992637756826884e-05, "loss": 0.7481, "step": 21060 }, { "epoch": 0.67, "learning_rate": 1.9926242212946777e-05, "loss": 0.7561, "step": 21065 }, { "epoch": 0.67, "learning_rate": 1.99261067337737e-05, "loss": 0.7392, "step": 21070 }, { "epoch": 0.67, "learning_rate": 1.99259711307513e-05, "loss": 0.7388, "step": 21075 }, { "epoch": 0.67, "learning_rate": 1.992583540388128e-05, "loss": 0.7475, "step": 21080 }, { "epoch": 0.67, "learning_rate": 1.9925699553165324e-05, "loss": 0.7446, "step": 21085 }, { "epoch": 0.67, "learning_rate": 1.992556357860513e-05, "loss": 0.7507, "step": 21090 }, { "epoch": 0.68, "learning_rate": 1.992542748020239e-05, "loss": 0.7611, "step": 21095 }, { "epoch": 0.68, "learning_rate": 1.992529125795881e-05, "loss": 0.7403, "step": 21100 }, { "epoch": 0.68, "learning_rate": 1.9925154911876085e-05, "loss": 0.7435, "step": 21105 }, { "epoch": 0.68, "learning_rate": 1.9925018441955916e-05, "loss": 0.758, "step": 21110 }, { "epoch": 0.68, "learning_rate": 1.9924881848200007e-05, "loss": 0.7523, "step": 21115 }, { "epoch": 0.68, "learning_rate": 1.992474513061006e-05, "loss": 0.7495, "step": 21120 }, { "epoch": 0.68, "learning_rate": 1.9924608289187786e-05, "loss": 0.7477, "step": 21125 }, { "epoch": 0.68, "learning_rate": 1.9924471323934885e-05, "loss": 0.75, "step": 21130 }, { "epoch": 0.68, "learning_rate": 1.9924334234853076e-05, "loss": 0.7493, "step": 21135 }, { "epoch": 0.68, "learning_rate": 1.992419702194406e-05, "loss": 0.7628, "step": 21140 }, { "epoch": 0.68, "learning_rate": 1.9924059685209548e-05, "loss": 0.7462, "step": 21145 }, { "epoch": 0.68, "learning_rate": 1.9923922224651265e-05, "loss": 0.7555, "step": 21150 }, { "epoch": 0.68, "learning_rate": 1.9923784640270914e-05, "loss": 0.7566, "step": 21155 }, { "epoch": 0.68, "learning_rate": 1.9923646932070223e-05, "loss": 0.7514, "step": 21160 }, { "epoch": 0.68, "learning_rate": 1.9923509100050903e-05, "loss": 0.7528, "step": 21165 }, { "epoch": 0.68, "learning_rate": 1.992337114421467e-05, "loss": 0.7454, "step": 21170 }, { "epoch": 0.68, "learning_rate": 1.9923233064563253e-05, "loss": 0.7561, "step": 21175 }, { "epoch": 0.68, "learning_rate": 1.9923094861098372e-05, "loss": 0.7446, "step": 21180 }, { "epoch": 0.68, "learning_rate": 1.992295653382175e-05, "loss": 0.7527, "step": 21185 }, { "epoch": 0.68, "learning_rate": 1.9922818082735116e-05, "loss": 0.7444, "step": 21190 }, { "epoch": 0.68, "learning_rate": 1.9922679507840197e-05, "loss": 0.7492, "step": 21195 }, { "epoch": 0.68, "learning_rate": 1.9922540809138716e-05, "loss": 0.7507, "step": 21200 }, { "epoch": 0.68, "learning_rate": 1.9922401986632414e-05, "loss": 0.7476, "step": 21205 }, { "epoch": 0.68, "learning_rate": 1.9922263040323013e-05, "loss": 0.7543, "step": 21210 }, { "epoch": 0.68, "learning_rate": 1.9922123970212256e-05, "loss": 0.7479, "step": 21215 }, { "epoch": 0.68, "learning_rate": 1.9921984776301867e-05, "loss": 0.7459, "step": 21220 }, { "epoch": 0.68, "learning_rate": 1.9921845458593595e-05, "loss": 0.7333, "step": 21225 }, { "epoch": 0.68, "learning_rate": 1.992170601708917e-05, "loss": 0.7551, "step": 21230 }, { "epoch": 0.68, "learning_rate": 1.992156645179033e-05, "loss": 0.7441, "step": 21235 }, { "epoch": 0.68, "learning_rate": 1.9921426762698827e-05, "loss": 0.7508, "step": 21240 }, { "epoch": 0.68, "learning_rate": 1.9921286949816394e-05, "loss": 0.7423, "step": 21245 }, { "epoch": 0.68, "learning_rate": 1.9921147013144782e-05, "loss": 0.7407, "step": 21250 }, { "epoch": 0.68, "learning_rate": 1.992100695268573e-05, "loss": 0.7472, "step": 21255 }, { "epoch": 0.68, "learning_rate": 1.9920866768440993e-05, "loss": 0.7344, "step": 21260 }, { "epoch": 0.68, "learning_rate": 1.9920726460412312e-05, "loss": 0.7512, "step": 21265 }, { "epoch": 0.68, "learning_rate": 1.9920586028601445e-05, "loss": 0.754, "step": 21270 }, { "epoch": 0.68, "learning_rate": 1.992044547301014e-05, "loss": 0.7401, "step": 21275 }, { "epoch": 0.68, "learning_rate": 1.9920304793640155e-05, "loss": 0.7535, "step": 21280 }, { "epoch": 0.68, "learning_rate": 1.992016399049324e-05, "loss": 0.7521, "step": 21285 }, { "epoch": 0.68, "learning_rate": 1.9920023063571153e-05, "loss": 0.7449, "step": 21290 }, { "epoch": 0.68, "learning_rate": 1.9919882012875656e-05, "loss": 0.755, "step": 21295 }, { "epoch": 0.68, "learning_rate": 1.9919740838408506e-05, "loss": 0.7436, "step": 21300 }, { "epoch": 0.68, "learning_rate": 1.9919599540171466e-05, "loss": 0.7507, "step": 21305 }, { "epoch": 0.68, "learning_rate": 1.9919458118166297e-05, "loss": 0.7493, "step": 21310 }, { "epoch": 0.68, "learning_rate": 1.9919316572394764e-05, "loss": 0.747, "step": 21315 }, { "epoch": 0.68, "learning_rate": 1.9919174902858632e-05, "loss": 0.7504, "step": 21320 }, { "epoch": 0.68, "learning_rate": 1.9919033109559677e-05, "loss": 0.7523, "step": 21325 }, { "epoch": 0.68, "learning_rate": 1.991889119249965e-05, "loss": 0.7427, "step": 21330 }, { "epoch": 0.68, "learning_rate": 1.991874915168034e-05, "loss": 0.7415, "step": 21335 }, { "epoch": 0.68, "learning_rate": 1.9918606987103515e-05, "loss": 0.7398, "step": 21340 }, { "epoch": 0.68, "learning_rate": 1.9918464698770944e-05, "loss": 0.7481, "step": 21345 }, { "epoch": 0.68, "learning_rate": 1.9918322286684402e-05, "loss": 0.7391, "step": 21350 }, { "epoch": 0.68, "learning_rate": 1.991817975084567e-05, "loss": 0.7516, "step": 21355 }, { "epoch": 0.68, "learning_rate": 1.9918037091256527e-05, "loss": 0.7411, "step": 21360 }, { "epoch": 0.68, "learning_rate": 1.9917894307918745e-05, "loss": 0.7472, "step": 21365 }, { "epoch": 0.68, "learning_rate": 1.9917751400834114e-05, "loss": 0.7569, "step": 21370 }, { "epoch": 0.68, "learning_rate": 1.9917608370004417e-05, "loss": 0.7466, "step": 21375 }, { "epoch": 0.68, "learning_rate": 1.9917465215431434e-05, "loss": 0.7383, "step": 21380 }, { "epoch": 0.68, "learning_rate": 1.9917321937116955e-05, "loss": 0.7354, "step": 21385 }, { "epoch": 0.68, "learning_rate": 1.9917178535062764e-05, "loss": 0.7418, "step": 21390 }, { "epoch": 0.68, "learning_rate": 1.9917035009270652e-05, "loss": 0.7549, "step": 21395 }, { "epoch": 0.68, "learning_rate": 1.991689135974241e-05, "loss": 0.7441, "step": 21400 }, { "epoch": 0.68, "learning_rate": 1.991674758647983e-05, "loss": 0.7462, "step": 21405 }, { "epoch": 0.69, "learning_rate": 1.9916603689484707e-05, "loss": 0.7466, "step": 21410 }, { "epoch": 0.69, "learning_rate": 1.9916459668758837e-05, "loss": 0.758, "step": 21415 }, { "epoch": 0.69, "learning_rate": 1.991631552430401e-05, "loss": 0.7412, "step": 21420 }, { "epoch": 0.69, "learning_rate": 1.9916171256122036e-05, "loss": 0.7408, "step": 21425 }, { "epoch": 0.69, "learning_rate": 1.9916026864214707e-05, "loss": 0.7451, "step": 21430 }, { "epoch": 0.69, "learning_rate": 1.9915882348583827e-05, "loss": 0.7312, "step": 21435 }, { "epoch": 0.69, "learning_rate": 1.99157377092312e-05, "loss": 0.7475, "step": 21440 }, { "epoch": 0.69, "learning_rate": 1.9915592946158626e-05, "loss": 0.7532, "step": 21445 }, { "epoch": 0.69, "learning_rate": 1.9915448059367916e-05, "loss": 0.744, "step": 21450 }, { "epoch": 0.69, "learning_rate": 1.9915303048860876e-05, "loss": 0.7455, "step": 21455 }, { "epoch": 0.69, "learning_rate": 1.991515791463932e-05, "loss": 0.7555, "step": 21460 }, { "epoch": 0.69, "learning_rate": 1.991501265670505e-05, "loss": 0.7522, "step": 21465 }, { "epoch": 0.69, "learning_rate": 1.9914867275059887e-05, "loss": 0.7358, "step": 21470 }, { "epoch": 0.69, "learning_rate": 1.9914721769705637e-05, "loss": 0.7435, "step": 21475 }, { "epoch": 0.69, "learning_rate": 1.991457614064412e-05, "loss": 0.7526, "step": 21480 }, { "epoch": 0.69, "learning_rate": 1.9914430387877155e-05, "loss": 0.7473, "step": 21485 }, { "epoch": 0.69, "learning_rate": 1.9914284511406557e-05, "loss": 0.7292, "step": 21490 }, { "epoch": 0.69, "learning_rate": 1.9914138511234145e-05, "loss": 0.7544, "step": 21495 }, { "epoch": 0.69, "learning_rate": 1.9913992387361747e-05, "loss": 0.7402, "step": 21500 }, { "epoch": 0.69, "learning_rate": 1.991384613979118e-05, "loss": 0.7463, "step": 21505 }, { "epoch": 0.69, "learning_rate": 1.991369976852427e-05, "loss": 0.7579, "step": 21510 }, { "epoch": 0.69, "learning_rate": 1.9913553273562846e-05, "loss": 0.7417, "step": 21515 }, { "epoch": 0.69, "learning_rate": 1.9913406654908732e-05, "loss": 0.7432, "step": 21520 }, { "epoch": 0.69, "learning_rate": 1.9913259912563762e-05, "loss": 0.7408, "step": 21525 }, { "epoch": 0.69, "learning_rate": 1.9913113046529762e-05, "loss": 0.7525, "step": 21530 }, { "epoch": 0.69, "learning_rate": 1.991296605680857e-05, "loss": 0.7534, "step": 21535 }, { "epoch": 0.69, "learning_rate": 1.9912818943402013e-05, "loss": 0.7328, "step": 21540 }, { "epoch": 0.69, "learning_rate": 1.991267170631193e-05, "loss": 0.7535, "step": 21545 }, { "epoch": 0.69, "learning_rate": 1.9912524345540164e-05, "loss": 0.7405, "step": 21550 }, { "epoch": 0.69, "learning_rate": 1.991237686108854e-05, "loss": 0.7383, "step": 21555 }, { "epoch": 0.69, "learning_rate": 1.9912229252958914e-05, "loss": 0.7365, "step": 21560 }, { "epoch": 0.69, "learning_rate": 1.9912081521153114e-05, "loss": 0.7566, "step": 21565 }, { "epoch": 0.69, "learning_rate": 1.9911933665672993e-05, "loss": 0.7426, "step": 21570 }, { "epoch": 0.69, "learning_rate": 1.991178568652039e-05, "loss": 0.7391, "step": 21575 }, { "epoch": 0.69, "learning_rate": 1.9911637583697155e-05, "loss": 0.7313, "step": 21580 }, { "epoch": 0.69, "learning_rate": 1.991148935720513e-05, "loss": 0.7476, "step": 21585 }, { "epoch": 0.69, "learning_rate": 1.9911341007046175e-05, "loss": 0.7496, "step": 21590 }, { "epoch": 0.69, "learning_rate": 1.991119253322213e-05, "loss": 0.7421, "step": 21595 }, { "epoch": 0.69, "learning_rate": 1.9911043935734855e-05, "loss": 0.744, "step": 21600 }, { "epoch": 0.69, "learning_rate": 1.9910895214586198e-05, "loss": 0.7467, "step": 21605 }, { "epoch": 0.69, "learning_rate": 1.991074636977802e-05, "loss": 0.756, "step": 21610 }, { "epoch": 0.69, "learning_rate": 1.9910597401312176e-05, "loss": 0.7465, "step": 21615 }, { "epoch": 0.69, "learning_rate": 1.9910448309190525e-05, "loss": 0.7468, "step": 21620 }, { "epoch": 0.69, "learning_rate": 1.991029909341493e-05, "loss": 0.7523, "step": 21625 }, { "epoch": 0.69, "learning_rate": 1.9910149753987244e-05, "loss": 0.7619, "step": 21630 }, { "epoch": 0.69, "learning_rate": 1.9910000290909343e-05, "loss": 0.7455, "step": 21635 }, { "epoch": 0.69, "learning_rate": 1.990985070418308e-05, "loss": 0.7539, "step": 21640 }, { "epoch": 0.69, "learning_rate": 1.9909700993810327e-05, "loss": 0.7573, "step": 21645 }, { "epoch": 0.69, "learning_rate": 1.990955115979295e-05, "loss": 0.7484, "step": 21650 }, { "epoch": 0.69, "learning_rate": 1.9909401202132824e-05, "loss": 0.7373, "step": 21655 }, { "epoch": 0.69, "learning_rate": 1.9909251120831813e-05, "loss": 0.7402, "step": 21660 }, { "epoch": 0.69, "learning_rate": 1.9909100915891795e-05, "loss": 0.7406, "step": 21665 }, { "epoch": 0.69, "learning_rate": 1.990895058731464e-05, "loss": 0.7625, "step": 21670 }, { "epoch": 0.69, "learning_rate": 1.990880013510222e-05, "loss": 0.7369, "step": 21675 }, { "epoch": 0.69, "learning_rate": 1.9908649559256426e-05, "loss": 0.7432, "step": 21680 }, { "epoch": 0.69, "learning_rate": 1.9908498859779125e-05, "loss": 0.7486, "step": 21685 }, { "epoch": 0.69, "learning_rate": 1.9908348036672202e-05, "loss": 0.7473, "step": 21690 }, { "epoch": 0.69, "learning_rate": 1.9908197089937534e-05, "loss": 0.7395, "step": 21695 }, { "epoch": 0.69, "learning_rate": 1.990804601957701e-05, "loss": 0.7524, "step": 21700 }, { "epoch": 0.69, "learning_rate": 1.9907894825592514e-05, "loss": 0.749, "step": 21705 }, { "epoch": 0.69, "learning_rate": 1.9907743507985926e-05, "loss": 0.7343, "step": 21710 }, { "epoch": 0.69, "learning_rate": 1.9907592066759146e-05, "loss": 0.745, "step": 21715 }, { "epoch": 0.7, "learning_rate": 1.9907440501914053e-05, "loss": 0.7319, "step": 21720 }, { "epoch": 0.7, "learning_rate": 1.990728881345254e-05, "loss": 0.7519, "step": 21725 }, { "epoch": 0.7, "learning_rate": 1.9907137001376506e-05, "loss": 0.7428, "step": 21730 }, { "epoch": 0.7, "learning_rate": 1.9906985065687835e-05, "loss": 0.7515, "step": 21735 }, { "epoch": 0.7, "learning_rate": 1.9906833006388435e-05, "loss": 0.7365, "step": 21740 }, { "epoch": 0.7, "learning_rate": 1.9906680823480192e-05, "loss": 0.7501, "step": 21745 }, { "epoch": 0.7, "learning_rate": 1.990652851696501e-05, "loss": 0.7409, "step": 21750 }, { "epoch": 0.7, "learning_rate": 1.990637608684479e-05, "loss": 0.7494, "step": 21755 }, { "epoch": 0.7, "learning_rate": 1.9906223533121435e-05, "loss": 0.7548, "step": 21760 }, { "epoch": 0.7, "learning_rate": 1.9906070855796842e-05, "loss": 0.7475, "step": 21765 }, { "epoch": 0.7, "learning_rate": 1.990591805487292e-05, "loss": 0.7504, "step": 21770 }, { "epoch": 0.7, "learning_rate": 1.9905765130351577e-05, "loss": 0.7441, "step": 21775 }, { "epoch": 0.7, "learning_rate": 1.990561208223472e-05, "loss": 0.7542, "step": 21780 }, { "epoch": 0.7, "learning_rate": 1.9905458910524256e-05, "loss": 0.7541, "step": 21785 }, { "epoch": 0.7, "learning_rate": 1.9905305615222104e-05, "loss": 0.7489, "step": 21790 }, { "epoch": 0.7, "learning_rate": 1.9905152196330168e-05, "loss": 0.7349, "step": 21795 }, { "epoch": 0.7, "learning_rate": 1.990499865385036e-05, "loss": 0.7535, "step": 21800 }, { "epoch": 0.7, "learning_rate": 1.990484498778461e-05, "loss": 0.7445, "step": 21805 }, { "epoch": 0.7, "learning_rate": 1.990469119813482e-05, "loss": 0.7434, "step": 21810 }, { "epoch": 0.7, "learning_rate": 1.9904537284902917e-05, "loss": 0.749, "step": 21815 }, { "epoch": 0.7, "learning_rate": 1.9904383248090823e-05, "loss": 0.7475, "step": 21820 }, { "epoch": 0.7, "learning_rate": 1.9904229087700454e-05, "loss": 0.7442, "step": 21825 }, { "epoch": 0.7, "learning_rate": 1.9904074803733735e-05, "loss": 0.7376, "step": 21830 }, { "epoch": 0.7, "learning_rate": 1.9903920396192592e-05, "loss": 0.741, "step": 21835 }, { "epoch": 0.7, "learning_rate": 1.9903765865078952e-05, "loss": 0.7407, "step": 21840 }, { "epoch": 0.7, "learning_rate": 1.990361121039474e-05, "loss": 0.7428, "step": 21845 }, { "epoch": 0.7, "learning_rate": 1.9903456432141898e-05, "loss": 0.7466, "step": 21850 }, { "epoch": 0.7, "learning_rate": 1.990330153032234e-05, "loss": 0.7467, "step": 21855 }, { "epoch": 0.7, "learning_rate": 1.9903146504938005e-05, "loss": 0.7546, "step": 21860 }, { "epoch": 0.7, "learning_rate": 1.9902991355990832e-05, "loss": 0.7433, "step": 21865 }, { "epoch": 0.7, "learning_rate": 1.990283608348275e-05, "loss": 0.7391, "step": 21870 }, { "epoch": 0.7, "learning_rate": 1.9902680687415704e-05, "loss": 0.7386, "step": 21875 }, { "epoch": 0.7, "learning_rate": 1.9902525167791626e-05, "loss": 0.7452, "step": 21880 }, { "epoch": 0.7, "learning_rate": 1.990236952461246e-05, "loss": 0.7432, "step": 21885 }, { "epoch": 0.7, "learning_rate": 1.9902213757880147e-05, "loss": 0.7407, "step": 21890 }, { "epoch": 0.7, "learning_rate": 1.9902057867596633e-05, "loss": 0.7528, "step": 21895 }, { "epoch": 0.7, "learning_rate": 1.9901901853763857e-05, "loss": 0.7354, "step": 21900 }, { "epoch": 0.7, "learning_rate": 1.9901745716383773e-05, "loss": 0.7481, "step": 21905 }, { "epoch": 0.7, "learning_rate": 1.9901589455458322e-05, "loss": 0.7438, "step": 21910 }, { "epoch": 0.7, "learning_rate": 1.9901433070989458e-05, "loss": 0.734, "step": 21915 }, { "epoch": 0.7, "learning_rate": 1.990127656297913e-05, "loss": 0.7508, "step": 21920 }, { "epoch": 0.7, "learning_rate": 1.9901119931429294e-05, "loss": 0.7374, "step": 21925 }, { "epoch": 0.7, "learning_rate": 1.9900963176341902e-05, "loss": 0.7486, "step": 21930 }, { "epoch": 0.7, "learning_rate": 1.9900806297718912e-05, "loss": 0.751, "step": 21935 }, { "epoch": 0.7, "learning_rate": 1.9900649295562275e-05, "loss": 0.7366, "step": 21940 }, { "epoch": 0.7, "learning_rate": 1.9900492169873957e-05, "loss": 0.7401, "step": 21945 }, { "epoch": 0.7, "learning_rate": 1.990033492065592e-05, "loss": 0.7289, "step": 21950 }, { "epoch": 0.7, "learning_rate": 1.9900177547910116e-05, "loss": 0.7459, "step": 21955 }, { "epoch": 0.7, "learning_rate": 1.9900020051638517e-05, "loss": 0.7398, "step": 21960 }, { "epoch": 0.7, "learning_rate": 1.9899862431843087e-05, "loss": 0.7425, "step": 21965 }, { "epoch": 0.7, "learning_rate": 1.989970468852579e-05, "loss": 0.7455, "step": 21970 }, { "epoch": 0.7, "learning_rate": 1.9899546821688597e-05, "loss": 0.7408, "step": 21975 }, { "epoch": 0.7, "learning_rate": 1.9899388831333475e-05, "loss": 0.7512, "step": 21980 }, { "epoch": 0.7, "learning_rate": 1.9899230717462398e-05, "loss": 0.744, "step": 21985 }, { "epoch": 0.7, "learning_rate": 1.9899072480077337e-05, "loss": 0.7425, "step": 21990 }, { "epoch": 0.7, "learning_rate": 1.9898914119180265e-05, "loss": 0.7343, "step": 21995 }, { "epoch": 0.7, "learning_rate": 1.989875563477316e-05, "loss": 0.737, "step": 22000 }, { "epoch": 0.7, "learning_rate": 1.9898597026858e-05, "loss": 0.7428, "step": 22005 }, { "epoch": 0.7, "learning_rate": 1.989843829543676e-05, "loss": 0.7307, "step": 22010 }, { "epoch": 0.7, "learning_rate": 1.989827944051143e-05, "loss": 0.7353, "step": 22015 }, { "epoch": 0.7, "learning_rate": 1.9898120462083977e-05, "loss": 0.7449, "step": 22020 }, { "epoch": 0.7, "learning_rate": 1.9897961360156398e-05, "loss": 0.7391, "step": 22025 }, { "epoch": 0.7, "learning_rate": 1.9897802134730673e-05, "loss": 0.7261, "step": 22030 }, { "epoch": 0.71, "learning_rate": 1.989764278580879e-05, "loss": 0.7459, "step": 22035 }, { "epoch": 0.71, "learning_rate": 1.9897483313392735e-05, "loss": 0.7344, "step": 22040 }, { "epoch": 0.71, "learning_rate": 1.98973237174845e-05, "loss": 0.7396, "step": 22045 }, { "epoch": 0.71, "learning_rate": 1.9897163998086076e-05, "loss": 0.7376, "step": 22050 }, { "epoch": 0.71, "learning_rate": 1.9897004155199452e-05, "loss": 0.7331, "step": 22055 }, { "epoch": 0.71, "learning_rate": 1.989684418882663e-05, "loss": 0.7517, "step": 22060 }, { "epoch": 0.71, "learning_rate": 1.9896684098969598e-05, "loss": 0.7413, "step": 22065 }, { "epoch": 0.71, "learning_rate": 1.9896523885630356e-05, "loss": 0.7488, "step": 22070 }, { "epoch": 0.71, "learning_rate": 1.9896363548810905e-05, "loss": 0.7415, "step": 22075 }, { "epoch": 0.71, "learning_rate": 1.9896203088513245e-05, "loss": 0.7442, "step": 22080 }, { "epoch": 0.71, "learning_rate": 1.9896042504739377e-05, "loss": 0.7391, "step": 22085 }, { "epoch": 0.71, "learning_rate": 1.9895881797491307e-05, "loss": 0.7602, "step": 22090 }, { "epoch": 0.71, "learning_rate": 1.9895720966771034e-05, "loss": 0.7378, "step": 22095 }, { "epoch": 0.71, "learning_rate": 1.9895560012580574e-05, "loss": 0.7416, "step": 22100 }, { "epoch": 0.71, "learning_rate": 1.9895398934921927e-05, "loss": 0.7429, "step": 22105 }, { "epoch": 0.71, "learning_rate": 1.9895237733797107e-05, "loss": 0.7442, "step": 22110 }, { "epoch": 0.71, "learning_rate": 1.989507640920812e-05, "loss": 0.745, "step": 22115 }, { "epoch": 0.71, "learning_rate": 1.989491496115699e-05, "loss": 0.7458, "step": 22120 }, { "epoch": 0.71, "learning_rate": 1.9894753389645723e-05, "loss": 0.7415, "step": 22125 }, { "epoch": 0.71, "learning_rate": 1.9894591694676334e-05, "loss": 0.7358, "step": 22130 }, { "epoch": 0.71, "learning_rate": 1.9894429876250844e-05, "loss": 0.7338, "step": 22135 }, { "epoch": 0.71, "learning_rate": 1.9894267934371273e-05, "loss": 0.7483, "step": 22140 }, { "epoch": 0.71, "learning_rate": 1.9894105869039636e-05, "loss": 0.7427, "step": 22145 }, { "epoch": 0.71, "learning_rate": 1.9893943680257964e-05, "loss": 0.7357, "step": 22150 }, { "epoch": 0.71, "learning_rate": 1.9893781368028274e-05, "loss": 0.7382, "step": 22155 }, { "epoch": 0.71, "learning_rate": 1.989361893235259e-05, "loss": 0.7373, "step": 22160 }, { "epoch": 0.71, "learning_rate": 1.9893456373232944e-05, "loss": 0.7276, "step": 22165 }, { "epoch": 0.71, "learning_rate": 1.989329369067136e-05, "loss": 0.7338, "step": 22170 }, { "epoch": 0.71, "learning_rate": 1.989313088466987e-05, "loss": 0.7416, "step": 22175 }, { "epoch": 0.71, "learning_rate": 1.9892967955230504e-05, "loss": 0.733, "step": 22180 }, { "epoch": 0.71, "learning_rate": 1.9892804902355293e-05, "loss": 0.7419, "step": 22185 }, { "epoch": 0.71, "learning_rate": 1.9892641726046277e-05, "loss": 0.7412, "step": 22190 }, { "epoch": 0.71, "learning_rate": 1.9892478426305492e-05, "loss": 0.7458, "step": 22195 }, { "epoch": 0.71, "learning_rate": 1.9892315003134968e-05, "loss": 0.726, "step": 22200 }, { "epoch": 0.71, "learning_rate": 1.989215145653675e-05, "loss": 0.7427, "step": 22205 }, { "epoch": 0.71, "learning_rate": 1.989198778651288e-05, "loss": 0.7497, "step": 22210 }, { "epoch": 0.71, "learning_rate": 1.9891823993065393e-05, "loss": 0.7308, "step": 22215 }, { "epoch": 0.71, "learning_rate": 1.9891660076196338e-05, "loss": 0.7517, "step": 22220 }, { "epoch": 0.71, "learning_rate": 1.989149603590776e-05, "loss": 0.7437, "step": 22225 }, { "epoch": 0.71, "learning_rate": 1.9891331872201707e-05, "loss": 0.7504, "step": 22230 }, { "epoch": 0.71, "learning_rate": 1.9891167585080226e-05, "loss": 0.7558, "step": 22235 }, { "epoch": 0.71, "learning_rate": 1.989100317454536e-05, "loss": 0.7384, "step": 22240 }, { "epoch": 0.71, "learning_rate": 1.989083864059917e-05, "loss": 0.7518, "step": 22245 }, { "epoch": 0.71, "learning_rate": 1.9890673983243708e-05, "loss": 0.7517, "step": 22250 }, { "epoch": 0.71, "learning_rate": 1.989050920248102e-05, "loss": 0.7406, "step": 22255 }, { "epoch": 0.71, "learning_rate": 1.9890344298313175e-05, "loss": 0.7296, "step": 22260 }, { "epoch": 0.71, "learning_rate": 1.9890179270742217e-05, "loss": 0.7422, "step": 22265 }, { "epoch": 0.71, "learning_rate": 1.9890014119770214e-05, "loss": 0.7461, "step": 22270 }, { "epoch": 0.71, "learning_rate": 1.9889848845399226e-05, "loss": 0.7561, "step": 22275 }, { "epoch": 0.71, "learning_rate": 1.988968344763131e-05, "loss": 0.7494, "step": 22280 }, { "epoch": 0.71, "learning_rate": 1.9889517926468534e-05, "loss": 0.7431, "step": 22285 }, { "epoch": 0.71, "learning_rate": 1.9889352281912963e-05, "loss": 0.7364, "step": 22290 }, { "epoch": 0.71, "learning_rate": 1.988918651396666e-05, "loss": 0.7455, "step": 22295 }, { "epoch": 0.71, "learning_rate": 1.98890206226317e-05, "loss": 0.7318, "step": 22300 }, { "epoch": 0.71, "learning_rate": 1.988885460791015e-05, "loss": 0.7369, "step": 22305 }, { "epoch": 0.71, "learning_rate": 1.9888688469804075e-05, "loss": 0.7461, "step": 22310 }, { "epoch": 0.71, "learning_rate": 1.9888522208315557e-05, "loss": 0.743, "step": 22315 }, { "epoch": 0.71, "learning_rate": 1.988835582344667e-05, "loss": 0.7438, "step": 22320 }, { "epoch": 0.71, "learning_rate": 1.988818931519948e-05, "loss": 0.7326, "step": 22325 }, { "epoch": 0.71, "learning_rate": 1.9888022683576073e-05, "loss": 0.7356, "step": 22330 }, { "epoch": 0.71, "learning_rate": 1.9887855928578527e-05, "loss": 0.7334, "step": 22335 }, { "epoch": 0.71, "learning_rate": 1.9887689050208924e-05, "loss": 0.742, "step": 22340 }, { "epoch": 0.72, "learning_rate": 1.9887522048469342e-05, "loss": 0.743, "step": 22345 }, { "epoch": 0.72, "learning_rate": 1.988735492336187e-05, "loss": 0.7406, "step": 22350 }, { "epoch": 0.72, "learning_rate": 1.9887187674888587e-05, "loss": 0.7334, "step": 22355 }, { "epoch": 0.72, "learning_rate": 1.9887020303051586e-05, "loss": 0.7201, "step": 22360 }, { "epoch": 0.72, "learning_rate": 1.988685280785295e-05, "loss": 0.7406, "step": 22365 }, { "epoch": 0.72, "learning_rate": 1.988668518929477e-05, "loss": 0.7312, "step": 22370 }, { "epoch": 0.72, "learning_rate": 1.988651744737914e-05, "loss": 0.7424, "step": 22375 }, { "epoch": 0.72, "learning_rate": 1.9886349582108154e-05, "loss": 0.7396, "step": 22380 }, { "epoch": 0.72, "learning_rate": 1.98861815934839e-05, "loss": 0.7373, "step": 22385 }, { "epoch": 0.72, "learning_rate": 1.988601348150848e-05, "loss": 0.7389, "step": 22390 }, { "epoch": 0.72, "learning_rate": 1.988584524618399e-05, "loss": 0.7361, "step": 22395 }, { "epoch": 0.72, "learning_rate": 1.988567688751253e-05, "loss": 0.7269, "step": 22400 }, { "epoch": 0.72, "learning_rate": 1.9885508405496193e-05, "loss": 0.7258, "step": 22405 }, { "epoch": 0.72, "learning_rate": 1.9885339800137094e-05, "loss": 0.757, "step": 22410 }, { "epoch": 0.72, "learning_rate": 1.9885171071437327e-05, "loss": 0.7379, "step": 22415 }, { "epoch": 0.72, "learning_rate": 1.9885002219399e-05, "loss": 0.7412, "step": 22420 }, { "epoch": 0.72, "learning_rate": 1.9884833244024226e-05, "loss": 0.7325, "step": 22425 }, { "epoch": 0.72, "learning_rate": 1.98846641453151e-05, "loss": 0.7347, "step": 22430 }, { "epoch": 0.72, "learning_rate": 1.9884494923273742e-05, "loss": 0.7194, "step": 22435 }, { "epoch": 0.72, "learning_rate": 1.9884325577902262e-05, "loss": 0.7506, "step": 22440 }, { "epoch": 0.72, "learning_rate": 1.988415610920277e-05, "loss": 0.731, "step": 22445 }, { "epoch": 0.72, "learning_rate": 1.9883986517177382e-05, "loss": 0.7321, "step": 22450 }, { "epoch": 0.72, "learning_rate": 1.9883816801828216e-05, "loss": 0.7339, "step": 22455 }, { "epoch": 0.72, "learning_rate": 1.988364696315739e-05, "loss": 0.7262, "step": 22460 }, { "epoch": 0.72, "learning_rate": 1.9883477001167012e-05, "loss": 0.7422, "step": 22465 }, { "epoch": 0.72, "learning_rate": 1.988330691585922e-05, "loss": 0.732, "step": 22470 }, { "epoch": 0.72, "learning_rate": 1.9883136707236127e-05, "loss": 0.7321, "step": 22475 }, { "epoch": 0.72, "learning_rate": 1.9882966375299854e-05, "loss": 0.7416, "step": 22480 }, { "epoch": 0.72, "learning_rate": 1.9882795920052532e-05, "loss": 0.749, "step": 22485 }, { "epoch": 0.72, "learning_rate": 1.9882625341496285e-05, "loss": 0.7347, "step": 22490 }, { "epoch": 0.72, "learning_rate": 1.988245463963324e-05, "loss": 0.7553, "step": 22495 }, { "epoch": 0.72, "learning_rate": 1.988228381446553e-05, "loss": 0.7413, "step": 22500 }, { "epoch": 0.72, "learning_rate": 1.9882112865995284e-05, "loss": 0.7365, "step": 22505 }, { "epoch": 0.72, "learning_rate": 1.9881941794224636e-05, "loss": 0.7411, "step": 22510 }, { "epoch": 0.72, "learning_rate": 1.9881770599155726e-05, "loss": 0.737, "step": 22515 }, { "epoch": 0.72, "learning_rate": 1.988159928079068e-05, "loss": 0.752, "step": 22520 }, { "epoch": 0.72, "learning_rate": 1.9881427839131637e-05, "loss": 0.7335, "step": 22525 }, { "epoch": 0.72, "learning_rate": 1.9881256274180745e-05, "loss": 0.7475, "step": 22530 }, { "epoch": 0.72, "learning_rate": 1.9881084585940135e-05, "loss": 0.7385, "step": 22535 }, { "epoch": 0.72, "learning_rate": 1.9880912774411955e-05, "loss": 0.7372, "step": 22540 }, { "epoch": 0.72, "learning_rate": 1.9880740839598346e-05, "loss": 0.7352, "step": 22545 }, { "epoch": 0.72, "learning_rate": 1.9880568781501454e-05, "loss": 0.7248, "step": 22550 }, { "epoch": 0.72, "learning_rate": 1.9880396600123425e-05, "loss": 0.7408, "step": 22555 }, { "epoch": 0.72, "learning_rate": 1.988022429546641e-05, "loss": 0.7553, "step": 22560 }, { "epoch": 0.72, "learning_rate": 1.9880051867532556e-05, "loss": 0.7317, "step": 22565 }, { "epoch": 0.72, "learning_rate": 1.9879879316324015e-05, "loss": 0.7316, "step": 22570 }, { "epoch": 0.72, "learning_rate": 1.987970664184294e-05, "loss": 0.7351, "step": 22575 }, { "epoch": 0.72, "learning_rate": 1.987953384409149e-05, "loss": 0.7291, "step": 22580 }, { "epoch": 0.72, "learning_rate": 1.9879360923071812e-05, "loss": 0.7223, "step": 22585 }, { "epoch": 0.72, "learning_rate": 1.9879187878786067e-05, "loss": 0.7425, "step": 22590 }, { "epoch": 0.72, "learning_rate": 1.987901471123642e-05, "loss": 0.7431, "step": 22595 }, { "epoch": 0.72, "learning_rate": 1.9878841420425023e-05, "loss": 0.7328, "step": 22600 }, { "epoch": 0.72, "learning_rate": 1.9878668006354044e-05, "loss": 0.7363, "step": 22605 }, { "epoch": 0.72, "learning_rate": 1.9878494469025646e-05, "loss": 0.7335, "step": 22610 }, { "epoch": 0.72, "learning_rate": 1.9878320808441994e-05, "loss": 0.7388, "step": 22615 }, { "epoch": 0.72, "learning_rate": 1.987814702460525e-05, "loss": 0.7355, "step": 22620 }, { "epoch": 0.72, "learning_rate": 1.987797311751759e-05, "loss": 0.7352, "step": 22625 }, { "epoch": 0.72, "learning_rate": 1.987779908718118e-05, "loss": 0.7416, "step": 22630 }, { "epoch": 0.72, "learning_rate": 1.987762493359819e-05, "loss": 0.7338, "step": 22635 }, { "epoch": 0.72, "learning_rate": 1.9877450656770794e-05, "loss": 0.7339, "step": 22640 }, { "epoch": 0.72, "learning_rate": 1.987727625670117e-05, "loss": 0.7248, "step": 22645 }, { "epoch": 0.72, "learning_rate": 1.987710173339149e-05, "loss": 0.7397, "step": 22650 }, { "epoch": 0.72, "learning_rate": 1.987692708684393e-05, "loss": 0.7482, "step": 22655 }, { "epoch": 0.73, "learning_rate": 1.9876752317060676e-05, "loss": 0.7455, "step": 22660 }, { "epoch": 0.73, "learning_rate": 1.98765774240439e-05, "loss": 0.762, "step": 22665 }, { "epoch": 0.73, "learning_rate": 1.987640240779579e-05, "loss": 0.7369, "step": 22670 }, { "epoch": 0.73, "learning_rate": 1.987622726831853e-05, "loss": 0.7299, "step": 22675 }, { "epoch": 0.73, "learning_rate": 1.98760520056143e-05, "loss": 0.7314, "step": 22680 }, { "epoch": 0.73, "learning_rate": 1.9875876619685294e-05, "loss": 0.7276, "step": 22685 }, { "epoch": 0.73, "learning_rate": 1.9875701110533693e-05, "loss": 0.7434, "step": 22690 }, { "epoch": 0.73, "learning_rate": 1.987552547816169e-05, "loss": 0.7272, "step": 22695 }, { "epoch": 0.73, "learning_rate": 1.987534972257148e-05, "loss": 0.7213, "step": 22700 }, { "epoch": 0.73, "learning_rate": 1.9875173843765252e-05, "loss": 0.7402, "step": 22705 }, { "epoch": 0.73, "learning_rate": 1.9874997841745202e-05, "loss": 0.7382, "step": 22710 }, { "epoch": 0.73, "learning_rate": 1.987482171651352e-05, "loss": 0.7446, "step": 22715 }, { "epoch": 0.73, "learning_rate": 1.9874645468072417e-05, "loss": 0.7345, "step": 22720 }, { "epoch": 0.73, "learning_rate": 1.9874469096424075e-05, "loss": 0.7389, "step": 22725 }, { "epoch": 0.73, "learning_rate": 1.987429260157071e-05, "loss": 0.7371, "step": 22730 }, { "epoch": 0.73, "learning_rate": 1.9874115983514513e-05, "loss": 0.7424, "step": 22735 }, { "epoch": 0.73, "learning_rate": 1.9873939242257694e-05, "loss": 0.7268, "step": 22740 }, { "epoch": 0.73, "learning_rate": 1.9873762377802453e-05, "loss": 0.7375, "step": 22745 }, { "epoch": 0.73, "learning_rate": 1.9873585390151003e-05, "loss": 0.7337, "step": 22750 }, { "epoch": 0.73, "learning_rate": 1.987340827930555e-05, "loss": 0.7388, "step": 22755 }, { "epoch": 0.73, "learning_rate": 1.9873231045268303e-05, "loss": 0.7341, "step": 22760 }, { "epoch": 0.73, "learning_rate": 1.9873053688041474e-05, "loss": 0.7263, "step": 22765 }, { "epoch": 0.73, "learning_rate": 1.9872876207627276e-05, "loss": 0.7549, "step": 22770 }, { "epoch": 0.73, "learning_rate": 1.9872698604027924e-05, "loss": 0.7168, "step": 22775 }, { "epoch": 0.73, "learning_rate": 1.9872520877245628e-05, "loss": 0.7477, "step": 22780 }, { "epoch": 0.73, "learning_rate": 1.9872343027282617e-05, "loss": 0.7286, "step": 22785 }, { "epoch": 0.73, "learning_rate": 1.98721650541411e-05, "loss": 0.7367, "step": 22790 }, { "epoch": 0.73, "learning_rate": 1.98719869578233e-05, "loss": 0.7403, "step": 22795 }, { "epoch": 0.73, "learning_rate": 1.987180873833144e-05, "loss": 0.7308, "step": 22800 }, { "epoch": 0.73, "learning_rate": 1.9871630395667748e-05, "loss": 0.733, "step": 22805 }, { "epoch": 0.73, "learning_rate": 1.9871451929834443e-05, "loss": 0.7312, "step": 22810 }, { "epoch": 0.73, "learning_rate": 1.9871273340833752e-05, "loss": 0.7434, "step": 22815 }, { "epoch": 0.73, "learning_rate": 1.9871094628667905e-05, "loss": 0.7418, "step": 22820 }, { "epoch": 0.73, "learning_rate": 1.9870915793339137e-05, "loss": 0.7237, "step": 22825 }, { "epoch": 0.73, "learning_rate": 1.987073683484967e-05, "loss": 0.7344, "step": 22830 }, { "epoch": 0.73, "learning_rate": 1.9870557753201742e-05, "loss": 0.74, "step": 22835 }, { "epoch": 0.73, "learning_rate": 1.9870378548397585e-05, "loss": 0.7391, "step": 22840 }, { "epoch": 0.73, "learning_rate": 1.9870199220439442e-05, "loss": 0.7389, "step": 22845 }, { "epoch": 0.73, "learning_rate": 1.987001976932954e-05, "loss": 0.7268, "step": 22850 }, { "epoch": 0.73, "learning_rate": 1.9869840195070126e-05, "loss": 0.7376, "step": 22855 }, { "epoch": 0.73, "learning_rate": 1.9869660497663435e-05, "loss": 0.7411, "step": 22860 }, { "epoch": 0.73, "learning_rate": 1.9869480677111713e-05, "loss": 0.7225, "step": 22865 }, { "epoch": 0.73, "learning_rate": 1.9869300733417206e-05, "loss": 0.7406, "step": 22870 }, { "epoch": 0.73, "learning_rate": 1.9869120666582153e-05, "loss": 0.7297, "step": 22875 }, { "epoch": 0.73, "learning_rate": 1.9868940476608802e-05, "loss": 0.7318, "step": 22880 }, { "epoch": 0.73, "learning_rate": 1.9868760163499405e-05, "loss": 0.7396, "step": 22885 }, { "epoch": 0.73, "learning_rate": 1.9868579727256208e-05, "loss": 0.7269, "step": 22890 }, { "epoch": 0.73, "learning_rate": 1.986839916788146e-05, "loss": 0.7407, "step": 22895 }, { "epoch": 0.73, "learning_rate": 1.9868218485377424e-05, "loss": 0.7422, "step": 22900 }, { "epoch": 0.73, "learning_rate": 1.9868037679746347e-05, "loss": 0.7348, "step": 22905 }, { "epoch": 0.73, "learning_rate": 1.9867856750990483e-05, "loss": 0.7299, "step": 22910 }, { "epoch": 0.73, "learning_rate": 1.9867675699112095e-05, "loss": 0.733, "step": 22915 }, { "epoch": 0.73, "learning_rate": 1.9867494524113436e-05, "loss": 0.7428, "step": 22920 }, { "epoch": 0.73, "learning_rate": 1.9867313225996773e-05, "loss": 0.7427, "step": 22925 }, { "epoch": 0.73, "learning_rate": 1.9867131804764366e-05, "loss": 0.7314, "step": 22930 }, { "epoch": 0.73, "learning_rate": 1.9866950260418475e-05, "loss": 0.7192, "step": 22935 }, { "epoch": 0.73, "learning_rate": 1.9866768592961366e-05, "loss": 0.7274, "step": 22940 }, { "epoch": 0.73, "learning_rate": 1.9866586802395313e-05, "loss": 0.7452, "step": 22945 }, { "epoch": 0.73, "learning_rate": 1.9866404888722575e-05, "loss": 0.7245, "step": 22950 }, { "epoch": 0.73, "learning_rate": 1.986622285194543e-05, "loss": 0.7313, "step": 22955 }, { "epoch": 0.73, "learning_rate": 1.9866040692066137e-05, "loss": 0.7285, "step": 22960 }, { "epoch": 0.73, "learning_rate": 1.9865858409086984e-05, "loss": 0.7407, "step": 22965 }, { "epoch": 0.74, "learning_rate": 1.9865676003010233e-05, "loss": 0.7259, "step": 22970 }, { "epoch": 0.74, "learning_rate": 1.9865493473838168e-05, "loss": 0.7279, "step": 22975 }, { "epoch": 0.74, "learning_rate": 1.9865310821573063e-05, "loss": 0.7427, "step": 22980 }, { "epoch": 0.74, "learning_rate": 1.9865128046217195e-05, "loss": 0.7392, "step": 22985 }, { "epoch": 0.74, "learning_rate": 1.986494514777285e-05, "loss": 0.7402, "step": 22990 }, { "epoch": 0.74, "learning_rate": 1.98647621262423e-05, "loss": 0.7414, "step": 22995 }, { "epoch": 0.74, "learning_rate": 1.9864578981627844e-05, "loss": 0.7378, "step": 23000 }, { "epoch": 0.74, "learning_rate": 1.9864395713931754e-05, "loss": 0.7275, "step": 23005 }, { "epoch": 0.74, "learning_rate": 1.9864212323156322e-05, "loss": 0.7377, "step": 23010 }, { "epoch": 0.74, "learning_rate": 1.9864028809303838e-05, "loss": 0.7419, "step": 23015 }, { "epoch": 0.74, "learning_rate": 1.9863845172376586e-05, "loss": 0.7546, "step": 23020 }, { "epoch": 0.74, "learning_rate": 1.986366141237686e-05, "loss": 0.7394, "step": 23025 }, { "epoch": 0.74, "learning_rate": 1.9863477529306956e-05, "loss": 0.7151, "step": 23030 }, { "epoch": 0.74, "learning_rate": 1.9863293523169162e-05, "loss": 0.725, "step": 23035 }, { "epoch": 0.74, "learning_rate": 1.9863109393965782e-05, "loss": 0.7434, "step": 23040 }, { "epoch": 0.74, "learning_rate": 1.9862925141699106e-05, "loss": 0.7545, "step": 23045 }, { "epoch": 0.74, "learning_rate": 1.9862740766371434e-05, "loss": 0.7446, "step": 23050 }, { "epoch": 0.74, "learning_rate": 1.986255626798507e-05, "loss": 0.7247, "step": 23055 }, { "epoch": 0.74, "learning_rate": 1.9862371646542314e-05, "loss": 0.7348, "step": 23060 }, { "epoch": 0.74, "learning_rate": 1.986218690204547e-05, "loss": 0.7357, "step": 23065 }, { "epoch": 0.74, "learning_rate": 1.9862002034496846e-05, "loss": 0.7409, "step": 23070 }, { "epoch": 0.74, "learning_rate": 1.9861817043898743e-05, "loss": 0.7297, "step": 23075 }, { "epoch": 0.74, "learning_rate": 1.9861631930253468e-05, "loss": 0.7367, "step": 23080 }, { "epoch": 0.74, "learning_rate": 1.986144669356334e-05, "loss": 0.7444, "step": 23085 }, { "epoch": 0.74, "learning_rate": 1.9861261333830662e-05, "loss": 0.7532, "step": 23090 }, { "epoch": 0.74, "learning_rate": 1.9861075851057747e-05, "loss": 0.7471, "step": 23095 }, { "epoch": 0.74, "learning_rate": 1.9860890245246915e-05, "loss": 0.7361, "step": 23100 }, { "epoch": 0.74, "learning_rate": 1.986070451640048e-05, "loss": 0.7359, "step": 23105 }, { "epoch": 0.74, "learning_rate": 1.9860518664520752e-05, "loss": 0.7309, "step": 23110 }, { "epoch": 0.74, "learning_rate": 1.986033268961006e-05, "loss": 0.7426, "step": 23115 }, { "epoch": 0.74, "learning_rate": 1.9860146591670717e-05, "loss": 0.7241, "step": 23120 }, { "epoch": 0.74, "learning_rate": 1.985996037070505e-05, "loss": 0.7322, "step": 23125 }, { "epoch": 0.74, "learning_rate": 1.985977402671538e-05, "loss": 0.7338, "step": 23130 }, { "epoch": 0.74, "learning_rate": 1.9859587559704033e-05, "loss": 0.7236, "step": 23135 }, { "epoch": 0.74, "learning_rate": 1.9859400969673338e-05, "loss": 0.7234, "step": 23140 }, { "epoch": 0.74, "learning_rate": 1.9859214256625616e-05, "loss": 0.7372, "step": 23145 }, { "epoch": 0.74, "learning_rate": 1.9859027420563203e-05, "loss": 0.7377, "step": 23150 }, { "epoch": 0.74, "learning_rate": 1.9858840461488425e-05, "loss": 0.7324, "step": 23155 }, { "epoch": 0.74, "learning_rate": 1.9858653379403623e-05, "loss": 0.7277, "step": 23160 }, { "epoch": 0.74, "learning_rate": 1.985846617431112e-05, "loss": 0.7281, "step": 23165 }, { "epoch": 0.74, "learning_rate": 1.9858278846213266e-05, "loss": 0.7304, "step": 23170 }, { "epoch": 0.74, "learning_rate": 1.9858091395112383e-05, "loss": 0.7322, "step": 23175 }, { "epoch": 0.74, "learning_rate": 1.985790382101082e-05, "loss": 0.7301, "step": 23180 }, { "epoch": 0.74, "learning_rate": 1.9857716123910913e-05, "loss": 0.7442, "step": 23185 }, { "epoch": 0.74, "learning_rate": 1.9857528303815008e-05, "loss": 0.7227, "step": 23190 }, { "epoch": 0.74, "learning_rate": 1.9857340360725447e-05, "loss": 0.7389, "step": 23195 }, { "epoch": 0.74, "learning_rate": 1.9857152294644567e-05, "loss": 0.7135, "step": 23200 }, { "epoch": 0.74, "learning_rate": 1.9856964105574727e-05, "loss": 0.7364, "step": 23205 }, { "epoch": 0.74, "learning_rate": 1.9856775793518267e-05, "loss": 0.7145, "step": 23210 }, { "epoch": 0.74, "learning_rate": 1.985658735847754e-05, "loss": 0.7239, "step": 23215 }, { "epoch": 0.74, "learning_rate": 1.9856398800454893e-05, "loss": 0.7353, "step": 23220 }, { "epoch": 0.74, "learning_rate": 1.9856210119452685e-05, "loss": 0.7284, "step": 23225 }, { "epoch": 0.74, "learning_rate": 1.9856021315473266e-05, "loss": 0.7482, "step": 23230 }, { "epoch": 0.74, "learning_rate": 1.9855832388518995e-05, "loss": 0.7383, "step": 23235 }, { "epoch": 0.74, "learning_rate": 1.9855643338592223e-05, "loss": 0.7322, "step": 23240 }, { "epoch": 0.74, "learning_rate": 1.9855454165695315e-05, "loss": 0.74, "step": 23245 }, { "epoch": 0.74, "learning_rate": 1.985526486983063e-05, "loss": 0.72, "step": 23250 }, { "epoch": 0.74, "learning_rate": 1.985507545100053e-05, "loss": 0.7229, "step": 23255 }, { "epoch": 0.74, "learning_rate": 1.9854885909207372e-05, "loss": 0.7239, "step": 23260 }, { "epoch": 0.74, "learning_rate": 1.985469624445353e-05, "loss": 0.7278, "step": 23265 }, { "epoch": 0.74, "learning_rate": 1.9854506456741366e-05, "loss": 0.7367, "step": 23270 }, { "epoch": 0.74, "learning_rate": 1.985431654607325e-05, "loss": 0.736, "step": 23275 }, { "epoch": 0.74, "learning_rate": 1.985412651245155e-05, "loss": 0.7341, "step": 23280 }, { "epoch": 0.75, "learning_rate": 1.9853936355878635e-05, "loss": 0.7357, "step": 23285 }, { "epoch": 0.75, "learning_rate": 1.9853746076356878e-05, "loss": 0.7429, "step": 23290 }, { "epoch": 0.75, "learning_rate": 1.985355567388866e-05, "loss": 0.7394, "step": 23295 }, { "epoch": 0.75, "learning_rate": 1.985336514847635e-05, "loss": 0.7319, "step": 23300 }, { "epoch": 0.75, "learning_rate": 1.985317450012233e-05, "loss": 0.7371, "step": 23305 }, { "epoch": 0.75, "learning_rate": 1.9852983728828972e-05, "loss": 0.7366, "step": 23310 }, { "epoch": 0.75, "learning_rate": 1.985279283459866e-05, "loss": 0.7307, "step": 23315 }, { "epoch": 0.75, "learning_rate": 1.9852601817433777e-05, "loss": 0.7248, "step": 23320 }, { "epoch": 0.75, "learning_rate": 1.9852410677336707e-05, "loss": 0.7244, "step": 23325 }, { "epoch": 0.75, "learning_rate": 1.9852219414309833e-05, "loss": 0.732, "step": 23330 }, { "epoch": 0.75, "learning_rate": 1.9852028028355538e-05, "loss": 0.7417, "step": 23335 }, { "epoch": 0.75, "learning_rate": 1.9851836519476217e-05, "loss": 0.735, "step": 23340 }, { "epoch": 0.75, "learning_rate": 1.9851644887674254e-05, "loss": 0.7374, "step": 23345 }, { "epoch": 0.75, "learning_rate": 1.9851453132952042e-05, "loss": 0.7262, "step": 23350 }, { "epoch": 0.75, "learning_rate": 1.9851261255311974e-05, "loss": 0.7089, "step": 23355 }, { "epoch": 0.75, "learning_rate": 1.9851069254756444e-05, "loss": 0.7319, "step": 23360 }, { "epoch": 0.75, "learning_rate": 1.9850877131287844e-05, "loss": 0.731, "step": 23365 }, { "epoch": 0.75, "learning_rate": 1.9850684884908577e-05, "loss": 0.7409, "step": 23370 }, { "epoch": 0.75, "learning_rate": 1.9850492515621038e-05, "loss": 0.7355, "step": 23375 }, { "epoch": 0.75, "learning_rate": 1.9850300023427632e-05, "loss": 0.7363, "step": 23380 }, { "epoch": 0.75, "learning_rate": 1.9850107408330752e-05, "loss": 0.722, "step": 23385 }, { "epoch": 0.75, "learning_rate": 1.9849914670332807e-05, "loss": 0.7396, "step": 23390 }, { "epoch": 0.75, "learning_rate": 1.9849721809436202e-05, "loss": 0.73, "step": 23395 }, { "epoch": 0.75, "learning_rate": 1.9849528825643346e-05, "loss": 0.7283, "step": 23400 }, { "epoch": 0.75, "learning_rate": 1.9849335718956638e-05, "loss": 0.7281, "step": 23405 }, { "epoch": 0.75, "learning_rate": 1.9849142489378494e-05, "loss": 0.7252, "step": 23410 }, { "epoch": 0.75, "learning_rate": 1.9848949136911325e-05, "loss": 0.7277, "step": 23415 }, { "epoch": 0.75, "learning_rate": 1.9848755661557542e-05, "loss": 0.7457, "step": 23420 }, { "epoch": 0.75, "learning_rate": 1.984856206331956e-05, "loss": 0.739, "step": 23425 }, { "epoch": 0.75, "learning_rate": 1.984836834219979e-05, "loss": 0.7445, "step": 23430 }, { "epoch": 0.75, "learning_rate": 1.9848174498200656e-05, "loss": 0.7234, "step": 23435 }, { "epoch": 0.75, "learning_rate": 1.9847980531324573e-05, "loss": 0.7361, "step": 23440 }, { "epoch": 0.75, "learning_rate": 1.984778644157396e-05, "loss": 0.7365, "step": 23445 }, { "epoch": 0.75, "learning_rate": 1.984759222895124e-05, "loss": 0.7351, "step": 23450 }, { "epoch": 0.75, "learning_rate": 1.984739789345884e-05, "loss": 0.7112, "step": 23455 }, { "epoch": 0.75, "learning_rate": 1.9847203435099182e-05, "loss": 0.7287, "step": 23460 }, { "epoch": 0.75, "learning_rate": 1.9847008853874687e-05, "loss": 0.7191, "step": 23465 }, { "epoch": 0.75, "learning_rate": 1.984681414978779e-05, "loss": 0.7248, "step": 23470 }, { "epoch": 0.75, "learning_rate": 1.9846619322840915e-05, "loss": 0.7421, "step": 23475 }, { "epoch": 0.75, "learning_rate": 1.98464243730365e-05, "loss": 0.7302, "step": 23480 }, { "epoch": 0.75, "learning_rate": 1.9846229300376968e-05, "loss": 0.7388, "step": 23485 }, { "epoch": 0.75, "learning_rate": 1.984603410486476e-05, "loss": 0.7329, "step": 23490 }, { "epoch": 0.75, "learning_rate": 1.9845838786502312e-05, "loss": 0.722, "step": 23495 }, { "epoch": 0.75, "learning_rate": 1.9845643345292055e-05, "loss": 0.7307, "step": 23500 }, { "epoch": 0.75, "learning_rate": 1.984544778123643e-05, "loss": 0.7173, "step": 23505 }, { "epoch": 0.75, "learning_rate": 1.9845252094337884e-05, "loss": 0.7229, "step": 23510 }, { "epoch": 0.75, "learning_rate": 1.9845056284598846e-05, "loss": 0.7303, "step": 23515 }, { "epoch": 0.75, "learning_rate": 1.9844860352021768e-05, "loss": 0.7287, "step": 23520 }, { "epoch": 0.75, "learning_rate": 1.9844664296609096e-05, "loss": 0.7452, "step": 23525 }, { "epoch": 0.75, "learning_rate": 1.9844468118363268e-05, "loss": 0.7311, "step": 23530 }, { "epoch": 0.75, "learning_rate": 1.984427181728674e-05, "loss": 0.7295, "step": 23535 }, { "epoch": 0.75, "learning_rate": 1.9844075393381955e-05, "loss": 0.724, "step": 23540 }, { "epoch": 0.75, "learning_rate": 1.9843878846651367e-05, "loss": 0.7262, "step": 23545 }, { "epoch": 0.75, "learning_rate": 1.9843682177097427e-05, "loss": 0.7343, "step": 23550 }, { "epoch": 0.75, "learning_rate": 1.984348538472259e-05, "loss": 0.7339, "step": 23555 }, { "epoch": 0.75, "learning_rate": 1.9843288469529313e-05, "loss": 0.7332, "step": 23560 }, { "epoch": 0.75, "learning_rate": 1.9843091431520053e-05, "loss": 0.7311, "step": 23565 }, { "epoch": 0.75, "learning_rate": 1.984289427069726e-05, "loss": 0.734, "step": 23570 }, { "epoch": 0.75, "learning_rate": 1.9842696987063402e-05, "loss": 0.7287, "step": 23575 }, { "epoch": 0.75, "learning_rate": 1.9842499580620945e-05, "loss": 0.7295, "step": 23580 }, { "epoch": 0.75, "learning_rate": 1.9842302051372342e-05, "loss": 0.7305, "step": 23585 }, { "epoch": 0.75, "learning_rate": 1.984210439932006e-05, "loss": 0.7328, "step": 23590 }, { "epoch": 0.76, "learning_rate": 1.984190662446657e-05, "loss": 0.7246, "step": 23595 }, { "epoch": 0.76, "learning_rate": 1.9841708726814336e-05, "loss": 0.7302, "step": 23600 }, { "epoch": 0.76, "learning_rate": 1.9841510706365824e-05, "loss": 0.7306, "step": 23605 }, { "epoch": 0.76, "learning_rate": 1.984131256312351e-05, "loss": 0.732, "step": 23610 }, { "epoch": 0.76, "learning_rate": 1.9841114297089868e-05, "loss": 0.7377, "step": 23615 }, { "epoch": 0.76, "learning_rate": 1.9840915908267367e-05, "loss": 0.7272, "step": 23620 }, { "epoch": 0.76, "learning_rate": 1.9840717396658483e-05, "loss": 0.7272, "step": 23625 }, { "epoch": 0.76, "learning_rate": 1.9840518762265695e-05, "loss": 0.7339, "step": 23630 }, { "epoch": 0.76, "learning_rate": 1.984032000509148e-05, "loss": 0.7385, "step": 23635 }, { "epoch": 0.76, "learning_rate": 1.9840121125138317e-05, "loss": 0.7266, "step": 23640 }, { "epoch": 0.76, "learning_rate": 1.9839922122408688e-05, "loss": 0.7471, "step": 23645 }, { "epoch": 0.76, "learning_rate": 1.9839722996905076e-05, "loss": 0.7169, "step": 23650 }, { "epoch": 0.76, "learning_rate": 1.9839523748629967e-05, "loss": 0.7369, "step": 23655 }, { "epoch": 0.76, "learning_rate": 1.9839324377585845e-05, "loss": 0.7259, "step": 23660 }, { "epoch": 0.76, "learning_rate": 1.98391248837752e-05, "loss": 0.7256, "step": 23665 }, { "epoch": 0.76, "learning_rate": 1.9838925267200517e-05, "loss": 0.731, "step": 23670 }, { "epoch": 0.76, "learning_rate": 1.983872552786429e-05, "loss": 0.7374, "step": 23675 }, { "epoch": 0.76, "learning_rate": 1.9838525665769013e-05, "loss": 0.7307, "step": 23680 }, { "epoch": 0.76, "learning_rate": 1.9838325680917177e-05, "loss": 0.733, "step": 23685 }, { "epoch": 0.76, "learning_rate": 1.9838125573311276e-05, "loss": 0.7294, "step": 23690 }, { "epoch": 0.76, "learning_rate": 1.9837925342953808e-05, "loss": 0.7277, "step": 23695 }, { "epoch": 0.76, "learning_rate": 1.983772498984727e-05, "loss": 0.7152, "step": 23700 }, { "epoch": 0.76, "learning_rate": 1.9837524513994165e-05, "loss": 0.74, "step": 23705 }, { "epoch": 0.76, "learning_rate": 1.9837323915396994e-05, "loss": 0.7278, "step": 23710 }, { "epoch": 0.76, "learning_rate": 1.9837123194058257e-05, "loss": 0.7226, "step": 23715 }, { "epoch": 0.76, "learning_rate": 1.983692234998046e-05, "loss": 0.7283, "step": 23720 }, { "epoch": 0.76, "learning_rate": 1.983672138316611e-05, "loss": 0.7174, "step": 23725 }, { "epoch": 0.76, "learning_rate": 1.983652029361771e-05, "loss": 0.7212, "step": 23730 }, { "epoch": 0.76, "learning_rate": 1.9836319081337776e-05, "loss": 0.7294, "step": 23735 }, { "epoch": 0.76, "learning_rate": 1.9836117746328815e-05, "loss": 0.722, "step": 23740 }, { "epoch": 0.76, "learning_rate": 1.983591628859334e-05, "loss": 0.7319, "step": 23745 }, { "epoch": 0.76, "learning_rate": 1.983571470813386e-05, "loss": 0.7327, "step": 23750 }, { "epoch": 0.76, "learning_rate": 1.9835513004952895e-05, "loss": 0.7356, "step": 23755 }, { "epoch": 0.76, "learning_rate": 1.9835311179052963e-05, "loss": 0.735, "step": 23760 }, { "epoch": 0.76, "learning_rate": 1.9835109230436578e-05, "loss": 0.7339, "step": 23765 }, { "epoch": 0.76, "learning_rate": 1.9834907159106264e-05, "loss": 0.7256, "step": 23770 }, { "epoch": 0.76, "learning_rate": 1.9834704965064535e-05, "loss": 0.7319, "step": 23775 }, { "epoch": 0.76, "learning_rate": 1.983450264831392e-05, "loss": 0.7345, "step": 23780 }, { "epoch": 0.76, "learning_rate": 1.9834300208856943e-05, "loss": 0.7329, "step": 23785 }, { "epoch": 0.76, "learning_rate": 1.9834097646696125e-05, "loss": 0.736, "step": 23790 }, { "epoch": 0.76, "learning_rate": 1.9833894961834003e-05, "loss": 0.7148, "step": 23795 }, { "epoch": 0.76, "learning_rate": 1.9833692154273097e-05, "loss": 0.7292, "step": 23800 }, { "epoch": 0.76, "learning_rate": 1.9833489224015944e-05, "loss": 0.7269, "step": 23805 }, { "epoch": 0.76, "learning_rate": 1.9833286171065067e-05, "loss": 0.7207, "step": 23810 }, { "epoch": 0.76, "learning_rate": 1.983308299542301e-05, "loss": 0.7147, "step": 23815 }, { "epoch": 0.76, "learning_rate": 1.9832879697092297e-05, "loss": 0.7183, "step": 23820 }, { "epoch": 0.76, "learning_rate": 1.9832676276075476e-05, "loss": 0.7508, "step": 23825 }, { "epoch": 0.76, "learning_rate": 1.9832472732375078e-05, "loss": 0.7316, "step": 23830 }, { "epoch": 0.76, "learning_rate": 1.9832269065993643e-05, "loss": 0.7206, "step": 23835 }, { "epoch": 0.76, "learning_rate": 1.9832065276933716e-05, "loss": 0.7305, "step": 23840 }, { "epoch": 0.76, "learning_rate": 1.9831861365197834e-05, "loss": 0.7215, "step": 23845 }, { "epoch": 0.76, "learning_rate": 1.983165733078855e-05, "loss": 0.7265, "step": 23850 }, { "epoch": 0.76, "learning_rate": 1.9831453173708398e-05, "loss": 0.7326, "step": 23855 }, { "epoch": 0.76, "learning_rate": 1.9831248893959937e-05, "loss": 0.7289, "step": 23860 }, { "epoch": 0.76, "learning_rate": 1.983104449154571e-05, "loss": 0.73, "step": 23865 }, { "epoch": 0.76, "learning_rate": 1.9830839966468262e-05, "loss": 0.7316, "step": 23870 }, { "epoch": 0.76, "learning_rate": 1.9830635318730155e-05, "loss": 0.7308, "step": 23875 }, { "epoch": 0.76, "learning_rate": 1.983043054833394e-05, "loss": 0.728, "step": 23880 }, { "epoch": 0.76, "learning_rate": 1.9830225655282164e-05, "loss": 0.7221, "step": 23885 }, { "epoch": 0.76, "learning_rate": 1.9830020639577397e-05, "loss": 0.7317, "step": 23890 }, { "epoch": 0.76, "learning_rate": 1.9829815501222184e-05, "loss": 0.7328, "step": 23895 }, { "epoch": 0.76, "learning_rate": 1.982961024021909e-05, "loss": 0.7305, "step": 23900 }, { "epoch": 0.76, "learning_rate": 1.982940485657068e-05, "loss": 0.7318, "step": 23905 }, { "epoch": 0.77, "learning_rate": 1.982919935027951e-05, "loss": 0.7376, "step": 23910 }, { "epoch": 0.77, "learning_rate": 1.9828993721348146e-05, "loss": 0.7381, "step": 23915 }, { "epoch": 0.77, "learning_rate": 1.982878796977915e-05, "loss": 0.736, "step": 23920 }, { "epoch": 0.77, "learning_rate": 1.9828582095575104e-05, "loss": 0.7373, "step": 23925 }, { "epoch": 0.77, "learning_rate": 1.982837609873856e-05, "loss": 0.7325, "step": 23930 }, { "epoch": 0.77, "learning_rate": 1.9828169979272096e-05, "loss": 0.7319, "step": 23935 }, { "epoch": 0.77, "learning_rate": 1.9827963737178282e-05, "loss": 0.7268, "step": 23940 }, { "epoch": 0.77, "learning_rate": 1.9827757372459695e-05, "loss": 0.7394, "step": 23945 }, { "epoch": 0.77, "learning_rate": 1.9827550885118902e-05, "loss": 0.7353, "step": 23950 }, { "epoch": 0.77, "learning_rate": 1.9827344275158486e-05, "loss": 0.7279, "step": 23955 }, { "epoch": 0.77, "learning_rate": 1.9827137542581022e-05, "loss": 0.7338, "step": 23960 }, { "epoch": 0.77, "learning_rate": 1.9826930687389094e-05, "loss": 0.7236, "step": 23965 }, { "epoch": 0.77, "learning_rate": 1.9826723709585274e-05, "loss": 0.7292, "step": 23970 }, { "epoch": 0.77, "learning_rate": 1.982651660917215e-05, "loss": 0.7223, "step": 23975 }, { "epoch": 0.77, "learning_rate": 1.982630938615231e-05, "loss": 0.7318, "step": 23980 }, { "epoch": 0.77, "learning_rate": 1.9826102040528333e-05, "loss": 0.7232, "step": 23985 }, { "epoch": 0.77, "learning_rate": 1.9825894572302808e-05, "loss": 0.7331, "step": 23990 }, { "epoch": 0.77, "learning_rate": 1.9825686981478324e-05, "loss": 0.7398, "step": 23995 }, { "epoch": 0.77, "learning_rate": 1.982547926805747e-05, "loss": 0.728, "step": 24000 }, { "epoch": 0.77, "learning_rate": 1.9825271432042838e-05, "loss": 0.7241, "step": 24005 }, { "epoch": 0.77, "learning_rate": 1.9825063473437024e-05, "loss": 0.7336, "step": 24010 }, { "epoch": 0.77, "learning_rate": 1.9824855392242622e-05, "loss": 0.7336, "step": 24015 }, { "epoch": 0.77, "learning_rate": 1.9824647188462224e-05, "loss": 0.7115, "step": 24020 }, { "epoch": 0.77, "learning_rate": 1.9824438862098435e-05, "loss": 0.729, "step": 24025 }, { "epoch": 0.77, "learning_rate": 1.9824230413153843e-05, "loss": 0.7295, "step": 24030 }, { "epoch": 0.77, "learning_rate": 1.9824021841631062e-05, "loss": 0.738, "step": 24035 }, { "epoch": 0.77, "learning_rate": 1.9823813147532686e-05, "loss": 0.7152, "step": 24040 }, { "epoch": 0.77, "learning_rate": 1.982360433086132e-05, "loss": 0.7457, "step": 24045 }, { "epoch": 0.77, "learning_rate": 1.9823395391619575e-05, "loss": 0.7193, "step": 24050 }, { "epoch": 0.77, "learning_rate": 1.982318632981005e-05, "loss": 0.7186, "step": 24055 }, { "epoch": 0.77, "learning_rate": 1.9822977145435357e-05, "loss": 0.7187, "step": 24060 }, { "epoch": 0.77, "learning_rate": 1.9822767838498107e-05, "loss": 0.7342, "step": 24065 }, { "epoch": 0.77, "learning_rate": 1.9822558409000908e-05, "loss": 0.709, "step": 24070 }, { "epoch": 0.77, "learning_rate": 1.982234885694638e-05, "loss": 0.7281, "step": 24075 }, { "epoch": 0.77, "learning_rate": 1.982213918233713e-05, "loss": 0.7366, "step": 24080 }, { "epoch": 0.77, "learning_rate": 1.982192938517578e-05, "loss": 0.7384, "step": 24085 }, { "epoch": 0.77, "learning_rate": 1.9821719465464942e-05, "loss": 0.7323, "step": 24090 }, { "epoch": 0.77, "learning_rate": 1.982150942320724e-05, "loss": 0.7202, "step": 24095 }, { "epoch": 0.77, "learning_rate": 1.9821299258405297e-05, "loss": 0.7261, "step": 24100 }, { "epoch": 0.77, "learning_rate": 1.9821088971061725e-05, "loss": 0.7334, "step": 24105 }, { "epoch": 0.77, "learning_rate": 1.9820878561179157e-05, "loss": 0.7267, "step": 24110 }, { "epoch": 0.77, "learning_rate": 1.9820668028760215e-05, "loss": 0.7191, "step": 24115 }, { "epoch": 0.77, "learning_rate": 1.9820457373807525e-05, "loss": 0.7301, "step": 24120 }, { "epoch": 0.77, "learning_rate": 1.982024659632372e-05, "loss": 0.726, "step": 24125 }, { "epoch": 0.77, "learning_rate": 1.9820035696311423e-05, "loss": 0.725, "step": 24130 }, { "epoch": 0.77, "learning_rate": 1.981982467377327e-05, "loss": 0.7304, "step": 24135 }, { "epoch": 0.77, "learning_rate": 1.9819613528711896e-05, "loss": 0.7251, "step": 24140 }, { "epoch": 0.77, "learning_rate": 1.9819402261129928e-05, "loss": 0.7216, "step": 24145 }, { "epoch": 0.77, "learning_rate": 1.9819190871030005e-05, "loss": 0.7225, "step": 24150 }, { "epoch": 0.77, "learning_rate": 1.981897935841477e-05, "loss": 0.7254, "step": 24155 }, { "epoch": 0.77, "learning_rate": 1.9818767723286855e-05, "loss": 0.7277, "step": 24160 }, { "epoch": 0.77, "learning_rate": 1.9818555965648907e-05, "loss": 0.7143, "step": 24165 }, { "epoch": 0.77, "learning_rate": 1.981834408550356e-05, "loss": 0.7208, "step": 24170 }, { "epoch": 0.77, "learning_rate": 1.9818132082853466e-05, "loss": 0.7178, "step": 24175 }, { "epoch": 0.77, "learning_rate": 1.981791995770127e-05, "loss": 0.7289, "step": 24180 }, { "epoch": 0.77, "learning_rate": 1.981770771004961e-05, "loss": 0.7271, "step": 24185 }, { "epoch": 0.77, "learning_rate": 1.981749533990114e-05, "loss": 0.7216, "step": 24190 }, { "epoch": 0.77, "learning_rate": 1.9817282847258507e-05, "loss": 0.7305, "step": 24195 }, { "epoch": 0.77, "learning_rate": 1.981707023212437e-05, "loss": 0.7222, "step": 24200 }, { "epoch": 0.77, "learning_rate": 1.9816857494501374e-05, "loss": 0.7192, "step": 24205 }, { "epoch": 0.77, "learning_rate": 1.9816644634392173e-05, "loss": 0.7183, "step": 24210 }, { "epoch": 0.77, "learning_rate": 1.981643165179943e-05, "loss": 0.7284, "step": 24215 }, { "epoch": 0.78, "learning_rate": 1.9816218546725796e-05, "loss": 0.7232, "step": 24220 }, { "epoch": 0.78, "learning_rate": 1.9816005319173932e-05, "loss": 0.7154, "step": 24225 }, { "epoch": 0.78, "learning_rate": 1.9815791969146495e-05, "loss": 0.7223, "step": 24230 }, { "epoch": 0.78, "learning_rate": 1.9815578496646158e-05, "loss": 0.7233, "step": 24235 }, { "epoch": 0.78, "learning_rate": 1.9815364901675573e-05, "loss": 0.7298, "step": 24240 }, { "epoch": 0.78, "learning_rate": 1.9815151184237407e-05, "loss": 0.7278, "step": 24245 }, { "epoch": 0.78, "learning_rate": 1.981493734433433e-05, "loss": 0.749, "step": 24250 }, { "epoch": 0.78, "learning_rate": 1.981472338196901e-05, "loss": 0.7455, "step": 24255 }, { "epoch": 0.78, "learning_rate": 1.9814509297144114e-05, "loss": 0.7256, "step": 24260 }, { "epoch": 0.78, "learning_rate": 1.9814295089862316e-05, "loss": 0.7281, "step": 24265 }, { "epoch": 0.78, "learning_rate": 1.9814080760126285e-05, "loss": 0.7142, "step": 24270 }, { "epoch": 0.78, "learning_rate": 1.98138663079387e-05, "loss": 0.7326, "step": 24275 }, { "epoch": 0.78, "learning_rate": 1.9813651733302232e-05, "loss": 0.7188, "step": 24280 }, { "epoch": 0.78, "learning_rate": 1.9813437036219563e-05, "loss": 0.7339, "step": 24285 }, { "epoch": 0.78, "learning_rate": 1.9813222216693365e-05, "loss": 0.7191, "step": 24290 }, { "epoch": 0.78, "learning_rate": 1.9813007274726325e-05, "loss": 0.7274, "step": 24295 }, { "epoch": 0.78, "learning_rate": 1.9812792210321123e-05, "loss": 0.7322, "step": 24300 }, { "epoch": 0.78, "learning_rate": 1.9812577023480442e-05, "loss": 0.7389, "step": 24305 }, { "epoch": 0.78, "learning_rate": 1.9812361714206963e-05, "loss": 0.7266, "step": 24310 }, { "epoch": 0.78, "learning_rate": 1.9812146282503383e-05, "loss": 0.7298, "step": 24315 }, { "epoch": 0.78, "learning_rate": 1.981193072837238e-05, "loss": 0.7233, "step": 24320 }, { "epoch": 0.78, "learning_rate": 1.9811715051816644e-05, "loss": 0.7312, "step": 24325 }, { "epoch": 0.78, "learning_rate": 1.9811499252838873e-05, "loss": 0.7203, "step": 24330 }, { "epoch": 0.78, "learning_rate": 1.981128333144175e-05, "loss": 0.7252, "step": 24335 }, { "epoch": 0.78, "learning_rate": 1.9811067287627978e-05, "loss": 0.726, "step": 24340 }, { "epoch": 0.78, "learning_rate": 1.9810851121400248e-05, "loss": 0.7169, "step": 24345 }, { "epoch": 0.78, "learning_rate": 1.9810634832761258e-05, "loss": 0.7223, "step": 24350 }, { "epoch": 0.78, "learning_rate": 1.9810418421713708e-05, "loss": 0.716, "step": 24355 }, { "epoch": 0.78, "learning_rate": 1.9810201888260295e-05, "loss": 0.7222, "step": 24360 }, { "epoch": 0.78, "learning_rate": 1.9809985232403727e-05, "loss": 0.7243, "step": 24365 }, { "epoch": 0.78, "learning_rate": 1.9809768454146697e-05, "loss": 0.7323, "step": 24370 }, { "epoch": 0.78, "learning_rate": 1.9809551553491918e-05, "loss": 0.7194, "step": 24375 }, { "epoch": 0.78, "learning_rate": 1.980933453044209e-05, "loss": 0.7041, "step": 24380 }, { "epoch": 0.78, "learning_rate": 1.980911738499993e-05, "loss": 0.7282, "step": 24385 }, { "epoch": 0.78, "learning_rate": 1.9808900117168142e-05, "loss": 0.7218, "step": 24390 }, { "epoch": 0.78, "learning_rate": 1.9808682726949435e-05, "loss": 0.7241, "step": 24395 }, { "epoch": 0.78, "learning_rate": 1.9808465214346525e-05, "loss": 0.7245, "step": 24400 }, { "epoch": 0.78, "learning_rate": 1.9808247579362123e-05, "loss": 0.7286, "step": 24405 }, { "epoch": 0.78, "learning_rate": 1.9808029821998946e-05, "loss": 0.7271, "step": 24410 }, { "epoch": 0.78, "learning_rate": 1.980781194225971e-05, "loss": 0.7094, "step": 24415 }, { "epoch": 0.78, "learning_rate": 1.9807593940147138e-05, "loss": 0.7228, "step": 24420 }, { "epoch": 0.78, "learning_rate": 1.9807375815663944e-05, "loss": 0.7295, "step": 24425 }, { "epoch": 0.78, "learning_rate": 1.9807157568812848e-05, "loss": 0.7227, "step": 24430 }, { "epoch": 0.78, "learning_rate": 1.980693919959658e-05, "loss": 0.7277, "step": 24435 }, { "epoch": 0.78, "learning_rate": 1.9806720708017862e-05, "loss": 0.724, "step": 24440 }, { "epoch": 0.78, "learning_rate": 1.980650209407942e-05, "loss": 0.7264, "step": 24445 }, { "epoch": 0.78, "learning_rate": 1.980628335778398e-05, "loss": 0.7223, "step": 24450 }, { "epoch": 0.78, "learning_rate": 1.9806064499134274e-05, "loss": 0.7282, "step": 24455 }, { "epoch": 0.78, "learning_rate": 1.980584551813303e-05, "loss": 0.7335, "step": 24460 }, { "epoch": 0.78, "learning_rate": 1.9805626414782985e-05, "loss": 0.7238, "step": 24465 }, { "epoch": 0.78, "learning_rate": 1.9805407189086866e-05, "loss": 0.725, "step": 24470 }, { "epoch": 0.78, "learning_rate": 1.9805187841047412e-05, "loss": 0.7244, "step": 24475 }, { "epoch": 0.78, "learning_rate": 1.980496837066736e-05, "loss": 0.7163, "step": 24480 }, { "epoch": 0.78, "learning_rate": 1.980474877794945e-05, "loss": 0.7206, "step": 24485 }, { "epoch": 0.78, "learning_rate": 1.9804529062896417e-05, "loss": 0.7304, "step": 24490 }, { "epoch": 0.78, "learning_rate": 1.9804309225511003e-05, "loss": 0.7234, "step": 24495 }, { "epoch": 0.78, "learning_rate": 1.980408926579596e-05, "loss": 0.7284, "step": 24500 }, { "epoch": 0.78, "learning_rate": 1.980386918375402e-05, "loss": 0.7283, "step": 24505 }, { "epoch": 0.78, "learning_rate": 1.9803648979387936e-05, "loss": 0.7242, "step": 24510 }, { "epoch": 0.78, "learning_rate": 1.9803428652700452e-05, "loss": 0.7252, "step": 24515 }, { "epoch": 0.78, "learning_rate": 1.9803208203694323e-05, "loss": 0.714, "step": 24520 }, { "epoch": 0.78, "learning_rate": 1.9802987632372296e-05, "loss": 0.7245, "step": 24525 }, { "epoch": 0.78, "learning_rate": 1.9802766938737118e-05, "loss": 0.7318, "step": 24530 }, { "epoch": 0.79, "learning_rate": 1.9802546122791552e-05, "loss": 0.7227, "step": 24535 }, { "epoch": 0.79, "learning_rate": 1.9802325184538345e-05, "loss": 0.7249, "step": 24540 }, { "epoch": 0.79, "learning_rate": 1.9802104123980262e-05, "loss": 0.7334, "step": 24545 }, { "epoch": 0.79, "learning_rate": 1.980188294112005e-05, "loss": 0.719, "step": 24550 }, { "epoch": 0.79, "learning_rate": 1.9801661635960482e-05, "loss": 0.7042, "step": 24555 }, { "epoch": 0.79, "learning_rate": 1.980144020850431e-05, "loss": 0.7134, "step": 24560 }, { "epoch": 0.79, "learning_rate": 1.9801218658754296e-05, "loss": 0.7194, "step": 24565 }, { "epoch": 0.79, "learning_rate": 1.980099698671321e-05, "loss": 0.7281, "step": 24570 }, { "epoch": 0.79, "learning_rate": 1.980077519238382e-05, "loss": 0.7175, "step": 24575 }, { "epoch": 0.79, "learning_rate": 1.9800553275768882e-05, "loss": 0.7055, "step": 24580 }, { "epoch": 0.79, "learning_rate": 1.9800331236871174e-05, "loss": 0.729, "step": 24585 }, { "epoch": 0.79, "learning_rate": 1.9800109075693465e-05, "loss": 0.7287, "step": 24590 }, { "epoch": 0.79, "learning_rate": 1.9799886792238523e-05, "loss": 0.7184, "step": 24595 }, { "epoch": 0.79, "learning_rate": 1.9799664386509127e-05, "loss": 0.7204, "step": 24600 }, { "epoch": 0.79, "learning_rate": 1.979944185850805e-05, "loss": 0.7258, "step": 24605 }, { "epoch": 0.79, "learning_rate": 1.9799219208238063e-05, "loss": 0.7309, "step": 24610 }, { "epoch": 0.79, "learning_rate": 1.9798996435701954e-05, "loss": 0.7351, "step": 24615 }, { "epoch": 0.79, "learning_rate": 1.9798773540902494e-05, "loss": 0.7255, "step": 24620 }, { "epoch": 0.79, "learning_rate": 1.979855052384247e-05, "loss": 0.7322, "step": 24625 }, { "epoch": 0.79, "learning_rate": 1.979832738452466e-05, "loss": 0.7216, "step": 24630 }, { "epoch": 0.79, "learning_rate": 1.9798104122951854e-05, "loss": 0.714, "step": 24635 }, { "epoch": 0.79, "learning_rate": 1.9797880739126833e-05, "loss": 0.7124, "step": 24640 }, { "epoch": 0.79, "learning_rate": 1.9797657233052382e-05, "loss": 0.7248, "step": 24645 }, { "epoch": 0.79, "learning_rate": 1.9797433604731297e-05, "loss": 0.7328, "step": 24650 }, { "epoch": 0.79, "learning_rate": 1.979720985416636e-05, "loss": 0.7216, "step": 24655 }, { "epoch": 0.79, "learning_rate": 1.9796985981360368e-05, "loss": 0.7191, "step": 24660 }, { "epoch": 0.79, "learning_rate": 1.9796761986316114e-05, "loss": 0.7241, "step": 24665 }, { "epoch": 0.79, "learning_rate": 1.979653786903639e-05, "loss": 0.7298, "step": 24670 }, { "epoch": 0.79, "learning_rate": 1.9796313629524e-05, "loss": 0.7132, "step": 24675 }, { "epoch": 0.79, "learning_rate": 1.9796089267781733e-05, "loss": 0.7138, "step": 24680 }, { "epoch": 0.79, "learning_rate": 1.979586478381239e-05, "loss": 0.7203, "step": 24685 }, { "epoch": 0.79, "learning_rate": 1.9795640177618777e-05, "loss": 0.7336, "step": 24690 }, { "epoch": 0.79, "learning_rate": 1.9795415449203688e-05, "loss": 0.7229, "step": 24695 }, { "epoch": 0.79, "learning_rate": 1.9795190598569936e-05, "loss": 0.7269, "step": 24700 }, { "epoch": 0.79, "learning_rate": 1.9794965625720318e-05, "loss": 0.7182, "step": 24705 }, { "epoch": 0.79, "learning_rate": 1.979474053065765e-05, "loss": 0.7339, "step": 24710 }, { "epoch": 0.79, "learning_rate": 1.9794515313384734e-05, "loss": 0.7137, "step": 24715 }, { "epoch": 0.79, "learning_rate": 1.9794289973904382e-05, "loss": 0.7248, "step": 24720 }, { "epoch": 0.79, "learning_rate": 1.979406451221941e-05, "loss": 0.7297, "step": 24725 }, { "epoch": 0.79, "learning_rate": 1.979383892833262e-05, "loss": 0.7206, "step": 24730 }, { "epoch": 0.79, "learning_rate": 1.9793613222246838e-05, "loss": 0.7334, "step": 24735 }, { "epoch": 0.79, "learning_rate": 1.9793387393964873e-05, "loss": 0.7194, "step": 24740 }, { "epoch": 0.79, "learning_rate": 1.9793161443489547e-05, "loss": 0.7238, "step": 24745 }, { "epoch": 0.79, "learning_rate": 1.9792935370823676e-05, "loss": 0.7201, "step": 24750 }, { "epoch": 0.79, "learning_rate": 1.979270917597008e-05, "loss": 0.7341, "step": 24755 }, { "epoch": 0.79, "learning_rate": 1.9792482858931586e-05, "loss": 0.7276, "step": 24760 }, { "epoch": 0.79, "learning_rate": 1.979225641971102e-05, "loss": 0.7258, "step": 24765 }, { "epoch": 0.79, "learning_rate": 1.9792029858311193e-05, "loss": 0.7286, "step": 24770 }, { "epoch": 0.79, "learning_rate": 1.9791803174734946e-05, "loss": 0.7297, "step": 24775 }, { "epoch": 0.79, "learning_rate": 1.9791576368985102e-05, "loss": 0.7122, "step": 24780 }, { "epoch": 0.79, "learning_rate": 1.9791349441064495e-05, "loss": 0.7112, "step": 24785 }, { "epoch": 0.79, "learning_rate": 1.979112239097595e-05, "loss": 0.7254, "step": 24790 }, { "epoch": 0.79, "learning_rate": 1.9790895218722305e-05, "loss": 0.7348, "step": 24795 }, { "epoch": 0.79, "learning_rate": 1.979066792430639e-05, "loss": 0.7162, "step": 24800 }, { "epoch": 0.79, "learning_rate": 1.9790440507731046e-05, "loss": 0.7231, "step": 24805 }, { "epoch": 0.79, "learning_rate": 1.9790212968999104e-05, "loss": 0.7204, "step": 24810 }, { "epoch": 0.79, "learning_rate": 1.978998530811341e-05, "loss": 0.7307, "step": 24815 }, { "epoch": 0.79, "learning_rate": 1.9789757525076802e-05, "loss": 0.7196, "step": 24820 }, { "epoch": 0.79, "learning_rate": 1.978952961989212e-05, "loss": 0.718, "step": 24825 }, { "epoch": 0.79, "learning_rate": 1.978930159256221e-05, "loss": 0.7262, "step": 24830 }, { "epoch": 0.79, "learning_rate": 1.9789073443089914e-05, "loss": 0.7253, "step": 24835 }, { "epoch": 0.79, "learning_rate": 1.9788845171478082e-05, "loss": 0.7256, "step": 24840 }, { "epoch": 0.8, "learning_rate": 1.9788616777729565e-05, "loss": 0.733, "step": 24845 }, { "epoch": 0.8, "learning_rate": 1.9788388261847204e-05, "loss": 0.7234, "step": 24850 }, { "epoch": 0.8, "learning_rate": 1.9788159623833856e-05, "loss": 0.7084, "step": 24855 }, { "epoch": 0.8, "learning_rate": 1.9787930863692374e-05, "loss": 0.7158, "step": 24860 }, { "epoch": 0.8, "learning_rate": 1.978770198142561e-05, "loss": 0.7288, "step": 24865 }, { "epoch": 0.8, "learning_rate": 1.978747297703642e-05, "loss": 0.7243, "step": 24870 }, { "epoch": 0.8, "learning_rate": 1.9787243850527663e-05, "loss": 0.7176, "step": 24875 }, { "epoch": 0.8, "learning_rate": 1.97870146019022e-05, "loss": 0.7227, "step": 24880 }, { "epoch": 0.8, "learning_rate": 1.9786785231162885e-05, "loss": 0.7164, "step": 24885 }, { "epoch": 0.8, "learning_rate": 1.9786555738312584e-05, "loss": 0.7098, "step": 24890 }, { "epoch": 0.8, "learning_rate": 1.9786326123354162e-05, "loss": 0.717, "step": 24895 }, { "epoch": 0.8, "learning_rate": 1.978609638629048e-05, "loss": 0.7234, "step": 24900 }, { "epoch": 0.8, "learning_rate": 1.9785866527124405e-05, "loss": 0.7275, "step": 24905 }, { "epoch": 0.8, "learning_rate": 1.9785636545858807e-05, "loss": 0.7273, "step": 24910 }, { "epoch": 0.8, "learning_rate": 1.9785406442496553e-05, "loss": 0.724, "step": 24915 }, { "epoch": 0.8, "learning_rate": 1.9785176217040516e-05, "loss": 0.7179, "step": 24920 }, { "epoch": 0.8, "learning_rate": 1.9784945869493568e-05, "loss": 0.7189, "step": 24925 }, { "epoch": 0.8, "learning_rate": 1.9784715399858587e-05, "loss": 0.7296, "step": 24930 }, { "epoch": 0.8, "learning_rate": 1.978448480813844e-05, "loss": 0.7116, "step": 24935 }, { "epoch": 0.8, "learning_rate": 1.978425409433601e-05, "loss": 0.7279, "step": 24940 }, { "epoch": 0.8, "learning_rate": 1.9784023258454176e-05, "loss": 0.7318, "step": 24945 }, { "epoch": 0.8, "learning_rate": 1.9783792300495817e-05, "loss": 0.7295, "step": 24950 }, { "epoch": 0.8, "learning_rate": 1.9783561220463813e-05, "loss": 0.7301, "step": 24955 }, { "epoch": 0.8, "learning_rate": 1.978333001836105e-05, "loss": 0.7178, "step": 24960 }, { "epoch": 0.8, "learning_rate": 1.9783098694190414e-05, "loss": 0.715, "step": 24965 }, { "epoch": 0.8, "learning_rate": 1.9782867247954783e-05, "loss": 0.7102, "step": 24970 }, { "epoch": 0.8, "learning_rate": 1.9782635679657053e-05, "loss": 0.7227, "step": 24975 }, { "epoch": 0.8, "learning_rate": 1.978240398930011e-05, "loss": 0.7278, "step": 24980 }, { "epoch": 0.8, "learning_rate": 1.9782172176886848e-05, "loss": 0.7247, "step": 24985 }, { "epoch": 0.8, "learning_rate": 1.9781940242420156e-05, "loss": 0.7358, "step": 24990 }, { "epoch": 0.8, "learning_rate": 1.9781708185902925e-05, "loss": 0.7253, "step": 24995 }, { "epoch": 0.8, "learning_rate": 1.9781476007338058e-05, "loss": 0.72, "step": 25000 }, { "epoch": 0.8, "learning_rate": 1.978124370672845e-05, "loss": 0.7065, "step": 25005 }, { "epoch": 0.8, "learning_rate": 1.978101128407699e-05, "loss": 0.7275, "step": 25010 }, { "epoch": 0.8, "learning_rate": 1.978077873938659e-05, "loss": 0.7278, "step": 25015 }, { "epoch": 0.8, "learning_rate": 1.978054607266015e-05, "loss": 0.7216, "step": 25020 }, { "epoch": 0.8, "learning_rate": 1.9780313283900568e-05, "loss": 0.7178, "step": 25025 }, { "epoch": 0.8, "learning_rate": 1.978008037311075e-05, "loss": 0.7196, "step": 25030 }, { "epoch": 0.8, "learning_rate": 1.9779847340293605e-05, "loss": 0.727, "step": 25035 }, { "epoch": 0.8, "learning_rate": 1.9779614185452034e-05, "loss": 0.7242, "step": 25040 }, { "epoch": 0.8, "learning_rate": 1.9779380908588954e-05, "loss": 0.7126, "step": 25045 }, { "epoch": 0.8, "learning_rate": 1.9779147509707267e-05, "loss": 0.7237, "step": 25050 }, { "epoch": 0.8, "learning_rate": 1.9778913988809895e-05, "loss": 0.7226, "step": 25055 }, { "epoch": 0.8, "learning_rate": 1.9778680345899744e-05, "loss": 0.7212, "step": 25060 }, { "epoch": 0.8, "learning_rate": 1.9778446580979735e-05, "loss": 0.7286, "step": 25065 }, { "epoch": 0.8, "learning_rate": 1.977821269405278e-05, "loss": 0.7134, "step": 25070 }, { "epoch": 0.8, "learning_rate": 1.97779786851218e-05, "loss": 0.7286, "step": 25075 }, { "epoch": 0.8, "learning_rate": 1.9777744554189713e-05, "loss": 0.7195, "step": 25080 }, { "epoch": 0.8, "learning_rate": 1.9777510301259437e-05, "loss": 0.7198, "step": 25085 }, { "epoch": 0.8, "learning_rate": 1.9777275926333903e-05, "loss": 0.7191, "step": 25090 }, { "epoch": 0.8, "learning_rate": 1.9777041429416034e-05, "loss": 0.729, "step": 25095 }, { "epoch": 0.8, "learning_rate": 1.9776806810508748e-05, "loss": 0.7165, "step": 25100 }, { "epoch": 0.8, "learning_rate": 1.9776572069614978e-05, "loss": 0.7196, "step": 25105 }, { "epoch": 0.8, "learning_rate": 1.9776337206737653e-05, "loss": 0.7269, "step": 25110 }, { "epoch": 0.8, "learning_rate": 1.9776102221879702e-05, "loss": 0.7413, "step": 25115 }, { "epoch": 0.8, "learning_rate": 1.9775867115044057e-05, "loss": 0.7156, "step": 25120 }, { "epoch": 0.8, "learning_rate": 1.9775631886233655e-05, "loss": 0.7235, "step": 25125 }, { "epoch": 0.8, "learning_rate": 1.9775396535451423e-05, "loss": 0.7209, "step": 25130 }, { "epoch": 0.8, "learning_rate": 1.9775161062700306e-05, "loss": 0.7263, "step": 25135 }, { "epoch": 0.8, "learning_rate": 1.9774925467983238e-05, "loss": 0.7235, "step": 25140 }, { "epoch": 0.8, "learning_rate": 1.977468975130316e-05, "loss": 0.7205, "step": 25145 }, { "epoch": 0.8, "learning_rate": 1.977445391266301e-05, "loss": 0.7076, "step": 25150 }, { "epoch": 0.8, "learning_rate": 1.9774217952065735e-05, "loss": 0.7106, "step": 25155 }, { "epoch": 0.81, "learning_rate": 1.9773981869514274e-05, "loss": 0.7171, "step": 25160 }, { "epoch": 0.81, "learning_rate": 1.9773745665011577e-05, "loss": 0.7249, "step": 25165 }, { "epoch": 0.81, "learning_rate": 1.977350933856059e-05, "loss": 0.7157, "step": 25170 }, { "epoch": 0.81, "learning_rate": 1.9773272890164264e-05, "loss": 0.7215, "step": 25175 }, { "epoch": 0.81, "learning_rate": 1.9773036319825543e-05, "loss": 0.7205, "step": 25180 }, { "epoch": 0.81, "learning_rate": 1.9772799627547383e-05, "loss": 0.7233, "step": 25185 }, { "epoch": 0.81, "learning_rate": 1.9772562813332736e-05, "loss": 0.7384, "step": 25190 }, { "epoch": 0.81, "learning_rate": 1.9772325877184558e-05, "loss": 0.7239, "step": 25195 }, { "epoch": 0.81, "learning_rate": 1.9772088819105804e-05, "loss": 0.714, "step": 25200 }, { "epoch": 0.81, "learning_rate": 1.9771851639099432e-05, "loss": 0.7327, "step": 25205 }, { "epoch": 0.81, "learning_rate": 1.9771614337168404e-05, "loss": 0.7293, "step": 25210 }, { "epoch": 0.81, "learning_rate": 1.9771376913315677e-05, "loss": 0.7346, "step": 25215 }, { "epoch": 0.81, "learning_rate": 1.9771139367544212e-05, "loss": 0.7217, "step": 25220 }, { "epoch": 0.81, "learning_rate": 1.9770901699856978e-05, "loss": 0.721, "step": 25225 }, { "epoch": 0.81, "learning_rate": 1.977066391025694e-05, "loss": 0.7212, "step": 25230 }, { "epoch": 0.81, "learning_rate": 1.977042599874706e-05, "loss": 0.7216, "step": 25235 }, { "epoch": 0.81, "learning_rate": 1.977018796533031e-05, "loss": 0.713, "step": 25240 }, { "epoch": 0.81, "learning_rate": 1.976994981000966e-05, "loss": 0.7287, "step": 25245 }, { "epoch": 0.81, "learning_rate": 1.9769711532788083e-05, "loss": 0.7189, "step": 25250 }, { "epoch": 0.81, "learning_rate": 1.976947313366855e-05, "loss": 0.7122, "step": 25255 }, { "epoch": 0.81, "learning_rate": 1.976923461265403e-05, "loss": 0.7238, "step": 25260 }, { "epoch": 0.81, "learning_rate": 1.9768995969747513e-05, "loss": 0.7196, "step": 25265 }, { "epoch": 0.81, "learning_rate": 1.976875720495196e-05, "loss": 0.7225, "step": 25270 }, { "epoch": 0.81, "learning_rate": 1.976851831827036e-05, "loss": 0.7267, "step": 25275 }, { "epoch": 0.81, "learning_rate": 1.97682793097057e-05, "loss": 0.7299, "step": 25280 }, { "epoch": 0.81, "learning_rate": 1.9768040179260944e-05, "loss": 0.7266, "step": 25285 }, { "epoch": 0.81, "learning_rate": 1.976780092693909e-05, "loss": 0.7055, "step": 25290 }, { "epoch": 0.81, "learning_rate": 1.9767561552743117e-05, "loss": 0.7121, "step": 25295 }, { "epoch": 0.81, "learning_rate": 1.9767322056676018e-05, "loss": 0.7269, "step": 25300 }, { "epoch": 0.81, "learning_rate": 1.9767082438740776e-05, "loss": 0.7321, "step": 25305 }, { "epoch": 0.81, "learning_rate": 1.9766842698940377e-05, "loss": 0.7167, "step": 25310 }, { "epoch": 0.81, "learning_rate": 1.9766602837277818e-05, "loss": 0.7099, "step": 25315 }, { "epoch": 0.81, "learning_rate": 1.9766362853756092e-05, "loss": 0.7216, "step": 25320 }, { "epoch": 0.81, "learning_rate": 1.976612274837819e-05, "loss": 0.7357, "step": 25325 }, { "epoch": 0.81, "learning_rate": 1.9765882521147115e-05, "loss": 0.7271, "step": 25330 }, { "epoch": 0.81, "learning_rate": 1.9765642172065857e-05, "loss": 0.718, "step": 25335 }, { "epoch": 0.81, "learning_rate": 1.9765401701137416e-05, "loss": 0.7129, "step": 25340 }, { "epoch": 0.81, "learning_rate": 1.976516110836479e-05, "loss": 0.7196, "step": 25345 }, { "epoch": 0.81, "learning_rate": 1.976492039375099e-05, "loss": 0.7189, "step": 25350 }, { "epoch": 0.81, "learning_rate": 1.9764679557299005e-05, "loss": 0.7248, "step": 25355 }, { "epoch": 0.81, "learning_rate": 1.976443859901186e-05, "loss": 0.7178, "step": 25360 }, { "epoch": 0.81, "learning_rate": 1.9764197518892544e-05, "loss": 0.7318, "step": 25365 }, { "epoch": 0.81, "learning_rate": 1.9763956316944068e-05, "loss": 0.7097, "step": 25370 }, { "epoch": 0.81, "learning_rate": 1.976371499316945e-05, "loss": 0.72, "step": 25375 }, { "epoch": 0.81, "learning_rate": 1.9763473547571693e-05, "loss": 0.7177, "step": 25380 }, { "epoch": 0.81, "learning_rate": 1.9763231980153813e-05, "loss": 0.7302, "step": 25385 }, { "epoch": 0.81, "learning_rate": 1.9762990290918825e-05, "loss": 0.7062, "step": 25390 }, { "epoch": 0.81, "learning_rate": 1.976274847986974e-05, "loss": 0.7214, "step": 25395 }, { "epoch": 0.81, "learning_rate": 1.976250654700958e-05, "loss": 0.7086, "step": 25400 }, { "epoch": 0.81, "learning_rate": 1.976226449234136e-05, "loss": 0.7134, "step": 25405 }, { "epoch": 0.81, "learning_rate": 1.97620223158681e-05, "loss": 0.7186, "step": 25410 }, { "epoch": 0.81, "learning_rate": 1.9761780017592827e-05, "loss": 0.7185, "step": 25415 }, { "epoch": 0.81, "learning_rate": 1.9761537597518557e-05, "loss": 0.7308, "step": 25420 }, { "epoch": 0.81, "learning_rate": 1.9761295055648323e-05, "loss": 0.7089, "step": 25425 }, { "epoch": 0.81, "learning_rate": 1.9761052391985145e-05, "loss": 0.7085, "step": 25430 }, { "epoch": 0.81, "learning_rate": 1.9760809606532054e-05, "loss": 0.7211, "step": 25435 }, { "epoch": 0.81, "learning_rate": 1.976056669929207e-05, "loss": 0.7112, "step": 25440 }, { "epoch": 0.81, "learning_rate": 1.9760323670268238e-05, "loss": 0.725, "step": 25445 }, { "epoch": 0.81, "learning_rate": 1.976008051946358e-05, "loss": 0.7275, "step": 25450 }, { "epoch": 0.81, "learning_rate": 1.9759837246881134e-05, "loss": 0.7163, "step": 25455 }, { "epoch": 0.81, "learning_rate": 1.9759593852523937e-05, "loss": 0.7136, "step": 25460 }, { "epoch": 0.81, "learning_rate": 1.975935033639502e-05, "loss": 0.7054, "step": 25465 }, { "epoch": 0.82, "learning_rate": 1.975910669849743e-05, "loss": 0.7163, "step": 25470 }, { "epoch": 0.82, "learning_rate": 1.97588629388342e-05, "loss": 0.718, "step": 25475 }, { "epoch": 0.82, "learning_rate": 1.9758619057408372e-05, "loss": 0.7224, "step": 25480 }, { "epoch": 0.82, "learning_rate": 1.9758375054222992e-05, "loss": 0.7172, "step": 25485 }, { "epoch": 0.82, "learning_rate": 1.9758130929281102e-05, "loss": 0.7175, "step": 25490 }, { "epoch": 0.82, "learning_rate": 1.9757886682585744e-05, "loss": 0.7251, "step": 25495 }, { "epoch": 0.82, "learning_rate": 1.9757642314139977e-05, "loss": 0.7241, "step": 25500 }, { "epoch": 0.82, "learning_rate": 1.975739782394684e-05, "loss": 0.7185, "step": 25505 }, { "epoch": 0.82, "learning_rate": 1.9757153212009388e-05, "loss": 0.7185, "step": 25510 }, { "epoch": 0.82, "learning_rate": 1.975690847833067e-05, "loss": 0.7141, "step": 25515 }, { "epoch": 0.82, "learning_rate": 1.9756663622913744e-05, "loss": 0.7332, "step": 25520 }, { "epoch": 0.82, "learning_rate": 1.975641864576166e-05, "loss": 0.7026, "step": 25525 }, { "epoch": 0.82, "learning_rate": 1.975617354687748e-05, "loss": 0.7253, "step": 25530 }, { "epoch": 0.82, "learning_rate": 1.9755928326264255e-05, "loss": 0.7169, "step": 25535 }, { "epoch": 0.82, "learning_rate": 1.9755682983925054e-05, "loss": 0.7272, "step": 25540 }, { "epoch": 0.82, "learning_rate": 1.975543751986293e-05, "loss": 0.7206, "step": 25545 }, { "epoch": 0.82, "learning_rate": 1.975519193408095e-05, "loss": 0.7266, "step": 25550 }, { "epoch": 0.82, "learning_rate": 1.9754946226582176e-05, "loss": 0.7251, "step": 25555 }, { "epoch": 0.82, "learning_rate": 1.9754700397369674e-05, "loss": 0.7136, "step": 25560 }, { "epoch": 0.82, "learning_rate": 1.9754454446446512e-05, "loss": 0.7093, "step": 25565 }, { "epoch": 0.82, "learning_rate": 1.9754208373815758e-05, "loss": 0.7218, "step": 25570 }, { "epoch": 0.82, "learning_rate": 1.9753962179480485e-05, "loss": 0.7208, "step": 25575 }, { "epoch": 0.82, "learning_rate": 1.975371586344376e-05, "loss": 0.7129, "step": 25580 }, { "epoch": 0.82, "learning_rate": 1.975346942570866e-05, "loss": 0.7278, "step": 25585 }, { "epoch": 0.82, "learning_rate": 1.9753222866278264e-05, "loss": 0.7151, "step": 25590 }, { "epoch": 0.82, "learning_rate": 1.9752976185155635e-05, "loss": 0.7098, "step": 25595 }, { "epoch": 0.82, "learning_rate": 1.9752729382343866e-05, "loss": 0.7351, "step": 25600 }, { "epoch": 0.82, "learning_rate": 1.9752482457846026e-05, "loss": 0.6999, "step": 25605 }, { "epoch": 0.82, "learning_rate": 1.9752235411665198e-05, "loss": 0.7226, "step": 25610 }, { "epoch": 0.82, "learning_rate": 1.975198824380447e-05, "loss": 0.7221, "step": 25615 }, { "epoch": 0.82, "learning_rate": 1.975174095426692e-05, "loss": 0.706, "step": 25620 }, { "epoch": 0.82, "learning_rate": 1.9751493543055634e-05, "loss": 0.7156, "step": 25625 }, { "epoch": 0.82, "learning_rate": 1.97512460101737e-05, "loss": 0.7167, "step": 25630 }, { "epoch": 0.82, "learning_rate": 1.975099835562421e-05, "loss": 0.7097, "step": 25635 }, { "epoch": 0.82, "learning_rate": 1.975075057941025e-05, "loss": 0.7305, "step": 25640 }, { "epoch": 0.82, "learning_rate": 1.975050268153491e-05, "loss": 0.7228, "step": 25645 }, { "epoch": 0.82, "learning_rate": 1.9750254662001284e-05, "loss": 0.713, "step": 25650 }, { "epoch": 0.82, "learning_rate": 1.975000652081247e-05, "loss": 0.7103, "step": 25655 }, { "epoch": 0.82, "learning_rate": 1.9749758257971562e-05, "loss": 0.734, "step": 25660 }, { "epoch": 0.82, "learning_rate": 1.974950987348166e-05, "loss": 0.7157, "step": 25665 }, { "epoch": 0.82, "learning_rate": 1.9749261367345857e-05, "loss": 0.7144, "step": 25670 }, { "epoch": 0.82, "learning_rate": 1.9749012739567258e-05, "loss": 0.7229, "step": 25675 }, { "epoch": 0.82, "learning_rate": 1.9748763990148964e-05, "loss": 0.7178, "step": 25680 }, { "epoch": 0.82, "learning_rate": 1.9748515119094083e-05, "loss": 0.7212, "step": 25685 }, { "epoch": 0.82, "learning_rate": 1.9748266126405714e-05, "loss": 0.7145, "step": 25690 }, { "epoch": 0.82, "learning_rate": 1.9748017012086965e-05, "loss": 0.7102, "step": 25695 }, { "epoch": 0.82, "learning_rate": 1.974776777614095e-05, "loss": 0.7259, "step": 25700 }, { "epoch": 0.82, "learning_rate": 1.974751841857077e-05, "loss": 0.7203, "step": 25705 }, { "epoch": 0.82, "learning_rate": 1.974726893937954e-05, "loss": 0.7126, "step": 25710 }, { "epoch": 0.82, "learning_rate": 1.9747019338570373e-05, "loss": 0.7132, "step": 25715 }, { "epoch": 0.82, "learning_rate": 1.9746769616146383e-05, "loss": 0.7166, "step": 25720 }, { "epoch": 0.82, "learning_rate": 1.9746519772110688e-05, "loss": 0.7243, "step": 25725 }, { "epoch": 0.82, "learning_rate": 1.9746269806466404e-05, "loss": 0.7168, "step": 25730 }, { "epoch": 0.82, "learning_rate": 1.974601971921665e-05, "loss": 0.7238, "step": 25735 }, { "epoch": 0.82, "learning_rate": 1.9745769510364546e-05, "loss": 0.7247, "step": 25740 }, { "epoch": 0.82, "learning_rate": 1.9745519179913214e-05, "loss": 0.7097, "step": 25745 }, { "epoch": 0.82, "learning_rate": 1.9745268727865774e-05, "loss": 0.718, "step": 25750 }, { "epoch": 0.82, "learning_rate": 1.9745018154225354e-05, "loss": 0.7193, "step": 25755 }, { "epoch": 0.82, "learning_rate": 1.9744767458995083e-05, "loss": 0.7072, "step": 25760 }, { "epoch": 0.82, "learning_rate": 1.9744516642178087e-05, "loss": 0.7104, "step": 25765 }, { "epoch": 0.82, "learning_rate": 1.974426570377749e-05, "loss": 0.7034, "step": 25770 }, { "epoch": 0.82, "learning_rate": 1.9744014643796435e-05, "loss": 0.7174, "step": 25775 }, { "epoch": 0.82, "learning_rate": 1.9743763462238044e-05, "loss": 0.7205, "step": 25780 }, { "epoch": 0.83, "learning_rate": 1.9743512159105454e-05, "loss": 0.7052, "step": 25785 }, { "epoch": 0.83, "learning_rate": 1.97432607344018e-05, "loss": 0.7202, "step": 25790 }, { "epoch": 0.83, "learning_rate": 1.974300918813022e-05, "loss": 0.7215, "step": 25795 }, { "epoch": 0.83, "learning_rate": 1.9742757520293856e-05, "loss": 0.7116, "step": 25800 }, { "epoch": 0.83, "learning_rate": 1.9742505730895843e-05, "loss": 0.7114, "step": 25805 }, { "epoch": 0.83, "learning_rate": 1.974225381993932e-05, "loss": 0.7218, "step": 25810 }, { "epoch": 0.83, "learning_rate": 1.9742001787427443e-05, "loss": 0.7119, "step": 25815 }, { "epoch": 0.83, "learning_rate": 1.9741749633363342e-05, "loss": 0.7119, "step": 25820 }, { "epoch": 0.83, "learning_rate": 1.974149735775017e-05, "loss": 0.7101, "step": 25825 }, { "epoch": 0.83, "learning_rate": 1.9741244960591074e-05, "loss": 0.7113, "step": 25830 }, { "epoch": 0.83, "learning_rate": 1.9740992441889205e-05, "loss": 0.7234, "step": 25835 }, { "epoch": 0.83, "learning_rate": 1.974073980164771e-05, "loss": 0.7126, "step": 25840 }, { "epoch": 0.83, "learning_rate": 1.9740487039869746e-05, "loss": 0.708, "step": 25845 }, { "epoch": 0.83, "learning_rate": 1.9740234156558463e-05, "loss": 0.7133, "step": 25850 }, { "epoch": 0.83, "learning_rate": 1.9739981151717017e-05, "loss": 0.7053, "step": 25855 }, { "epoch": 0.83, "learning_rate": 1.9739728025348562e-05, "loss": 0.7104, "step": 25860 }, { "epoch": 0.83, "learning_rate": 1.9739474777456257e-05, "loss": 0.6985, "step": 25865 }, { "epoch": 0.83, "learning_rate": 1.973922140804327e-05, "loss": 0.7128, "step": 25870 }, { "epoch": 0.83, "learning_rate": 1.9738967917112752e-05, "loss": 0.723, "step": 25875 }, { "epoch": 0.83, "learning_rate": 1.9738714304667874e-05, "loss": 0.7216, "step": 25880 }, { "epoch": 0.83, "learning_rate": 1.9738460570711794e-05, "loss": 0.7094, "step": 25885 }, { "epoch": 0.83, "learning_rate": 1.9738206715247682e-05, "loss": 0.7269, "step": 25890 }, { "epoch": 0.83, "learning_rate": 1.97379527382787e-05, "loss": 0.711, "step": 25895 }, { "epoch": 0.83, "learning_rate": 1.9737698639808024e-05, "loss": 0.7184, "step": 25900 }, { "epoch": 0.83, "learning_rate": 1.973744441983882e-05, "loss": 0.7158, "step": 25905 }, { "epoch": 0.83, "learning_rate": 1.973719007837426e-05, "loss": 0.7135, "step": 25910 }, { "epoch": 0.83, "learning_rate": 1.9736935615417517e-05, "loss": 0.7241, "step": 25915 }, { "epoch": 0.83, "learning_rate": 1.973668103097177e-05, "loss": 0.7166, "step": 25920 }, { "epoch": 0.83, "learning_rate": 1.9736426325040194e-05, "loss": 0.7133, "step": 25925 }, { "epoch": 0.83, "learning_rate": 1.9736171497625968e-05, "loss": 0.7173, "step": 25930 }, { "epoch": 0.83, "learning_rate": 1.9735916548732262e-05, "loss": 0.7129, "step": 25935 }, { "epoch": 0.83, "learning_rate": 1.973566147836227e-05, "loss": 0.7097, "step": 25940 }, { "epoch": 0.83, "learning_rate": 1.9735406286519168e-05, "loss": 0.7121, "step": 25945 }, { "epoch": 0.83, "learning_rate": 1.973515097320614e-05, "loss": 0.712, "step": 25950 }, { "epoch": 0.83, "learning_rate": 1.9734895538426372e-05, "loss": 0.7166, "step": 25955 }, { "epoch": 0.83, "learning_rate": 1.9734639982183053e-05, "loss": 0.7173, "step": 25960 }, { "epoch": 0.83, "learning_rate": 1.9734384304479367e-05, "loss": 0.7183, "step": 25965 }, { "epoch": 0.83, "learning_rate": 1.9734128505318512e-05, "loss": 0.7229, "step": 25970 }, { "epoch": 0.83, "learning_rate": 1.9733872584703673e-05, "loss": 0.7094, "step": 25975 }, { "epoch": 0.83, "learning_rate": 1.9733616542638045e-05, "loss": 0.7229, "step": 25980 }, { "epoch": 0.83, "learning_rate": 1.9733360379124822e-05, "loss": 0.7059, "step": 25985 }, { "epoch": 0.83, "learning_rate": 1.9733104094167204e-05, "loss": 0.7267, "step": 25990 }, { "epoch": 0.83, "learning_rate": 1.9732847687768385e-05, "loss": 0.715, "step": 25995 }, { "epoch": 0.83, "learning_rate": 1.9732591159931564e-05, "loss": 0.7281, "step": 26000 }, { "epoch": 0.83, "learning_rate": 1.9732334510659942e-05, "loss": 0.7234, "step": 26005 }, { "epoch": 0.83, "learning_rate": 1.9732077739956725e-05, "loss": 0.7227, "step": 26010 }, { "epoch": 0.83, "learning_rate": 1.973182084782511e-05, "loss": 0.713, "step": 26015 }, { "epoch": 0.83, "learning_rate": 1.9731563834268308e-05, "loss": 0.7061, "step": 26020 }, { "epoch": 0.83, "learning_rate": 1.9731306699289522e-05, "loss": 0.7169, "step": 26025 }, { "epoch": 0.83, "learning_rate": 1.9731049442891965e-05, "loss": 0.7051, "step": 26030 }, { "epoch": 0.83, "learning_rate": 1.973079206507884e-05, "loss": 0.7237, "step": 26035 }, { "epoch": 0.83, "learning_rate": 1.9730534565853364e-05, "loss": 0.7268, "step": 26040 }, { "epoch": 0.83, "learning_rate": 1.973027694521875e-05, "loss": 0.7253, "step": 26045 }, { "epoch": 0.83, "learning_rate": 1.973001920317821e-05, "loss": 0.7119, "step": 26050 }, { "epoch": 0.83, "learning_rate": 1.972976133973496e-05, "loss": 0.7248, "step": 26055 }, { "epoch": 0.83, "learning_rate": 1.9729503354892215e-05, "loss": 0.707, "step": 26060 }, { "epoch": 0.83, "learning_rate": 1.97292452486532e-05, "loss": 0.7145, "step": 26065 }, { "epoch": 0.83, "learning_rate": 1.972898702102113e-05, "loss": 0.691, "step": 26070 }, { "epoch": 0.83, "learning_rate": 1.972872867199923e-05, "loss": 0.7114, "step": 26075 }, { "epoch": 0.83, "learning_rate": 1.9728470201590725e-05, "loss": 0.7066, "step": 26080 }, { "epoch": 0.83, "learning_rate": 1.9728211609798835e-05, "loss": 0.706, "step": 26085 }, { "epoch": 0.83, "learning_rate": 1.9727952896626788e-05, "loss": 0.7112, "step": 26090 }, { "epoch": 0.84, "learning_rate": 1.9727694062077813e-05, "loss": 0.7131, "step": 26095 }, { "epoch": 0.84, "learning_rate": 1.972743510615514e-05, "loss": 0.7141, "step": 26100 }, { "epoch": 0.84, "learning_rate": 1.9727176028862e-05, "loss": 0.7122, "step": 26105 }, { "epoch": 0.84, "learning_rate": 1.9726916830201626e-05, "loss": 0.7206, "step": 26110 }, { "epoch": 0.84, "learning_rate": 1.9726657510177246e-05, "loss": 0.7126, "step": 26115 }, { "epoch": 0.84, "learning_rate": 1.972639806879211e-05, "loss": 0.7035, "step": 26120 }, { "epoch": 0.84, "learning_rate": 1.9726138506049438e-05, "loss": 0.7141, "step": 26125 }, { "epoch": 0.84, "learning_rate": 1.9725878821952478e-05, "loss": 0.7073, "step": 26130 }, { "epoch": 0.84, "learning_rate": 1.9725619016504466e-05, "loss": 0.7022, "step": 26135 }, { "epoch": 0.84, "learning_rate": 1.972535908970865e-05, "loss": 0.7232, "step": 26140 }, { "epoch": 0.84, "learning_rate": 1.972509904156827e-05, "loss": 0.7103, "step": 26145 }, { "epoch": 0.84, "learning_rate": 1.9724838872086568e-05, "loss": 0.7149, "step": 26150 }, { "epoch": 0.84, "learning_rate": 1.9724578581266793e-05, "loss": 0.7188, "step": 26155 }, { "epoch": 0.84, "learning_rate": 1.9724318169112187e-05, "loss": 0.7136, "step": 26160 }, { "epoch": 0.84, "learning_rate": 1.9724057635626008e-05, "loss": 0.7275, "step": 26165 }, { "epoch": 0.84, "learning_rate": 1.9723796980811503e-05, "loss": 0.7032, "step": 26170 }, { "epoch": 0.84, "learning_rate": 1.9723536204671922e-05, "loss": 0.7073, "step": 26175 }, { "epoch": 0.84, "learning_rate": 1.972327530721052e-05, "loss": 0.7227, "step": 26180 }, { "epoch": 0.84, "learning_rate": 1.9723014288430557e-05, "loss": 0.7072, "step": 26185 }, { "epoch": 0.84, "learning_rate": 1.972275314833528e-05, "loss": 0.7012, "step": 26190 }, { "epoch": 0.84, "learning_rate": 1.972249188692796e-05, "loss": 0.7119, "step": 26195 }, { "epoch": 0.84, "learning_rate": 1.9722230504211843e-05, "loss": 0.7167, "step": 26200 }, { "epoch": 0.84, "learning_rate": 1.97219690001902e-05, "loss": 0.7065, "step": 26205 }, { "epoch": 0.84, "learning_rate": 1.972170737486629e-05, "loss": 0.7175, "step": 26210 }, { "epoch": 0.84, "learning_rate": 1.9721445628243375e-05, "loss": 0.7083, "step": 26215 }, { "epoch": 0.84, "learning_rate": 1.972118376032473e-05, "loss": 0.7112, "step": 26220 }, { "epoch": 0.84, "learning_rate": 1.972092177111361e-05, "loss": 0.7144, "step": 26225 }, { "epoch": 0.84, "learning_rate": 1.9720659660613298e-05, "loss": 0.7059, "step": 26230 }, { "epoch": 0.84, "learning_rate": 1.9720397428827052e-05, "loss": 0.7114, "step": 26235 }, { "epoch": 0.84, "learning_rate": 1.972013507575815e-05, "loss": 0.7076, "step": 26240 }, { "epoch": 0.84, "learning_rate": 1.9719872601409863e-05, "loss": 0.716, "step": 26245 }, { "epoch": 0.84, "learning_rate": 1.9719610005785466e-05, "loss": 0.7034, "step": 26250 }, { "epoch": 0.84, "learning_rate": 1.971934728888823e-05, "loss": 0.719, "step": 26255 }, { "epoch": 0.84, "learning_rate": 1.971908445072145e-05, "loss": 0.7179, "step": 26260 }, { "epoch": 0.84, "learning_rate": 1.9718821491288392e-05, "loss": 0.7065, "step": 26265 }, { "epoch": 0.84, "learning_rate": 1.9718558410592336e-05, "loss": 0.7042, "step": 26270 }, { "epoch": 0.84, "learning_rate": 1.971829520863657e-05, "loss": 0.7204, "step": 26275 }, { "epoch": 0.84, "learning_rate": 1.9718031885424378e-05, "loss": 0.7159, "step": 26280 }, { "epoch": 0.84, "learning_rate": 1.9717768440959042e-05, "loss": 0.7124, "step": 26285 }, { "epoch": 0.84, "learning_rate": 1.971750487524385e-05, "loss": 0.7193, "step": 26290 }, { "epoch": 0.84, "learning_rate": 1.9717241188282092e-05, "loss": 0.7173, "step": 26295 }, { "epoch": 0.84, "learning_rate": 1.9716977380077058e-05, "loss": 0.7115, "step": 26300 }, { "epoch": 0.84, "learning_rate": 1.971671345063204e-05, "loss": 0.7174, "step": 26305 }, { "epoch": 0.84, "learning_rate": 1.9716449399950327e-05, "loss": 0.7161, "step": 26310 }, { "epoch": 0.84, "learning_rate": 1.971618522803522e-05, "loss": 0.7121, "step": 26315 }, { "epoch": 0.84, "learning_rate": 1.9715920934890007e-05, "loss": 0.7117, "step": 26320 }, { "epoch": 0.84, "learning_rate": 1.9715656520517993e-05, "loss": 0.727, "step": 26325 }, { "epoch": 0.84, "learning_rate": 1.9715391984922474e-05, "loss": 0.7156, "step": 26330 }, { "epoch": 0.84, "learning_rate": 1.971512732810675e-05, "loss": 0.7107, "step": 26335 }, { "epoch": 0.84, "learning_rate": 1.971486255007413e-05, "loss": 0.7092, "step": 26340 }, { "epoch": 0.84, "learning_rate": 1.9714597650827903e-05, "loss": 0.7106, "step": 26345 }, { "epoch": 0.84, "learning_rate": 1.9714332630371385e-05, "loss": 0.7192, "step": 26350 }, { "epoch": 0.84, "learning_rate": 1.9714067488707888e-05, "loss": 0.7158, "step": 26355 }, { "epoch": 0.84, "learning_rate": 1.9713802225840705e-05, "loss": 0.7126, "step": 26360 }, { "epoch": 0.84, "learning_rate": 1.9713536841773156e-05, "loss": 0.703, "step": 26365 }, { "epoch": 0.84, "learning_rate": 1.9713271336508552e-05, "loss": 0.7093, "step": 26370 }, { "epoch": 0.84, "learning_rate": 1.9713005710050203e-05, "loss": 0.7107, "step": 26375 }, { "epoch": 0.84, "learning_rate": 1.9712739962401422e-05, "loss": 0.7114, "step": 26380 }, { "epoch": 0.84, "learning_rate": 1.9712474093565526e-05, "loss": 0.7065, "step": 26385 }, { "epoch": 0.84, "learning_rate": 1.9712208103545837e-05, "loss": 0.7166, "step": 26390 }, { "epoch": 0.84, "learning_rate": 1.9711941992345666e-05, "loss": 0.7023, "step": 26395 }, { "epoch": 0.84, "learning_rate": 1.971167575996834e-05, "loss": 0.7154, "step": 26400 }, { "epoch": 0.84, "learning_rate": 1.9711409406417176e-05, "loss": 0.7117, "step": 26405 }, { "epoch": 0.85, "learning_rate": 1.97111429316955e-05, "loss": 0.7176, "step": 26410 }, { "epoch": 0.85, "learning_rate": 1.9710876335806634e-05, "loss": 0.7235, "step": 26415 }, { "epoch": 0.85, "learning_rate": 1.9710609618753907e-05, "loss": 0.7155, "step": 26420 }, { "epoch": 0.85, "learning_rate": 1.971034278054065e-05, "loss": 0.7175, "step": 26425 }, { "epoch": 0.85, "learning_rate": 1.9710075821170183e-05, "loss": 0.7215, "step": 26430 }, { "epoch": 0.85, "learning_rate": 1.9709808740645847e-05, "loss": 0.7105, "step": 26435 }, { "epoch": 0.85, "learning_rate": 1.9709541538970968e-05, "loss": 0.7066, "step": 26440 }, { "epoch": 0.85, "learning_rate": 1.9709274216148883e-05, "loss": 0.7134, "step": 26445 }, { "epoch": 0.85, "learning_rate": 1.9709006772182926e-05, "loss": 0.717, "step": 26450 }, { "epoch": 0.85, "learning_rate": 1.970873920707643e-05, "loss": 0.7116, "step": 26455 }, { "epoch": 0.85, "learning_rate": 1.9708471520832743e-05, "loss": 0.7175, "step": 26460 }, { "epoch": 0.85, "learning_rate": 1.9708203713455198e-05, "loss": 0.7187, "step": 26465 }, { "epoch": 0.85, "learning_rate": 1.9707935784947137e-05, "loss": 0.7104, "step": 26470 }, { "epoch": 0.85, "learning_rate": 1.9707667735311908e-05, "loss": 0.7172, "step": 26475 }, { "epoch": 0.85, "learning_rate": 1.9707399564552844e-05, "loss": 0.7195, "step": 26480 }, { "epoch": 0.85, "learning_rate": 1.9707131272673307e-05, "loss": 0.7217, "step": 26485 }, { "epoch": 0.85, "learning_rate": 1.970686285967663e-05, "loss": 0.7226, "step": 26490 }, { "epoch": 0.85, "learning_rate": 1.970659432556617e-05, "loss": 0.7151, "step": 26495 }, { "epoch": 0.85, "learning_rate": 1.9706325670345276e-05, "loss": 0.7256, "step": 26500 }, { "epoch": 0.85, "learning_rate": 1.97060568940173e-05, "loss": 0.7089, "step": 26505 }, { "epoch": 0.85, "learning_rate": 1.9705787996585594e-05, "loss": 0.7106, "step": 26510 }, { "epoch": 0.85, "learning_rate": 1.9705518978053513e-05, "loss": 0.7075, "step": 26515 }, { "epoch": 0.85, "learning_rate": 1.9705249838424416e-05, "loss": 0.71, "step": 26520 }, { "epoch": 0.85, "learning_rate": 1.970498057770166e-05, "loss": 0.7218, "step": 26525 }, { "epoch": 0.85, "learning_rate": 1.9704711195888605e-05, "loss": 0.7154, "step": 26530 }, { "epoch": 0.85, "learning_rate": 1.970444169298861e-05, "loss": 0.7168, "step": 26535 }, { "epoch": 0.85, "learning_rate": 1.9704172069005044e-05, "loss": 0.7129, "step": 26540 }, { "epoch": 0.85, "learning_rate": 1.970390232394126e-05, "loss": 0.7129, "step": 26545 }, { "epoch": 0.85, "learning_rate": 1.9703632457800633e-05, "loss": 0.6966, "step": 26550 }, { "epoch": 0.85, "learning_rate": 1.970336247058653e-05, "loss": 0.7261, "step": 26555 }, { "epoch": 0.85, "learning_rate": 1.9703092362302313e-05, "loss": 0.7261, "step": 26560 }, { "epoch": 0.85, "learning_rate": 1.9702822132951356e-05, "loss": 0.7268, "step": 26565 }, { "epoch": 0.85, "learning_rate": 1.9702551782537032e-05, "loss": 0.7175, "step": 26570 }, { "epoch": 0.85, "learning_rate": 1.9702281311062713e-05, "loss": 0.721, "step": 26575 }, { "epoch": 0.85, "learning_rate": 1.9702010718531774e-05, "loss": 0.7121, "step": 26580 }, { "epoch": 0.85, "learning_rate": 1.970174000494759e-05, "loss": 0.7119, "step": 26585 }, { "epoch": 0.85, "learning_rate": 1.9701469170313538e-05, "loss": 0.705, "step": 26590 }, { "epoch": 0.85, "learning_rate": 1.9701198214633e-05, "loss": 0.7161, "step": 26595 }, { "epoch": 0.85, "learning_rate": 1.9700927137909358e-05, "loss": 0.7082, "step": 26600 }, { "epoch": 0.85, "learning_rate": 1.970065594014599e-05, "loss": 0.6984, "step": 26605 }, { "epoch": 0.85, "learning_rate": 1.9700384621346282e-05, "loss": 0.7177, "step": 26610 }, { "epoch": 0.85, "learning_rate": 1.9700113181513618e-05, "loss": 0.7184, "step": 26615 }, { "epoch": 0.85, "learning_rate": 1.9699841620651384e-05, "loss": 0.7018, "step": 26620 }, { "epoch": 0.85, "learning_rate": 1.9699569938762975e-05, "loss": 0.7195, "step": 26625 }, { "epoch": 0.85, "learning_rate": 1.9699298135851773e-05, "loss": 0.7042, "step": 26630 }, { "epoch": 0.85, "learning_rate": 1.9699026211921172e-05, "loss": 0.7199, "step": 26635 }, { "epoch": 0.85, "learning_rate": 1.9698754166974564e-05, "loss": 0.7159, "step": 26640 }, { "epoch": 0.85, "learning_rate": 1.9698482001015344e-05, "loss": 0.7176, "step": 26645 }, { "epoch": 0.85, "learning_rate": 1.969820971404691e-05, "loss": 0.7268, "step": 26650 }, { "epoch": 0.85, "learning_rate": 1.9697937306072656e-05, "loss": 0.715, "step": 26655 }, { "epoch": 0.85, "learning_rate": 1.9697664777095982e-05, "loss": 0.7077, "step": 26660 }, { "epoch": 0.85, "learning_rate": 1.9697392127120293e-05, "loss": 0.7169, "step": 26665 }, { "epoch": 0.85, "learning_rate": 1.9697119356148982e-05, "loss": 0.702, "step": 26670 }, { "epoch": 0.85, "learning_rate": 1.969684646418546e-05, "loss": 0.702, "step": 26675 }, { "epoch": 0.85, "learning_rate": 1.9696573451233126e-05, "loss": 0.706, "step": 26680 }, { "epoch": 0.85, "learning_rate": 1.969630031729539e-05, "loss": 0.7262, "step": 26685 }, { "epoch": 0.85, "learning_rate": 1.969602706237566e-05, "loss": 0.7122, "step": 26690 }, { "epoch": 0.85, "learning_rate": 1.9695753686477347e-05, "loss": 0.7188, "step": 26695 }, { "epoch": 0.85, "learning_rate": 1.9695480189603856e-05, "loss": 0.7105, "step": 26700 }, { "epoch": 0.85, "learning_rate": 1.9695206571758604e-05, "loss": 0.6986, "step": 26705 }, { "epoch": 0.85, "learning_rate": 1.9694932832945005e-05, "loss": 0.7104, "step": 26710 }, { "epoch": 0.85, "learning_rate": 1.9694658973166468e-05, "loss": 0.6998, "step": 26715 }, { "epoch": 0.86, "learning_rate": 1.9694384992426422e-05, "loss": 0.7084, "step": 26720 }, { "epoch": 0.86, "learning_rate": 1.969411089072828e-05, "loss": 0.7121, "step": 26725 }, { "epoch": 0.86, "learning_rate": 1.9693836668075458e-05, "loss": 0.7208, "step": 26730 }, { "epoch": 0.86, "learning_rate": 1.969356232447138e-05, "loss": 0.7044, "step": 26735 }, { "epoch": 0.86, "learning_rate": 1.969328785991947e-05, "loss": 0.7174, "step": 26740 }, { "epoch": 0.86, "learning_rate": 1.9693013274423155e-05, "loss": 0.7162, "step": 26745 }, { "epoch": 0.86, "learning_rate": 1.9692738567985853e-05, "loss": 0.7106, "step": 26750 }, { "epoch": 0.86, "learning_rate": 1.9692463740611e-05, "loss": 0.7062, "step": 26755 }, { "epoch": 0.86, "learning_rate": 1.969218879230202e-05, "loss": 0.7172, "step": 26760 }, { "epoch": 0.86, "learning_rate": 1.969191372306235e-05, "loss": 0.706, "step": 26765 }, { "epoch": 0.86, "learning_rate": 1.969163853289541e-05, "loss": 0.7155, "step": 26770 }, { "epoch": 0.86, "learning_rate": 1.9691363221804645e-05, "loss": 0.711, "step": 26775 }, { "epoch": 0.86, "learning_rate": 1.9691087789793486e-05, "loss": 0.7139, "step": 26780 }, { "epoch": 0.86, "learning_rate": 1.969081223686537e-05, "loss": 0.709, "step": 26785 }, { "epoch": 0.86, "learning_rate": 1.969053656302373e-05, "loss": 0.7077, "step": 26790 }, { "epoch": 0.86, "learning_rate": 1.969026076827202e-05, "loss": 0.7116, "step": 26795 }, { "epoch": 0.86, "learning_rate": 1.9689984852613664e-05, "loss": 0.7099, "step": 26800 }, { "epoch": 0.86, "learning_rate": 1.9689708816052115e-05, "loss": 0.7129, "step": 26805 }, { "epoch": 0.86, "learning_rate": 1.9689432658590813e-05, "loss": 0.7045, "step": 26810 }, { "epoch": 0.86, "learning_rate": 1.9689156380233206e-05, "loss": 0.713, "step": 26815 }, { "epoch": 0.86, "learning_rate": 1.9688879980982737e-05, "loss": 0.699, "step": 26820 }, { "epoch": 0.86, "learning_rate": 1.9688603460842862e-05, "loss": 0.7026, "step": 26825 }, { "epoch": 0.86, "learning_rate": 1.9688326819817023e-05, "loss": 0.7229, "step": 26830 }, { "epoch": 0.86, "learning_rate": 1.9688050057908677e-05, "loss": 0.7094, "step": 26835 }, { "epoch": 0.86, "learning_rate": 1.9687773175121278e-05, "loss": 0.7002, "step": 26840 }, { "epoch": 0.86, "learning_rate": 1.9687496171458276e-05, "loss": 0.7107, "step": 26845 }, { "epoch": 0.86, "learning_rate": 1.968721904692313e-05, "loss": 0.7123, "step": 26850 }, { "epoch": 0.86, "learning_rate": 1.96869418015193e-05, "loss": 0.7008, "step": 26855 }, { "epoch": 0.86, "learning_rate": 1.968666443525024e-05, "loss": 0.7089, "step": 26860 }, { "epoch": 0.86, "learning_rate": 1.9686386948119414e-05, "loss": 0.7024, "step": 26865 }, { "epoch": 0.86, "learning_rate": 1.9686109340130284e-05, "loss": 0.7134, "step": 26870 }, { "epoch": 0.86, "learning_rate": 1.9685831611286312e-05, "loss": 0.7107, "step": 26875 }, { "epoch": 0.86, "learning_rate": 1.9685553761590967e-05, "loss": 0.6984, "step": 26880 }, { "epoch": 0.86, "learning_rate": 1.9685275791047713e-05, "loss": 0.7097, "step": 26885 }, { "epoch": 0.86, "learning_rate": 1.9684997699660016e-05, "loss": 0.7108, "step": 26890 }, { "epoch": 0.86, "learning_rate": 1.968471948743135e-05, "loss": 0.6984, "step": 26895 }, { "epoch": 0.86, "learning_rate": 1.9684441154365185e-05, "loss": 0.711, "step": 26900 }, { "epoch": 0.86, "learning_rate": 1.9684162700464995e-05, "loss": 0.7113, "step": 26905 }, { "epoch": 0.86, "learning_rate": 1.968388412573425e-05, "loss": 0.7174, "step": 26910 }, { "epoch": 0.86, "learning_rate": 1.9683605430176432e-05, "loss": 0.7062, "step": 26915 }, { "epoch": 0.86, "learning_rate": 1.968332661379501e-05, "loss": 0.707, "step": 26920 }, { "epoch": 0.86, "learning_rate": 1.9683047676593475e-05, "loss": 0.7147, "step": 26925 }, { "epoch": 0.86, "learning_rate": 1.9682768618575296e-05, "loss": 0.7005, "step": 26930 }, { "epoch": 0.86, "learning_rate": 1.9682489439743958e-05, "loss": 0.7151, "step": 26935 }, { "epoch": 0.86, "learning_rate": 1.968221014010295e-05, "loss": 0.7122, "step": 26940 }, { "epoch": 0.86, "learning_rate": 1.9681930719655747e-05, "loss": 0.7102, "step": 26945 }, { "epoch": 0.86, "learning_rate": 1.9681651178405844e-05, "loss": 0.7184, "step": 26950 }, { "epoch": 0.86, "learning_rate": 1.968137151635672e-05, "loss": 0.7203, "step": 26955 }, { "epoch": 0.86, "learning_rate": 1.9681091733511876e-05, "loss": 0.6984, "step": 26960 }, { "epoch": 0.86, "learning_rate": 1.9680811829874794e-05, "loss": 0.7209, "step": 26965 }, { "epoch": 0.86, "learning_rate": 1.9680531805448973e-05, "loss": 0.7011, "step": 26970 }, { "epoch": 0.86, "learning_rate": 1.9680251660237898e-05, "loss": 0.7138, "step": 26975 }, { "epoch": 0.86, "learning_rate": 1.9679971394245074e-05, "loss": 0.7199, "step": 26980 }, { "epoch": 0.86, "learning_rate": 1.9679691007473988e-05, "loss": 0.7129, "step": 26985 }, { "epoch": 0.86, "learning_rate": 1.9679410499928147e-05, "loss": 0.7058, "step": 26990 }, { "epoch": 0.86, "learning_rate": 1.9679129871611047e-05, "loss": 0.7185, "step": 26995 }, { "epoch": 0.86, "learning_rate": 1.967884912252619e-05, "loss": 0.7158, "step": 27000 }, { "epoch": 0.86, "learning_rate": 1.9678568252677078e-05, "loss": 0.7097, "step": 27005 }, { "epoch": 0.86, "learning_rate": 1.967828726206722e-05, "loss": 0.7174, "step": 27010 }, { "epoch": 0.86, "learning_rate": 1.9678006150700114e-05, "loss": 0.6988, "step": 27015 }, { "epoch": 0.86, "learning_rate": 1.9677724918579274e-05, "loss": 0.7121, "step": 27020 }, { "epoch": 0.86, "learning_rate": 1.9677443565708206e-05, "loss": 0.7031, "step": 27025 }, { "epoch": 0.86, "learning_rate": 1.9677162092090423e-05, "loss": 0.7124, "step": 27030 }, { "epoch": 0.87, "learning_rate": 1.9676880497729435e-05, "loss": 0.7128, "step": 27035 }, { "epoch": 0.87, "learning_rate": 1.9676598782628755e-05, "loss": 0.7186, "step": 27040 }, { "epoch": 0.87, "learning_rate": 1.9676316946791897e-05, "loss": 0.6943, "step": 27045 }, { "epoch": 0.87, "learning_rate": 1.9676034990222382e-05, "loss": 0.7139, "step": 27050 }, { "epoch": 0.87, "learning_rate": 1.9675752912923726e-05, "loss": 0.6994, "step": 27055 }, { "epoch": 0.87, "learning_rate": 1.967547071489945e-05, "loss": 0.7103, "step": 27060 }, { "epoch": 0.87, "learning_rate": 1.967518839615307e-05, "loss": 0.7093, "step": 27065 }, { "epoch": 0.87, "learning_rate": 1.9674905956688112e-05, "loss": 0.7054, "step": 27070 }, { "epoch": 0.87, "learning_rate": 1.9674623396508095e-05, "loss": 0.7133, "step": 27075 }, { "epoch": 0.87, "learning_rate": 1.9674340715616553e-05, "loss": 0.7064, "step": 27080 }, { "epoch": 0.87, "learning_rate": 1.967405791401701e-05, "loss": 0.7034, "step": 27085 }, { "epoch": 0.87, "learning_rate": 1.9673774991712992e-05, "loss": 0.707, "step": 27090 }, { "epoch": 0.87, "learning_rate": 1.9673491948708034e-05, "loss": 0.7021, "step": 27095 }, { "epoch": 0.87, "learning_rate": 1.9673208785005658e-05, "loss": 0.6885, "step": 27100 }, { "epoch": 0.87, "learning_rate": 1.967292550060941e-05, "loss": 0.7111, "step": 27105 }, { "epoch": 0.87, "learning_rate": 1.9672642095522813e-05, "loss": 0.7142, "step": 27110 }, { "epoch": 0.87, "learning_rate": 1.967235856974941e-05, "loss": 0.719, "step": 27115 }, { "epoch": 0.87, "learning_rate": 1.9672074923292736e-05, "loss": 0.7043, "step": 27120 }, { "epoch": 0.87, "learning_rate": 1.967179115615633e-05, "loss": 0.6975, "step": 27125 }, { "epoch": 0.87, "learning_rate": 1.9671507268343736e-05, "loss": 0.7082, "step": 27130 }, { "epoch": 0.87, "learning_rate": 1.967122325985849e-05, "loss": 0.7063, "step": 27135 }, { "epoch": 0.87, "learning_rate": 1.9670939130704138e-05, "loss": 0.7158, "step": 27140 }, { "epoch": 0.87, "learning_rate": 1.967065488088423e-05, "loss": 0.7102, "step": 27145 }, { "epoch": 0.87, "learning_rate": 1.9670370510402306e-05, "loss": 0.7135, "step": 27150 }, { "epoch": 0.87, "learning_rate": 1.9670086019261917e-05, "loss": 0.7072, "step": 27155 }, { "epoch": 0.87, "learning_rate": 1.9669801407466614e-05, "loss": 0.7049, "step": 27160 }, { "epoch": 0.87, "learning_rate": 1.9669516675019945e-05, "loss": 0.7077, "step": 27165 }, { "epoch": 0.87, "learning_rate": 1.9669231821925464e-05, "loss": 0.7149, "step": 27170 }, { "epoch": 0.87, "learning_rate": 1.9668946848186728e-05, "loss": 0.7052, "step": 27175 }, { "epoch": 0.87, "learning_rate": 1.966866175380729e-05, "loss": 0.7189, "step": 27180 }, { "epoch": 0.87, "learning_rate": 1.9668376538790706e-05, "loss": 0.7084, "step": 27185 }, { "epoch": 0.87, "learning_rate": 1.9668091203140535e-05, "loss": 0.7139, "step": 27190 }, { "epoch": 0.87, "learning_rate": 1.966780574686034e-05, "loss": 0.7128, "step": 27195 }, { "epoch": 0.87, "learning_rate": 1.9667520169953677e-05, "loss": 0.7048, "step": 27200 }, { "epoch": 0.87, "learning_rate": 1.9667234472424115e-05, "loss": 0.6966, "step": 27205 }, { "epoch": 0.87, "learning_rate": 1.966694865427522e-05, "loss": 0.7087, "step": 27210 }, { "epoch": 0.87, "learning_rate": 1.966666271551055e-05, "loss": 0.7064, "step": 27215 }, { "epoch": 0.87, "learning_rate": 1.9666376656133676e-05, "loss": 0.7066, "step": 27220 }, { "epoch": 0.87, "learning_rate": 1.966609047614817e-05, "loss": 0.7184, "step": 27225 }, { "epoch": 0.87, "learning_rate": 1.9665804175557605e-05, "loss": 0.7148, "step": 27230 }, { "epoch": 0.87, "learning_rate": 1.9665517754365547e-05, "loss": 0.7078, "step": 27235 }, { "epoch": 0.87, "learning_rate": 1.9665231212575574e-05, "loss": 0.6987, "step": 27240 }, { "epoch": 0.87, "learning_rate": 1.966494455019126e-05, "loss": 0.7102, "step": 27245 }, { "epoch": 0.87, "learning_rate": 1.9664657767216176e-05, "loss": 0.7165, "step": 27250 }, { "epoch": 0.87, "learning_rate": 1.966437086365391e-05, "loss": 0.7104, "step": 27255 }, { "epoch": 0.87, "learning_rate": 1.9664083839508036e-05, "loss": 0.7035, "step": 27260 }, { "epoch": 0.87, "learning_rate": 1.9663796694782138e-05, "loss": 0.7124, "step": 27265 }, { "epoch": 0.87, "learning_rate": 1.9663509429479796e-05, "loss": 0.7059, "step": 27270 }, { "epoch": 0.87, "learning_rate": 1.9663222043604594e-05, "loss": 0.7074, "step": 27275 }, { "epoch": 0.87, "learning_rate": 1.966293453716012e-05, "loss": 0.7124, "step": 27280 }, { "epoch": 0.87, "learning_rate": 1.966264691014996e-05, "loss": 0.7041, "step": 27285 }, { "epoch": 0.87, "learning_rate": 1.9662359162577706e-05, "loss": 0.7022, "step": 27290 }, { "epoch": 0.87, "learning_rate": 1.966207129444694e-05, "loss": 0.7116, "step": 27295 }, { "epoch": 0.87, "learning_rate": 1.9661783305761264e-05, "loss": 0.7123, "step": 27300 }, { "epoch": 0.87, "learning_rate": 1.9661495196524266e-05, "loss": 0.7174, "step": 27305 }, { "epoch": 0.87, "learning_rate": 1.966120696673954e-05, "loss": 0.7067, "step": 27310 }, { "epoch": 0.87, "learning_rate": 1.9660918616410686e-05, "loss": 0.7039, "step": 27315 }, { "epoch": 0.87, "learning_rate": 1.9660630145541292e-05, "loss": 0.7077, "step": 27320 }, { "epoch": 0.87, "learning_rate": 1.9660341554134972e-05, "loss": 0.7103, "step": 27325 }, { "epoch": 0.87, "learning_rate": 1.9660052842195315e-05, "loss": 0.7184, "step": 27330 }, { "epoch": 0.87, "learning_rate": 1.965976400972593e-05, "loss": 0.7169, "step": 27335 }, { "epoch": 0.87, "learning_rate": 1.965947505673042e-05, "loss": 0.7108, "step": 27340 }, { "epoch": 0.88, "learning_rate": 1.9659185983212388e-05, "loss": 0.712, "step": 27345 }, { "epoch": 0.88, "learning_rate": 1.965889678917544e-05, "loss": 0.704, "step": 27350 }, { "epoch": 0.88, "learning_rate": 1.9658607474623187e-05, "loss": 0.7111, "step": 27355 }, { "epoch": 0.88, "learning_rate": 1.9658318039559238e-05, "loss": 0.7024, "step": 27360 }, { "epoch": 0.88, "learning_rate": 1.9658028483987203e-05, "loss": 0.7058, "step": 27365 }, { "epoch": 0.88, "learning_rate": 1.9657738807910695e-05, "loss": 0.7115, "step": 27370 }, { "epoch": 0.88, "learning_rate": 1.9657449011333328e-05, "loss": 0.6965, "step": 27375 }, { "epoch": 0.88, "learning_rate": 1.9657159094258724e-05, "loss": 0.6931, "step": 27380 }, { "epoch": 0.88, "learning_rate": 1.9656869056690492e-05, "loss": 0.7142, "step": 27385 }, { "epoch": 0.88, "learning_rate": 1.9656578898632257e-05, "loss": 0.712, "step": 27390 }, { "epoch": 0.88, "learning_rate": 1.9656288620087634e-05, "loss": 0.6977, "step": 27395 }, { "epoch": 0.88, "learning_rate": 1.965599822106025e-05, "loss": 0.7103, "step": 27400 }, { "epoch": 0.88, "learning_rate": 1.9655707701553722e-05, "loss": 0.6949, "step": 27405 }, { "epoch": 0.88, "learning_rate": 1.965541706157168e-05, "loss": 0.6963, "step": 27410 }, { "epoch": 0.88, "learning_rate": 1.9655126301117748e-05, "loss": 0.7054, "step": 27415 }, { "epoch": 0.88, "learning_rate": 1.965483542019556e-05, "loss": 0.7197, "step": 27420 }, { "epoch": 0.88, "learning_rate": 1.9654544418808732e-05, "loss": 0.7061, "step": 27425 }, { "epoch": 0.88, "learning_rate": 1.965425329696091e-05, "loss": 0.7106, "step": 27430 }, { "epoch": 0.88, "learning_rate": 1.9653962054655714e-05, "loss": 0.709, "step": 27435 }, { "epoch": 0.88, "learning_rate": 1.9653670691896785e-05, "loss": 0.6915, "step": 27440 }, { "epoch": 0.88, "learning_rate": 1.965337920868776e-05, "loss": 0.7164, "step": 27445 }, { "epoch": 0.88, "learning_rate": 1.965308760503227e-05, "loss": 0.7114, "step": 27450 }, { "epoch": 0.88, "learning_rate": 1.9652795880933956e-05, "loss": 0.7158, "step": 27455 }, { "epoch": 0.88, "learning_rate": 1.9652504036396456e-05, "loss": 0.7083, "step": 27460 }, { "epoch": 0.88, "learning_rate": 1.9652212071423415e-05, "loss": 0.7136, "step": 27465 }, { "epoch": 0.88, "learning_rate": 1.9651919986018473e-05, "loss": 0.7255, "step": 27470 }, { "epoch": 0.88, "learning_rate": 1.9651627780185277e-05, "loss": 0.6957, "step": 27475 }, { "epoch": 0.88, "learning_rate": 1.965133545392747e-05, "loss": 0.7105, "step": 27480 }, { "epoch": 0.88, "learning_rate": 1.96510430072487e-05, "loss": 0.719, "step": 27485 }, { "epoch": 0.88, "learning_rate": 1.965075044015262e-05, "loss": 0.7048, "step": 27490 }, { "epoch": 0.88, "learning_rate": 1.9650457752642872e-05, "loss": 0.7047, "step": 27495 }, { "epoch": 0.88, "learning_rate": 1.9650164944723116e-05, "loss": 0.7132, "step": 27500 }, { "epoch": 0.88, "learning_rate": 1.9649872016397e-05, "loss": 0.7058, "step": 27505 }, { "epoch": 0.88, "learning_rate": 1.9649578967668185e-05, "loss": 0.7172, "step": 27510 }, { "epoch": 0.88, "learning_rate": 1.9649285798540322e-05, "loss": 0.709, "step": 27515 }, { "epoch": 0.88, "learning_rate": 1.964899250901707e-05, "loss": 0.7048, "step": 27520 }, { "epoch": 0.88, "learning_rate": 1.964869909910209e-05, "loss": 0.7032, "step": 27525 }, { "epoch": 0.88, "learning_rate": 1.964840556879904e-05, "loss": 0.7015, "step": 27530 }, { "epoch": 0.88, "learning_rate": 1.9648111918111584e-05, "loss": 0.6965, "step": 27535 }, { "epoch": 0.88, "learning_rate": 1.9647818147043386e-05, "loss": 0.7046, "step": 27540 }, { "epoch": 0.88, "learning_rate": 1.9647524255598114e-05, "loss": 0.7074, "step": 27545 }, { "epoch": 0.88, "learning_rate": 1.9647230243779432e-05, "loss": 0.7102, "step": 27550 }, { "epoch": 0.88, "learning_rate": 1.9646936111591005e-05, "loss": 0.7016, "step": 27555 }, { "epoch": 0.88, "learning_rate": 1.9646641859036513e-05, "loss": 0.7087, "step": 27560 }, { "epoch": 0.88, "learning_rate": 1.9646347486119615e-05, "loss": 0.6943, "step": 27565 }, { "epoch": 0.88, "learning_rate": 1.9646052992843994e-05, "loss": 0.7147, "step": 27570 }, { "epoch": 0.88, "learning_rate": 1.964575837921332e-05, "loss": 0.7014, "step": 27575 }, { "epoch": 0.88, "learning_rate": 1.964546364523127e-05, "loss": 0.7117, "step": 27580 }, { "epoch": 0.88, "learning_rate": 1.9645168790901523e-05, "loss": 0.7016, "step": 27585 }, { "epoch": 0.88, "learning_rate": 1.964487381622775e-05, "loss": 0.6993, "step": 27590 }, { "epoch": 0.88, "learning_rate": 1.964457872121364e-05, "loss": 0.7099, "step": 27595 }, { "epoch": 0.88, "learning_rate": 1.9644283505862877e-05, "loss": 0.7101, "step": 27600 }, { "epoch": 0.88, "learning_rate": 1.9643988170179135e-05, "loss": 0.7232, "step": 27605 }, { "epoch": 0.88, "learning_rate": 1.9643692714166103e-05, "loss": 0.6992, "step": 27610 }, { "epoch": 0.88, "learning_rate": 1.964339713782747e-05, "loss": 0.7165, "step": 27615 }, { "epoch": 0.88, "learning_rate": 1.9643101441166924e-05, "loss": 0.7104, "step": 27620 }, { "epoch": 0.88, "learning_rate": 1.964280562418815e-05, "loss": 0.7181, "step": 27625 }, { "epoch": 0.88, "learning_rate": 1.964250968689484e-05, "loss": 0.6977, "step": 27630 }, { "epoch": 0.88, "learning_rate": 1.964221362929069e-05, "loss": 0.7, "step": 27635 }, { "epoch": 0.88, "learning_rate": 1.964191745137939e-05, "loss": 0.7074, "step": 27640 }, { "epoch": 0.88, "learning_rate": 1.964162115316464e-05, "loss": 0.7128, "step": 27645 }, { "epoch": 0.88, "learning_rate": 1.9641324734650134e-05, "loss": 0.7009, "step": 27650 }, { "epoch": 0.88, "learning_rate": 1.9641028195839568e-05, "loss": 0.7045, "step": 27655 }, { "epoch": 0.89, "learning_rate": 1.964073153673665e-05, "loss": 0.7047, "step": 27660 }, { "epoch": 0.89, "learning_rate": 1.964043475734507e-05, "loss": 0.7227, "step": 27665 }, { "epoch": 0.89, "learning_rate": 1.964013785766854e-05, "loss": 0.7198, "step": 27670 }, { "epoch": 0.89, "learning_rate": 1.963984083771076e-05, "loss": 0.7198, "step": 27675 }, { "epoch": 0.89, "learning_rate": 1.963954369747544e-05, "loss": 0.701, "step": 27680 }, { "epoch": 0.89, "learning_rate": 1.9639246436966285e-05, "loss": 0.7103, "step": 27685 }, { "epoch": 0.89, "learning_rate": 1.9638949056187e-05, "loss": 0.7025, "step": 27690 }, { "epoch": 0.89, "learning_rate": 1.9638651555141302e-05, "loss": 0.7136, "step": 27695 }, { "epoch": 0.89, "learning_rate": 1.9638353933832902e-05, "loss": 0.7104, "step": 27700 }, { "epoch": 0.89, "learning_rate": 1.963805619226551e-05, "loss": 0.7005, "step": 27705 }, { "epoch": 0.89, "learning_rate": 1.9637758330442845e-05, "loss": 0.7126, "step": 27710 }, { "epoch": 0.89, "learning_rate": 1.9637460348368615e-05, "loss": 0.7192, "step": 27715 }, { "epoch": 0.89, "learning_rate": 1.963716224604655e-05, "loss": 0.7146, "step": 27720 }, { "epoch": 0.89, "learning_rate": 1.9636864023480363e-05, "loss": 0.7037, "step": 27725 }, { "epoch": 0.89, "learning_rate": 1.9636565680673774e-05, "loss": 0.6933, "step": 27730 }, { "epoch": 0.89, "learning_rate": 1.9636267217630506e-05, "loss": 0.6951, "step": 27735 }, { "epoch": 0.89, "learning_rate": 1.9635968634354286e-05, "loss": 0.6975, "step": 27740 }, { "epoch": 0.89, "learning_rate": 1.9635669930848837e-05, "loss": 0.6993, "step": 27745 }, { "epoch": 0.89, "learning_rate": 1.963537110711789e-05, "loss": 0.706, "step": 27750 }, { "epoch": 0.89, "learning_rate": 1.9635072163165164e-05, "loss": 0.7042, "step": 27755 }, { "epoch": 0.89, "learning_rate": 1.9634773098994397e-05, "loss": 0.71, "step": 27760 }, { "epoch": 0.89, "learning_rate": 1.9634473914609316e-05, "loss": 0.7015, "step": 27765 }, { "epoch": 0.89, "learning_rate": 1.9634174610013662e-05, "loss": 0.7075, "step": 27770 }, { "epoch": 0.89, "learning_rate": 1.963387518521116e-05, "loss": 0.7046, "step": 27775 }, { "epoch": 0.89, "learning_rate": 1.963357564020555e-05, "loss": 0.6948, "step": 27780 }, { "epoch": 0.89, "learning_rate": 1.963327597500057e-05, "loss": 0.7087, "step": 27785 }, { "epoch": 0.89, "learning_rate": 1.9632976189599957e-05, "loss": 0.7062, "step": 27790 }, { "epoch": 0.89, "learning_rate": 1.9632676284007454e-05, "loss": 0.7115, "step": 27795 }, { "epoch": 0.89, "learning_rate": 1.96323762582268e-05, "loss": 0.7032, "step": 27800 }, { "epoch": 0.89, "learning_rate": 1.963207611226174e-05, "loss": 0.702, "step": 27805 }, { "epoch": 0.89, "learning_rate": 1.963177584611602e-05, "loss": 0.7061, "step": 27810 }, { "epoch": 0.89, "learning_rate": 1.9631475459793385e-05, "loss": 0.7038, "step": 27815 }, { "epoch": 0.89, "learning_rate": 1.9631174953297582e-05, "loss": 0.6882, "step": 27820 }, { "epoch": 0.89, "learning_rate": 1.9630874326632365e-05, "loss": 0.6991, "step": 27825 }, { "epoch": 0.89, "learning_rate": 1.963057357980148e-05, "loss": 0.7046, "step": 27830 }, { "epoch": 0.89, "learning_rate": 1.9630272712808682e-05, "loss": 0.7114, "step": 27835 }, { "epoch": 0.89, "learning_rate": 1.9629971725657724e-05, "loss": 0.7158, "step": 27840 }, { "epoch": 0.89, "learning_rate": 1.962967061835236e-05, "loss": 0.7154, "step": 27845 }, { "epoch": 0.89, "learning_rate": 1.962936939089635e-05, "loss": 0.7, "step": 27850 }, { "epoch": 0.89, "learning_rate": 1.9629068043293454e-05, "loss": 0.7074, "step": 27855 }, { "epoch": 0.89, "learning_rate": 1.9628766575547423e-05, "loss": 0.6952, "step": 27860 }, { "epoch": 0.89, "learning_rate": 1.962846498766203e-05, "loss": 0.6958, "step": 27865 }, { "epoch": 0.89, "learning_rate": 1.962816327964103e-05, "loss": 0.6996, "step": 27870 }, { "epoch": 0.89, "learning_rate": 1.962786145148819e-05, "loss": 0.715, "step": 27875 }, { "epoch": 0.89, "learning_rate": 1.9627559503207278e-05, "loss": 0.6997, "step": 27880 }, { "epoch": 0.89, "learning_rate": 1.9627257434802053e-05, "loss": 0.7042, "step": 27885 }, { "epoch": 0.89, "learning_rate": 1.9626955246276297e-05, "loss": 0.6894, "step": 27890 }, { "epoch": 0.89, "learning_rate": 1.962665293763377e-05, "loss": 0.7059, "step": 27895 }, { "epoch": 0.89, "learning_rate": 1.962635050887825e-05, "loss": 0.7096, "step": 27900 }, { "epoch": 0.89, "learning_rate": 1.9626047960013505e-05, "loss": 0.7026, "step": 27905 }, { "epoch": 0.89, "learning_rate": 1.9625745291043316e-05, "loss": 0.7075, "step": 27910 }, { "epoch": 0.89, "learning_rate": 1.9625442501971455e-05, "loss": 0.7166, "step": 27915 }, { "epoch": 0.89, "learning_rate": 1.96251395928017e-05, "loss": 0.7084, "step": 27920 }, { "epoch": 0.89, "learning_rate": 1.9624836563537837e-05, "loss": 0.7174, "step": 27925 }, { "epoch": 0.89, "learning_rate": 1.9624533414183636e-05, "loss": 0.707, "step": 27930 }, { "epoch": 0.89, "learning_rate": 1.9624230144742887e-05, "loss": 0.7035, "step": 27935 }, { "epoch": 0.89, "learning_rate": 1.9623926755219375e-05, "loss": 0.7034, "step": 27940 }, { "epoch": 0.89, "learning_rate": 1.962362324561688e-05, "loss": 0.7081, "step": 27945 }, { "epoch": 0.89, "learning_rate": 1.9623319615939192e-05, "loss": 0.7145, "step": 27950 }, { "epoch": 0.89, "learning_rate": 1.9623015866190098e-05, "loss": 0.7173, "step": 27955 }, { "epoch": 0.89, "learning_rate": 1.9622711996373388e-05, "loss": 0.7109, "step": 27960 }, { "epoch": 0.89, "learning_rate": 1.9622408006492855e-05, "loss": 0.7008, "step": 27965 }, { "epoch": 0.9, "learning_rate": 1.9622103896552294e-05, "loss": 0.7052, "step": 27970 }, { "epoch": 0.9, "learning_rate": 1.9621799666555495e-05, "loss": 0.6995, "step": 27975 }, { "epoch": 0.9, "learning_rate": 1.9621495316506253e-05, "loss": 0.7009, "step": 27980 }, { "epoch": 0.9, "learning_rate": 1.9621190846408373e-05, "loss": 0.7147, "step": 27985 }, { "epoch": 0.9, "learning_rate": 1.9620886256265646e-05, "loss": 0.6961, "step": 27990 }, { "epoch": 0.9, "learning_rate": 1.9620581546081875e-05, "loss": 0.7161, "step": 27995 }, { "epoch": 0.9, "learning_rate": 1.962027671586086e-05, "loss": 0.7141, "step": 28000 }, { "epoch": 0.9, "learning_rate": 1.961997176560641e-05, "loss": 0.7008, "step": 28005 }, { "epoch": 0.9, "learning_rate": 1.9619666695322324e-05, "loss": 0.6965, "step": 28010 }, { "epoch": 0.9, "learning_rate": 1.9619361505012414e-05, "loss": 0.6987, "step": 28015 }, { "epoch": 0.9, "learning_rate": 1.961905619468048e-05, "loss": 0.7051, "step": 28020 }, { "epoch": 0.9, "learning_rate": 1.961875076433034e-05, "loss": 0.7056, "step": 28025 }, { "epoch": 0.9, "learning_rate": 1.96184452139658e-05, "loss": 0.7049, "step": 28030 }, { "epoch": 0.9, "learning_rate": 1.9618139543590676e-05, "loss": 0.6997, "step": 28035 }, { "epoch": 0.9, "learning_rate": 1.9617833753208775e-05, "loss": 0.7087, "step": 28040 }, { "epoch": 0.9, "learning_rate": 1.961752784282392e-05, "loss": 0.6991, "step": 28045 }, { "epoch": 0.9, "learning_rate": 1.9617221812439925e-05, "loss": 0.6901, "step": 28050 }, { "epoch": 0.9, "learning_rate": 1.9616915662060606e-05, "loss": 0.7069, "step": 28055 }, { "epoch": 0.9, "learning_rate": 1.9616609391689786e-05, "loss": 0.6824, "step": 28060 }, { "epoch": 0.9, "learning_rate": 1.9616303001331284e-05, "loss": 0.7105, "step": 28065 }, { "epoch": 0.9, "learning_rate": 1.961599649098892e-05, "loss": 0.6949, "step": 28070 }, { "epoch": 0.9, "learning_rate": 1.961568986066653e-05, "loss": 0.7021, "step": 28075 }, { "epoch": 0.9, "learning_rate": 1.961538311036793e-05, "loss": 0.7066, "step": 28080 }, { "epoch": 0.9, "learning_rate": 1.961507624009695e-05, "loss": 0.7148, "step": 28085 }, { "epoch": 0.9, "learning_rate": 1.961476924985742e-05, "loss": 0.7109, "step": 28090 }, { "epoch": 0.9, "learning_rate": 1.9614462139653164e-05, "loss": 0.7047, "step": 28095 }, { "epoch": 0.9, "learning_rate": 1.961415490948802e-05, "loss": 0.6999, "step": 28100 }, { "epoch": 0.9, "learning_rate": 1.961384755936582e-05, "loss": 0.7001, "step": 28105 }, { "epoch": 0.9, "learning_rate": 1.9613540089290402e-05, "loss": 0.6976, "step": 28110 }, { "epoch": 0.9, "learning_rate": 1.9613232499265598e-05, "loss": 0.7021, "step": 28115 }, { "epoch": 0.9, "learning_rate": 1.961292478929525e-05, "loss": 0.706, "step": 28120 }, { "epoch": 0.9, "learning_rate": 1.961261695938319e-05, "loss": 0.7109, "step": 28125 }, { "epoch": 0.9, "learning_rate": 1.9612309009533264e-05, "loss": 0.6956, "step": 28130 }, { "epoch": 0.9, "learning_rate": 1.9612000939749317e-05, "loss": 0.7031, "step": 28135 }, { "epoch": 0.9, "learning_rate": 1.9611692750035188e-05, "loss": 0.7046, "step": 28140 }, { "epoch": 0.9, "learning_rate": 1.961138444039472e-05, "loss": 0.716, "step": 28145 }, { "epoch": 0.9, "learning_rate": 1.961107601083177e-05, "loss": 0.7092, "step": 28150 }, { "epoch": 0.9, "learning_rate": 1.9610767461350174e-05, "loss": 0.6933, "step": 28155 }, { "epoch": 0.9, "learning_rate": 1.9610458791953793e-05, "loss": 0.7093, "step": 28160 }, { "epoch": 0.9, "learning_rate": 1.9610150002646467e-05, "loss": 0.7115, "step": 28165 }, { "epoch": 0.9, "learning_rate": 1.960984109343206e-05, "loss": 0.7152, "step": 28170 }, { "epoch": 0.9, "learning_rate": 1.960953206431442e-05, "loss": 0.6995, "step": 28175 }, { "epoch": 0.9, "learning_rate": 1.9609222915297405e-05, "loss": 0.6993, "step": 28180 }, { "epoch": 0.9, "learning_rate": 1.960891364638487e-05, "loss": 0.7071, "step": 28185 }, { "epoch": 0.9, "learning_rate": 1.9608604257580674e-05, "loss": 0.714, "step": 28190 }, { "epoch": 0.9, "learning_rate": 1.960829474888868e-05, "loss": 0.7124, "step": 28195 }, { "epoch": 0.9, "learning_rate": 1.9607985120312744e-05, "loss": 0.6928, "step": 28200 }, { "epoch": 0.9, "learning_rate": 1.960767537185674e-05, "loss": 0.7075, "step": 28205 }, { "epoch": 0.9, "learning_rate": 1.960736550352452e-05, "loss": 0.7178, "step": 28210 }, { "epoch": 0.9, "learning_rate": 1.9607055515319962e-05, "loss": 0.7023, "step": 28215 }, { "epoch": 0.9, "learning_rate": 1.9606745407246925e-05, "loss": 0.7027, "step": 28220 }, { "epoch": 0.9, "learning_rate": 1.9606435179309284e-05, "loss": 0.6945, "step": 28225 }, { "epoch": 0.9, "learning_rate": 1.9606124831510903e-05, "loss": 0.701, "step": 28230 }, { "epoch": 0.9, "learning_rate": 1.9605814363855663e-05, "loss": 0.7042, "step": 28235 }, { "epoch": 0.9, "learning_rate": 1.960550377634743e-05, "loss": 0.7012, "step": 28240 }, { "epoch": 0.9, "learning_rate": 1.9605193068990082e-05, "loss": 0.7095, "step": 28245 }, { "epoch": 0.9, "learning_rate": 1.96048822417875e-05, "loss": 0.7026, "step": 28250 }, { "epoch": 0.9, "learning_rate": 1.9604571294743555e-05, "loss": 0.6911, "step": 28255 }, { "epoch": 0.9, "learning_rate": 1.960426022786213e-05, "loss": 0.7079, "step": 28260 }, { "epoch": 0.9, "learning_rate": 1.9603949041147107e-05, "loss": 0.705, "step": 28265 }, { "epoch": 0.9, "learning_rate": 1.960363773460237e-05, "loss": 0.6901, "step": 28270 }, { "epoch": 0.9, "learning_rate": 1.96033263082318e-05, "loss": 0.7036, "step": 28275 }, { "epoch": 0.9, "learning_rate": 1.9603014762039286e-05, "loss": 0.7058, "step": 28280 }, { "epoch": 0.91, "learning_rate": 1.960270309602871e-05, "loss": 0.7041, "step": 28285 }, { "epoch": 0.91, "learning_rate": 1.9602391310203966e-05, "loss": 0.6907, "step": 28290 }, { "epoch": 0.91, "learning_rate": 1.9602079404568942e-05, "loss": 0.6996, "step": 28295 }, { "epoch": 0.91, "learning_rate": 1.9601767379127528e-05, "loss": 0.7134, "step": 28300 }, { "epoch": 0.91, "learning_rate": 1.960145523388362e-05, "loss": 0.697, "step": 28305 }, { "epoch": 0.91, "learning_rate": 1.9601142968841112e-05, "loss": 0.7031, "step": 28310 }, { "epoch": 0.91, "learning_rate": 1.96008305840039e-05, "loss": 0.7055, "step": 28315 }, { "epoch": 0.91, "learning_rate": 1.960051807937588e-05, "loss": 0.6952, "step": 28320 }, { "epoch": 0.91, "learning_rate": 1.9600205454960952e-05, "loss": 0.7039, "step": 28325 }, { "epoch": 0.91, "learning_rate": 1.959989271076302e-05, "loss": 0.6986, "step": 28330 }, { "epoch": 0.91, "learning_rate": 1.959957984678598e-05, "loss": 0.7093, "step": 28335 }, { "epoch": 0.91, "learning_rate": 1.9599266863033743e-05, "loss": 0.7075, "step": 28340 }, { "epoch": 0.91, "learning_rate": 1.959895375951021e-05, "loss": 0.7096, "step": 28345 }, { "epoch": 0.91, "learning_rate": 1.9598640536219288e-05, "loss": 0.7063, "step": 28350 }, { "epoch": 0.91, "learning_rate": 1.959832719316488e-05, "loss": 0.6836, "step": 28355 }, { "epoch": 0.91, "learning_rate": 1.9598013730350906e-05, "loss": 0.694, "step": 28360 }, { "epoch": 0.91, "learning_rate": 1.959770014778127e-05, "loss": 0.6988, "step": 28365 }, { "epoch": 0.91, "learning_rate": 1.9597386445459883e-05, "loss": 0.7105, "step": 28370 }, { "epoch": 0.91, "learning_rate": 1.9597072623390668e-05, "loss": 0.7125, "step": 28375 }, { "epoch": 0.91, "learning_rate": 1.9596758681577533e-05, "loss": 0.7098, "step": 28380 }, { "epoch": 0.91, "learning_rate": 1.95964446200244e-05, "loss": 0.7004, "step": 28385 }, { "epoch": 0.91, "learning_rate": 1.9596130438735178e-05, "loss": 0.7045, "step": 28390 }, { "epoch": 0.91, "learning_rate": 1.9595816137713798e-05, "loss": 0.7068, "step": 28395 }, { "epoch": 0.91, "learning_rate": 1.9595501716964176e-05, "loss": 0.7069, "step": 28400 }, { "epoch": 0.91, "learning_rate": 1.9595187176490237e-05, "loss": 0.7032, "step": 28405 }, { "epoch": 0.91, "learning_rate": 1.9594872516295907e-05, "loss": 0.6978, "step": 28410 }, { "epoch": 0.91, "learning_rate": 1.9594557736385107e-05, "loss": 0.6982, "step": 28415 }, { "epoch": 0.91, "learning_rate": 1.959424283676177e-05, "loss": 0.7054, "step": 28420 }, { "epoch": 0.91, "learning_rate": 1.959392781742982e-05, "loss": 0.6924, "step": 28425 }, { "epoch": 0.91, "learning_rate": 1.959361267839319e-05, "loss": 0.7021, "step": 28430 }, { "epoch": 0.91, "learning_rate": 1.9593297419655815e-05, "loss": 0.697, "step": 28435 }, { "epoch": 0.91, "learning_rate": 1.9592982041221625e-05, "loss": 0.7028, "step": 28440 }, { "epoch": 0.91, "learning_rate": 1.9592666543094558e-05, "loss": 0.6965, "step": 28445 }, { "epoch": 0.91, "learning_rate": 1.9592350925278546e-05, "loss": 0.7079, "step": 28450 }, { "epoch": 0.91, "learning_rate": 1.959203518777753e-05, "loss": 0.709, "step": 28455 }, { "epoch": 0.91, "learning_rate": 1.9591719330595444e-05, "loss": 0.7044, "step": 28460 }, { "epoch": 0.91, "learning_rate": 1.9591403353736238e-05, "loss": 0.7064, "step": 28465 }, { "epoch": 0.91, "learning_rate": 1.959108725720385e-05, "loss": 0.7109, "step": 28470 }, { "epoch": 0.91, "learning_rate": 1.9590771041002225e-05, "loss": 0.7046, "step": 28475 }, { "epoch": 0.91, "learning_rate": 1.9590454705135307e-05, "loss": 0.6909, "step": 28480 }, { "epoch": 0.91, "learning_rate": 1.959013824960704e-05, "loss": 0.694, "step": 28485 }, { "epoch": 0.91, "learning_rate": 1.9589821674421382e-05, "loss": 0.6941, "step": 28490 }, { "epoch": 0.91, "learning_rate": 1.9589504979582274e-05, "loss": 0.7018, "step": 28495 }, { "epoch": 0.91, "learning_rate": 1.958918816509367e-05, "loss": 0.707, "step": 28500 }, { "epoch": 0.91, "learning_rate": 1.9588871230959524e-05, "loss": 0.7036, "step": 28505 }, { "epoch": 0.91, "learning_rate": 1.9588554177183794e-05, "loss": 0.6899, "step": 28510 }, { "epoch": 0.91, "learning_rate": 1.9588237003770426e-05, "loss": 0.6886, "step": 28515 }, { "epoch": 0.91, "learning_rate": 1.9587919710723385e-05, "loss": 0.7054, "step": 28520 }, { "epoch": 0.91, "learning_rate": 1.958760229804663e-05, "loss": 0.6793, "step": 28525 }, { "epoch": 0.91, "learning_rate": 1.9587284765744118e-05, "loss": 0.6968, "step": 28530 }, { "epoch": 0.91, "learning_rate": 1.9586967113819812e-05, "loss": 0.7083, "step": 28535 }, { "epoch": 0.91, "learning_rate": 1.9586649342277676e-05, "loss": 0.7023, "step": 28540 }, { "epoch": 0.91, "learning_rate": 1.9586331451121678e-05, "loss": 0.7028, "step": 28545 }, { "epoch": 0.91, "learning_rate": 1.9586013440355774e-05, "loss": 0.6978, "step": 28550 }, { "epoch": 0.91, "learning_rate": 1.9585695309983946e-05, "loss": 0.712, "step": 28555 }, { "epoch": 0.91, "learning_rate": 1.9585377060010154e-05, "loss": 0.7031, "step": 28560 }, { "epoch": 0.91, "learning_rate": 1.9585058690438366e-05, "loss": 0.706, "step": 28565 }, { "epoch": 0.91, "learning_rate": 1.9584740201272567e-05, "loss": 0.7008, "step": 28570 }, { "epoch": 0.91, "learning_rate": 1.9584421592516717e-05, "loss": 0.6958, "step": 28575 }, { "epoch": 0.91, "learning_rate": 1.9584102864174804e-05, "loss": 0.693, "step": 28580 }, { "epoch": 0.91, "learning_rate": 1.9583784016250795e-05, "loss": 0.7013, "step": 28585 }, { "epoch": 0.91, "learning_rate": 1.958346504874867e-05, "loss": 0.7131, "step": 28590 }, { "epoch": 0.92, "learning_rate": 1.958314596167241e-05, "loss": 0.6996, "step": 28595 }, { "epoch": 0.92, "learning_rate": 1.9582826755026002e-05, "loss": 0.7065, "step": 28600 }, { "epoch": 0.92, "learning_rate": 1.958250742881342e-05, "loss": 0.7138, "step": 28605 }, { "epoch": 0.92, "learning_rate": 1.958218798303865e-05, "loss": 0.6975, "step": 28610 }, { "epoch": 0.92, "learning_rate": 1.9581868417705684e-05, "loss": 0.7008, "step": 28615 }, { "epoch": 0.92, "learning_rate": 1.9581548732818503e-05, "loss": 0.7037, "step": 28620 }, { "epoch": 0.92, "learning_rate": 1.95812289283811e-05, "loss": 0.7074, "step": 28625 }, { "epoch": 0.92, "learning_rate": 1.958090900439746e-05, "loss": 0.7006, "step": 28630 }, { "epoch": 0.92, "learning_rate": 1.9580588960871577e-05, "loss": 0.6943, "step": 28635 }, { "epoch": 0.92, "learning_rate": 1.9580268797807447e-05, "loss": 0.6954, "step": 28640 }, { "epoch": 0.92, "learning_rate": 1.957994851520906e-05, "loss": 0.7092, "step": 28645 }, { "epoch": 0.92, "learning_rate": 1.9579628113080414e-05, "loss": 0.6977, "step": 28650 }, { "epoch": 0.92, "learning_rate": 1.9579307591425512e-05, "loss": 0.6905, "step": 28655 }, { "epoch": 0.92, "learning_rate": 1.9578986950248345e-05, "loss": 0.6923, "step": 28660 }, { "epoch": 0.92, "learning_rate": 1.957866618955292e-05, "loss": 0.7055, "step": 28665 }, { "epoch": 0.92, "learning_rate": 1.9578345309343234e-05, "loss": 0.7013, "step": 28670 }, { "epoch": 0.92, "learning_rate": 1.9578024309623296e-05, "loss": 0.7019, "step": 28675 }, { "epoch": 0.92, "learning_rate": 1.9577703190397105e-05, "loss": 0.6951, "step": 28680 }, { "epoch": 0.92, "learning_rate": 1.9577381951668673e-05, "loss": 0.6935, "step": 28685 }, { "epoch": 0.92, "learning_rate": 1.9577060593442006e-05, "loss": 0.7024, "step": 28690 }, { "epoch": 0.92, "learning_rate": 1.9576739115721115e-05, "loss": 0.6898, "step": 28695 }, { "epoch": 0.92, "learning_rate": 1.9576417518510007e-05, "loss": 0.7008, "step": 28700 }, { "epoch": 0.92, "learning_rate": 1.95760958018127e-05, "loss": 0.71, "step": 28705 }, { "epoch": 0.92, "learning_rate": 1.9575773965633202e-05, "loss": 0.6978, "step": 28710 }, { "epoch": 0.92, "learning_rate": 1.9575452009975535e-05, "loss": 0.6864, "step": 28715 }, { "epoch": 0.92, "learning_rate": 1.9575129934843712e-05, "loss": 0.7105, "step": 28720 }, { "epoch": 0.92, "learning_rate": 1.9574807740241754e-05, "loss": 0.7031, "step": 28725 }, { "epoch": 0.92, "learning_rate": 1.957448542617368e-05, "loss": 0.7065, "step": 28730 }, { "epoch": 0.92, "learning_rate": 1.957416299264351e-05, "loss": 0.698, "step": 28735 }, { "epoch": 0.92, "learning_rate": 1.9573840439655272e-05, "loss": 0.6977, "step": 28740 }, { "epoch": 0.92, "learning_rate": 1.9573517767212982e-05, "loss": 0.6932, "step": 28745 }, { "epoch": 0.92, "learning_rate": 1.9573194975320672e-05, "loss": 0.7033, "step": 28750 }, { "epoch": 0.92, "learning_rate": 1.9572872063982372e-05, "loss": 0.6968, "step": 28755 }, { "epoch": 0.92, "learning_rate": 1.9572549033202106e-05, "loss": 0.7074, "step": 28760 }, { "epoch": 0.92, "learning_rate": 1.9572225882983903e-05, "loss": 0.6979, "step": 28765 }, { "epoch": 0.92, "learning_rate": 1.9571902613331804e-05, "loss": 0.6879, "step": 28770 }, { "epoch": 0.92, "learning_rate": 1.957157922424983e-05, "loss": 0.7069, "step": 28775 }, { "epoch": 0.92, "learning_rate": 1.9571255715742028e-05, "loss": 0.7023, "step": 28780 }, { "epoch": 0.92, "learning_rate": 1.9570932087812428e-05, "loss": 0.6973, "step": 28785 }, { "epoch": 0.92, "learning_rate": 1.9570608340465066e-05, "loss": 0.6961, "step": 28790 }, { "epoch": 0.92, "learning_rate": 1.9570284473703983e-05, "loss": 0.7064, "step": 28795 }, { "epoch": 0.92, "learning_rate": 1.9569960487533226e-05, "loss": 0.7065, "step": 28800 }, { "epoch": 0.92, "learning_rate": 1.956963638195683e-05, "loss": 0.7045, "step": 28805 }, { "epoch": 0.92, "learning_rate": 1.9569312156978843e-05, "loss": 0.7006, "step": 28810 }, { "epoch": 0.92, "learning_rate": 1.9568987812603307e-05, "loss": 0.7137, "step": 28815 }, { "epoch": 0.92, "learning_rate": 1.956866334883427e-05, "loss": 0.6949, "step": 28820 }, { "epoch": 0.92, "learning_rate": 1.9568338765675786e-05, "loss": 0.6884, "step": 28825 }, { "epoch": 0.92, "learning_rate": 1.9568014063131898e-05, "loss": 0.6997, "step": 28830 }, { "epoch": 0.92, "learning_rate": 1.9567689241206658e-05, "loss": 0.6988, "step": 28835 }, { "epoch": 0.92, "learning_rate": 1.956736429990412e-05, "loss": 0.7049, "step": 28840 }, { "epoch": 0.92, "learning_rate": 1.956703923922834e-05, "loss": 0.6851, "step": 28845 }, { "epoch": 0.92, "learning_rate": 1.9566714059183373e-05, "loss": 0.6901, "step": 28850 }, { "epoch": 0.92, "learning_rate": 1.9566388759773277e-05, "loss": 0.6993, "step": 28855 }, { "epoch": 0.92, "learning_rate": 1.9566063341002106e-05, "loss": 0.7113, "step": 28860 }, { "epoch": 0.92, "learning_rate": 1.9565737802873927e-05, "loss": 0.7004, "step": 28865 }, { "epoch": 0.92, "learning_rate": 1.9565412145392796e-05, "loss": 0.7029, "step": 28870 }, { "epoch": 0.92, "learning_rate": 1.956508636856278e-05, "loss": 0.7187, "step": 28875 }, { "epoch": 0.92, "learning_rate": 1.9564760472387944e-05, "loss": 0.6982, "step": 28880 }, { "epoch": 0.92, "learning_rate": 1.956443445687235e-05, "loss": 0.6879, "step": 28885 }, { "epoch": 0.92, "learning_rate": 1.956410832202007e-05, "loss": 0.705, "step": 28890 }, { "epoch": 0.92, "learning_rate": 1.9563782067835174e-05, "loss": 0.7103, "step": 28895 }, { "epoch": 0.92, "learning_rate": 1.956345569432173e-05, "loss": 0.6996, "step": 28900 }, { "epoch": 0.92, "learning_rate": 1.9563129201483807e-05, "loss": 0.6929, "step": 28905 }, { "epoch": 0.93, "learning_rate": 1.9562802589325488e-05, "loss": 0.6989, "step": 28910 }, { "epoch": 0.93, "learning_rate": 1.956247585785084e-05, "loss": 0.7083, "step": 28915 }, { "epoch": 0.93, "learning_rate": 1.956214900706394e-05, "loss": 0.7114, "step": 28920 }, { "epoch": 0.93, "learning_rate": 1.956182203696887e-05, "loss": 0.6912, "step": 28925 }, { "epoch": 0.93, "learning_rate": 1.956149494756971e-05, "loss": 0.6995, "step": 28930 }, { "epoch": 0.93, "learning_rate": 1.9561167738870538e-05, "loss": 0.7179, "step": 28935 }, { "epoch": 0.93, "learning_rate": 1.956084041087544e-05, "loss": 0.7051, "step": 28940 }, { "epoch": 0.93, "learning_rate": 1.9560512963588495e-05, "loss": 0.7009, "step": 28945 }, { "epoch": 0.93, "learning_rate": 1.9560185397013794e-05, "loss": 0.6937, "step": 28950 }, { "epoch": 0.93, "learning_rate": 1.955985771115542e-05, "loss": 0.6949, "step": 28955 }, { "epoch": 0.93, "learning_rate": 1.9559529906017466e-05, "loss": 0.7006, "step": 28960 }, { "epoch": 0.93, "learning_rate": 1.9559201981604016e-05, "loss": 0.7012, "step": 28965 }, { "epoch": 0.93, "learning_rate": 1.955887393791917e-05, "loss": 0.6984, "step": 28970 }, { "epoch": 0.93, "learning_rate": 1.9558545774967007e-05, "loss": 0.691, "step": 28975 }, { "epoch": 0.93, "learning_rate": 1.9558217492751637e-05, "loss": 0.6967, "step": 28980 }, { "epoch": 0.93, "learning_rate": 1.955788909127715e-05, "loss": 0.6892, "step": 28985 }, { "epoch": 0.93, "learning_rate": 1.955756057054764e-05, "loss": 0.6912, "step": 28990 }, { "epoch": 0.93, "learning_rate": 1.9557231930567212e-05, "loss": 0.6891, "step": 28995 }, { "epoch": 0.93, "learning_rate": 1.9556903171339963e-05, "loss": 0.6953, "step": 29000 }, { "epoch": 0.93, "learning_rate": 1.955657429286999e-05, "loss": 0.7024, "step": 29005 }, { "epoch": 0.93, "learning_rate": 1.9556245295161408e-05, "loss": 0.6928, "step": 29010 }, { "epoch": 0.93, "learning_rate": 1.9555916178218315e-05, "loss": 0.6899, "step": 29015 }, { "epoch": 0.93, "learning_rate": 1.955558694204482e-05, "loss": 0.6992, "step": 29020 }, { "epoch": 0.93, "learning_rate": 1.9555257586645026e-05, "loss": 0.6996, "step": 29025 }, { "epoch": 0.93, "learning_rate": 1.9554928112023046e-05, "loss": 0.7109, "step": 29030 }, { "epoch": 0.93, "learning_rate": 1.955459851818299e-05, "loss": 0.6915, "step": 29035 }, { "epoch": 0.93, "learning_rate": 1.9554268805128973e-05, "loss": 0.6912, "step": 29040 }, { "epoch": 0.93, "learning_rate": 1.9553938972865106e-05, "loss": 0.6986, "step": 29045 }, { "epoch": 0.93, "learning_rate": 1.9553609021395507e-05, "loss": 0.6931, "step": 29050 }, { "epoch": 0.93, "learning_rate": 1.955327895072429e-05, "loss": 0.7033, "step": 29055 }, { "epoch": 0.93, "learning_rate": 1.955294876085557e-05, "loss": 0.6862, "step": 29060 }, { "epoch": 0.93, "learning_rate": 1.955261845179348e-05, "loss": 0.6848, "step": 29065 }, { "epoch": 0.93, "learning_rate": 1.955228802354212e-05, "loss": 0.7036, "step": 29070 }, { "epoch": 0.93, "learning_rate": 1.9551957476105637e-05, "loss": 0.6989, "step": 29075 }, { "epoch": 0.93, "learning_rate": 1.955162680948814e-05, "loss": 0.6985, "step": 29080 }, { "epoch": 0.93, "learning_rate": 1.9551296023693754e-05, "loss": 0.702, "step": 29085 }, { "epoch": 0.93, "learning_rate": 1.9550965118726613e-05, "loss": 0.7026, "step": 29090 }, { "epoch": 0.93, "learning_rate": 1.9550634094590844e-05, "loss": 0.7079, "step": 29095 }, { "epoch": 0.93, "learning_rate": 1.955030295129058e-05, "loss": 0.6955, "step": 29100 }, { "epoch": 0.93, "learning_rate": 1.9549971688829946e-05, "loss": 0.7023, "step": 29105 }, { "epoch": 0.93, "learning_rate": 1.954964030721308e-05, "loss": 0.6975, "step": 29110 }, { "epoch": 0.93, "learning_rate": 1.9549308806444112e-05, "loss": 0.6999, "step": 29115 }, { "epoch": 0.93, "learning_rate": 1.9548977186527184e-05, "loss": 0.6993, "step": 29120 }, { "epoch": 0.93, "learning_rate": 1.9548645447466433e-05, "loss": 0.6932, "step": 29125 }, { "epoch": 0.93, "learning_rate": 1.954831358926599e-05, "loss": 0.6929, "step": 29130 }, { "epoch": 0.93, "learning_rate": 1.9547981611930006e-05, "loss": 0.6993, "step": 29135 }, { "epoch": 0.93, "learning_rate": 1.9547649515462618e-05, "loss": 0.6965, "step": 29140 }, { "epoch": 0.93, "learning_rate": 1.954731729986797e-05, "loss": 0.7047, "step": 29145 }, { "epoch": 0.93, "learning_rate": 1.9546984965150212e-05, "loss": 0.6979, "step": 29150 }, { "epoch": 0.93, "learning_rate": 1.954665251131348e-05, "loss": 0.6965, "step": 29155 }, { "epoch": 0.93, "learning_rate": 1.9546319938361935e-05, "loss": 0.7002, "step": 29160 }, { "epoch": 0.93, "learning_rate": 1.9545987246299715e-05, "loss": 0.7062, "step": 29165 }, { "epoch": 0.93, "learning_rate": 1.9545654435130975e-05, "loss": 0.7129, "step": 29170 }, { "epoch": 0.93, "learning_rate": 1.9545321504859875e-05, "loss": 0.7058, "step": 29175 }, { "epoch": 0.93, "learning_rate": 1.9544988455490555e-05, "loss": 0.6949, "step": 29180 }, { "epoch": 0.93, "learning_rate": 1.954465528702718e-05, "loss": 0.6898, "step": 29185 }, { "epoch": 0.93, "learning_rate": 1.9544321999473907e-05, "loss": 0.6894, "step": 29190 }, { "epoch": 0.93, "learning_rate": 1.9543988592834892e-05, "loss": 0.7039, "step": 29195 }, { "epoch": 0.93, "learning_rate": 1.9543655067114294e-05, "loss": 0.6905, "step": 29200 }, { "epoch": 0.93, "learning_rate": 1.9543321422316276e-05, "loss": 0.7155, "step": 29205 }, { "epoch": 0.93, "learning_rate": 1.9542987658445002e-05, "loss": 0.6957, "step": 29210 }, { "epoch": 0.93, "learning_rate": 1.9542653775504633e-05, "loss": 0.6958, "step": 29215 }, { "epoch": 0.94, "learning_rate": 1.9542319773499337e-05, "loss": 0.7128, "step": 29220 }, { "epoch": 0.94, "learning_rate": 1.9541985652433283e-05, "loss": 0.6959, "step": 29225 }, { "epoch": 0.94, "learning_rate": 1.9541651412310637e-05, "loss": 0.6881, "step": 29230 }, { "epoch": 0.94, "learning_rate": 1.9541317053135575e-05, "loss": 0.7027, "step": 29235 }, { "epoch": 0.94, "learning_rate": 1.9540982574912258e-05, "loss": 0.7084, "step": 29240 }, { "epoch": 0.94, "learning_rate": 1.954064797764487e-05, "loss": 0.6854, "step": 29245 }, { "epoch": 0.94, "learning_rate": 1.954031326133758e-05, "loss": 0.6922, "step": 29250 }, { "epoch": 0.94, "learning_rate": 1.953997842599457e-05, "loss": 0.6835, "step": 29255 }, { "epoch": 0.94, "learning_rate": 1.9539643471620006e-05, "loss": 0.6871, "step": 29260 }, { "epoch": 0.94, "learning_rate": 1.9539308398218083e-05, "loss": 0.699, "step": 29265 }, { "epoch": 0.94, "learning_rate": 1.9538973205792967e-05, "loss": 0.7041, "step": 29270 }, { "epoch": 0.94, "learning_rate": 1.9538637894348852e-05, "loss": 0.688, "step": 29275 }, { "epoch": 0.94, "learning_rate": 1.9538302463889914e-05, "loss": 0.6984, "step": 29280 }, { "epoch": 0.94, "learning_rate": 1.9537966914420343e-05, "loss": 0.7134, "step": 29285 }, { "epoch": 0.94, "learning_rate": 1.9537631245944323e-05, "loss": 0.7064, "step": 29290 }, { "epoch": 0.94, "learning_rate": 1.9537295458466042e-05, "loss": 0.7078, "step": 29295 }, { "epoch": 0.94, "learning_rate": 1.9536959551989692e-05, "loss": 0.6979, "step": 29300 }, { "epoch": 0.94, "learning_rate": 1.953662352651946e-05, "loss": 0.6999, "step": 29305 }, { "epoch": 0.94, "learning_rate": 1.9536287382059543e-05, "loss": 0.6946, "step": 29310 }, { "epoch": 0.94, "learning_rate": 1.953595111861413e-05, "loss": 0.6951, "step": 29315 }, { "epoch": 0.94, "learning_rate": 1.9535614736187425e-05, "loss": 0.6773, "step": 29320 }, { "epoch": 0.94, "learning_rate": 1.953527823478362e-05, "loss": 0.6963, "step": 29325 }, { "epoch": 0.94, "learning_rate": 1.953494161440691e-05, "loss": 0.7047, "step": 29330 }, { "epoch": 0.94, "learning_rate": 1.95346048750615e-05, "loss": 0.6947, "step": 29335 }, { "epoch": 0.94, "learning_rate": 1.953426801675159e-05, "loss": 0.7114, "step": 29340 }, { "epoch": 0.94, "learning_rate": 1.9533931039481386e-05, "loss": 0.6926, "step": 29345 }, { "epoch": 0.94, "learning_rate": 1.9533593943255087e-05, "loss": 0.6994, "step": 29350 }, { "epoch": 0.94, "learning_rate": 1.95332567280769e-05, "loss": 0.6939, "step": 29355 }, { "epoch": 0.94, "learning_rate": 1.953291939395104e-05, "loss": 0.7154, "step": 29360 }, { "epoch": 0.94, "learning_rate": 1.9532581940881706e-05, "loss": 0.6941, "step": 29365 }, { "epoch": 0.94, "learning_rate": 1.9532244368873114e-05, "loss": 0.6986, "step": 29370 }, { "epoch": 0.94, "learning_rate": 1.9531906677929472e-05, "loss": 0.697, "step": 29375 }, { "epoch": 0.94, "learning_rate": 1.9531568868054997e-05, "loss": 0.6989, "step": 29380 }, { "epoch": 0.94, "learning_rate": 1.9531230939253906e-05, "loss": 0.6795, "step": 29385 }, { "epoch": 0.94, "learning_rate": 1.9530892891530408e-05, "loss": 0.6862, "step": 29390 }, { "epoch": 0.94, "learning_rate": 1.953055472488873e-05, "loss": 0.6959, "step": 29395 }, { "epoch": 0.94, "learning_rate": 1.9530216439333085e-05, "loss": 0.7144, "step": 29400 }, { "epoch": 0.94, "learning_rate": 1.9529878034867692e-05, "loss": 0.6926, "step": 29405 }, { "epoch": 0.94, "learning_rate": 1.9529539511496776e-05, "loss": 0.7083, "step": 29410 }, { "epoch": 0.94, "learning_rate": 1.9529200869224566e-05, "loss": 0.6962, "step": 29415 }, { "epoch": 0.94, "learning_rate": 1.952886210805528e-05, "loss": 0.6932, "step": 29420 }, { "epoch": 0.94, "learning_rate": 1.952852322799315e-05, "loss": 0.6985, "step": 29425 }, { "epoch": 0.94, "learning_rate": 1.9528184229042398e-05, "loss": 0.6977, "step": 29430 }, { "epoch": 0.94, "learning_rate": 1.952784511120726e-05, "loss": 0.7137, "step": 29435 }, { "epoch": 0.94, "learning_rate": 1.9527505874491962e-05, "loss": 0.6853, "step": 29440 }, { "epoch": 0.94, "learning_rate": 1.952716651890074e-05, "loss": 0.6881, "step": 29445 }, { "epoch": 0.94, "learning_rate": 1.9526827044437833e-05, "loss": 0.6913, "step": 29450 }, { "epoch": 0.94, "learning_rate": 1.9526487451107465e-05, "loss": 0.702, "step": 29455 }, { "epoch": 0.94, "learning_rate": 1.9526147738913882e-05, "loss": 0.7016, "step": 29460 }, { "epoch": 0.94, "learning_rate": 1.9525807907861322e-05, "loss": 0.71, "step": 29465 }, { "epoch": 0.94, "learning_rate": 1.952546795795402e-05, "loss": 0.6946, "step": 29470 }, { "epoch": 0.94, "learning_rate": 1.952512788919622e-05, "loss": 0.7067, "step": 29475 }, { "epoch": 0.94, "learning_rate": 1.9524787701592167e-05, "loss": 0.6961, "step": 29480 }, { "epoch": 0.94, "learning_rate": 1.9524447395146105e-05, "loss": 0.6901, "step": 29485 }, { "epoch": 0.94, "learning_rate": 1.952410696986228e-05, "loss": 0.6842, "step": 29490 }, { "epoch": 0.94, "learning_rate": 1.9523766425744937e-05, "loss": 0.6856, "step": 29495 }, { "epoch": 0.94, "learning_rate": 1.9523425762798328e-05, "loss": 0.695, "step": 29500 }, { "epoch": 0.94, "learning_rate": 1.9523084981026704e-05, "loss": 0.6841, "step": 29505 }, { "epoch": 0.94, "learning_rate": 1.9522744080434312e-05, "loss": 0.6967, "step": 29510 }, { "epoch": 0.94, "learning_rate": 1.9522403061025413e-05, "loss": 0.6885, "step": 29515 }, { "epoch": 0.94, "learning_rate": 1.9522061922804253e-05, "loss": 0.7001, "step": 29520 }, { "epoch": 0.94, "learning_rate": 1.9521720665775098e-05, "loss": 0.701, "step": 29525 }, { "epoch": 0.94, "learning_rate": 1.95213792899422e-05, "loss": 0.6877, "step": 29530 }, { "epoch": 0.95, "learning_rate": 1.952103779530982e-05, "loss": 0.6861, "step": 29535 }, { "epoch": 0.95, "learning_rate": 1.9520696181882216e-05, "loss": 0.6908, "step": 29540 }, { "epoch": 0.95, "learning_rate": 1.9520354449663653e-05, "loss": 0.7054, "step": 29545 }, { "epoch": 0.95, "learning_rate": 1.9520012598658397e-05, "loss": 0.6925, "step": 29550 }, { "epoch": 0.95, "learning_rate": 1.9519670628870708e-05, "loss": 0.6985, "step": 29555 }, { "epoch": 0.95, "learning_rate": 1.951932854030486e-05, "loss": 0.7116, "step": 29560 }, { "epoch": 0.95, "learning_rate": 1.951898633296511e-05, "loss": 0.7004, "step": 29565 }, { "epoch": 0.95, "learning_rate": 1.951864400685574e-05, "loss": 0.7016, "step": 29570 }, { "epoch": 0.95, "learning_rate": 1.9518301561981016e-05, "loss": 0.6956, "step": 29575 }, { "epoch": 0.95, "learning_rate": 1.951795899834521e-05, "loss": 0.693, "step": 29580 }, { "epoch": 0.95, "learning_rate": 1.9517616315952598e-05, "loss": 0.7004, "step": 29585 }, { "epoch": 0.95, "learning_rate": 1.951727351480745e-05, "loss": 0.6908, "step": 29590 }, { "epoch": 0.95, "learning_rate": 1.9516930594914053e-05, "loss": 0.7007, "step": 29595 }, { "epoch": 0.95, "learning_rate": 1.9516587556276677e-05, "loss": 0.6948, "step": 29600 }, { "epoch": 0.95, "learning_rate": 1.9516244398899607e-05, "loss": 0.7053, "step": 29605 }, { "epoch": 0.95, "learning_rate": 1.9515901122787126e-05, "loss": 0.7007, "step": 29610 }, { "epoch": 0.95, "learning_rate": 1.9515557727943512e-05, "loss": 0.6967, "step": 29615 }, { "epoch": 0.95, "learning_rate": 1.9515214214373052e-05, "loss": 0.6876, "step": 29620 }, { "epoch": 0.95, "learning_rate": 1.951487058208003e-05, "loss": 0.7033, "step": 29625 }, { "epoch": 0.95, "learning_rate": 1.951452683106874e-05, "loss": 0.6975, "step": 29630 }, { "epoch": 0.95, "learning_rate": 1.9514182961343463e-05, "loss": 0.6997, "step": 29635 }, { "epoch": 0.95, "learning_rate": 1.9513838972908498e-05, "loss": 0.7077, "step": 29640 }, { "epoch": 0.95, "learning_rate": 1.951349486576813e-05, "loss": 0.704, "step": 29645 }, { "epoch": 0.95, "learning_rate": 1.951315063992665e-05, "loss": 0.7011, "step": 29650 }, { "epoch": 0.95, "learning_rate": 1.951280629538836e-05, "loss": 0.6926, "step": 29655 }, { "epoch": 0.95, "learning_rate": 1.9512461832157554e-05, "loss": 0.6906, "step": 29660 }, { "epoch": 0.95, "learning_rate": 1.9512117250238533e-05, "loss": 0.6801, "step": 29665 }, { "epoch": 0.95, "learning_rate": 1.951177254963559e-05, "loss": 0.7152, "step": 29670 }, { "epoch": 0.95, "learning_rate": 1.951142773035303e-05, "loss": 0.702, "step": 29675 }, { "epoch": 0.95, "learning_rate": 1.9511082792395152e-05, "loss": 0.6997, "step": 29680 }, { "epoch": 0.95, "learning_rate": 1.9510737735766266e-05, "loss": 0.6987, "step": 29685 }, { "epoch": 0.95, "learning_rate": 1.951039256047067e-05, "loss": 0.6907, "step": 29690 }, { "epoch": 0.95, "learning_rate": 1.9510047266512676e-05, "loss": 0.6991, "step": 29695 }, { "epoch": 0.95, "learning_rate": 1.950970185389659e-05, "loss": 0.7025, "step": 29700 }, { "epoch": 0.95, "learning_rate": 1.9509356322626728e-05, "loss": 0.6759, "step": 29705 }, { "epoch": 0.95, "learning_rate": 1.950901067270739e-05, "loss": 0.6858, "step": 29710 }, { "epoch": 0.95, "learning_rate": 1.9508664904142897e-05, "loss": 0.6951, "step": 29715 }, { "epoch": 0.95, "learning_rate": 1.950831901693756e-05, "loss": 0.693, "step": 29720 }, { "epoch": 0.95, "learning_rate": 1.950797301109569e-05, "loss": 0.6941, "step": 29725 }, { "epoch": 0.95, "learning_rate": 1.9507626886621618e-05, "loss": 0.6987, "step": 29730 }, { "epoch": 0.95, "learning_rate": 1.950728064351965e-05, "loss": 0.695, "step": 29735 }, { "epoch": 0.95, "learning_rate": 1.950693428179411e-05, "loss": 0.6885, "step": 29740 }, { "epoch": 0.95, "learning_rate": 1.950658780144932e-05, "loss": 0.7051, "step": 29745 }, { "epoch": 0.95, "learning_rate": 1.95062412024896e-05, "loss": 0.697, "step": 29750 }, { "epoch": 0.95, "learning_rate": 1.950589448491928e-05, "loss": 0.6886, "step": 29755 }, { "epoch": 0.95, "learning_rate": 1.9505547648742687e-05, "loss": 0.6947, "step": 29760 }, { "epoch": 0.95, "learning_rate": 1.950520069396414e-05, "loss": 0.6936, "step": 29765 }, { "epoch": 0.95, "learning_rate": 1.9504853620587977e-05, "loss": 0.6851, "step": 29770 }, { "epoch": 0.95, "learning_rate": 1.950450642861852e-05, "loss": 0.6811, "step": 29775 }, { "epoch": 0.95, "learning_rate": 1.950415911806011e-05, "loss": 0.6854, "step": 29780 }, { "epoch": 0.95, "learning_rate": 1.950381168891707e-05, "loss": 0.6876, "step": 29785 }, { "epoch": 0.95, "learning_rate": 1.9503464141193747e-05, "loss": 0.7096, "step": 29790 }, { "epoch": 0.95, "learning_rate": 1.9503116474894467e-05, "loss": 0.6945, "step": 29795 }, { "epoch": 0.95, "learning_rate": 1.9502768690023574e-05, "loss": 0.6954, "step": 29800 }, { "epoch": 0.95, "learning_rate": 1.9502420786585406e-05, "loss": 0.6979, "step": 29805 }, { "epoch": 0.95, "learning_rate": 1.9502072764584303e-05, "loss": 0.6893, "step": 29810 }, { "epoch": 0.95, "learning_rate": 1.9501724624024608e-05, "loss": 0.6898, "step": 29815 }, { "epoch": 0.95, "learning_rate": 1.9501376364910664e-05, "loss": 0.6868, "step": 29820 }, { "epoch": 0.95, "learning_rate": 1.9501027987246813e-05, "loss": 0.7001, "step": 29825 }, { "epoch": 0.95, "learning_rate": 1.950067949103741e-05, "loss": 0.692, "step": 29830 }, { "epoch": 0.95, "learning_rate": 1.9500330876286798e-05, "loss": 0.7014, "step": 29835 }, { "epoch": 0.95, "learning_rate": 1.9499982142999325e-05, "loss": 0.6905, "step": 29840 }, { "epoch": 0.96, "learning_rate": 1.949963329117935e-05, "loss": 0.6934, "step": 29845 }, { "epoch": 0.96, "learning_rate": 1.9499284320831213e-05, "loss": 0.6943, "step": 29850 }, { "epoch": 0.96, "learning_rate": 1.949893523195928e-05, "loss": 0.7038, "step": 29855 }, { "epoch": 0.96, "learning_rate": 1.94985860245679e-05, "loss": 0.6836, "step": 29860 }, { "epoch": 0.96, "learning_rate": 1.9498236698661433e-05, "loss": 0.7001, "step": 29865 }, { "epoch": 0.96, "learning_rate": 1.9497887254244237e-05, "loss": 0.6944, "step": 29870 }, { "epoch": 0.96, "learning_rate": 1.949753769132067e-05, "loss": 0.7058, "step": 29875 }, { "epoch": 0.96, "learning_rate": 1.9497188009895097e-05, "loss": 0.6932, "step": 29880 }, { "epoch": 0.96, "learning_rate": 1.9496838209971878e-05, "loss": 0.6916, "step": 29885 }, { "epoch": 0.96, "learning_rate": 1.949648829155538e-05, "loss": 0.6858, "step": 29890 }, { "epoch": 0.96, "learning_rate": 1.9496138254649968e-05, "loss": 0.6954, "step": 29895 }, { "epoch": 0.96, "learning_rate": 1.9495788099260008e-05, "loss": 0.694, "step": 29900 }, { "epoch": 0.96, "learning_rate": 1.949543782538987e-05, "loss": 0.6968, "step": 29905 }, { "epoch": 0.96, "learning_rate": 1.9495087433043928e-05, "loss": 0.7111, "step": 29910 }, { "epoch": 0.96, "learning_rate": 1.9494736922226546e-05, "loss": 0.6957, "step": 29915 }, { "epoch": 0.96, "learning_rate": 1.9494386292942102e-05, "loss": 0.7045, "step": 29920 }, { "epoch": 0.96, "learning_rate": 1.9494035545194975e-05, "loss": 0.6927, "step": 29925 }, { "epoch": 0.96, "learning_rate": 1.9493684678989534e-05, "loss": 0.696, "step": 29930 }, { "epoch": 0.96, "learning_rate": 1.9493333694330158e-05, "loss": 0.7051, "step": 29935 }, { "epoch": 0.96, "learning_rate": 1.949298259122123e-05, "loss": 0.6936, "step": 29940 }, { "epoch": 0.96, "learning_rate": 1.949263136966713e-05, "loss": 0.6895, "step": 29945 }, { "epoch": 0.96, "learning_rate": 1.9492280029672237e-05, "loss": 0.6987, "step": 29950 }, { "epoch": 0.96, "learning_rate": 1.9491928571240936e-05, "loss": 0.6972, "step": 29955 }, { "epoch": 0.96, "learning_rate": 1.9491576994377618e-05, "loss": 0.6918, "step": 29960 }, { "epoch": 0.96, "learning_rate": 1.949122529908666e-05, "loss": 0.6971, "step": 29965 }, { "epoch": 0.96, "learning_rate": 1.9490873485372457e-05, "loss": 0.6913, "step": 29970 }, { "epoch": 0.96, "learning_rate": 1.9490521553239397e-05, "loss": 0.6963, "step": 29975 }, { "epoch": 0.96, "learning_rate": 1.949016950269187e-05, "loss": 0.6921, "step": 29980 }, { "epoch": 0.96, "learning_rate": 1.9489817333734265e-05, "loss": 0.6933, "step": 29985 }, { "epoch": 0.96, "learning_rate": 1.9489465046370986e-05, "loss": 0.6894, "step": 29990 }, { "epoch": 0.96, "learning_rate": 1.948911264060642e-05, "loss": 0.6889, "step": 29995 }, { "epoch": 0.96, "learning_rate": 1.9488760116444966e-05, "loss": 0.7077, "step": 30000 }, { "epoch": 0.96, "learning_rate": 1.9488407473891024e-05, "loss": 0.701, "step": 30005 }, { "epoch": 0.96, "learning_rate": 1.9488054712948995e-05, "loss": 0.6996, "step": 30010 }, { "epoch": 0.96, "learning_rate": 1.948770183362328e-05, "loss": 0.6912, "step": 30015 }, { "epoch": 0.96, "learning_rate": 1.9487348835918273e-05, "loss": 0.6934, "step": 30020 }, { "epoch": 0.96, "learning_rate": 1.9486995719838392e-05, "loss": 0.7003, "step": 30025 }, { "epoch": 0.96, "learning_rate": 1.9486642485388035e-05, "loss": 0.7021, "step": 30030 }, { "epoch": 0.96, "learning_rate": 1.9486289132571613e-05, "loss": 0.6917, "step": 30035 }, { "epoch": 0.96, "learning_rate": 1.9485935661393532e-05, "loss": 0.688, "step": 30040 }, { "epoch": 0.96, "learning_rate": 1.9485582071858202e-05, "loss": 0.6983, "step": 30045 }, { "epoch": 0.96, "learning_rate": 1.9485228363970038e-05, "loss": 0.6834, "step": 30050 }, { "epoch": 0.96, "learning_rate": 1.9484874537733448e-05, "loss": 0.7053, "step": 30055 }, { "epoch": 0.96, "learning_rate": 1.9484520593152854e-05, "loss": 0.6945, "step": 30060 }, { "epoch": 0.96, "learning_rate": 1.9484166530232666e-05, "loss": 0.6912, "step": 30065 }, { "epoch": 0.96, "learning_rate": 1.9483812348977307e-05, "loss": 0.6887, "step": 30070 }, { "epoch": 0.96, "learning_rate": 1.9483458049391188e-05, "loss": 0.6833, "step": 30075 }, { "epoch": 0.96, "learning_rate": 1.948310363147874e-05, "loss": 0.7071, "step": 30080 }, { "epoch": 0.96, "learning_rate": 1.948274909524438e-05, "loss": 0.6747, "step": 30085 }, { "epoch": 0.96, "learning_rate": 1.948239444069253e-05, "loss": 0.6994, "step": 30090 }, { "epoch": 0.96, "learning_rate": 1.9482039667827614e-05, "loss": 0.6911, "step": 30095 }, { "epoch": 0.96, "learning_rate": 1.948168477665406e-05, "loss": 0.6863, "step": 30100 }, { "epoch": 0.96, "learning_rate": 1.9481329767176303e-05, "loss": 0.6882, "step": 30105 }, { "epoch": 0.96, "learning_rate": 1.9480974639398762e-05, "loss": 0.682, "step": 30110 }, { "epoch": 0.96, "learning_rate": 1.9480619393325875e-05, "loss": 0.6924, "step": 30115 }, { "epoch": 0.96, "learning_rate": 1.948026402896207e-05, "loss": 0.6911, "step": 30120 }, { "epoch": 0.96, "learning_rate": 1.9479908546311783e-05, "loss": 0.687, "step": 30125 }, { "epoch": 0.96, "learning_rate": 1.9479552945379454e-05, "loss": 0.6909, "step": 30130 }, { "epoch": 0.96, "learning_rate": 1.947919722616951e-05, "loss": 0.6996, "step": 30135 }, { "epoch": 0.96, "learning_rate": 1.9478841388686397e-05, "loss": 0.6915, "step": 30140 }, { "epoch": 0.96, "learning_rate": 1.9478485432934554e-05, "loss": 0.686, "step": 30145 }, { "epoch": 0.96, "learning_rate": 1.947812935891842e-05, "loss": 0.6933, "step": 30150 }, { "epoch": 0.96, "learning_rate": 1.9477773166642434e-05, "loss": 0.6796, "step": 30155 }, { "epoch": 0.97, "learning_rate": 1.9477416856111048e-05, "loss": 0.6922, "step": 30160 }, { "epoch": 0.97, "learning_rate": 1.9477060427328705e-05, "loss": 0.6911, "step": 30165 }, { "epoch": 0.97, "learning_rate": 1.9476703880299852e-05, "loss": 0.6833, "step": 30170 }, { "epoch": 0.97, "learning_rate": 1.947634721502894e-05, "loss": 0.7039, "step": 30175 }, { "epoch": 0.97, "learning_rate": 1.947599043152041e-05, "loss": 0.701, "step": 30180 }, { "epoch": 0.97, "learning_rate": 1.9475633529778726e-05, "loss": 0.7022, "step": 30185 }, { "epoch": 0.97, "learning_rate": 1.9475276509808332e-05, "loss": 0.6924, "step": 30190 }, { "epoch": 0.97, "learning_rate": 1.9474919371613687e-05, "loss": 0.7013, "step": 30195 }, { "epoch": 0.97, "learning_rate": 1.9474562115199246e-05, "loss": 0.6909, "step": 30200 }, { "epoch": 0.97, "learning_rate": 1.9474204740569466e-05, "loss": 0.688, "step": 30205 }, { "epoch": 0.97, "learning_rate": 1.947384724772881e-05, "loss": 0.6774, "step": 30210 }, { "epoch": 0.97, "learning_rate": 1.947348963668173e-05, "loss": 0.6947, "step": 30215 }, { "epoch": 0.97, "learning_rate": 1.9473131907432695e-05, "loss": 0.7061, "step": 30220 }, { "epoch": 0.97, "learning_rate": 1.947277405998617e-05, "loss": 0.6943, "step": 30225 }, { "epoch": 0.97, "learning_rate": 1.947241609434661e-05, "loss": 0.6904, "step": 30230 }, { "epoch": 0.97, "learning_rate": 1.947205801051849e-05, "loss": 0.683, "step": 30235 }, { "epoch": 0.97, "learning_rate": 1.9471699808506276e-05, "loss": 0.7006, "step": 30240 }, { "epoch": 0.97, "learning_rate": 1.947134148831444e-05, "loss": 0.7021, "step": 30245 }, { "epoch": 0.97, "learning_rate": 1.9470983049947446e-05, "loss": 0.6998, "step": 30250 }, { "epoch": 0.97, "learning_rate": 1.947062449340977e-05, "loss": 0.6938, "step": 30255 }, { "epoch": 0.97, "learning_rate": 1.9470265818705885e-05, "loss": 0.6973, "step": 30260 }, { "epoch": 0.97, "learning_rate": 1.946990702584027e-05, "loss": 0.7047, "step": 30265 }, { "epoch": 0.97, "learning_rate": 1.9469548114817395e-05, "loss": 0.6991, "step": 30270 }, { "epoch": 0.97, "learning_rate": 1.9469189085641743e-05, "loss": 0.6845, "step": 30275 }, { "epoch": 0.97, "learning_rate": 1.9468829938317798e-05, "loss": 0.6874, "step": 30280 }, { "epoch": 0.97, "learning_rate": 1.9468470672850027e-05, "loss": 0.6912, "step": 30285 }, { "epoch": 0.97, "learning_rate": 1.9468111289242925e-05, "loss": 0.6955, "step": 30290 }, { "epoch": 0.97, "learning_rate": 1.9467751787500974e-05, "loss": 0.7039, "step": 30295 }, { "epoch": 0.97, "learning_rate": 1.9467392167628655e-05, "loss": 0.6855, "step": 30300 }, { "epoch": 0.97, "learning_rate": 1.9467032429630462e-05, "loss": 0.6909, "step": 30305 }, { "epoch": 0.97, "learning_rate": 1.9466672573510875e-05, "loss": 0.6952, "step": 30310 }, { "epoch": 0.97, "learning_rate": 1.946631259927439e-05, "loss": 0.6877, "step": 30315 }, { "epoch": 0.97, "learning_rate": 1.9465952506925497e-05, "loss": 0.7036, "step": 30320 }, { "epoch": 0.97, "learning_rate": 1.946559229646869e-05, "loss": 0.6774, "step": 30325 }, { "epoch": 0.97, "learning_rate": 1.946523196790846e-05, "loss": 0.6999, "step": 30330 }, { "epoch": 0.97, "learning_rate": 1.9464871521249305e-05, "loss": 0.6767, "step": 30335 }, { "epoch": 0.97, "learning_rate": 1.9464510956495724e-05, "loss": 0.6865, "step": 30340 }, { "epoch": 0.97, "learning_rate": 1.9464150273652214e-05, "loss": 0.6874, "step": 30345 }, { "epoch": 0.97, "learning_rate": 1.9463789472723272e-05, "loss": 0.6899, "step": 30350 }, { "epoch": 0.97, "learning_rate": 1.9463428553713407e-05, "loss": 0.6848, "step": 30355 }, { "epoch": 0.97, "learning_rate": 1.9463067516627116e-05, "loss": 0.692, "step": 30360 }, { "epoch": 0.97, "learning_rate": 1.9462706361468907e-05, "loss": 0.6968, "step": 30365 }, { "epoch": 0.97, "learning_rate": 1.9462345088243287e-05, "loss": 0.7147, "step": 30370 }, { "epoch": 0.97, "learning_rate": 1.946198369695476e-05, "loss": 0.6994, "step": 30375 }, { "epoch": 0.97, "learning_rate": 1.9461622187607837e-05, "loss": 0.6918, "step": 30380 }, { "epoch": 0.97, "learning_rate": 1.946126056020703e-05, "loss": 0.6965, "step": 30385 }, { "epoch": 0.97, "learning_rate": 1.9460898814756848e-05, "loss": 0.7039, "step": 30390 }, { "epoch": 0.97, "learning_rate": 1.9460536951261808e-05, "loss": 0.6973, "step": 30395 }, { "epoch": 0.97, "learning_rate": 1.946017496972642e-05, "loss": 0.6834, "step": 30400 }, { "epoch": 0.97, "learning_rate": 1.945981287015521e-05, "loss": 0.6906, "step": 30405 }, { "epoch": 0.97, "learning_rate": 1.9459450652552684e-05, "loss": 0.7102, "step": 30410 }, { "epoch": 0.97, "learning_rate": 1.9459088316923373e-05, "loss": 0.6969, "step": 30415 }, { "epoch": 0.97, "learning_rate": 1.9458725863271784e-05, "loss": 0.6979, "step": 30420 }, { "epoch": 0.97, "learning_rate": 1.9458363291602455e-05, "loss": 0.6963, "step": 30425 }, { "epoch": 0.97, "learning_rate": 1.94580006019199e-05, "loss": 0.6908, "step": 30430 }, { "epoch": 0.97, "learning_rate": 1.9457637794228645e-05, "loss": 0.6882, "step": 30435 }, { "epoch": 0.97, "learning_rate": 1.9457274868533218e-05, "loss": 0.6861, "step": 30440 }, { "epoch": 0.97, "learning_rate": 1.945691182483815e-05, "loss": 0.7041, "step": 30445 }, { "epoch": 0.97, "learning_rate": 1.9456548663147966e-05, "loss": 0.6929, "step": 30450 }, { "epoch": 0.97, "learning_rate": 1.94561853834672e-05, "loss": 0.6983, "step": 30455 }, { "epoch": 0.97, "learning_rate": 1.9455821985800388e-05, "loss": 0.6902, "step": 30460 }, { "epoch": 0.97, "learning_rate": 1.9455458470152057e-05, "loss": 0.6866, "step": 30465 }, { "epoch": 0.98, "learning_rate": 1.945509483652675e-05, "loss": 0.7003, "step": 30470 }, { "epoch": 0.98, "learning_rate": 1.9454731084928995e-05, "loss": 0.682, "step": 30475 }, { "epoch": 0.98, "learning_rate": 1.945436721536334e-05, "loss": 0.7025, "step": 30480 }, { "epoch": 0.98, "learning_rate": 1.945400322783432e-05, "loss": 0.696, "step": 30485 }, { "epoch": 0.98, "learning_rate": 1.9453639122346475e-05, "loss": 0.6965, "step": 30490 }, { "epoch": 0.98, "learning_rate": 1.945327489890435e-05, "loss": 0.7038, "step": 30495 }, { "epoch": 0.98, "learning_rate": 1.9452910557512497e-05, "loss": 0.6898, "step": 30500 }, { "epoch": 0.98, "learning_rate": 1.9452546098175448e-05, "loss": 0.6879, "step": 30505 }, { "epoch": 0.98, "learning_rate": 1.945218152089776e-05, "loss": 0.6739, "step": 30510 }, { "epoch": 0.98, "learning_rate": 1.945181682568398e-05, "loss": 0.6999, "step": 30515 }, { "epoch": 0.98, "learning_rate": 1.9451452012538653e-05, "loss": 0.6957, "step": 30520 }, { "epoch": 0.98, "learning_rate": 1.9451087081466337e-05, "loss": 0.6868, "step": 30525 }, { "epoch": 0.98, "learning_rate": 1.9450722032471584e-05, "loss": 0.686, "step": 30530 }, { "epoch": 0.98, "learning_rate": 1.945035686555895e-05, "loss": 0.6918, "step": 30535 }, { "epoch": 0.98, "learning_rate": 1.944999158073299e-05, "loss": 0.6956, "step": 30540 }, { "epoch": 0.98, "learning_rate": 1.9449626177998257e-05, "loss": 0.6954, "step": 30545 }, { "epoch": 0.98, "learning_rate": 1.9449260657359317e-05, "loss": 0.6808, "step": 30550 }, { "epoch": 0.98, "learning_rate": 1.944889501882073e-05, "loss": 0.6935, "step": 30555 }, { "epoch": 0.98, "learning_rate": 1.9448529262387054e-05, "loss": 0.6912, "step": 30560 }, { "epoch": 0.98, "learning_rate": 1.9448163388062853e-05, "loss": 0.6916, "step": 30565 }, { "epoch": 0.98, "learning_rate": 1.9447797395852698e-05, "loss": 0.6854, "step": 30570 }, { "epoch": 0.98, "learning_rate": 1.9447431285761148e-05, "loss": 0.7037, "step": 30575 }, { "epoch": 0.98, "learning_rate": 1.9447065057792777e-05, "loss": 0.6875, "step": 30580 }, { "epoch": 0.98, "learning_rate": 1.944669871195215e-05, "loss": 0.7006, "step": 30585 }, { "epoch": 0.98, "learning_rate": 1.9446332248243844e-05, "loss": 0.6798, "step": 30590 }, { "epoch": 0.98, "learning_rate": 1.944596566667242e-05, "loss": 0.7042, "step": 30595 }, { "epoch": 0.98, "learning_rate": 1.9445598967242464e-05, "loss": 0.6801, "step": 30600 }, { "epoch": 0.98, "learning_rate": 1.9445232149958543e-05, "loss": 0.6868, "step": 30605 }, { "epoch": 0.98, "learning_rate": 1.944486521482524e-05, "loss": 0.6858, "step": 30610 }, { "epoch": 0.98, "learning_rate": 1.944449816184713e-05, "loss": 0.6835, "step": 30615 }, { "epoch": 0.98, "learning_rate": 1.9444130991028793e-05, "loss": 0.6962, "step": 30620 }, { "epoch": 0.98, "learning_rate": 1.944376370237481e-05, "loss": 0.6896, "step": 30625 }, { "epoch": 0.98, "learning_rate": 1.9443396295889767e-05, "loss": 0.6898, "step": 30630 }, { "epoch": 0.98, "learning_rate": 1.9443028771578243e-05, "loss": 0.6853, "step": 30635 }, { "epoch": 0.98, "learning_rate": 1.9442661129444828e-05, "loss": 0.6951, "step": 30640 }, { "epoch": 0.98, "learning_rate": 1.9442293369494108e-05, "loss": 0.6958, "step": 30645 }, { "epoch": 0.98, "learning_rate": 1.944192549173067e-05, "loss": 0.6999, "step": 30650 }, { "epoch": 0.98, "learning_rate": 1.9441557496159103e-05, "loss": 0.6993, "step": 30655 }, { "epoch": 0.98, "learning_rate": 1.9441189382784e-05, "loss": 0.6949, "step": 30660 }, { "epoch": 0.98, "learning_rate": 1.9440821151609956e-05, "loss": 0.697, "step": 30665 }, { "epoch": 0.98, "learning_rate": 1.9440452802641567e-05, "loss": 0.6905, "step": 30670 }, { "epoch": 0.98, "learning_rate": 1.944008433588342e-05, "loss": 0.6957, "step": 30675 }, { "epoch": 0.98, "learning_rate": 1.943971575134012e-05, "loss": 0.6994, "step": 30680 }, { "epoch": 0.98, "learning_rate": 1.9439347049016266e-05, "loss": 0.684, "step": 30685 }, { "epoch": 0.98, "learning_rate": 1.9438978228916456e-05, "loss": 0.7001, "step": 30690 }, { "epoch": 0.98, "learning_rate": 1.943860929104529e-05, "loss": 0.705, "step": 30695 }, { "epoch": 0.98, "learning_rate": 1.9438240235407375e-05, "loss": 0.6911, "step": 30700 }, { "epoch": 0.98, "learning_rate": 1.9437871062007314e-05, "loss": 0.6947, "step": 30705 }, { "epoch": 0.98, "learning_rate": 1.9437501770849714e-05, "loss": 0.7019, "step": 30710 }, { "epoch": 0.98, "learning_rate": 1.9437132361939182e-05, "loss": 0.6957, "step": 30715 }, { "epoch": 0.98, "learning_rate": 1.9436762835280327e-05, "loss": 0.6934, "step": 30720 }, { "epoch": 0.98, "learning_rate": 1.943639319087776e-05, "loss": 0.6864, "step": 30725 }, { "epoch": 0.98, "learning_rate": 1.9436023428736095e-05, "loss": 0.7007, "step": 30730 }, { "epoch": 0.98, "learning_rate": 1.9435653548859944e-05, "loss": 0.6899, "step": 30735 }, { "epoch": 0.98, "learning_rate": 1.943528355125392e-05, "loss": 0.6904, "step": 30740 }, { "epoch": 0.98, "learning_rate": 1.943491343592264e-05, "loss": 0.7039, "step": 30745 }, { "epoch": 0.98, "learning_rate": 1.9434543202870726e-05, "loss": 0.6771, "step": 30750 }, { "epoch": 0.98, "learning_rate": 1.9434172852102793e-05, "loss": 0.6927, "step": 30755 }, { "epoch": 0.98, "learning_rate": 1.9433802383623464e-05, "loss": 0.6987, "step": 30760 }, { "epoch": 0.98, "learning_rate": 1.943343179743736e-05, "loss": 0.6946, "step": 30765 }, { "epoch": 0.98, "learning_rate": 1.943306109354911e-05, "loss": 0.6944, "step": 30770 }, { "epoch": 0.98, "learning_rate": 1.9432690271963327e-05, "loss": 0.6886, "step": 30775 }, { "epoch": 0.98, "learning_rate": 1.9432319332684654e-05, "loss": 0.6914, "step": 30780 }, { "epoch": 0.99, "learning_rate": 1.9431948275717706e-05, "loss": 0.6978, "step": 30785 }, { "epoch": 0.99, "learning_rate": 1.943157710106712e-05, "loss": 0.6871, "step": 30790 }, { "epoch": 0.99, "learning_rate": 1.943120580873753e-05, "loss": 0.6858, "step": 30795 }, { "epoch": 0.99, "learning_rate": 1.9430834398733557e-05, "loss": 0.6887, "step": 30800 }, { "epoch": 0.99, "learning_rate": 1.9430462871059842e-05, "loss": 0.6741, "step": 30805 }, { "epoch": 0.99, "learning_rate": 1.943009122572102e-05, "loss": 0.6924, "step": 30810 }, { "epoch": 0.99, "learning_rate": 1.9429719462721732e-05, "loss": 0.6877, "step": 30815 }, { "epoch": 0.99, "learning_rate": 1.9429347582066614e-05, "loss": 0.6956, "step": 30820 }, { "epoch": 0.99, "learning_rate": 1.9428975583760303e-05, "loss": 0.6966, "step": 30825 }, { "epoch": 0.99, "learning_rate": 1.942860346780744e-05, "loss": 0.7065, "step": 30830 }, { "epoch": 0.99, "learning_rate": 1.9428231234212673e-05, "loss": 0.699, "step": 30835 }, { "epoch": 0.99, "learning_rate": 1.9427858882980645e-05, "loss": 0.6878, "step": 30840 }, { "epoch": 0.99, "learning_rate": 1.9427486414116e-05, "loss": 0.7103, "step": 30845 }, { "epoch": 0.99, "learning_rate": 1.9427113827623385e-05, "loss": 0.6879, "step": 30850 }, { "epoch": 0.99, "learning_rate": 1.942674112350745e-05, "loss": 0.6895, "step": 30855 }, { "epoch": 0.99, "learning_rate": 1.9426368301772848e-05, "loss": 0.6946, "step": 30860 }, { "epoch": 0.99, "learning_rate": 1.9425995362424225e-05, "loss": 0.6946, "step": 30865 }, { "epoch": 0.99, "learning_rate": 1.942562230546624e-05, "loss": 0.6826, "step": 30870 }, { "epoch": 0.99, "learning_rate": 1.9425249130903544e-05, "loss": 0.6892, "step": 30875 }, { "epoch": 0.99, "learning_rate": 1.9424875838740792e-05, "loss": 0.704, "step": 30880 }, { "epoch": 0.99, "learning_rate": 1.9424502428982644e-05, "loss": 0.7032, "step": 30885 }, { "epoch": 0.99, "learning_rate": 1.942412890163376e-05, "loss": 0.6946, "step": 30890 }, { "epoch": 0.99, "learning_rate": 1.94237552566988e-05, "loss": 0.6866, "step": 30895 }, { "epoch": 0.99, "learning_rate": 1.9423381494182422e-05, "loss": 0.6775, "step": 30900 }, { "epoch": 0.99, "learning_rate": 1.9423007614089294e-05, "loss": 0.6945, "step": 30905 }, { "epoch": 0.99, "learning_rate": 1.9422633616424083e-05, "loss": 0.7001, "step": 30910 }, { "epoch": 0.99, "learning_rate": 1.9422259501191448e-05, "loss": 0.6903, "step": 30915 }, { "epoch": 0.99, "learning_rate": 1.9421885268396064e-05, "loss": 0.6696, "step": 30920 }, { "epoch": 0.99, "learning_rate": 1.9421510918042593e-05, "loss": 0.6946, "step": 30925 }, { "epoch": 0.99, "learning_rate": 1.9421136450135715e-05, "loss": 0.6918, "step": 30930 }, { "epoch": 0.99, "learning_rate": 1.9420761864680095e-05, "loss": 0.6908, "step": 30935 }, { "epoch": 0.99, "learning_rate": 1.942038716168041e-05, "loss": 0.6876, "step": 30940 }, { "epoch": 0.99, "learning_rate": 1.9420012341141334e-05, "loss": 0.6799, "step": 30945 }, { "epoch": 0.99, "learning_rate": 1.9419637403067547e-05, "loss": 0.6858, "step": 30950 }, { "epoch": 0.99, "learning_rate": 1.9419262347463718e-05, "loss": 0.6901, "step": 30955 }, { "epoch": 0.99, "learning_rate": 1.9418887174334538e-05, "loss": 0.6952, "step": 30960 }, { "epoch": 0.99, "learning_rate": 1.941851188368468e-05, "loss": 0.6925, "step": 30965 }, { "epoch": 0.99, "learning_rate": 1.9418136475518833e-05, "loss": 0.7038, "step": 30970 }, { "epoch": 0.99, "learning_rate": 1.9417760949841672e-05, "loss": 0.6917, "step": 30975 }, { "epoch": 0.99, "learning_rate": 1.9417385306657894e-05, "loss": 0.678, "step": 30980 }, { "epoch": 0.99, "learning_rate": 1.9417009545972178e-05, "loss": 0.6858, "step": 30985 }, { "epoch": 0.99, "learning_rate": 1.9416633667789212e-05, "loss": 0.6846, "step": 30990 }, { "epoch": 0.99, "learning_rate": 1.9416257672113693e-05, "loss": 0.6806, "step": 30995 }, { "epoch": 0.99, "learning_rate": 1.9415881558950302e-05, "loss": 0.699, "step": 31000 }, { "epoch": 0.99, "learning_rate": 1.941550532830374e-05, "loss": 0.6902, "step": 31005 }, { "epoch": 0.99, "learning_rate": 1.94151289801787e-05, "loss": 0.6807, "step": 31010 }, { "epoch": 0.99, "learning_rate": 1.9414752514579876e-05, "loss": 0.6894, "step": 31015 }, { "epoch": 0.99, "learning_rate": 1.9414375931511965e-05, "loss": 0.6938, "step": 31020 }, { "epoch": 0.99, "learning_rate": 1.9413999230979666e-05, "loss": 0.6846, "step": 31025 }, { "epoch": 0.99, "learning_rate": 1.941362241298768e-05, "loss": 0.696, "step": 31030 }, { "epoch": 0.99, "learning_rate": 1.9413245477540708e-05, "loss": 0.6952, "step": 31035 }, { "epoch": 0.99, "learning_rate": 1.9412868424643452e-05, "loss": 0.6884, "step": 31040 }, { "epoch": 0.99, "learning_rate": 1.941249125430062e-05, "loss": 0.6919, "step": 31045 }, { "epoch": 0.99, "learning_rate": 1.941211396651691e-05, "loss": 0.6936, "step": 31050 }, { "epoch": 0.99, "learning_rate": 1.9411736561297043e-05, "loss": 0.6885, "step": 31055 }, { "epoch": 0.99, "learning_rate": 1.9411359038645715e-05, "loss": 0.6955, "step": 31060 }, { "epoch": 0.99, "learning_rate": 1.9410981398567642e-05, "loss": 0.6869, "step": 31065 }, { "epoch": 0.99, "learning_rate": 1.9410603641067537e-05, "loss": 0.6859, "step": 31070 }, { "epoch": 0.99, "learning_rate": 1.941022576615011e-05, "loss": 0.6955, "step": 31075 }, { "epoch": 0.99, "learning_rate": 1.940984777382008e-05, "loss": 0.6881, "step": 31080 }, { "epoch": 0.99, "learning_rate": 1.940946966408216e-05, "loss": 0.6787, "step": 31085 }, { "epoch": 0.99, "learning_rate": 1.9409091436941067e-05, "loss": 0.6915, "step": 31090 }, { "epoch": 1.0, "learning_rate": 1.9408713092401525e-05, "loss": 0.6834, "step": 31095 }, { "epoch": 1.0, "learning_rate": 1.9408334630468247e-05, "loss": 0.6873, "step": 31100 }, { "epoch": 1.0, "learning_rate": 1.940795605114596e-05, "loss": 0.7059, "step": 31105 }, { "epoch": 1.0, "learning_rate": 1.940757735443939e-05, "loss": 0.6817, "step": 31110 }, { "epoch": 1.0, "learning_rate": 1.9407198540353258e-05, "loss": 0.6926, "step": 31115 }, { "epoch": 1.0, "learning_rate": 1.9406819608892288e-05, "loss": 0.7024, "step": 31120 }, { "epoch": 1.0, "learning_rate": 1.9406440560061214e-05, "loss": 0.6873, "step": 31125 }, { "epoch": 1.0, "learning_rate": 1.9406061393864764e-05, "loss": 0.6941, "step": 31130 }, { "epoch": 1.0, "learning_rate": 1.9405682110307668e-05, "loss": 0.6937, "step": 31135 }, { "epoch": 1.0, "learning_rate": 1.9405302709394658e-05, "loss": 0.6838, "step": 31140 }, { "epoch": 1.0, "learning_rate": 1.9404923191130468e-05, "loss": 0.6824, "step": 31145 }, { "epoch": 1.0, "learning_rate": 1.940454355551983e-05, "loss": 0.6908, "step": 31150 }, { "epoch": 1.0, "learning_rate": 1.9404163802567487e-05, "loss": 0.6843, "step": 31155 }, { "epoch": 1.0, "learning_rate": 1.9403783932278176e-05, "loss": 0.6951, "step": 31160 }, { "epoch": 1.0, "learning_rate": 1.9403403944656635e-05, "loss": 0.6924, "step": 31165 }, { "epoch": 1.0, "learning_rate": 1.9403023839707603e-05, "loss": 0.6865, "step": 31170 }, { "epoch": 1.0, "learning_rate": 1.9402643617435824e-05, "loss": 0.6886, "step": 31175 }, { "epoch": 1.0, "learning_rate": 1.9402263277846046e-05, "loss": 0.6936, "step": 31180 }, { "epoch": 1.0, "learning_rate": 1.940188282094301e-05, "loss": 0.6842, "step": 31185 }, { "epoch": 1.0, "learning_rate": 1.9401502246731464e-05, "loss": 0.6774, "step": 31190 }, { "epoch": 1.0, "learning_rate": 1.940112155521616e-05, "loss": 0.6841, "step": 31195 }, { "epoch": 1.0, "learning_rate": 1.940074074640184e-05, "loss": 0.6917, "step": 31200 }, { "epoch": 1.0, "learning_rate": 1.9400359820293265e-05, "loss": 0.6831, "step": 31205 }, { "epoch": 1.0, "learning_rate": 1.9399978776895177e-05, "loss": 0.6859, "step": 31210 }, { "epoch": 1.0, "learning_rate": 1.9399597616212344e-05, "loss": 0.7006, "step": 31215 }, { "epoch": 1.0, "learning_rate": 1.9399216338249508e-05, "loss": 0.6939, "step": 31220 }, { "epoch": 1.0, "learning_rate": 1.9398834943011434e-05, "loss": 0.6969, "step": 31225 }, { "epoch": 1.0, "learning_rate": 1.939845343050288e-05, "loss": 0.692, "step": 31230 }, { "epoch": 1.0, "learning_rate": 1.9398071800728608e-05, "loss": 0.6937, "step": 31235 }, { "epoch": 1.0, "learning_rate": 1.9397690053693373e-05, "loss": 0.6834, "step": 31240 }, { "epoch": 1.0, "learning_rate": 1.9397308189401944e-05, "loss": 0.6963, "step": 31245 }, { "epoch": 1.0, "learning_rate": 1.9396926207859085e-05, "loss": 0.6806, "step": 31250 }, { "epoch": 1.0, "learning_rate": 1.9396544109069563e-05, "loss": 0.6842, "step": 31255 }, { "epoch": 1.0, "learning_rate": 1.9396161893038138e-05, "loss": 0.6963, "step": 31260 }, { "epoch": 1.0, "learning_rate": 1.9395779559769584e-05, "loss": 0.678, "step": 31265 }, { "epoch": 1.0, "learning_rate": 1.9395397109268676e-05, "loss": 0.6752, "step": 31270 }, { "epoch": 1.0, "learning_rate": 1.939501454154018e-05, "loss": 0.7012, "step": 31275 }, { "epoch": 1.0, "learning_rate": 1.939463185658887e-05, "loss": 0.6822, "step": 31280 }, { "epoch": 1.0, "learning_rate": 1.939424905441952e-05, "loss": 0.6843, "step": 31285 }, { "epoch": 1.0, "learning_rate": 1.939386613503691e-05, "loss": 0.6932, "step": 31290 }, { "epoch": 1.0, "learning_rate": 1.9393483098445815e-05, "loss": 0.6933, "step": 31295 }, { "epoch": 1.0, "learning_rate": 1.9393099944651017e-05, "loss": 0.6832, "step": 31300 }, { "epoch": 1.0, "learning_rate": 1.9392716673657292e-05, "loss": 0.676, "step": 31305 }, { "epoch": 1.0, "learning_rate": 1.9392333285469427e-05, "loss": 0.6707, "step": 31310 }, { "epoch": 1.0, "learning_rate": 1.93919497800922e-05, "loss": 0.6884, "step": 31315 }, { "epoch": 1.0, "learning_rate": 1.9391566157530404e-05, "loss": 0.6701, "step": 31320 }, { "epoch": 1.0, "learning_rate": 1.9391182417788816e-05, "loss": 0.6781, "step": 31325 }, { "epoch": 1.0, "learning_rate": 1.9390798560872233e-05, "loss": 0.6824, "step": 31330 }, { "epoch": 1.0, "learning_rate": 1.9390414586785437e-05, "loss": 0.6842, "step": 31335 }, { "epoch": 1.0, "learning_rate": 1.9390030495533225e-05, "loss": 0.6822, "step": 31340 }, { "epoch": 1.0, "learning_rate": 1.9389646287120385e-05, "loss": 0.6862, "step": 31345 }, { "epoch": 1.0, "learning_rate": 1.938926196155171e-05, "loss": 0.6875, "step": 31350 }, { "epoch": 1.0, "learning_rate": 1.9388877518832e-05, "loss": 0.6818, "step": 31355 }, { "epoch": 1.0, "learning_rate": 1.938849295896605e-05, "loss": 0.6905, "step": 31360 }, { "epoch": 1.0, "learning_rate": 1.9388108281958654e-05, "loss": 0.6978, "step": 31365 }, { "epoch": 1.0, "learning_rate": 1.938772348781462e-05, "loss": 0.6946, "step": 31370 }, { "epoch": 1.0, "learning_rate": 1.9387338576538743e-05, "loss": 0.6868, "step": 31375 }, { "epoch": 1.0, "learning_rate": 1.9386953548135824e-05, "loss": 0.695, "step": 31380 }, { "epoch": 1.0, "learning_rate": 1.9386568402610675e-05, "loss": 0.6934, "step": 31385 }, { "epoch": 1.0, "learning_rate": 1.9386183139968093e-05, "loss": 0.6895, "step": 31390 }, { "epoch": 1.0, "learning_rate": 1.938579776021289e-05, "loss": 0.6888, "step": 31395 }, { "epoch": 1.0, "learning_rate": 1.938541226334987e-05, "loss": 0.6932, "step": 31400 }, { "epoch": 1.0, "learning_rate": 1.9385026649383846e-05, "loss": 0.696, "step": 31405 }, { "epoch": 1.01, "learning_rate": 1.9384640918319633e-05, "loss": 0.6908, "step": 31410 }, { "epoch": 1.01, "learning_rate": 1.9384255070162036e-05, "loss": 0.6927, "step": 31415 }, { "epoch": 1.01, "learning_rate": 1.9383869104915877e-05, "loss": 0.6782, "step": 31420 }, { "epoch": 1.01, "learning_rate": 1.9383483022585966e-05, "loss": 0.6727, "step": 31425 }, { "epoch": 1.01, "learning_rate": 1.938309682317712e-05, "loss": 0.6922, "step": 31430 }, { "epoch": 1.01, "learning_rate": 1.938271050669416e-05, "loss": 0.685, "step": 31435 }, { "epoch": 1.01, "learning_rate": 1.938232407314191e-05, "loss": 0.6733, "step": 31440 }, { "epoch": 1.01, "learning_rate": 1.9381937522525185e-05, "loss": 0.6784, "step": 31445 }, { "epoch": 1.01, "learning_rate": 1.9381550854848812e-05, "loss": 0.6762, "step": 31450 }, { "epoch": 1.01, "learning_rate": 1.938116407011761e-05, "loss": 0.6848, "step": 31455 }, { "epoch": 1.01, "learning_rate": 1.9380777168336414e-05, "loss": 0.6775, "step": 31460 }, { "epoch": 1.01, "learning_rate": 1.9380390149510044e-05, "loss": 0.6827, "step": 31465 }, { "epoch": 1.01, "learning_rate": 1.9380003013643328e-05, "loss": 0.6839, "step": 31470 }, { "epoch": 1.01, "learning_rate": 1.9379615760741108e-05, "loss": 0.688, "step": 31475 }, { "epoch": 1.01, "learning_rate": 1.93792283908082e-05, "loss": 0.6985, "step": 31480 }, { "epoch": 1.01, "learning_rate": 1.937884090384945e-05, "loss": 0.6826, "step": 31485 }, { "epoch": 1.01, "learning_rate": 1.9378453299869683e-05, "loss": 0.6825, "step": 31490 }, { "epoch": 1.01, "learning_rate": 1.9378065578873742e-05, "loss": 0.6685, "step": 31495 }, { "epoch": 1.01, "learning_rate": 1.937767774086646e-05, "loss": 0.6808, "step": 31500 }, { "epoch": 1.01, "learning_rate": 1.937728978585268e-05, "loss": 0.684, "step": 31505 }, { "epoch": 1.01, "learning_rate": 1.937690171383724e-05, "loss": 0.6835, "step": 31510 }, { "epoch": 1.01, "learning_rate": 1.9376513524824987e-05, "loss": 0.6993, "step": 31515 }, { "epoch": 1.01, "learning_rate": 1.9376125218820758e-05, "loss": 0.6895, "step": 31520 }, { "epoch": 1.01, "learning_rate": 1.9375736795829402e-05, "loss": 0.6631, "step": 31525 }, { "epoch": 1.01, "learning_rate": 1.937534825585576e-05, "loss": 0.6862, "step": 31530 }, { "epoch": 1.01, "learning_rate": 1.9374959598904686e-05, "loss": 0.6832, "step": 31535 }, { "epoch": 1.01, "learning_rate": 1.9374570824981028e-05, "loss": 0.6863, "step": 31540 }, { "epoch": 1.01, "learning_rate": 1.9374181934089635e-05, "loss": 0.6895, "step": 31545 }, { "epoch": 1.01, "learning_rate": 1.9373792926235358e-05, "loss": 0.6817, "step": 31550 }, { "epoch": 1.01, "learning_rate": 1.9373403801423054e-05, "loss": 0.6859, "step": 31555 }, { "epoch": 1.01, "learning_rate": 1.9373014559657576e-05, "loss": 0.6856, "step": 31560 }, { "epoch": 1.01, "learning_rate": 1.9372625200943784e-05, "loss": 0.6728, "step": 31565 }, { "epoch": 1.01, "learning_rate": 1.9372235725286533e-05, "loss": 0.684, "step": 31570 }, { "epoch": 1.01, "learning_rate": 1.937184613269068e-05, "loss": 0.674, "step": 31575 }, { "epoch": 1.01, "learning_rate": 1.9371456423161095e-05, "loss": 0.6892, "step": 31580 }, { "epoch": 1.01, "learning_rate": 1.937106659670263e-05, "loss": 0.6801, "step": 31585 }, { "epoch": 1.01, "learning_rate": 1.9370676653320153e-05, "loss": 0.7087, "step": 31590 }, { "epoch": 1.01, "learning_rate": 1.9370286593018532e-05, "loss": 0.6894, "step": 31595 }, { "epoch": 1.01, "learning_rate": 1.936989641580263e-05, "loss": 0.6772, "step": 31600 }, { "epoch": 1.01, "learning_rate": 1.936950612167732e-05, "loss": 0.6819, "step": 31605 }, { "epoch": 1.01, "learning_rate": 1.9369115710647465e-05, "loss": 0.6801, "step": 31610 }, { "epoch": 1.01, "learning_rate": 1.9368725182717944e-05, "loss": 0.6776, "step": 31615 }, { "epoch": 1.01, "learning_rate": 1.936833453789362e-05, "loss": 0.6885, "step": 31620 }, { "epoch": 1.01, "learning_rate": 1.936794377617938e-05, "loss": 0.6825, "step": 31625 }, { "epoch": 1.01, "learning_rate": 1.936755289758009e-05, "loss": 0.6824, "step": 31630 }, { "epoch": 1.01, "learning_rate": 1.9367161902100626e-05, "loss": 0.6812, "step": 31635 }, { "epoch": 1.01, "learning_rate": 1.9366770789745873e-05, "loss": 0.6912, "step": 31640 }, { "epoch": 1.01, "learning_rate": 1.9366379560520706e-05, "loss": 0.6877, "step": 31645 }, { "epoch": 1.01, "learning_rate": 1.936598821443001e-05, "loss": 0.6915, "step": 31650 }, { "epoch": 1.01, "learning_rate": 1.9365596751478665e-05, "loss": 0.6986, "step": 31655 }, { "epoch": 1.01, "learning_rate": 1.9365205171671558e-05, "loss": 0.6947, "step": 31660 }, { "epoch": 1.01, "learning_rate": 1.936481347501357e-05, "loss": 0.6864, "step": 31665 }, { "epoch": 1.01, "learning_rate": 1.9364421661509592e-05, "loss": 0.6901, "step": 31670 }, { "epoch": 1.01, "learning_rate": 1.9364029731164517e-05, "loss": 0.6839, "step": 31675 }, { "epoch": 1.01, "learning_rate": 1.9363637683983225e-05, "loss": 0.6925, "step": 31680 }, { "epoch": 1.01, "learning_rate": 1.9363245519970613e-05, "loss": 0.6788, "step": 31685 }, { "epoch": 1.01, "learning_rate": 1.936285323913158e-05, "loss": 0.6803, "step": 31690 }, { "epoch": 1.01, "learning_rate": 1.936246084147101e-05, "loss": 0.6788, "step": 31695 }, { "epoch": 1.01, "learning_rate": 1.9362068326993804e-05, "loss": 0.6836, "step": 31700 }, { "epoch": 1.01, "learning_rate": 1.936167569570486e-05, "loss": 0.6882, "step": 31705 }, { "epoch": 1.01, "learning_rate": 1.9361282947609075e-05, "loss": 0.6887, "step": 31710 }, { "epoch": 1.01, "learning_rate": 1.9360890082711353e-05, "loss": 0.6972, "step": 31715 }, { "epoch": 1.02, "learning_rate": 1.936049710101659e-05, "loss": 0.683, "step": 31720 }, { "epoch": 1.02, "learning_rate": 1.9360104002529693e-05, "loss": 0.687, "step": 31725 }, { "epoch": 1.02, "learning_rate": 1.9359710787255567e-05, "loss": 0.6935, "step": 31730 }, { "epoch": 1.02, "learning_rate": 1.9359317455199117e-05, "loss": 0.6844, "step": 31735 }, { "epoch": 1.02, "learning_rate": 1.935892400636525e-05, "loss": 0.6733, "step": 31740 }, { "epoch": 1.02, "learning_rate": 1.935853044075888e-05, "loss": 0.6823, "step": 31745 }, { "epoch": 1.02, "learning_rate": 1.935813675838491e-05, "loss": 0.6806, "step": 31750 }, { "epoch": 1.02, "learning_rate": 1.9357742959248256e-05, "loss": 0.6826, "step": 31755 }, { "epoch": 1.02, "learning_rate": 1.9357349043353832e-05, "loss": 0.6811, "step": 31760 }, { "epoch": 1.02, "learning_rate": 1.9356955010706552e-05, "loss": 0.6884, "step": 31765 }, { "epoch": 1.02, "learning_rate": 1.9356560861311332e-05, "loss": 0.6902, "step": 31770 }, { "epoch": 1.02, "learning_rate": 1.9356166595173094e-05, "loss": 0.6713, "step": 31775 }, { "epoch": 1.02, "learning_rate": 1.9355772212296752e-05, "loss": 0.6848, "step": 31780 }, { "epoch": 1.02, "learning_rate": 1.9355377712687228e-05, "loss": 0.6796, "step": 31785 }, { "epoch": 1.02, "learning_rate": 1.9354983096349446e-05, "loss": 0.6766, "step": 31790 }, { "epoch": 1.02, "learning_rate": 1.9354588363288324e-05, "loss": 0.6825, "step": 31795 }, { "epoch": 1.02, "learning_rate": 1.9354193513508794e-05, "loss": 0.6849, "step": 31800 }, { "epoch": 1.02, "learning_rate": 1.9353798547015784e-05, "loss": 0.6925, "step": 31805 }, { "epoch": 1.02, "learning_rate": 1.935340346381421e-05, "loss": 0.6861, "step": 31810 }, { "epoch": 1.02, "learning_rate": 1.9353008263909016e-05, "loss": 0.6938, "step": 31815 }, { "epoch": 1.02, "learning_rate": 1.935261294730513e-05, "loss": 0.6858, "step": 31820 }, { "epoch": 1.02, "learning_rate": 1.935221751400747e-05, "loss": 0.6848, "step": 31825 }, { "epoch": 1.02, "learning_rate": 1.9351821964020988e-05, "loss": 0.6777, "step": 31830 }, { "epoch": 1.02, "learning_rate": 1.935142629735061e-05, "loss": 0.6827, "step": 31835 }, { "epoch": 1.02, "learning_rate": 1.935103051400128e-05, "loss": 0.6865, "step": 31840 }, { "epoch": 1.02, "learning_rate": 1.9350634613977924e-05, "loss": 0.6876, "step": 31845 }, { "epoch": 1.02, "learning_rate": 1.9350238597285497e-05, "loss": 0.682, "step": 31850 }, { "epoch": 1.02, "learning_rate": 1.9349842463928924e-05, "loss": 0.6906, "step": 31855 }, { "epoch": 1.02, "learning_rate": 1.934944621391316e-05, "loss": 0.7, "step": 31860 }, { "epoch": 1.02, "learning_rate": 1.9349049847243145e-05, "loss": 0.6752, "step": 31865 }, { "epoch": 1.02, "learning_rate": 1.9348653363923828e-05, "loss": 0.6782, "step": 31870 }, { "epoch": 1.02, "learning_rate": 1.9348256763960146e-05, "loss": 0.6798, "step": 31875 }, { "epoch": 1.02, "learning_rate": 1.9347860047357055e-05, "loss": 0.6724, "step": 31880 }, { "epoch": 1.02, "learning_rate": 1.9347463214119507e-05, "loss": 0.684, "step": 31885 }, { "epoch": 1.02, "learning_rate": 1.9347066264252447e-05, "loss": 0.6897, "step": 31890 }, { "epoch": 1.02, "learning_rate": 1.934666919776083e-05, "loss": 0.6765, "step": 31895 }, { "epoch": 1.02, "learning_rate": 1.9346272014649613e-05, "loss": 0.6833, "step": 31900 }, { "epoch": 1.02, "learning_rate": 1.934587471492375e-05, "loss": 0.6889, "step": 31905 }, { "epoch": 1.02, "learning_rate": 1.9345477298588194e-05, "loss": 0.6793, "step": 31910 }, { "epoch": 1.02, "learning_rate": 1.9345079765647912e-05, "loss": 0.6881, "step": 31915 }, { "epoch": 1.02, "learning_rate": 1.9344682116107856e-05, "loss": 0.685, "step": 31920 }, { "epoch": 1.02, "learning_rate": 1.9344284349972994e-05, "loss": 0.6832, "step": 31925 }, { "epoch": 1.02, "learning_rate": 1.9343886467248288e-05, "loss": 0.6885, "step": 31930 }, { "epoch": 1.02, "learning_rate": 1.9343488467938696e-05, "loss": 0.6735, "step": 31935 }, { "epoch": 1.02, "learning_rate": 1.934309035204919e-05, "loss": 0.6855, "step": 31940 }, { "epoch": 1.02, "learning_rate": 1.9342692119584737e-05, "loss": 0.6837, "step": 31945 }, { "epoch": 1.02, "learning_rate": 1.93422937705503e-05, "loss": 0.6872, "step": 31950 }, { "epoch": 1.02, "learning_rate": 1.934189530495086e-05, "loss": 0.6942, "step": 31955 }, { "epoch": 1.02, "learning_rate": 1.934149672279138e-05, "loss": 0.6826, "step": 31960 }, { "epoch": 1.02, "learning_rate": 1.9341098024076835e-05, "loss": 0.6897, "step": 31965 }, { "epoch": 1.02, "learning_rate": 1.93406992088122e-05, "loss": 0.6812, "step": 31970 }, { "epoch": 1.02, "learning_rate": 1.9340300277002452e-05, "loss": 0.6858, "step": 31975 }, { "epoch": 1.02, "learning_rate": 1.9339901228652567e-05, "loss": 0.6957, "step": 31980 }, { "epoch": 1.02, "learning_rate": 1.9339502063767526e-05, "loss": 0.6716, "step": 31985 }, { "epoch": 1.02, "learning_rate": 1.9339102782352307e-05, "loss": 0.6878, "step": 31990 }, { "epoch": 1.02, "learning_rate": 1.9338703384411893e-05, "loss": 0.6907, "step": 31995 }, { "epoch": 1.02, "learning_rate": 1.933830386995127e-05, "loss": 0.692, "step": 32000 }, { "epoch": 1.02, "learning_rate": 1.933790423897542e-05, "loss": 0.6958, "step": 32005 }, { "epoch": 1.02, "learning_rate": 1.9337504491489326e-05, "loss": 0.6694, "step": 32010 }, { "epoch": 1.02, "learning_rate": 1.933710462749798e-05, "loss": 0.6838, "step": 32015 }, { "epoch": 1.02, "learning_rate": 1.9336704647006376e-05, "loss": 0.6781, "step": 32020 }, { "epoch": 1.02, "learning_rate": 1.9336304550019493e-05, "loss": 0.6783, "step": 32025 }, { "epoch": 1.02, "learning_rate": 1.933590433654233e-05, "loss": 0.6837, "step": 32030 }, { "epoch": 1.03, "learning_rate": 1.9335504006579883e-05, "loss": 0.6777, "step": 32035 }, { "epoch": 1.03, "learning_rate": 1.9335103560137137e-05, "loss": 0.6808, "step": 32040 }, { "epoch": 1.03, "learning_rate": 1.93347029972191e-05, "loss": 0.6931, "step": 32045 }, { "epoch": 1.03, "learning_rate": 1.9334302317830764e-05, "loss": 0.6804, "step": 32050 }, { "epoch": 1.03, "learning_rate": 1.933390152197713e-05, "loss": 0.6816, "step": 32055 }, { "epoch": 1.03, "learning_rate": 1.9333500609663196e-05, "loss": 0.6921, "step": 32060 }, { "epoch": 1.03, "learning_rate": 1.933309958089397e-05, "loss": 0.6805, "step": 32065 }, { "epoch": 1.03, "learning_rate": 1.933269843567445e-05, "loss": 0.6727, "step": 32070 }, { "epoch": 1.03, "learning_rate": 1.933229717400964e-05, "loss": 0.6918, "step": 32075 }, { "epoch": 1.03, "learning_rate": 1.933189579590455e-05, "loss": 0.6958, "step": 32080 }, { "epoch": 1.03, "learning_rate": 1.9331494301364192e-05, "loss": 0.6769, "step": 32085 }, { "epoch": 1.03, "learning_rate": 1.9331092690393567e-05, "loss": 0.6769, "step": 32090 }, { "epoch": 1.03, "learning_rate": 1.9330690962997694e-05, "loss": 0.6816, "step": 32095 }, { "epoch": 1.03, "learning_rate": 1.9330289119181578e-05, "loss": 0.6988, "step": 32100 }, { "epoch": 1.03, "learning_rate": 1.932988715895024e-05, "loss": 0.6831, "step": 32105 }, { "epoch": 1.03, "learning_rate": 1.932948508230869e-05, "loss": 0.6662, "step": 32110 }, { "epoch": 1.03, "learning_rate": 1.932908288926194e-05, "loss": 0.6846, "step": 32115 }, { "epoch": 1.03, "learning_rate": 1.9328680579815024e-05, "loss": 0.6859, "step": 32120 }, { "epoch": 1.03, "learning_rate": 1.9328278153972947e-05, "loss": 0.6895, "step": 32125 }, { "epoch": 1.03, "learning_rate": 1.9327875611740737e-05, "loss": 0.6774, "step": 32130 }, { "epoch": 1.03, "learning_rate": 1.9327472953123415e-05, "loss": 0.6746, "step": 32135 }, { "epoch": 1.03, "learning_rate": 1.9327070178126005e-05, "loss": 0.6835, "step": 32140 }, { "epoch": 1.03, "learning_rate": 1.9326667286753533e-05, "loss": 0.6851, "step": 32145 }, { "epoch": 1.03, "learning_rate": 1.9326264279011026e-05, "loss": 0.6732, "step": 32150 }, { "epoch": 1.03, "learning_rate": 1.932586115490351e-05, "loss": 0.6723, "step": 32155 }, { "epoch": 1.03, "learning_rate": 1.9325457914436016e-05, "loss": 0.679, "step": 32160 }, { "epoch": 1.03, "learning_rate": 1.932505455761358e-05, "loss": 0.6773, "step": 32165 }, { "epoch": 1.03, "learning_rate": 1.9324651084441227e-05, "loss": 0.6783, "step": 32170 }, { "epoch": 1.03, "learning_rate": 1.9324247494923996e-05, "loss": 0.6771, "step": 32175 }, { "epoch": 1.03, "learning_rate": 1.9323843789066922e-05, "loss": 0.6846, "step": 32180 }, { "epoch": 1.03, "learning_rate": 1.9323439966875043e-05, "loss": 0.6769, "step": 32185 }, { "epoch": 1.03, "learning_rate": 1.932303602835339e-05, "loss": 0.6824, "step": 32190 }, { "epoch": 1.03, "learning_rate": 1.9322631973507016e-05, "loss": 0.678, "step": 32195 }, { "epoch": 1.03, "learning_rate": 1.9322227802340955e-05, "loss": 0.6741, "step": 32200 }, { "epoch": 1.03, "learning_rate": 1.9321823514860247e-05, "loss": 0.6738, "step": 32205 }, { "epoch": 1.03, "learning_rate": 1.9321419111069943e-05, "loss": 0.6847, "step": 32210 }, { "epoch": 1.03, "learning_rate": 1.9321014590975082e-05, "loss": 0.6874, "step": 32215 }, { "epoch": 1.03, "learning_rate": 1.9320609954580714e-05, "loss": 0.6777, "step": 32220 }, { "epoch": 1.03, "learning_rate": 1.9320205201891894e-05, "loss": 0.6855, "step": 32225 }, { "epoch": 1.03, "learning_rate": 1.9319800332913667e-05, "loss": 0.687, "step": 32230 }, { "epoch": 1.03, "learning_rate": 1.9319395347651076e-05, "loss": 0.6915, "step": 32235 }, { "epoch": 1.03, "learning_rate": 1.931899024610919e-05, "loss": 0.6719, "step": 32240 }, { "epoch": 1.03, "learning_rate": 1.9318585028293056e-05, "loss": 0.676, "step": 32245 }, { "epoch": 1.03, "learning_rate": 1.9318179694207726e-05, "loss": 0.6831, "step": 32250 }, { "epoch": 1.03, "learning_rate": 1.9317774243858264e-05, "loss": 0.6886, "step": 32255 }, { "epoch": 1.03, "learning_rate": 1.9317368677249724e-05, "loss": 0.6721, "step": 32260 }, { "epoch": 1.03, "learning_rate": 1.9316962994387167e-05, "loss": 0.688, "step": 32265 }, { "epoch": 1.03, "learning_rate": 1.931655719527566e-05, "loss": 0.6856, "step": 32270 }, { "epoch": 1.03, "learning_rate": 1.931615127992026e-05, "loss": 0.6843, "step": 32275 }, { "epoch": 1.03, "learning_rate": 1.9315745248326037e-05, "loss": 0.6827, "step": 32280 }, { "epoch": 1.03, "learning_rate": 1.9315339100498048e-05, "loss": 0.689, "step": 32285 }, { "epoch": 1.03, "learning_rate": 1.9314932836441374e-05, "loss": 0.6934, "step": 32290 }, { "epoch": 1.03, "learning_rate": 1.931452645616107e-05, "loss": 0.6879, "step": 32295 }, { "epoch": 1.03, "learning_rate": 1.9314119959662218e-05, "loss": 0.6777, "step": 32300 }, { "epoch": 1.03, "learning_rate": 1.9313713346949886e-05, "loss": 0.6862, "step": 32305 }, { "epoch": 1.03, "learning_rate": 1.9313306618029143e-05, "loss": 0.6679, "step": 32310 }, { "epoch": 1.03, "learning_rate": 1.931289977290507e-05, "loss": 0.6974, "step": 32315 }, { "epoch": 1.03, "learning_rate": 1.9312492811582735e-05, "loss": 0.6805, "step": 32320 }, { "epoch": 1.03, "learning_rate": 1.9312085734067226e-05, "loss": 0.688, "step": 32325 }, { "epoch": 1.03, "learning_rate": 1.9311678540363615e-05, "loss": 0.6739, "step": 32330 }, { "epoch": 1.03, "learning_rate": 1.9311271230476987e-05, "loss": 0.6814, "step": 32335 }, { "epoch": 1.03, "learning_rate": 1.931086380441242e-05, "loss": 0.6824, "step": 32340 }, { "epoch": 1.04, "learning_rate": 1.9310456262175004e-05, "loss": 0.6729, "step": 32345 }, { "epoch": 1.04, "learning_rate": 1.9310048603769816e-05, "loss": 0.678, "step": 32350 }, { "epoch": 1.04, "learning_rate": 1.9309640829201947e-05, "loss": 0.6699, "step": 32355 }, { "epoch": 1.04, "learning_rate": 1.9309232938476482e-05, "loss": 0.682, "step": 32360 }, { "epoch": 1.04, "learning_rate": 1.9308824931598514e-05, "loss": 0.6938, "step": 32365 }, { "epoch": 1.04, "learning_rate": 1.930841680857313e-05, "loss": 0.6898, "step": 32370 }, { "epoch": 1.04, "learning_rate": 1.9308008569405424e-05, "loss": 0.6847, "step": 32375 }, { "epoch": 1.04, "learning_rate": 1.930760021410049e-05, "loss": 0.6849, "step": 32380 }, { "epoch": 1.04, "learning_rate": 1.9307191742663424e-05, "loss": 0.6733, "step": 32385 }, { "epoch": 1.04, "learning_rate": 1.9306783155099322e-05, "loss": 0.6895, "step": 32390 }, { "epoch": 1.04, "learning_rate": 1.9306374451413278e-05, "loss": 0.684, "step": 32395 }, { "epoch": 1.04, "learning_rate": 1.9305965631610397e-05, "loss": 0.6697, "step": 32400 }, { "epoch": 1.04, "learning_rate": 1.9305556695695776e-05, "loss": 0.676, "step": 32405 }, { "epoch": 1.04, "learning_rate": 1.9305147643674524e-05, "loss": 0.6787, "step": 32410 }, { "epoch": 1.04, "learning_rate": 1.9304738475551733e-05, "loss": 0.6869, "step": 32415 }, { "epoch": 1.04, "learning_rate": 1.9304329191332522e-05, "loss": 0.6889, "step": 32420 }, { "epoch": 1.04, "learning_rate": 1.9303919791021984e-05, "loss": 0.6851, "step": 32425 }, { "epoch": 1.04, "learning_rate": 1.930351027462524e-05, "loss": 0.6723, "step": 32430 }, { "epoch": 1.04, "learning_rate": 1.9303100642147388e-05, "loss": 0.6903, "step": 32435 }, { "epoch": 1.04, "learning_rate": 1.930269089359355e-05, "loss": 0.6838, "step": 32440 }, { "epoch": 1.04, "learning_rate": 1.9302281028968826e-05, "loss": 0.6872, "step": 32445 }, { "epoch": 1.04, "learning_rate": 1.9301871048278343e-05, "loss": 0.6717, "step": 32450 }, { "epoch": 1.04, "learning_rate": 1.930146095152721e-05, "loss": 0.6939, "step": 32455 }, { "epoch": 1.04, "learning_rate": 1.930105073872054e-05, "loss": 0.6796, "step": 32460 }, { "epoch": 1.04, "learning_rate": 1.9300640409863457e-05, "loss": 0.6664, "step": 32465 }, { "epoch": 1.04, "learning_rate": 1.930022996496108e-05, "loss": 0.6818, "step": 32470 }, { "epoch": 1.04, "learning_rate": 1.929981940401853e-05, "loss": 0.6814, "step": 32475 }, { "epoch": 1.04, "learning_rate": 1.929940872704093e-05, "loss": 0.6836, "step": 32480 }, { "epoch": 1.04, "learning_rate": 1.92989979340334e-05, "loss": 0.6748, "step": 32485 }, { "epoch": 1.04, "learning_rate": 1.929858702500107e-05, "loss": 0.6904, "step": 32490 }, { "epoch": 1.04, "learning_rate": 1.9298175999949068e-05, "loss": 0.6793, "step": 32495 }, { "epoch": 1.04, "learning_rate": 1.9297764858882516e-05, "loss": 0.6823, "step": 32500 }, { "epoch": 1.04, "learning_rate": 1.929735360180655e-05, "loss": 0.6856, "step": 32505 }, { "epoch": 1.04, "learning_rate": 1.9296942228726295e-05, "loss": 0.6829, "step": 32510 }, { "epoch": 1.04, "learning_rate": 1.9296530739646892e-05, "loss": 0.6843, "step": 32515 }, { "epoch": 1.04, "learning_rate": 1.9296119134573473e-05, "loss": 0.6888, "step": 32520 }, { "epoch": 1.04, "learning_rate": 1.9295707413511166e-05, "loss": 0.6826, "step": 32525 }, { "epoch": 1.04, "learning_rate": 1.929529557646512e-05, "loss": 0.658, "step": 32530 }, { "epoch": 1.04, "learning_rate": 1.929488362344046e-05, "loss": 0.6874, "step": 32535 }, { "epoch": 1.04, "learning_rate": 1.9294471554442336e-05, "loss": 0.67, "step": 32540 }, { "epoch": 1.04, "learning_rate": 1.929405936947589e-05, "loss": 0.6766, "step": 32545 }, { "epoch": 1.04, "learning_rate": 1.9293647068546263e-05, "loss": 0.6709, "step": 32550 }, { "epoch": 1.04, "learning_rate": 1.929323465165859e-05, "loss": 0.6822, "step": 32555 }, { "epoch": 1.04, "learning_rate": 1.929282211881803e-05, "loss": 0.6848, "step": 32560 }, { "epoch": 1.04, "learning_rate": 1.9292409470029726e-05, "loss": 0.6825, "step": 32565 }, { "epoch": 1.04, "learning_rate": 1.9291996705298826e-05, "loss": 0.6763, "step": 32570 }, { "epoch": 1.04, "learning_rate": 1.9291583824630478e-05, "loss": 0.6865, "step": 32575 }, { "epoch": 1.04, "learning_rate": 1.9291170828029835e-05, "loss": 0.6802, "step": 32580 }, { "epoch": 1.04, "learning_rate": 1.929075771550205e-05, "loss": 0.6845, "step": 32585 }, { "epoch": 1.04, "learning_rate": 1.9290344487052277e-05, "loss": 0.6789, "step": 32590 }, { "epoch": 1.04, "learning_rate": 1.9289931142685673e-05, "loss": 0.6883, "step": 32595 }, { "epoch": 1.04, "learning_rate": 1.9289517682407397e-05, "loss": 0.6732, "step": 32600 }, { "epoch": 1.04, "learning_rate": 1.9289104106222606e-05, "loss": 0.6758, "step": 32605 }, { "epoch": 1.04, "learning_rate": 1.9288690414136458e-05, "loss": 0.6863, "step": 32610 }, { "epoch": 1.04, "learning_rate": 1.9288276606154118e-05, "loss": 0.6791, "step": 32615 }, { "epoch": 1.04, "learning_rate": 1.9287862682280748e-05, "loss": 0.6893, "step": 32620 }, { "epoch": 1.04, "learning_rate": 1.9287448642521513e-05, "loss": 0.6821, "step": 32625 }, { "epoch": 1.04, "learning_rate": 1.928703448688158e-05, "loss": 0.6711, "step": 32630 }, { "epoch": 1.04, "learning_rate": 1.928662021536611e-05, "loss": 0.6815, "step": 32635 }, { "epoch": 1.04, "learning_rate": 1.928620582798028e-05, "loss": 0.6774, "step": 32640 }, { "epoch": 1.04, "learning_rate": 1.9285791324729257e-05, "loss": 0.6781, "step": 32645 }, { "epoch": 1.04, "learning_rate": 1.9285376705618216e-05, "loss": 0.6758, "step": 32650 }, { "epoch": 1.04, "learning_rate": 1.9284961970652323e-05, "loss": 0.6797, "step": 32655 }, { "epoch": 1.05, "learning_rate": 1.928454711983676e-05, "loss": 0.688, "step": 32660 }, { "epoch": 1.05, "learning_rate": 1.92841321531767e-05, "loss": 0.6763, "step": 32665 }, { "epoch": 1.05, "learning_rate": 1.928371707067732e-05, "loss": 0.6864, "step": 32670 }, { "epoch": 1.05, "learning_rate": 1.9283301872343798e-05, "loss": 0.6794, "step": 32675 }, { "epoch": 1.05, "learning_rate": 1.928288655818132e-05, "loss": 0.6819, "step": 32680 }, { "epoch": 1.05, "learning_rate": 1.9282471128195063e-05, "loss": 0.6812, "step": 32685 }, { "epoch": 1.05, "learning_rate": 1.9282055582390208e-05, "loss": 0.6842, "step": 32690 }, { "epoch": 1.05, "learning_rate": 1.9281639920771948e-05, "loss": 0.6898, "step": 32695 }, { "epoch": 1.05, "learning_rate": 1.928122414334546e-05, "loss": 0.6829, "step": 32700 }, { "epoch": 1.05, "learning_rate": 1.928080825011594e-05, "loss": 0.6873, "step": 32705 }, { "epoch": 1.05, "learning_rate": 1.9280392241088576e-05, "loss": 0.6806, "step": 32710 }, { "epoch": 1.05, "learning_rate": 1.927997611626855e-05, "loss": 0.6766, "step": 32715 }, { "epoch": 1.05, "learning_rate": 1.9279559875661067e-05, "loss": 0.6757, "step": 32720 }, { "epoch": 1.05, "learning_rate": 1.927914351927131e-05, "loss": 0.6887, "step": 32725 }, { "epoch": 1.05, "learning_rate": 1.9278727047104477e-05, "loss": 0.6716, "step": 32730 }, { "epoch": 1.05, "learning_rate": 1.9278310459165765e-05, "loss": 0.6838, "step": 32735 }, { "epoch": 1.05, "learning_rate": 1.9277893755460373e-05, "loss": 0.6891, "step": 32740 }, { "epoch": 1.05, "learning_rate": 1.9277476935993498e-05, "loss": 0.6856, "step": 32745 }, { "epoch": 1.05, "learning_rate": 1.9277060000770342e-05, "loss": 0.6721, "step": 32750 }, { "epoch": 1.05, "learning_rate": 1.927664294979611e-05, "loss": 0.6774, "step": 32755 }, { "epoch": 1.05, "learning_rate": 1.9276225783076002e-05, "loss": 0.6924, "step": 32760 }, { "epoch": 1.05, "learning_rate": 1.927580850061522e-05, "loss": 0.6899, "step": 32765 }, { "epoch": 1.05, "learning_rate": 1.9275391102418976e-05, "loss": 0.6789, "step": 32770 }, { "epoch": 1.05, "learning_rate": 1.9274973588492475e-05, "loss": 0.681, "step": 32775 }, { "epoch": 1.05, "learning_rate": 1.927455595884093e-05, "loss": 0.6982, "step": 32780 }, { "epoch": 1.05, "learning_rate": 1.9274138213469548e-05, "loss": 0.6736, "step": 32785 }, { "epoch": 1.05, "learning_rate": 1.9273720352383544e-05, "loss": 0.6877, "step": 32790 }, { "epoch": 1.05, "learning_rate": 1.9273302375588127e-05, "loss": 0.6825, "step": 32795 }, { "epoch": 1.05, "learning_rate": 1.9272884283088517e-05, "loss": 0.675, "step": 32800 }, { "epoch": 1.05, "learning_rate": 1.927246607488993e-05, "loss": 0.6817, "step": 32805 }, { "epoch": 1.05, "learning_rate": 1.927204775099758e-05, "loss": 0.6851, "step": 32810 }, { "epoch": 1.05, "learning_rate": 1.9271629311416687e-05, "loss": 0.6895, "step": 32815 }, { "epoch": 1.05, "learning_rate": 1.9271210756152482e-05, "loss": 0.6738, "step": 32820 }, { "epoch": 1.05, "learning_rate": 1.9270792085210176e-05, "loss": 0.678, "step": 32825 }, { "epoch": 1.05, "learning_rate": 1.9270373298594998e-05, "loss": 0.6671, "step": 32830 }, { "epoch": 1.05, "learning_rate": 1.926995439631217e-05, "loss": 0.6783, "step": 32835 }, { "epoch": 1.05, "learning_rate": 1.926953537836692e-05, "loss": 0.6799, "step": 32840 }, { "epoch": 1.05, "learning_rate": 1.926911624476448e-05, "loss": 0.6781, "step": 32845 }, { "epoch": 1.05, "learning_rate": 1.926869699551007e-05, "loss": 0.6712, "step": 32850 }, { "epoch": 1.05, "learning_rate": 1.9268277630608935e-05, "loss": 0.6799, "step": 32855 }, { "epoch": 1.05, "learning_rate": 1.9267858150066297e-05, "loss": 0.6779, "step": 32860 }, { "epoch": 1.05, "learning_rate": 1.926743855388739e-05, "loss": 0.6655, "step": 32865 }, { "epoch": 1.05, "learning_rate": 1.9267018842077455e-05, "loss": 0.682, "step": 32870 }, { "epoch": 1.05, "learning_rate": 1.9266599014641724e-05, "loss": 0.6749, "step": 32875 }, { "epoch": 1.05, "learning_rate": 1.926617907158544e-05, "loss": 0.6799, "step": 32880 }, { "epoch": 1.05, "learning_rate": 1.9265759012913836e-05, "loss": 0.687, "step": 32885 }, { "epoch": 1.05, "learning_rate": 1.9265338838632156e-05, "loss": 0.6744, "step": 32890 }, { "epoch": 1.05, "learning_rate": 1.9264918548745645e-05, "loss": 0.6783, "step": 32895 }, { "epoch": 1.05, "learning_rate": 1.9264498143259546e-05, "loss": 0.6987, "step": 32900 }, { "epoch": 1.05, "learning_rate": 1.9264077622179105e-05, "loss": 0.685, "step": 32905 }, { "epoch": 1.05, "learning_rate": 1.926365698550957e-05, "loss": 0.689, "step": 32910 }, { "epoch": 1.05, "learning_rate": 1.926323623325618e-05, "loss": 0.6874, "step": 32915 }, { "epoch": 1.05, "learning_rate": 1.92628153654242e-05, "loss": 0.6793, "step": 32920 }, { "epoch": 1.05, "learning_rate": 1.9262394382018867e-05, "loss": 0.671, "step": 32925 }, { "epoch": 1.05, "learning_rate": 1.9261973283045443e-05, "loss": 0.6773, "step": 32930 }, { "epoch": 1.05, "learning_rate": 1.9261552068509174e-05, "loss": 0.6841, "step": 32935 }, { "epoch": 1.05, "learning_rate": 1.9261130738415327e-05, "loss": 0.6842, "step": 32940 }, { "epoch": 1.05, "learning_rate": 1.9260709292769147e-05, "loss": 0.6894, "step": 32945 }, { "epoch": 1.05, "learning_rate": 1.9260287731575902e-05, "loss": 0.6733, "step": 32950 }, { "epoch": 1.05, "learning_rate": 1.925986605484085e-05, "loss": 0.6837, "step": 32955 }, { "epoch": 1.05, "learning_rate": 1.9259444262569244e-05, "loss": 0.6783, "step": 32960 }, { "epoch": 1.05, "learning_rate": 1.9259022354766353e-05, "loss": 0.6743, "step": 32965 }, { "epoch": 1.06, "learning_rate": 1.9258600331437445e-05, "loss": 0.6773, "step": 32970 }, { "epoch": 1.06, "learning_rate": 1.925817819258778e-05, "loss": 0.6816, "step": 32975 }, { "epoch": 1.06, "learning_rate": 1.9257755938222628e-05, "loss": 0.6867, "step": 32980 }, { "epoch": 1.06, "learning_rate": 1.9257333568347256e-05, "loss": 0.681, "step": 32985 }, { "epoch": 1.06, "learning_rate": 1.925691108296693e-05, "loss": 0.6759, "step": 32990 }, { "epoch": 1.06, "learning_rate": 1.925648848208693e-05, "loss": 0.6882, "step": 32995 }, { "epoch": 1.06, "learning_rate": 1.9256065765712524e-05, "loss": 0.6723, "step": 33000 }, { "epoch": 1.06, "learning_rate": 1.9255642933848983e-05, "loss": 0.6877, "step": 33005 }, { "epoch": 1.06, "learning_rate": 1.925521998650159e-05, "loss": 0.6896, "step": 33010 }, { "epoch": 1.06, "learning_rate": 1.925479692367562e-05, "loss": 0.686, "step": 33015 }, { "epoch": 1.06, "learning_rate": 1.925437374537635e-05, "loss": 0.6838, "step": 33020 }, { "epoch": 1.06, "learning_rate": 1.925395045160906e-05, "loss": 0.6762, "step": 33025 }, { "epoch": 1.06, "learning_rate": 1.925352704237903e-05, "loss": 0.6875, "step": 33030 }, { "epoch": 1.06, "learning_rate": 1.9253103517691543e-05, "loss": 0.6817, "step": 33035 }, { "epoch": 1.06, "learning_rate": 1.925267987755189e-05, "loss": 0.6772, "step": 33040 }, { "epoch": 1.06, "learning_rate": 1.9252256121965346e-05, "loss": 0.6792, "step": 33045 }, { "epoch": 1.06, "learning_rate": 1.925183225093721e-05, "loss": 0.6783, "step": 33050 }, { "epoch": 1.06, "learning_rate": 1.9251408264472758e-05, "loss": 0.6792, "step": 33055 }, { "epoch": 1.06, "learning_rate": 1.9250984162577297e-05, "loss": 0.677, "step": 33060 }, { "epoch": 1.06, "learning_rate": 1.92505599452561e-05, "loss": 0.6801, "step": 33065 }, { "epoch": 1.06, "learning_rate": 1.925013561251447e-05, "loss": 0.6756, "step": 33070 }, { "epoch": 1.06, "learning_rate": 1.9249711164357704e-05, "loss": 0.6797, "step": 33075 }, { "epoch": 1.06, "learning_rate": 1.924928660079109e-05, "loss": 0.6734, "step": 33080 }, { "epoch": 1.06, "learning_rate": 1.9248861921819934e-05, "loss": 0.6856, "step": 33085 }, { "epoch": 1.06, "learning_rate": 1.9248437127449525e-05, "loss": 0.6666, "step": 33090 }, { "epoch": 1.06, "learning_rate": 1.924801221768517e-05, "loss": 0.6755, "step": 33095 }, { "epoch": 1.06, "learning_rate": 1.9247587192532167e-05, "loss": 0.6781, "step": 33100 }, { "epoch": 1.06, "learning_rate": 1.9247162051995826e-05, "loss": 0.6762, "step": 33105 }, { "epoch": 1.06, "learning_rate": 1.9246736796081444e-05, "loss": 0.6822, "step": 33110 }, { "epoch": 1.06, "learning_rate": 1.9246311424794327e-05, "loss": 0.6719, "step": 33115 }, { "epoch": 1.06, "learning_rate": 1.924588593813979e-05, "loss": 0.6879, "step": 33120 }, { "epoch": 1.06, "learning_rate": 1.9245460336123136e-05, "loss": 0.6896, "step": 33125 }, { "epoch": 1.06, "learning_rate": 1.9245034618749673e-05, "loss": 0.693, "step": 33130 }, { "epoch": 1.06, "learning_rate": 1.9244608786024715e-05, "loss": 0.6702, "step": 33135 }, { "epoch": 1.06, "learning_rate": 1.924418283795358e-05, "loss": 0.6809, "step": 33140 }, { "epoch": 1.06, "learning_rate": 1.9243756774541574e-05, "loss": 0.6712, "step": 33145 }, { "epoch": 1.06, "learning_rate": 1.924333059579402e-05, "loss": 0.6782, "step": 33150 }, { "epoch": 1.06, "learning_rate": 1.9242904301716235e-05, "loss": 0.6795, "step": 33155 }, { "epoch": 1.06, "learning_rate": 1.9242477892313534e-05, "loss": 0.6842, "step": 33160 }, { "epoch": 1.06, "learning_rate": 1.9242051367591238e-05, "loss": 0.6734, "step": 33165 }, { "epoch": 1.06, "learning_rate": 1.9241624727554672e-05, "loss": 0.6838, "step": 33170 }, { "epoch": 1.06, "learning_rate": 1.9241197972209157e-05, "loss": 0.6816, "step": 33175 }, { "epoch": 1.06, "learning_rate": 1.924077110156002e-05, "loss": 0.6883, "step": 33180 }, { "epoch": 1.06, "learning_rate": 1.9240344115612584e-05, "loss": 0.6796, "step": 33185 }, { "epoch": 1.06, "learning_rate": 1.923991701437218e-05, "loss": 0.6768, "step": 33190 }, { "epoch": 1.06, "learning_rate": 1.9239489797844132e-05, "loss": 0.6741, "step": 33195 }, { "epoch": 1.06, "learning_rate": 1.923906246603377e-05, "loss": 0.6981, "step": 33200 }, { "epoch": 1.06, "learning_rate": 1.9238635018946438e-05, "loss": 0.6699, "step": 33205 }, { "epoch": 1.06, "learning_rate": 1.9238207456587453e-05, "loss": 0.6904, "step": 33210 }, { "epoch": 1.06, "learning_rate": 1.923777977896216e-05, "loss": 0.6775, "step": 33215 }, { "epoch": 1.06, "learning_rate": 1.923735198607589e-05, "loss": 0.6797, "step": 33220 }, { "epoch": 1.06, "learning_rate": 1.9236924077933988e-05, "loss": 0.6699, "step": 33225 }, { "epoch": 1.06, "learning_rate": 1.9236496054541783e-05, "loss": 0.6668, "step": 33230 }, { "epoch": 1.06, "learning_rate": 1.9236067915904624e-05, "loss": 0.7048, "step": 33235 }, { "epoch": 1.06, "learning_rate": 1.923563966202785e-05, "loss": 0.6844, "step": 33240 }, { "epoch": 1.06, "learning_rate": 1.92352112929168e-05, "loss": 0.6733, "step": 33245 }, { "epoch": 1.06, "learning_rate": 1.9234782808576823e-05, "loss": 0.6725, "step": 33250 }, { "epoch": 1.06, "learning_rate": 1.9234354209013268e-05, "loss": 0.6737, "step": 33255 }, { "epoch": 1.06, "learning_rate": 1.9233925494231477e-05, "loss": 0.6821, "step": 33260 }, { "epoch": 1.06, "learning_rate": 1.9233496664236804e-05, "loss": 0.6763, "step": 33265 }, { "epoch": 1.06, "learning_rate": 1.9233067719034597e-05, "loss": 0.6627, "step": 33270 }, { "epoch": 1.06, "learning_rate": 1.923263865863021e-05, "loss": 0.6798, "step": 33275 }, { "epoch": 1.06, "learning_rate": 1.923220948302899e-05, "loss": 0.6758, "step": 33280 }, { "epoch": 1.07, "learning_rate": 1.92317801922363e-05, "loss": 0.6782, "step": 33285 }, { "epoch": 1.07, "learning_rate": 1.9231350786257493e-05, "loss": 0.6738, "step": 33290 }, { "epoch": 1.07, "learning_rate": 1.9230921265097928e-05, "loss": 0.6659, "step": 33295 }, { "epoch": 1.07, "learning_rate": 1.923049162876296e-05, "loss": 0.6741, "step": 33300 }, { "epoch": 1.07, "learning_rate": 1.9230061877257957e-05, "loss": 0.6728, "step": 33305 }, { "epoch": 1.07, "learning_rate": 1.922963201058827e-05, "loss": 0.6872, "step": 33310 }, { "epoch": 1.07, "learning_rate": 1.9229202028759273e-05, "loss": 0.6714, "step": 33315 }, { "epoch": 1.07, "learning_rate": 1.922877193177633e-05, "loss": 0.6718, "step": 33320 }, { "epoch": 1.07, "learning_rate": 1.92283417196448e-05, "loss": 0.6691, "step": 33325 }, { "epoch": 1.07, "learning_rate": 1.9227911392370055e-05, "loss": 0.6726, "step": 33330 }, { "epoch": 1.07, "learning_rate": 1.9227480949957466e-05, "loss": 0.6766, "step": 33335 }, { "epoch": 1.07, "learning_rate": 1.92270503924124e-05, "loss": 0.6717, "step": 33340 }, { "epoch": 1.07, "learning_rate": 1.9226619719740235e-05, "loss": 0.6833, "step": 33345 }, { "epoch": 1.07, "learning_rate": 1.9226188931946343e-05, "loss": 0.673, "step": 33350 }, { "epoch": 1.07, "learning_rate": 1.9225758029036093e-05, "loss": 0.6793, "step": 33355 }, { "epoch": 1.07, "learning_rate": 1.922532701101486e-05, "loss": 0.6784, "step": 33360 }, { "epoch": 1.07, "learning_rate": 1.9224895877888036e-05, "loss": 0.6834, "step": 33365 }, { "epoch": 1.07, "learning_rate": 1.922446462966099e-05, "loss": 0.6757, "step": 33370 }, { "epoch": 1.07, "learning_rate": 1.9224033266339103e-05, "loss": 0.6835, "step": 33375 }, { "epoch": 1.07, "learning_rate": 1.9223601787927757e-05, "loss": 0.6706, "step": 33380 }, { "epoch": 1.07, "learning_rate": 1.9223170194432338e-05, "loss": 0.6859, "step": 33385 }, { "epoch": 1.07, "learning_rate": 1.922273848585823e-05, "loss": 0.6775, "step": 33390 }, { "epoch": 1.07, "learning_rate": 1.922230666221082e-05, "loss": 0.6857, "step": 33395 }, { "epoch": 1.07, "learning_rate": 1.9221874723495494e-05, "loss": 0.6709, "step": 33400 }, { "epoch": 1.07, "learning_rate": 1.9221442669717645e-05, "loss": 0.6805, "step": 33405 }, { "epoch": 1.07, "learning_rate": 1.9221010500882662e-05, "loss": 0.6699, "step": 33410 }, { "epoch": 1.07, "learning_rate": 1.9220578216995936e-05, "loss": 0.6814, "step": 33415 }, { "epoch": 1.07, "learning_rate": 1.9220145818062857e-05, "loss": 0.6744, "step": 33420 }, { "epoch": 1.07, "learning_rate": 1.9219713304088833e-05, "loss": 0.6704, "step": 33425 }, { "epoch": 1.07, "learning_rate": 1.9219280675079244e-05, "loss": 0.6782, "step": 33430 }, { "epoch": 1.07, "learning_rate": 1.92188479310395e-05, "loss": 0.6838, "step": 33435 }, { "epoch": 1.07, "learning_rate": 1.9218415071974998e-05, "loss": 0.6878, "step": 33440 }, { "epoch": 1.07, "learning_rate": 1.9217982097891136e-05, "loss": 0.6821, "step": 33445 }, { "epoch": 1.07, "learning_rate": 1.9217549008793318e-05, "loss": 0.6659, "step": 33450 }, { "epoch": 1.07, "learning_rate": 1.9217115804686945e-05, "loss": 0.6681, "step": 33455 }, { "epoch": 1.07, "learning_rate": 1.9216682485577425e-05, "loss": 0.6723, "step": 33460 }, { "epoch": 1.07, "learning_rate": 1.9216249051470165e-05, "loss": 0.6764, "step": 33465 }, { "epoch": 1.07, "learning_rate": 1.9215815502370573e-05, "loss": 0.6697, "step": 33470 }, { "epoch": 1.07, "learning_rate": 1.9215381838284056e-05, "loss": 0.6762, "step": 33475 }, { "epoch": 1.07, "learning_rate": 1.921494805921603e-05, "loss": 0.6656, "step": 33480 }, { "epoch": 1.07, "learning_rate": 1.92145141651719e-05, "loss": 0.6623, "step": 33485 }, { "epoch": 1.07, "learning_rate": 1.9214080156157085e-05, "loss": 0.669, "step": 33490 }, { "epoch": 1.07, "learning_rate": 1.9213646032176997e-05, "loss": 0.681, "step": 33495 }, { "epoch": 1.07, "learning_rate": 1.9213211793237056e-05, "loss": 0.6767, "step": 33500 }, { "epoch": 1.07, "learning_rate": 1.9212777439342675e-05, "loss": 0.6893, "step": 33505 }, { "epoch": 1.07, "learning_rate": 1.921234297049928e-05, "loss": 0.68, "step": 33510 }, { "epoch": 1.07, "learning_rate": 1.921190838671229e-05, "loss": 0.6661, "step": 33515 }, { "epoch": 1.07, "learning_rate": 1.9211473687987123e-05, "loss": 0.6777, "step": 33520 }, { "epoch": 1.07, "learning_rate": 1.9211038874329208e-05, "loss": 0.6834, "step": 33525 }, { "epoch": 1.07, "learning_rate": 1.9210603945743965e-05, "loss": 0.6825, "step": 33530 }, { "epoch": 1.07, "learning_rate": 1.921016890223683e-05, "loss": 0.6884, "step": 33535 }, { "epoch": 1.07, "learning_rate": 1.9209733743813218e-05, "loss": 0.6836, "step": 33540 }, { "epoch": 1.07, "learning_rate": 1.920929847047857e-05, "loss": 0.6715, "step": 33545 }, { "epoch": 1.07, "learning_rate": 1.920886308223831e-05, "loss": 0.686, "step": 33550 }, { "epoch": 1.07, "learning_rate": 1.9208427579097874e-05, "loss": 0.6803, "step": 33555 }, { "epoch": 1.07, "learning_rate": 1.9207991961062693e-05, "loss": 0.676, "step": 33560 }, { "epoch": 1.07, "learning_rate": 1.9207556228138206e-05, "loss": 0.6743, "step": 33565 }, { "epoch": 1.07, "learning_rate": 1.9207120380329844e-05, "loss": 0.676, "step": 33570 }, { "epoch": 1.07, "learning_rate": 1.9206684417643052e-05, "loss": 0.6755, "step": 33575 }, { "epoch": 1.07, "learning_rate": 1.9206248340083268e-05, "loss": 0.6741, "step": 33580 }, { "epoch": 1.07, "learning_rate": 1.9205812147655926e-05, "loss": 0.6819, "step": 33585 }, { "epoch": 1.07, "learning_rate": 1.9205375840366475e-05, "loss": 0.6907, "step": 33590 }, { "epoch": 1.08, "learning_rate": 1.920493941822036e-05, "loss": 0.686, "step": 33595 }, { "epoch": 1.08, "learning_rate": 1.9204502881223023e-05, "loss": 0.6778, "step": 33600 }, { "epoch": 1.08, "learning_rate": 1.9204066229379912e-05, "loss": 0.6646, "step": 33605 }, { "epoch": 1.08, "learning_rate": 1.9203629462696473e-05, "loss": 0.685, "step": 33610 }, { "epoch": 1.08, "learning_rate": 1.920319258117816e-05, "loss": 0.6792, "step": 33615 }, { "epoch": 1.08, "learning_rate": 1.9202755584830418e-05, "loss": 0.6722, "step": 33620 }, { "epoch": 1.08, "learning_rate": 1.9202318473658707e-05, "loss": 0.674, "step": 33625 }, { "epoch": 1.08, "learning_rate": 1.920188124766847e-05, "loss": 0.6647, "step": 33630 }, { "epoch": 1.08, "learning_rate": 1.9201443906865176e-05, "loss": 0.6728, "step": 33635 }, { "epoch": 1.08, "learning_rate": 1.9201006451254273e-05, "loss": 0.6771, "step": 33640 }, { "epoch": 1.08, "learning_rate": 1.9200568880841217e-05, "loss": 0.6818, "step": 33645 }, { "epoch": 1.08, "learning_rate": 1.9200131195631476e-05, "loss": 0.6776, "step": 33650 }, { "epoch": 1.08, "learning_rate": 1.9199693395630502e-05, "loss": 0.6878, "step": 33655 }, { "epoch": 1.08, "learning_rate": 1.919925548084377e-05, "loss": 0.6835, "step": 33660 }, { "epoch": 1.08, "learning_rate": 1.9198817451276728e-05, "loss": 0.6763, "step": 33665 }, { "epoch": 1.08, "learning_rate": 1.9198379306934855e-05, "loss": 0.6692, "step": 33670 }, { "epoch": 1.08, "learning_rate": 1.9197941047823606e-05, "loss": 0.683, "step": 33675 }, { "epoch": 1.08, "learning_rate": 1.9197502673948462e-05, "loss": 0.6733, "step": 33680 }, { "epoch": 1.08, "learning_rate": 1.9197064185314882e-05, "loss": 0.6719, "step": 33685 }, { "epoch": 1.08, "learning_rate": 1.9196625581928342e-05, "loss": 0.6795, "step": 33690 }, { "epoch": 1.08, "learning_rate": 1.9196186863794316e-05, "loss": 0.688, "step": 33695 }, { "epoch": 1.08, "learning_rate": 1.9195748030918272e-05, "loss": 0.6754, "step": 33700 }, { "epoch": 1.08, "learning_rate": 1.919530908330569e-05, "loss": 0.6793, "step": 33705 }, { "epoch": 1.08, "learning_rate": 1.919487002096205e-05, "loss": 0.6704, "step": 33710 }, { "epoch": 1.08, "learning_rate": 1.919443084389282e-05, "loss": 0.6709, "step": 33715 }, { "epoch": 1.08, "learning_rate": 1.9193991552103486e-05, "loss": 0.6714, "step": 33720 }, { "epoch": 1.08, "learning_rate": 1.9193552145599533e-05, "loss": 0.6768, "step": 33725 }, { "epoch": 1.08, "learning_rate": 1.9193112624386438e-05, "loss": 0.6802, "step": 33730 }, { "epoch": 1.08, "learning_rate": 1.9192672988469682e-05, "loss": 0.6766, "step": 33735 }, { "epoch": 1.08, "learning_rate": 1.9192233237854762e-05, "loss": 0.6757, "step": 33740 }, { "epoch": 1.08, "learning_rate": 1.9191793372547153e-05, "loss": 0.6787, "step": 33745 }, { "epoch": 1.08, "learning_rate": 1.9191353392552346e-05, "loss": 0.6653, "step": 33750 }, { "epoch": 1.08, "learning_rate": 1.9190913297875834e-05, "loss": 0.6825, "step": 33755 }, { "epoch": 1.08, "learning_rate": 1.919047308852311e-05, "loss": 0.6734, "step": 33760 }, { "epoch": 1.08, "learning_rate": 1.9190032764499658e-05, "loss": 0.6659, "step": 33765 }, { "epoch": 1.08, "learning_rate": 1.918959232581098e-05, "loss": 0.6961, "step": 33770 }, { "epoch": 1.08, "learning_rate": 1.9189151772462567e-05, "loss": 0.6761, "step": 33775 }, { "epoch": 1.08, "learning_rate": 1.918871110445992e-05, "loss": 0.678, "step": 33780 }, { "epoch": 1.08, "learning_rate": 1.918827032180853e-05, "loss": 0.6886, "step": 33785 }, { "epoch": 1.08, "learning_rate": 1.9187829424513908e-05, "loss": 0.6789, "step": 33790 }, { "epoch": 1.08, "learning_rate": 1.918738841258154e-05, "loss": 0.6771, "step": 33795 }, { "epoch": 1.08, "learning_rate": 1.918694728601694e-05, "loss": 0.6792, "step": 33800 }, { "epoch": 1.08, "learning_rate": 1.9186506044825614e-05, "loss": 0.6757, "step": 33805 }, { "epoch": 1.08, "learning_rate": 1.918606468901306e-05, "loss": 0.674, "step": 33810 }, { "epoch": 1.08, "learning_rate": 1.9185623218584785e-05, "loss": 0.6677, "step": 33815 }, { "epoch": 1.08, "learning_rate": 1.91851816335463e-05, "loss": 0.6793, "step": 33820 }, { "epoch": 1.08, "learning_rate": 1.9184739933903114e-05, "loss": 0.6618, "step": 33825 }, { "epoch": 1.08, "learning_rate": 1.918429811966074e-05, "loss": 0.6858, "step": 33830 }, { "epoch": 1.08, "learning_rate": 1.918385619082469e-05, "loss": 0.6819, "step": 33835 }, { "epoch": 1.08, "learning_rate": 1.9183414147400475e-05, "loss": 0.6744, "step": 33840 }, { "epoch": 1.08, "learning_rate": 1.9182971989393612e-05, "loss": 0.6756, "step": 33845 }, { "epoch": 1.08, "learning_rate": 1.9182529716809618e-05, "loss": 0.6863, "step": 33850 }, { "epoch": 1.08, "learning_rate": 1.9182087329654013e-05, "loss": 0.6755, "step": 33855 }, { "epoch": 1.08, "learning_rate": 1.9181644827932317e-05, "loss": 0.6854, "step": 33860 }, { "epoch": 1.08, "learning_rate": 1.9181202211650044e-05, "loss": 0.6721, "step": 33865 }, { "epoch": 1.08, "learning_rate": 1.918075948081273e-05, "loss": 0.6893, "step": 33870 }, { "epoch": 1.08, "learning_rate": 1.9180316635425883e-05, "loss": 0.676, "step": 33875 }, { "epoch": 1.08, "learning_rate": 1.917987367549504e-05, "loss": 0.6839, "step": 33880 }, { "epoch": 1.08, "learning_rate": 1.9179430601025723e-05, "loss": 0.6763, "step": 33885 }, { "epoch": 1.08, "learning_rate": 1.9178987412023465e-05, "loss": 0.6778, "step": 33890 }, { "epoch": 1.08, "learning_rate": 1.9178544108493787e-05, "loss": 0.6808, "step": 33895 }, { "epoch": 1.08, "learning_rate": 1.9178100690442233e-05, "loss": 0.6744, "step": 33900 }, { "epoch": 1.08, "learning_rate": 1.9177657157874324e-05, "loss": 0.6744, "step": 33905 }, { "epoch": 1.09, "learning_rate": 1.9177213510795594e-05, "loss": 0.6747, "step": 33910 }, { "epoch": 1.09, "learning_rate": 1.9176769749211586e-05, "loss": 0.6786, "step": 33915 }, { "epoch": 1.09, "learning_rate": 1.9176325873127837e-05, "loss": 0.6793, "step": 33920 }, { "epoch": 1.09, "learning_rate": 1.9175881882549877e-05, "loss": 0.676, "step": 33925 }, { "epoch": 1.09, "learning_rate": 1.9175437777483252e-05, "loss": 0.6843, "step": 33930 }, { "epoch": 1.09, "learning_rate": 1.9174993557933504e-05, "loss": 0.6809, "step": 33935 }, { "epoch": 1.09, "learning_rate": 1.9174549223906168e-05, "loss": 0.6763, "step": 33940 }, { "epoch": 1.09, "learning_rate": 1.91741047754068e-05, "loss": 0.6707, "step": 33945 }, { "epoch": 1.09, "learning_rate": 1.917366021244093e-05, "loss": 0.6744, "step": 33950 }, { "epoch": 1.09, "learning_rate": 1.9173215535014123e-05, "loss": 0.6882, "step": 33955 }, { "epoch": 1.09, "learning_rate": 1.9172770743131913e-05, "loss": 0.6886, "step": 33960 }, { "epoch": 1.09, "learning_rate": 1.9172325836799852e-05, "loss": 0.6636, "step": 33965 }, { "epoch": 1.09, "learning_rate": 1.91718808160235e-05, "loss": 0.668, "step": 33970 }, { "epoch": 1.09, "learning_rate": 1.9171435680808396e-05, "loss": 0.6654, "step": 33975 }, { "epoch": 1.09, "learning_rate": 1.9170990431160105e-05, "loss": 0.6808, "step": 33980 }, { "epoch": 1.09, "learning_rate": 1.9170545067084178e-05, "loss": 0.6754, "step": 33985 }, { "epoch": 1.09, "learning_rate": 1.9170099588586175e-05, "loss": 0.6743, "step": 33990 }, { "epoch": 1.09, "learning_rate": 1.916965399567165e-05, "loss": 0.6851, "step": 33995 }, { "epoch": 1.09, "learning_rate": 1.9169208288346168e-05, "loss": 0.6713, "step": 34000 }, { "epoch": 1.09, "learning_rate": 1.916876246661528e-05, "loss": 0.6775, "step": 34005 }, { "epoch": 1.09, "learning_rate": 1.9168316530484563e-05, "loss": 0.6735, "step": 34010 }, { "epoch": 1.09, "learning_rate": 1.9167870479959566e-05, "loss": 0.6746, "step": 34015 }, { "epoch": 1.09, "learning_rate": 1.9167424315045866e-05, "loss": 0.6726, "step": 34020 }, { "epoch": 1.09, "learning_rate": 1.9166978035749023e-05, "loss": 0.6856, "step": 34025 }, { "epoch": 1.09, "learning_rate": 1.916653164207461e-05, "loss": 0.6901, "step": 34030 }, { "epoch": 1.09, "learning_rate": 1.9166085134028197e-05, "loss": 0.6665, "step": 34035 }, { "epoch": 1.09, "learning_rate": 1.9165638511615346e-05, "loss": 0.6872, "step": 34040 }, { "epoch": 1.09, "learning_rate": 1.916519177484164e-05, "loss": 0.6865, "step": 34045 }, { "epoch": 1.09, "learning_rate": 1.916474492371265e-05, "loss": 0.6835, "step": 34050 }, { "epoch": 1.09, "learning_rate": 1.9164297958233954e-05, "loss": 0.6763, "step": 34055 }, { "epoch": 1.09, "learning_rate": 1.9163850878411118e-05, "loss": 0.6885, "step": 34060 }, { "epoch": 1.09, "learning_rate": 1.9163403684249734e-05, "loss": 0.6733, "step": 34065 }, { "epoch": 1.09, "learning_rate": 1.916295637575537e-05, "loss": 0.6922, "step": 34070 }, { "epoch": 1.09, "learning_rate": 1.916250895293362e-05, "loss": 0.6781, "step": 34075 }, { "epoch": 1.09, "learning_rate": 1.9162061415790053e-05, "loss": 0.6725, "step": 34080 }, { "epoch": 1.09, "learning_rate": 1.9161613764330265e-05, "loss": 0.687, "step": 34085 }, { "epoch": 1.09, "learning_rate": 1.916116599855983e-05, "loss": 0.6803, "step": 34090 }, { "epoch": 1.09, "learning_rate": 1.916071811848434e-05, "loss": 0.6862, "step": 34095 }, { "epoch": 1.09, "learning_rate": 1.9160270124109386e-05, "loss": 0.6814, "step": 34100 }, { "epoch": 1.09, "learning_rate": 1.915982201544056e-05, "loss": 0.6788, "step": 34105 }, { "epoch": 1.09, "learning_rate": 1.9159373792483444e-05, "loss": 0.6795, "step": 34110 }, { "epoch": 1.09, "learning_rate": 1.9158925455243637e-05, "loss": 0.6764, "step": 34115 }, { "epoch": 1.09, "learning_rate": 1.9158477003726728e-05, "loss": 0.6816, "step": 34120 }, { "epoch": 1.09, "learning_rate": 1.9158028437938316e-05, "loss": 0.6819, "step": 34125 }, { "epoch": 1.09, "learning_rate": 1.9157579757883997e-05, "loss": 0.6809, "step": 34130 }, { "epoch": 1.09, "learning_rate": 1.9157130963569372e-05, "loss": 0.6795, "step": 34135 }, { "epoch": 1.09, "learning_rate": 1.9156682055000034e-05, "loss": 0.6698, "step": 34140 }, { "epoch": 1.09, "learning_rate": 1.9156233032181592e-05, "loss": 0.6812, "step": 34145 }, { "epoch": 1.09, "learning_rate": 1.9155783895119642e-05, "loss": 0.6757, "step": 34150 }, { "epoch": 1.09, "learning_rate": 1.915533464381979e-05, "loss": 0.6685, "step": 34155 }, { "epoch": 1.09, "learning_rate": 1.9154885278287648e-05, "loss": 0.6644, "step": 34160 }, { "epoch": 1.09, "learning_rate": 1.915443579852881e-05, "loss": 0.672, "step": 34165 }, { "epoch": 1.09, "learning_rate": 1.9153986204548897e-05, "loss": 0.6875, "step": 34170 }, { "epoch": 1.09, "learning_rate": 1.9153536496353505e-05, "loss": 0.6897, "step": 34175 }, { "epoch": 1.09, "learning_rate": 1.915308667394826e-05, "loss": 0.6802, "step": 34180 }, { "epoch": 1.09, "learning_rate": 1.9152636737338764e-05, "loss": 0.6751, "step": 34185 }, { "epoch": 1.09, "learning_rate": 1.9152186686530634e-05, "loss": 0.6738, "step": 34190 }, { "epoch": 1.09, "learning_rate": 1.9151736521529485e-05, "loss": 0.665, "step": 34195 }, { "epoch": 1.09, "learning_rate": 1.9151286242340936e-05, "loss": 0.6766, "step": 34200 }, { "epoch": 1.09, "learning_rate": 1.9150835848970605e-05, "loss": 0.6779, "step": 34205 }, { "epoch": 1.09, "learning_rate": 1.9150385341424105e-05, "loss": 0.6758, "step": 34210 }, { "epoch": 1.09, "learning_rate": 1.9149934719707067e-05, "loss": 0.6727, "step": 34215 }, { "epoch": 1.1, "learning_rate": 1.9149483983825106e-05, "loss": 0.6652, "step": 34220 }, { "epoch": 1.1, "learning_rate": 1.914903313378385e-05, "loss": 0.6749, "step": 34225 }, { "epoch": 1.1, "learning_rate": 1.914858216958892e-05, "loss": 0.6766, "step": 34230 }, { "epoch": 1.1, "learning_rate": 1.914813109124595e-05, "loss": 0.6817, "step": 34235 }, { "epoch": 1.1, "learning_rate": 1.9147679898760557e-05, "loss": 0.6727, "step": 34240 }, { "epoch": 1.1, "learning_rate": 1.9147228592138384e-05, "loss": 0.6714, "step": 34245 }, { "epoch": 1.1, "learning_rate": 1.914677717138505e-05, "loss": 0.6567, "step": 34250 }, { "epoch": 1.1, "learning_rate": 1.9146325636506196e-05, "loss": 0.6815, "step": 34255 }, { "epoch": 1.1, "learning_rate": 1.914587398750745e-05, "loss": 0.674, "step": 34260 }, { "epoch": 1.1, "learning_rate": 1.9145422224394452e-05, "loss": 0.6785, "step": 34265 }, { "epoch": 1.1, "learning_rate": 1.9144970347172837e-05, "loss": 0.6736, "step": 34270 }, { "epoch": 1.1, "learning_rate": 1.9144518355848243e-05, "loss": 0.6772, "step": 34275 }, { "epoch": 1.1, "learning_rate": 1.9144066250426306e-05, "loss": 0.6819, "step": 34280 }, { "epoch": 1.1, "learning_rate": 1.9143614030912673e-05, "loss": 0.6694, "step": 34285 }, { "epoch": 1.1, "learning_rate": 1.9143161697312986e-05, "loss": 0.6745, "step": 34290 }, { "epoch": 1.1, "learning_rate": 1.914270924963288e-05, "loss": 0.6665, "step": 34295 }, { "epoch": 1.1, "learning_rate": 1.9142256687878012e-05, "loss": 0.6682, "step": 34300 }, { "epoch": 1.1, "learning_rate": 1.914180401205402e-05, "loss": 0.6668, "step": 34305 }, { "epoch": 1.1, "learning_rate": 1.9141351222166556e-05, "loss": 0.6707, "step": 34310 }, { "epoch": 1.1, "learning_rate": 1.914089831822127e-05, "loss": 0.6778, "step": 34315 }, { "epoch": 1.1, "learning_rate": 1.914044530022381e-05, "loss": 0.675, "step": 34320 }, { "epoch": 1.1, "learning_rate": 1.9139992168179836e-05, "loss": 0.6862, "step": 34325 }, { "epoch": 1.1, "learning_rate": 1.913953892209499e-05, "loss": 0.6798, "step": 34330 }, { "epoch": 1.1, "learning_rate": 1.9139085561974936e-05, "loss": 0.6787, "step": 34335 }, { "epoch": 1.1, "learning_rate": 1.9138632087825327e-05, "loss": 0.6798, "step": 34340 }, { "epoch": 1.1, "learning_rate": 1.9138178499651826e-05, "loss": 0.6783, "step": 34345 }, { "epoch": 1.1, "learning_rate": 1.9137724797460084e-05, "loss": 0.68, "step": 34350 }, { "epoch": 1.1, "learning_rate": 1.9137270981255765e-05, "loss": 0.6732, "step": 34355 }, { "epoch": 1.1, "learning_rate": 1.9136817051044536e-05, "loss": 0.6602, "step": 34360 }, { "epoch": 1.1, "learning_rate": 1.9136363006832057e-05, "loss": 0.6773, "step": 34365 }, { "epoch": 1.1, "learning_rate": 1.9135908848623993e-05, "loss": 0.668, "step": 34370 }, { "epoch": 1.1, "learning_rate": 1.913545457642601e-05, "loss": 0.6753, "step": 34375 }, { "epoch": 1.1, "learning_rate": 1.913500019024378e-05, "loss": 0.6783, "step": 34380 }, { "epoch": 1.1, "learning_rate": 1.9134545690082968e-05, "loss": 0.6668, "step": 34385 }, { "epoch": 1.1, "learning_rate": 1.9134091075949242e-05, "loss": 0.6866, "step": 34390 }, { "epoch": 1.1, "learning_rate": 1.9133636347848287e-05, "loss": 0.6696, "step": 34395 }, { "epoch": 1.1, "learning_rate": 1.913318150578576e-05, "loss": 0.6677, "step": 34400 }, { "epoch": 1.1, "learning_rate": 1.9132726549767353e-05, "loss": 0.6649, "step": 34405 }, { "epoch": 1.1, "learning_rate": 1.913227147979873e-05, "loss": 0.6628, "step": 34410 }, { "epoch": 1.1, "learning_rate": 1.9131816295885572e-05, "loss": 0.6672, "step": 34415 }, { "epoch": 1.1, "learning_rate": 1.913136099803356e-05, "loss": 0.6627, "step": 34420 }, { "epoch": 1.1, "learning_rate": 1.913090558624838e-05, "loss": 0.664, "step": 34425 }, { "epoch": 1.1, "learning_rate": 1.9130450060535702e-05, "loss": 0.6744, "step": 34430 }, { "epoch": 1.1, "learning_rate": 1.9129994420901217e-05, "loss": 0.6707, "step": 34435 }, { "epoch": 1.1, "learning_rate": 1.9129538667350613e-05, "loss": 0.674, "step": 34440 }, { "epoch": 1.1, "learning_rate": 1.912908279988957e-05, "loss": 0.6842, "step": 34445 }, { "epoch": 1.1, "learning_rate": 1.9128626818523776e-05, "loss": 0.6849, "step": 34450 }, { "epoch": 1.1, "learning_rate": 1.9128170723258925e-05, "loss": 0.677, "step": 34455 }, { "epoch": 1.1, "learning_rate": 1.912771451410071e-05, "loss": 0.6684, "step": 34460 }, { "epoch": 1.1, "learning_rate": 1.9127258191054814e-05, "loss": 0.6778, "step": 34465 }, { "epoch": 1.1, "learning_rate": 1.9126801754126935e-05, "loss": 0.6688, "step": 34470 }, { "epoch": 1.1, "learning_rate": 1.912634520332277e-05, "loss": 0.6732, "step": 34475 }, { "epoch": 1.1, "learning_rate": 1.9125888538648017e-05, "loss": 0.6719, "step": 34480 }, { "epoch": 1.1, "learning_rate": 1.9125431760108366e-05, "loss": 0.6831, "step": 34485 }, { "epoch": 1.1, "learning_rate": 1.9124974867709526e-05, "loss": 0.6768, "step": 34490 }, { "epoch": 1.1, "learning_rate": 1.912451786145719e-05, "loss": 0.6741, "step": 34495 }, { "epoch": 1.1, "learning_rate": 1.9124060741357065e-05, "loss": 0.6818, "step": 34500 }, { "epoch": 1.1, "learning_rate": 1.912360350741485e-05, "loss": 0.664, "step": 34505 }, { "epoch": 1.1, "learning_rate": 1.9123146159636253e-05, "loss": 0.6627, "step": 34510 }, { "epoch": 1.1, "learning_rate": 1.912268869802698e-05, "loss": 0.6754, "step": 34515 }, { "epoch": 1.1, "learning_rate": 1.912223112259274e-05, "loss": 0.6827, "step": 34520 }, { "epoch": 1.1, "learning_rate": 1.912177343333924e-05, "loss": 0.6711, "step": 34525 }, { "epoch": 1.1, "learning_rate": 1.9121315630272192e-05, "loss": 0.6721, "step": 34530 }, { "epoch": 1.11, "learning_rate": 1.912085771339731e-05, "loss": 0.6675, "step": 34535 }, { "epoch": 1.11, "learning_rate": 1.91203996827203e-05, "loss": 0.6718, "step": 34540 }, { "epoch": 1.11, "learning_rate": 1.911994153824688e-05, "loss": 0.6752, "step": 34545 }, { "epoch": 1.11, "learning_rate": 1.911948327998278e-05, "loss": 0.6821, "step": 34550 }, { "epoch": 1.11, "learning_rate": 1.9119024907933698e-05, "loss": 0.6671, "step": 34555 }, { "epoch": 1.11, "learning_rate": 1.911856642210536e-05, "loss": 0.6768, "step": 34560 }, { "epoch": 1.11, "learning_rate": 1.911810782250349e-05, "loss": 0.6847, "step": 34565 }, { "epoch": 1.11, "learning_rate": 1.9117649109133807e-05, "loss": 0.677, "step": 34570 }, { "epoch": 1.11, "learning_rate": 1.911719028200204e-05, "loss": 0.6627, "step": 34575 }, { "epoch": 1.11, "learning_rate": 1.9116731341113904e-05, "loss": 0.6651, "step": 34580 }, { "epoch": 1.11, "learning_rate": 1.9116272286475134e-05, "loss": 0.6696, "step": 34585 }, { "epoch": 1.11, "learning_rate": 1.911581311809145e-05, "loss": 0.6694, "step": 34590 }, { "epoch": 1.11, "learning_rate": 1.9115353835968588e-05, "loss": 0.6719, "step": 34595 }, { "epoch": 1.11, "learning_rate": 1.9114894440112274e-05, "loss": 0.6742, "step": 34600 }, { "epoch": 1.11, "learning_rate": 1.9114434930528242e-05, "loss": 0.6805, "step": 34605 }, { "epoch": 1.11, "learning_rate": 1.9113975307222226e-05, "loss": 0.6693, "step": 34610 }, { "epoch": 1.11, "learning_rate": 1.911351557019996e-05, "loss": 0.6721, "step": 34615 }, { "epoch": 1.11, "learning_rate": 1.9113055719467182e-05, "loss": 0.6813, "step": 34620 }, { "epoch": 1.11, "learning_rate": 1.9112595755029625e-05, "loss": 0.6622, "step": 34625 }, { "epoch": 1.11, "learning_rate": 1.911213567689303e-05, "loss": 0.6607, "step": 34630 }, { "epoch": 1.11, "learning_rate": 1.9111675485063138e-05, "loss": 0.67, "step": 34635 }, { "epoch": 1.11, "learning_rate": 1.911121517954569e-05, "loss": 0.6751, "step": 34640 }, { "epoch": 1.11, "learning_rate": 1.9110754760346434e-05, "loss": 0.677, "step": 34645 }, { "epoch": 1.11, "learning_rate": 1.911029422747111e-05, "loss": 0.6759, "step": 34650 }, { "epoch": 1.11, "learning_rate": 1.9109833580925466e-05, "loss": 0.6703, "step": 34655 }, { "epoch": 1.11, "learning_rate": 1.9109372820715248e-05, "loss": 0.6643, "step": 34660 }, { "epoch": 1.11, "learning_rate": 1.9108911946846205e-05, "loss": 0.6723, "step": 34665 }, { "epoch": 1.11, "learning_rate": 1.9108450959324086e-05, "loss": 0.6781, "step": 34670 }, { "epoch": 1.11, "learning_rate": 1.9107989858154646e-05, "loss": 0.683, "step": 34675 }, { "epoch": 1.11, "learning_rate": 1.9107528643343637e-05, "loss": 0.6863, "step": 34680 }, { "epoch": 1.11, "learning_rate": 1.9107067314896816e-05, "loss": 0.6758, "step": 34685 }, { "epoch": 1.11, "learning_rate": 1.9106605872819935e-05, "loss": 0.6667, "step": 34690 }, { "epoch": 1.11, "learning_rate": 1.9106144317118754e-05, "loss": 0.6846, "step": 34695 }, { "epoch": 1.11, "learning_rate": 1.910568264779903e-05, "loss": 0.6652, "step": 34700 }, { "epoch": 1.11, "learning_rate": 1.9105220864866524e-05, "loss": 0.6611, "step": 34705 }, { "epoch": 1.11, "learning_rate": 1.9104758968327e-05, "loss": 0.6764, "step": 34710 }, { "epoch": 1.11, "learning_rate": 1.9104296958186216e-05, "loss": 0.6675, "step": 34715 }, { "epoch": 1.11, "learning_rate": 1.9103834834449942e-05, "loss": 0.6704, "step": 34720 }, { "epoch": 1.11, "learning_rate": 1.9103372597123944e-05, "loss": 0.6817, "step": 34725 }, { "epoch": 1.11, "learning_rate": 1.9102910246213982e-05, "loss": 0.6637, "step": 34730 }, { "epoch": 1.11, "learning_rate": 1.9102447781725833e-05, "loss": 0.6714, "step": 34735 }, { "epoch": 1.11, "learning_rate": 1.9101985203665267e-05, "loss": 0.6737, "step": 34740 }, { "epoch": 1.11, "learning_rate": 1.910152251203805e-05, "loss": 0.6778, "step": 34745 }, { "epoch": 1.11, "learning_rate": 1.9101059706849957e-05, "loss": 0.6836, "step": 34750 }, { "epoch": 1.11, "learning_rate": 1.9100596788106766e-05, "loss": 0.6778, "step": 34755 }, { "epoch": 1.11, "learning_rate": 1.910013375581425e-05, "loss": 0.665, "step": 34760 }, { "epoch": 1.11, "learning_rate": 1.9099670609978184e-05, "loss": 0.6706, "step": 34765 }, { "epoch": 1.11, "learning_rate": 1.9099207350604353e-05, "loss": 0.6806, "step": 34770 }, { "epoch": 1.11, "learning_rate": 1.909874397769853e-05, "loss": 0.6701, "step": 34775 }, { "epoch": 1.11, "learning_rate": 1.90982804912665e-05, "loss": 0.678, "step": 34780 }, { "epoch": 1.11, "learning_rate": 1.909781689131405e-05, "loss": 0.6733, "step": 34785 }, { "epoch": 1.11, "learning_rate": 1.9097353177846957e-05, "loss": 0.6634, "step": 34790 }, { "epoch": 1.11, "learning_rate": 1.909688935087101e-05, "loss": 0.6868, "step": 34795 }, { "epoch": 1.11, "learning_rate": 1.9096425410392e-05, "loss": 0.6753, "step": 34800 }, { "epoch": 1.11, "learning_rate": 1.909596135641571e-05, "loss": 0.6667, "step": 34805 }, { "epoch": 1.11, "learning_rate": 1.9095497188947933e-05, "loss": 0.6788, "step": 34810 }, { "epoch": 1.11, "learning_rate": 1.909503290799446e-05, "loss": 0.6686, "step": 34815 }, { "epoch": 1.11, "learning_rate": 1.909456851356108e-05, "loss": 0.6725, "step": 34820 }, { "epoch": 1.11, "learning_rate": 1.9094104005653594e-05, "loss": 0.6693, "step": 34825 }, { "epoch": 1.11, "learning_rate": 1.9093639384277794e-05, "loss": 0.6753, "step": 34830 }, { "epoch": 1.11, "learning_rate": 1.9093174649439477e-05, "loss": 0.669, "step": 34835 }, { "epoch": 1.11, "learning_rate": 1.9092709801144445e-05, "loss": 0.6668, "step": 34840 }, { "epoch": 1.12, "learning_rate": 1.9092244839398494e-05, "loss": 0.6821, "step": 34845 }, { "epoch": 1.12, "learning_rate": 1.9091779764207425e-05, "loss": 0.6712, "step": 34850 }, { "epoch": 1.12, "learning_rate": 1.909131457557704e-05, "loss": 0.6688, "step": 34855 }, { "epoch": 1.12, "learning_rate": 1.9090849273513153e-05, "loss": 0.6552, "step": 34860 }, { "epoch": 1.12, "learning_rate": 1.909038385802156e-05, "loss": 0.6755, "step": 34865 }, { "epoch": 1.12, "learning_rate": 1.908991832910807e-05, "loss": 0.6707, "step": 34870 }, { "epoch": 1.12, "learning_rate": 1.908945268677849e-05, "loss": 0.6701, "step": 34875 }, { "epoch": 1.12, "learning_rate": 1.908898693103863e-05, "loss": 0.683, "step": 34880 }, { "epoch": 1.12, "learning_rate": 1.9088521061894306e-05, "loss": 0.6689, "step": 34885 }, { "epoch": 1.12, "learning_rate": 1.908805507935133e-05, "loss": 0.6602, "step": 34890 }, { "epoch": 1.12, "learning_rate": 1.9087588983415508e-05, "loss": 0.6715, "step": 34895 }, { "epoch": 1.12, "learning_rate": 1.9087122774092666e-05, "loss": 0.6737, "step": 34900 }, { "epoch": 1.12, "learning_rate": 1.9086656451388616e-05, "loss": 0.6675, "step": 34905 }, { "epoch": 1.12, "learning_rate": 1.9086190015309175e-05, "loss": 0.6649, "step": 34910 }, { "epoch": 1.12, "learning_rate": 1.9085723465860164e-05, "loss": 0.6778, "step": 34915 }, { "epoch": 1.12, "learning_rate": 1.908525680304741e-05, "loss": 0.6706, "step": 34920 }, { "epoch": 1.12, "learning_rate": 1.908479002687672e-05, "loss": 0.6769, "step": 34925 }, { "epoch": 1.12, "learning_rate": 1.9084323137353937e-05, "loss": 0.6675, "step": 34930 }, { "epoch": 1.12, "learning_rate": 1.9083856134484876e-05, "loss": 0.6625, "step": 34935 }, { "epoch": 1.12, "learning_rate": 1.9083389018275364e-05, "loss": 0.6721, "step": 34940 }, { "epoch": 1.12, "learning_rate": 1.9082921788731233e-05, "loss": 0.684, "step": 34945 }, { "epoch": 1.12, "learning_rate": 1.908245444585831e-05, "loss": 0.6661, "step": 34950 }, { "epoch": 1.12, "learning_rate": 1.9081986989662423e-05, "loss": 0.6907, "step": 34955 }, { "epoch": 1.12, "learning_rate": 1.9081519420149415e-05, "loss": 0.6723, "step": 34960 }, { "epoch": 1.12, "learning_rate": 1.9081051737325106e-05, "loss": 0.6744, "step": 34965 }, { "epoch": 1.12, "learning_rate": 1.9080583941195345e-05, "loss": 0.6682, "step": 34970 }, { "epoch": 1.12, "learning_rate": 1.908011603176596e-05, "loss": 0.6683, "step": 34975 }, { "epoch": 1.12, "learning_rate": 1.907964800904279e-05, "loss": 0.6702, "step": 34980 }, { "epoch": 1.12, "learning_rate": 1.9079179873031676e-05, "loss": 0.6781, "step": 34985 }, { "epoch": 1.12, "learning_rate": 1.9078711623738458e-05, "loss": 0.6631, "step": 34990 }, { "epoch": 1.12, "learning_rate": 1.9078243261168983e-05, "loss": 0.6653, "step": 34995 }, { "epoch": 1.12, "learning_rate": 1.907777478532909e-05, "loss": 0.6813, "step": 35000 }, { "epoch": 1.12, "learning_rate": 1.9077306196224622e-05, "loss": 0.6712, "step": 35005 }, { "epoch": 1.12, "learning_rate": 1.907683749386143e-05, "loss": 0.6754, "step": 35010 }, { "epoch": 1.12, "learning_rate": 1.9076368678245364e-05, "loss": 0.6723, "step": 35015 }, { "epoch": 1.12, "learning_rate": 1.9075899749382268e-05, "loss": 0.6808, "step": 35020 }, { "epoch": 1.12, "learning_rate": 1.9075430707278e-05, "loss": 0.6662, "step": 35025 }, { "epoch": 1.12, "learning_rate": 1.90749615519384e-05, "loss": 0.6706, "step": 35030 }, { "epoch": 1.12, "learning_rate": 1.9074492283369336e-05, "loss": 0.6686, "step": 35035 }, { "epoch": 1.12, "learning_rate": 1.9074022901576656e-05, "loss": 0.6688, "step": 35040 }, { "epoch": 1.12, "learning_rate": 1.9073553406566217e-05, "loss": 0.6886, "step": 35045 }, { "epoch": 1.12, "learning_rate": 1.9073083798343873e-05, "loss": 0.6717, "step": 35050 }, { "epoch": 1.12, "learning_rate": 1.9072614076915494e-05, "loss": 0.674, "step": 35055 }, { "epoch": 1.12, "learning_rate": 1.907214424228693e-05, "loss": 0.6561, "step": 35060 }, { "epoch": 1.12, "learning_rate": 1.9071674294464046e-05, "loss": 0.6818, "step": 35065 }, { "epoch": 1.12, "learning_rate": 1.9071204233452708e-05, "loss": 0.681, "step": 35070 }, { "epoch": 1.12, "learning_rate": 1.9070734059258784e-05, "loss": 0.6765, "step": 35075 }, { "epoch": 1.12, "learning_rate": 1.9070263771888133e-05, "loss": 0.6776, "step": 35080 }, { "epoch": 1.12, "learning_rate": 1.906979337134663e-05, "loss": 0.6687, "step": 35085 }, { "epoch": 1.12, "learning_rate": 1.9069322857640135e-05, "loss": 0.673, "step": 35090 }, { "epoch": 1.12, "learning_rate": 1.9068852230774525e-05, "loss": 0.6717, "step": 35095 }, { "epoch": 1.12, "learning_rate": 1.9068381490755673e-05, "loss": 0.6761, "step": 35100 }, { "epoch": 1.12, "learning_rate": 1.906791063758945e-05, "loss": 0.6654, "step": 35105 }, { "epoch": 1.12, "learning_rate": 1.9067439671281732e-05, "loss": 0.6723, "step": 35110 }, { "epoch": 1.12, "learning_rate": 1.9066968591838395e-05, "loss": 0.6777, "step": 35115 }, { "epoch": 1.12, "learning_rate": 1.906649739926532e-05, "loss": 0.667, "step": 35120 }, { "epoch": 1.12, "learning_rate": 1.906602609356838e-05, "loss": 0.6825, "step": 35125 }, { "epoch": 1.12, "learning_rate": 1.9065554674753456e-05, "loss": 0.6793, "step": 35130 }, { "epoch": 1.12, "learning_rate": 1.9065083142826436e-05, "loss": 0.6704, "step": 35135 }, { "epoch": 1.12, "learning_rate": 1.9064611497793196e-05, "loss": 0.6693, "step": 35140 }, { "epoch": 1.12, "learning_rate": 1.9064139739659628e-05, "loss": 0.6743, "step": 35145 }, { "epoch": 1.12, "learning_rate": 1.9063667868431613e-05, "loss": 0.6807, "step": 35150 }, { "epoch": 1.12, "learning_rate": 1.906319588411504e-05, "loss": 0.666, "step": 35155 }, { "epoch": 1.13, "learning_rate": 1.90627237867158e-05, "loss": 0.674, "step": 35160 }, { "epoch": 1.13, "learning_rate": 1.906225157623978e-05, "loss": 0.6623, "step": 35165 }, { "epoch": 1.13, "learning_rate": 1.9061779252692876e-05, "loss": 0.667, "step": 35170 }, { "epoch": 1.13, "learning_rate": 1.9061306816080974e-05, "loss": 0.6694, "step": 35175 }, { "epoch": 1.13, "learning_rate": 1.9060834266409977e-05, "loss": 0.6756, "step": 35180 }, { "epoch": 1.13, "learning_rate": 1.9060361603685777e-05, "loss": 0.6778, "step": 35185 }, { "epoch": 1.13, "learning_rate": 1.9059888827914273e-05, "loss": 0.668, "step": 35190 }, { "epoch": 1.13, "learning_rate": 1.905941593910136e-05, "loss": 0.6757, "step": 35195 }, { "epoch": 1.13, "learning_rate": 1.9058942937252943e-05, "loss": 0.6775, "step": 35200 }, { "epoch": 1.13, "learning_rate": 1.905846982237492e-05, "loss": 0.6715, "step": 35205 }, { "epoch": 1.13, "learning_rate": 1.90579965944732e-05, "loss": 0.6664, "step": 35210 }, { "epoch": 1.13, "learning_rate": 1.905752325355368e-05, "loss": 0.6931, "step": 35215 }, { "epoch": 1.13, "learning_rate": 1.9057049799622268e-05, "loss": 0.6755, "step": 35220 }, { "epoch": 1.13, "learning_rate": 1.9056576232684878e-05, "loss": 0.6693, "step": 35225 }, { "epoch": 1.13, "learning_rate": 1.9056102552747407e-05, "loss": 0.6702, "step": 35230 }, { "epoch": 1.13, "learning_rate": 1.9055628759815778e-05, "loss": 0.6643, "step": 35235 }, { "epoch": 1.13, "learning_rate": 1.9055154853895894e-05, "loss": 0.6734, "step": 35240 }, { "epoch": 1.13, "learning_rate": 1.905468083499367e-05, "loss": 0.6683, "step": 35245 }, { "epoch": 1.13, "learning_rate": 1.905420670311502e-05, "loss": 0.6693, "step": 35250 }, { "epoch": 1.13, "learning_rate": 1.905373245826586e-05, "loss": 0.6843, "step": 35255 }, { "epoch": 1.13, "learning_rate": 1.9053258100452108e-05, "loss": 0.673, "step": 35260 }, { "epoch": 1.13, "learning_rate": 1.9052783629679684e-05, "loss": 0.6731, "step": 35265 }, { "epoch": 1.13, "learning_rate": 1.9052309045954504e-05, "loss": 0.6801, "step": 35270 }, { "epoch": 1.13, "learning_rate": 1.905183434928249e-05, "loss": 0.6586, "step": 35275 }, { "epoch": 1.13, "learning_rate": 1.9051359539669573e-05, "loss": 0.676, "step": 35280 }, { "epoch": 1.13, "learning_rate": 1.9050884617121667e-05, "loss": 0.6637, "step": 35285 }, { "epoch": 1.13, "learning_rate": 1.90504095816447e-05, "loss": 0.6818, "step": 35290 }, { "epoch": 1.13, "learning_rate": 1.90499344332446e-05, "loss": 0.6749, "step": 35295 }, { "epoch": 1.13, "learning_rate": 1.90494591719273e-05, "loss": 0.6683, "step": 35300 }, { "epoch": 1.13, "learning_rate": 1.9048983797698723e-05, "loss": 0.6673, "step": 35305 }, { "epoch": 1.13, "learning_rate": 1.9048508310564807e-05, "loss": 0.6763, "step": 35310 }, { "epoch": 1.13, "learning_rate": 1.904803271053148e-05, "loss": 0.665, "step": 35315 }, { "epoch": 1.13, "learning_rate": 1.904755699760467e-05, "loss": 0.675, "step": 35320 }, { "epoch": 1.13, "learning_rate": 1.9047081171790327e-05, "loss": 0.6669, "step": 35325 }, { "epoch": 1.13, "learning_rate": 1.904660523309438e-05, "loss": 0.6704, "step": 35330 }, { "epoch": 1.13, "learning_rate": 1.904612918152277e-05, "loss": 0.6809, "step": 35335 }, { "epoch": 1.13, "learning_rate": 1.904565301708143e-05, "loss": 0.6648, "step": 35340 }, { "epoch": 1.13, "learning_rate": 1.9045176739776305e-05, "loss": 0.679, "step": 35345 }, { "epoch": 1.13, "learning_rate": 1.9044700349613344e-05, "loss": 0.67, "step": 35350 }, { "epoch": 1.13, "learning_rate": 1.9044223846598483e-05, "loss": 0.6688, "step": 35355 }, { "epoch": 1.13, "learning_rate": 1.9043747230737667e-05, "loss": 0.676, "step": 35360 }, { "epoch": 1.13, "learning_rate": 1.9043270502036847e-05, "loss": 0.6602, "step": 35365 }, { "epoch": 1.13, "learning_rate": 1.904279366050197e-05, "loss": 0.6648, "step": 35370 }, { "epoch": 1.13, "learning_rate": 1.9042316706138987e-05, "loss": 0.6759, "step": 35375 }, { "epoch": 1.13, "learning_rate": 1.9041839638953847e-05, "loss": 0.6726, "step": 35380 }, { "epoch": 1.13, "learning_rate": 1.9041362458952503e-05, "loss": 0.6731, "step": 35385 }, { "epoch": 1.13, "learning_rate": 1.904088516614091e-05, "loss": 0.681, "step": 35390 }, { "epoch": 1.13, "learning_rate": 1.904040776052502e-05, "loss": 0.6717, "step": 35395 }, { "epoch": 1.13, "learning_rate": 1.903993024211079e-05, "loss": 0.6816, "step": 35400 }, { "epoch": 1.13, "learning_rate": 1.903945261090418e-05, "loss": 0.6643, "step": 35405 }, { "epoch": 1.13, "learning_rate": 1.9038974866911154e-05, "loss": 0.6767, "step": 35410 }, { "epoch": 1.13, "learning_rate": 1.9038497010137666e-05, "loss": 0.6679, "step": 35415 }, { "epoch": 1.13, "learning_rate": 1.9038019040589678e-05, "loss": 0.6749, "step": 35420 }, { "epoch": 1.13, "learning_rate": 1.903754095827316e-05, "loss": 0.6667, "step": 35425 }, { "epoch": 1.13, "learning_rate": 1.9037062763194067e-05, "loss": 0.6668, "step": 35430 }, { "epoch": 1.13, "learning_rate": 1.9036584455358373e-05, "loss": 0.6691, "step": 35435 }, { "epoch": 1.13, "learning_rate": 1.903610603477205e-05, "loss": 0.6729, "step": 35440 }, { "epoch": 1.13, "learning_rate": 1.9035627501441057e-05, "loss": 0.6652, "step": 35445 }, { "epoch": 1.13, "learning_rate": 1.903514885537137e-05, "loss": 0.6727, "step": 35450 }, { "epoch": 1.13, "learning_rate": 1.903467009656896e-05, "loss": 0.6664, "step": 35455 }, { "epoch": 1.13, "learning_rate": 1.9034191225039802e-05, "loss": 0.6758, "step": 35460 }, { "epoch": 1.13, "learning_rate": 1.903371224078987e-05, "loss": 0.6769, "step": 35465 }, { "epoch": 1.14, "learning_rate": 1.9033233143825144e-05, "loss": 0.6759, "step": 35470 }, { "epoch": 1.14, "learning_rate": 1.9032753934151594e-05, "loss": 0.6764, "step": 35475 }, { "epoch": 1.14, "learning_rate": 1.9032274611775204e-05, "loss": 0.6614, "step": 35480 }, { "epoch": 1.14, "learning_rate": 1.9031795176701955e-05, "loss": 0.6701, "step": 35485 }, { "epoch": 1.14, "learning_rate": 1.9031315628937826e-05, "loss": 0.6857, "step": 35490 }, { "epoch": 1.14, "learning_rate": 1.9030835968488805e-05, "loss": 0.661, "step": 35495 }, { "epoch": 1.14, "learning_rate": 1.9030356195360875e-05, "loss": 0.6701, "step": 35500 }, { "epoch": 1.14, "learning_rate": 1.902987630956002e-05, "loss": 0.6696, "step": 35505 }, { "epoch": 1.14, "learning_rate": 1.9029396311092227e-05, "loss": 0.6698, "step": 35510 }, { "epoch": 1.14, "learning_rate": 1.9028916199963486e-05, "loss": 0.6763, "step": 35515 }, { "epoch": 1.14, "learning_rate": 1.902843597617979e-05, "loss": 0.6731, "step": 35520 }, { "epoch": 1.14, "learning_rate": 1.902795563974713e-05, "loss": 0.6671, "step": 35525 }, { "epoch": 1.14, "learning_rate": 1.90274751906715e-05, "loss": 0.6691, "step": 35530 }, { "epoch": 1.14, "learning_rate": 1.902699462895889e-05, "loss": 0.6806, "step": 35535 }, { "epoch": 1.14, "learning_rate": 1.90265139546153e-05, "loss": 0.6721, "step": 35540 }, { "epoch": 1.14, "learning_rate": 1.9026033167646727e-05, "loss": 0.6687, "step": 35545 }, { "epoch": 1.14, "learning_rate": 1.902555226805917e-05, "loss": 0.6705, "step": 35550 }, { "epoch": 1.14, "learning_rate": 1.9025071255858627e-05, "loss": 0.6656, "step": 35555 }, { "epoch": 1.14, "learning_rate": 1.9024590131051098e-05, "loss": 0.6697, "step": 35560 }, { "epoch": 1.14, "learning_rate": 1.9024108893642594e-05, "loss": 0.6808, "step": 35565 }, { "epoch": 1.14, "learning_rate": 1.9023627543639118e-05, "loss": 0.6547, "step": 35570 }, { "epoch": 1.14, "learning_rate": 1.9023146081046664e-05, "loss": 0.6725, "step": 35575 }, { "epoch": 1.14, "learning_rate": 1.9022664505871252e-05, "loss": 0.6679, "step": 35580 }, { "epoch": 1.14, "learning_rate": 1.9022182818118888e-05, "loss": 0.6643, "step": 35585 }, { "epoch": 1.14, "learning_rate": 1.9021701017795577e-05, "loss": 0.6689, "step": 35590 }, { "epoch": 1.14, "learning_rate": 1.9021219104907337e-05, "loss": 0.6746, "step": 35595 }, { "epoch": 1.14, "learning_rate": 1.9020737079460178e-05, "loss": 0.6605, "step": 35600 }, { "epoch": 1.14, "learning_rate": 1.902025494146011e-05, "loss": 0.6665, "step": 35605 }, { "epoch": 1.14, "learning_rate": 1.9019772690913158e-05, "loss": 0.6856, "step": 35610 }, { "epoch": 1.14, "learning_rate": 1.9019290327825334e-05, "loss": 0.6782, "step": 35615 }, { "epoch": 1.14, "learning_rate": 1.901880785220265e-05, "loss": 0.6639, "step": 35620 }, { "epoch": 1.14, "learning_rate": 1.901832526405114e-05, "loss": 0.6655, "step": 35625 }, { "epoch": 1.14, "learning_rate": 1.9017842563376813e-05, "loss": 0.6554, "step": 35630 }, { "epoch": 1.14, "learning_rate": 1.90173597501857e-05, "loss": 0.6742, "step": 35635 }, { "epoch": 1.14, "learning_rate": 1.9016876824483817e-05, "loss": 0.6692, "step": 35640 }, { "epoch": 1.14, "learning_rate": 1.9016393786277202e-05, "loss": 0.6597, "step": 35645 }, { "epoch": 1.14, "learning_rate": 1.901591063557187e-05, "loss": 0.6619, "step": 35650 }, { "epoch": 1.14, "learning_rate": 1.9015427372373852e-05, "loss": 0.6847, "step": 35655 }, { "epoch": 1.14, "learning_rate": 1.901494399668918e-05, "loss": 0.6703, "step": 35660 }, { "epoch": 1.14, "learning_rate": 1.9014460508523883e-05, "loss": 0.6802, "step": 35665 }, { "epoch": 1.14, "learning_rate": 1.9013976907883996e-05, "loss": 0.679, "step": 35670 }, { "epoch": 1.14, "learning_rate": 1.9013493194775553e-05, "loss": 0.6649, "step": 35675 }, { "epoch": 1.14, "learning_rate": 1.9013009369204586e-05, "loss": 0.6622, "step": 35680 }, { "epoch": 1.14, "learning_rate": 1.9012525431177134e-05, "loss": 0.6793, "step": 35685 }, { "epoch": 1.14, "learning_rate": 1.901204138069924e-05, "loss": 0.6812, "step": 35690 }, { "epoch": 1.14, "learning_rate": 1.9011557217776933e-05, "loss": 0.6631, "step": 35695 }, { "epoch": 1.14, "learning_rate": 1.901107294241626e-05, "loss": 0.6803, "step": 35700 }, { "epoch": 1.14, "learning_rate": 1.9010588554623263e-05, "loss": 0.6821, "step": 35705 }, { "epoch": 1.14, "learning_rate": 1.9010104054403988e-05, "loss": 0.6689, "step": 35710 }, { "epoch": 1.14, "learning_rate": 1.9009619441764477e-05, "loss": 0.6687, "step": 35715 }, { "epoch": 1.14, "learning_rate": 1.900913471671078e-05, "loss": 0.6817, "step": 35720 }, { "epoch": 1.14, "learning_rate": 1.9008649879248938e-05, "loss": 0.6754, "step": 35725 }, { "epoch": 1.14, "learning_rate": 1.9008164929385008e-05, "loss": 0.6722, "step": 35730 }, { "epoch": 1.14, "learning_rate": 1.9007679867125037e-05, "loss": 0.6707, "step": 35735 }, { "epoch": 1.14, "learning_rate": 1.9007194692475073e-05, "loss": 0.678, "step": 35740 }, { "epoch": 1.14, "learning_rate": 1.900670940544118e-05, "loss": 0.6645, "step": 35745 }, { "epoch": 1.14, "learning_rate": 1.9006224006029404e-05, "loss": 0.669, "step": 35750 }, { "epoch": 1.14, "learning_rate": 1.9005738494245806e-05, "loss": 0.6923, "step": 35755 }, { "epoch": 1.14, "learning_rate": 1.9005252870096446e-05, "loss": 0.6754, "step": 35760 }, { "epoch": 1.14, "learning_rate": 1.9004767133587373e-05, "loss": 0.6682, "step": 35765 }, { "epoch": 1.14, "learning_rate": 1.900428128472466e-05, "loss": 0.6797, "step": 35770 }, { "epoch": 1.14, "learning_rate": 1.9003795323514363e-05, "loss": 0.6692, "step": 35775 }, { "epoch": 1.14, "learning_rate": 1.9003309249962543e-05, "loss": 0.6783, "step": 35780 }, { "epoch": 1.15, "learning_rate": 1.9002823064075268e-05, "loss": 0.6785, "step": 35785 }, { "epoch": 1.15, "learning_rate": 1.9002336765858603e-05, "loss": 0.6629, "step": 35790 }, { "epoch": 1.15, "learning_rate": 1.900185035531862e-05, "loss": 0.671, "step": 35795 }, { "epoch": 1.15, "learning_rate": 1.9001363832461385e-05, "loss": 0.6799, "step": 35800 }, { "epoch": 1.15, "learning_rate": 1.9000877197292964e-05, "loss": 0.6502, "step": 35805 }, { "epoch": 1.15, "learning_rate": 1.9000390449819433e-05, "loss": 0.6655, "step": 35810 }, { "epoch": 1.15, "learning_rate": 1.8999903590046863e-05, "loss": 0.6694, "step": 35815 }, { "epoch": 1.15, "learning_rate": 1.8999416617981334e-05, "loss": 0.6722, "step": 35820 }, { "epoch": 1.15, "learning_rate": 1.899892953362892e-05, "loss": 0.6722, "step": 35825 }, { "epoch": 1.15, "learning_rate": 1.899844233699569e-05, "loss": 0.6681, "step": 35830 }, { "epoch": 1.15, "learning_rate": 1.8997955028087735e-05, "loss": 0.6642, "step": 35835 }, { "epoch": 1.15, "learning_rate": 1.899746760691113e-05, "loss": 0.6764, "step": 35840 }, { "epoch": 1.15, "learning_rate": 1.8996980073471953e-05, "loss": 0.6772, "step": 35845 }, { "epoch": 1.15, "learning_rate": 1.8996492427776295e-05, "loss": 0.6674, "step": 35850 }, { "epoch": 1.15, "learning_rate": 1.899600466983023e-05, "loss": 0.6693, "step": 35855 }, { "epoch": 1.15, "learning_rate": 1.8995516799639856e-05, "loss": 0.6762, "step": 35860 }, { "epoch": 1.15, "learning_rate": 1.899502881721125e-05, "loss": 0.6789, "step": 35865 }, { "epoch": 1.15, "learning_rate": 1.8994540722550504e-05, "loss": 0.6865, "step": 35870 }, { "epoch": 1.15, "learning_rate": 1.899405251566371e-05, "loss": 0.669, "step": 35875 }, { "epoch": 1.15, "learning_rate": 1.8993564196556962e-05, "loss": 0.6605, "step": 35880 }, { "epoch": 1.15, "learning_rate": 1.8993075765236342e-05, "loss": 0.6679, "step": 35885 }, { "epoch": 1.15, "learning_rate": 1.8992587221707953e-05, "loss": 0.6617, "step": 35890 }, { "epoch": 1.15, "learning_rate": 1.8992098565977893e-05, "loss": 0.6776, "step": 35895 }, { "epoch": 1.15, "learning_rate": 1.899160979805225e-05, "loss": 0.6767, "step": 35900 }, { "epoch": 1.15, "learning_rate": 1.899112091793713e-05, "loss": 0.6645, "step": 35905 }, { "epoch": 1.15, "learning_rate": 1.8990631925638627e-05, "loss": 0.6684, "step": 35910 }, { "epoch": 1.15, "learning_rate": 1.8990142821162848e-05, "loss": 0.659, "step": 35915 }, { "epoch": 1.15, "learning_rate": 1.898965360451589e-05, "loss": 0.6534, "step": 35920 }, { "epoch": 1.15, "learning_rate": 1.8989164275703864e-05, "loss": 0.6757, "step": 35925 }, { "epoch": 1.15, "learning_rate": 1.898867483473287e-05, "loss": 0.6645, "step": 35930 }, { "epoch": 1.15, "learning_rate": 1.8988185281609013e-05, "loss": 0.662, "step": 35935 }, { "epoch": 1.15, "learning_rate": 1.8987695616338405e-05, "loss": 0.6705, "step": 35940 }, { "epoch": 1.15, "learning_rate": 1.8987205838927157e-05, "loss": 0.6775, "step": 35945 }, { "epoch": 1.15, "learning_rate": 1.8986715949381378e-05, "loss": 0.6535, "step": 35950 }, { "epoch": 1.15, "learning_rate": 1.8986225947707177e-05, "loss": 0.6847, "step": 35955 }, { "epoch": 1.15, "learning_rate": 1.8985735833910675e-05, "loss": 0.6733, "step": 35960 }, { "epoch": 1.15, "learning_rate": 1.898524560799798e-05, "loss": 0.6581, "step": 35965 }, { "epoch": 1.15, "learning_rate": 1.8984755269975213e-05, "loss": 0.6691, "step": 35970 }, { "epoch": 1.15, "learning_rate": 1.8984264819848494e-05, "loss": 0.6728, "step": 35975 }, { "epoch": 1.15, "learning_rate": 1.8983774257623934e-05, "loss": 0.6529, "step": 35980 }, { "epoch": 1.15, "learning_rate": 1.8983283583307662e-05, "loss": 0.672, "step": 35985 }, { "epoch": 1.15, "learning_rate": 1.8982792796905797e-05, "loss": 0.6664, "step": 35990 }, { "epoch": 1.15, "learning_rate": 1.8982301898424465e-05, "loss": 0.6677, "step": 35995 }, { "epoch": 1.15, "learning_rate": 1.8981810887869784e-05, "loss": 0.6655, "step": 36000 }, { "epoch": 1.15, "learning_rate": 1.898131976524789e-05, "loss": 0.6789, "step": 36005 }, { "epoch": 1.15, "learning_rate": 1.8980828530564907e-05, "loss": 0.6613, "step": 36010 }, { "epoch": 1.15, "learning_rate": 1.898033718382696e-05, "loss": 0.6697, "step": 36015 }, { "epoch": 1.15, "learning_rate": 1.8979845725040186e-05, "loss": 0.6606, "step": 36020 }, { "epoch": 1.15, "learning_rate": 1.897935415421071e-05, "loss": 0.6677, "step": 36025 }, { "epoch": 1.15, "learning_rate": 1.8978862471344672e-05, "loss": 0.6691, "step": 36030 }, { "epoch": 1.15, "learning_rate": 1.8978370676448205e-05, "loss": 0.6665, "step": 36035 }, { "epoch": 1.15, "learning_rate": 1.8977878769527444e-05, "loss": 0.6656, "step": 36040 }, { "epoch": 1.15, "learning_rate": 1.8977386750588523e-05, "loss": 0.6671, "step": 36045 }, { "epoch": 1.15, "learning_rate": 1.897689461963759e-05, "loss": 0.6753, "step": 36050 }, { "epoch": 1.15, "learning_rate": 1.897640237668078e-05, "loss": 0.6764, "step": 36055 }, { "epoch": 1.15, "learning_rate": 1.897591002172423e-05, "loss": 0.6724, "step": 36060 }, { "epoch": 1.15, "learning_rate": 1.8975417554774093e-05, "loss": 0.6721, "step": 36065 }, { "epoch": 1.15, "learning_rate": 1.8974924975836507e-05, "loss": 0.6626, "step": 36070 }, { "epoch": 1.15, "learning_rate": 1.897443228491762e-05, "loss": 0.6836, "step": 36075 }, { "epoch": 1.15, "learning_rate": 1.897393948202358e-05, "loss": 0.6657, "step": 36080 }, { "epoch": 1.15, "learning_rate": 1.8973446567160535e-05, "loss": 0.6791, "step": 36085 }, { "epoch": 1.15, "learning_rate": 1.8972953540334634e-05, "loss": 0.6675, "step": 36090 }, { "epoch": 1.16, "learning_rate": 1.897246040155203e-05, "loss": 0.6749, "step": 36095 }, { "epoch": 1.16, "learning_rate": 1.897196715081888e-05, "loss": 0.6824, "step": 36100 }, { "epoch": 1.16, "learning_rate": 1.8971473788141327e-05, "loss": 0.67, "step": 36105 }, { "epoch": 1.16, "learning_rate": 1.8970980313525536e-05, "loss": 0.6716, "step": 36110 }, { "epoch": 1.16, "learning_rate": 1.897048672697766e-05, "loss": 0.6763, "step": 36115 }, { "epoch": 1.16, "learning_rate": 1.8969993028503862e-05, "loss": 0.6747, "step": 36120 }, { "epoch": 1.16, "learning_rate": 1.8969499218110302e-05, "loss": 0.6631, "step": 36125 }, { "epoch": 1.16, "learning_rate": 1.8969005295803134e-05, "loss": 0.6757, "step": 36130 }, { "epoch": 1.16, "learning_rate": 1.8968511261588528e-05, "loss": 0.6712, "step": 36135 }, { "epoch": 1.16, "learning_rate": 1.8968017115472646e-05, "loss": 0.6682, "step": 36140 }, { "epoch": 1.16, "learning_rate": 1.8967522857461652e-05, "loss": 0.6683, "step": 36145 }, { "epoch": 1.16, "learning_rate": 1.8967028487561712e-05, "loss": 0.6648, "step": 36150 }, { "epoch": 1.16, "learning_rate": 1.8966534005779e-05, "loss": 0.676, "step": 36155 }, { "epoch": 1.16, "learning_rate": 1.896603941211968e-05, "loss": 0.6775, "step": 36160 }, { "epoch": 1.16, "learning_rate": 1.8965544706589925e-05, "loss": 0.6757, "step": 36165 }, { "epoch": 1.16, "learning_rate": 1.896504988919591e-05, "loss": 0.6727, "step": 36170 }, { "epoch": 1.16, "learning_rate": 1.8964554959943803e-05, "loss": 0.66, "step": 36175 }, { "epoch": 1.16, "learning_rate": 1.8964059918839784e-05, "loss": 0.6809, "step": 36180 }, { "epoch": 1.16, "learning_rate": 1.896356476589003e-05, "loss": 0.6648, "step": 36185 }, { "epoch": 1.16, "learning_rate": 1.8963069501100717e-05, "loss": 0.6777, "step": 36190 }, { "epoch": 1.16, "learning_rate": 1.8962574124478023e-05, "loss": 0.666, "step": 36195 }, { "epoch": 1.16, "learning_rate": 1.8962078636028135e-05, "loss": 0.6665, "step": 36200 }, { "epoch": 1.16, "learning_rate": 1.8961583035757227e-05, "loss": 0.6725, "step": 36205 }, { "epoch": 1.16, "learning_rate": 1.8961087323671487e-05, "loss": 0.657, "step": 36210 }, { "epoch": 1.16, "learning_rate": 1.8960591499777104e-05, "loss": 0.6542, "step": 36215 }, { "epoch": 1.16, "learning_rate": 1.8960095564080258e-05, "loss": 0.6774, "step": 36220 }, { "epoch": 1.16, "learning_rate": 1.895959951658714e-05, "loss": 0.6609, "step": 36225 }, { "epoch": 1.16, "learning_rate": 1.895910335730394e-05, "loss": 0.6573, "step": 36230 }, { "epoch": 1.16, "learning_rate": 1.8958607086236842e-05, "loss": 0.6849, "step": 36235 }, { "epoch": 1.16, "learning_rate": 1.895811070339205e-05, "loss": 0.6641, "step": 36240 }, { "epoch": 1.16, "learning_rate": 1.8957614208775747e-05, "loss": 0.6742, "step": 36245 }, { "epoch": 1.16, "learning_rate": 1.895711760239413e-05, "loss": 0.6715, "step": 36250 }, { "epoch": 1.16, "learning_rate": 1.89566208842534e-05, "loss": 0.6666, "step": 36255 }, { "epoch": 1.16, "learning_rate": 1.895612405435975e-05, "loss": 0.663, "step": 36260 }, { "epoch": 1.16, "learning_rate": 1.895562711271938e-05, "loss": 0.6665, "step": 36265 }, { "epoch": 1.16, "learning_rate": 1.895513005933849e-05, "loss": 0.662, "step": 36270 }, { "epoch": 1.16, "learning_rate": 1.8954632894223285e-05, "loss": 0.6682, "step": 36275 }, { "epoch": 1.16, "learning_rate": 1.895413561737996e-05, "loss": 0.6796, "step": 36280 }, { "epoch": 1.16, "learning_rate": 1.895363822881473e-05, "loss": 0.6623, "step": 36285 }, { "epoch": 1.16, "learning_rate": 1.89531407285338e-05, "loss": 0.6719, "step": 36290 }, { "epoch": 1.16, "learning_rate": 1.8952643116543368e-05, "loss": 0.6548, "step": 36295 }, { "epoch": 1.16, "learning_rate": 1.895214539284965e-05, "loss": 0.6688, "step": 36300 }, { "epoch": 1.16, "learning_rate": 1.8951647557458856e-05, "loss": 0.6704, "step": 36305 }, { "epoch": 1.16, "learning_rate": 1.8951149610377193e-05, "loss": 0.6604, "step": 36310 }, { "epoch": 1.16, "learning_rate": 1.8950651551610878e-05, "loss": 0.6578, "step": 36315 }, { "epoch": 1.16, "learning_rate": 1.8950153381166126e-05, "loss": 0.6605, "step": 36320 }, { "epoch": 1.16, "learning_rate": 1.894965509904915e-05, "loss": 0.6784, "step": 36325 }, { "epoch": 1.16, "learning_rate": 1.894915670526617e-05, "loss": 0.6669, "step": 36330 }, { "epoch": 1.16, "learning_rate": 1.8948658199823402e-05, "loss": 0.6708, "step": 36335 }, { "epoch": 1.16, "learning_rate": 1.8948159582727067e-05, "loss": 0.6679, "step": 36340 }, { "epoch": 1.16, "learning_rate": 1.8947660853983387e-05, "loss": 0.675, "step": 36345 }, { "epoch": 1.16, "learning_rate": 1.894716201359858e-05, "loss": 0.6787, "step": 36350 }, { "epoch": 1.16, "learning_rate": 1.8946663061578877e-05, "loss": 0.6764, "step": 36355 }, { "epoch": 1.16, "learning_rate": 1.89461639979305e-05, "loss": 0.6746, "step": 36360 }, { "epoch": 1.16, "learning_rate": 1.8945664822659675e-05, "loss": 0.6643, "step": 36365 }, { "epoch": 1.16, "learning_rate": 1.8945165535772632e-05, "loss": 0.6739, "step": 36370 }, { "epoch": 1.16, "learning_rate": 1.89446661372756e-05, "loss": 0.6826, "step": 36375 }, { "epoch": 1.16, "learning_rate": 1.894416662717481e-05, "loss": 0.6622, "step": 36380 }, { "epoch": 1.16, "learning_rate": 1.8943667005476498e-05, "loss": 0.6647, "step": 36385 }, { "epoch": 1.16, "learning_rate": 1.894316727218689e-05, "loss": 0.6733, "step": 36390 }, { "epoch": 1.16, "learning_rate": 1.894266742731223e-05, "loss": 0.6666, "step": 36395 }, { "epoch": 1.16, "learning_rate": 1.8942167470858747e-05, "loss": 0.6664, "step": 36400 }, { "epoch": 1.16, "learning_rate": 1.8941667402832683e-05, "loss": 0.6676, "step": 36405 }, { "epoch": 1.17, "learning_rate": 1.8941167223240277e-05, "loss": 0.6574, "step": 36410 }, { "epoch": 1.17, "learning_rate": 1.894066693208777e-05, "loss": 0.6669, "step": 36415 }, { "epoch": 1.17, "learning_rate": 1.894016652938141e-05, "loss": 0.6798, "step": 36420 }, { "epoch": 1.17, "learning_rate": 1.8939666015127424e-05, "loss": 0.6654, "step": 36425 }, { "epoch": 1.17, "learning_rate": 1.893916538933207e-05, "loss": 0.6812, "step": 36430 }, { "epoch": 1.17, "learning_rate": 1.8938664652001596e-05, "loss": 0.6746, "step": 36435 }, { "epoch": 1.17, "learning_rate": 1.8938163803142244e-05, "loss": 0.6689, "step": 36440 }, { "epoch": 1.17, "learning_rate": 1.893766284276026e-05, "loss": 0.6791, "step": 36445 }, { "epoch": 1.17, "learning_rate": 1.8937161770861906e-05, "loss": 0.6782, "step": 36450 }, { "epoch": 1.17, "learning_rate": 1.8936660587453427e-05, "loss": 0.6739, "step": 36455 }, { "epoch": 1.17, "learning_rate": 1.893615929254107e-05, "loss": 0.6711, "step": 36460 }, { "epoch": 1.17, "learning_rate": 1.8935657886131102e-05, "loss": 0.6683, "step": 36465 }, { "epoch": 1.17, "learning_rate": 1.8935156368229773e-05, "loss": 0.6764, "step": 36470 }, { "epoch": 1.17, "learning_rate": 1.893465473884334e-05, "loss": 0.6674, "step": 36475 }, { "epoch": 1.17, "learning_rate": 1.8934152997978065e-05, "loss": 0.6729, "step": 36480 }, { "epoch": 1.17, "learning_rate": 1.89336511456402e-05, "loss": 0.6682, "step": 36485 }, { "epoch": 1.17, "learning_rate": 1.893314918183602e-05, "loss": 0.6662, "step": 36490 }, { "epoch": 1.17, "learning_rate": 1.8932647106571775e-05, "loss": 0.6727, "step": 36495 }, { "epoch": 1.17, "learning_rate": 1.893214491985374e-05, "loss": 0.6533, "step": 36500 }, { "epoch": 1.17, "learning_rate": 1.893164262168817e-05, "loss": 0.6609, "step": 36505 }, { "epoch": 1.17, "learning_rate": 1.893114021208134e-05, "loss": 0.6734, "step": 36510 }, { "epoch": 1.17, "learning_rate": 1.893063769103952e-05, "loss": 0.6769, "step": 36515 }, { "epoch": 1.17, "learning_rate": 1.8930135058568977e-05, "loss": 0.6694, "step": 36520 }, { "epoch": 1.17, "learning_rate": 1.8929632314675982e-05, "loss": 0.6636, "step": 36525 }, { "epoch": 1.17, "learning_rate": 1.8929129459366805e-05, "loss": 0.6729, "step": 36530 }, { "epoch": 1.17, "learning_rate": 1.892862649264773e-05, "loss": 0.6671, "step": 36535 }, { "epoch": 1.17, "learning_rate": 1.8928123414525018e-05, "loss": 0.6701, "step": 36540 }, { "epoch": 1.17, "learning_rate": 1.8927620225004958e-05, "loss": 0.6604, "step": 36545 }, { "epoch": 1.17, "learning_rate": 1.8927116924093824e-05, "loss": 0.6804, "step": 36550 }, { "epoch": 1.17, "learning_rate": 1.8926613511797898e-05, "loss": 0.6725, "step": 36555 }, { "epoch": 1.17, "learning_rate": 1.8926109988123455e-05, "loss": 0.6677, "step": 36560 }, { "epoch": 1.17, "learning_rate": 1.8925606353076787e-05, "loss": 0.6646, "step": 36565 }, { "epoch": 1.17, "learning_rate": 1.892510260666417e-05, "loss": 0.667, "step": 36570 }, { "epoch": 1.17, "learning_rate": 1.8924598748891888e-05, "loss": 0.6546, "step": 36575 }, { "epoch": 1.17, "learning_rate": 1.8924094779766237e-05, "loss": 0.6677, "step": 36580 }, { "epoch": 1.17, "learning_rate": 1.8923590699293497e-05, "loss": 0.6695, "step": 36585 }, { "epoch": 1.17, "learning_rate": 1.8923086507479963e-05, "loss": 0.6752, "step": 36590 }, { "epoch": 1.17, "learning_rate": 1.8922582204331918e-05, "loss": 0.6736, "step": 36595 }, { "epoch": 1.17, "learning_rate": 1.8922077789855665e-05, "loss": 0.6671, "step": 36600 }, { "epoch": 1.17, "learning_rate": 1.8921573264057488e-05, "loss": 0.6684, "step": 36605 }, { "epoch": 1.17, "learning_rate": 1.892106862694369e-05, "loss": 0.6655, "step": 36610 }, { "epoch": 1.17, "learning_rate": 1.8920563878520562e-05, "loss": 0.6726, "step": 36615 }, { "epoch": 1.17, "learning_rate": 1.89200590187944e-05, "loss": 0.6675, "step": 36620 }, { "epoch": 1.17, "learning_rate": 1.8919554047771508e-05, "loss": 0.6704, "step": 36625 }, { "epoch": 1.17, "learning_rate": 1.891904896545819e-05, "loss": 0.664, "step": 36630 }, { "epoch": 1.17, "learning_rate": 1.8918543771860734e-05, "loss": 0.6727, "step": 36635 }, { "epoch": 1.17, "learning_rate": 1.891803846698546e-05, "loss": 0.6644, "step": 36640 }, { "epoch": 1.17, "learning_rate": 1.8917533050838663e-05, "loss": 0.6693, "step": 36645 }, { "epoch": 1.17, "learning_rate": 1.8917027523426648e-05, "loss": 0.6599, "step": 36650 }, { "epoch": 1.17, "learning_rate": 1.891652188475573e-05, "loss": 0.6841, "step": 36655 }, { "epoch": 1.17, "learning_rate": 1.8916016134832213e-05, "loss": 0.6577, "step": 36660 }, { "epoch": 1.17, "learning_rate": 1.8915510273662406e-05, "loss": 0.6729, "step": 36665 }, { "epoch": 1.17, "learning_rate": 1.8915004301252626e-05, "loss": 0.6646, "step": 36670 }, { "epoch": 1.17, "learning_rate": 1.891449821760918e-05, "loss": 0.655, "step": 36675 }, { "epoch": 1.17, "learning_rate": 1.8913992022738386e-05, "loss": 0.6656, "step": 36680 }, { "epoch": 1.17, "learning_rate": 1.891348571664656e-05, "loss": 0.6686, "step": 36685 }, { "epoch": 1.17, "learning_rate": 1.8912979299340016e-05, "loss": 0.6715, "step": 36690 }, { "epoch": 1.17, "learning_rate": 1.891247277082508e-05, "loss": 0.6614, "step": 36695 }, { "epoch": 1.17, "learning_rate": 1.8911966131108064e-05, "loss": 0.6606, "step": 36700 }, { "epoch": 1.17, "learning_rate": 1.8911459380195293e-05, "loss": 0.6557, "step": 36705 }, { "epoch": 1.17, "learning_rate": 1.8910952518093087e-05, "loss": 0.6771, "step": 36710 }, { "epoch": 1.17, "learning_rate": 1.8910445544807774e-05, "loss": 0.6597, "step": 36715 }, { "epoch": 1.18, "learning_rate": 1.8909938460345677e-05, "loss": 0.6653, "step": 36720 }, { "epoch": 1.18, "learning_rate": 1.8909431264713128e-05, "loss": 0.6774, "step": 36725 }, { "epoch": 1.18, "learning_rate": 1.890892395791645e-05, "loss": 0.6688, "step": 36730 }, { "epoch": 1.18, "learning_rate": 1.890841653996197e-05, "loss": 0.6649, "step": 36735 }, { "epoch": 1.18, "learning_rate": 1.890790901085603e-05, "loss": 0.6599, "step": 36740 }, { "epoch": 1.18, "learning_rate": 1.890740137060495e-05, "loss": 0.6728, "step": 36745 }, { "epoch": 1.18, "learning_rate": 1.890689361921507e-05, "loss": 0.6789, "step": 36750 }, { "epoch": 1.18, "learning_rate": 1.8906385756692724e-05, "loss": 0.6658, "step": 36755 }, { "epoch": 1.18, "learning_rate": 1.890587778304425e-05, "loss": 0.6656, "step": 36760 }, { "epoch": 1.18, "learning_rate": 1.890536969827599e-05, "loss": 0.664, "step": 36765 }, { "epoch": 1.18, "learning_rate": 1.8904861502394275e-05, "loss": 0.6735, "step": 36770 }, { "epoch": 1.18, "learning_rate": 1.890435319540545e-05, "loss": 0.6646, "step": 36775 }, { "epoch": 1.18, "learning_rate": 1.8903844777315855e-05, "loss": 0.675, "step": 36780 }, { "epoch": 1.18, "learning_rate": 1.890333624813184e-05, "loss": 0.6635, "step": 36785 }, { "epoch": 1.18, "learning_rate": 1.8902827607859742e-05, "loss": 0.662, "step": 36790 }, { "epoch": 1.18, "learning_rate": 1.8902318856505916e-05, "loss": 0.6626, "step": 36795 }, { "epoch": 1.18, "learning_rate": 1.8901809994076702e-05, "loss": 0.6584, "step": 36800 }, { "epoch": 1.18, "learning_rate": 1.890130102057845e-05, "loss": 0.6758, "step": 36805 }, { "epoch": 1.18, "learning_rate": 1.8900791936017518e-05, "loss": 0.6631, "step": 36810 }, { "epoch": 1.18, "learning_rate": 1.8900282740400247e-05, "loss": 0.6652, "step": 36815 }, { "epoch": 1.18, "learning_rate": 1.8899773433732996e-05, "loss": 0.6706, "step": 36820 }, { "epoch": 1.18, "learning_rate": 1.889926401602212e-05, "loss": 0.6721, "step": 36825 }, { "epoch": 1.18, "learning_rate": 1.8898754487273975e-05, "loss": 0.6634, "step": 36830 }, { "epoch": 1.18, "learning_rate": 1.889824484749492e-05, "loss": 0.6667, "step": 36835 }, { "epoch": 1.18, "learning_rate": 1.889773509669131e-05, "loss": 0.6546, "step": 36840 }, { "epoch": 1.18, "learning_rate": 1.8897225234869505e-05, "loss": 0.6578, "step": 36845 }, { "epoch": 1.18, "learning_rate": 1.889671526203587e-05, "loss": 0.6687, "step": 36850 }, { "epoch": 1.18, "learning_rate": 1.8896205178196766e-05, "loss": 0.6827, "step": 36855 }, { "epoch": 1.18, "learning_rate": 1.889569498335856e-05, "loss": 0.6658, "step": 36860 }, { "epoch": 1.18, "learning_rate": 1.8895184677527615e-05, "loss": 0.6733, "step": 36865 }, { "epoch": 1.18, "learning_rate": 1.8894674260710296e-05, "loss": 0.6607, "step": 36870 }, { "epoch": 1.18, "learning_rate": 1.889416373291298e-05, "loss": 0.6596, "step": 36875 }, { "epoch": 1.18, "learning_rate": 1.8893653094142027e-05, "loss": 0.6526, "step": 36880 }, { "epoch": 1.18, "learning_rate": 1.8893142344403812e-05, "loss": 0.6461, "step": 36885 }, { "epoch": 1.18, "learning_rate": 1.8892631483704708e-05, "loss": 0.669, "step": 36890 }, { "epoch": 1.18, "learning_rate": 1.889212051205109e-05, "loss": 0.6619, "step": 36895 }, { "epoch": 1.18, "learning_rate": 1.8891609429449335e-05, "loss": 0.6767, "step": 36900 }, { "epoch": 1.18, "learning_rate": 1.8891098235905815e-05, "loss": 0.6591, "step": 36905 }, { "epoch": 1.18, "learning_rate": 1.8890586931426912e-05, "loss": 0.6643, "step": 36910 }, { "epoch": 1.18, "learning_rate": 1.8890075516019006e-05, "loss": 0.6621, "step": 36915 }, { "epoch": 1.18, "learning_rate": 1.8889563989688476e-05, "loss": 0.655, "step": 36920 }, { "epoch": 1.18, "learning_rate": 1.8889052352441702e-05, "loss": 0.6691, "step": 36925 }, { "epoch": 1.18, "learning_rate": 1.8888540604285075e-05, "loss": 0.6639, "step": 36930 }, { "epoch": 1.18, "learning_rate": 1.8888028745224973e-05, "loss": 0.6791, "step": 36935 }, { "epoch": 1.18, "learning_rate": 1.8887516775267788e-05, "loss": 0.6662, "step": 36940 }, { "epoch": 1.18, "learning_rate": 1.8887004694419902e-05, "loss": 0.656, "step": 36945 }, { "epoch": 1.18, "learning_rate": 1.888649250268771e-05, "loss": 0.6647, "step": 36950 }, { "epoch": 1.18, "learning_rate": 1.8885980200077595e-05, "loss": 0.6702, "step": 36955 }, { "epoch": 1.18, "learning_rate": 1.888546778659596e-05, "loss": 0.6711, "step": 36960 }, { "epoch": 1.18, "learning_rate": 1.8884955262249193e-05, "loss": 0.6587, "step": 36965 }, { "epoch": 1.18, "learning_rate": 1.8884442627043688e-05, "loss": 0.6563, "step": 36970 }, { "epoch": 1.18, "learning_rate": 1.888392988098584e-05, "loss": 0.6587, "step": 36975 }, { "epoch": 1.18, "learning_rate": 1.8883417024082047e-05, "loss": 0.6828, "step": 36980 }, { "epoch": 1.18, "learning_rate": 1.8882904056338712e-05, "loss": 0.6745, "step": 36985 }, { "epoch": 1.18, "learning_rate": 1.8882390977762234e-05, "loss": 0.664, "step": 36990 }, { "epoch": 1.18, "learning_rate": 1.888187778835901e-05, "loss": 0.6646, "step": 36995 }, { "epoch": 1.18, "learning_rate": 1.8881364488135448e-05, "loss": 0.6614, "step": 37000 }, { "epoch": 1.18, "learning_rate": 1.8880851077097952e-05, "loss": 0.6759, "step": 37005 }, { "epoch": 1.18, "learning_rate": 1.8880337555252923e-05, "loss": 0.6706, "step": 37010 }, { "epoch": 1.18, "learning_rate": 1.8879823922606777e-05, "loss": 0.67, "step": 37015 }, { "epoch": 1.18, "learning_rate": 1.8879310179165915e-05, "loss": 0.6757, "step": 37020 }, { "epoch": 1.18, "learning_rate": 1.8878796324936752e-05, "loss": 0.6597, "step": 37025 }, { "epoch": 1.18, "learning_rate": 1.8878282359925698e-05, "loss": 0.6629, "step": 37030 }, { "epoch": 1.19, "learning_rate": 1.8877768284139164e-05, "loss": 0.6703, "step": 37035 }, { "epoch": 1.19, "learning_rate": 1.8877254097583566e-05, "loss": 0.6724, "step": 37040 }, { "epoch": 1.19, "learning_rate": 1.887673980026532e-05, "loss": 0.6585, "step": 37045 }, { "epoch": 1.19, "learning_rate": 1.887622539219084e-05, "loss": 0.6677, "step": 37050 }, { "epoch": 1.19, "learning_rate": 1.8875710873366545e-05, "loss": 0.6791, "step": 37055 }, { "epoch": 1.19, "learning_rate": 1.8875196243798858e-05, "loss": 0.6647, "step": 37060 }, { "epoch": 1.19, "learning_rate": 1.8874681503494197e-05, "loss": 0.6754, "step": 37065 }, { "epoch": 1.19, "learning_rate": 1.887416665245899e-05, "loss": 0.6721, "step": 37070 }, { "epoch": 1.19, "learning_rate": 1.8873651690699652e-05, "loss": 0.6747, "step": 37075 }, { "epoch": 1.19, "learning_rate": 1.8873136618222615e-05, "loss": 0.6533, "step": 37080 }, { "epoch": 1.19, "learning_rate": 1.88726214350343e-05, "loss": 0.6625, "step": 37085 }, { "epoch": 1.19, "learning_rate": 1.887210614114114e-05, "loss": 0.6599, "step": 37090 }, { "epoch": 1.19, "learning_rate": 1.8871590736549564e-05, "loss": 0.6592, "step": 37095 }, { "epoch": 1.19, "learning_rate": 1.8871075221266003e-05, "loss": 0.6733, "step": 37100 }, { "epoch": 1.19, "learning_rate": 1.8870559595296883e-05, "loss": 0.6702, "step": 37105 }, { "epoch": 1.19, "learning_rate": 1.8870043858648644e-05, "loss": 0.6707, "step": 37110 }, { "epoch": 1.19, "learning_rate": 1.886952801132772e-05, "loss": 0.6651, "step": 37115 }, { "epoch": 1.19, "learning_rate": 1.8869012053340546e-05, "loss": 0.6823, "step": 37120 }, { "epoch": 1.19, "learning_rate": 1.886849598469356e-05, "loss": 0.6845, "step": 37125 }, { "epoch": 1.19, "learning_rate": 1.8867979805393203e-05, "loss": 0.6625, "step": 37130 }, { "epoch": 1.19, "learning_rate": 1.886746351544591e-05, "loss": 0.6745, "step": 37135 }, { "epoch": 1.19, "learning_rate": 1.8866947114858128e-05, "loss": 0.6689, "step": 37140 }, { "epoch": 1.19, "learning_rate": 1.88664306036363e-05, "loss": 0.6562, "step": 37145 }, { "epoch": 1.19, "learning_rate": 1.8865913981786867e-05, "loss": 0.6657, "step": 37150 }, { "epoch": 1.19, "learning_rate": 1.8865397249316277e-05, "loss": 0.6636, "step": 37155 }, { "epoch": 1.19, "learning_rate": 1.886488040623098e-05, "loss": 0.6691, "step": 37160 }, { "epoch": 1.19, "learning_rate": 1.886436345253742e-05, "loss": 0.6654, "step": 37165 }, { "epoch": 1.19, "learning_rate": 1.8863846388242047e-05, "loss": 0.6655, "step": 37170 }, { "epoch": 1.19, "learning_rate": 1.8863329213351318e-05, "loss": 0.6788, "step": 37175 }, { "epoch": 1.19, "learning_rate": 1.8862811927871686e-05, "loss": 0.6551, "step": 37180 }, { "epoch": 1.19, "learning_rate": 1.8862294531809596e-05, "loss": 0.6715, "step": 37185 }, { "epoch": 1.19, "learning_rate": 1.8861777025171512e-05, "loss": 0.6657, "step": 37190 }, { "epoch": 1.19, "learning_rate": 1.8861259407963888e-05, "loss": 0.6769, "step": 37195 }, { "epoch": 1.19, "learning_rate": 1.886074168019318e-05, "loss": 0.6512, "step": 37200 }, { "epoch": 1.19, "learning_rate": 1.8860223841865856e-05, "loss": 0.6724, "step": 37205 }, { "epoch": 1.19, "learning_rate": 1.8859705892988366e-05, "loss": 0.6696, "step": 37210 }, { "epoch": 1.19, "learning_rate": 1.8859187833567182e-05, "loss": 0.6735, "step": 37215 }, { "epoch": 1.19, "learning_rate": 1.8858669663608764e-05, "loss": 0.6598, "step": 37220 }, { "epoch": 1.19, "learning_rate": 1.8858151383119576e-05, "loss": 0.668, "step": 37225 }, { "epoch": 1.19, "learning_rate": 1.8857632992106087e-05, "loss": 0.6681, "step": 37230 }, { "epoch": 1.19, "learning_rate": 1.8857114490574765e-05, "loss": 0.6598, "step": 37235 }, { "epoch": 1.19, "learning_rate": 1.8856595878532074e-05, "loss": 0.6667, "step": 37240 }, { "epoch": 1.19, "learning_rate": 1.8856077155984493e-05, "loss": 0.6681, "step": 37245 }, { "epoch": 1.19, "learning_rate": 1.8855558322938492e-05, "loss": 0.6562, "step": 37250 }, { "epoch": 1.19, "learning_rate": 1.885503937940054e-05, "loss": 0.6551, "step": 37255 }, { "epoch": 1.19, "learning_rate": 1.8854520325377117e-05, "loss": 0.6658, "step": 37260 }, { "epoch": 1.19, "learning_rate": 1.8854001160874696e-05, "loss": 0.6687, "step": 37265 }, { "epoch": 1.19, "learning_rate": 1.8853481885899755e-05, "loss": 0.6648, "step": 37270 }, { "epoch": 1.19, "learning_rate": 1.8852962500458775e-05, "loss": 0.6697, "step": 37275 }, { "epoch": 1.19, "learning_rate": 1.8852443004558237e-05, "loss": 0.6677, "step": 37280 }, { "epoch": 1.19, "learning_rate": 1.8851923398204616e-05, "loss": 0.6726, "step": 37285 }, { "epoch": 1.19, "learning_rate": 1.8851403681404408e-05, "loss": 0.6771, "step": 37290 }, { "epoch": 1.19, "learning_rate": 1.8850883854164083e-05, "loss": 0.6623, "step": 37295 }, { "epoch": 1.19, "learning_rate": 1.8850363916490137e-05, "loss": 0.6664, "step": 37300 }, { "epoch": 1.19, "learning_rate": 1.8849843868389055e-05, "loss": 0.6693, "step": 37305 }, { "epoch": 1.19, "learning_rate": 1.8849323709867324e-05, "loss": 0.6724, "step": 37310 }, { "epoch": 1.19, "learning_rate": 1.8848803440931437e-05, "loss": 0.6616, "step": 37315 }, { "epoch": 1.19, "learning_rate": 1.884828306158788e-05, "loss": 0.66, "step": 37320 }, { "epoch": 1.19, "learning_rate": 1.8847762571843153e-05, "loss": 0.6731, "step": 37325 }, { "epoch": 1.19, "learning_rate": 1.8847241971703743e-05, "loss": 0.6719, "step": 37330 }, { "epoch": 1.19, "learning_rate": 1.8846721261176153e-05, "loss": 0.6562, "step": 37335 }, { "epoch": 1.19, "learning_rate": 1.8846200440266875e-05, "loss": 0.669, "step": 37340 }, { "epoch": 1.2, "learning_rate": 1.8845679508982407e-05, "loss": 0.659, "step": 37345 }, { "epoch": 1.2, "learning_rate": 1.8845158467329248e-05, "loss": 0.6667, "step": 37350 }, { "epoch": 1.2, "learning_rate": 1.8844637315313904e-05, "loss": 0.6514, "step": 37355 }, { "epoch": 1.2, "learning_rate": 1.8844116052942878e-05, "loss": 0.6614, "step": 37360 }, { "epoch": 1.2, "learning_rate": 1.8843594680222667e-05, "loss": 0.6571, "step": 37365 }, { "epoch": 1.2, "learning_rate": 1.8843073197159782e-05, "loss": 0.668, "step": 37370 }, { "epoch": 1.2, "learning_rate": 1.8842551603760725e-05, "loss": 0.6583, "step": 37375 }, { "epoch": 1.2, "learning_rate": 1.8842029900032005e-05, "loss": 0.6669, "step": 37380 }, { "epoch": 1.2, "learning_rate": 1.8841508085980137e-05, "loss": 0.6628, "step": 37385 }, { "epoch": 1.2, "learning_rate": 1.8840986161611626e-05, "loss": 0.6598, "step": 37390 }, { "epoch": 1.2, "learning_rate": 1.8840464126932988e-05, "loss": 0.6732, "step": 37395 }, { "epoch": 1.2, "learning_rate": 1.883994198195073e-05, "loss": 0.6702, "step": 37400 }, { "epoch": 1.2, "learning_rate": 1.8839419726671375e-05, "loss": 0.6652, "step": 37405 }, { "epoch": 1.2, "learning_rate": 1.8838897361101433e-05, "loss": 0.6745, "step": 37410 }, { "epoch": 1.2, "learning_rate": 1.8838374885247426e-05, "loss": 0.6708, "step": 37415 }, { "epoch": 1.2, "learning_rate": 1.883785229911587e-05, "loss": 0.6687, "step": 37420 }, { "epoch": 1.2, "learning_rate": 1.8837329602713286e-05, "loss": 0.6791, "step": 37425 }, { "epoch": 1.2, "learning_rate": 1.8836806796046194e-05, "loss": 0.6676, "step": 37430 }, { "epoch": 1.2, "learning_rate": 1.883628387912112e-05, "loss": 0.659, "step": 37435 }, { "epoch": 1.2, "learning_rate": 1.883576085194459e-05, "loss": 0.6608, "step": 37440 }, { "epoch": 1.2, "learning_rate": 1.8835237714523127e-05, "loss": 0.6629, "step": 37445 }, { "epoch": 1.2, "learning_rate": 1.883471446686326e-05, "loss": 0.673, "step": 37450 }, { "epoch": 1.2, "learning_rate": 1.8834191108971516e-05, "loss": 0.6494, "step": 37455 }, { "epoch": 1.2, "learning_rate": 1.8833667640854423e-05, "loss": 0.6665, "step": 37460 }, { "epoch": 1.2, "learning_rate": 1.8833144062518517e-05, "loss": 0.6623, "step": 37465 }, { "epoch": 1.2, "learning_rate": 1.8832620373970326e-05, "loss": 0.6569, "step": 37470 }, { "epoch": 1.2, "learning_rate": 1.883209657521639e-05, "loss": 0.6601, "step": 37475 }, { "epoch": 1.2, "learning_rate": 1.883157266626324e-05, "loss": 0.6489, "step": 37480 }, { "epoch": 1.2, "learning_rate": 1.8831048647117415e-05, "loss": 0.659, "step": 37485 }, { "epoch": 1.2, "learning_rate": 1.883052451778545e-05, "loss": 0.6613, "step": 37490 }, { "epoch": 1.2, "learning_rate": 1.883000027827389e-05, "loss": 0.6612, "step": 37495 }, { "epoch": 1.2, "learning_rate": 1.8829475928589272e-05, "loss": 0.6553, "step": 37500 }, { "epoch": 1.2, "learning_rate": 1.8828951468738138e-05, "loss": 0.6827, "step": 37505 }, { "epoch": 1.2, "learning_rate": 1.8828426898727035e-05, "loss": 0.6611, "step": 37510 }, { "epoch": 1.2, "learning_rate": 1.8827902218562505e-05, "loss": 0.666, "step": 37515 }, { "epoch": 1.2, "learning_rate": 1.8827377428251096e-05, "loss": 0.671, "step": 37520 }, { "epoch": 1.2, "learning_rate": 1.8826852527799355e-05, "loss": 0.6716, "step": 37525 }, { "epoch": 1.2, "learning_rate": 1.8826327517213835e-05, "loss": 0.6727, "step": 37530 }, { "epoch": 1.2, "learning_rate": 1.882580239650108e-05, "loss": 0.6767, "step": 37535 }, { "epoch": 1.2, "learning_rate": 1.882527716566765e-05, "loss": 0.6731, "step": 37540 }, { "epoch": 1.2, "learning_rate": 1.8824751824720086e-05, "loss": 0.6648, "step": 37545 }, { "epoch": 1.2, "learning_rate": 1.882422637366496e-05, "loss": 0.6685, "step": 37550 }, { "epoch": 1.2, "learning_rate": 1.882370081250881e-05, "loss": 0.6575, "step": 37555 }, { "epoch": 1.2, "learning_rate": 1.882317514125821e-05, "loss": 0.6764, "step": 37560 }, { "epoch": 1.2, "learning_rate": 1.8822649359919704e-05, "loss": 0.6693, "step": 37565 }, { "epoch": 1.2, "learning_rate": 1.8822123468499866e-05, "loss": 0.6562, "step": 37570 }, { "epoch": 1.2, "learning_rate": 1.8821597467005247e-05, "loss": 0.6586, "step": 37575 }, { "epoch": 1.2, "learning_rate": 1.8821071355442417e-05, "loss": 0.6643, "step": 37580 }, { "epoch": 1.2, "learning_rate": 1.8820545133817935e-05, "loss": 0.6618, "step": 37585 }, { "epoch": 1.2, "learning_rate": 1.882001880213837e-05, "loss": 0.6608, "step": 37590 }, { "epoch": 1.2, "learning_rate": 1.8819492360410286e-05, "loss": 0.6822, "step": 37595 }, { "epoch": 1.2, "learning_rate": 1.8818965808640255e-05, "loss": 0.6672, "step": 37600 }, { "epoch": 1.2, "learning_rate": 1.8818439146834845e-05, "loss": 0.6629, "step": 37605 }, { "epoch": 1.2, "learning_rate": 1.881791237500063e-05, "loss": 0.6637, "step": 37610 }, { "epoch": 1.2, "learning_rate": 1.881738549314418e-05, "loss": 0.6562, "step": 37615 }, { "epoch": 1.2, "learning_rate": 1.881685850127207e-05, "loss": 0.6621, "step": 37620 }, { "epoch": 1.2, "learning_rate": 1.881633139939087e-05, "loss": 0.6602, "step": 37625 }, { "epoch": 1.2, "learning_rate": 1.8815804187507166e-05, "loss": 0.6609, "step": 37630 }, { "epoch": 1.2, "learning_rate": 1.881527686562753e-05, "loss": 0.6623, "step": 37635 }, { "epoch": 1.2, "learning_rate": 1.8814749433758544e-05, "loss": 0.6662, "step": 37640 }, { "epoch": 1.2, "learning_rate": 1.8814221891906785e-05, "loss": 0.6606, "step": 37645 }, { "epoch": 1.2, "learning_rate": 1.881369424007884e-05, "loss": 0.6678, "step": 37650 }, { "epoch": 1.2, "learning_rate": 1.881316647828129e-05, "loss": 0.6612, "step": 37655 }, { "epoch": 1.21, "learning_rate": 1.881263860652072e-05, "loss": 0.677, "step": 37660 }, { "epoch": 1.21, "learning_rate": 1.881211062480372e-05, "loss": 0.6778, "step": 37665 }, { "epoch": 1.21, "learning_rate": 1.881158253313687e-05, "loss": 0.6561, "step": 37670 }, { "epoch": 1.21, "learning_rate": 1.881105433152677e-05, "loss": 0.6529, "step": 37675 }, { "epoch": 1.21, "learning_rate": 1.8810526019979996e-05, "loss": 0.6774, "step": 37680 }, { "epoch": 1.21, "learning_rate": 1.8809997598503153e-05, "loss": 0.6652, "step": 37685 }, { "epoch": 1.21, "learning_rate": 1.880946906710283e-05, "loss": 0.6537, "step": 37690 }, { "epoch": 1.21, "learning_rate": 1.880894042578562e-05, "loss": 0.6655, "step": 37695 }, { "epoch": 1.21, "learning_rate": 1.8808411674558114e-05, "loss": 0.6624, "step": 37700 }, { "epoch": 1.21, "learning_rate": 1.880788281342692e-05, "loss": 0.6592, "step": 37705 }, { "epoch": 1.21, "learning_rate": 1.880735384239863e-05, "loss": 0.6626, "step": 37710 }, { "epoch": 1.21, "learning_rate": 1.8806824761479845e-05, "loss": 0.6726, "step": 37715 }, { "epoch": 1.21, "learning_rate": 1.880629557067717e-05, "loss": 0.6786, "step": 37720 }, { "epoch": 1.21, "learning_rate": 1.8805766269997203e-05, "loss": 0.679, "step": 37725 }, { "epoch": 1.21, "learning_rate": 1.8805236859446546e-05, "loss": 0.6692, "step": 37730 }, { "epoch": 1.21, "learning_rate": 1.8804707339031814e-05, "loss": 0.6659, "step": 37735 }, { "epoch": 1.21, "learning_rate": 1.8804177708759605e-05, "loss": 0.6757, "step": 37740 }, { "epoch": 1.21, "learning_rate": 1.880364796863653e-05, "loss": 0.6506, "step": 37745 }, { "epoch": 1.21, "learning_rate": 1.8803118118669203e-05, "loss": 0.6731, "step": 37750 }, { "epoch": 1.21, "learning_rate": 1.880258815886423e-05, "loss": 0.6593, "step": 37755 }, { "epoch": 1.21, "learning_rate": 1.8802058089228222e-05, "loss": 0.6665, "step": 37760 }, { "epoch": 1.21, "learning_rate": 1.88015279097678e-05, "loss": 0.6677, "step": 37765 }, { "epoch": 1.21, "learning_rate": 1.880099762048957e-05, "loss": 0.6765, "step": 37770 }, { "epoch": 1.21, "learning_rate": 1.8800467221400156e-05, "loss": 0.6601, "step": 37775 }, { "epoch": 1.21, "learning_rate": 1.879993671250617e-05, "loss": 0.6703, "step": 37780 }, { "epoch": 1.21, "learning_rate": 1.8799406093814237e-05, "loss": 0.6605, "step": 37785 }, { "epoch": 1.21, "learning_rate": 1.8798875365330974e-05, "loss": 0.6661, "step": 37790 }, { "epoch": 1.21, "learning_rate": 1.8798344527063e-05, "loss": 0.6686, "step": 37795 }, { "epoch": 1.21, "learning_rate": 1.8797813579016948e-05, "loss": 0.6711, "step": 37800 }, { "epoch": 1.21, "learning_rate": 1.8797282521199428e-05, "loss": 0.6603, "step": 37805 }, { "epoch": 1.21, "learning_rate": 1.879675135361708e-05, "loss": 0.6635, "step": 37810 }, { "epoch": 1.21, "learning_rate": 1.879622007627653e-05, "loss": 0.6625, "step": 37815 }, { "epoch": 1.21, "learning_rate": 1.8795688689184398e-05, "loss": 0.6635, "step": 37820 }, { "epoch": 1.21, "learning_rate": 1.879515719234732e-05, "loss": 0.669, "step": 37825 }, { "epoch": 1.21, "learning_rate": 1.8794625585771926e-05, "loss": 0.6568, "step": 37830 }, { "epoch": 1.21, "learning_rate": 1.879409386946485e-05, "loss": 0.6544, "step": 37835 }, { "epoch": 1.21, "learning_rate": 1.8793562043432728e-05, "loss": 0.6511, "step": 37840 }, { "epoch": 1.21, "learning_rate": 1.879303010768219e-05, "loss": 0.6674, "step": 37845 }, { "epoch": 1.21, "learning_rate": 1.879249806221988e-05, "loss": 0.661, "step": 37850 }, { "epoch": 1.21, "learning_rate": 1.8791965907052435e-05, "loss": 0.6741, "step": 37855 }, { "epoch": 1.21, "learning_rate": 1.8791433642186487e-05, "loss": 0.6525, "step": 37860 }, { "epoch": 1.21, "learning_rate": 1.8790901267628685e-05, "loss": 0.6632, "step": 37865 }, { "epoch": 1.21, "learning_rate": 1.879036878338567e-05, "loss": 0.6603, "step": 37870 }, { "epoch": 1.21, "learning_rate": 1.878983618946409e-05, "loss": 0.6649, "step": 37875 }, { "epoch": 1.21, "learning_rate": 1.8789303485870575e-05, "loss": 0.6704, "step": 37880 }, { "epoch": 1.21, "learning_rate": 1.878877067261179e-05, "loss": 0.6616, "step": 37885 }, { "epoch": 1.21, "learning_rate": 1.8788237749694373e-05, "loss": 0.6682, "step": 37890 }, { "epoch": 1.21, "learning_rate": 1.8787704717124975e-05, "loss": 0.6628, "step": 37895 }, { "epoch": 1.21, "learning_rate": 1.878717157491025e-05, "loss": 0.6705, "step": 37900 }, { "epoch": 1.21, "learning_rate": 1.8786638323056846e-05, "loss": 0.6772, "step": 37905 }, { "epoch": 1.21, "learning_rate": 1.8786104961571413e-05, "loss": 0.6697, "step": 37910 }, { "epoch": 1.21, "learning_rate": 1.8785571490460617e-05, "loss": 0.655, "step": 37915 }, { "epoch": 1.21, "learning_rate": 1.8785037909731104e-05, "loss": 0.6614, "step": 37920 }, { "epoch": 1.21, "learning_rate": 1.878450421938954e-05, "loss": 0.6571, "step": 37925 }, { "epoch": 1.21, "learning_rate": 1.8783970419442573e-05, "loss": 0.6669, "step": 37930 }, { "epoch": 1.21, "learning_rate": 1.8783436509896872e-05, "loss": 0.6587, "step": 37935 }, { "epoch": 1.21, "learning_rate": 1.87829024907591e-05, "loss": 0.656, "step": 37940 }, { "epoch": 1.21, "learning_rate": 1.8782368362035913e-05, "loss": 0.6607, "step": 37945 }, { "epoch": 1.21, "learning_rate": 1.8781834123733977e-05, "loss": 0.6653, "step": 37950 }, { "epoch": 1.21, "learning_rate": 1.8781299775859964e-05, "loss": 0.6724, "step": 37955 }, { "epoch": 1.21, "learning_rate": 1.878076531842053e-05, "loss": 0.6677, "step": 37960 }, { "epoch": 1.21, "learning_rate": 1.8780230751422354e-05, "loss": 0.6579, "step": 37965 }, { "epoch": 1.22, "learning_rate": 1.8779696074872103e-05, "loss": 0.6601, "step": 37970 }, { "epoch": 1.22, "learning_rate": 1.8779161288776444e-05, "loss": 0.6643, "step": 37975 }, { "epoch": 1.22, "learning_rate": 1.8778626393142053e-05, "loss": 0.6705, "step": 37980 }, { "epoch": 1.22, "learning_rate": 1.877809138797561e-05, "loss": 0.6681, "step": 37985 }, { "epoch": 1.22, "learning_rate": 1.8777556273283774e-05, "loss": 0.6751, "step": 37990 }, { "epoch": 1.22, "learning_rate": 1.8777021049073237e-05, "loss": 0.6637, "step": 37995 }, { "epoch": 1.22, "learning_rate": 1.8776485715350672e-05, "loss": 0.6705, "step": 38000 }, { "epoch": 1.22, "learning_rate": 1.8775950272122756e-05, "loss": 0.6715, "step": 38005 }, { "epoch": 1.22, "learning_rate": 1.8775414719396173e-05, "loss": 0.6708, "step": 38010 }, { "epoch": 1.22, "learning_rate": 1.8774879057177605e-05, "loss": 0.6757, "step": 38015 }, { "epoch": 1.22, "learning_rate": 1.8774343285473734e-05, "loss": 0.6448, "step": 38020 }, { "epoch": 1.22, "learning_rate": 1.8773807404291244e-05, "loss": 0.6534, "step": 38025 }, { "epoch": 1.22, "learning_rate": 1.8773271413636826e-05, "loss": 0.6551, "step": 38030 }, { "epoch": 1.22, "learning_rate": 1.8772735313517163e-05, "loss": 0.6626, "step": 38035 }, { "epoch": 1.22, "learning_rate": 1.8772199103938946e-05, "loss": 0.6646, "step": 38040 }, { "epoch": 1.22, "learning_rate": 1.8771662784908865e-05, "loss": 0.6468, "step": 38045 }, { "epoch": 1.22, "learning_rate": 1.8771126356433607e-05, "loss": 0.6582, "step": 38050 }, { "epoch": 1.22, "learning_rate": 1.8770589818519873e-05, "loss": 0.6537, "step": 38055 }, { "epoch": 1.22, "learning_rate": 1.8770053171174357e-05, "loss": 0.6702, "step": 38060 }, { "epoch": 1.22, "learning_rate": 1.876951641440375e-05, "loss": 0.664, "step": 38065 }, { "epoch": 1.22, "learning_rate": 1.876897954821475e-05, "loss": 0.6487, "step": 38070 }, { "epoch": 1.22, "learning_rate": 1.8768442572614055e-05, "loss": 0.6801, "step": 38075 }, { "epoch": 1.22, "learning_rate": 1.8767905487608367e-05, "loss": 0.6588, "step": 38080 }, { "epoch": 1.22, "learning_rate": 1.876736829320439e-05, "loss": 0.6749, "step": 38085 }, { "epoch": 1.22, "learning_rate": 1.8766830989408818e-05, "loss": 0.6577, "step": 38090 }, { "epoch": 1.22, "learning_rate": 1.8766293576228363e-05, "loss": 0.6626, "step": 38095 }, { "epoch": 1.22, "learning_rate": 1.876575605366973e-05, "loss": 0.6783, "step": 38100 }, { "epoch": 1.22, "learning_rate": 1.8765218421739623e-05, "loss": 0.6616, "step": 38105 }, { "epoch": 1.22, "learning_rate": 1.8764680680444747e-05, "loss": 0.6707, "step": 38110 }, { "epoch": 1.22, "learning_rate": 1.876414282979182e-05, "loss": 0.6489, "step": 38115 }, { "epoch": 1.22, "learning_rate": 1.8763604869787544e-05, "loss": 0.6626, "step": 38120 }, { "epoch": 1.22, "learning_rate": 1.8763066800438638e-05, "loss": 0.6461, "step": 38125 }, { "epoch": 1.22, "learning_rate": 1.876252862175181e-05, "loss": 0.6674, "step": 38130 }, { "epoch": 1.22, "learning_rate": 1.876199033373378e-05, "loss": 0.6678, "step": 38135 }, { "epoch": 1.22, "learning_rate": 1.8761451936391263e-05, "loss": 0.657, "step": 38140 }, { "epoch": 1.22, "learning_rate": 1.8760913429730972e-05, "loss": 0.659, "step": 38145 }, { "epoch": 1.22, "learning_rate": 1.876037481375963e-05, "loss": 0.6634, "step": 38150 }, { "epoch": 1.22, "learning_rate": 1.875983608848396e-05, "loss": 0.6502, "step": 38155 }, { "epoch": 1.22, "learning_rate": 1.875929725391068e-05, "loss": 0.6657, "step": 38160 }, { "epoch": 1.22, "learning_rate": 1.8758758310046513e-05, "loss": 0.6815, "step": 38165 }, { "epoch": 1.22, "learning_rate": 1.875821925689818e-05, "loss": 0.6665, "step": 38170 }, { "epoch": 1.22, "learning_rate": 1.8757680094472417e-05, "loss": 0.655, "step": 38175 }, { "epoch": 1.22, "learning_rate": 1.8757140822775943e-05, "loss": 0.6588, "step": 38180 }, { "epoch": 1.22, "learning_rate": 1.875660144181549e-05, "loss": 0.6653, "step": 38185 }, { "epoch": 1.22, "learning_rate": 1.8756061951597787e-05, "loss": 0.6613, "step": 38190 }, { "epoch": 1.22, "learning_rate": 1.8755522352129564e-05, "loss": 0.6574, "step": 38195 }, { "epoch": 1.22, "learning_rate": 1.8754982643417553e-05, "loss": 0.661, "step": 38200 }, { "epoch": 1.22, "learning_rate": 1.8754442825468494e-05, "loss": 0.6584, "step": 38205 }, { "epoch": 1.22, "learning_rate": 1.8753902898289115e-05, "loss": 0.6501, "step": 38210 }, { "epoch": 1.22, "learning_rate": 1.8753362861886156e-05, "loss": 0.6593, "step": 38215 }, { "epoch": 1.22, "learning_rate": 1.8752822716266356e-05, "loss": 0.6586, "step": 38220 }, { "epoch": 1.22, "learning_rate": 1.8752282461436456e-05, "loss": 0.6653, "step": 38225 }, { "epoch": 1.22, "learning_rate": 1.875174209740319e-05, "loss": 0.662, "step": 38230 }, { "epoch": 1.22, "learning_rate": 1.8751201624173304e-05, "loss": 0.6799, "step": 38235 }, { "epoch": 1.22, "learning_rate": 1.8750661041753547e-05, "loss": 0.6633, "step": 38240 }, { "epoch": 1.22, "learning_rate": 1.8750120350150657e-05, "loss": 0.6674, "step": 38245 }, { "epoch": 1.22, "learning_rate": 1.874957954937138e-05, "loss": 0.6512, "step": 38250 }, { "epoch": 1.22, "learning_rate": 1.8749038639422465e-05, "loss": 0.6611, "step": 38255 }, { "epoch": 1.22, "learning_rate": 1.8748497620310668e-05, "loss": 0.6675, "step": 38260 }, { "epoch": 1.22, "learning_rate": 1.8747956492042724e-05, "loss": 0.6695, "step": 38265 }, { "epoch": 1.22, "learning_rate": 1.87474152546254e-05, "loss": 0.6564, "step": 38270 }, { "epoch": 1.22, "learning_rate": 1.8746873908065443e-05, "loss": 0.6539, "step": 38275 }, { "epoch": 1.22, "learning_rate": 1.874633245236961e-05, "loss": 0.6755, "step": 38280 }, { "epoch": 1.23, "learning_rate": 1.874579088754465e-05, "loss": 0.6609, "step": 38285 }, { "epoch": 1.23, "learning_rate": 1.8745249213597324e-05, "loss": 0.6671, "step": 38290 }, { "epoch": 1.23, "learning_rate": 1.8744707430534395e-05, "loss": 0.6662, "step": 38295 }, { "epoch": 1.23, "learning_rate": 1.8744165538362615e-05, "loss": 0.6609, "step": 38300 }, { "epoch": 1.23, "learning_rate": 1.874362353708875e-05, "loss": 0.6586, "step": 38305 }, { "epoch": 1.23, "learning_rate": 1.8743081426719564e-05, "loss": 0.6593, "step": 38310 }, { "epoch": 1.23, "learning_rate": 1.8742539207261815e-05, "loss": 0.6502, "step": 38315 }, { "epoch": 1.23, "learning_rate": 1.8741996878722276e-05, "loss": 0.669, "step": 38320 }, { "epoch": 1.23, "learning_rate": 1.874145444110771e-05, "loss": 0.6654, "step": 38325 }, { "epoch": 1.23, "learning_rate": 1.8740911894424883e-05, "loss": 0.683, "step": 38330 }, { "epoch": 1.23, "learning_rate": 1.8740369238680565e-05, "loss": 0.6623, "step": 38335 }, { "epoch": 1.23, "learning_rate": 1.873982647388153e-05, "loss": 0.6614, "step": 38340 }, { "epoch": 1.23, "learning_rate": 1.873928360003455e-05, "loss": 0.6567, "step": 38345 }, { "epoch": 1.23, "learning_rate": 1.8738740617146396e-05, "loss": 0.6691, "step": 38350 }, { "epoch": 1.23, "learning_rate": 1.873819752522384e-05, "loss": 0.6663, "step": 38355 }, { "epoch": 1.23, "learning_rate": 1.8737654324273668e-05, "loss": 0.6589, "step": 38360 }, { "epoch": 1.23, "learning_rate": 1.8737111014302643e-05, "loss": 0.652, "step": 38365 }, { "epoch": 1.23, "learning_rate": 1.873656759531756e-05, "loss": 0.6556, "step": 38370 }, { "epoch": 1.23, "learning_rate": 1.8736024067325188e-05, "loss": 0.6596, "step": 38375 }, { "epoch": 1.23, "learning_rate": 1.8735480430332313e-05, "loss": 0.6643, "step": 38380 }, { "epoch": 1.23, "learning_rate": 1.873493668434572e-05, "loss": 0.6706, "step": 38385 }, { "epoch": 1.23, "learning_rate": 1.8734392829372188e-05, "loss": 0.6728, "step": 38390 }, { "epoch": 1.23, "learning_rate": 1.8733848865418504e-05, "loss": 0.6574, "step": 38395 }, { "epoch": 1.23, "learning_rate": 1.873330479249146e-05, "loss": 0.67, "step": 38400 }, { "epoch": 1.23, "learning_rate": 1.873276061059784e-05, "loss": 0.6684, "step": 38405 }, { "epoch": 1.23, "learning_rate": 1.8732216319744435e-05, "loss": 0.6602, "step": 38410 }, { "epoch": 1.23, "learning_rate": 1.8731671919938038e-05, "loss": 0.6575, "step": 38415 }, { "epoch": 1.23, "learning_rate": 1.8731127411185434e-05, "loss": 0.6593, "step": 38420 }, { "epoch": 1.23, "learning_rate": 1.873058279349343e-05, "loss": 0.6599, "step": 38425 }, { "epoch": 1.23, "learning_rate": 1.873003806686881e-05, "loss": 0.6704, "step": 38430 }, { "epoch": 1.23, "learning_rate": 1.872949323131837e-05, "loss": 0.6604, "step": 38435 }, { "epoch": 1.23, "learning_rate": 1.872894828684892e-05, "loss": 0.6627, "step": 38440 }, { "epoch": 1.23, "learning_rate": 1.8728403233467247e-05, "loss": 0.6615, "step": 38445 }, { "epoch": 1.23, "learning_rate": 1.8727858071180162e-05, "loss": 0.6539, "step": 38450 }, { "epoch": 1.23, "learning_rate": 1.8727312799994455e-05, "loss": 0.6499, "step": 38455 }, { "epoch": 1.23, "learning_rate": 1.872676741991694e-05, "loss": 0.6606, "step": 38460 }, { "epoch": 1.23, "learning_rate": 1.8726221930954418e-05, "loss": 0.6542, "step": 38465 }, { "epoch": 1.23, "learning_rate": 1.8725676333113694e-05, "loss": 0.6725, "step": 38470 }, { "epoch": 1.23, "learning_rate": 1.8725130626401573e-05, "loss": 0.6561, "step": 38475 }, { "epoch": 1.23, "learning_rate": 1.8724584810824874e-05, "loss": 0.65, "step": 38480 }, { "epoch": 1.23, "learning_rate": 1.8724038886390394e-05, "loss": 0.6603, "step": 38485 }, { "epoch": 1.23, "learning_rate": 1.8723492853104956e-05, "loss": 0.658, "step": 38490 }, { "epoch": 1.23, "learning_rate": 1.8722946710975365e-05, "loss": 0.6573, "step": 38495 }, { "epoch": 1.23, "learning_rate": 1.8722400460008437e-05, "loss": 0.658, "step": 38500 }, { "epoch": 1.23, "learning_rate": 1.8721854100210993e-05, "loss": 0.6656, "step": 38505 }, { "epoch": 1.23, "learning_rate": 1.8721307631589845e-05, "loss": 0.6667, "step": 38510 }, { "epoch": 1.23, "learning_rate": 1.872076105415181e-05, "loss": 0.6706, "step": 38515 }, { "epoch": 1.23, "learning_rate": 1.872021436790371e-05, "loss": 0.6648, "step": 38520 }, { "epoch": 1.23, "learning_rate": 1.8719667572852366e-05, "loss": 0.6553, "step": 38525 }, { "epoch": 1.23, "learning_rate": 1.8719120669004606e-05, "loss": 0.6681, "step": 38530 }, { "epoch": 1.23, "learning_rate": 1.871857365636724e-05, "loss": 0.6592, "step": 38535 }, { "epoch": 1.23, "learning_rate": 1.8718026534947107e-05, "loss": 0.663, "step": 38540 }, { "epoch": 1.23, "learning_rate": 1.8717479304751024e-05, "loss": 0.6634, "step": 38545 }, { "epoch": 1.23, "learning_rate": 1.8716931965785826e-05, "loss": 0.6615, "step": 38550 }, { "epoch": 1.23, "learning_rate": 1.871638451805834e-05, "loss": 0.6674, "step": 38555 }, { "epoch": 1.23, "learning_rate": 1.871583696157539e-05, "loss": 0.6662, "step": 38560 }, { "epoch": 1.23, "learning_rate": 1.8715289296343818e-05, "loss": 0.6581, "step": 38565 }, { "epoch": 1.23, "learning_rate": 1.8714741522370454e-05, "loss": 0.6572, "step": 38570 }, { "epoch": 1.23, "learning_rate": 1.871419363966213e-05, "loss": 0.6762, "step": 38575 }, { "epoch": 1.23, "learning_rate": 1.871364564822568e-05, "loss": 0.6665, "step": 38580 }, { "epoch": 1.23, "learning_rate": 1.871309754806795e-05, "loss": 0.6583, "step": 38585 }, { "epoch": 1.23, "learning_rate": 1.871254933919577e-05, "loss": 0.6664, "step": 38590 }, { "epoch": 1.24, "learning_rate": 1.8712001021615985e-05, "loss": 0.6658, "step": 38595 }, { "epoch": 1.24, "learning_rate": 1.8711452595335434e-05, "loss": 0.6658, "step": 38600 }, { "epoch": 1.24, "learning_rate": 1.8710904060360965e-05, "loss": 0.6618, "step": 38605 }, { "epoch": 1.24, "learning_rate": 1.8710355416699413e-05, "loss": 0.6688, "step": 38610 }, { "epoch": 1.24, "learning_rate": 1.870980666435763e-05, "loss": 0.656, "step": 38615 }, { "epoch": 1.24, "learning_rate": 1.870925780334246e-05, "loss": 0.6697, "step": 38620 }, { "epoch": 1.24, "learning_rate": 1.8708708833660755e-05, "loss": 0.6767, "step": 38625 }, { "epoch": 1.24, "learning_rate": 1.8708159755319363e-05, "loss": 0.6726, "step": 38630 }, { "epoch": 1.24, "learning_rate": 1.870761056832513e-05, "loss": 0.6723, "step": 38635 }, { "epoch": 1.24, "learning_rate": 1.8707061272684916e-05, "loss": 0.6682, "step": 38640 }, { "epoch": 1.24, "learning_rate": 1.870651186840557e-05, "loss": 0.6649, "step": 38645 }, { "epoch": 1.24, "learning_rate": 1.8705962355493944e-05, "loss": 0.6705, "step": 38650 }, { "epoch": 1.24, "learning_rate": 1.8705412733956903e-05, "loss": 0.674, "step": 38655 }, { "epoch": 1.24, "learning_rate": 1.8704863003801297e-05, "loss": 0.6608, "step": 38660 }, { "epoch": 1.24, "learning_rate": 1.870431316503399e-05, "loss": 0.6588, "step": 38665 }, { "epoch": 1.24, "learning_rate": 1.870376321766184e-05, "loss": 0.6604, "step": 38670 }, { "epoch": 1.24, "learning_rate": 1.8703213161691708e-05, "loss": 0.6571, "step": 38675 }, { "epoch": 1.24, "learning_rate": 1.870266299713046e-05, "loss": 0.6698, "step": 38680 }, { "epoch": 1.24, "learning_rate": 1.8702112723984957e-05, "loss": 0.6684, "step": 38685 }, { "epoch": 1.24, "learning_rate": 1.870156234226207e-05, "loss": 0.6546, "step": 38690 }, { "epoch": 1.24, "learning_rate": 1.870101185196866e-05, "loss": 0.6501, "step": 38695 }, { "epoch": 1.24, "learning_rate": 1.87004612531116e-05, "loss": 0.6636, "step": 38700 }, { "epoch": 1.24, "learning_rate": 1.869991054569776e-05, "loss": 0.6561, "step": 38705 }, { "epoch": 1.24, "learning_rate": 1.8699359729734002e-05, "loss": 0.6627, "step": 38710 }, { "epoch": 1.24, "learning_rate": 1.8698808805227212e-05, "loss": 0.6626, "step": 38715 }, { "epoch": 1.24, "learning_rate": 1.8698257772184253e-05, "loss": 0.6612, "step": 38720 }, { "epoch": 1.24, "learning_rate": 1.8697706630612013e-05, "loss": 0.6603, "step": 38725 }, { "epoch": 1.24, "learning_rate": 1.8697155380517356e-05, "loss": 0.6589, "step": 38730 }, { "epoch": 1.24, "learning_rate": 1.8696604021907166e-05, "loss": 0.6737, "step": 38735 }, { "epoch": 1.24, "learning_rate": 1.869605255478832e-05, "loss": 0.6523, "step": 38740 }, { "epoch": 1.24, "learning_rate": 1.8695500979167703e-05, "loss": 0.6549, "step": 38745 }, { "epoch": 1.24, "learning_rate": 1.869494929505219e-05, "loss": 0.6604, "step": 38750 }, { "epoch": 1.24, "learning_rate": 1.8694397502448672e-05, "loss": 0.6584, "step": 38755 }, { "epoch": 1.24, "learning_rate": 1.869384560136403e-05, "loss": 0.666, "step": 38760 }, { "epoch": 1.24, "learning_rate": 1.869329359180515e-05, "loss": 0.6549, "step": 38765 }, { "epoch": 1.24, "learning_rate": 1.869274147377892e-05, "loss": 0.6607, "step": 38770 }, { "epoch": 1.24, "learning_rate": 1.869218924729223e-05, "loss": 0.6671, "step": 38775 }, { "epoch": 1.24, "learning_rate": 1.869163691235197e-05, "loss": 0.6665, "step": 38780 }, { "epoch": 1.24, "learning_rate": 1.8691084468965027e-05, "loss": 0.6458, "step": 38785 }, { "epoch": 1.24, "learning_rate": 1.8690531917138298e-05, "loss": 0.672, "step": 38790 }, { "epoch": 1.24, "learning_rate": 1.868997925687868e-05, "loss": 0.6534, "step": 38795 }, { "epoch": 1.24, "learning_rate": 1.8689426488193066e-05, "loss": 0.6583, "step": 38800 }, { "epoch": 1.24, "learning_rate": 1.8688873611088348e-05, "loss": 0.6562, "step": 38805 }, { "epoch": 1.24, "learning_rate": 1.8688320625571433e-05, "loss": 0.6566, "step": 38810 }, { "epoch": 1.24, "learning_rate": 1.8687767531649212e-05, "loss": 0.6646, "step": 38815 }, { "epoch": 1.24, "learning_rate": 1.8687214329328593e-05, "loss": 0.6717, "step": 38820 }, { "epoch": 1.24, "learning_rate": 1.8686661018616478e-05, "loss": 0.6579, "step": 38825 }, { "epoch": 1.24, "learning_rate": 1.8686107599519766e-05, "loss": 0.6565, "step": 38830 }, { "epoch": 1.24, "learning_rate": 1.8685554072045367e-05, "loss": 0.665, "step": 38835 }, { "epoch": 1.24, "learning_rate": 1.868500043620018e-05, "loss": 0.6673, "step": 38840 }, { "epoch": 1.24, "learning_rate": 1.868444669199112e-05, "loss": 0.6566, "step": 38845 }, { "epoch": 1.24, "learning_rate": 1.8683892839425098e-05, "loss": 0.6648, "step": 38850 }, { "epoch": 1.24, "learning_rate": 1.8683338878509015e-05, "loss": 0.6606, "step": 38855 }, { "epoch": 1.24, "learning_rate": 1.8682784809249792e-05, "loss": 0.6537, "step": 38860 }, { "epoch": 1.24, "learning_rate": 1.8682230631654333e-05, "loss": 0.658, "step": 38865 }, { "epoch": 1.24, "learning_rate": 1.8681676345729564e-05, "loss": 0.6636, "step": 38870 }, { "epoch": 1.24, "learning_rate": 1.8681121951482397e-05, "loss": 0.674, "step": 38875 }, { "epoch": 1.24, "learning_rate": 1.868056744891974e-05, "loss": 0.654, "step": 38880 }, { "epoch": 1.24, "learning_rate": 1.8680012838048523e-05, "loss": 0.6515, "step": 38885 }, { "epoch": 1.24, "learning_rate": 1.8679458118875658e-05, "loss": 0.6698, "step": 38890 }, { "epoch": 1.24, "learning_rate": 1.8678903291408075e-05, "loss": 0.6554, "step": 38895 }, { "epoch": 1.24, "learning_rate": 1.867834835565269e-05, "loss": 0.6552, "step": 38900 }, { "epoch": 1.24, "learning_rate": 1.867779331161643e-05, "loss": 0.6598, "step": 38905 }, { "epoch": 1.25, "learning_rate": 1.867723815930621e-05, "loss": 0.6534, "step": 38910 }, { "epoch": 1.25, "learning_rate": 1.867668289872898e-05, "loss": 0.6705, "step": 38915 }, { "epoch": 1.25, "learning_rate": 1.8676127529891645e-05, "loss": 0.6722, "step": 38920 }, { "epoch": 1.25, "learning_rate": 1.8675572052801145e-05, "loss": 0.6598, "step": 38925 }, { "epoch": 1.25, "learning_rate": 1.867501646746441e-05, "loss": 0.6549, "step": 38930 }, { "epoch": 1.25, "learning_rate": 1.867446077388837e-05, "loss": 0.6567, "step": 38935 }, { "epoch": 1.25, "learning_rate": 1.8673904972079956e-05, "loss": 0.6601, "step": 38940 }, { "epoch": 1.25, "learning_rate": 1.8673349062046112e-05, "loss": 0.6528, "step": 38945 }, { "epoch": 1.25, "learning_rate": 1.8672793043793768e-05, "loss": 0.6718, "step": 38950 }, { "epoch": 1.25, "learning_rate": 1.8672236917329857e-05, "loss": 0.6638, "step": 38955 }, { "epoch": 1.25, "learning_rate": 1.867168068266133e-05, "loss": 0.6547, "step": 38960 }, { "epoch": 1.25, "learning_rate": 1.8671124339795118e-05, "loss": 0.6668, "step": 38965 }, { "epoch": 1.25, "learning_rate": 1.867056788873816e-05, "loss": 0.6615, "step": 38970 }, { "epoch": 1.25, "learning_rate": 1.8670011329497408e-05, "loss": 0.6676, "step": 38975 }, { "epoch": 1.25, "learning_rate": 1.8669454662079802e-05, "loss": 0.6562, "step": 38980 }, { "epoch": 1.25, "learning_rate": 1.8668897886492284e-05, "loss": 0.6605, "step": 38985 }, { "epoch": 1.25, "learning_rate": 1.866834100274181e-05, "loss": 0.6505, "step": 38990 }, { "epoch": 1.25, "learning_rate": 1.866778401083532e-05, "loss": 0.6608, "step": 38995 }, { "epoch": 1.25, "learning_rate": 1.8667226910779767e-05, "loss": 0.6595, "step": 39000 }, { "epoch": 1.25, "learning_rate": 1.8666669702582097e-05, "loss": 0.6536, "step": 39005 }, { "epoch": 1.25, "learning_rate": 1.866611238624927e-05, "loss": 0.6632, "step": 39010 }, { "epoch": 1.25, "learning_rate": 1.8665554961788236e-05, "loss": 0.6641, "step": 39015 }, { "epoch": 1.25, "learning_rate": 1.866499742920595e-05, "loss": 0.6623, "step": 39020 }, { "epoch": 1.25, "learning_rate": 1.866443978850937e-05, "loss": 0.6665, "step": 39025 }, { "epoch": 1.25, "learning_rate": 1.8663882039705456e-05, "loss": 0.6619, "step": 39030 }, { "epoch": 1.25, "learning_rate": 1.866332418280116e-05, "loss": 0.6472, "step": 39035 }, { "epoch": 1.25, "learning_rate": 1.8662766217803447e-05, "loss": 0.6646, "step": 39040 }, { "epoch": 1.25, "learning_rate": 1.8662208144719276e-05, "loss": 0.6627, "step": 39045 }, { "epoch": 1.25, "learning_rate": 1.8661649963555616e-05, "loss": 0.6633, "step": 39050 }, { "epoch": 1.25, "learning_rate": 1.8661091674319425e-05, "loss": 0.661, "step": 39055 }, { "epoch": 1.25, "learning_rate": 1.8660533277017672e-05, "loss": 0.6558, "step": 39060 }, { "epoch": 1.25, "learning_rate": 1.8659974771657325e-05, "loss": 0.6563, "step": 39065 }, { "epoch": 1.25, "learning_rate": 1.8659416158245348e-05, "loss": 0.6509, "step": 39070 }, { "epoch": 1.25, "learning_rate": 1.865885743678872e-05, "loss": 0.6507, "step": 39075 }, { "epoch": 1.25, "learning_rate": 1.8658298607294402e-05, "loss": 0.6634, "step": 39080 }, { "epoch": 1.25, "learning_rate": 1.865773966976937e-05, "loss": 0.6622, "step": 39085 }, { "epoch": 1.25, "learning_rate": 1.8657180624220602e-05, "loss": 0.6491, "step": 39090 }, { "epoch": 1.25, "learning_rate": 1.865662147065507e-05, "loss": 0.6735, "step": 39095 }, { "epoch": 1.25, "learning_rate": 1.865606220907975e-05, "loss": 0.6561, "step": 39100 }, { "epoch": 1.25, "learning_rate": 1.865550283950162e-05, "loss": 0.6685, "step": 39105 }, { "epoch": 1.25, "learning_rate": 1.8654943361927662e-05, "loss": 0.6717, "step": 39110 }, { "epoch": 1.25, "learning_rate": 1.8654383776364855e-05, "loss": 0.6594, "step": 39115 }, { "epoch": 1.25, "learning_rate": 1.865382408282018e-05, "loss": 0.658, "step": 39120 }, { "epoch": 1.25, "learning_rate": 1.8653264281300622e-05, "loss": 0.6647, "step": 39125 }, { "epoch": 1.25, "learning_rate": 1.8652704371813165e-05, "loss": 0.6614, "step": 39130 }, { "epoch": 1.25, "learning_rate": 1.8652144354364793e-05, "loss": 0.6768, "step": 39135 }, { "epoch": 1.25, "learning_rate": 1.8651584228962495e-05, "loss": 0.6687, "step": 39140 }, { "epoch": 1.25, "learning_rate": 1.865102399561326e-05, "loss": 0.661, "step": 39145 }, { "epoch": 1.25, "learning_rate": 1.865046365432408e-05, "loss": 0.6569, "step": 39150 }, { "epoch": 1.25, "learning_rate": 1.8649903205101948e-05, "loss": 0.6555, "step": 39155 }, { "epoch": 1.25, "learning_rate": 1.864934264795385e-05, "loss": 0.6501, "step": 39160 }, { "epoch": 1.25, "learning_rate": 1.8648781982886784e-05, "loss": 0.659, "step": 39165 }, { "epoch": 1.25, "learning_rate": 1.8648221209907744e-05, "loss": 0.6599, "step": 39170 }, { "epoch": 1.25, "learning_rate": 1.864766032902373e-05, "loss": 0.6573, "step": 39175 }, { "epoch": 1.25, "learning_rate": 1.8647099340241738e-05, "loss": 0.6638, "step": 39180 }, { "epoch": 1.25, "learning_rate": 1.8646538243568765e-05, "loss": 0.6531, "step": 39185 }, { "epoch": 1.25, "learning_rate": 1.8645977039011818e-05, "loss": 0.6683, "step": 39190 }, { "epoch": 1.25, "learning_rate": 1.8645415726577893e-05, "loss": 0.655, "step": 39195 }, { "epoch": 1.25, "learning_rate": 1.8644854306273997e-05, "loss": 0.6621, "step": 39200 }, { "epoch": 1.25, "learning_rate": 1.8644292778107137e-05, "loss": 0.6662, "step": 39205 }, { "epoch": 1.25, "learning_rate": 1.8643731142084312e-05, "loss": 0.6621, "step": 39210 }, { "epoch": 1.25, "learning_rate": 1.864316939821254e-05, "loss": 0.6528, "step": 39215 }, { "epoch": 1.26, "learning_rate": 1.864260754649882e-05, "loss": 0.6424, "step": 39220 }, { "epoch": 1.26, "learning_rate": 1.8642045586950165e-05, "loss": 0.6567, "step": 39225 }, { "epoch": 1.26, "learning_rate": 1.8641483519573592e-05, "loss": 0.6485, "step": 39230 }, { "epoch": 1.26, "learning_rate": 1.864092134437611e-05, "loss": 0.6682, "step": 39235 }, { "epoch": 1.26, "learning_rate": 1.864035906136473e-05, "loss": 0.662, "step": 39240 }, { "epoch": 1.26, "learning_rate": 1.8639796670546473e-05, "loss": 0.6639, "step": 39245 }, { "epoch": 1.26, "learning_rate": 1.8639234171928355e-05, "loss": 0.6642, "step": 39250 }, { "epoch": 1.26, "learning_rate": 1.8638671565517392e-05, "loss": 0.6725, "step": 39255 }, { "epoch": 1.26, "learning_rate": 1.8638108851320607e-05, "loss": 0.6624, "step": 39260 }, { "epoch": 1.26, "learning_rate": 1.8637546029345018e-05, "loss": 0.6687, "step": 39265 }, { "epoch": 1.26, "learning_rate": 1.8636983099597646e-05, "loss": 0.6756, "step": 39270 }, { "epoch": 1.26, "learning_rate": 1.863642006208552e-05, "loss": 0.6533, "step": 39275 }, { "epoch": 1.26, "learning_rate": 1.8635856916815664e-05, "loss": 0.668, "step": 39280 }, { "epoch": 1.26, "learning_rate": 1.86352936637951e-05, "loss": 0.6633, "step": 39285 }, { "epoch": 1.26, "learning_rate": 1.863473030303086e-05, "loss": 0.6741, "step": 39290 }, { "epoch": 1.26, "learning_rate": 1.863416683452997e-05, "loss": 0.6575, "step": 39295 }, { "epoch": 1.26, "learning_rate": 1.8633603258299464e-05, "loss": 0.6607, "step": 39300 }, { "epoch": 1.26, "learning_rate": 1.8633039574346373e-05, "loss": 0.6596, "step": 39305 }, { "epoch": 1.26, "learning_rate": 1.863247578267773e-05, "loss": 0.6662, "step": 39310 }, { "epoch": 1.26, "learning_rate": 1.8631911883300564e-05, "loss": 0.6689, "step": 39315 }, { "epoch": 1.26, "learning_rate": 1.863134787622192e-05, "loss": 0.6582, "step": 39320 }, { "epoch": 1.26, "learning_rate": 1.8630783761448828e-05, "loss": 0.6562, "step": 39325 }, { "epoch": 1.26, "learning_rate": 1.8630219538988334e-05, "loss": 0.6632, "step": 39330 }, { "epoch": 1.26, "learning_rate": 1.8629655208847465e-05, "loss": 0.6636, "step": 39335 }, { "epoch": 1.26, "learning_rate": 1.8629090771033275e-05, "loss": 0.6609, "step": 39340 }, { "epoch": 1.26, "learning_rate": 1.8628526225552806e-05, "loss": 0.6636, "step": 39345 }, { "epoch": 1.26, "learning_rate": 1.8627961572413094e-05, "loss": 0.6714, "step": 39350 }, { "epoch": 1.26, "learning_rate": 1.862739681162119e-05, "loss": 0.6574, "step": 39355 }, { "epoch": 1.26, "learning_rate": 1.862683194318413e-05, "loss": 0.6606, "step": 39360 }, { "epoch": 1.26, "learning_rate": 1.862626696710898e-05, "loss": 0.6605, "step": 39365 }, { "epoch": 1.26, "learning_rate": 1.8625701883402776e-05, "loss": 0.6633, "step": 39370 }, { "epoch": 1.26, "learning_rate": 1.8625136692072577e-05, "loss": 0.6419, "step": 39375 }, { "epoch": 1.26, "learning_rate": 1.8624571393125425e-05, "loss": 0.664, "step": 39380 }, { "epoch": 1.26, "learning_rate": 1.8624005986568385e-05, "loss": 0.6578, "step": 39385 }, { "epoch": 1.26, "learning_rate": 1.8623440472408497e-05, "loss": 0.6477, "step": 39390 }, { "epoch": 1.26, "learning_rate": 1.8622874850652834e-05, "loss": 0.6674, "step": 39395 }, { "epoch": 1.26, "learning_rate": 1.862230912130844e-05, "loss": 0.6561, "step": 39400 }, { "epoch": 1.26, "learning_rate": 1.862174328438238e-05, "loss": 0.6549, "step": 39405 }, { "epoch": 1.26, "learning_rate": 1.8621177339881712e-05, "loss": 0.6442, "step": 39410 }, { "epoch": 1.26, "learning_rate": 1.86206112878135e-05, "loss": 0.6687, "step": 39415 }, { "epoch": 1.26, "learning_rate": 1.86200451281848e-05, "loss": 0.6558, "step": 39420 }, { "epoch": 1.26, "learning_rate": 1.8619478861002682e-05, "loss": 0.6692, "step": 39425 }, { "epoch": 1.26, "learning_rate": 1.8618912486274214e-05, "loss": 0.6553, "step": 39430 }, { "epoch": 1.26, "learning_rate": 1.8618346004006456e-05, "loss": 0.6594, "step": 39435 }, { "epoch": 1.26, "learning_rate": 1.861777941420648e-05, "loss": 0.6524, "step": 39440 }, { "epoch": 1.26, "learning_rate": 1.861721271688135e-05, "loss": 0.663, "step": 39445 }, { "epoch": 1.26, "learning_rate": 1.8616645912038146e-05, "loss": 0.6586, "step": 39450 }, { "epoch": 1.26, "learning_rate": 1.861607899968393e-05, "loss": 0.6665, "step": 39455 }, { "epoch": 1.26, "learning_rate": 1.8615511979825784e-05, "loss": 0.6594, "step": 39460 }, { "epoch": 1.26, "learning_rate": 1.861494485247078e-05, "loss": 0.6615, "step": 39465 }, { "epoch": 1.26, "learning_rate": 1.8614377617625993e-05, "loss": 0.6606, "step": 39470 }, { "epoch": 1.26, "learning_rate": 1.86138102752985e-05, "loss": 0.6627, "step": 39475 }, { "epoch": 1.26, "learning_rate": 1.861324282549538e-05, "loss": 0.6571, "step": 39480 }, { "epoch": 1.26, "learning_rate": 1.8612675268223717e-05, "loss": 0.6481, "step": 39485 }, { "epoch": 1.26, "learning_rate": 1.861210760349059e-05, "loss": 0.6571, "step": 39490 }, { "epoch": 1.26, "learning_rate": 1.8611539831303074e-05, "loss": 0.6564, "step": 39495 }, { "epoch": 1.26, "learning_rate": 1.8610971951668265e-05, "loss": 0.654, "step": 39500 }, { "epoch": 1.26, "learning_rate": 1.861040396459324e-05, "loss": 0.6607, "step": 39505 }, { "epoch": 1.26, "learning_rate": 1.8609835870085096e-05, "loss": 0.6527, "step": 39510 }, { "epoch": 1.26, "learning_rate": 1.8609267668150913e-05, "loss": 0.6537, "step": 39515 }, { "epoch": 1.26, "learning_rate": 1.860869935879778e-05, "loss": 0.6512, "step": 39520 }, { "epoch": 1.26, "learning_rate": 1.8608130942032792e-05, "loss": 0.6716, "step": 39525 }, { "epoch": 1.26, "learning_rate": 1.8607562417863038e-05, "loss": 0.6491, "step": 39530 }, { "epoch": 1.27, "learning_rate": 1.8606993786295614e-05, "loss": 0.6617, "step": 39535 }, { "epoch": 1.27, "learning_rate": 1.8606425047337616e-05, "loss": 0.6587, "step": 39540 }, { "epoch": 1.27, "learning_rate": 1.8605856200996135e-05, "loss": 0.6489, "step": 39545 }, { "epoch": 1.27, "learning_rate": 1.8605287247278273e-05, "loss": 0.665, "step": 39550 }, { "epoch": 1.27, "learning_rate": 1.8604718186191128e-05, "loss": 0.6683, "step": 39555 }, { "epoch": 1.27, "learning_rate": 1.86041490177418e-05, "loss": 0.6449, "step": 39560 }, { "epoch": 1.27, "learning_rate": 1.8603579741937387e-05, "loss": 0.6628, "step": 39565 }, { "epoch": 1.27, "learning_rate": 1.8603010358785e-05, "loss": 0.6584, "step": 39570 }, { "epoch": 1.27, "learning_rate": 1.8602440868291736e-05, "loss": 0.6451, "step": 39575 }, { "epoch": 1.27, "learning_rate": 1.8601871270464708e-05, "loss": 0.6539, "step": 39580 }, { "epoch": 1.27, "learning_rate": 1.8601301565311012e-05, "loss": 0.668, "step": 39585 }, { "epoch": 1.27, "learning_rate": 1.8600731752837765e-05, "loss": 0.6609, "step": 39590 }, { "epoch": 1.27, "learning_rate": 1.8600161833052074e-05, "loss": 0.6563, "step": 39595 }, { "epoch": 1.27, "learning_rate": 1.8599591805961047e-05, "loss": 0.6634, "step": 39600 }, { "epoch": 1.27, "learning_rate": 1.8599021671571804e-05, "loss": 0.66, "step": 39605 }, { "epoch": 1.27, "learning_rate": 1.8598451429891455e-05, "loss": 0.6632, "step": 39610 }, { "epoch": 1.27, "learning_rate": 1.8597881080927108e-05, "loss": 0.6682, "step": 39615 }, { "epoch": 1.27, "learning_rate": 1.859731062468589e-05, "loss": 0.642, "step": 39620 }, { "epoch": 1.27, "learning_rate": 1.8596740061174912e-05, "loss": 0.6611, "step": 39625 }, { "epoch": 1.27, "learning_rate": 1.85961693904013e-05, "loss": 0.6604, "step": 39630 }, { "epoch": 1.27, "learning_rate": 1.8595598612372162e-05, "loss": 0.6409, "step": 39635 }, { "epoch": 1.27, "learning_rate": 1.8595027727094628e-05, "loss": 0.6629, "step": 39640 }, { "epoch": 1.27, "learning_rate": 1.8594456734575824e-05, "loss": 0.6534, "step": 39645 }, { "epoch": 1.27, "learning_rate": 1.8593885634822866e-05, "loss": 0.6495, "step": 39650 }, { "epoch": 1.27, "learning_rate": 1.8593314427842886e-05, "loss": 0.657, "step": 39655 }, { "epoch": 1.27, "learning_rate": 1.859274311364301e-05, "loss": 0.6561, "step": 39660 }, { "epoch": 1.27, "learning_rate": 1.8592171692230367e-05, "loss": 0.6553, "step": 39665 }, { "epoch": 1.27, "learning_rate": 1.859160016361208e-05, "loss": 0.6748, "step": 39670 }, { "epoch": 1.27, "learning_rate": 1.8591028527795288e-05, "loss": 0.658, "step": 39675 }, { "epoch": 1.27, "learning_rate": 1.8590456784787122e-05, "loss": 0.6571, "step": 39680 }, { "epoch": 1.27, "learning_rate": 1.8589884934594713e-05, "loss": 0.6661, "step": 39685 }, { "epoch": 1.27, "learning_rate": 1.8589312977225196e-05, "loss": 0.6674, "step": 39690 }, { "epoch": 1.27, "learning_rate": 1.858874091268571e-05, "loss": 0.6682, "step": 39695 }, { "epoch": 1.27, "learning_rate": 1.858816874098339e-05, "loss": 0.6663, "step": 39700 }, { "epoch": 1.27, "learning_rate": 1.8587596462125378e-05, "loss": 0.66, "step": 39705 }, { "epoch": 1.27, "learning_rate": 1.8587024076118808e-05, "loss": 0.6686, "step": 39710 }, { "epoch": 1.27, "learning_rate": 1.8586451582970834e-05, "loss": 0.6664, "step": 39715 }, { "epoch": 1.27, "learning_rate": 1.8585878982688588e-05, "loss": 0.6614, "step": 39720 }, { "epoch": 1.27, "learning_rate": 1.858530627527922e-05, "loss": 0.6523, "step": 39725 }, { "epoch": 1.27, "learning_rate": 1.8584733460749872e-05, "loss": 0.658, "step": 39730 }, { "epoch": 1.27, "learning_rate": 1.8584160539107693e-05, "loss": 0.6575, "step": 39735 }, { "epoch": 1.27, "learning_rate": 1.858358751035983e-05, "loss": 0.6556, "step": 39740 }, { "epoch": 1.27, "learning_rate": 1.858301437451344e-05, "loss": 0.6525, "step": 39745 }, { "epoch": 1.27, "learning_rate": 1.8582441131575658e-05, "loss": 0.6564, "step": 39750 }, { "epoch": 1.27, "learning_rate": 1.8581867781553654e-05, "loss": 0.6519, "step": 39755 }, { "epoch": 1.27, "learning_rate": 1.8581294324454573e-05, "loss": 0.6704, "step": 39760 }, { "epoch": 1.27, "learning_rate": 1.858072076028557e-05, "loss": 0.6664, "step": 39765 }, { "epoch": 1.27, "learning_rate": 1.8580147089053805e-05, "loss": 0.6683, "step": 39770 }, { "epoch": 1.27, "learning_rate": 1.857957331076643e-05, "loss": 0.6616, "step": 39775 }, { "epoch": 1.27, "learning_rate": 1.857899942543061e-05, "loss": 0.6494, "step": 39780 }, { "epoch": 1.27, "learning_rate": 1.8578425433053505e-05, "loss": 0.6636, "step": 39785 }, { "epoch": 1.27, "learning_rate": 1.8577851333642273e-05, "loss": 0.6616, "step": 39790 }, { "epoch": 1.27, "learning_rate": 1.8577277127204077e-05, "loss": 0.6629, "step": 39795 }, { "epoch": 1.27, "learning_rate": 1.8576702813746087e-05, "loss": 0.6681, "step": 39800 }, { "epoch": 1.27, "learning_rate": 1.8576128393275463e-05, "loss": 0.6561, "step": 39805 }, { "epoch": 1.27, "learning_rate": 1.8575553865799376e-05, "loss": 0.6578, "step": 39810 }, { "epoch": 1.27, "learning_rate": 1.8574979231324993e-05, "loss": 0.6601, "step": 39815 }, { "epoch": 1.27, "learning_rate": 1.8574404489859483e-05, "loss": 0.6592, "step": 39820 }, { "epoch": 1.27, "learning_rate": 1.857382964141002e-05, "loss": 0.6611, "step": 39825 }, { "epoch": 1.27, "learning_rate": 1.857325468598377e-05, "loss": 0.6469, "step": 39830 }, { "epoch": 1.27, "learning_rate": 1.8572679623587914e-05, "loss": 0.6612, "step": 39835 }, { "epoch": 1.27, "learning_rate": 1.8572104454229626e-05, "loss": 0.6564, "step": 39840 }, { "epoch": 1.28, "learning_rate": 1.8571529177916075e-05, "loss": 0.6494, "step": 39845 }, { "epoch": 1.28, "learning_rate": 1.8570953794654446e-05, "loss": 0.6672, "step": 39850 }, { "epoch": 1.28, "learning_rate": 1.857037830445192e-05, "loss": 0.6577, "step": 39855 }, { "epoch": 1.28, "learning_rate": 1.856980270731567e-05, "loss": 0.6522, "step": 39860 }, { "epoch": 1.28, "learning_rate": 1.8569227003252887e-05, "loss": 0.6521, "step": 39865 }, { "epoch": 1.28, "learning_rate": 1.8568651192270743e-05, "loss": 0.6592, "step": 39870 }, { "epoch": 1.28, "learning_rate": 1.856807527437643e-05, "loss": 0.6617, "step": 39875 }, { "epoch": 1.28, "learning_rate": 1.8567499249577135e-05, "loss": 0.6564, "step": 39880 }, { "epoch": 1.28, "learning_rate": 1.856692311788004e-05, "loss": 0.6454, "step": 39885 }, { "epoch": 1.28, "learning_rate": 1.8566346879292337e-05, "loss": 0.6685, "step": 39890 }, { "epoch": 1.28, "learning_rate": 1.8565770533821213e-05, "loss": 0.6622, "step": 39895 }, { "epoch": 1.28, "learning_rate": 1.8565194081473863e-05, "loss": 0.6516, "step": 39900 }, { "epoch": 1.28, "learning_rate": 1.8564617522257474e-05, "loss": 0.6549, "step": 39905 }, { "epoch": 1.28, "learning_rate": 1.856404085617925e-05, "loss": 0.6411, "step": 39910 }, { "epoch": 1.28, "learning_rate": 1.8563464083246372e-05, "loss": 0.6598, "step": 39915 }, { "epoch": 1.28, "learning_rate": 1.8562887203466044e-05, "loss": 0.6602, "step": 39920 }, { "epoch": 1.28, "learning_rate": 1.8562310216845463e-05, "loss": 0.6661, "step": 39925 }, { "epoch": 1.28, "learning_rate": 1.8561733123391835e-05, "loss": 0.6542, "step": 39930 }, { "epoch": 1.28, "learning_rate": 1.8561155923112347e-05, "loss": 0.6583, "step": 39935 }, { "epoch": 1.28, "learning_rate": 1.8560578616014214e-05, "loss": 0.6509, "step": 39940 }, { "epoch": 1.28, "learning_rate": 1.856000120210463e-05, "loss": 0.6679, "step": 39945 }, { "epoch": 1.28, "learning_rate": 1.8559423681390803e-05, "loss": 0.6515, "step": 39950 }, { "epoch": 1.28, "learning_rate": 1.8558846053879937e-05, "loss": 0.6626, "step": 39955 }, { "epoch": 1.28, "learning_rate": 1.855826831957924e-05, "loss": 0.6554, "step": 39960 }, { "epoch": 1.28, "learning_rate": 1.855769047849592e-05, "loss": 0.6655, "step": 39965 }, { "epoch": 1.28, "learning_rate": 1.8557112530637195e-05, "loss": 0.6664, "step": 39970 }, { "epoch": 1.28, "learning_rate": 1.855653447601026e-05, "loss": 0.6438, "step": 39975 }, { "epoch": 1.28, "learning_rate": 1.855595631462234e-05, "loss": 0.6497, "step": 39980 }, { "epoch": 1.28, "learning_rate": 1.8555378046480647e-05, "loss": 0.6572, "step": 39985 }, { "epoch": 1.28, "learning_rate": 1.855479967159239e-05, "loss": 0.6625, "step": 39990 }, { "epoch": 1.28, "learning_rate": 1.855422118996479e-05, "loss": 0.6453, "step": 39995 }, { "epoch": 1.28, "learning_rate": 1.855364260160507e-05, "loss": 0.6512, "step": 40000 }, { "epoch": 1.28, "learning_rate": 1.855306390652044e-05, "loss": 0.6533, "step": 40005 }, { "epoch": 1.28, "learning_rate": 1.8552485104718122e-05, "loss": 0.6595, "step": 40010 }, { "epoch": 1.28, "learning_rate": 1.855190619620534e-05, "loss": 0.6626, "step": 40015 }, { "epoch": 1.28, "learning_rate": 1.8551327180989318e-05, "loss": 0.6617, "step": 40020 }, { "epoch": 1.28, "learning_rate": 1.8550748059077278e-05, "loss": 0.6529, "step": 40025 }, { "epoch": 1.28, "learning_rate": 1.8550168830476448e-05, "loss": 0.6612, "step": 40030 }, { "epoch": 1.28, "learning_rate": 1.8549589495194058e-05, "loss": 0.657, "step": 40035 }, { "epoch": 1.28, "learning_rate": 1.854901005323733e-05, "loss": 0.6517, "step": 40040 }, { "epoch": 1.28, "learning_rate": 1.8548430504613497e-05, "loss": 0.6569, "step": 40045 }, { "epoch": 1.28, "learning_rate": 1.8547850849329788e-05, "loss": 0.6534, "step": 40050 }, { "epoch": 1.28, "learning_rate": 1.8547271087393436e-05, "loss": 0.6659, "step": 40055 }, { "epoch": 1.28, "learning_rate": 1.854669121881168e-05, "loss": 0.6606, "step": 40060 }, { "epoch": 1.28, "learning_rate": 1.8546111243591746e-05, "loss": 0.6534, "step": 40065 }, { "epoch": 1.28, "learning_rate": 1.854553116174088e-05, "loss": 0.6672, "step": 40070 }, { "epoch": 1.28, "learning_rate": 1.854495097326631e-05, "loss": 0.667, "step": 40075 }, { "epoch": 1.28, "learning_rate": 1.8544370678175282e-05, "loss": 0.6579, "step": 40080 }, { "epoch": 1.28, "learning_rate": 1.8543790276475037e-05, "loss": 0.6479, "step": 40085 }, { "epoch": 1.28, "learning_rate": 1.8543209768172815e-05, "loss": 0.6524, "step": 40090 }, { "epoch": 1.28, "learning_rate": 1.8542629153275854e-05, "loss": 0.6402, "step": 40095 }, { "epoch": 1.28, "learning_rate": 1.8542048431791404e-05, "loss": 0.6499, "step": 40100 }, { "epoch": 1.28, "learning_rate": 1.854146760372671e-05, "loss": 0.6651, "step": 40105 }, { "epoch": 1.28, "learning_rate": 1.854088666908902e-05, "loss": 0.645, "step": 40110 }, { "epoch": 1.28, "learning_rate": 1.854030562788558e-05, "loss": 0.66, "step": 40115 }, { "epoch": 1.28, "learning_rate": 1.853972448012364e-05, "loss": 0.6553, "step": 40120 }, { "epoch": 1.28, "learning_rate": 1.8539143225810453e-05, "loss": 0.6532, "step": 40125 }, { "epoch": 1.28, "learning_rate": 1.853856186495327e-05, "loss": 0.6591, "step": 40130 }, { "epoch": 1.28, "learning_rate": 1.8537980397559342e-05, "loss": 0.6607, "step": 40135 }, { "epoch": 1.28, "learning_rate": 1.853739882363593e-05, "loss": 0.6504, "step": 40140 }, { "epoch": 1.28, "learning_rate": 1.8536817143190284e-05, "loss": 0.6598, "step": 40145 }, { "epoch": 1.28, "learning_rate": 1.8536235356229667e-05, "loss": 0.6638, "step": 40150 }, { "epoch": 1.28, "learning_rate": 1.8535653462761337e-05, "loss": 0.6538, "step": 40155 }, { "epoch": 1.29, "learning_rate": 1.8535071462792557e-05, "loss": 0.6494, "step": 40160 }, { "epoch": 1.29, "learning_rate": 1.8534489356330576e-05, "loss": 0.6646, "step": 40165 }, { "epoch": 1.29, "learning_rate": 1.8533907143382672e-05, "loss": 0.6619, "step": 40170 }, { "epoch": 1.29, "learning_rate": 1.8533324823956104e-05, "loss": 0.6534, "step": 40175 }, { "epoch": 1.29, "learning_rate": 1.8532742398058134e-05, "loss": 0.6508, "step": 40180 }, { "epoch": 1.29, "learning_rate": 1.8532159865696034e-05, "loss": 0.6587, "step": 40185 }, { "epoch": 1.29, "learning_rate": 1.8531577226877068e-05, "loss": 0.6555, "step": 40190 }, { "epoch": 1.29, "learning_rate": 1.853099448160851e-05, "loss": 0.6615, "step": 40195 }, { "epoch": 1.29, "learning_rate": 1.8530411629897628e-05, "loss": 0.6482, "step": 40200 }, { "epoch": 1.29, "learning_rate": 1.85298286717517e-05, "loss": 0.6528, "step": 40205 }, { "epoch": 1.29, "learning_rate": 1.852924560717799e-05, "loss": 0.6524, "step": 40210 }, { "epoch": 1.29, "learning_rate": 1.852866243618378e-05, "loss": 0.654, "step": 40215 }, { "epoch": 1.29, "learning_rate": 1.8528079158776342e-05, "loss": 0.659, "step": 40220 }, { "epoch": 1.29, "learning_rate": 1.852749577496296e-05, "loss": 0.6551, "step": 40225 }, { "epoch": 1.29, "learning_rate": 1.8526912284750908e-05, "loss": 0.6445, "step": 40230 }, { "epoch": 1.29, "learning_rate": 1.8526328688147465e-05, "loss": 0.6555, "step": 40235 }, { "epoch": 1.29, "learning_rate": 1.8525744985159916e-05, "loss": 0.6533, "step": 40240 }, { "epoch": 1.29, "learning_rate": 1.852516117579554e-05, "loss": 0.6716, "step": 40245 }, { "epoch": 1.29, "learning_rate": 1.8524577260061628e-05, "loss": 0.6648, "step": 40250 }, { "epoch": 1.29, "learning_rate": 1.8523993237965458e-05, "loss": 0.6527, "step": 40255 }, { "epoch": 1.29, "learning_rate": 1.8523409109514324e-05, "loss": 0.6575, "step": 40260 }, { "epoch": 1.29, "learning_rate": 1.852282487471551e-05, "loss": 0.6606, "step": 40265 }, { "epoch": 1.29, "learning_rate": 1.8522240533576302e-05, "loss": 0.6574, "step": 40270 }, { "epoch": 1.29, "learning_rate": 1.8521656086103998e-05, "loss": 0.666, "step": 40275 }, { "epoch": 1.29, "learning_rate": 1.852107153230589e-05, "loss": 0.6602, "step": 40280 }, { "epoch": 1.29, "learning_rate": 1.852048687218927e-05, "loss": 0.6456, "step": 40285 }, { "epoch": 1.29, "learning_rate": 1.8519902105761426e-05, "loss": 0.6615, "step": 40290 }, { "epoch": 1.29, "learning_rate": 1.8519317233029664e-05, "loss": 0.6568, "step": 40295 }, { "epoch": 1.29, "learning_rate": 1.8518732254001275e-05, "loss": 0.6625, "step": 40300 }, { "epoch": 1.29, "learning_rate": 1.8518147168683566e-05, "loss": 0.6632, "step": 40305 }, { "epoch": 1.29, "learning_rate": 1.8517561977083825e-05, "loss": 0.6501, "step": 40310 }, { "epoch": 1.29, "learning_rate": 1.851697667920936e-05, "loss": 0.6543, "step": 40315 }, { "epoch": 1.29, "learning_rate": 1.851639127506748e-05, "loss": 0.6629, "step": 40320 }, { "epoch": 1.29, "learning_rate": 1.8515805764665478e-05, "loss": 0.6532, "step": 40325 }, { "epoch": 1.29, "learning_rate": 1.851522014801067e-05, "loss": 0.6588, "step": 40330 }, { "epoch": 1.29, "learning_rate": 1.8514634425110353e-05, "loss": 0.6556, "step": 40335 }, { "epoch": 1.29, "learning_rate": 1.851404859597184e-05, "loss": 0.654, "step": 40340 }, { "epoch": 1.29, "learning_rate": 1.851346266060244e-05, "loss": 0.6637, "step": 40345 }, { "epoch": 1.29, "learning_rate": 1.8512876619009467e-05, "loss": 0.6516, "step": 40350 }, { "epoch": 1.29, "learning_rate": 1.8512290471200225e-05, "loss": 0.6708, "step": 40355 }, { "epoch": 1.29, "learning_rate": 1.8511704217182038e-05, "loss": 0.6613, "step": 40360 }, { "epoch": 1.29, "learning_rate": 1.8511117856962213e-05, "loss": 0.6589, "step": 40365 }, { "epoch": 1.29, "learning_rate": 1.8510531390548067e-05, "loss": 0.6457, "step": 40370 }, { "epoch": 1.29, "learning_rate": 1.850994481794692e-05, "loss": 0.6593, "step": 40375 }, { "epoch": 1.29, "learning_rate": 1.8509358139166088e-05, "loss": 0.6471, "step": 40380 }, { "epoch": 1.29, "learning_rate": 1.8508771354212894e-05, "loss": 0.6585, "step": 40385 }, { "epoch": 1.29, "learning_rate": 1.8508184463094657e-05, "loss": 0.6526, "step": 40390 }, { "epoch": 1.29, "learning_rate": 1.8507597465818702e-05, "loss": 0.6568, "step": 40395 }, { "epoch": 1.29, "learning_rate": 1.8507010362392352e-05, "loss": 0.651, "step": 40400 }, { "epoch": 1.29, "learning_rate": 1.850642315282293e-05, "loss": 0.6581, "step": 40405 }, { "epoch": 1.29, "learning_rate": 1.8505835837117763e-05, "loss": 0.6514, "step": 40410 }, { "epoch": 1.29, "learning_rate": 1.8505248415284186e-05, "loss": 0.6576, "step": 40415 }, { "epoch": 1.29, "learning_rate": 1.850466088732952e-05, "loss": 0.6465, "step": 40420 }, { "epoch": 1.29, "learning_rate": 1.85040732532611e-05, "loss": 0.6597, "step": 40425 }, { "epoch": 1.29, "learning_rate": 1.8503485513086256e-05, "loss": 0.6526, "step": 40430 }, { "epoch": 1.29, "learning_rate": 1.850289766681232e-05, "loss": 0.6524, "step": 40435 }, { "epoch": 1.29, "learning_rate": 1.850230971444663e-05, "loss": 0.6662, "step": 40440 }, { "epoch": 1.29, "learning_rate": 1.850172165599652e-05, "loss": 0.6554, "step": 40445 }, { "epoch": 1.29, "learning_rate": 1.850113349146933e-05, "loss": 0.6532, "step": 40450 }, { "epoch": 1.29, "learning_rate": 1.8500545220872396e-05, "loss": 0.6651, "step": 40455 }, { "epoch": 1.29, "learning_rate": 1.8499956844213058e-05, "loss": 0.6443, "step": 40460 }, { "epoch": 1.29, "learning_rate": 1.849936836149866e-05, "loss": 0.6558, "step": 40465 }, { "epoch": 1.3, "learning_rate": 1.849877977273654e-05, "loss": 0.6435, "step": 40470 }, { "epoch": 1.3, "learning_rate": 1.8498191077934042e-05, "loss": 0.647, "step": 40475 }, { "epoch": 1.3, "learning_rate": 1.8497602277098517e-05, "loss": 0.6554, "step": 40480 }, { "epoch": 1.3, "learning_rate": 1.8497013370237303e-05, "loss": 0.6625, "step": 40485 }, { "epoch": 1.3, "learning_rate": 1.849642435735776e-05, "loss": 0.6514, "step": 40490 }, { "epoch": 1.3, "learning_rate": 1.8495835238467224e-05, "loss": 0.6722, "step": 40495 }, { "epoch": 1.3, "learning_rate": 1.8495246013573057e-05, "loss": 0.649, "step": 40500 }, { "epoch": 1.3, "learning_rate": 1.84946566826826e-05, "loss": 0.6621, "step": 40505 }, { "epoch": 1.3, "learning_rate": 1.8494067245803214e-05, "loss": 0.6607, "step": 40510 }, { "epoch": 1.3, "learning_rate": 1.849347770294225e-05, "loss": 0.6574, "step": 40515 }, { "epoch": 1.3, "learning_rate": 1.8492888054107066e-05, "loss": 0.6526, "step": 40520 }, { "epoch": 1.3, "learning_rate": 1.8492298299305015e-05, "loss": 0.6616, "step": 40525 }, { "epoch": 1.3, "learning_rate": 1.8491708438543465e-05, "loss": 0.6552, "step": 40530 }, { "epoch": 1.3, "learning_rate": 1.849111847182976e-05, "loss": 0.6595, "step": 40535 }, { "epoch": 1.3, "learning_rate": 1.8490528399171278e-05, "loss": 0.6664, "step": 40540 }, { "epoch": 1.3, "learning_rate": 1.848993822057537e-05, "loss": 0.6513, "step": 40545 }, { "epoch": 1.3, "learning_rate": 1.8489347936049403e-05, "loss": 0.6507, "step": 40550 }, { "epoch": 1.3, "learning_rate": 1.8488757545600746e-05, "loss": 0.6621, "step": 40555 }, { "epoch": 1.3, "learning_rate": 1.8488167049236758e-05, "loss": 0.6473, "step": 40560 }, { "epoch": 1.3, "learning_rate": 1.8487576446964812e-05, "loss": 0.6586, "step": 40565 }, { "epoch": 1.3, "learning_rate": 1.8486985738792277e-05, "loss": 0.6622, "step": 40570 }, { "epoch": 1.3, "learning_rate": 1.848639492472652e-05, "loss": 0.6603, "step": 40575 }, { "epoch": 1.3, "learning_rate": 1.8485804004774914e-05, "loss": 0.6512, "step": 40580 }, { "epoch": 1.3, "learning_rate": 1.8485212978944834e-05, "loss": 0.6552, "step": 40585 }, { "epoch": 1.3, "learning_rate": 1.848462184724365e-05, "loss": 0.6604, "step": 40590 }, { "epoch": 1.3, "learning_rate": 1.8484030609678744e-05, "loss": 0.6612, "step": 40595 }, { "epoch": 1.3, "learning_rate": 1.8483439266257485e-05, "loss": 0.6639, "step": 40600 }, { "epoch": 1.3, "learning_rate": 1.848284781698726e-05, "loss": 0.6508, "step": 40605 }, { "epoch": 1.3, "learning_rate": 1.8482256261875442e-05, "loss": 0.6534, "step": 40610 }, { "epoch": 1.3, "learning_rate": 1.8481664600929413e-05, "loss": 0.6471, "step": 40615 }, { "epoch": 1.3, "learning_rate": 1.848107283415656e-05, "loss": 0.6593, "step": 40620 }, { "epoch": 1.3, "learning_rate": 1.848048096156426e-05, "loss": 0.6575, "step": 40625 }, { "epoch": 1.3, "learning_rate": 1.8479888983159903e-05, "loss": 0.6488, "step": 40630 }, { "epoch": 1.3, "learning_rate": 1.8479296898950873e-05, "loss": 0.6602, "step": 40635 }, { "epoch": 1.3, "learning_rate": 1.8478704708944555e-05, "loss": 0.6599, "step": 40640 }, { "epoch": 1.3, "learning_rate": 1.847811241314834e-05, "loss": 0.6514, "step": 40645 }, { "epoch": 1.3, "learning_rate": 1.847752001156962e-05, "loss": 0.6621, "step": 40650 }, { "epoch": 1.3, "learning_rate": 1.8476927504215786e-05, "loss": 0.6587, "step": 40655 }, { "epoch": 1.3, "learning_rate": 1.847633489109423e-05, "loss": 0.6541, "step": 40660 }, { "epoch": 1.3, "learning_rate": 1.8475742172212347e-05, "loss": 0.6461, "step": 40665 }, { "epoch": 1.3, "learning_rate": 1.8475149347577526e-05, "loss": 0.6511, "step": 40670 }, { "epoch": 1.3, "learning_rate": 1.8474556417197175e-05, "loss": 0.6624, "step": 40675 }, { "epoch": 1.3, "learning_rate": 1.8473963381078685e-05, "loss": 0.6658, "step": 40680 }, { "epoch": 1.3, "learning_rate": 1.847337023922945e-05, "loss": 0.6599, "step": 40685 }, { "epoch": 1.3, "learning_rate": 1.8472776991656886e-05, "loss": 0.6706, "step": 40690 }, { "epoch": 1.3, "learning_rate": 1.847218363836838e-05, "loss": 0.645, "step": 40695 }, { "epoch": 1.3, "learning_rate": 1.8471590179371346e-05, "loss": 0.6599, "step": 40700 }, { "epoch": 1.3, "learning_rate": 1.847099661467318e-05, "loss": 0.6652, "step": 40705 }, { "epoch": 1.3, "learning_rate": 1.8470402944281295e-05, "loss": 0.6611, "step": 40710 }, { "epoch": 1.3, "learning_rate": 1.8469809168203093e-05, "loss": 0.6425, "step": 40715 }, { "epoch": 1.3, "learning_rate": 1.846921528644599e-05, "loss": 0.6419, "step": 40720 }, { "epoch": 1.3, "learning_rate": 1.8468621299017388e-05, "loss": 0.6413, "step": 40725 }, { "epoch": 1.3, "learning_rate": 1.84680272059247e-05, "loss": 0.6665, "step": 40730 }, { "epoch": 1.3, "learning_rate": 1.846743300717534e-05, "loss": 0.6614, "step": 40735 }, { "epoch": 1.3, "learning_rate": 1.8466838702776722e-05, "loss": 0.6551, "step": 40740 }, { "epoch": 1.3, "learning_rate": 1.8466244292736267e-05, "loss": 0.6487, "step": 40745 }, { "epoch": 1.3, "learning_rate": 1.8465649777061377e-05, "loss": 0.6511, "step": 40750 }, { "epoch": 1.3, "learning_rate": 1.8465055155759483e-05, "loss": 0.6505, "step": 40755 }, { "epoch": 1.3, "learning_rate": 1.8464460428838002e-05, "loss": 0.6628, "step": 40760 }, { "epoch": 1.3, "learning_rate": 1.846386559630435e-05, "loss": 0.6443, "step": 40765 }, { "epoch": 1.3, "learning_rate": 1.846327065816595e-05, "loss": 0.6618, "step": 40770 }, { "epoch": 1.3, "learning_rate": 1.8462675614430223e-05, "loss": 0.647, "step": 40775 }, { "epoch": 1.3, "learning_rate": 1.8462080465104598e-05, "loss": 0.6585, "step": 40780 }, { "epoch": 1.31, "learning_rate": 1.8461485210196503e-05, "loss": 0.6568, "step": 40785 }, { "epoch": 1.31, "learning_rate": 1.8460889849713357e-05, "loss": 0.6566, "step": 40790 }, { "epoch": 1.31, "learning_rate": 1.8460294383662595e-05, "loss": 0.6625, "step": 40795 }, { "epoch": 1.31, "learning_rate": 1.8459698812051642e-05, "loss": 0.657, "step": 40800 }, { "epoch": 1.31, "learning_rate": 1.8459103134887936e-05, "loss": 0.6601, "step": 40805 }, { "epoch": 1.31, "learning_rate": 1.84585073521789e-05, "loss": 0.6654, "step": 40810 }, { "epoch": 1.31, "learning_rate": 1.8457911463931975e-05, "loss": 0.6613, "step": 40815 }, { "epoch": 1.31, "learning_rate": 1.845731547015459e-05, "loss": 0.6502, "step": 40820 }, { "epoch": 1.31, "learning_rate": 1.845671937085419e-05, "loss": 0.6621, "step": 40825 }, { "epoch": 1.31, "learning_rate": 1.84561231660382e-05, "loss": 0.648, "step": 40830 }, { "epoch": 1.31, "learning_rate": 1.8455526855714074e-05, "loss": 0.6479, "step": 40835 }, { "epoch": 1.31, "learning_rate": 1.845493043988924e-05, "loss": 0.664, "step": 40840 }, { "epoch": 1.31, "learning_rate": 1.8454333918571145e-05, "loss": 0.6421, "step": 40845 }, { "epoch": 1.31, "learning_rate": 1.845373729176723e-05, "loss": 0.664, "step": 40850 }, { "epoch": 1.31, "learning_rate": 1.845314055948494e-05, "loss": 0.6531, "step": 40855 }, { "epoch": 1.31, "learning_rate": 1.8452543721731723e-05, "loss": 0.6533, "step": 40860 }, { "epoch": 1.31, "learning_rate": 1.8451946778515024e-05, "loss": 0.6421, "step": 40865 }, { "epoch": 1.31, "learning_rate": 1.8451349729842288e-05, "loss": 0.6561, "step": 40870 }, { "epoch": 1.31, "learning_rate": 1.8450752575720967e-05, "loss": 0.6491, "step": 40875 }, { "epoch": 1.31, "learning_rate": 1.8450155316158512e-05, "loss": 0.6523, "step": 40880 }, { "epoch": 1.31, "learning_rate": 1.8449557951162376e-05, "loss": 0.674, "step": 40885 }, { "epoch": 1.31, "learning_rate": 1.8448960480740007e-05, "loss": 0.6426, "step": 40890 }, { "epoch": 1.31, "learning_rate": 1.8448362904898868e-05, "loss": 0.6704, "step": 40895 }, { "epoch": 1.31, "learning_rate": 1.844776522364641e-05, "loss": 0.648, "step": 40900 }, { "epoch": 1.31, "learning_rate": 1.8447167436990093e-05, "loss": 0.6602, "step": 40905 }, { "epoch": 1.31, "learning_rate": 1.8446569544937372e-05, "loss": 0.6607, "step": 40910 }, { "epoch": 1.31, "learning_rate": 1.8445971547495707e-05, "loss": 0.6582, "step": 40915 }, { "epoch": 1.31, "learning_rate": 1.8445373444672562e-05, "loss": 0.6498, "step": 40920 }, { "epoch": 1.31, "learning_rate": 1.8444775236475402e-05, "loss": 0.648, "step": 40925 }, { "epoch": 1.31, "learning_rate": 1.8444176922911686e-05, "loss": 0.6457, "step": 40930 }, { "epoch": 1.31, "learning_rate": 1.844357850398888e-05, "loss": 0.6567, "step": 40935 }, { "epoch": 1.31, "learning_rate": 1.8442979979714453e-05, "loss": 0.6589, "step": 40940 }, { "epoch": 1.31, "learning_rate": 1.844238135009587e-05, "loss": 0.6581, "step": 40945 }, { "epoch": 1.31, "learning_rate": 1.8441782615140603e-05, "loss": 0.6613, "step": 40950 }, { "epoch": 1.31, "learning_rate": 1.844118377485612e-05, "loss": 0.6492, "step": 40955 }, { "epoch": 1.31, "learning_rate": 1.8440584829249894e-05, "loss": 0.6513, "step": 40960 }, { "epoch": 1.31, "learning_rate": 1.84399857783294e-05, "loss": 0.6457, "step": 40965 }, { "epoch": 1.31, "learning_rate": 1.8439386622102108e-05, "loss": 0.6629, "step": 40970 }, { "epoch": 1.31, "learning_rate": 1.84387873605755e-05, "loss": 0.6363, "step": 40975 }, { "epoch": 1.31, "learning_rate": 1.8438187993757045e-05, "loss": 0.6463, "step": 40980 }, { "epoch": 1.31, "learning_rate": 1.8437588521654228e-05, "loss": 0.6576, "step": 40985 }, { "epoch": 1.31, "learning_rate": 1.8436988944274522e-05, "loss": 0.6512, "step": 40990 }, { "epoch": 1.31, "learning_rate": 1.843638926162542e-05, "loss": 0.6415, "step": 40995 }, { "epoch": 1.31, "learning_rate": 1.843578947371439e-05, "loss": 0.6552, "step": 41000 }, { "epoch": 1.31, "learning_rate": 1.8435189580548924e-05, "loss": 0.6565, "step": 41005 }, { "epoch": 1.31, "learning_rate": 1.8434589582136503e-05, "loss": 0.6655, "step": 41010 }, { "epoch": 1.31, "learning_rate": 1.8433989478484622e-05, "loss": 0.6557, "step": 41015 }, { "epoch": 1.31, "learning_rate": 1.8433389269600757e-05, "loss": 0.6554, "step": 41020 }, { "epoch": 1.31, "learning_rate": 1.8432788955492404e-05, "loss": 0.6652, "step": 41025 }, { "epoch": 1.31, "learning_rate": 1.843218853616705e-05, "loss": 0.6621, "step": 41030 }, { "epoch": 1.31, "learning_rate": 1.843158801163219e-05, "loss": 0.6552, "step": 41035 }, { "epoch": 1.31, "learning_rate": 1.8430987381895312e-05, "loss": 0.6588, "step": 41040 }, { "epoch": 1.31, "learning_rate": 1.8430386646963915e-05, "loss": 0.6586, "step": 41045 }, { "epoch": 1.31, "learning_rate": 1.842978580684549e-05, "loss": 0.6344, "step": 41050 }, { "epoch": 1.31, "learning_rate": 1.8429184861547537e-05, "loss": 0.6669, "step": 41055 }, { "epoch": 1.31, "learning_rate": 1.842858381107755e-05, "loss": 0.6621, "step": 41060 }, { "epoch": 1.31, "learning_rate": 1.8427982655443034e-05, "loss": 0.6603, "step": 41065 }, { "epoch": 1.31, "learning_rate": 1.8427381394651485e-05, "loss": 0.6602, "step": 41070 }, { "epoch": 1.31, "learning_rate": 1.842678002871041e-05, "loss": 0.6482, "step": 41075 }, { "epoch": 1.31, "learning_rate": 1.8426178557627305e-05, "loss": 0.6649, "step": 41080 }, { "epoch": 1.31, "learning_rate": 1.8425576981409682e-05, "loss": 0.6539, "step": 41085 }, { "epoch": 1.31, "learning_rate": 1.8424975300065046e-05, "loss": 0.6479, "step": 41090 }, { "epoch": 1.32, "learning_rate": 1.8424373513600896e-05, "loss": 0.6557, "step": 41095 }, { "epoch": 1.32, "learning_rate": 1.8423771622024752e-05, "loss": 0.6632, "step": 41100 }, { "epoch": 1.32, "learning_rate": 1.842316962534412e-05, "loss": 0.6628, "step": 41105 }, { "epoch": 1.32, "learning_rate": 1.8422567523566503e-05, "loss": 0.6509, "step": 41110 }, { "epoch": 1.32, "learning_rate": 1.8421965316699424e-05, "loss": 0.6444, "step": 41115 }, { "epoch": 1.32, "learning_rate": 1.8421363004750393e-05, "loss": 0.6552, "step": 41120 }, { "epoch": 1.32, "learning_rate": 1.8420760587726925e-05, "loss": 0.6522, "step": 41125 }, { "epoch": 1.32, "learning_rate": 1.8420158065636538e-05, "loss": 0.6439, "step": 41130 }, { "epoch": 1.32, "learning_rate": 1.8419555438486747e-05, "loss": 0.656, "step": 41135 }, { "epoch": 1.32, "learning_rate": 1.841895270628507e-05, "loss": 0.6583, "step": 41140 }, { "epoch": 1.32, "learning_rate": 1.8418349869039033e-05, "loss": 0.6557, "step": 41145 }, { "epoch": 1.32, "learning_rate": 1.8417746926756157e-05, "loss": 0.656, "step": 41150 }, { "epoch": 1.32, "learning_rate": 1.8417143879443956e-05, "loss": 0.6449, "step": 41155 }, { "epoch": 1.32, "learning_rate": 1.8416540727109967e-05, "loss": 0.6564, "step": 41160 }, { "epoch": 1.32, "learning_rate": 1.8415937469761703e-05, "loss": 0.6538, "step": 41165 }, { "epoch": 1.32, "learning_rate": 1.84153341074067e-05, "loss": 0.6515, "step": 41170 }, { "epoch": 1.32, "learning_rate": 1.841473064005249e-05, "loss": 0.6682, "step": 41175 }, { "epoch": 1.32, "learning_rate": 1.841412706770659e-05, "loss": 0.6564, "step": 41180 }, { "epoch": 1.32, "learning_rate": 1.8413523390376535e-05, "loss": 0.6656, "step": 41185 }, { "epoch": 1.32, "learning_rate": 1.8412919608069862e-05, "loss": 0.6432, "step": 41190 }, { "epoch": 1.32, "learning_rate": 1.8412315720794102e-05, "loss": 0.6496, "step": 41195 }, { "epoch": 1.32, "learning_rate": 1.8411711728556787e-05, "loss": 0.651, "step": 41200 }, { "epoch": 1.32, "learning_rate": 1.8411107631365457e-05, "loss": 0.6563, "step": 41205 }, { "epoch": 1.32, "learning_rate": 1.841050342922765e-05, "loss": 0.6444, "step": 41210 }, { "epoch": 1.32, "learning_rate": 1.8409899122150898e-05, "loss": 0.657, "step": 41215 }, { "epoch": 1.32, "learning_rate": 1.840929471014275e-05, "loss": 0.6521, "step": 41220 }, { "epoch": 1.32, "learning_rate": 1.8408690193210737e-05, "loss": 0.6598, "step": 41225 }, { "epoch": 1.32, "learning_rate": 1.8408085571362412e-05, "loss": 0.6604, "step": 41230 }, { "epoch": 1.32, "learning_rate": 1.8407480844605315e-05, "loss": 0.6487, "step": 41235 }, { "epoch": 1.32, "learning_rate": 1.840687601294699e-05, "loss": 0.6506, "step": 41240 }, { "epoch": 1.32, "learning_rate": 1.8406271076394983e-05, "loss": 0.6451, "step": 41245 }, { "epoch": 1.32, "learning_rate": 1.8405666034956842e-05, "loss": 0.649, "step": 41250 }, { "epoch": 1.32, "learning_rate": 1.8405060888640122e-05, "loss": 0.6531, "step": 41255 }, { "epoch": 1.32, "learning_rate": 1.8404455637452364e-05, "loss": 0.6465, "step": 41260 }, { "epoch": 1.32, "learning_rate": 1.8403850281401128e-05, "loss": 0.6484, "step": 41265 }, { "epoch": 1.32, "learning_rate": 1.8403244820493966e-05, "loss": 0.652, "step": 41270 }, { "epoch": 1.32, "learning_rate": 1.8402639254738422e-05, "loss": 0.6562, "step": 41275 }, { "epoch": 1.32, "learning_rate": 1.8402033584142067e-05, "loss": 0.6464, "step": 41280 }, { "epoch": 1.32, "learning_rate": 1.840142780871245e-05, "loss": 0.6663, "step": 41285 }, { "epoch": 1.32, "learning_rate": 1.8400821928457126e-05, "loss": 0.6537, "step": 41290 }, { "epoch": 1.32, "learning_rate": 1.840021594338366e-05, "loss": 0.6452, "step": 41295 }, { "epoch": 1.32, "learning_rate": 1.8399609853499614e-05, "loss": 0.6464, "step": 41300 }, { "epoch": 1.32, "learning_rate": 1.839900365881255e-05, "loss": 0.6634, "step": 41305 }, { "epoch": 1.32, "learning_rate": 1.8398397359330023e-05, "loss": 0.6433, "step": 41310 }, { "epoch": 1.32, "learning_rate": 1.839779095505961e-05, "loss": 0.6415, "step": 41315 }, { "epoch": 1.32, "learning_rate": 1.8397184446008868e-05, "loss": 0.6455, "step": 41320 }, { "epoch": 1.32, "learning_rate": 1.839657783218537e-05, "loss": 0.6517, "step": 41325 }, { "epoch": 1.32, "learning_rate": 1.839597111359669e-05, "loss": 0.652, "step": 41330 }, { "epoch": 1.32, "learning_rate": 1.8395364290250383e-05, "loss": 0.6569, "step": 41335 }, { "epoch": 1.32, "learning_rate": 1.8394757362154027e-05, "loss": 0.6645, "step": 41340 }, { "epoch": 1.32, "learning_rate": 1.8394150329315203e-05, "loss": 0.6592, "step": 41345 }, { "epoch": 1.32, "learning_rate": 1.8393543191741473e-05, "loss": 0.6524, "step": 41350 }, { "epoch": 1.32, "learning_rate": 1.8392935949440417e-05, "loss": 0.6573, "step": 41355 }, { "epoch": 1.32, "learning_rate": 1.8392328602419617e-05, "loss": 0.6524, "step": 41360 }, { "epoch": 1.32, "learning_rate": 1.8391721150686642e-05, "loss": 0.6551, "step": 41365 }, { "epoch": 1.32, "learning_rate": 1.8391113594249076e-05, "loss": 0.6441, "step": 41370 }, { "epoch": 1.32, "learning_rate": 1.8390505933114503e-05, "loss": 0.6678, "step": 41375 }, { "epoch": 1.32, "learning_rate": 1.8389898167290497e-05, "loss": 0.6493, "step": 41380 }, { "epoch": 1.32, "learning_rate": 1.8389290296784647e-05, "loss": 0.6516, "step": 41385 }, { "epoch": 1.32, "learning_rate": 1.8388682321604535e-05, "loss": 0.654, "step": 41390 }, { "epoch": 1.32, "learning_rate": 1.8388074241757748e-05, "loss": 0.6534, "step": 41395 }, { "epoch": 1.32, "learning_rate": 1.8387466057251872e-05, "loss": 0.66, "step": 41400 }, { "epoch": 1.32, "learning_rate": 1.8386857768094492e-05, "loss": 0.6464, "step": 41405 }, { "epoch": 1.33, "learning_rate": 1.8386249374293208e-05, "loss": 0.6516, "step": 41410 }, { "epoch": 1.33, "learning_rate": 1.83856408758556e-05, "loss": 0.6551, "step": 41415 }, { "epoch": 1.33, "learning_rate": 1.8385032272789266e-05, "loss": 0.6533, "step": 41420 }, { "epoch": 1.33, "learning_rate": 1.8384423565101798e-05, "loss": 0.6634, "step": 41425 }, { "epoch": 1.33, "learning_rate": 1.8383814752800793e-05, "loss": 0.6619, "step": 41430 }, { "epoch": 1.33, "learning_rate": 1.8383205835893845e-05, "loss": 0.6618, "step": 41435 }, { "epoch": 1.33, "learning_rate": 1.838259681438855e-05, "loss": 0.6566, "step": 41440 }, { "epoch": 1.33, "learning_rate": 1.8381987688292514e-05, "loss": 0.6644, "step": 41445 }, { "epoch": 1.33, "learning_rate": 1.8381378457613327e-05, "loss": 0.6562, "step": 41450 }, { "epoch": 1.33, "learning_rate": 1.8380769122358595e-05, "loss": 0.6492, "step": 41455 }, { "epoch": 1.33, "learning_rate": 1.8380159682535925e-05, "loss": 0.6439, "step": 41460 }, { "epoch": 1.33, "learning_rate": 1.8379550138152916e-05, "loss": 0.6521, "step": 41465 }, { "epoch": 1.33, "learning_rate": 1.8378940489217178e-05, "loss": 0.6608, "step": 41470 }, { "epoch": 1.33, "learning_rate": 1.8378330735736313e-05, "loss": 0.6488, "step": 41475 }, { "epoch": 1.33, "learning_rate": 1.8377720877717925e-05, "loss": 0.6548, "step": 41480 }, { "epoch": 1.33, "learning_rate": 1.8377110915169634e-05, "loss": 0.6732, "step": 41485 }, { "epoch": 1.33, "learning_rate": 1.8376500848099043e-05, "loss": 0.6417, "step": 41490 }, { "epoch": 1.33, "learning_rate": 1.8375890676513767e-05, "loss": 0.6435, "step": 41495 }, { "epoch": 1.33, "learning_rate": 1.837528040042142e-05, "loss": 0.6642, "step": 41500 }, { "epoch": 1.33, "learning_rate": 1.8374670019829614e-05, "loss": 0.6418, "step": 41505 }, { "epoch": 1.33, "learning_rate": 1.8374059534745962e-05, "loss": 0.6485, "step": 41510 }, { "epoch": 1.33, "learning_rate": 1.8373448945178086e-05, "loss": 0.6503, "step": 41515 }, { "epoch": 1.33, "learning_rate": 1.8372838251133606e-05, "loss": 0.6531, "step": 41520 }, { "epoch": 1.33, "learning_rate": 1.8372227452620137e-05, "loss": 0.6623, "step": 41525 }, { "epoch": 1.33, "learning_rate": 1.8371616549645303e-05, "loss": 0.6438, "step": 41530 }, { "epoch": 1.33, "learning_rate": 1.8371005542216728e-05, "loss": 0.646, "step": 41535 }, { "epoch": 1.33, "learning_rate": 1.8370394430342027e-05, "loss": 0.6467, "step": 41540 }, { "epoch": 1.33, "learning_rate": 1.8369783214028832e-05, "loss": 0.6584, "step": 41545 }, { "epoch": 1.33, "learning_rate": 1.836917189328477e-05, "loss": 0.64, "step": 41550 }, { "epoch": 1.33, "learning_rate": 1.8368560468117464e-05, "loss": 0.6489, "step": 41555 }, { "epoch": 1.33, "learning_rate": 1.8367948938534547e-05, "loss": 0.6509, "step": 41560 }, { "epoch": 1.33, "learning_rate": 1.836733730454365e-05, "loss": 0.6422, "step": 41565 }, { "epoch": 1.33, "learning_rate": 1.8366725566152394e-05, "loss": 0.6484, "step": 41570 }, { "epoch": 1.33, "learning_rate": 1.836611372336843e-05, "loss": 0.6672, "step": 41575 }, { "epoch": 1.33, "learning_rate": 1.8365501776199375e-05, "loss": 0.6487, "step": 41580 }, { "epoch": 1.33, "learning_rate": 1.8364889724652872e-05, "loss": 0.6642, "step": 41585 }, { "epoch": 1.33, "learning_rate": 1.8364277568736556e-05, "loss": 0.641, "step": 41590 }, { "epoch": 1.33, "learning_rate": 1.8363665308458065e-05, "loss": 0.6585, "step": 41595 }, { "epoch": 1.33, "learning_rate": 1.836305294382504e-05, "loss": 0.6576, "step": 41600 }, { "epoch": 1.33, "learning_rate": 1.8362440474845124e-05, "loss": 0.652, "step": 41605 }, { "epoch": 1.33, "learning_rate": 1.836182790152595e-05, "loss": 0.6445, "step": 41610 }, { "epoch": 1.33, "learning_rate": 1.836121522387517e-05, "loss": 0.6461, "step": 41615 }, { "epoch": 1.33, "learning_rate": 1.8360602441900423e-05, "loss": 0.6485, "step": 41620 }, { "epoch": 1.33, "learning_rate": 1.8359989555609355e-05, "loss": 0.647, "step": 41625 }, { "epoch": 1.33, "learning_rate": 1.8359376565009618e-05, "loss": 0.6461, "step": 41630 }, { "epoch": 1.33, "learning_rate": 1.8358763470108852e-05, "loss": 0.6458, "step": 41635 }, { "epoch": 1.33, "learning_rate": 1.835815027091472e-05, "loss": 0.6526, "step": 41640 }, { "epoch": 1.33, "learning_rate": 1.8357536967434856e-05, "loss": 0.6625, "step": 41645 }, { "epoch": 1.33, "learning_rate": 1.835692355967693e-05, "loss": 0.6536, "step": 41650 }, { "epoch": 1.33, "learning_rate": 1.8356310047648578e-05, "loss": 0.6454, "step": 41655 }, { "epoch": 1.33, "learning_rate": 1.8355696431357465e-05, "loss": 0.6613, "step": 41660 }, { "epoch": 1.33, "learning_rate": 1.835508271081125e-05, "loss": 0.6497, "step": 41665 }, { "epoch": 1.33, "learning_rate": 1.8354468886017582e-05, "loss": 0.6522, "step": 41670 }, { "epoch": 1.33, "learning_rate": 1.8353854956984127e-05, "loss": 0.6565, "step": 41675 }, { "epoch": 1.33, "learning_rate": 1.8353240923718538e-05, "loss": 0.6458, "step": 41680 }, { "epoch": 1.33, "learning_rate": 1.8352626786228486e-05, "loss": 0.6555, "step": 41685 }, { "epoch": 1.33, "learning_rate": 1.835201254452162e-05, "loss": 0.6595, "step": 41690 }, { "epoch": 1.33, "learning_rate": 1.8351398198605617e-05, "loss": 0.6568, "step": 41695 }, { "epoch": 1.33, "learning_rate": 1.8350783748488135e-05, "loss": 0.636, "step": 41700 }, { "epoch": 1.33, "learning_rate": 1.8350169194176846e-05, "loss": 0.6501, "step": 41705 }, { "epoch": 1.33, "learning_rate": 1.8349554535679413e-05, "loss": 0.6478, "step": 41710 }, { "epoch": 1.33, "learning_rate": 1.8348939773003508e-05, "loss": 0.6449, "step": 41715 }, { "epoch": 1.34, "learning_rate": 1.8348324906156796e-05, "loss": 0.6525, "step": 41720 }, { "epoch": 1.34, "learning_rate": 1.8347709935146958e-05, "loss": 0.6468, "step": 41725 }, { "epoch": 1.34, "learning_rate": 1.8347094859981658e-05, "loss": 0.6561, "step": 41730 }, { "epoch": 1.34, "learning_rate": 1.8346479680668575e-05, "loss": 0.6491, "step": 41735 }, { "epoch": 1.34, "learning_rate": 1.8345864397215387e-05, "loss": 0.6638, "step": 41740 }, { "epoch": 1.34, "learning_rate": 1.8345249009629768e-05, "loss": 0.6558, "step": 41745 }, { "epoch": 1.34, "learning_rate": 1.834463351791939e-05, "loss": 0.659, "step": 41750 }, { "epoch": 1.34, "learning_rate": 1.8344017922091944e-05, "loss": 0.6615, "step": 41755 }, { "epoch": 1.34, "learning_rate": 1.8343402222155106e-05, "loss": 0.6521, "step": 41760 }, { "epoch": 1.34, "learning_rate": 1.834278641811656e-05, "loss": 0.6446, "step": 41765 }, { "epoch": 1.34, "learning_rate": 1.8342170509983985e-05, "loss": 0.6497, "step": 41770 }, { "epoch": 1.34, "learning_rate": 1.834155449776507e-05, "loss": 0.6634, "step": 41775 }, { "epoch": 1.34, "learning_rate": 1.8340938381467498e-05, "loss": 0.6468, "step": 41780 }, { "epoch": 1.34, "learning_rate": 1.8340322161098956e-05, "loss": 0.6534, "step": 41785 }, { "epoch": 1.34, "learning_rate": 1.8339705836667135e-05, "loss": 0.6597, "step": 41790 }, { "epoch": 1.34, "learning_rate": 1.8339089408179724e-05, "loss": 0.6503, "step": 41795 }, { "epoch": 1.34, "learning_rate": 1.8338472875644417e-05, "loss": 0.6496, "step": 41800 }, { "epoch": 1.34, "learning_rate": 1.8337856239068902e-05, "loss": 0.6517, "step": 41805 }, { "epoch": 1.34, "learning_rate": 1.8337239498460876e-05, "loss": 0.6538, "step": 41810 }, { "epoch": 1.34, "learning_rate": 1.8336622653828032e-05, "loss": 0.658, "step": 41815 }, { "epoch": 1.34, "learning_rate": 1.8336005705178065e-05, "loss": 0.6507, "step": 41820 }, { "epoch": 1.34, "learning_rate": 1.833538865251868e-05, "loss": 0.6582, "step": 41825 }, { "epoch": 1.34, "learning_rate": 1.833477149585757e-05, "loss": 0.6619, "step": 41830 }, { "epoch": 1.34, "learning_rate": 1.8334154235202434e-05, "loss": 0.6641, "step": 41835 }, { "epoch": 1.34, "learning_rate": 1.8333536870560983e-05, "loss": 0.6635, "step": 41840 }, { "epoch": 1.34, "learning_rate": 1.833291940194091e-05, "loss": 0.6495, "step": 41845 }, { "epoch": 1.34, "learning_rate": 1.8332301829349918e-05, "loss": 0.6563, "step": 41850 }, { "epoch": 1.34, "learning_rate": 1.833168415279572e-05, "loss": 0.661, "step": 41855 }, { "epoch": 1.34, "learning_rate": 1.833106637228602e-05, "loss": 0.6416, "step": 41860 }, { "epoch": 1.34, "learning_rate": 1.833044848782853e-05, "loss": 0.6485, "step": 41865 }, { "epoch": 1.34, "learning_rate": 1.832983049943095e-05, "loss": 0.6486, "step": 41870 }, { "epoch": 1.34, "learning_rate": 1.8329212407100996e-05, "loss": 0.6532, "step": 41875 }, { "epoch": 1.34, "learning_rate": 1.8328594210846382e-05, "loss": 0.6419, "step": 41880 }, { "epoch": 1.34, "learning_rate": 1.832797591067482e-05, "loss": 0.6535, "step": 41885 }, { "epoch": 1.34, "learning_rate": 1.8327357506594023e-05, "loss": 0.6538, "step": 41890 }, { "epoch": 1.34, "learning_rate": 1.8326738998611708e-05, "loss": 0.6564, "step": 41895 }, { "epoch": 1.34, "learning_rate": 1.8326120386735595e-05, "loss": 0.6372, "step": 41900 }, { "epoch": 1.34, "learning_rate": 1.8325501670973397e-05, "loss": 0.6529, "step": 41905 }, { "epoch": 1.34, "learning_rate": 1.8324882851332834e-05, "loss": 0.6555, "step": 41910 }, { "epoch": 1.34, "learning_rate": 1.8324263927821634e-05, "loss": 0.6669, "step": 41915 }, { "epoch": 1.34, "learning_rate": 1.832364490044751e-05, "loss": 0.6521, "step": 41920 }, { "epoch": 1.34, "learning_rate": 1.8323025769218198e-05, "loss": 0.6457, "step": 41925 }, { "epoch": 1.34, "learning_rate": 1.832240653414141e-05, "loss": 0.6625, "step": 41930 }, { "epoch": 1.34, "learning_rate": 1.832178719522488e-05, "loss": 0.6623, "step": 41935 }, { "epoch": 1.34, "learning_rate": 1.8321167752476335e-05, "loss": 0.6697, "step": 41940 }, { "epoch": 1.34, "learning_rate": 1.8320548205903497e-05, "loss": 0.6341, "step": 41945 }, { "epoch": 1.34, "learning_rate": 1.8319928555514108e-05, "loss": 0.6483, "step": 41950 }, { "epoch": 1.34, "learning_rate": 1.831930880131589e-05, "loss": 0.643, "step": 41955 }, { "epoch": 1.34, "learning_rate": 1.8318688943316577e-05, "loss": 0.6533, "step": 41960 }, { "epoch": 1.34, "learning_rate": 1.8318068981523906e-05, "loss": 0.6665, "step": 41965 }, { "epoch": 1.34, "learning_rate": 1.8317448915945613e-05, "loss": 0.6486, "step": 41970 }, { "epoch": 1.34, "learning_rate": 1.831682874658943e-05, "loss": 0.6562, "step": 41975 }, { "epoch": 1.34, "learning_rate": 1.83162084734631e-05, "loss": 0.6488, "step": 41980 }, { "epoch": 1.34, "learning_rate": 1.8315588096574358e-05, "loss": 0.6543, "step": 41985 }, { "epoch": 1.34, "learning_rate": 1.8314967615930948e-05, "loss": 0.6575, "step": 41990 }, { "epoch": 1.34, "learning_rate": 1.831434703154061e-05, "loss": 0.6569, "step": 41995 }, { "epoch": 1.34, "learning_rate": 1.8313726343411085e-05, "loss": 0.6301, "step": 42000 }, { "epoch": 1.34, "learning_rate": 1.8313105551550125e-05, "loss": 0.6437, "step": 42005 }, { "epoch": 1.34, "learning_rate": 1.8312484655965466e-05, "loss": 0.6487, "step": 42010 }, { "epoch": 1.34, "learning_rate": 1.831186365666486e-05, "loss": 0.6587, "step": 42015 }, { "epoch": 1.34, "learning_rate": 1.8311242553656056e-05, "loss": 0.6595, "step": 42020 }, { "epoch": 1.34, "learning_rate": 1.83106213469468e-05, "loss": 0.6386, "step": 42025 }, { "epoch": 1.34, "learning_rate": 1.831000003654485e-05, "loss": 0.6462, "step": 42030 }, { "epoch": 1.35, "learning_rate": 1.830937862245795e-05, "loss": 0.6319, "step": 42035 }, { "epoch": 1.35, "learning_rate": 1.8308757104693854e-05, "loss": 0.6573, "step": 42040 }, { "epoch": 1.35, "learning_rate": 1.8308135483260324e-05, "loss": 0.6556, "step": 42045 }, { "epoch": 1.35, "learning_rate": 1.8307513758165113e-05, "loss": 0.6578, "step": 42050 }, { "epoch": 1.35, "learning_rate": 1.8306891929415973e-05, "loss": 0.6485, "step": 42055 }, { "epoch": 1.35, "learning_rate": 1.8306269997020666e-05, "loss": 0.659, "step": 42060 }, { "epoch": 1.35, "learning_rate": 1.8305647960986958e-05, "loss": 0.654, "step": 42065 }, { "epoch": 1.35, "learning_rate": 1.83050258213226e-05, "loss": 0.6445, "step": 42070 }, { "epoch": 1.35, "learning_rate": 1.830440357803536e-05, "loss": 0.6471, "step": 42075 }, { "epoch": 1.35, "learning_rate": 1.8303781231133e-05, "loss": 0.6465, "step": 42080 }, { "epoch": 1.35, "learning_rate": 1.830315878062329e-05, "loss": 0.6667, "step": 42085 }, { "epoch": 1.35, "learning_rate": 1.8302536226513993e-05, "loss": 0.6563, "step": 42090 }, { "epoch": 1.35, "learning_rate": 1.8301913568812874e-05, "loss": 0.6507, "step": 42095 }, { "epoch": 1.35, "learning_rate": 1.8301290807527703e-05, "loss": 0.6493, "step": 42100 }, { "epoch": 1.35, "learning_rate": 1.8300667942666252e-05, "loss": 0.6493, "step": 42105 }, { "epoch": 1.35, "learning_rate": 1.8300044974236294e-05, "loss": 0.6444, "step": 42110 }, { "epoch": 1.35, "learning_rate": 1.8299421902245598e-05, "loss": 0.6493, "step": 42115 }, { "epoch": 1.35, "learning_rate": 1.8298798726701942e-05, "loss": 0.6529, "step": 42120 }, { "epoch": 1.35, "learning_rate": 1.82981754476131e-05, "loss": 0.6469, "step": 42125 }, { "epoch": 1.35, "learning_rate": 1.8297552064986846e-05, "loss": 0.643, "step": 42130 }, { "epoch": 1.35, "learning_rate": 1.8296928578830963e-05, "loss": 0.6493, "step": 42135 }, { "epoch": 1.35, "learning_rate": 1.8296304989153225e-05, "loss": 0.6562, "step": 42140 }, { "epoch": 1.35, "learning_rate": 1.8295681295961416e-05, "loss": 0.6448, "step": 42145 }, { "epoch": 1.35, "learning_rate": 1.829505749926332e-05, "loss": 0.6478, "step": 42150 }, { "epoch": 1.35, "learning_rate": 1.829443359906671e-05, "loss": 0.6484, "step": 42155 }, { "epoch": 1.35, "learning_rate": 1.8293809595379386e-05, "loss": 0.6403, "step": 42160 }, { "epoch": 1.35, "learning_rate": 1.8293185488209122e-05, "loss": 0.6458, "step": 42165 }, { "epoch": 1.35, "learning_rate": 1.829256127756371e-05, "loss": 0.644, "step": 42170 }, { "epoch": 1.35, "learning_rate": 1.8291936963450933e-05, "loss": 0.6468, "step": 42175 }, { "epoch": 1.35, "learning_rate": 1.8291312545878587e-05, "loss": 0.6404, "step": 42180 }, { "epoch": 1.35, "learning_rate": 1.8290688024854465e-05, "loss": 0.6493, "step": 42185 }, { "epoch": 1.35, "learning_rate": 1.829006340038635e-05, "loss": 0.6433, "step": 42190 }, { "epoch": 1.35, "learning_rate": 1.8289438672482044e-05, "loss": 0.6607, "step": 42195 }, { "epoch": 1.35, "learning_rate": 1.8288813841149333e-05, "loss": 0.6561, "step": 42200 }, { "epoch": 1.35, "learning_rate": 1.8288188906396024e-05, "loss": 0.6421, "step": 42205 }, { "epoch": 1.35, "learning_rate": 1.8287563868229906e-05, "loss": 0.6556, "step": 42210 }, { "epoch": 1.35, "learning_rate": 1.8286938726658778e-05, "loss": 0.6419, "step": 42215 }, { "epoch": 1.35, "learning_rate": 1.8286313481690446e-05, "loss": 0.6558, "step": 42220 }, { "epoch": 1.35, "learning_rate": 1.8285688133332704e-05, "loss": 0.6435, "step": 42225 }, { "epoch": 1.35, "learning_rate": 1.828506268159336e-05, "loss": 0.6559, "step": 42230 }, { "epoch": 1.35, "learning_rate": 1.8284437126480215e-05, "loss": 0.6551, "step": 42235 }, { "epoch": 1.35, "learning_rate": 1.8283811468001078e-05, "loss": 0.6505, "step": 42240 }, { "epoch": 1.35, "learning_rate": 1.8283185706163752e-05, "loss": 0.668, "step": 42245 }, { "epoch": 1.35, "learning_rate": 1.8282559840976043e-05, "loss": 0.643, "step": 42250 }, { "epoch": 1.35, "learning_rate": 1.8281933872445764e-05, "loss": 0.6536, "step": 42255 }, { "epoch": 1.35, "learning_rate": 1.828130780058072e-05, "loss": 0.6427, "step": 42260 }, { "epoch": 1.35, "learning_rate": 1.8280681625388732e-05, "loss": 0.6526, "step": 42265 }, { "epoch": 1.35, "learning_rate": 1.82800553468776e-05, "loss": 0.6462, "step": 42270 }, { "epoch": 1.35, "learning_rate": 1.8279428965055153e-05, "loss": 0.6581, "step": 42275 }, { "epoch": 1.35, "learning_rate": 1.8278802479929197e-05, "loss": 0.6309, "step": 42280 }, { "epoch": 1.35, "learning_rate": 1.8278175891507546e-05, "loss": 0.6608, "step": 42285 }, { "epoch": 1.35, "learning_rate": 1.8277549199798023e-05, "loss": 0.6461, "step": 42290 }, { "epoch": 1.35, "learning_rate": 1.827692240480845e-05, "loss": 0.6502, "step": 42295 }, { "epoch": 1.35, "learning_rate": 1.827629550654664e-05, "loss": 0.6659, "step": 42300 }, { "epoch": 1.35, "learning_rate": 1.8275668505020424e-05, "loss": 0.655, "step": 42305 }, { "epoch": 1.35, "learning_rate": 1.827504140023762e-05, "loss": 0.652, "step": 42310 }, { "epoch": 1.35, "learning_rate": 1.827441419220605e-05, "loss": 0.6436, "step": 42315 }, { "epoch": 1.35, "learning_rate": 1.8273786880933543e-05, "loss": 0.6497, "step": 42320 }, { "epoch": 1.35, "learning_rate": 1.8273159466427926e-05, "loss": 0.6586, "step": 42325 }, { "epoch": 1.35, "learning_rate": 1.8272531948697026e-05, "loss": 0.6614, "step": 42330 }, { "epoch": 1.35, "learning_rate": 1.8271904327748677e-05, "loss": 0.6466, "step": 42335 }, { "epoch": 1.35, "learning_rate": 1.82712766035907e-05, "loss": 0.6389, "step": 42340 }, { "epoch": 1.36, "learning_rate": 1.827064877623094e-05, "loss": 0.65, "step": 42345 }, { "epoch": 1.36, "learning_rate": 1.827002084567722e-05, "loss": 0.6602, "step": 42350 }, { "epoch": 1.36, "learning_rate": 1.8269392811937384e-05, "loss": 0.6594, "step": 42355 }, { "epoch": 1.36, "learning_rate": 1.8268764675019257e-05, "loss": 0.6466, "step": 42360 }, { "epoch": 1.36, "learning_rate": 1.8268136434930687e-05, "loss": 0.6508, "step": 42365 }, { "epoch": 1.36, "learning_rate": 1.8267508091679508e-05, "loss": 0.6595, "step": 42370 }, { "epoch": 1.36, "learning_rate": 1.8266879645273557e-05, "loss": 0.6476, "step": 42375 }, { "epoch": 1.36, "learning_rate": 1.8266251095720677e-05, "loss": 0.6453, "step": 42380 }, { "epoch": 1.36, "learning_rate": 1.8265622443028715e-05, "loss": 0.6508, "step": 42385 }, { "epoch": 1.36, "learning_rate": 1.826499368720551e-05, "loss": 0.6504, "step": 42390 }, { "epoch": 1.36, "learning_rate": 1.8264364828258908e-05, "loss": 0.6516, "step": 42395 }, { "epoch": 1.36, "learning_rate": 1.8263735866196758e-05, "loss": 0.6452, "step": 42400 }, { "epoch": 1.36, "learning_rate": 1.8263106801026903e-05, "loss": 0.6451, "step": 42405 }, { "epoch": 1.36, "learning_rate": 1.8262477632757193e-05, "loss": 0.6529, "step": 42410 }, { "epoch": 1.36, "learning_rate": 1.8261848361395484e-05, "loss": 0.657, "step": 42415 }, { "epoch": 1.36, "learning_rate": 1.8261218986949617e-05, "loss": 0.6501, "step": 42420 }, { "epoch": 1.36, "learning_rate": 1.8260589509427457e-05, "loss": 0.6667, "step": 42425 }, { "epoch": 1.36, "learning_rate": 1.825995992883685e-05, "loss": 0.6412, "step": 42430 }, { "epoch": 1.36, "learning_rate": 1.8259330245185652e-05, "loss": 0.6534, "step": 42435 }, { "epoch": 1.36, "learning_rate": 1.825870045848172e-05, "loss": 0.6578, "step": 42440 }, { "epoch": 1.36, "learning_rate": 1.825807056873292e-05, "loss": 0.6573, "step": 42445 }, { "epoch": 1.36, "learning_rate": 1.8257440575947095e-05, "loss": 0.6463, "step": 42450 }, { "epoch": 1.36, "learning_rate": 1.825681048013212e-05, "loss": 0.6464, "step": 42455 }, { "epoch": 1.36, "learning_rate": 1.825618028129585e-05, "loss": 0.6501, "step": 42460 }, { "epoch": 1.36, "learning_rate": 1.8255549979446148e-05, "loss": 0.6443, "step": 42465 }, { "epoch": 1.36, "learning_rate": 1.825491957459088e-05, "loss": 0.6457, "step": 42470 }, { "epoch": 1.36, "learning_rate": 1.825428906673791e-05, "loss": 0.6429, "step": 42475 }, { "epoch": 1.36, "learning_rate": 1.825365845589511e-05, "loss": 0.6416, "step": 42480 }, { "epoch": 1.36, "learning_rate": 1.8253027742070342e-05, "loss": 0.6516, "step": 42485 }, { "epoch": 1.36, "learning_rate": 1.825239692527148e-05, "loss": 0.6525, "step": 42490 }, { "epoch": 1.36, "learning_rate": 1.8251766005506396e-05, "loss": 0.6356, "step": 42495 }, { "epoch": 1.36, "learning_rate": 1.8251134982782952e-05, "loss": 0.6572, "step": 42500 }, { "epoch": 1.36, "learning_rate": 1.8250503857109033e-05, "loss": 0.6588, "step": 42505 }, { "epoch": 1.36, "learning_rate": 1.8249872628492507e-05, "loss": 0.6519, "step": 42510 }, { "epoch": 1.36, "learning_rate": 1.824924129694125e-05, "loss": 0.655, "step": 42515 }, { "epoch": 1.36, "learning_rate": 1.8248609862463145e-05, "loss": 0.6601, "step": 42520 }, { "epoch": 1.36, "learning_rate": 1.8247978325066063e-05, "loss": 0.6482, "step": 42525 }, { "epoch": 1.36, "learning_rate": 1.824734668475789e-05, "loss": 0.6546, "step": 42530 }, { "epoch": 1.36, "learning_rate": 1.8246714941546507e-05, "loss": 0.6464, "step": 42535 }, { "epoch": 1.36, "learning_rate": 1.8246083095439788e-05, "loss": 0.6492, "step": 42540 }, { "epoch": 1.36, "learning_rate": 1.8245451146445626e-05, "loss": 0.6523, "step": 42545 }, { "epoch": 1.36, "learning_rate": 1.8244819094571897e-05, "loss": 0.6538, "step": 42550 }, { "epoch": 1.36, "learning_rate": 1.8244186939826497e-05, "loss": 0.6542, "step": 42555 }, { "epoch": 1.36, "learning_rate": 1.824355468221731e-05, "loss": 0.6461, "step": 42560 }, { "epoch": 1.36, "learning_rate": 1.8242922321752222e-05, "loss": 0.6615, "step": 42565 }, { "epoch": 1.36, "learning_rate": 1.8242289858439123e-05, "loss": 0.6458, "step": 42570 }, { "epoch": 1.36, "learning_rate": 1.8241657292285907e-05, "loss": 0.652, "step": 42575 }, { "epoch": 1.36, "learning_rate": 1.8241024623300466e-05, "loss": 0.6486, "step": 42580 }, { "epoch": 1.36, "learning_rate": 1.8240391851490696e-05, "loss": 0.6543, "step": 42585 }, { "epoch": 1.36, "learning_rate": 1.8239758976864487e-05, "loss": 0.6447, "step": 42590 }, { "epoch": 1.36, "learning_rate": 1.8239125999429737e-05, "loss": 0.6581, "step": 42595 }, { "epoch": 1.36, "learning_rate": 1.8238492919194347e-05, "loss": 0.6407, "step": 42600 }, { "epoch": 1.36, "learning_rate": 1.8237859736166216e-05, "loss": 0.6482, "step": 42605 }, { "epoch": 1.36, "learning_rate": 1.823722645035324e-05, "loss": 0.6371, "step": 42610 }, { "epoch": 1.36, "learning_rate": 1.823659306176332e-05, "loss": 0.6416, "step": 42615 }, { "epoch": 1.36, "learning_rate": 1.8235959570404364e-05, "loss": 0.6502, "step": 42620 }, { "epoch": 1.36, "learning_rate": 1.8235325976284276e-05, "loss": 0.6403, "step": 42625 }, { "epoch": 1.36, "learning_rate": 1.8234692279410956e-05, "loss": 0.6372, "step": 42630 }, { "epoch": 1.36, "learning_rate": 1.8234058479792317e-05, "loss": 0.6585, "step": 42635 }, { "epoch": 1.36, "learning_rate": 1.823342457743626e-05, "loss": 0.6574, "step": 42640 }, { "epoch": 1.36, "learning_rate": 1.8232790572350705e-05, "loss": 0.6709, "step": 42645 }, { "epoch": 1.36, "learning_rate": 1.823215646454355e-05, "loss": 0.6515, "step": 42650 }, { "epoch": 1.36, "learning_rate": 1.8231522254022714e-05, "loss": 0.6533, "step": 42655 }, { "epoch": 1.37, "learning_rate": 1.823088794079611e-05, "loss": 0.6567, "step": 42660 }, { "epoch": 1.37, "learning_rate": 1.8230253524871652e-05, "loss": 0.6502, "step": 42665 }, { "epoch": 1.37, "learning_rate": 1.8229619006257254e-05, "loss": 0.6429, "step": 42670 }, { "epoch": 1.37, "learning_rate": 1.8228984384960832e-05, "loss": 0.6546, "step": 42675 }, { "epoch": 1.37, "learning_rate": 1.822834966099031e-05, "loss": 0.6456, "step": 42680 }, { "epoch": 1.37, "learning_rate": 1.82277148343536e-05, "loss": 0.648, "step": 42685 }, { "epoch": 1.37, "learning_rate": 1.8227079905058627e-05, "loss": 0.6536, "step": 42690 }, { "epoch": 1.37, "learning_rate": 1.8226444873113315e-05, "loss": 0.6588, "step": 42695 }, { "epoch": 1.37, "learning_rate": 1.8225809738525583e-05, "loss": 0.6393, "step": 42700 }, { "epoch": 1.37, "learning_rate": 1.8225174501303357e-05, "loss": 0.6435, "step": 42705 }, { "epoch": 1.37, "learning_rate": 1.8224539161454564e-05, "loss": 0.6535, "step": 42710 }, { "epoch": 1.37, "learning_rate": 1.8223903718987134e-05, "loss": 0.6462, "step": 42715 }, { "epoch": 1.37, "learning_rate": 1.8223268173908988e-05, "loss": 0.6606, "step": 42720 }, { "epoch": 1.37, "learning_rate": 1.822263252622806e-05, "loss": 0.6565, "step": 42725 }, { "epoch": 1.37, "learning_rate": 1.8221996775952285e-05, "loss": 0.6433, "step": 42730 }, { "epoch": 1.37, "learning_rate": 1.822136092308959e-05, "loss": 0.6534, "step": 42735 }, { "epoch": 1.37, "learning_rate": 1.8220724967647907e-05, "loss": 0.6512, "step": 42740 }, { "epoch": 1.37, "learning_rate": 1.8220088909635176e-05, "loss": 0.6446, "step": 42745 }, { "epoch": 1.37, "learning_rate": 1.8219452749059332e-05, "loss": 0.6479, "step": 42750 }, { "epoch": 1.37, "learning_rate": 1.821881648592831e-05, "loss": 0.6507, "step": 42755 }, { "epoch": 1.37, "learning_rate": 1.8218180120250055e-05, "loss": 0.6537, "step": 42760 }, { "epoch": 1.37, "learning_rate": 1.82175436520325e-05, "loss": 0.6501, "step": 42765 }, { "epoch": 1.37, "learning_rate": 1.8216907081283586e-05, "loss": 0.6558, "step": 42770 }, { "epoch": 1.37, "learning_rate": 1.821627040801126e-05, "loss": 0.6469, "step": 42775 }, { "epoch": 1.37, "learning_rate": 1.8215633632223463e-05, "loss": 0.6478, "step": 42780 }, { "epoch": 1.37, "learning_rate": 1.8214996753928143e-05, "loss": 0.6454, "step": 42785 }, { "epoch": 1.37, "learning_rate": 1.8214359773133243e-05, "loss": 0.6482, "step": 42790 }, { "epoch": 1.37, "learning_rate": 1.8213722689846714e-05, "loss": 0.6512, "step": 42795 }, { "epoch": 1.37, "learning_rate": 1.82130855040765e-05, "loss": 0.6464, "step": 42800 }, { "epoch": 1.37, "learning_rate": 1.8212448215830558e-05, "loss": 0.6563, "step": 42805 }, { "epoch": 1.37, "learning_rate": 1.8211810825116835e-05, "loss": 0.6604, "step": 42810 }, { "epoch": 1.37, "learning_rate": 1.8211173331943287e-05, "loss": 0.6454, "step": 42815 }, { "epoch": 1.37, "learning_rate": 1.8210535736317864e-05, "loss": 0.6492, "step": 42820 }, { "epoch": 1.37, "learning_rate": 1.8209898038248523e-05, "loss": 0.6471, "step": 42825 }, { "epoch": 1.37, "learning_rate": 1.820926023774322e-05, "loss": 0.6423, "step": 42830 }, { "epoch": 1.37, "learning_rate": 1.8208622334809915e-05, "loss": 0.6492, "step": 42835 }, { "epoch": 1.37, "learning_rate": 1.8207984329456567e-05, "loss": 0.6541, "step": 42840 }, { "epoch": 1.37, "learning_rate": 1.8207346221691135e-05, "loss": 0.656, "step": 42845 }, { "epoch": 1.37, "learning_rate": 1.820670801152158e-05, "loss": 0.6427, "step": 42850 }, { "epoch": 1.37, "learning_rate": 1.8206069698955867e-05, "loss": 0.6488, "step": 42855 }, { "epoch": 1.37, "learning_rate": 1.8205431284001963e-05, "loss": 0.6444, "step": 42860 }, { "epoch": 1.37, "learning_rate": 1.8204792766667827e-05, "loss": 0.6404, "step": 42865 }, { "epoch": 1.37, "learning_rate": 1.8204154146961428e-05, "loss": 0.645, "step": 42870 }, { "epoch": 1.37, "learning_rate": 1.8203515424890738e-05, "loss": 0.6437, "step": 42875 }, { "epoch": 1.37, "learning_rate": 1.8202876600463722e-05, "loss": 0.6467, "step": 42880 }, { "epoch": 1.37, "learning_rate": 1.8202237673688354e-05, "loss": 0.6395, "step": 42885 }, { "epoch": 1.37, "learning_rate": 1.8201598644572605e-05, "loss": 0.6433, "step": 42890 }, { "epoch": 1.37, "learning_rate": 1.8200959513124443e-05, "loss": 0.6569, "step": 42895 }, { "epoch": 1.37, "learning_rate": 1.820032027935185e-05, "loss": 0.6472, "step": 42900 }, { "epoch": 1.37, "learning_rate": 1.8199680943262802e-05, "loss": 0.643, "step": 42905 }, { "epoch": 1.37, "learning_rate": 1.8199041504865266e-05, "loss": 0.6487, "step": 42910 }, { "epoch": 1.37, "learning_rate": 1.819840196416723e-05, "loss": 0.6457, "step": 42915 }, { "epoch": 1.37, "learning_rate": 1.8197762321176675e-05, "loss": 0.6383, "step": 42920 }, { "epoch": 1.37, "learning_rate": 1.8197122575901576e-05, "loss": 0.6505, "step": 42925 }, { "epoch": 1.37, "learning_rate": 1.8196482728349915e-05, "loss": 0.6445, "step": 42930 }, { "epoch": 1.37, "learning_rate": 1.8195842778529677e-05, "loss": 0.6656, "step": 42935 }, { "epoch": 1.37, "learning_rate": 1.819520272644885e-05, "loss": 0.6391, "step": 42940 }, { "epoch": 1.37, "learning_rate": 1.8194562572115417e-05, "loss": 0.6517, "step": 42945 }, { "epoch": 1.37, "learning_rate": 1.8193922315537363e-05, "loss": 0.6463, "step": 42950 }, { "epoch": 1.37, "learning_rate": 1.8193281956722683e-05, "loss": 0.6423, "step": 42955 }, { "epoch": 1.37, "learning_rate": 1.8192641495679362e-05, "loss": 0.6584, "step": 42960 }, { "epoch": 1.37, "learning_rate": 1.819200093241539e-05, "loss": 0.6595, "step": 42965 }, { "epoch": 1.38, "learning_rate": 1.8191360266938765e-05, "loss": 0.6437, "step": 42970 }, { "epoch": 1.38, "learning_rate": 1.8190719499257472e-05, "loss": 0.6552, "step": 42975 }, { "epoch": 1.38, "learning_rate": 1.8190078629379514e-05, "loss": 0.6598, "step": 42980 }, { "epoch": 1.38, "learning_rate": 1.8189437657312885e-05, "loss": 0.6431, "step": 42985 }, { "epoch": 1.38, "learning_rate": 1.8188796583065582e-05, "loss": 0.6579, "step": 42990 }, { "epoch": 1.38, "learning_rate": 1.8188155406645603e-05, "loss": 0.6521, "step": 42995 }, { "epoch": 1.38, "learning_rate": 1.8187514128060946e-05, "loss": 0.6576, "step": 43000 }, { "epoch": 1.38, "learning_rate": 1.818687274731962e-05, "loss": 0.6567, "step": 43005 }, { "epoch": 1.38, "learning_rate": 1.8186231264429615e-05, "loss": 0.6557, "step": 43010 }, { "epoch": 1.38, "learning_rate": 1.8185589679398948e-05, "loss": 0.659, "step": 43015 }, { "epoch": 1.38, "learning_rate": 1.818494799223562e-05, "loss": 0.6506, "step": 43020 }, { "epoch": 1.38, "learning_rate": 1.8184306202947635e-05, "loss": 0.6515, "step": 43025 }, { "epoch": 1.38, "learning_rate": 1.8183664311542995e-05, "loss": 0.6451, "step": 43030 }, { "epoch": 1.38, "learning_rate": 1.818302231802972e-05, "loss": 0.6421, "step": 43035 }, { "epoch": 1.38, "learning_rate": 1.818238022241582e-05, "loss": 0.6397, "step": 43040 }, { "epoch": 1.38, "learning_rate": 1.81817380247093e-05, "loss": 0.651, "step": 43045 }, { "epoch": 1.38, "learning_rate": 1.8181095724918173e-05, "loss": 0.6611, "step": 43050 }, { "epoch": 1.38, "learning_rate": 1.8180453323050456e-05, "loss": 0.6377, "step": 43055 }, { "epoch": 1.38, "learning_rate": 1.8179810819114164e-05, "loss": 0.6372, "step": 43060 }, { "epoch": 1.38, "learning_rate": 1.8179168213117314e-05, "loss": 0.6574, "step": 43065 }, { "epoch": 1.38, "learning_rate": 1.8178525505067922e-05, "loss": 0.6537, "step": 43070 }, { "epoch": 1.38, "learning_rate": 1.8177882694974008e-05, "loss": 0.6357, "step": 43075 }, { "epoch": 1.38, "learning_rate": 1.817723978284359e-05, "loss": 0.6529, "step": 43080 }, { "epoch": 1.38, "learning_rate": 1.8176596768684697e-05, "loss": 0.6451, "step": 43085 }, { "epoch": 1.38, "learning_rate": 1.8175953652505344e-05, "loss": 0.6402, "step": 43090 }, { "epoch": 1.38, "learning_rate": 1.8175310434313558e-05, "loss": 0.6535, "step": 43095 }, { "epoch": 1.38, "learning_rate": 1.8174667114117368e-05, "loss": 0.6661, "step": 43100 }, { "epoch": 1.38, "learning_rate": 1.8174023691924794e-05, "loss": 0.6456, "step": 43105 }, { "epoch": 1.38, "learning_rate": 1.8173380167743874e-05, "loss": 0.6496, "step": 43110 }, { "epoch": 1.38, "learning_rate": 1.8172736541582626e-05, "loss": 0.6468, "step": 43115 }, { "epoch": 1.38, "learning_rate": 1.8172092813449083e-05, "loss": 0.6541, "step": 43120 }, { "epoch": 1.38, "learning_rate": 1.8171448983351284e-05, "loss": 0.65, "step": 43125 }, { "epoch": 1.38, "learning_rate": 1.817080505129726e-05, "loss": 0.637, "step": 43130 }, { "epoch": 1.38, "learning_rate": 1.817016101729504e-05, "loss": 0.6544, "step": 43135 }, { "epoch": 1.38, "learning_rate": 1.8169516881352666e-05, "loss": 0.6615, "step": 43140 }, { "epoch": 1.38, "learning_rate": 1.8168872643478172e-05, "loss": 0.6502, "step": 43145 }, { "epoch": 1.38, "learning_rate": 1.816822830367959e-05, "loss": 0.6516, "step": 43150 }, { "epoch": 1.38, "learning_rate": 1.8167583861964968e-05, "loss": 0.6549, "step": 43155 }, { "epoch": 1.38, "learning_rate": 1.8166939318342348e-05, "loss": 0.6557, "step": 43160 }, { "epoch": 1.38, "learning_rate": 1.8166294672819767e-05, "loss": 0.6415, "step": 43165 }, { "epoch": 1.38, "learning_rate": 1.816564992540527e-05, "loss": 0.649, "step": 43170 }, { "epoch": 1.38, "learning_rate": 1.81650050761069e-05, "loss": 0.662, "step": 43175 }, { "epoch": 1.38, "learning_rate": 1.8164360124932703e-05, "loss": 0.6398, "step": 43180 }, { "epoch": 1.38, "learning_rate": 1.816371507189073e-05, "loss": 0.667, "step": 43185 }, { "epoch": 1.38, "learning_rate": 1.8163069916989027e-05, "loss": 0.6607, "step": 43190 }, { "epoch": 1.38, "learning_rate": 1.8162424660235643e-05, "loss": 0.6438, "step": 43195 }, { "epoch": 1.38, "learning_rate": 1.8161779301638626e-05, "loss": 0.6498, "step": 43200 }, { "epoch": 1.38, "learning_rate": 1.8161133841206036e-05, "loss": 0.6497, "step": 43205 }, { "epoch": 1.38, "learning_rate": 1.816048827894592e-05, "loss": 0.6609, "step": 43210 }, { "epoch": 1.38, "learning_rate": 1.8159842614866336e-05, "loss": 0.6341, "step": 43215 }, { "epoch": 1.38, "learning_rate": 1.815919684897534e-05, "loss": 0.6562, "step": 43220 }, { "epoch": 1.38, "learning_rate": 1.8158550981280987e-05, "loss": 0.6592, "step": 43225 }, { "epoch": 1.38, "learning_rate": 1.8157905011791337e-05, "loss": 0.639, "step": 43230 }, { "epoch": 1.38, "learning_rate": 1.815725894051445e-05, "loss": 0.6541, "step": 43235 }, { "epoch": 1.38, "learning_rate": 1.8156612767458387e-05, "loss": 0.6531, "step": 43240 }, { "epoch": 1.38, "learning_rate": 1.815596649263121e-05, "loss": 0.6502, "step": 43245 }, { "epoch": 1.38, "learning_rate": 1.8155320116040983e-05, "loss": 0.6639, "step": 43250 }, { "epoch": 1.38, "learning_rate": 1.815467363769577e-05, "loss": 0.6449, "step": 43255 }, { "epoch": 1.38, "learning_rate": 1.8154027057603638e-05, "loss": 0.654, "step": 43260 }, { "epoch": 1.38, "learning_rate": 1.8153380375772655e-05, "loss": 0.6675, "step": 43265 }, { "epoch": 1.38, "learning_rate": 1.8152733592210888e-05, "loss": 0.6603, "step": 43270 }, { "epoch": 1.38, "learning_rate": 1.815208670692641e-05, "loss": 0.6419, "step": 43275 }, { "epoch": 1.38, "learning_rate": 1.8151439719927292e-05, "loss": 0.6589, "step": 43280 }, { "epoch": 1.39, "learning_rate": 1.81507926312216e-05, "loss": 0.641, "step": 43285 }, { "epoch": 1.39, "learning_rate": 1.8150145440817417e-05, "loss": 0.6537, "step": 43290 }, { "epoch": 1.39, "learning_rate": 1.814949814872281e-05, "loss": 0.6453, "step": 43295 }, { "epoch": 1.39, "learning_rate": 1.8148850754945865e-05, "loss": 0.6528, "step": 43300 }, { "epoch": 1.39, "learning_rate": 1.814820325949465e-05, "loss": 0.6365, "step": 43305 }, { "epoch": 1.39, "learning_rate": 1.8147555662377246e-05, "loss": 0.6559, "step": 43310 }, { "epoch": 1.39, "learning_rate": 1.814690796360174e-05, "loss": 0.6674, "step": 43315 }, { "epoch": 1.39, "learning_rate": 1.8146260163176205e-05, "loss": 0.6567, "step": 43320 }, { "epoch": 1.39, "learning_rate": 1.814561226110873e-05, "loss": 0.6489, "step": 43325 }, { "epoch": 1.39, "learning_rate": 1.8144964257407388e-05, "loss": 0.646, "step": 43330 }, { "epoch": 1.39, "learning_rate": 1.814431615208028e-05, "loss": 0.6526, "step": 43335 }, { "epoch": 1.39, "learning_rate": 1.814366794513548e-05, "loss": 0.6439, "step": 43340 }, { "epoch": 1.39, "learning_rate": 1.8143019636581084e-05, "loss": 0.6577, "step": 43345 }, { "epoch": 1.39, "learning_rate": 1.8142371226425176e-05, "loss": 0.6414, "step": 43350 }, { "epoch": 1.39, "learning_rate": 1.8141722714675846e-05, "loss": 0.6568, "step": 43355 }, { "epoch": 1.39, "learning_rate": 1.814107410134119e-05, "loss": 0.6413, "step": 43360 }, { "epoch": 1.39, "learning_rate": 1.8140425386429297e-05, "loss": 0.633, "step": 43365 }, { "epoch": 1.39, "learning_rate": 1.8139776569948263e-05, "loss": 0.6467, "step": 43370 }, { "epoch": 1.39, "learning_rate": 1.8139127651906183e-05, "loss": 0.6438, "step": 43375 }, { "epoch": 1.39, "learning_rate": 1.813847863231115e-05, "loss": 0.6557, "step": 43380 }, { "epoch": 1.39, "learning_rate": 1.813782951117127e-05, "loss": 0.6499, "step": 43385 }, { "epoch": 1.39, "learning_rate": 1.8137180288494636e-05, "loss": 0.6549, "step": 43390 }, { "epoch": 1.39, "learning_rate": 1.8136530964289348e-05, "loss": 0.6389, "step": 43395 }, { "epoch": 1.39, "learning_rate": 1.813588153856351e-05, "loss": 0.6541, "step": 43400 }, { "epoch": 1.39, "learning_rate": 1.8135232011325223e-05, "loss": 0.653, "step": 43405 }, { "epoch": 1.39, "learning_rate": 1.8134582382582595e-05, "loss": 0.6313, "step": 43410 }, { "epoch": 1.39, "learning_rate": 1.813393265234373e-05, "loss": 0.6458, "step": 43415 }, { "epoch": 1.39, "learning_rate": 1.813328282061673e-05, "loss": 0.641, "step": 43420 }, { "epoch": 1.39, "learning_rate": 1.8132632887409708e-05, "loss": 0.6505, "step": 43425 }, { "epoch": 1.39, "learning_rate": 1.8131982852730775e-05, "loss": 0.6438, "step": 43430 }, { "epoch": 1.39, "learning_rate": 1.8131332716588038e-05, "loss": 0.6434, "step": 43435 }, { "epoch": 1.39, "learning_rate": 1.813068247898961e-05, "loss": 0.6562, "step": 43440 }, { "epoch": 1.39, "learning_rate": 1.8130032139943604e-05, "loss": 0.6455, "step": 43445 }, { "epoch": 1.39, "learning_rate": 1.812938169945813e-05, "loss": 0.6521, "step": 43450 }, { "epoch": 1.39, "learning_rate": 1.812873115754131e-05, "loss": 0.6446, "step": 43455 }, { "epoch": 1.39, "learning_rate": 1.812808051420126e-05, "loss": 0.6483, "step": 43460 }, { "epoch": 1.39, "learning_rate": 1.81274297694461e-05, "loss": 0.654, "step": 43465 }, { "epoch": 1.39, "learning_rate": 1.8126778923283938e-05, "loss": 0.6418, "step": 43470 }, { "epoch": 1.39, "learning_rate": 1.812612797572291e-05, "loss": 0.6354, "step": 43475 }, { "epoch": 1.39, "learning_rate": 1.8125476926771127e-05, "loss": 0.6569, "step": 43480 }, { "epoch": 1.39, "learning_rate": 1.812482577643672e-05, "loss": 0.6535, "step": 43485 }, { "epoch": 1.39, "learning_rate": 1.8124174524727808e-05, "loss": 0.6525, "step": 43490 }, { "epoch": 1.39, "learning_rate": 1.8123523171652514e-05, "loss": 0.6485, "step": 43495 }, { "epoch": 1.39, "learning_rate": 1.812287171721897e-05, "loss": 0.6311, "step": 43500 }, { "epoch": 1.39, "learning_rate": 1.812222016143531e-05, "loss": 0.6469, "step": 43505 }, { "epoch": 1.39, "learning_rate": 1.8121568504309656e-05, "loss": 0.6466, "step": 43510 }, { "epoch": 1.39, "learning_rate": 1.8120916745850134e-05, "loss": 0.6543, "step": 43515 }, { "epoch": 1.39, "learning_rate": 1.8120264886064888e-05, "loss": 0.6395, "step": 43520 }, { "epoch": 1.39, "learning_rate": 1.8119612924962043e-05, "loss": 0.6619, "step": 43525 }, { "epoch": 1.39, "learning_rate": 1.8118960862549735e-05, "loss": 0.6512, "step": 43530 }, { "epoch": 1.39, "learning_rate": 1.81183086988361e-05, "loss": 0.6498, "step": 43535 }, { "epoch": 1.39, "learning_rate": 1.8117656433829283e-05, "loss": 0.648, "step": 43540 }, { "epoch": 1.39, "learning_rate": 1.811700406753741e-05, "loss": 0.6464, "step": 43545 }, { "epoch": 1.39, "learning_rate": 1.8116351599968623e-05, "loss": 0.6423, "step": 43550 }, { "epoch": 1.39, "learning_rate": 1.8115699031131074e-05, "loss": 0.6596, "step": 43555 }, { "epoch": 1.39, "learning_rate": 1.811504636103289e-05, "loss": 0.6514, "step": 43560 }, { "epoch": 1.39, "learning_rate": 1.8114393589682225e-05, "loss": 0.6415, "step": 43565 }, { "epoch": 1.39, "learning_rate": 1.811374071708722e-05, "loss": 0.6452, "step": 43570 }, { "epoch": 1.39, "learning_rate": 1.8113087743256025e-05, "loss": 0.6536, "step": 43575 }, { "epoch": 1.39, "learning_rate": 1.811243466819678e-05, "loss": 0.6413, "step": 43580 }, { "epoch": 1.39, "learning_rate": 1.8111781491917636e-05, "loss": 0.654, "step": 43585 }, { "epoch": 1.39, "learning_rate": 1.8111128214426743e-05, "loss": 0.6465, "step": 43590 }, { "epoch": 1.4, "learning_rate": 1.8110474835732255e-05, "loss": 0.6534, "step": 43595 }, { "epoch": 1.4, "learning_rate": 1.810982135584232e-05, "loss": 0.6508, "step": 43600 }, { "epoch": 1.4, "learning_rate": 1.8109167774765098e-05, "loss": 0.646, "step": 43605 }, { "epoch": 1.4, "learning_rate": 1.8108514092508737e-05, "loss": 0.6524, "step": 43610 }, { "epoch": 1.4, "learning_rate": 1.8107860309081395e-05, "loss": 0.6404, "step": 43615 }, { "epoch": 1.4, "learning_rate": 1.8107206424491227e-05, "loss": 0.6411, "step": 43620 }, { "epoch": 1.4, "learning_rate": 1.81065524387464e-05, "loss": 0.6451, "step": 43625 }, { "epoch": 1.4, "learning_rate": 1.810589835185507e-05, "loss": 0.6511, "step": 43630 }, { "epoch": 1.4, "learning_rate": 1.8105244163825392e-05, "loss": 0.6429, "step": 43635 }, { "epoch": 1.4, "learning_rate": 1.8104589874665533e-05, "loss": 0.6466, "step": 43640 }, { "epoch": 1.4, "learning_rate": 1.810393548438366e-05, "loss": 0.6486, "step": 43645 }, { "epoch": 1.4, "learning_rate": 1.810328099298793e-05, "loss": 0.6502, "step": 43650 }, { "epoch": 1.4, "learning_rate": 1.8102626400486515e-05, "loss": 0.6511, "step": 43655 }, { "epoch": 1.4, "learning_rate": 1.8101971706887583e-05, "loss": 0.6513, "step": 43660 }, { "epoch": 1.4, "learning_rate": 1.8101316912199298e-05, "loss": 0.6509, "step": 43665 }, { "epoch": 1.4, "learning_rate": 1.8100662016429834e-05, "loss": 0.6475, "step": 43670 }, { "epoch": 1.4, "learning_rate": 1.810000701958736e-05, "loss": 0.6299, "step": 43675 }, { "epoch": 1.4, "learning_rate": 1.8099351921680054e-05, "loss": 0.6388, "step": 43680 }, { "epoch": 1.4, "learning_rate": 1.809869672271608e-05, "loss": 0.6499, "step": 43685 }, { "epoch": 1.4, "learning_rate": 1.809804142270362e-05, "loss": 0.6428, "step": 43690 }, { "epoch": 1.4, "learning_rate": 1.809738602165085e-05, "loss": 0.6522, "step": 43695 }, { "epoch": 1.4, "learning_rate": 1.8096730519565945e-05, "loss": 0.6416, "step": 43700 }, { "epoch": 1.4, "learning_rate": 1.8096074916457086e-05, "loss": 0.6422, "step": 43705 }, { "epoch": 1.4, "learning_rate": 1.809541921233245e-05, "loss": 0.6458, "step": 43710 }, { "epoch": 1.4, "learning_rate": 1.8094763407200217e-05, "loss": 0.6437, "step": 43715 }, { "epoch": 1.4, "learning_rate": 1.809410750106858e-05, "loss": 0.6462, "step": 43720 }, { "epoch": 1.4, "learning_rate": 1.809345149394571e-05, "loss": 0.6328, "step": 43725 }, { "epoch": 1.4, "learning_rate": 1.8092795385839798e-05, "loss": 0.6448, "step": 43730 }, { "epoch": 1.4, "learning_rate": 1.809213917675903e-05, "loss": 0.6501, "step": 43735 }, { "epoch": 1.4, "learning_rate": 1.8091482866711595e-05, "loss": 0.6512, "step": 43740 }, { "epoch": 1.4, "learning_rate": 1.8090826455705678e-05, "loss": 0.6456, "step": 43745 }, { "epoch": 1.4, "learning_rate": 1.8090169943749477e-05, "loss": 0.6454, "step": 43750 }, { "epoch": 1.4, "learning_rate": 1.8089513330851173e-05, "loss": 0.6369, "step": 43755 }, { "epoch": 1.4, "learning_rate": 1.8088856617018967e-05, "loss": 0.6393, "step": 43760 }, { "epoch": 1.4, "learning_rate": 1.8088199802261047e-05, "loss": 0.6507, "step": 43765 }, { "epoch": 1.4, "learning_rate": 1.8087542886585612e-05, "loss": 0.6518, "step": 43770 }, { "epoch": 1.4, "learning_rate": 1.8086885870000856e-05, "loss": 0.6491, "step": 43775 }, { "epoch": 1.4, "learning_rate": 1.8086228752514976e-05, "loss": 0.6445, "step": 43780 }, { "epoch": 1.4, "learning_rate": 1.8085571534136174e-05, "loss": 0.6479, "step": 43785 }, { "epoch": 1.4, "learning_rate": 1.808491421487265e-05, "loss": 0.6458, "step": 43790 }, { "epoch": 1.4, "learning_rate": 1.8084256794732605e-05, "loss": 0.6464, "step": 43795 }, { "epoch": 1.4, "learning_rate": 1.8083599273724238e-05, "loss": 0.6549, "step": 43800 }, { "epoch": 1.4, "learning_rate": 1.8082941651855758e-05, "loss": 0.6349, "step": 43805 }, { "epoch": 1.4, "learning_rate": 1.8082283929135368e-05, "loss": 0.6369, "step": 43810 }, { "epoch": 1.4, "learning_rate": 1.8081626105571274e-05, "loss": 0.6389, "step": 43815 }, { "epoch": 1.4, "learning_rate": 1.808096818117169e-05, "loss": 0.6639, "step": 43820 }, { "epoch": 1.4, "learning_rate": 1.808031015594481e-05, "loss": 0.6439, "step": 43825 }, { "epoch": 1.4, "learning_rate": 1.807965202989886e-05, "loss": 0.649, "step": 43830 }, { "epoch": 1.4, "learning_rate": 1.8078993803042046e-05, "loss": 0.6426, "step": 43835 }, { "epoch": 1.4, "learning_rate": 1.8078335475382576e-05, "loss": 0.6395, "step": 43840 }, { "epoch": 1.4, "learning_rate": 1.807767704692867e-05, "loss": 0.6499, "step": 43845 }, { "epoch": 1.4, "learning_rate": 1.8077018517688542e-05, "loss": 0.6623, "step": 43850 }, { "epoch": 1.4, "learning_rate": 1.8076359887670406e-05, "loss": 0.6509, "step": 43855 }, { "epoch": 1.4, "learning_rate": 1.8075701156882485e-05, "loss": 0.6486, "step": 43860 }, { "epoch": 1.4, "learning_rate": 1.8075042325332992e-05, "loss": 0.6485, "step": 43865 }, { "epoch": 1.4, "learning_rate": 1.8074383393030153e-05, "loss": 0.6533, "step": 43870 }, { "epoch": 1.4, "learning_rate": 1.8073724359982184e-05, "loss": 0.6464, "step": 43875 }, { "epoch": 1.4, "learning_rate": 1.8073065226197312e-05, "loss": 0.6523, "step": 43880 }, { "epoch": 1.4, "learning_rate": 1.8072405991683762e-05, "loss": 0.6458, "step": 43885 }, { "epoch": 1.4, "learning_rate": 1.8071746656449752e-05, "loss": 0.6465, "step": 43890 }, { "epoch": 1.4, "learning_rate": 1.8071087220503515e-05, "loss": 0.6492, "step": 43895 }, { "epoch": 1.4, "learning_rate": 1.807042768385328e-05, "loss": 0.6418, "step": 43900 }, { "epoch": 1.4, "learning_rate": 1.8069768046507272e-05, "loss": 0.6479, "step": 43905 }, { "epoch": 1.41, "learning_rate": 1.8069108308473724e-05, "loss": 0.6402, "step": 43910 }, { "epoch": 1.41, "learning_rate": 1.8068448469760867e-05, "loss": 0.6375, "step": 43915 }, { "epoch": 1.41, "learning_rate": 1.806778853037693e-05, "loss": 0.6465, "step": 43920 }, { "epoch": 1.41, "learning_rate": 1.8067128490330153e-05, "loss": 0.6592, "step": 43925 }, { "epoch": 1.41, "learning_rate": 1.8066468349628773e-05, "loss": 0.6468, "step": 43930 }, { "epoch": 1.41, "learning_rate": 1.8065808108281017e-05, "loss": 0.64, "step": 43935 }, { "epoch": 1.41, "learning_rate": 1.806514776629513e-05, "loss": 0.6548, "step": 43940 }, { "epoch": 1.41, "learning_rate": 1.8064487323679354e-05, "loss": 0.6551, "step": 43945 }, { "epoch": 1.41, "learning_rate": 1.806382678044192e-05, "loss": 0.6454, "step": 43950 }, { "epoch": 1.41, "learning_rate": 1.8063166136591077e-05, "loss": 0.6451, "step": 43955 }, { "epoch": 1.41, "learning_rate": 1.8062505392135067e-05, "loss": 0.6558, "step": 43960 }, { "epoch": 1.41, "learning_rate": 1.806184454708213e-05, "loss": 0.6532, "step": 43965 }, { "epoch": 1.41, "learning_rate": 1.8061183601440517e-05, "loss": 0.6504, "step": 43970 }, { "epoch": 1.41, "learning_rate": 1.806052255521847e-05, "loss": 0.6409, "step": 43975 }, { "epoch": 1.41, "learning_rate": 1.8059861408424244e-05, "loss": 0.6551, "step": 43980 }, { "epoch": 1.41, "learning_rate": 1.805920016106608e-05, "loss": 0.6451, "step": 43985 }, { "epoch": 1.41, "learning_rate": 1.8058538813152233e-05, "loss": 0.6467, "step": 43990 }, { "epoch": 1.41, "learning_rate": 1.8057877364690953e-05, "loss": 0.6482, "step": 43995 }, { "epoch": 1.41, "learning_rate": 1.8057215815690494e-05, "loss": 0.6496, "step": 44000 }, { "epoch": 1.41, "learning_rate": 1.805655416615911e-05, "loss": 0.6528, "step": 44005 }, { "epoch": 1.41, "learning_rate": 1.8055892416105053e-05, "loss": 0.6422, "step": 44010 }, { "epoch": 1.41, "learning_rate": 1.805523056553659e-05, "loss": 0.6535, "step": 44015 }, { "epoch": 1.41, "learning_rate": 1.8054568614461966e-05, "loss": 0.6413, "step": 44020 }, { "epoch": 1.41, "learning_rate": 1.805390656288945e-05, "loss": 0.6465, "step": 44025 }, { "epoch": 1.41, "learning_rate": 1.80532444108273e-05, "loss": 0.6427, "step": 44030 }, { "epoch": 1.41, "learning_rate": 1.8052582158283768e-05, "loss": 0.6514, "step": 44035 }, { "epoch": 1.41, "learning_rate": 1.8051919805267136e-05, "loss": 0.6484, "step": 44040 }, { "epoch": 1.41, "learning_rate": 1.805125735178565e-05, "loss": 0.65, "step": 44045 }, { "epoch": 1.41, "learning_rate": 1.8050594797847587e-05, "loss": 0.6445, "step": 44050 }, { "epoch": 1.41, "learning_rate": 1.804993214346121e-05, "loss": 0.651, "step": 44055 }, { "epoch": 1.41, "learning_rate": 1.8049269388634788e-05, "loss": 0.6469, "step": 44060 }, { "epoch": 1.41, "learning_rate": 1.8048606533376588e-05, "loss": 0.6587, "step": 44065 }, { "epoch": 1.41, "learning_rate": 1.8047943577694883e-05, "loss": 0.6443, "step": 44070 }, { "epoch": 1.41, "learning_rate": 1.8047280521597943e-05, "loss": 0.6372, "step": 44075 }, { "epoch": 1.41, "learning_rate": 1.804661736509404e-05, "loss": 0.6643, "step": 44080 }, { "epoch": 1.41, "learning_rate": 1.8045954108191455e-05, "loss": 0.6425, "step": 44085 }, { "epoch": 1.41, "learning_rate": 1.8045290750898456e-05, "loss": 0.6488, "step": 44090 }, { "epoch": 1.41, "learning_rate": 1.8044627293223322e-05, "loss": 0.644, "step": 44095 }, { "epoch": 1.41, "learning_rate": 1.804396373517433e-05, "loss": 0.648, "step": 44100 }, { "epoch": 1.41, "learning_rate": 1.8043300076759763e-05, "loss": 0.6493, "step": 44105 }, { "epoch": 1.41, "learning_rate": 1.8042636317987896e-05, "loss": 0.6481, "step": 44110 }, { "epoch": 1.41, "learning_rate": 1.804197245886702e-05, "loss": 0.6413, "step": 44115 }, { "epoch": 1.41, "learning_rate": 1.8041308499405406e-05, "loss": 0.6577, "step": 44120 }, { "epoch": 1.41, "learning_rate": 1.8040644439611348e-05, "loss": 0.6438, "step": 44125 }, { "epoch": 1.41, "learning_rate": 1.803998027949313e-05, "loss": 0.6366, "step": 44130 }, { "epoch": 1.41, "learning_rate": 1.8039316019059033e-05, "loss": 0.6444, "step": 44135 }, { "epoch": 1.41, "learning_rate": 1.803865165831735e-05, "loss": 0.6447, "step": 44140 }, { "epoch": 1.41, "learning_rate": 1.803798719727637e-05, "loss": 0.6415, "step": 44145 }, { "epoch": 1.41, "learning_rate": 1.8037322635944383e-05, "loss": 0.6519, "step": 44150 }, { "epoch": 1.41, "learning_rate": 1.803665797432968e-05, "loss": 0.6422, "step": 44155 }, { "epoch": 1.41, "learning_rate": 1.803599321244055e-05, "loss": 0.6415, "step": 44160 }, { "epoch": 1.41, "learning_rate": 1.8035328350285298e-05, "loss": 0.6428, "step": 44165 }, { "epoch": 1.41, "learning_rate": 1.8034663387872213e-05, "loss": 0.6494, "step": 44170 }, { "epoch": 1.41, "learning_rate": 1.803399832520959e-05, "loss": 0.6573, "step": 44175 }, { "epoch": 1.41, "learning_rate": 1.8033333162305732e-05, "loss": 0.6418, "step": 44180 }, { "epoch": 1.41, "learning_rate": 1.8032667899168937e-05, "loss": 0.656, "step": 44185 }, { "epoch": 1.41, "learning_rate": 1.80320025358075e-05, "loss": 0.6416, "step": 44190 }, { "epoch": 1.41, "learning_rate": 1.803133707222973e-05, "loss": 0.646, "step": 44195 }, { "epoch": 1.41, "learning_rate": 1.8030671508443928e-05, "loss": 0.6497, "step": 44200 }, { "epoch": 1.41, "learning_rate": 1.80300058444584e-05, "loss": 0.6421, "step": 44205 }, { "epoch": 1.41, "learning_rate": 1.802934008028144e-05, "loss": 0.6443, "step": 44210 }, { "epoch": 1.41, "learning_rate": 1.8028674215921375e-05, "loss": 0.6491, "step": 44215 }, { "epoch": 1.42, "learning_rate": 1.8028008251386493e-05, "loss": 0.6479, "step": 44220 }, { "epoch": 1.42, "learning_rate": 1.8027342186685114e-05, "loss": 0.6553, "step": 44225 }, { "epoch": 1.42, "learning_rate": 1.802667602182555e-05, "loss": 0.6538, "step": 44230 }, { "epoch": 1.42, "learning_rate": 1.8026009756816113e-05, "loss": 0.638, "step": 44235 }, { "epoch": 1.42, "learning_rate": 1.8025343391665107e-05, "loss": 0.6297, "step": 44240 }, { "epoch": 1.42, "learning_rate": 1.8024676926380854e-05, "loss": 0.6542, "step": 44245 }, { "epoch": 1.42, "learning_rate": 1.802401036097167e-05, "loss": 0.6517, "step": 44250 }, { "epoch": 1.42, "learning_rate": 1.8023343695445863e-05, "loss": 0.6556, "step": 44255 }, { "epoch": 1.42, "learning_rate": 1.8022676929811763e-05, "loss": 0.6416, "step": 44260 }, { "epoch": 1.42, "learning_rate": 1.8022010064077685e-05, "loss": 0.642, "step": 44265 }, { "epoch": 1.42, "learning_rate": 1.8021343098251943e-05, "loss": 0.6438, "step": 44270 }, { "epoch": 1.42, "learning_rate": 1.802067603234287e-05, "loss": 0.649, "step": 44275 }, { "epoch": 1.42, "learning_rate": 1.8020008866358782e-05, "loss": 0.6419, "step": 44280 }, { "epoch": 1.42, "learning_rate": 1.8019341600308005e-05, "loss": 0.6557, "step": 44285 }, { "epoch": 1.42, "learning_rate": 1.801867423419886e-05, "loss": 0.6468, "step": 44290 }, { "epoch": 1.42, "learning_rate": 1.8018006768039684e-05, "loss": 0.6479, "step": 44295 }, { "epoch": 1.42, "learning_rate": 1.8017339201838798e-05, "loss": 0.6437, "step": 44300 }, { "epoch": 1.42, "learning_rate": 1.801667153560453e-05, "loss": 0.644, "step": 44305 }, { "epoch": 1.42, "learning_rate": 1.8016003769345216e-05, "loss": 0.6377, "step": 44310 }, { "epoch": 1.42, "learning_rate": 1.8015335903069184e-05, "loss": 0.6488, "step": 44315 }, { "epoch": 1.42, "learning_rate": 1.8014667936784764e-05, "loss": 0.6441, "step": 44320 }, { "epoch": 1.42, "learning_rate": 1.8013999870500298e-05, "loss": 0.6289, "step": 44325 }, { "epoch": 1.42, "learning_rate": 1.8013331704224118e-05, "loss": 0.6422, "step": 44330 }, { "epoch": 1.42, "learning_rate": 1.801266343796456e-05, "loss": 0.641, "step": 44335 }, { "epoch": 1.42, "learning_rate": 1.801199507172996e-05, "loss": 0.6434, "step": 44340 }, { "epoch": 1.42, "learning_rate": 1.8011326605528664e-05, "loss": 0.6464, "step": 44345 }, { "epoch": 1.42, "learning_rate": 1.8010658039369006e-05, "loss": 0.6435, "step": 44350 }, { "epoch": 1.42, "learning_rate": 1.8009989373259334e-05, "loss": 0.6427, "step": 44355 }, { "epoch": 1.42, "learning_rate": 1.8009320607207984e-05, "loss": 0.6376, "step": 44360 }, { "epoch": 1.42, "learning_rate": 1.8008651741223304e-05, "loss": 0.6435, "step": 44365 }, { "epoch": 1.42, "learning_rate": 1.800798277531364e-05, "loss": 0.6314, "step": 44370 }, { "epoch": 1.42, "learning_rate": 1.8007313709487334e-05, "loss": 0.6537, "step": 44375 }, { "epoch": 1.42, "learning_rate": 1.800664454375274e-05, "loss": 0.6524, "step": 44380 }, { "epoch": 1.42, "learning_rate": 1.8005975278118208e-05, "loss": 0.6552, "step": 44385 }, { "epoch": 1.42, "learning_rate": 1.8005305912592087e-05, "loss": 0.6475, "step": 44390 }, { "epoch": 1.42, "learning_rate": 1.8004636447182725e-05, "loss": 0.6398, "step": 44395 }, { "epoch": 1.42, "learning_rate": 1.8003966881898473e-05, "loss": 0.6577, "step": 44400 }, { "epoch": 1.42, "learning_rate": 1.8003297216747694e-05, "loss": 0.6538, "step": 44405 }, { "epoch": 1.42, "learning_rate": 1.800262745173874e-05, "loss": 0.6462, "step": 44410 }, { "epoch": 1.42, "learning_rate": 1.8001957586879965e-05, "loss": 0.6424, "step": 44415 }, { "epoch": 1.42, "learning_rate": 1.8001287622179728e-05, "loss": 0.6559, "step": 44420 }, { "epoch": 1.42, "learning_rate": 1.8000617557646392e-05, "loss": 0.636, "step": 44425 }, { "epoch": 1.42, "learning_rate": 1.799994739328831e-05, "loss": 0.6383, "step": 44430 }, { "epoch": 1.42, "learning_rate": 1.7999277129113855e-05, "loss": 0.6423, "step": 44435 }, { "epoch": 1.42, "learning_rate": 1.799860676513138e-05, "loss": 0.6457, "step": 44440 }, { "epoch": 1.42, "learning_rate": 1.799793630134925e-05, "loss": 0.64, "step": 44445 }, { "epoch": 1.42, "learning_rate": 1.7997265737775837e-05, "loss": 0.6437, "step": 44450 }, { "epoch": 1.42, "learning_rate": 1.79965950744195e-05, "loss": 0.64, "step": 44455 }, { "epoch": 1.42, "learning_rate": 1.7995924311288613e-05, "loss": 0.654, "step": 44460 }, { "epoch": 1.42, "learning_rate": 1.7995253448391543e-05, "loss": 0.6351, "step": 44465 }, { "epoch": 1.42, "learning_rate": 1.7994582485736664e-05, "loss": 0.6488, "step": 44470 }, { "epoch": 1.42, "learning_rate": 1.7993911423332336e-05, "loss": 0.6399, "step": 44475 }, { "epoch": 1.42, "learning_rate": 1.7993240261186945e-05, "loss": 0.6395, "step": 44480 }, { "epoch": 1.42, "learning_rate": 1.7992568999308858e-05, "loss": 0.6428, "step": 44485 }, { "epoch": 1.42, "learning_rate": 1.7991897637706455e-05, "loss": 0.6408, "step": 44490 }, { "epoch": 1.42, "learning_rate": 1.799122617638811e-05, "loss": 0.6441, "step": 44495 }, { "epoch": 1.42, "learning_rate": 1.79905546153622e-05, "loss": 0.6515, "step": 44500 }, { "epoch": 1.42, "learning_rate": 1.7989882954637105e-05, "loss": 0.6423, "step": 44505 }, { "epoch": 1.42, "learning_rate": 1.7989211194221206e-05, "loss": 0.6323, "step": 44510 }, { "epoch": 1.42, "learning_rate": 1.7988539334122882e-05, "loss": 0.6301, "step": 44515 }, { "epoch": 1.42, "learning_rate": 1.798786737435052e-05, "loss": 0.6468, "step": 44520 }, { "epoch": 1.42, "learning_rate": 1.7987195314912504e-05, "loss": 0.6514, "step": 44525 }, { "epoch": 1.42, "learning_rate": 1.798652315581722e-05, "loss": 0.6429, "step": 44530 }, { "epoch": 1.43, "learning_rate": 1.7985850897073045e-05, "loss": 0.6422, "step": 44535 }, { "epoch": 1.43, "learning_rate": 1.798517853868838e-05, "loss": 0.6455, "step": 44540 }, { "epoch": 1.43, "learning_rate": 1.7984506080671608e-05, "loss": 0.6364, "step": 44545 }, { "epoch": 1.43, "learning_rate": 1.7983833523031114e-05, "loss": 0.6417, "step": 44550 }, { "epoch": 1.43, "learning_rate": 1.79831608657753e-05, "loss": 0.6526, "step": 44555 }, { "epoch": 1.43, "learning_rate": 1.7982488108912553e-05, "loss": 0.6593, "step": 44560 }, { "epoch": 1.43, "learning_rate": 1.798181525245127e-05, "loss": 0.6481, "step": 44565 }, { "epoch": 1.43, "learning_rate": 1.798114229639984e-05, "loss": 0.6392, "step": 44570 }, { "epoch": 1.43, "learning_rate": 1.798046924076667e-05, "loss": 0.6483, "step": 44575 }, { "epoch": 1.43, "learning_rate": 1.797979608556015e-05, "loss": 0.6449, "step": 44580 }, { "epoch": 1.43, "learning_rate": 1.7979122830788677e-05, "loss": 0.6459, "step": 44585 }, { "epoch": 1.43, "learning_rate": 1.797844947646066e-05, "loss": 0.6454, "step": 44590 }, { "epoch": 1.43, "learning_rate": 1.797777602258449e-05, "loss": 0.6556, "step": 44595 }, { "epoch": 1.43, "learning_rate": 1.7977102469168578e-05, "loss": 0.6449, "step": 44600 }, { "epoch": 1.43, "learning_rate": 1.7976428816221327e-05, "loss": 0.6327, "step": 44605 }, { "epoch": 1.43, "learning_rate": 1.797575506375114e-05, "loss": 0.6406, "step": 44610 }, { "epoch": 1.43, "learning_rate": 1.7975081211766424e-05, "loss": 0.6371, "step": 44615 }, { "epoch": 1.43, "learning_rate": 1.7974407260275587e-05, "loss": 0.6379, "step": 44620 }, { "epoch": 1.43, "learning_rate": 1.7973733209287036e-05, "loss": 0.6402, "step": 44625 }, { "epoch": 1.43, "learning_rate": 1.7973059058809186e-05, "loss": 0.6496, "step": 44630 }, { "epoch": 1.43, "learning_rate": 1.7972384808850444e-05, "loss": 0.6435, "step": 44635 }, { "epoch": 1.43, "learning_rate": 1.7971710459419226e-05, "loss": 0.6441, "step": 44640 }, { "epoch": 1.43, "learning_rate": 1.7971036010523944e-05, "loss": 0.6482, "step": 44645 }, { "epoch": 1.43, "learning_rate": 1.797036146217301e-05, "loss": 0.6541, "step": 44650 }, { "epoch": 1.43, "learning_rate": 1.796968681437485e-05, "loss": 0.6428, "step": 44655 }, { "epoch": 1.43, "learning_rate": 1.796901206713787e-05, "loss": 0.6406, "step": 44660 }, { "epoch": 1.43, "learning_rate": 1.79683372204705e-05, "loss": 0.6476, "step": 44665 }, { "epoch": 1.43, "learning_rate": 1.7967662274381148e-05, "loss": 0.6503, "step": 44670 }, { "epoch": 1.43, "learning_rate": 1.7966987228878247e-05, "loss": 0.6439, "step": 44675 }, { "epoch": 1.43, "learning_rate": 1.796631208397021e-05, "loss": 0.6276, "step": 44680 }, { "epoch": 1.43, "learning_rate": 1.7965636839665466e-05, "loss": 0.6434, "step": 44685 }, { "epoch": 1.43, "learning_rate": 1.7964961495972443e-05, "loss": 0.6465, "step": 44690 }, { "epoch": 1.43, "learning_rate": 1.796428605289956e-05, "loss": 0.6367, "step": 44695 }, { "epoch": 1.43, "learning_rate": 1.7963610510455254e-05, "loss": 0.65, "step": 44700 }, { "epoch": 1.43, "learning_rate": 1.7962934868647944e-05, "loss": 0.6392, "step": 44705 }, { "epoch": 1.43, "learning_rate": 1.796225912748607e-05, "loss": 0.6328, "step": 44710 }, { "epoch": 1.43, "learning_rate": 1.7961583286978054e-05, "loss": 0.6433, "step": 44715 }, { "epoch": 1.43, "learning_rate": 1.7960907347132332e-05, "loss": 0.6465, "step": 44720 }, { "epoch": 1.43, "learning_rate": 1.7960231307957333e-05, "loss": 0.6363, "step": 44725 }, { "epoch": 1.43, "learning_rate": 1.7959555169461504e-05, "loss": 0.6505, "step": 44730 }, { "epoch": 1.43, "learning_rate": 1.795887893165327e-05, "loss": 0.644, "step": 44735 }, { "epoch": 1.43, "learning_rate": 1.7958202594541078e-05, "loss": 0.6427, "step": 44740 }, { "epoch": 1.43, "learning_rate": 1.7957526158133357e-05, "loss": 0.649, "step": 44745 }, { "epoch": 1.43, "learning_rate": 1.7956849622438554e-05, "loss": 0.6264, "step": 44750 }, { "epoch": 1.43, "learning_rate": 1.7956172987465107e-05, "loss": 0.6376, "step": 44755 }, { "epoch": 1.43, "learning_rate": 1.7955496253221462e-05, "loss": 0.651, "step": 44760 }, { "epoch": 1.43, "learning_rate": 1.795481941971606e-05, "loss": 0.6503, "step": 44765 }, { "epoch": 1.43, "learning_rate": 1.795414248695734e-05, "loss": 0.6267, "step": 44770 }, { "epoch": 1.43, "learning_rate": 1.795346545495376e-05, "loss": 0.6473, "step": 44775 }, { "epoch": 1.43, "learning_rate": 1.7952788323713755e-05, "loss": 0.6398, "step": 44780 }, { "epoch": 1.43, "learning_rate": 1.795211109324579e-05, "loss": 0.6366, "step": 44785 }, { "epoch": 1.43, "learning_rate": 1.7951433763558297e-05, "loss": 0.6472, "step": 44790 }, { "epoch": 1.43, "learning_rate": 1.7950756334659737e-05, "loss": 0.6567, "step": 44795 }, { "epoch": 1.43, "learning_rate": 1.7950078806558565e-05, "loss": 0.653, "step": 44800 }, { "epoch": 1.43, "learning_rate": 1.7949401179263225e-05, "loss": 0.6337, "step": 44805 }, { "epoch": 1.43, "learning_rate": 1.794872345278218e-05, "loss": 0.639, "step": 44810 }, { "epoch": 1.43, "learning_rate": 1.794804562712388e-05, "loss": 0.644, "step": 44815 }, { "epoch": 1.43, "learning_rate": 1.794736770229679e-05, "loss": 0.6555, "step": 44820 }, { "epoch": 1.43, "learning_rate": 1.7946689678309356e-05, "loss": 0.6472, "step": 44825 }, { "epoch": 1.43, "learning_rate": 1.7946011555170053e-05, "loss": 0.6397, "step": 44830 }, { "epoch": 1.43, "learning_rate": 1.7945333332887332e-05, "loss": 0.6477, "step": 44835 }, { "epoch": 1.43, "learning_rate": 1.794465501146966e-05, "loss": 0.645, "step": 44840 }, { "epoch": 1.44, "learning_rate": 1.7943976590925496e-05, "loss": 0.6323, "step": 44845 }, { "epoch": 1.44, "learning_rate": 1.794329807126331e-05, "loss": 0.6519, "step": 44850 }, { "epoch": 1.44, "learning_rate": 1.7942619452491562e-05, "loss": 0.644, "step": 44855 }, { "epoch": 1.44, "learning_rate": 1.7941940734618727e-05, "loss": 0.6458, "step": 44860 }, { "epoch": 1.44, "learning_rate": 1.7941261917653266e-05, "loss": 0.6302, "step": 44865 }, { "epoch": 1.44, "learning_rate": 1.7940583001603653e-05, "loss": 0.6498, "step": 44870 }, { "epoch": 1.44, "learning_rate": 1.7939903986478354e-05, "loss": 0.6397, "step": 44875 }, { "epoch": 1.44, "learning_rate": 1.793922487228585e-05, "loss": 0.6505, "step": 44880 }, { "epoch": 1.44, "learning_rate": 1.7938545659034602e-05, "loss": 0.6453, "step": 44885 }, { "epoch": 1.44, "learning_rate": 1.79378663467331e-05, "loss": 0.6304, "step": 44890 }, { "epoch": 1.44, "learning_rate": 1.7937186935389807e-05, "loss": 0.651, "step": 44895 }, { "epoch": 1.44, "learning_rate": 1.7936507425013204e-05, "loss": 0.6441, "step": 44900 }, { "epoch": 1.44, "learning_rate": 1.7935827815611775e-05, "loss": 0.6479, "step": 44905 }, { "epoch": 1.44, "learning_rate": 1.793514810719399e-05, "loss": 0.6469, "step": 44910 }, { "epoch": 1.44, "learning_rate": 1.7934468299768336e-05, "loss": 0.6277, "step": 44915 }, { "epoch": 1.44, "learning_rate": 1.793378839334329e-05, "loss": 0.641, "step": 44920 }, { "epoch": 1.44, "learning_rate": 1.7933108387927346e-05, "loss": 0.6344, "step": 44925 }, { "epoch": 1.44, "learning_rate": 1.7932428283528976e-05, "loss": 0.6373, "step": 44930 }, { "epoch": 1.44, "learning_rate": 1.7931748080156674e-05, "loss": 0.6519, "step": 44935 }, { "epoch": 1.44, "learning_rate": 1.7931067777818922e-05, "loss": 0.6494, "step": 44940 }, { "epoch": 1.44, "learning_rate": 1.793038737652421e-05, "loss": 0.6519, "step": 44945 }, { "epoch": 1.44, "learning_rate": 1.792970687628103e-05, "loss": 0.6368, "step": 44950 }, { "epoch": 1.44, "learning_rate": 1.792902627709787e-05, "loss": 0.64, "step": 44955 }, { "epoch": 1.44, "learning_rate": 1.792834557898322e-05, "loss": 0.6429, "step": 44960 }, { "epoch": 1.44, "learning_rate": 1.7927664781945573e-05, "loss": 0.6527, "step": 44965 }, { "epoch": 1.44, "learning_rate": 1.7926983885993434e-05, "loss": 0.6385, "step": 44970 }, { "epoch": 1.44, "learning_rate": 1.7926302891135283e-05, "loss": 0.6374, "step": 44975 }, { "epoch": 1.44, "learning_rate": 1.7925621797379626e-05, "loss": 0.651, "step": 44980 }, { "epoch": 1.44, "learning_rate": 1.7924940604734962e-05, "loss": 0.6447, "step": 44985 }, { "epoch": 1.44, "learning_rate": 1.7924259313209787e-05, "loss": 0.6317, "step": 44990 }, { "epoch": 1.44, "learning_rate": 1.7923577922812604e-05, "loss": 0.6408, "step": 44995 }, { "epoch": 1.44, "learning_rate": 1.792289643355191e-05, "loss": 0.6515, "step": 45000 }, { "epoch": 1.44, "learning_rate": 1.792221484543621e-05, "loss": 0.6432, "step": 45005 }, { "epoch": 1.44, "learning_rate": 1.792153315847401e-05, "loss": 0.6323, "step": 45010 }, { "epoch": 1.44, "learning_rate": 1.7920851372673818e-05, "loss": 0.6349, "step": 45015 }, { "epoch": 1.44, "learning_rate": 1.7920169488044138e-05, "loss": 0.6487, "step": 45020 }, { "epoch": 1.44, "learning_rate": 1.7919487504593472e-05, "loss": 0.6522, "step": 45025 }, { "epoch": 1.44, "learning_rate": 1.7918805422330342e-05, "loss": 0.6495, "step": 45030 }, { "epoch": 1.44, "learning_rate": 1.7918123241263247e-05, "loss": 0.6425, "step": 45035 }, { "epoch": 1.44, "learning_rate": 1.7917440961400706e-05, "loss": 0.644, "step": 45040 }, { "epoch": 1.44, "learning_rate": 1.7916758582751227e-05, "loss": 0.6522, "step": 45045 }, { "epoch": 1.44, "learning_rate": 1.7916076105323323e-05, "loss": 0.6382, "step": 45050 }, { "epoch": 1.44, "learning_rate": 1.7915393529125516e-05, "loss": 0.6448, "step": 45055 }, { "epoch": 1.44, "learning_rate": 1.7914710854166317e-05, "loss": 0.643, "step": 45060 }, { "epoch": 1.44, "learning_rate": 1.7914028080454247e-05, "loss": 0.6342, "step": 45065 }, { "epoch": 1.44, "learning_rate": 1.7913345207997824e-05, "loss": 0.6442, "step": 45070 }, { "epoch": 1.44, "learning_rate": 1.791266223680557e-05, "loss": 0.6439, "step": 45075 }, { "epoch": 1.44, "learning_rate": 1.7911979166886e-05, "loss": 0.6492, "step": 45080 }, { "epoch": 1.44, "learning_rate": 1.791129599824764e-05, "loss": 0.6466, "step": 45085 }, { "epoch": 1.44, "learning_rate": 1.7910612730899018e-05, "loss": 0.644, "step": 45090 }, { "epoch": 1.44, "learning_rate": 1.790992936484866e-05, "loss": 0.6418, "step": 45095 }, { "epoch": 1.44, "learning_rate": 1.7909245900105085e-05, "loss": 0.6278, "step": 45100 }, { "epoch": 1.44, "learning_rate": 1.7908562336676826e-05, "loss": 0.6487, "step": 45105 }, { "epoch": 1.44, "learning_rate": 1.790787867457241e-05, "loss": 0.647, "step": 45110 }, { "epoch": 1.44, "learning_rate": 1.7907194913800367e-05, "loss": 0.6445, "step": 45115 }, { "epoch": 1.44, "learning_rate": 1.790651105436923e-05, "loss": 0.6446, "step": 45120 }, { "epoch": 1.44, "learning_rate": 1.7905827096287532e-05, "loss": 0.6519, "step": 45125 }, { "epoch": 1.44, "learning_rate": 1.79051430395638e-05, "loss": 0.6492, "step": 45130 }, { "epoch": 1.44, "learning_rate": 1.790445888420658e-05, "loss": 0.6392, "step": 45135 }, { "epoch": 1.44, "learning_rate": 1.7903774630224404e-05, "loss": 0.6441, "step": 45140 }, { "epoch": 1.44, "learning_rate": 1.7903090277625807e-05, "loss": 0.6353, "step": 45145 }, { "epoch": 1.44, "learning_rate": 1.7902405826419323e-05, "loss": 0.6458, "step": 45150 }, { "epoch": 1.44, "learning_rate": 1.7901721276613506e-05, "loss": 0.6523, "step": 45155 }, { "epoch": 1.45, "learning_rate": 1.7901036628216885e-05, "loss": 0.647, "step": 45160 }, { "epoch": 1.45, "learning_rate": 1.7900351881238013e-05, "loss": 0.6425, "step": 45165 }, { "epoch": 1.45, "learning_rate": 1.789966703568542e-05, "loss": 0.6447, "step": 45170 }, { "epoch": 1.45, "learning_rate": 1.789898209156766e-05, "loss": 0.6324, "step": 45175 }, { "epoch": 1.45, "learning_rate": 1.789829704889328e-05, "loss": 0.6464, "step": 45180 }, { "epoch": 1.45, "learning_rate": 1.7897611907670823e-05, "loss": 0.649, "step": 45185 }, { "epoch": 1.45, "learning_rate": 1.789692666790884e-05, "loss": 0.6413, "step": 45190 }, { "epoch": 1.45, "learning_rate": 1.789624132961588e-05, "loss": 0.6492, "step": 45195 }, { "epoch": 1.45, "learning_rate": 1.7895555892800494e-05, "loss": 0.6451, "step": 45200 }, { "epoch": 1.45, "learning_rate": 1.7894870357471236e-05, "loss": 0.635, "step": 45205 }, { "epoch": 1.45, "learning_rate": 1.7894184723636657e-05, "loss": 0.6435, "step": 45210 }, { "epoch": 1.45, "learning_rate": 1.7893498991305317e-05, "loss": 0.6392, "step": 45215 }, { "epoch": 1.45, "learning_rate": 1.7892813160485762e-05, "loss": 0.641, "step": 45220 }, { "epoch": 1.45, "learning_rate": 1.789212723118656e-05, "loss": 0.6339, "step": 45225 }, { "epoch": 1.45, "learning_rate": 1.7891441203416258e-05, "loss": 0.6448, "step": 45230 }, { "epoch": 1.45, "learning_rate": 1.7890755077183426e-05, "loss": 0.6405, "step": 45235 }, { "epoch": 1.45, "learning_rate": 1.7890068852496624e-05, "loss": 0.649, "step": 45240 }, { "epoch": 1.45, "learning_rate": 1.7889382529364407e-05, "loss": 0.6307, "step": 45245 }, { "epoch": 1.45, "learning_rate": 1.7888696107795343e-05, "loss": 0.6358, "step": 45250 }, { "epoch": 1.45, "learning_rate": 1.7888009587797995e-05, "loss": 0.6411, "step": 45255 }, { "epoch": 1.45, "learning_rate": 1.7887322969380935e-05, "loss": 0.6398, "step": 45260 }, { "epoch": 1.45, "learning_rate": 1.7886636252552717e-05, "loss": 0.636, "step": 45265 }, { "epoch": 1.45, "learning_rate": 1.7885949437321923e-05, "loss": 0.642, "step": 45270 }, { "epoch": 1.45, "learning_rate": 1.7885262523697116e-05, "loss": 0.6323, "step": 45275 }, { "epoch": 1.45, "learning_rate": 1.7884575511686867e-05, "loss": 0.644, "step": 45280 }, { "epoch": 1.45, "learning_rate": 1.788388840129975e-05, "loss": 0.6418, "step": 45285 }, { "epoch": 1.45, "learning_rate": 1.7883201192544332e-05, "loss": 0.6484, "step": 45290 }, { "epoch": 1.45, "learning_rate": 1.7882513885429197e-05, "loss": 0.6381, "step": 45295 }, { "epoch": 1.45, "learning_rate": 1.788182647996291e-05, "loss": 0.648, "step": 45300 }, { "epoch": 1.45, "learning_rate": 1.7881138976154055e-05, "loss": 0.6416, "step": 45305 }, { "epoch": 1.45, "learning_rate": 1.788045137401121e-05, "loss": 0.6447, "step": 45310 }, { "epoch": 1.45, "learning_rate": 1.787976367354295e-05, "loss": 0.6391, "step": 45315 }, { "epoch": 1.45, "learning_rate": 1.787907587475786e-05, "loss": 0.642, "step": 45320 }, { "epoch": 1.45, "learning_rate": 1.7878387977664522e-05, "loss": 0.6387, "step": 45325 }, { "epoch": 1.45, "learning_rate": 1.7877699982271516e-05, "loss": 0.6408, "step": 45330 }, { "epoch": 1.45, "learning_rate": 1.7877011888587427e-05, "loss": 0.6254, "step": 45335 }, { "epoch": 1.45, "learning_rate": 1.7876323696620838e-05, "loss": 0.6452, "step": 45340 }, { "epoch": 1.45, "learning_rate": 1.787563540638034e-05, "loss": 0.6474, "step": 45345 }, { "epoch": 1.45, "learning_rate": 1.787494701787452e-05, "loss": 0.6569, "step": 45350 }, { "epoch": 1.45, "learning_rate": 1.7874258531111963e-05, "loss": 0.648, "step": 45355 }, { "epoch": 1.45, "learning_rate": 1.7873569946101266e-05, "loss": 0.6504, "step": 45360 }, { "epoch": 1.45, "learning_rate": 1.7872881262851018e-05, "loss": 0.6381, "step": 45365 }, { "epoch": 1.45, "learning_rate": 1.787219248136981e-05, "loss": 0.6484, "step": 45370 }, { "epoch": 1.45, "learning_rate": 1.7871503601666233e-05, "loss": 0.6476, "step": 45375 }, { "epoch": 1.45, "learning_rate": 1.787081462374889e-05, "loss": 0.6471, "step": 45380 }, { "epoch": 1.45, "learning_rate": 1.7870125547626372e-05, "loss": 0.6398, "step": 45385 }, { "epoch": 1.45, "learning_rate": 1.7869436373307278e-05, "loss": 0.6501, "step": 45390 }, { "epoch": 1.45, "learning_rate": 1.786874710080021e-05, "loss": 0.6406, "step": 45395 }, { "epoch": 1.45, "learning_rate": 1.7868057730113766e-05, "loss": 0.6387, "step": 45400 }, { "epoch": 1.45, "learning_rate": 1.7867368261256542e-05, "loss": 0.6417, "step": 45405 }, { "epoch": 1.45, "learning_rate": 1.786667869423715e-05, "loss": 0.6506, "step": 45410 }, { "epoch": 1.45, "learning_rate": 1.7865989029064185e-05, "loss": 0.6264, "step": 45415 }, { "epoch": 1.45, "learning_rate": 1.7865299265746257e-05, "loss": 0.6342, "step": 45420 }, { "epoch": 1.45, "learning_rate": 1.7864609404291976e-05, "loss": 0.6481, "step": 45425 }, { "epoch": 1.45, "learning_rate": 1.786391944470994e-05, "loss": 0.6485, "step": 45430 }, { "epoch": 1.45, "learning_rate": 1.7863229387008765e-05, "loss": 0.6509, "step": 45435 }, { "epoch": 1.45, "learning_rate": 1.786253923119706e-05, "loss": 0.6411, "step": 45440 }, { "epoch": 1.45, "learning_rate": 1.786184897728343e-05, "loss": 0.6407, "step": 45445 }, { "epoch": 1.45, "learning_rate": 1.78611586252765e-05, "loss": 0.6371, "step": 45450 }, { "epoch": 1.45, "learning_rate": 1.7860468175184867e-05, "loss": 0.6535, "step": 45455 }, { "epoch": 1.45, "learning_rate": 1.785977762701716e-05, "loss": 0.6382, "step": 45460 }, { "epoch": 1.45, "learning_rate": 1.785908698078199e-05, "loss": 0.6382, "step": 45465 }, { "epoch": 1.46, "learning_rate": 1.785839623648797e-05, "loss": 0.6475, "step": 45470 }, { "epoch": 1.46, "learning_rate": 1.7857705394143726e-05, "loss": 0.6384, "step": 45475 }, { "epoch": 1.46, "learning_rate": 1.785701445375787e-05, "loss": 0.6483, "step": 45480 }, { "epoch": 1.46, "learning_rate": 1.785632341533903e-05, "loss": 0.6511, "step": 45485 }, { "epoch": 1.46, "learning_rate": 1.7855632278895826e-05, "loss": 0.6393, "step": 45490 }, { "epoch": 1.46, "learning_rate": 1.7854941044436883e-05, "loss": 0.6452, "step": 45495 }, { "epoch": 1.46, "learning_rate": 1.785424971197082e-05, "loss": 0.6413, "step": 45500 }, { "epoch": 1.46, "learning_rate": 1.7853558281506267e-05, "loss": 0.6276, "step": 45505 }, { "epoch": 1.46, "learning_rate": 1.785286675305185e-05, "loss": 0.6379, "step": 45510 }, { "epoch": 1.46, "learning_rate": 1.78521751266162e-05, "loss": 0.6458, "step": 45515 }, { "epoch": 1.46, "learning_rate": 1.7851483402207937e-05, "loss": 0.6388, "step": 45520 }, { "epoch": 1.46, "learning_rate": 1.7850791579835703e-05, "loss": 0.6574, "step": 45525 }, { "epoch": 1.46, "learning_rate": 1.7850099659508128e-05, "loss": 0.6356, "step": 45530 }, { "epoch": 1.46, "learning_rate": 1.7849407641233843e-05, "loss": 0.6484, "step": 45535 }, { "epoch": 1.46, "learning_rate": 1.7848715525021482e-05, "loss": 0.6522, "step": 45540 }, { "epoch": 1.46, "learning_rate": 1.7848023310879678e-05, "loss": 0.6524, "step": 45545 }, { "epoch": 1.46, "learning_rate": 1.784733099881707e-05, "loss": 0.6343, "step": 45550 }, { "epoch": 1.46, "learning_rate": 1.7846638588842302e-05, "loss": 0.6301, "step": 45555 }, { "epoch": 1.46, "learning_rate": 1.7845946080964004e-05, "loss": 0.642, "step": 45560 }, { "epoch": 1.46, "learning_rate": 1.7845253475190825e-05, "loss": 0.646, "step": 45565 }, { "epoch": 1.46, "learning_rate": 1.7844560771531397e-05, "loss": 0.6421, "step": 45570 }, { "epoch": 1.46, "learning_rate": 1.7843867969994372e-05, "loss": 0.6521, "step": 45575 }, { "epoch": 1.46, "learning_rate": 1.784317507058839e-05, "loss": 0.6465, "step": 45580 }, { "epoch": 1.46, "learning_rate": 1.7842482073322097e-05, "loss": 0.6418, "step": 45585 }, { "epoch": 1.46, "learning_rate": 1.7841788978204137e-05, "loss": 0.6383, "step": 45590 }, { "epoch": 1.46, "learning_rate": 1.784109578524316e-05, "loss": 0.6536, "step": 45595 }, { "epoch": 1.46, "learning_rate": 1.784040249444782e-05, "loss": 0.6547, "step": 45600 }, { "epoch": 1.46, "learning_rate": 1.783970910582676e-05, "loss": 0.6371, "step": 45605 }, { "epoch": 1.46, "learning_rate": 1.783901561938864e-05, "loss": 0.6372, "step": 45610 }, { "epoch": 1.46, "learning_rate": 1.7838322035142098e-05, "loss": 0.6201, "step": 45615 }, { "epoch": 1.46, "learning_rate": 1.78376283530958e-05, "loss": 0.6474, "step": 45620 }, { "epoch": 1.46, "learning_rate": 1.78369345732584e-05, "loss": 0.6394, "step": 45625 }, { "epoch": 1.46, "learning_rate": 1.783624069563855e-05, "loss": 0.6407, "step": 45630 }, { "epoch": 1.46, "learning_rate": 1.783554672024491e-05, "loss": 0.6413, "step": 45635 }, { "epoch": 1.46, "learning_rate": 1.783485264708614e-05, "loss": 0.642, "step": 45640 }, { "epoch": 1.46, "learning_rate": 1.7834158476170902e-05, "loss": 0.6434, "step": 45645 }, { "epoch": 1.46, "learning_rate": 1.783346420750785e-05, "loss": 0.6297, "step": 45650 }, { "epoch": 1.46, "learning_rate": 1.783276984110565e-05, "loss": 0.6536, "step": 45655 }, { "epoch": 1.46, "learning_rate": 1.7832075376972972e-05, "loss": 0.6382, "step": 45660 }, { "epoch": 1.46, "learning_rate": 1.783138081511847e-05, "loss": 0.6616, "step": 45665 }, { "epoch": 1.46, "learning_rate": 1.7830686155550815e-05, "loss": 0.6326, "step": 45670 }, { "epoch": 1.46, "learning_rate": 1.782999139827868e-05, "loss": 0.6332, "step": 45675 }, { "epoch": 1.46, "learning_rate": 1.7829296543310725e-05, "loss": 0.6305, "step": 45680 }, { "epoch": 1.46, "learning_rate": 1.782860159065562e-05, "loss": 0.6417, "step": 45685 }, { "epoch": 1.46, "learning_rate": 1.782790654032204e-05, "loss": 0.6475, "step": 45690 }, { "epoch": 1.46, "learning_rate": 1.7827211392318662e-05, "loss": 0.6508, "step": 45695 }, { "epoch": 1.46, "learning_rate": 1.782651614665415e-05, "loss": 0.6464, "step": 45700 }, { "epoch": 1.46, "learning_rate": 1.782582080333718e-05, "loss": 0.6295, "step": 45705 }, { "epoch": 1.46, "learning_rate": 1.7825125362376434e-05, "loss": 0.6505, "step": 45710 }, { "epoch": 1.46, "learning_rate": 1.7824429823780586e-05, "loss": 0.655, "step": 45715 }, { "epoch": 1.46, "learning_rate": 1.7823734187558312e-05, "loss": 0.6274, "step": 45720 }, { "epoch": 1.46, "learning_rate": 1.7823038453718293e-05, "loss": 0.643, "step": 45725 }, { "epoch": 1.46, "learning_rate": 1.782234262226921e-05, "loss": 0.6443, "step": 45730 }, { "epoch": 1.46, "learning_rate": 1.7821646693219748e-05, "loss": 0.6421, "step": 45735 }, { "epoch": 1.46, "learning_rate": 1.7820950666578586e-05, "loss": 0.6501, "step": 45740 }, { "epoch": 1.46, "learning_rate": 1.782025454235441e-05, "loss": 0.6423, "step": 45745 }, { "epoch": 1.46, "learning_rate": 1.7819558320555902e-05, "loss": 0.6445, "step": 45750 }, { "epoch": 1.46, "learning_rate": 1.7818862001191754e-05, "loss": 0.6522, "step": 45755 }, { "epoch": 1.46, "learning_rate": 1.781816558427065e-05, "loss": 0.6437, "step": 45760 }, { "epoch": 1.46, "learning_rate": 1.7817469069801287e-05, "loss": 0.6471, "step": 45765 }, { "epoch": 1.46, "learning_rate": 1.7816772457792348e-05, "loss": 0.6426, "step": 45770 }, { "epoch": 1.46, "learning_rate": 1.7816075748252526e-05, "loss": 0.6449, "step": 45775 }, { "epoch": 1.46, "learning_rate": 1.7815378941190514e-05, "loss": 0.6435, "step": 45780 }, { "epoch": 1.47, "learning_rate": 1.781468203661501e-05, "loss": 0.6366, "step": 45785 }, { "epoch": 1.47, "learning_rate": 1.7813985034534704e-05, "loss": 0.6293, "step": 45790 }, { "epoch": 1.47, "learning_rate": 1.7813287934958293e-05, "loss": 0.6471, "step": 45795 }, { "epoch": 1.47, "learning_rate": 1.781259073789448e-05, "loss": 0.648, "step": 45800 }, { "epoch": 1.47, "learning_rate": 1.7811893443351958e-05, "loss": 0.6487, "step": 45805 }, { "epoch": 1.47, "learning_rate": 1.781119605133943e-05, "loss": 0.639, "step": 45810 }, { "epoch": 1.47, "learning_rate": 1.78104985618656e-05, "loss": 0.6521, "step": 45815 }, { "epoch": 1.47, "learning_rate": 1.7809800974939168e-05, "loss": 0.6509, "step": 45820 }, { "epoch": 1.47, "learning_rate": 1.7809103290568832e-05, "loss": 0.636, "step": 45825 }, { "epoch": 1.47, "learning_rate": 1.780840550876331e-05, "loss": 0.6427, "step": 45830 }, { "epoch": 1.47, "learning_rate": 1.7807707629531297e-05, "loss": 0.6372, "step": 45835 }, { "epoch": 1.47, "learning_rate": 1.7807009652881505e-05, "loss": 0.656, "step": 45840 }, { "epoch": 1.47, "learning_rate": 1.7806311578822644e-05, "loss": 0.6503, "step": 45845 }, { "epoch": 1.47, "learning_rate": 1.780561340736342e-05, "loss": 0.6438, "step": 45850 }, { "epoch": 1.47, "learning_rate": 1.780491513851255e-05, "loss": 0.6365, "step": 45855 }, { "epoch": 1.47, "learning_rate": 1.780421677227874e-05, "loss": 0.6337, "step": 45860 }, { "epoch": 1.47, "learning_rate": 1.7803518308670708e-05, "loss": 0.6441, "step": 45865 }, { "epoch": 1.47, "learning_rate": 1.7802819747697172e-05, "loss": 0.6404, "step": 45870 }, { "epoch": 1.47, "learning_rate": 1.780212108936684e-05, "loss": 0.6414, "step": 45875 }, { "epoch": 1.47, "learning_rate": 1.780142233368843e-05, "loss": 0.6447, "step": 45880 }, { "epoch": 1.47, "learning_rate": 1.7800723480670666e-05, "loss": 0.6408, "step": 45885 }, { "epoch": 1.47, "learning_rate": 1.780002453032226e-05, "loss": 0.6438, "step": 45890 }, { "epoch": 1.47, "learning_rate": 1.7799325482651946e-05, "loss": 0.6575, "step": 45895 }, { "epoch": 1.47, "learning_rate": 1.779862633766843e-05, "loss": 0.6377, "step": 45900 }, { "epoch": 1.47, "learning_rate": 1.7797927095380448e-05, "loss": 0.6475, "step": 45905 }, { "epoch": 1.47, "learning_rate": 1.779722775579672e-05, "loss": 0.6476, "step": 45910 }, { "epoch": 1.47, "learning_rate": 1.779652831892597e-05, "loss": 0.6492, "step": 45915 }, { "epoch": 1.47, "learning_rate": 1.779582878477693e-05, "loss": 0.6501, "step": 45920 }, { "epoch": 1.47, "learning_rate": 1.779512915335832e-05, "loss": 0.6494, "step": 45925 }, { "epoch": 1.47, "learning_rate": 1.7794429424678877e-05, "loss": 0.6515, "step": 45930 }, { "epoch": 1.47, "learning_rate": 1.7793729598747327e-05, "loss": 0.6393, "step": 45935 }, { "epoch": 1.47, "learning_rate": 1.7793029675572408e-05, "loss": 0.6515, "step": 45940 }, { "epoch": 1.47, "learning_rate": 1.7792329655162843e-05, "loss": 0.6466, "step": 45945 }, { "epoch": 1.47, "learning_rate": 1.7791629537527373e-05, "loss": 0.6577, "step": 45950 }, { "epoch": 1.47, "learning_rate": 1.7790929322674733e-05, "loss": 0.6427, "step": 45955 }, { "epoch": 1.47, "learning_rate": 1.779022901061366e-05, "loss": 0.6375, "step": 45960 }, { "epoch": 1.47, "learning_rate": 1.7789528601352887e-05, "loss": 0.6522, "step": 45965 }, { "epoch": 1.47, "learning_rate": 1.778882809490116e-05, "loss": 0.6332, "step": 45970 }, { "epoch": 1.47, "learning_rate": 1.7788127491267214e-05, "loss": 0.6466, "step": 45975 }, { "epoch": 1.47, "learning_rate": 1.7787426790459792e-05, "loss": 0.649, "step": 45980 }, { "epoch": 1.47, "learning_rate": 1.7786725992487643e-05, "loss": 0.641, "step": 45985 }, { "epoch": 1.47, "learning_rate": 1.7786025097359502e-05, "loss": 0.649, "step": 45990 }, { "epoch": 1.47, "learning_rate": 1.7785324105084117e-05, "loss": 0.6498, "step": 45995 }, { "epoch": 1.47, "learning_rate": 1.7784623015670237e-05, "loss": 0.6518, "step": 46000 }, { "epoch": 1.47, "learning_rate": 1.7783921829126605e-05, "loss": 0.6459, "step": 46005 }, { "epoch": 1.47, "learning_rate": 1.778322054546197e-05, "loss": 0.6461, "step": 46010 }, { "epoch": 1.47, "learning_rate": 1.778251916468509e-05, "loss": 0.6365, "step": 46015 }, { "epoch": 1.47, "learning_rate": 1.778181768680471e-05, "loss": 0.6411, "step": 46020 }, { "epoch": 1.47, "learning_rate": 1.778111611182958e-05, "loss": 0.634, "step": 46025 }, { "epoch": 1.47, "learning_rate": 1.7780414439768456e-05, "loss": 0.6516, "step": 46030 }, { "epoch": 1.47, "learning_rate": 1.7779712670630097e-05, "loss": 0.644, "step": 46035 }, { "epoch": 1.47, "learning_rate": 1.7779010804423254e-05, "loss": 0.6423, "step": 46040 }, { "epoch": 1.47, "learning_rate": 1.7778308841156687e-05, "loss": 0.6384, "step": 46045 }, { "epoch": 1.47, "learning_rate": 1.7777606780839152e-05, "loss": 0.6475, "step": 46050 }, { "epoch": 1.47, "learning_rate": 1.7776904623479407e-05, "loss": 0.6339, "step": 46055 }, { "epoch": 1.47, "learning_rate": 1.777620236908622e-05, "loss": 0.6475, "step": 46060 }, { "epoch": 1.47, "learning_rate": 1.7775500017668344e-05, "loss": 0.649, "step": 46065 }, { "epoch": 1.47, "learning_rate": 1.7774797569234553e-05, "loss": 0.6426, "step": 46070 }, { "epoch": 1.47, "learning_rate": 1.7774095023793606e-05, "loss": 0.6351, "step": 46075 }, { "epoch": 1.47, "learning_rate": 1.7773392381354267e-05, "loss": 0.6463, "step": 46080 }, { "epoch": 1.47, "learning_rate": 1.77726896419253e-05, "loss": 0.6386, "step": 46085 }, { "epoch": 1.47, "learning_rate": 1.7771986805515485e-05, "loss": 0.6439, "step": 46090 }, { "epoch": 1.48, "learning_rate": 1.7771283872133583e-05, "loss": 0.635, "step": 46095 }, { "epoch": 1.48, "learning_rate": 1.7770580841788364e-05, "loss": 0.6469, "step": 46100 }, { "epoch": 1.48, "learning_rate": 1.77698777144886e-05, "loss": 0.6461, "step": 46105 }, { "epoch": 1.48, "learning_rate": 1.7769174490243068e-05, "loss": 0.6381, "step": 46110 }, { "epoch": 1.48, "learning_rate": 1.7768471169060538e-05, "loss": 0.653, "step": 46115 }, { "epoch": 1.48, "learning_rate": 1.7767767750949784e-05, "loss": 0.6432, "step": 46120 }, { "epoch": 1.48, "learning_rate": 1.7767064235919594e-05, "loss": 0.6457, "step": 46125 }, { "epoch": 1.48, "learning_rate": 1.776636062397873e-05, "loss": 0.6404, "step": 46130 }, { "epoch": 1.48, "learning_rate": 1.7765656915135983e-05, "loss": 0.6439, "step": 46135 }, { "epoch": 1.48, "learning_rate": 1.776495310940013e-05, "loss": 0.6407, "step": 46140 }, { "epoch": 1.48, "learning_rate": 1.776424920677995e-05, "loss": 0.6396, "step": 46145 }, { "epoch": 1.48, "learning_rate": 1.7763545207284226e-05, "loss": 0.6384, "step": 46150 }, { "epoch": 1.48, "learning_rate": 1.7762841110921744e-05, "loss": 0.6376, "step": 46155 }, { "epoch": 1.48, "learning_rate": 1.7762136917701288e-05, "loss": 0.6374, "step": 46160 }, { "epoch": 1.48, "learning_rate": 1.7761432627631644e-05, "loss": 0.6495, "step": 46165 }, { "epoch": 1.48, "learning_rate": 1.77607282407216e-05, "loss": 0.6433, "step": 46170 }, { "epoch": 1.48, "learning_rate": 1.7760023756979944e-05, "loss": 0.6347, "step": 46175 }, { "epoch": 1.48, "learning_rate": 1.775931917641547e-05, "loss": 0.6443, "step": 46180 }, { "epoch": 1.48, "learning_rate": 1.775861449903696e-05, "loss": 0.6492, "step": 46185 }, { "epoch": 1.48, "learning_rate": 1.7757909724853218e-05, "loss": 0.6487, "step": 46190 }, { "epoch": 1.48, "learning_rate": 1.775720485387303e-05, "loss": 0.6335, "step": 46195 }, { "epoch": 1.48, "learning_rate": 1.775649988610519e-05, "loss": 0.641, "step": 46200 }, { "epoch": 1.48, "learning_rate": 1.77557948215585e-05, "loss": 0.6408, "step": 46205 }, { "epoch": 1.48, "learning_rate": 1.775508966024175e-05, "loss": 0.6443, "step": 46210 }, { "epoch": 1.48, "learning_rate": 1.7754384402163746e-05, "loss": 0.6361, "step": 46215 }, { "epoch": 1.48, "learning_rate": 1.775367904733328e-05, "loss": 0.6361, "step": 46220 }, { "epoch": 1.48, "learning_rate": 1.775297359575916e-05, "loss": 0.6408, "step": 46225 }, { "epoch": 1.48, "learning_rate": 1.775226804745018e-05, "loss": 0.6332, "step": 46230 }, { "epoch": 1.48, "learning_rate": 1.7751562402415152e-05, "loss": 0.6468, "step": 46235 }, { "epoch": 1.48, "learning_rate": 1.7750856660662872e-05, "loss": 0.6491, "step": 46240 }, { "epoch": 1.48, "learning_rate": 1.775015082220215e-05, "loss": 0.6386, "step": 46245 }, { "epoch": 1.48, "learning_rate": 1.7749444887041797e-05, "loss": 0.6388, "step": 46250 }, { "epoch": 1.48, "learning_rate": 1.7748738855190615e-05, "loss": 0.6404, "step": 46255 }, { "epoch": 1.48, "learning_rate": 1.7748032726657413e-05, "loss": 0.6382, "step": 46260 }, { "epoch": 1.48, "learning_rate": 1.7747326501451002e-05, "loss": 0.6416, "step": 46265 }, { "epoch": 1.48, "learning_rate": 1.77466201795802e-05, "loss": 0.6318, "step": 46270 }, { "epoch": 1.48, "learning_rate": 1.7745913761053812e-05, "loss": 0.6504, "step": 46275 }, { "epoch": 1.48, "learning_rate": 1.7745207245880654e-05, "loss": 0.6376, "step": 46280 }, { "epoch": 1.48, "learning_rate": 1.7744500634069544e-05, "loss": 0.6435, "step": 46285 }, { "epoch": 1.48, "learning_rate": 1.7743793925629296e-05, "loss": 0.6381, "step": 46290 }, { "epoch": 1.48, "learning_rate": 1.7743087120568727e-05, "loss": 0.6318, "step": 46295 }, { "epoch": 1.48, "learning_rate": 1.7742380218896658e-05, "loss": 0.6455, "step": 46300 }, { "epoch": 1.48, "learning_rate": 1.7741673220621907e-05, "loss": 0.6334, "step": 46305 }, { "epoch": 1.48, "learning_rate": 1.77409661257533e-05, "loss": 0.649, "step": 46310 }, { "epoch": 1.48, "learning_rate": 1.7740258934299654e-05, "loss": 0.6313, "step": 46315 }, { "epoch": 1.48, "learning_rate": 1.7739551646269796e-05, "loss": 0.6525, "step": 46320 }, { "epoch": 1.48, "learning_rate": 1.7738844261672547e-05, "loss": 0.6331, "step": 46325 }, { "epoch": 1.48, "learning_rate": 1.7738136780516738e-05, "loss": 0.6501, "step": 46330 }, { "epoch": 1.48, "learning_rate": 1.7737429202811194e-05, "loss": 0.647, "step": 46335 }, { "epoch": 1.48, "learning_rate": 1.7736721528564747e-05, "loss": 0.6412, "step": 46340 }, { "epoch": 1.48, "learning_rate": 1.773601375778622e-05, "loss": 0.6429, "step": 46345 }, { "epoch": 1.48, "learning_rate": 1.773530589048445e-05, "loss": 0.6437, "step": 46350 }, { "epoch": 1.48, "learning_rate": 1.7734597926668264e-05, "loss": 0.6601, "step": 46355 }, { "epoch": 1.48, "learning_rate": 1.7733889866346497e-05, "loss": 0.6404, "step": 46360 }, { "epoch": 1.48, "learning_rate": 1.7733181709527986e-05, "loss": 0.6493, "step": 46365 }, { "epoch": 1.48, "learning_rate": 1.7732473456221567e-05, "loss": 0.6451, "step": 46370 }, { "epoch": 1.48, "learning_rate": 1.7731765106436073e-05, "loss": 0.643, "step": 46375 }, { "epoch": 1.48, "learning_rate": 1.773105666018035e-05, "loss": 0.6355, "step": 46380 }, { "epoch": 1.48, "learning_rate": 1.7730348117463222e-05, "loss": 0.6476, "step": 46385 }, { "epoch": 1.48, "learning_rate": 1.772963947829355e-05, "loss": 0.6502, "step": 46390 }, { "epoch": 1.48, "learning_rate": 1.7728930742680156e-05, "loss": 0.6404, "step": 46395 }, { "epoch": 1.48, "learning_rate": 1.77282219106319e-05, "loss": 0.6263, "step": 46400 }, { "epoch": 1.48, "learning_rate": 1.772751298215761e-05, "loss": 0.6372, "step": 46405 }, { "epoch": 1.49, "learning_rate": 1.7726803957266146e-05, "loss": 0.6344, "step": 46410 }, { "epoch": 1.49, "learning_rate": 1.772609483596635e-05, "loss": 0.6516, "step": 46415 }, { "epoch": 1.49, "learning_rate": 1.7725385618267065e-05, "loss": 0.6443, "step": 46420 }, { "epoch": 1.49, "learning_rate": 1.7724676304177145e-05, "loss": 0.6449, "step": 46425 }, { "epoch": 1.49, "learning_rate": 1.7723966893705437e-05, "loss": 0.6396, "step": 46430 }, { "epoch": 1.49, "learning_rate": 1.772325738686079e-05, "loss": 0.6398, "step": 46435 }, { "epoch": 1.49, "learning_rate": 1.7722547783652064e-05, "loss": 0.6482, "step": 46440 }, { "epoch": 1.49, "learning_rate": 1.7721838084088113e-05, "loss": 0.6441, "step": 46445 }, { "epoch": 1.49, "learning_rate": 1.7721128288177782e-05, "loss": 0.6411, "step": 46450 }, { "epoch": 1.49, "learning_rate": 1.772041839592994e-05, "loss": 0.6543, "step": 46455 }, { "epoch": 1.49, "learning_rate": 1.771970840735343e-05, "loss": 0.6445, "step": 46460 }, { "epoch": 1.49, "learning_rate": 1.771899832245712e-05, "loss": 0.632, "step": 46465 }, { "epoch": 1.49, "learning_rate": 1.7718288141249873e-05, "loss": 0.6477, "step": 46470 }, { "epoch": 1.49, "learning_rate": 1.771757786374054e-05, "loss": 0.6378, "step": 46475 }, { "epoch": 1.49, "learning_rate": 1.7716867489937995e-05, "loss": 0.6329, "step": 46480 }, { "epoch": 1.49, "learning_rate": 1.771615701985109e-05, "loss": 0.6369, "step": 46485 }, { "epoch": 1.49, "learning_rate": 1.7715446453488696e-05, "loss": 0.6305, "step": 46490 }, { "epoch": 1.49, "learning_rate": 1.7714735790859678e-05, "loss": 0.6465, "step": 46495 }, { "epoch": 1.49, "learning_rate": 1.7714025031972904e-05, "loss": 0.6351, "step": 46500 }, { "epoch": 1.49, "learning_rate": 1.7713314176837237e-05, "loss": 0.6329, "step": 46505 }, { "epoch": 1.49, "learning_rate": 1.771260322546155e-05, "loss": 0.64, "step": 46510 }, { "epoch": 1.49, "learning_rate": 1.7711892177854717e-05, "loss": 0.6454, "step": 46515 }, { "epoch": 1.49, "learning_rate": 1.7711181034025607e-05, "loss": 0.6342, "step": 46520 }, { "epoch": 1.49, "learning_rate": 1.771046979398309e-05, "loss": 0.6338, "step": 46525 }, { "epoch": 1.49, "learning_rate": 1.7709758457736042e-05, "loss": 0.6362, "step": 46530 }, { "epoch": 1.49, "learning_rate": 1.7709047025293344e-05, "loss": 0.6375, "step": 46535 }, { "epoch": 1.49, "learning_rate": 1.7708335496663864e-05, "loss": 0.6377, "step": 46540 }, { "epoch": 1.49, "learning_rate": 1.7707623871856484e-05, "loss": 0.6341, "step": 46545 }, { "epoch": 1.49, "learning_rate": 1.7706912150880083e-05, "loss": 0.6408, "step": 46550 }, { "epoch": 1.49, "learning_rate": 1.770620033374354e-05, "loss": 0.6476, "step": 46555 }, { "epoch": 1.49, "learning_rate": 1.770548842045574e-05, "loss": 0.6463, "step": 46560 }, { "epoch": 1.49, "learning_rate": 1.770477641102556e-05, "loss": 0.641, "step": 46565 }, { "epoch": 1.49, "learning_rate": 1.770406430546189e-05, "loss": 0.642, "step": 46570 }, { "epoch": 1.49, "learning_rate": 1.770335210377361e-05, "loss": 0.6389, "step": 46575 }, { "epoch": 1.49, "learning_rate": 1.7702639805969612e-05, "loss": 0.6431, "step": 46580 }, { "epoch": 1.49, "learning_rate": 1.770192741205878e-05, "loss": 0.6407, "step": 46585 }, { "epoch": 1.49, "learning_rate": 1.7701214922049998e-05, "loss": 0.6425, "step": 46590 }, { "epoch": 1.49, "learning_rate": 1.7700502335952162e-05, "loss": 0.6429, "step": 46595 }, { "epoch": 1.49, "learning_rate": 1.7699789653774157e-05, "loss": 0.6356, "step": 46600 }, { "epoch": 1.49, "learning_rate": 1.769907687552488e-05, "loss": 0.6414, "step": 46605 }, { "epoch": 1.49, "learning_rate": 1.769836400121323e-05, "loss": 0.6329, "step": 46610 }, { "epoch": 1.49, "learning_rate": 1.7697651030848094e-05, "loss": 0.6289, "step": 46615 }, { "epoch": 1.49, "learning_rate": 1.7696937964438366e-05, "loss": 0.6487, "step": 46620 }, { "epoch": 1.49, "learning_rate": 1.7696224801992947e-05, "loss": 0.6345, "step": 46625 }, { "epoch": 1.49, "learning_rate": 1.7695511543520734e-05, "loss": 0.63, "step": 46630 }, { "epoch": 1.49, "learning_rate": 1.769479818903063e-05, "loss": 0.6263, "step": 46635 }, { "epoch": 1.49, "learning_rate": 1.7694084738531527e-05, "loss": 0.6357, "step": 46640 }, { "epoch": 1.49, "learning_rate": 1.7693371192032337e-05, "loss": 0.6389, "step": 46645 }, { "epoch": 1.49, "learning_rate": 1.7692657549541955e-05, "loss": 0.6316, "step": 46650 }, { "epoch": 1.49, "learning_rate": 1.769194381106929e-05, "loss": 0.6503, "step": 46655 }, { "epoch": 1.49, "learning_rate": 1.769122997662325e-05, "loss": 0.6301, "step": 46660 }, { "epoch": 1.49, "learning_rate": 1.7690516046212735e-05, "loss": 0.6453, "step": 46665 }, { "epoch": 1.49, "learning_rate": 1.7689802019846653e-05, "loss": 0.6224, "step": 46670 }, { "epoch": 1.49, "learning_rate": 1.7689087897533916e-05, "loss": 0.6464, "step": 46675 }, { "epoch": 1.49, "learning_rate": 1.7688373679283437e-05, "loss": 0.648, "step": 46680 }, { "epoch": 1.49, "learning_rate": 1.7687659365104117e-05, "loss": 0.6389, "step": 46685 }, { "epoch": 1.49, "learning_rate": 1.768694495500488e-05, "loss": 0.6474, "step": 46690 }, { "epoch": 1.49, "learning_rate": 1.7686230448994637e-05, "loss": 0.6282, "step": 46695 }, { "epoch": 1.49, "learning_rate": 1.76855158470823e-05, "loss": 0.6415, "step": 46700 }, { "epoch": 1.49, "learning_rate": 1.7684801149276784e-05, "loss": 0.6399, "step": 46705 }, { "epoch": 1.49, "learning_rate": 1.768408635558701e-05, "loss": 0.639, "step": 46710 }, { "epoch": 1.49, "learning_rate": 1.7683371466021896e-05, "loss": 0.6358, "step": 46715 }, { "epoch": 1.5, "learning_rate": 1.7682656480590362e-05, "loss": 0.6503, "step": 46720 }, { "epoch": 1.5, "learning_rate": 1.768194139930133e-05, "loss": 0.6535, "step": 46725 }, { "epoch": 1.5, "learning_rate": 1.7681226222163715e-05, "loss": 0.6489, "step": 46730 }, { "epoch": 1.5, "learning_rate": 1.7680510949186447e-05, "loss": 0.6293, "step": 46735 }, { "epoch": 1.5, "learning_rate": 1.7679795580378454e-05, "loss": 0.6367, "step": 46740 }, { "epoch": 1.5, "learning_rate": 1.7679080115748655e-05, "loss": 0.6391, "step": 46745 }, { "epoch": 1.5, "learning_rate": 1.767836455530598e-05, "loss": 0.6367, "step": 46750 }, { "epoch": 1.5, "learning_rate": 1.767764889905935e-05, "loss": 0.6505, "step": 46755 }, { "epoch": 1.5, "learning_rate": 1.7676933147017707e-05, "loss": 0.6434, "step": 46760 }, { "epoch": 1.5, "learning_rate": 1.7676217299189972e-05, "loss": 0.6451, "step": 46765 }, { "epoch": 1.5, "learning_rate": 1.7675501355585075e-05, "loss": 0.6372, "step": 46770 }, { "epoch": 1.5, "learning_rate": 1.7674785316211963e-05, "loss": 0.6376, "step": 46775 }, { "epoch": 1.5, "learning_rate": 1.7674069181079553e-05, "loss": 0.6517, "step": 46780 }, { "epoch": 1.5, "learning_rate": 1.767335295019679e-05, "loss": 0.6545, "step": 46785 }, { "epoch": 1.5, "learning_rate": 1.767263662357261e-05, "loss": 0.6418, "step": 46790 }, { "epoch": 1.5, "learning_rate": 1.767192020121595e-05, "loss": 0.6361, "step": 46795 }, { "epoch": 1.5, "learning_rate": 1.7671203683135747e-05, "loss": 0.6343, "step": 46800 }, { "epoch": 1.5, "learning_rate": 1.7670487069340944e-05, "loss": 0.6325, "step": 46805 }, { "epoch": 1.5, "learning_rate": 1.7669770359840476e-05, "loss": 0.6355, "step": 46810 }, { "epoch": 1.5, "learning_rate": 1.7669053554643298e-05, "loss": 0.6309, "step": 46815 }, { "epoch": 1.5, "learning_rate": 1.7668336653758338e-05, "loss": 0.6292, "step": 46820 }, { "epoch": 1.5, "learning_rate": 1.766761965719455e-05, "loss": 0.6424, "step": 46825 }, { "epoch": 1.5, "learning_rate": 1.766690256496088e-05, "loss": 0.6503, "step": 46830 }, { "epoch": 1.5, "learning_rate": 1.766618537706627e-05, "loss": 0.645, "step": 46835 }, { "epoch": 1.5, "learning_rate": 1.766546809351968e-05, "loss": 0.6473, "step": 46840 }, { "epoch": 1.5, "learning_rate": 1.7664750714330048e-05, "loss": 0.6496, "step": 46845 }, { "epoch": 1.5, "learning_rate": 1.7664033239506327e-05, "loss": 0.64, "step": 46850 }, { "epoch": 1.5, "learning_rate": 1.766331566905747e-05, "loss": 0.6366, "step": 46855 }, { "epoch": 1.5, "learning_rate": 1.7662598002992436e-05, "loss": 0.6442, "step": 46860 }, { "epoch": 1.5, "learning_rate": 1.766188024132017e-05, "loss": 0.6417, "step": 46865 }, { "epoch": 1.5, "learning_rate": 1.7661162384049633e-05, "loss": 0.6487, "step": 46870 }, { "epoch": 1.5, "learning_rate": 1.766044443118978e-05, "loss": 0.635, "step": 46875 }, { "epoch": 1.5, "learning_rate": 1.765972638274957e-05, "loss": 0.6478, "step": 46880 }, { "epoch": 1.5, "learning_rate": 1.7659008238737968e-05, "loss": 0.6435, "step": 46885 }, { "epoch": 1.5, "learning_rate": 1.7658289999163924e-05, "loss": 0.6458, "step": 46890 }, { "epoch": 1.5, "learning_rate": 1.76575716640364e-05, "loss": 0.6474, "step": 46895 }, { "epoch": 1.5, "learning_rate": 1.765685323336437e-05, "loss": 0.6411, "step": 46900 }, { "epoch": 1.5, "learning_rate": 1.765613470715678e-05, "loss": 0.6433, "step": 46905 }, { "epoch": 1.5, "learning_rate": 1.7655416085422613e-05, "loss": 0.6414, "step": 46910 }, { "epoch": 1.5, "learning_rate": 1.765469736817083e-05, "loss": 0.6382, "step": 46915 }, { "epoch": 1.5, "learning_rate": 1.7653978555410394e-05, "loss": 0.6424, "step": 46920 }, { "epoch": 1.5, "learning_rate": 1.7653259647150275e-05, "loss": 0.6454, "step": 46925 }, { "epoch": 1.5, "learning_rate": 1.7652540643399447e-05, "loss": 0.6456, "step": 46930 }, { "epoch": 1.5, "learning_rate": 1.7651821544166878e-05, "loss": 0.6354, "step": 46935 }, { "epoch": 1.5, "learning_rate": 1.765110234946154e-05, "loss": 0.6396, "step": 46940 }, { "epoch": 1.5, "learning_rate": 1.7650383059292408e-05, "loss": 0.635, "step": 46945 }, { "epoch": 1.5, "learning_rate": 1.7649663673668454e-05, "loss": 0.637, "step": 46950 }, { "epoch": 1.5, "learning_rate": 1.7648944192598657e-05, "loss": 0.6429, "step": 46955 }, { "epoch": 1.5, "learning_rate": 1.764822461609199e-05, "loss": 0.6303, "step": 46960 }, { "epoch": 1.5, "learning_rate": 1.7647504944157436e-05, "loss": 0.6515, "step": 46965 }, { "epoch": 1.5, "learning_rate": 1.7646785176803973e-05, "loss": 0.6453, "step": 46970 }, { "epoch": 1.5, "learning_rate": 1.764606531404058e-05, "loss": 0.6325, "step": 46975 }, { "epoch": 1.5, "learning_rate": 1.7645345355876243e-05, "loss": 0.6261, "step": 46980 }, { "epoch": 1.5, "learning_rate": 1.764462530231994e-05, "loss": 0.638, "step": 46985 }, { "epoch": 1.5, "learning_rate": 1.7643905153380658e-05, "loss": 0.6352, "step": 46990 }, { "epoch": 1.5, "learning_rate": 1.7643184909067377e-05, "loss": 0.6445, "step": 46995 }, { "epoch": 1.5, "learning_rate": 1.764246456938909e-05, "loss": 0.6414, "step": 47000 }, { "epoch": 1.5, "learning_rate": 1.7641744134354785e-05, "loss": 0.6452, "step": 47005 }, { "epoch": 1.5, "learning_rate": 1.7641023603973447e-05, "loss": 0.6408, "step": 47010 }, { "epoch": 1.5, "learning_rate": 1.764030297825407e-05, "loss": 0.6428, "step": 47015 }, { "epoch": 1.5, "learning_rate": 1.7639582257205644e-05, "loss": 0.6427, "step": 47020 }, { "epoch": 1.5, "learning_rate": 1.7638861440837157e-05, "loss": 0.6479, "step": 47025 }, { "epoch": 1.5, "learning_rate": 1.763814052915761e-05, "loss": 0.6354, "step": 47030 }, { "epoch": 1.51, "learning_rate": 1.763741952217599e-05, "loss": 0.649, "step": 47035 }, { "epoch": 1.51, "learning_rate": 1.7636698419901304e-05, "loss": 0.631, "step": 47040 }, { "epoch": 1.51, "learning_rate": 1.763597722234254e-05, "loss": 0.6434, "step": 47045 }, { "epoch": 1.51, "learning_rate": 1.76352559295087e-05, "loss": 0.6438, "step": 47050 }, { "epoch": 1.51, "learning_rate": 1.763453454140878e-05, "loss": 0.6294, "step": 47055 }, { "epoch": 1.51, "learning_rate": 1.7633813058051785e-05, "loss": 0.6308, "step": 47060 }, { "epoch": 1.51, "learning_rate": 1.7633091479446717e-05, "loss": 0.6403, "step": 47065 }, { "epoch": 1.51, "learning_rate": 1.763236980560258e-05, "loss": 0.6404, "step": 47070 }, { "epoch": 1.51, "learning_rate": 1.7631648036528374e-05, "loss": 0.6402, "step": 47075 }, { "epoch": 1.51, "learning_rate": 1.7630926172233107e-05, "loss": 0.6368, "step": 47080 }, { "epoch": 1.51, "learning_rate": 1.7630204212725783e-05, "loss": 0.6431, "step": 47085 }, { "epoch": 1.51, "learning_rate": 1.7629482158015418e-05, "loss": 0.6404, "step": 47090 }, { "epoch": 1.51, "learning_rate": 1.7628760008111015e-05, "loss": 0.641, "step": 47095 }, { "epoch": 1.51, "learning_rate": 1.7628037763021586e-05, "loss": 0.6405, "step": 47100 }, { "epoch": 1.51, "learning_rate": 1.762731542275614e-05, "loss": 0.6419, "step": 47105 }, { "epoch": 1.51, "learning_rate": 1.762659298732369e-05, "loss": 0.6465, "step": 47110 }, { "epoch": 1.51, "learning_rate": 1.7625870456733255e-05, "loss": 0.6294, "step": 47115 }, { "epoch": 1.51, "learning_rate": 1.7625147830993847e-05, "loss": 0.6382, "step": 47120 }, { "epoch": 1.51, "learning_rate": 1.762442511011448e-05, "loss": 0.647, "step": 47125 }, { "epoch": 1.51, "learning_rate": 1.7623702294104175e-05, "loss": 0.6384, "step": 47130 }, { "epoch": 1.51, "learning_rate": 1.762297938297195e-05, "loss": 0.6419, "step": 47135 }, { "epoch": 1.51, "learning_rate": 1.762225637672682e-05, "loss": 0.6399, "step": 47140 }, { "epoch": 1.51, "learning_rate": 1.7621533275377815e-05, "loss": 0.64, "step": 47145 }, { "epoch": 1.51, "learning_rate": 1.7620810078933946e-05, "loss": 0.6411, "step": 47150 }, { "epoch": 1.51, "learning_rate": 1.7620086787404253e-05, "loss": 0.6461, "step": 47155 }, { "epoch": 1.51, "learning_rate": 1.7619363400797744e-05, "loss": 0.6418, "step": 47160 }, { "epoch": 1.51, "learning_rate": 1.7618639919123448e-05, "loss": 0.6465, "step": 47165 }, { "epoch": 1.51, "learning_rate": 1.76179163423904e-05, "loss": 0.6447, "step": 47170 }, { "epoch": 1.51, "learning_rate": 1.761719267060762e-05, "loss": 0.6531, "step": 47175 }, { "epoch": 1.51, "learning_rate": 1.761646890378414e-05, "loss": 0.6517, "step": 47180 }, { "epoch": 1.51, "learning_rate": 1.7615745041928996e-05, "loss": 0.643, "step": 47185 }, { "epoch": 1.51, "learning_rate": 1.7615021085051213e-05, "loss": 0.6313, "step": 47190 }, { "epoch": 1.51, "learning_rate": 1.7614297033159826e-05, "loss": 0.6374, "step": 47195 }, { "epoch": 1.51, "learning_rate": 1.7613572886263865e-05, "loss": 0.6446, "step": 47200 }, { "epoch": 1.51, "learning_rate": 1.7612848644372373e-05, "loss": 0.64, "step": 47205 }, { "epoch": 1.51, "learning_rate": 1.761212430749438e-05, "loss": 0.6433, "step": 47210 }, { "epoch": 1.51, "learning_rate": 1.761139987563893e-05, "loss": 0.6428, "step": 47215 }, { "epoch": 1.51, "learning_rate": 1.7610675348815055e-05, "loss": 0.6475, "step": 47220 }, { "epoch": 1.51, "learning_rate": 1.76099507270318e-05, "loss": 0.6359, "step": 47225 }, { "epoch": 1.51, "learning_rate": 1.76092260102982e-05, "loss": 0.6436, "step": 47230 }, { "epoch": 1.51, "learning_rate": 1.760850119862331e-05, "loss": 0.6267, "step": 47235 }, { "epoch": 1.51, "learning_rate": 1.760777629201616e-05, "loss": 0.6354, "step": 47240 }, { "epoch": 1.51, "learning_rate": 1.7607051290485798e-05, "loss": 0.6528, "step": 47245 }, { "epoch": 1.51, "learning_rate": 1.7606326194041274e-05, "loss": 0.646, "step": 47250 }, { "epoch": 1.51, "learning_rate": 1.7605601002691633e-05, "loss": 0.6394, "step": 47255 }, { "epoch": 1.51, "learning_rate": 1.7604875716445925e-05, "loss": 0.6438, "step": 47260 }, { "epoch": 1.51, "learning_rate": 1.7604150335313195e-05, "loss": 0.6266, "step": 47265 }, { "epoch": 1.51, "learning_rate": 1.7603424859302498e-05, "loss": 0.6447, "step": 47270 }, { "epoch": 1.51, "learning_rate": 1.7602699288422885e-05, "loss": 0.643, "step": 47275 }, { "epoch": 1.51, "learning_rate": 1.7601973622683404e-05, "loss": 0.6426, "step": 47280 }, { "epoch": 1.51, "learning_rate": 1.760124786209312e-05, "loss": 0.6392, "step": 47285 }, { "epoch": 1.51, "learning_rate": 1.760052200666108e-05, "loss": 0.6363, "step": 47290 }, { "epoch": 1.51, "learning_rate": 1.759979605639634e-05, "loss": 0.6425, "step": 47295 }, { "epoch": 1.51, "learning_rate": 1.7599070011307965e-05, "loss": 0.6379, "step": 47300 }, { "epoch": 1.51, "learning_rate": 1.7598343871405004e-05, "loss": 0.6439, "step": 47305 }, { "epoch": 1.51, "learning_rate": 1.7597617636696525e-05, "loss": 0.6333, "step": 47310 }, { "epoch": 1.51, "learning_rate": 1.759689130719159e-05, "loss": 0.6405, "step": 47315 }, { "epoch": 1.51, "learning_rate": 1.7596164882899254e-05, "loss": 0.637, "step": 47320 }, { "epoch": 1.51, "learning_rate": 1.7595438363828584e-05, "loss": 0.636, "step": 47325 }, { "epoch": 1.51, "learning_rate": 1.759471174998865e-05, "loss": 0.6462, "step": 47330 }, { "epoch": 1.51, "learning_rate": 1.7593985041388514e-05, "loss": 0.6361, "step": 47335 }, { "epoch": 1.51, "learning_rate": 1.7593258238037242e-05, "loss": 0.6436, "step": 47340 }, { "epoch": 1.52, "learning_rate": 1.75925313399439e-05, "loss": 0.6403, "step": 47345 }, { "epoch": 1.52, "learning_rate": 1.759180434711757e-05, "loss": 0.6409, "step": 47350 }, { "epoch": 1.52, "learning_rate": 1.7591077259567306e-05, "loss": 0.6335, "step": 47355 }, { "epoch": 1.52, "learning_rate": 1.759035007730219e-05, "loss": 0.6402, "step": 47360 }, { "epoch": 1.52, "learning_rate": 1.7589622800331293e-05, "loss": 0.6396, "step": 47365 }, { "epoch": 1.52, "learning_rate": 1.758889542866369e-05, "loss": 0.6414, "step": 47370 }, { "epoch": 1.52, "learning_rate": 1.7588167962308458e-05, "loss": 0.6362, "step": 47375 }, { "epoch": 1.52, "learning_rate": 1.758744040127467e-05, "loss": 0.6399, "step": 47380 }, { "epoch": 1.52, "learning_rate": 1.7586712745571402e-05, "loss": 0.6339, "step": 47385 }, { "epoch": 1.52, "learning_rate": 1.758598499520774e-05, "loss": 0.645, "step": 47390 }, { "epoch": 1.52, "learning_rate": 1.758525715019276e-05, "loss": 0.6414, "step": 47395 }, { "epoch": 1.52, "learning_rate": 1.7584529210535545e-05, "loss": 0.6391, "step": 47400 }, { "epoch": 1.52, "learning_rate": 1.7583801176245176e-05, "loss": 0.6284, "step": 47405 }, { "epoch": 1.52, "learning_rate": 1.7583073047330738e-05, "loss": 0.6293, "step": 47410 }, { "epoch": 1.52, "learning_rate": 1.7582344823801317e-05, "loss": 0.6415, "step": 47415 }, { "epoch": 1.52, "learning_rate": 1.7581616505665996e-05, "loss": 0.6448, "step": 47420 }, { "epoch": 1.52, "learning_rate": 1.7580888092933867e-05, "loss": 0.6408, "step": 47425 }, { "epoch": 1.52, "learning_rate": 1.7580159585614015e-05, "loss": 0.6423, "step": 47430 }, { "epoch": 1.52, "learning_rate": 1.7579430983715525e-05, "loss": 0.6498, "step": 47435 }, { "epoch": 1.52, "learning_rate": 1.7578702287247494e-05, "loss": 0.6301, "step": 47440 }, { "epoch": 1.52, "learning_rate": 1.757797349621902e-05, "loss": 0.6447, "step": 47445 }, { "epoch": 1.52, "learning_rate": 1.7577244610639183e-05, "loss": 0.6441, "step": 47450 }, { "epoch": 1.52, "learning_rate": 1.7576515630517087e-05, "loss": 0.6372, "step": 47455 }, { "epoch": 1.52, "learning_rate": 1.757578655586182e-05, "loss": 0.6608, "step": 47460 }, { "epoch": 1.52, "learning_rate": 1.7575057386682487e-05, "loss": 0.6465, "step": 47465 }, { "epoch": 1.52, "learning_rate": 1.7574328122988183e-05, "loss": 0.6449, "step": 47470 }, { "epoch": 1.52, "learning_rate": 1.7573598764788e-05, "loss": 0.6414, "step": 47475 }, { "epoch": 1.52, "learning_rate": 1.7572869312091052e-05, "loss": 0.641, "step": 47480 }, { "epoch": 1.52, "learning_rate": 1.757213976490643e-05, "loss": 0.6423, "step": 47485 }, { "epoch": 1.52, "learning_rate": 1.7571410123243236e-05, "loss": 0.649, "step": 47490 }, { "epoch": 1.52, "learning_rate": 1.757068038711058e-05, "loss": 0.6338, "step": 47495 }, { "epoch": 1.52, "learning_rate": 1.7569950556517566e-05, "loss": 0.6373, "step": 47500 }, { "epoch": 1.52, "learning_rate": 1.7569220631473297e-05, "loss": 0.6465, "step": 47505 }, { "epoch": 1.52, "learning_rate": 1.7568490611986884e-05, "loss": 0.6449, "step": 47510 }, { "epoch": 1.52, "learning_rate": 1.756776049806743e-05, "loss": 0.6358, "step": 47515 }, { "epoch": 1.52, "learning_rate": 1.756703028972405e-05, "loss": 0.6384, "step": 47520 }, { "epoch": 1.52, "learning_rate": 1.7566299986965855e-05, "loss": 0.6479, "step": 47525 }, { "epoch": 1.52, "learning_rate": 1.7565569589801952e-05, "loss": 0.6416, "step": 47530 }, { "epoch": 1.52, "learning_rate": 1.7564839098241458e-05, "loss": 0.6297, "step": 47535 }, { "epoch": 1.52, "learning_rate": 1.7564108512293487e-05, "loss": 0.636, "step": 47540 }, { "epoch": 1.52, "learning_rate": 1.7563377831967157e-05, "loss": 0.6231, "step": 47545 }, { "epoch": 1.52, "learning_rate": 1.756264705727158e-05, "loss": 0.6417, "step": 47550 }, { "epoch": 1.52, "learning_rate": 1.7561916188215877e-05, "loss": 0.6494, "step": 47555 }, { "epoch": 1.52, "learning_rate": 1.7561185224809164e-05, "loss": 0.6361, "step": 47560 }, { "epoch": 1.52, "learning_rate": 1.756045416706057e-05, "loss": 0.6361, "step": 47565 }, { "epoch": 1.52, "learning_rate": 1.7559723014979205e-05, "loss": 0.6474, "step": 47570 }, { "epoch": 1.52, "learning_rate": 1.7558991768574197e-05, "loss": 0.6353, "step": 47575 }, { "epoch": 1.52, "learning_rate": 1.7558260427854673e-05, "loss": 0.643, "step": 47580 }, { "epoch": 1.52, "learning_rate": 1.755752899282975e-05, "loss": 0.6402, "step": 47585 }, { "epoch": 1.52, "learning_rate": 1.7556797463508565e-05, "loss": 0.6482, "step": 47590 }, { "epoch": 1.52, "learning_rate": 1.7556065839900232e-05, "loss": 0.6282, "step": 47595 }, { "epoch": 1.52, "learning_rate": 1.7555334122013894e-05, "loss": 0.6511, "step": 47600 }, { "epoch": 1.52, "learning_rate": 1.7554602309858674e-05, "loss": 0.6411, "step": 47605 }, { "epoch": 1.52, "learning_rate": 1.7553870403443696e-05, "loss": 0.6463, "step": 47610 }, { "epoch": 1.52, "learning_rate": 1.7553138402778102e-05, "loss": 0.64, "step": 47615 }, { "epoch": 1.52, "learning_rate": 1.7552406307871023e-05, "loss": 0.6329, "step": 47620 }, { "epoch": 1.52, "learning_rate": 1.7551674118731592e-05, "loss": 0.6362, "step": 47625 }, { "epoch": 1.52, "learning_rate": 1.7550941835368945e-05, "loss": 0.6346, "step": 47630 }, { "epoch": 1.52, "learning_rate": 1.755020945779222e-05, "loss": 0.6466, "step": 47635 }, { "epoch": 1.52, "learning_rate": 1.7549476986010552e-05, "loss": 0.6412, "step": 47640 }, { "epoch": 1.52, "learning_rate": 1.7548744420033085e-05, "loss": 0.6342, "step": 47645 }, { "epoch": 1.52, "learning_rate": 1.754801175986895e-05, "loss": 0.6336, "step": 47650 }, { "epoch": 1.52, "learning_rate": 1.7547279005527303e-05, "loss": 0.6369, "step": 47655 }, { "epoch": 1.53, "learning_rate": 1.7546546157017274e-05, "loss": 0.6216, "step": 47660 }, { "epoch": 1.53, "learning_rate": 1.7545813214348012e-05, "loss": 0.6504, "step": 47665 }, { "epoch": 1.53, "learning_rate": 1.754508017752866e-05, "loss": 0.6328, "step": 47670 }, { "epoch": 1.53, "learning_rate": 1.7544347046568363e-05, "loss": 0.6455, "step": 47675 }, { "epoch": 1.53, "learning_rate": 1.7543613821476277e-05, "loss": 0.6384, "step": 47680 }, { "epoch": 1.53, "learning_rate": 1.7542880502261542e-05, "loss": 0.6401, "step": 47685 }, { "epoch": 1.53, "learning_rate": 1.7542147088933307e-05, "loss": 0.6328, "step": 47690 }, { "epoch": 1.53, "learning_rate": 1.754141358150073e-05, "loss": 0.6446, "step": 47695 }, { "epoch": 1.53, "learning_rate": 1.7540679979972958e-05, "loss": 0.6389, "step": 47700 }, { "epoch": 1.53, "learning_rate": 1.7539946284359146e-05, "loss": 0.6301, "step": 47705 }, { "epoch": 1.53, "learning_rate": 1.7539212494668447e-05, "loss": 0.6381, "step": 47710 }, { "epoch": 1.53, "learning_rate": 1.7538478610910016e-05, "loss": 0.6372, "step": 47715 }, { "epoch": 1.53, "learning_rate": 1.7537744633093015e-05, "loss": 0.6446, "step": 47720 }, { "epoch": 1.53, "learning_rate": 1.7537010561226595e-05, "loss": 0.6295, "step": 47725 }, { "epoch": 1.53, "learning_rate": 1.753627639531992e-05, "loss": 0.6468, "step": 47730 }, { "epoch": 1.53, "learning_rate": 1.7535542135382147e-05, "loss": 0.6398, "step": 47735 }, { "epoch": 1.53, "learning_rate": 1.753480778142244e-05, "loss": 0.6383, "step": 47740 }, { "epoch": 1.53, "learning_rate": 1.7534073333449958e-05, "loss": 0.628, "step": 47745 }, { "epoch": 1.53, "learning_rate": 1.7533338791473872e-05, "loss": 0.6262, "step": 47750 }, { "epoch": 1.53, "learning_rate": 1.7532604155503336e-05, "loss": 0.6446, "step": 47755 }, { "epoch": 1.53, "learning_rate": 1.753186942554753e-05, "loss": 0.6362, "step": 47760 }, { "epoch": 1.53, "learning_rate": 1.753113460161561e-05, "loss": 0.6392, "step": 47765 }, { "epoch": 1.53, "learning_rate": 1.7530399683716746e-05, "loss": 0.6405, "step": 47770 }, { "epoch": 1.53, "learning_rate": 1.752966467186011e-05, "loss": 0.6291, "step": 47775 }, { "epoch": 1.53, "learning_rate": 1.7528929566054877e-05, "loss": 0.6312, "step": 47780 }, { "epoch": 1.53, "learning_rate": 1.7528194366310213e-05, "loss": 0.6398, "step": 47785 }, { "epoch": 1.53, "learning_rate": 1.752745907263529e-05, "loss": 0.6313, "step": 47790 }, { "epoch": 1.53, "learning_rate": 1.7526723685039288e-05, "loss": 0.6545, "step": 47795 }, { "epoch": 1.53, "learning_rate": 1.752598820353138e-05, "loss": 0.6311, "step": 47800 }, { "epoch": 1.53, "learning_rate": 1.7525252628120743e-05, "loss": 0.6299, "step": 47805 }, { "epoch": 1.53, "learning_rate": 1.7524516958816555e-05, "loss": 0.6342, "step": 47810 }, { "epoch": 1.53, "learning_rate": 1.752378119562799e-05, "loss": 0.6451, "step": 47815 }, { "epoch": 1.53, "learning_rate": 1.7523045338564237e-05, "loss": 0.6328, "step": 47820 }, { "epoch": 1.53, "learning_rate": 1.7522309387634472e-05, "loss": 0.6409, "step": 47825 }, { "epoch": 1.53, "learning_rate": 1.752157334284788e-05, "loss": 0.6479, "step": 47830 }, { "epoch": 1.53, "learning_rate": 1.752083720421364e-05, "loss": 0.6365, "step": 47835 }, { "epoch": 1.53, "learning_rate": 1.7520100971740942e-05, "loss": 0.6376, "step": 47840 }, { "epoch": 1.53, "learning_rate": 1.7519364645438972e-05, "loss": 0.6494, "step": 47845 }, { "epoch": 1.53, "learning_rate": 1.7518628225316915e-05, "loss": 0.6491, "step": 47850 }, { "epoch": 1.53, "learning_rate": 1.7517891711383957e-05, "loss": 0.6334, "step": 47855 }, { "epoch": 1.53, "learning_rate": 1.7517155103649293e-05, "loss": 0.6371, "step": 47860 }, { "epoch": 1.53, "learning_rate": 1.7516418402122112e-05, "loss": 0.6411, "step": 47865 }, { "epoch": 1.53, "learning_rate": 1.7515681606811602e-05, "loss": 0.6454, "step": 47870 }, { "epoch": 1.53, "learning_rate": 1.7514944717726962e-05, "loss": 0.6293, "step": 47875 }, { "epoch": 1.53, "learning_rate": 1.7514207734877384e-05, "loss": 0.6296, "step": 47880 }, { "epoch": 1.53, "learning_rate": 1.751347065827206e-05, "loss": 0.6476, "step": 47885 }, { "epoch": 1.53, "learning_rate": 1.7512733487920193e-05, "loss": 0.6356, "step": 47890 }, { "epoch": 1.53, "learning_rate": 1.7511996223830974e-05, "loss": 0.647, "step": 47895 }, { "epoch": 1.53, "learning_rate": 1.751125886601361e-05, "loss": 0.6364, "step": 47900 }, { "epoch": 1.53, "learning_rate": 1.7510521414477292e-05, "loss": 0.6435, "step": 47905 }, { "epoch": 1.53, "learning_rate": 1.7509783869231228e-05, "loss": 0.6491, "step": 47910 }, { "epoch": 1.53, "learning_rate": 1.7509046230284616e-05, "loss": 0.6381, "step": 47915 }, { "epoch": 1.53, "learning_rate": 1.7508308497646664e-05, "loss": 0.6437, "step": 47920 }, { "epoch": 1.53, "learning_rate": 1.7507570671326573e-05, "loss": 0.6424, "step": 47925 }, { "epoch": 1.53, "learning_rate": 1.7506832751333553e-05, "loss": 0.6289, "step": 47930 }, { "epoch": 1.53, "learning_rate": 1.7506094737676808e-05, "loss": 0.6252, "step": 47935 }, { "epoch": 1.53, "learning_rate": 1.7505356630365544e-05, "loss": 0.6401, "step": 47940 }, { "epoch": 1.53, "learning_rate": 1.750461842940897e-05, "loss": 0.6468, "step": 47945 }, { "epoch": 1.53, "learning_rate": 1.750388013481631e-05, "loss": 0.6371, "step": 47950 }, { "epoch": 1.53, "learning_rate": 1.7503141746596758e-05, "loss": 0.6351, "step": 47955 }, { "epoch": 1.53, "learning_rate": 1.750240326475954e-05, "loss": 0.6279, "step": 47960 }, { "epoch": 1.53, "learning_rate": 1.750166468931386e-05, "loss": 0.6368, "step": 47965 }, { "epoch": 1.54, "learning_rate": 1.750092602026894e-05, "loss": 0.6238, "step": 47970 }, { "epoch": 1.54, "learning_rate": 1.7500187257634e-05, "loss": 0.6393, "step": 47975 }, { "epoch": 1.54, "learning_rate": 1.7499448401418243e-05, "loss": 0.6476, "step": 47980 }, { "epoch": 1.54, "learning_rate": 1.7498709451630904e-05, "loss": 0.6275, "step": 47985 }, { "epoch": 1.54, "learning_rate": 1.7497970408281192e-05, "loss": 0.6402, "step": 47990 }, { "epoch": 1.54, "learning_rate": 1.7497231271378335e-05, "loss": 0.6296, "step": 47995 }, { "epoch": 1.54, "learning_rate": 1.749649204093155e-05, "loss": 0.6321, "step": 48000 } ], "logging_steps": 5, "max_steps": 156250, "num_train_epochs": 5, "save_steps": 2000, "total_flos": 3.310222499070345e+18, "trial_name": null, "trial_params": null }