{"current_steps": 10, "total_steps": 25254, "loss": 0.5847, "learning_rate": 6.596306068601583e-07, "epoch": 0.0011879306248515087, "percentage": 0.04, "elapsed_time": "0:00:38", "remaining_time": "1 day, 3:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20, "total_steps": 25254, "loss": 0.5711, "learning_rate": 1.3192612137203166e-06, "epoch": 0.0023758612497030173, "percentage": 0.08, "elapsed_time": "0:01:00", "remaining_time": "21:19:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 30, "total_steps": 25254, "loss": 0.5244, "learning_rate": 1.9788918205804753e-06, "epoch": 0.003563791874554526, "percentage": 0.12, "elapsed_time": "0:01:22", "remaining_time": "19:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 40, "total_steps": 25254, "loss": 0.4198, "learning_rate": 2.6385224274406333e-06, "epoch": 0.004751722499406035, "percentage": 0.16, "elapsed_time": "0:01:44", "remaining_time": "18:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 50, "total_steps": 25254, "loss": 0.3617, "learning_rate": 3.2981530343007917e-06, "epoch": 0.005939653124257543, "percentage": 0.2, "elapsed_time": "0:02:07", "remaining_time": "17:49:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 60, "total_steps": 25254, "loss": 0.3351, "learning_rate": 3.9577836411609505e-06, "epoch": 0.007127583749109052, "percentage": 0.24, "elapsed_time": "0:02:29", "remaining_time": "17:26:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 70, "total_steps": 25254, "loss": 0.3136, "learning_rate": 4.617414248021108e-06, "epoch": 0.00831551437396056, "percentage": 0.28, "elapsed_time": "0:02:50", "remaining_time": "17:05:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 80, "total_steps": 25254, "loss": 0.31, "learning_rate": 5.2770448548812665e-06, "epoch": 0.00950344499881207, "percentage": 0.32, "elapsed_time": "0:03:12", "remaining_time": "16:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 90, "total_steps": 25254, "loss": 0.2947, "learning_rate": 5.936675461741425e-06, "epoch": 0.010691375623663579, "percentage": 0.36, "elapsed_time": "0:03:34", "remaining_time": "16:40:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 100, "total_steps": 25254, "loss": 0.2869, "learning_rate": 6.596306068601583e-06, "epoch": 0.011879306248515086, "percentage": 0.4, "elapsed_time": "0:03:56", "remaining_time": "16:32:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 110, "total_steps": 25254, "loss": 0.2782, "learning_rate": 7.255936675461741e-06, "epoch": 0.013067236873366595, "percentage": 0.44, "elapsed_time": "0:04:19", "remaining_time": "16:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 120, "total_steps": 25254, "loss": 0.2753, "learning_rate": 7.915567282321901e-06, "epoch": 0.014255167498218105, "percentage": 0.48, "elapsed_time": "0:04:41", "remaining_time": "16:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 130, "total_steps": 25254, "loss": 0.2667, "learning_rate": 8.575197889182058e-06, "epoch": 0.015443098123069612, "percentage": 0.51, "elapsed_time": "0:05:03", "remaining_time": "16:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 140, "total_steps": 25254, "loss": 0.2591, "learning_rate": 9.234828496042216e-06, "epoch": 0.01663102874792112, "percentage": 0.55, "elapsed_time": "0:05:25", "remaining_time": "16:14:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 150, "total_steps": 25254, "loss": 0.2581, "learning_rate": 9.894459102902375e-06, "epoch": 0.01781895937277263, "percentage": 0.59, "elapsed_time": "0:05:47", "remaining_time": "16:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 160, "total_steps": 25254, "loss": 0.2502, "learning_rate": 1.0554089709762533e-05, "epoch": 0.01900688999762414, "percentage": 0.63, "elapsed_time": "0:06:08", "remaining_time": "16:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 170, "total_steps": 25254, "loss": 0.2468, "learning_rate": 1.1213720316622692e-05, "epoch": 0.020194820622475646, "percentage": 0.67, "elapsed_time": "0:06:30", "remaining_time": "16:00:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 180, "total_steps": 25254, "loss": 0.2457, "learning_rate": 1.187335092348285e-05, "epoch": 0.021382751247327157, "percentage": 0.71, "elapsed_time": "0:06:51", "remaining_time": "15:55:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 190, "total_steps": 25254, "loss": 0.2449, "learning_rate": 1.2532981530343008e-05, "epoch": 0.022570681872178665, "percentage": 0.75, "elapsed_time": "0:07:14", "remaining_time": "15:54:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 200, "total_steps": 25254, "loss": 0.2396, "learning_rate": 1.3192612137203167e-05, "epoch": 0.023758612497030172, "percentage": 0.79, "elapsed_time": "0:07:35", "remaining_time": "15:51:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 210, "total_steps": 25254, "loss": 0.2346, "learning_rate": 1.3852242744063327e-05, "epoch": 0.024946543121881683, "percentage": 0.83, "elapsed_time": "0:07:57", "remaining_time": "15:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 220, "total_steps": 25254, "loss": 0.2341, "learning_rate": 1.4511873350923482e-05, "epoch": 0.02613447374673319, "percentage": 0.87, "elapsed_time": "0:08:19", "remaining_time": "15:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 230, "total_steps": 25254, "loss": 0.2323, "learning_rate": 1.5171503957783642e-05, "epoch": 0.0273224043715847, "percentage": 0.91, "elapsed_time": "0:08:40", "remaining_time": "15:43:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 240, "total_steps": 25254, "loss": 0.2318, "learning_rate": 1.5831134564643802e-05, "epoch": 0.02851033499643621, "percentage": 0.95, "elapsed_time": "0:09:02", "remaining_time": "15:42:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 250, "total_steps": 25254, "loss": 0.2283, "learning_rate": 1.6490765171503957e-05, "epoch": 0.029698265621287717, "percentage": 0.99, "elapsed_time": "0:09:25", "remaining_time": "15:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 260, "total_steps": 25254, "loss": 0.2263, "learning_rate": 1.7150395778364116e-05, "epoch": 0.030886196246139225, "percentage": 1.03, "elapsed_time": "0:09:46", "remaining_time": "15:39:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 270, "total_steps": 25254, "loss": 0.2287, "learning_rate": 1.7810026385224277e-05, "epoch": 0.03207412687099073, "percentage": 1.07, "elapsed_time": "0:10:08", "remaining_time": "15:38:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 280, "total_steps": 25254, "loss": 0.2265, "learning_rate": 1.8469656992084432e-05, "epoch": 0.03326205749584224, "percentage": 1.11, "elapsed_time": "0:10:30", "remaining_time": "15:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 290, "total_steps": 25254, "loss": 0.223, "learning_rate": 1.912928759894459e-05, "epoch": 0.034449988120693754, "percentage": 1.15, "elapsed_time": "0:10:52", "remaining_time": "15:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 300, "total_steps": 25254, "loss": 0.2194, "learning_rate": 1.978891820580475e-05, "epoch": 0.03563791874554526, "percentage": 1.19, "elapsed_time": "0:11:14", "remaining_time": "15:35:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 310, "total_steps": 25254, "loss": 0.218, "learning_rate": 2.0448548812664908e-05, "epoch": 0.03682584937039677, "percentage": 1.23, "elapsed_time": "0:11:36", "remaining_time": "15:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 320, "total_steps": 25254, "loss": 0.2192, "learning_rate": 2.1108179419525066e-05, "epoch": 0.03801377999524828, "percentage": 1.27, "elapsed_time": "0:11:58", "remaining_time": "15:32:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 330, "total_steps": 25254, "loss": 0.2193, "learning_rate": 2.1767810026385225e-05, "epoch": 0.039201710620099785, "percentage": 1.31, "elapsed_time": "0:12:19", "remaining_time": "15:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 340, "total_steps": 25254, "loss": 0.2098, "learning_rate": 2.2427440633245383e-05, "epoch": 0.04038964124495129, "percentage": 1.35, "elapsed_time": "0:12:41", "remaining_time": "15:29:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 350, "total_steps": 25254, "loss": 0.2129, "learning_rate": 2.308707124010554e-05, "epoch": 0.04157757186980281, "percentage": 1.39, "elapsed_time": "0:13:03", "remaining_time": "15:29:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 360, "total_steps": 25254, "loss": 0.211, "learning_rate": 2.37467018469657e-05, "epoch": 0.042765502494654314, "percentage": 1.43, "elapsed_time": "0:13:25", "remaining_time": "15:28:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 370, "total_steps": 25254, "loss": 0.2164, "learning_rate": 2.4406332453825858e-05, "epoch": 0.04395343311950582, "percentage": 1.47, "elapsed_time": "0:13:47", "remaining_time": "15:27:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 380, "total_steps": 25254, "loss": 0.2132, "learning_rate": 2.5065963060686017e-05, "epoch": 0.04514136374435733, "percentage": 1.5, "elapsed_time": "0:14:09", "remaining_time": "15:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 390, "total_steps": 25254, "loss": 0.2091, "learning_rate": 2.572559366754618e-05, "epoch": 0.04632929436920884, "percentage": 1.54, "elapsed_time": "0:14:31", "remaining_time": "15:26:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 400, "total_steps": 25254, "loss": 0.2094, "learning_rate": 2.6385224274406334e-05, "epoch": 0.047517224994060345, "percentage": 1.58, "elapsed_time": "0:14:53", "remaining_time": "15:25:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 410, "total_steps": 25254, "loss": 0.2084, "learning_rate": 2.7044854881266492e-05, "epoch": 0.04870515561891185, "percentage": 1.62, "elapsed_time": "0:15:14", "remaining_time": "15:23:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 420, "total_steps": 25254, "loss": 0.2107, "learning_rate": 2.7704485488126654e-05, "epoch": 0.04989308624376337, "percentage": 1.66, "elapsed_time": "0:15:36", "remaining_time": "15:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 430, "total_steps": 25254, "loss": 0.2062, "learning_rate": 2.836411609498681e-05, "epoch": 0.051081016868614874, "percentage": 1.7, "elapsed_time": "0:15:58", "remaining_time": "15:21:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 440, "total_steps": 25254, "loss": 0.2093, "learning_rate": 2.9023746701846964e-05, "epoch": 0.05226894749346638, "percentage": 1.74, "elapsed_time": "0:16:19", "remaining_time": "15:20:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 450, "total_steps": 25254, "loss": 0.21, "learning_rate": 2.968337730870713e-05, "epoch": 0.05345687811831789, "percentage": 1.78, "elapsed_time": "0:16:41", "remaining_time": "15:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 460, "total_steps": 25254, "loss": 0.2054, "learning_rate": 3.0343007915567284e-05, "epoch": 0.0546448087431694, "percentage": 1.82, "elapsed_time": "0:17:03", "remaining_time": "15:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 470, "total_steps": 25254, "loss": 0.2025, "learning_rate": 3.100263852242744e-05, "epoch": 0.055832739368020905, "percentage": 1.86, "elapsed_time": "0:17:26", "remaining_time": "15:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 480, "total_steps": 25254, "loss": 0.2001, "learning_rate": 3.1662269129287604e-05, "epoch": 0.05702066999287242, "percentage": 1.9, "elapsed_time": "0:17:47", "remaining_time": "15:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 490, "total_steps": 25254, "loss": 0.2048, "learning_rate": 3.232189973614776e-05, "epoch": 0.05820860061772393, "percentage": 1.94, "elapsed_time": "0:18:09", "remaining_time": "15:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 500, "total_steps": 25254, "loss": 0.203, "learning_rate": 3.2981530343007914e-05, "epoch": 0.059396531242575434, "percentage": 1.98, "elapsed_time": "0:18:31", "remaining_time": "15:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 510, "total_steps": 25254, "loss": 0.2003, "learning_rate": 3.3641160949868076e-05, "epoch": 0.06058446186742694, "percentage": 2.02, "elapsed_time": "0:18:53", "remaining_time": "15:16:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 520, "total_steps": 25254, "loss": 0.1997, "learning_rate": 3.430079155672823e-05, "epoch": 0.06177239249227845, "percentage": 2.06, "elapsed_time": "0:19:14", "remaining_time": "15:15:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 530, "total_steps": 25254, "loss": 0.2014, "learning_rate": 3.496042216358839e-05, "epoch": 0.06296032311712996, "percentage": 2.1, "elapsed_time": "0:19:36", "remaining_time": "15:14:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 540, "total_steps": 25254, "loss": 0.2037, "learning_rate": 3.5620052770448555e-05, "epoch": 0.06414825374198146, "percentage": 2.14, "elapsed_time": "0:19:58", "remaining_time": "15:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 550, "total_steps": 25254, "loss": 0.2028, "learning_rate": 3.627968337730871e-05, "epoch": 0.06533618436683297, "percentage": 2.18, "elapsed_time": "0:20:19", "remaining_time": "15:12:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 560, "total_steps": 25254, "loss": 0.2013, "learning_rate": 3.6939313984168865e-05, "epoch": 0.06652411499168448, "percentage": 2.22, "elapsed_time": "0:20:40", "remaining_time": "15:11:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 570, "total_steps": 25254, "loss": 0.1974, "learning_rate": 3.759894459102902e-05, "epoch": 0.06771204561653599, "percentage": 2.26, "elapsed_time": "0:21:02", "remaining_time": "15:11:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 580, "total_steps": 25254, "loss": 0.2017, "learning_rate": 3.825857519788918e-05, "epoch": 0.06889997624138751, "percentage": 2.3, "elapsed_time": "0:21:24", "remaining_time": "15:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 590, "total_steps": 25254, "loss": 0.1955, "learning_rate": 3.8918205804749344e-05, "epoch": 0.07008790686623902, "percentage": 2.34, "elapsed_time": "0:21:46", "remaining_time": "15:10:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 600, "total_steps": 25254, "loss": 0.2019, "learning_rate": 3.95778364116095e-05, "epoch": 0.07127583749109052, "percentage": 2.38, "elapsed_time": "0:22:08", "remaining_time": "15:09:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 610, "total_steps": 25254, "loss": 0.1957, "learning_rate": 4.023746701846966e-05, "epoch": 0.07246376811594203, "percentage": 2.42, "elapsed_time": "0:22:29", "remaining_time": "15:08:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 620, "total_steps": 25254, "loss": 0.1967, "learning_rate": 4.0897097625329815e-05, "epoch": 0.07365169874079354, "percentage": 2.46, "elapsed_time": "0:22:50", "remaining_time": "15:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 630, "total_steps": 25254, "loss": 0.1937, "learning_rate": 4.155672823218997e-05, "epoch": 0.07483962936564505, "percentage": 2.49, "elapsed_time": "0:23:12", "remaining_time": "15:07:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 640, "total_steps": 25254, "loss": 0.196, "learning_rate": 4.221635883905013e-05, "epoch": 0.07602755999049655, "percentage": 2.53, "elapsed_time": "0:23:34", "remaining_time": "15:06:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 650, "total_steps": 25254, "loss": 0.2008, "learning_rate": 4.2875989445910294e-05, "epoch": 0.07721549061534806, "percentage": 2.57, "elapsed_time": "0:23:55", "remaining_time": "15:05:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 660, "total_steps": 25254, "loss": 0.1957, "learning_rate": 4.353562005277045e-05, "epoch": 0.07840342124019957, "percentage": 2.61, "elapsed_time": "0:24:17", "remaining_time": "15:05:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 670, "total_steps": 25254, "loss": 0.1941, "learning_rate": 4.419525065963061e-05, "epoch": 0.07959135186505108, "percentage": 2.65, "elapsed_time": "0:24:40", "remaining_time": "15:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 680, "total_steps": 25254, "loss": 0.1934, "learning_rate": 4.4854881266490766e-05, "epoch": 0.08077928248990258, "percentage": 2.69, "elapsed_time": "0:25:01", "remaining_time": "15:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 690, "total_steps": 25254, "loss": 0.1984, "learning_rate": 4.551451187335092e-05, "epoch": 0.08196721311475409, "percentage": 2.73, "elapsed_time": "0:25:24", "remaining_time": "15:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 700, "total_steps": 25254, "loss": 0.1948, "learning_rate": 4.617414248021108e-05, "epoch": 0.08315514373960561, "percentage": 2.77, "elapsed_time": "0:25:46", "remaining_time": "15:03:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 710, "total_steps": 25254, "loss": 0.1896, "learning_rate": 4.6833773087071245e-05, "epoch": 0.08434307436445712, "percentage": 2.81, "elapsed_time": "0:26:08", "remaining_time": "15:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 720, "total_steps": 25254, "loss": 0.1957, "learning_rate": 4.74934036939314e-05, "epoch": 0.08553100498930863, "percentage": 2.85, "elapsed_time": "0:26:31", "remaining_time": "15:03:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 730, "total_steps": 25254, "loss": 0.1974, "learning_rate": 4.815303430079156e-05, "epoch": 0.08671893561416014, "percentage": 2.89, "elapsed_time": "0:26:53", "remaining_time": "15:03:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 740, "total_steps": 25254, "loss": 0.1954, "learning_rate": 4.8812664907651717e-05, "epoch": 0.08790686623901164, "percentage": 2.93, "elapsed_time": "0:27:15", "remaining_time": "15:03:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 750, "total_steps": 25254, "loss": 0.1913, "learning_rate": 4.947229551451187e-05, "epoch": 0.08909479686386315, "percentage": 2.97, "elapsed_time": "0:27:38", "remaining_time": "15:03:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 760, "total_steps": 25254, "loss": 0.1938, "learning_rate": 4.999999917760701e-05, "epoch": 0.09028272748871466, "percentage": 3.01, "elapsed_time": "0:28:00", "remaining_time": "15:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 770, "total_steps": 25254, "loss": 0.1933, "learning_rate": 4.999997039385799e-05, "epoch": 0.09147065811356617, "percentage": 3.05, "elapsed_time": "0:28:22", "remaining_time": "15:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 780, "total_steps": 25254, "loss": 0.1921, "learning_rate": 4.999990049051348e-05, "epoch": 0.09265858873841767, "percentage": 3.09, "elapsed_time": "0:28:43", "remaining_time": "15:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 790, "total_steps": 25254, "loss": 0.1909, "learning_rate": 4.999978946768849e-05, "epoch": 0.09384651936326918, "percentage": 3.13, "elapsed_time": "0:29:05", "remaining_time": "15:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 800, "total_steps": 25254, "loss": 0.1889, "learning_rate": 4.99996373255656e-05, "epoch": 0.09503444998812069, "percentage": 3.17, "elapsed_time": "0:29:27", "remaining_time": "15:00:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 810, "total_steps": 25254, "loss": 0.1966, "learning_rate": 4.9999444064395065e-05, "epoch": 0.0962223806129722, "percentage": 3.21, "elapsed_time": "0:29:49", "remaining_time": "14:59:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 820, "total_steps": 25254, "loss": 0.1912, "learning_rate": 4.999920968449475e-05, "epoch": 0.0974103112378237, "percentage": 3.25, "elapsed_time": "0:30:11", "remaining_time": "14:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 830, "total_steps": 25254, "loss": 0.1897, "learning_rate": 4.999893418625017e-05, "epoch": 0.09859824186267523, "percentage": 3.29, "elapsed_time": "0:30:34", "remaining_time": "14:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 840, "total_steps": 25254, "loss": 0.1858, "learning_rate": 4.999861757011446e-05, "epoch": 0.09978617248752673, "percentage": 3.33, "elapsed_time": "0:30:56", "remaining_time": "14:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 850, "total_steps": 25254, "loss": 0.1954, "learning_rate": 4.999825983660837e-05, "epoch": 0.10097410311237824, "percentage": 3.37, "elapsed_time": "0:31:17", "remaining_time": "14:58:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 860, "total_steps": 25254, "loss": 0.1882, "learning_rate": 4.9997860986320314e-05, "epoch": 0.10216203373722975, "percentage": 3.41, "elapsed_time": "0:31:39", "remaining_time": "14:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 870, "total_steps": 25254, "loss": 0.1932, "learning_rate": 4.99974210199063e-05, "epoch": 0.10334996436208126, "percentage": 3.44, "elapsed_time": "0:32:01", "remaining_time": "14:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 880, "total_steps": 25254, "loss": 0.1838, "learning_rate": 4.9996939938089994e-05, "epoch": 0.10453789498693276, "percentage": 3.48, "elapsed_time": "0:32:22", "remaining_time": "14:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 890, "total_steps": 25254, "loss": 0.1897, "learning_rate": 4.999641774166265e-05, "epoch": 0.10572582561178427, "percentage": 3.52, "elapsed_time": "0:32:45", "remaining_time": "14:56:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 900, "total_steps": 25254, "loss": 0.1919, "learning_rate": 4.99958544314832e-05, "epoch": 0.10691375623663578, "percentage": 3.56, "elapsed_time": "0:33:07", "remaining_time": "14:56:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 910, "total_steps": 25254, "loss": 0.1874, "learning_rate": 4.9995250008478145e-05, "epoch": 0.10810168686148729, "percentage": 3.6, "elapsed_time": "0:33:28", "remaining_time": "14:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 920, "total_steps": 25254, "loss": 0.1873, "learning_rate": 4.9994604473641635e-05, "epoch": 0.1092896174863388, "percentage": 3.64, "elapsed_time": "0:33:51", "remaining_time": "14:55:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 930, "total_steps": 25254, "loss": 0.189, "learning_rate": 4.9993917828035444e-05, "epoch": 0.1104775481111903, "percentage": 3.68, "elapsed_time": "0:34:13", "remaining_time": "14:55:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 940, "total_steps": 25254, "loss": 0.1871, "learning_rate": 4.999319007278896e-05, "epoch": 0.11166547873604181, "percentage": 3.72, "elapsed_time": "0:34:34", "remaining_time": "14:54:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 950, "total_steps": 25254, "loss": 0.1878, "learning_rate": 4.999242120909916e-05, "epoch": 0.11285340936089332, "percentage": 3.76, "elapsed_time": "0:34:56", "remaining_time": "14:53:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 960, "total_steps": 25254, "loss": 0.1858, "learning_rate": 4.999161123823069e-05, "epoch": 0.11404133998574484, "percentage": 3.8, "elapsed_time": "0:35:18", "remaining_time": "14:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 970, "total_steps": 25254, "loss": 0.1867, "learning_rate": 4.999076016151576e-05, "epoch": 0.11522927061059635, "percentage": 3.84, "elapsed_time": "0:35:40", "remaining_time": "14:53:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 980, "total_steps": 25254, "loss": 0.1878, "learning_rate": 4.998986798035421e-05, "epoch": 0.11641720123544785, "percentage": 3.88, "elapsed_time": "0:36:02", "remaining_time": "14:52:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 990, "total_steps": 25254, "loss": 0.1878, "learning_rate": 4.9988934696213505e-05, "epoch": 0.11760513186029936, "percentage": 3.92, "elapsed_time": "0:36:24", "remaining_time": "14:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1000, "total_steps": 25254, "loss": 0.1894, "learning_rate": 4.998796031062868e-05, "epoch": 0.11879306248515087, "percentage": 3.96, "elapsed_time": "0:36:45", "remaining_time": "14:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1010, "total_steps": 25254, "loss": 0.1859, "learning_rate": 4.998694482520239e-05, "epoch": 0.11998099311000238, "percentage": 4.0, "elapsed_time": "0:37:07", "remaining_time": "14:50:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1020, "total_steps": 25254, "loss": 0.1811, "learning_rate": 4.998588824160489e-05, "epoch": 0.12116892373485388, "percentage": 4.04, "elapsed_time": "0:37:29", "remaining_time": "14:50:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1030, "total_steps": 25254, "loss": 0.1855, "learning_rate": 4.998479056157405e-05, "epoch": 0.12235685435970539, "percentage": 4.08, "elapsed_time": "0:37:51", "remaining_time": "14:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1040, "total_steps": 25254, "loss": 0.1841, "learning_rate": 4.9983651786915305e-05, "epoch": 0.1235447849845569, "percentage": 4.12, "elapsed_time": "0:38:13", "remaining_time": "14:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1050, "total_steps": 25254, "loss": 0.1799, "learning_rate": 4.99824719195017e-05, "epoch": 0.1247327156094084, "percentage": 4.16, "elapsed_time": "0:38:35", "remaining_time": "14:49:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1060, "total_steps": 25254, "loss": 0.1848, "learning_rate": 4.9981250961273865e-05, "epoch": 0.12592064623425991, "percentage": 4.2, "elapsed_time": "0:38:58", "remaining_time": "14:49:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1070, "total_steps": 25254, "loss": 0.1828, "learning_rate": 4.997998891424e-05, "epoch": 0.12710857685911142, "percentage": 4.24, "elapsed_time": "0:39:19", "remaining_time": "14:48:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1080, "total_steps": 25254, "loss": 0.1868, "learning_rate": 4.997868578047592e-05, "epoch": 0.12829650748396293, "percentage": 4.28, "elapsed_time": "0:39:41", "remaining_time": "14:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1090, "total_steps": 25254, "loss": 0.1828, "learning_rate": 4.9977341562125e-05, "epoch": 0.12948443810881444, "percentage": 4.32, "elapsed_time": "0:40:02", "remaining_time": "14:47:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1100, "total_steps": 25254, "loss": 0.1837, "learning_rate": 4.997595626139818e-05, "epoch": 0.13067236873366594, "percentage": 4.36, "elapsed_time": "0:40:24", "remaining_time": "14:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1110, "total_steps": 25254, "loss": 0.1822, "learning_rate": 4.997452988057399e-05, "epoch": 0.13186029935851745, "percentage": 4.4, "elapsed_time": "0:40:45", "remaining_time": "14:46:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1120, "total_steps": 25254, "loss": 0.1774, "learning_rate": 4.9973062421998516e-05, "epoch": 0.13304822998336896, "percentage": 4.43, "elapsed_time": "0:41:07", "remaining_time": "14:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1130, "total_steps": 25254, "loss": 0.1831, "learning_rate": 4.997155388808542e-05, "epoch": 0.13423616060822047, "percentage": 4.47, "elapsed_time": "0:41:28", "remaining_time": "14:45:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1140, "total_steps": 25254, "loss": 0.1811, "learning_rate": 4.997000428131592e-05, "epoch": 0.13542409123307197, "percentage": 4.51, "elapsed_time": "0:41:50", "remaining_time": "14:45:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1150, "total_steps": 25254, "loss": 0.1804, "learning_rate": 4.9968413604238776e-05, "epoch": 0.1366120218579235, "percentage": 4.55, "elapsed_time": "0:42:12", "remaining_time": "14:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1160, "total_steps": 25254, "loss": 0.1773, "learning_rate": 4.996678185947031e-05, "epoch": 0.13779995248277502, "percentage": 4.59, "elapsed_time": "0:42:35", "remaining_time": "14:44:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1170, "total_steps": 25254, "loss": 0.178, "learning_rate": 4.996510904969441e-05, "epoch": 0.13898788310762653, "percentage": 4.63, "elapsed_time": "0:42:56", "remaining_time": "14:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1180, "total_steps": 25254, "loss": 0.1799, "learning_rate": 4.996339517766247e-05, "epoch": 0.14017581373247803, "percentage": 4.67, "elapsed_time": "0:43:18", "remaining_time": "14:43:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1190, "total_steps": 25254, "loss": 0.1805, "learning_rate": 4.9961640246193456e-05, "epoch": 0.14136374435732954, "percentage": 4.71, "elapsed_time": "0:43:39", "remaining_time": "14:42:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1200, "total_steps": 25254, "loss": 0.1788, "learning_rate": 4.995984425817385e-05, "epoch": 0.14255167498218105, "percentage": 4.75, "elapsed_time": "0:44:01", "remaining_time": "14:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1210, "total_steps": 25254, "loss": 0.1804, "learning_rate": 4.995800721655766e-05, "epoch": 0.14373960560703256, "percentage": 4.79, "elapsed_time": "0:44:22", "remaining_time": "14:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1220, "total_steps": 25254, "loss": 0.1847, "learning_rate": 4.995612912436643e-05, "epoch": 0.14492753623188406, "percentage": 4.83, "elapsed_time": "0:44:44", "remaining_time": "14:41:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1230, "total_steps": 25254, "loss": 0.1801, "learning_rate": 4.995420998468923e-05, "epoch": 0.14611546685673557, "percentage": 4.87, "elapsed_time": "0:45:06", "remaining_time": "14:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1240, "total_steps": 25254, "loss": 0.1794, "learning_rate": 4.995224980068263e-05, "epoch": 0.14730339748158708, "percentage": 4.91, "elapsed_time": "0:45:27", "remaining_time": "14:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1250, "total_steps": 25254, "loss": 0.176, "learning_rate": 4.995024857557069e-05, "epoch": 0.14849132810643859, "percentage": 4.95, "elapsed_time": "0:45:48", "remaining_time": "14:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1260, "total_steps": 25254, "loss": 0.1762, "learning_rate": 4.994820631264503e-05, "epoch": 0.1496792587312901, "percentage": 4.99, "elapsed_time": "0:46:10", "remaining_time": "14:39:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1270, "total_steps": 25254, "loss": 0.1795, "learning_rate": 4.9946123015264715e-05, "epoch": 0.1508671893561416, "percentage": 5.03, "elapsed_time": "0:46:32", "remaining_time": "14:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1280, "total_steps": 25254, "loss": 0.1798, "learning_rate": 4.994399868685633e-05, "epoch": 0.1520551199809931, "percentage": 5.07, "elapsed_time": "0:46:53", "remaining_time": "14:38:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1290, "total_steps": 25254, "loss": 0.1741, "learning_rate": 4.994183333091393e-05, "epoch": 0.15324305060584462, "percentage": 5.11, "elapsed_time": "0:47:15", "remaining_time": "14:37:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1300, "total_steps": 25254, "loss": 0.1775, "learning_rate": 4.9939626950999075e-05, "epoch": 0.15443098123069612, "percentage": 5.15, "elapsed_time": "0:47:37", "remaining_time": "14:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1310, "total_steps": 25254, "loss": 0.1791, "learning_rate": 4.9937379550740785e-05, "epoch": 0.15561891185554763, "percentage": 5.19, "elapsed_time": "0:47:59", "remaining_time": "14:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1320, "total_steps": 25254, "loss": 0.1757, "learning_rate": 4.993509113383554e-05, "epoch": 0.15680684248039914, "percentage": 5.23, "elapsed_time": "0:48:20", "remaining_time": "14:36:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1330, "total_steps": 25254, "loss": 0.1809, "learning_rate": 4.993276170404731e-05, "epoch": 0.15799477310525065, "percentage": 5.27, "elapsed_time": "0:48:42", "remaining_time": "14:36:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1340, "total_steps": 25254, "loss": 0.1799, "learning_rate": 4.99303912652075e-05, "epoch": 0.15918270373010215, "percentage": 5.31, "elapsed_time": "0:49:04", "remaining_time": "14:35:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1350, "total_steps": 25254, "loss": 0.1798, "learning_rate": 4.992797982121498e-05, "epoch": 0.16037063435495366, "percentage": 5.35, "elapsed_time": "0:49:26", "remaining_time": "14:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1360, "total_steps": 25254, "loss": 0.1821, "learning_rate": 4.992552737603605e-05, "epoch": 0.16155856497980517, "percentage": 5.39, "elapsed_time": "0:49:47", "remaining_time": "14:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1370, "total_steps": 25254, "loss": 0.1778, "learning_rate": 4.992303393370447e-05, "epoch": 0.16274649560465668, "percentage": 5.42, "elapsed_time": "0:50:09", "remaining_time": "14:34:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1380, "total_steps": 25254, "loss": 0.1816, "learning_rate": 4.992049949832139e-05, "epoch": 0.16393442622950818, "percentage": 5.46, "elapsed_time": "0:50:30", "remaining_time": "14:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1390, "total_steps": 25254, "loss": 0.1747, "learning_rate": 4.991792407405546e-05, "epoch": 0.1651223568543597, "percentage": 5.5, "elapsed_time": "0:50:52", "remaining_time": "14:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1400, "total_steps": 25254, "loss": 0.1775, "learning_rate": 4.991530766514265e-05, "epoch": 0.16631028747921123, "percentage": 5.54, "elapsed_time": "0:51:14", "remaining_time": "14:33:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1410, "total_steps": 25254, "loss": 0.1764, "learning_rate": 4.991265027588643e-05, "epoch": 0.16749821810406273, "percentage": 5.58, "elapsed_time": "0:51:36", "remaining_time": "14:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1420, "total_steps": 25254, "loss": 0.173, "learning_rate": 4.9909951910657625e-05, "epoch": 0.16868614872891424, "percentage": 5.62, "elapsed_time": "0:51:58", "remaining_time": "14:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1430, "total_steps": 25254, "loss": 0.1766, "learning_rate": 4.990721257389446e-05, "epoch": 0.16987407935376575, "percentage": 5.66, "elapsed_time": "0:52:19", "remaining_time": "14:31:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1440, "total_steps": 25254, "loss": 0.1771, "learning_rate": 4.990443227010256e-05, "epoch": 0.17106200997861726, "percentage": 5.7, "elapsed_time": "0:52:43", "remaining_time": "14:31:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1450, "total_steps": 25254, "loss": 0.1751, "learning_rate": 4.990161100385494e-05, "epoch": 0.17224994060346877, "percentage": 5.74, "elapsed_time": "0:53:05", "remaining_time": "14:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1460, "total_steps": 25254, "loss": 0.1751, "learning_rate": 4.989874877979197e-05, "epoch": 0.17343787122832027, "percentage": 5.78, "elapsed_time": "0:53:26", "remaining_time": "14:31:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1470, "total_steps": 25254, "loss": 0.1787, "learning_rate": 4.9895845602621394e-05, "epoch": 0.17462580185317178, "percentage": 5.82, "elapsed_time": "0:53:48", "remaining_time": "14:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1480, "total_steps": 25254, "loss": 0.1753, "learning_rate": 4.989290147711831e-05, "epoch": 0.1758137324780233, "percentage": 5.86, "elapsed_time": "0:54:10", "remaining_time": "14:30:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1490, "total_steps": 25254, "loss": 0.1768, "learning_rate": 4.9889916408125196e-05, "epoch": 0.1770016631028748, "percentage": 5.9, "elapsed_time": "0:54:31", "remaining_time": "14:29:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1500, "total_steps": 25254, "loss": 0.177, "learning_rate": 4.988689040055183e-05, "epoch": 0.1781895937277263, "percentage": 5.94, "elapsed_time": "0:54:53", "remaining_time": "14:29:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1510, "total_steps": 25254, "loss": 0.1762, "learning_rate": 4.988382345937536e-05, "epoch": 0.1793775243525778, "percentage": 5.98, "elapsed_time": "0:55:15", "remaining_time": "14:28:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1520, "total_steps": 25254, "loss": 0.1773, "learning_rate": 4.988071558964023e-05, "epoch": 0.18056545497742932, "percentage": 6.02, "elapsed_time": "0:55:36", "remaining_time": "14:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1530, "total_steps": 25254, "loss": 0.1728, "learning_rate": 4.987756679645823e-05, "epoch": 0.18175338560228083, "percentage": 6.06, "elapsed_time": "0:55:58", "remaining_time": "14:28:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1540, "total_steps": 25254, "loss": 0.1756, "learning_rate": 4.987437708500845e-05, "epoch": 0.18294131622713233, "percentage": 6.1, "elapsed_time": "0:56:20", "remaining_time": "14:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1550, "total_steps": 25254, "loss": 0.1691, "learning_rate": 4.9871146460537285e-05, "epoch": 0.18412924685198384, "percentage": 6.14, "elapsed_time": "0:56:42", "remaining_time": "14:27:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1560, "total_steps": 25254, "loss": 0.1755, "learning_rate": 4.986787492835843e-05, "epoch": 0.18531717747683535, "percentage": 6.18, "elapsed_time": "0:57:04", "remaining_time": "14:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1570, "total_steps": 25254, "loss": 0.1751, "learning_rate": 4.986456249385283e-05, "epoch": 0.18650510810168686, "percentage": 6.22, "elapsed_time": "0:57:26", "remaining_time": "14:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1580, "total_steps": 25254, "loss": 0.1753, "learning_rate": 4.986120916246873e-05, "epoch": 0.18769303872653836, "percentage": 6.26, "elapsed_time": "0:57:47", "remaining_time": "14:25:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1590, "total_steps": 25254, "loss": 0.1768, "learning_rate": 4.9857814939721676e-05, "epoch": 0.18888096935138987, "percentage": 6.3, "elapsed_time": "0:58:09", "remaining_time": "14:25:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1600, "total_steps": 25254, "loss": 0.1748, "learning_rate": 4.985437983119441e-05, "epoch": 0.19006889997624138, "percentage": 6.34, "elapsed_time": "0:58:31", "remaining_time": "14:25:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1610, "total_steps": 25254, "loss": 0.1728, "learning_rate": 4.9850903842536946e-05, "epoch": 0.1912568306010929, "percentage": 6.38, "elapsed_time": "0:58:53", "remaining_time": "14:24:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1620, "total_steps": 25254, "loss": 0.1756, "learning_rate": 4.984738697946656e-05, "epoch": 0.1924447612259444, "percentage": 6.41, "elapsed_time": "0:59:15", "remaining_time": "14:24:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1630, "total_steps": 25254, "loss": 0.1761, "learning_rate": 4.984382924776772e-05, "epoch": 0.1936326918507959, "percentage": 6.45, "elapsed_time": "0:59:36", "remaining_time": "14:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1640, "total_steps": 25254, "loss": 0.1724, "learning_rate": 4.9840230653292144e-05, "epoch": 0.1948206224756474, "percentage": 6.49, "elapsed_time": "0:59:58", "remaining_time": "14:23:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1650, "total_steps": 25254, "loss": 0.1722, "learning_rate": 4.983659120195875e-05, "epoch": 0.19600855310049894, "percentage": 6.53, "elapsed_time": "1:00:20", "remaining_time": "14:23:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1660, "total_steps": 25254, "loss": 0.1729, "learning_rate": 4.9832910899753636e-05, "epoch": 0.19719648372535045, "percentage": 6.57, "elapsed_time": "1:00:42", "remaining_time": "14:22:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1670, "total_steps": 25254, "loss": 0.1724, "learning_rate": 4.9829189752730144e-05, "epoch": 0.19838441435020196, "percentage": 6.61, "elapsed_time": "1:01:04", "remaining_time": "14:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1680, "total_steps": 25254, "loss": 0.171, "learning_rate": 4.982542776700874e-05, "epoch": 0.19957234497505347, "percentage": 6.65, "elapsed_time": "1:01:26", "remaining_time": "14:22:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1690, "total_steps": 25254, "loss": 0.173, "learning_rate": 4.982162494877708e-05, "epoch": 0.20076027559990497, "percentage": 6.69, "elapsed_time": "1:01:48", "remaining_time": "14:21:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1700, "total_steps": 25254, "loss": 0.1753, "learning_rate": 4.9817781304290004e-05, "epoch": 0.20194820622475648, "percentage": 6.73, "elapsed_time": "1:02:10", "remaining_time": "14:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1710, "total_steps": 25254, "loss": 0.1723, "learning_rate": 4.981389683986947e-05, "epoch": 0.203136136849608, "percentage": 6.77, "elapsed_time": "1:02:32", "remaining_time": "14:21:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1720, "total_steps": 25254, "loss": 0.1717, "learning_rate": 4.98099715619046e-05, "epoch": 0.2043240674744595, "percentage": 6.81, "elapsed_time": "1:02:54", "remaining_time": "14:20:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1730, "total_steps": 25254, "loss": 0.1703, "learning_rate": 4.980600547685163e-05, "epoch": 0.205511998099311, "percentage": 6.85, "elapsed_time": "1:03:16", "remaining_time": "14:20:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1740, "total_steps": 25254, "loss": 0.1678, "learning_rate": 4.980199859123392e-05, "epoch": 0.2066999287241625, "percentage": 6.89, "elapsed_time": "1:03:38", "remaining_time": "14:20:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1750, "total_steps": 25254, "loss": 0.1715, "learning_rate": 4.9797950911641933e-05, "epoch": 0.20788785934901402, "percentage": 6.93, "elapsed_time": "1:04:00", "remaining_time": "14:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1760, "total_steps": 25254, "loss": 0.1729, "learning_rate": 4.9793862444733254e-05, "epoch": 0.20907578997386553, "percentage": 6.97, "elapsed_time": "1:04:21", "remaining_time": "14:19:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1770, "total_steps": 25254, "loss": 0.1742, "learning_rate": 4.978973319723251e-05, "epoch": 0.21026372059871704, "percentage": 7.01, "elapsed_time": "1:04:42", "remaining_time": "14:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1780, "total_steps": 25254, "loss": 0.1735, "learning_rate": 4.978556317593144e-05, "epoch": 0.21145165122356854, "percentage": 7.05, "elapsed_time": "1:05:05", "remaining_time": "14:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1790, "total_steps": 25254, "loss": 0.1701, "learning_rate": 4.978135238768884e-05, "epoch": 0.21263958184842005, "percentage": 7.09, "elapsed_time": "1:05:26", "remaining_time": "14:17:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1800, "total_steps": 25254, "loss": 0.1706, "learning_rate": 4.9777100839430543e-05, "epoch": 0.21382751247327156, "percentage": 7.13, "elapsed_time": "1:05:48", "remaining_time": "14:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1810, "total_steps": 25254, "loss": 0.17, "learning_rate": 4.9772808538149455e-05, "epoch": 0.21501544309812307, "percentage": 7.17, "elapsed_time": "1:06:10", "remaining_time": "14:17:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1820, "total_steps": 25254, "loss": 0.1739, "learning_rate": 4.9768475490905474e-05, "epoch": 0.21620337372297457, "percentage": 7.21, "elapsed_time": "1:06:32", "remaining_time": "14:16:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1830, "total_steps": 25254, "loss": 0.1717, "learning_rate": 4.976410170482554e-05, "epoch": 0.21739130434782608, "percentage": 7.25, "elapsed_time": "1:06:54", "remaining_time": "14:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1840, "total_steps": 25254, "loss": 0.1691, "learning_rate": 4.9759687187103596e-05, "epoch": 0.2185792349726776, "percentage": 7.29, "elapsed_time": "1:07:16", "remaining_time": "14:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1850, "total_steps": 25254, "loss": 0.1717, "learning_rate": 4.9755231945000574e-05, "epoch": 0.2197671655975291, "percentage": 7.33, "elapsed_time": "1:07:38", "remaining_time": "14:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1860, "total_steps": 25254, "loss": 0.1728, "learning_rate": 4.97507359858444e-05, "epoch": 0.2209550962223806, "percentage": 7.37, "elapsed_time": "1:08:00", "remaining_time": "14:15:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1870, "total_steps": 25254, "loss": 0.1726, "learning_rate": 4.974619931702995e-05, "epoch": 0.2221430268472321, "percentage": 7.4, "elapsed_time": "1:08:22", "remaining_time": "14:14:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1880, "total_steps": 25254, "loss": 0.1741, "learning_rate": 4.974162194601908e-05, "epoch": 0.22333095747208362, "percentage": 7.44, "elapsed_time": "1:08:43", "remaining_time": "14:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1890, "total_steps": 25254, "loss": 0.1709, "learning_rate": 4.97370038803406e-05, "epoch": 0.22451888809693513, "percentage": 7.48, "elapsed_time": "1:09:05", "remaining_time": "14:14:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1900, "total_steps": 25254, "loss": 0.1689, "learning_rate": 4.973234512759021e-05, "epoch": 0.22570681872178663, "percentage": 7.52, "elapsed_time": "1:09:26", "remaining_time": "14:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1910, "total_steps": 25254, "loss": 0.1725, "learning_rate": 4.972764569543058e-05, "epoch": 0.22689474934663817, "percentage": 7.56, "elapsed_time": "1:09:49", "remaining_time": "14:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1920, "total_steps": 25254, "loss": 0.1678, "learning_rate": 4.972290559159126e-05, "epoch": 0.22808267997148968, "percentage": 7.6, "elapsed_time": "1:10:12", "remaining_time": "14:13:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1930, "total_steps": 25254, "loss": 0.1732, "learning_rate": 4.971812482386872e-05, "epoch": 0.22927061059634118, "percentage": 7.64, "elapsed_time": "1:10:33", "remaining_time": "14:12:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1940, "total_steps": 25254, "loss": 0.1706, "learning_rate": 4.9713303400126274e-05, "epoch": 0.2304585412211927, "percentage": 7.68, "elapsed_time": "1:10:54", "remaining_time": "14:12:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1950, "total_steps": 25254, "loss": 0.1699, "learning_rate": 4.970844132829415e-05, "epoch": 0.2316464718460442, "percentage": 7.72, "elapsed_time": "1:11:17", "remaining_time": "14:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1960, "total_steps": 25254, "loss": 0.169, "learning_rate": 4.97035386163694e-05, "epoch": 0.2328344024708957, "percentage": 7.76, "elapsed_time": "1:11:38", "remaining_time": "14:11:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1970, "total_steps": 25254, "loss": 0.1706, "learning_rate": 4.969859527241596e-05, "epoch": 0.23402233309574721, "percentage": 7.8, "elapsed_time": "1:12:00", "remaining_time": "14:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1980, "total_steps": 25254, "loss": 0.1687, "learning_rate": 4.969361130456455e-05, "epoch": 0.23521026372059872, "percentage": 7.84, "elapsed_time": "1:12:21", "remaining_time": "14:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 1990, "total_steps": 25254, "loss": 0.1755, "learning_rate": 4.968858672101274e-05, "epoch": 0.23639819434545023, "percentage": 7.88, "elapsed_time": "1:12:42", "remaining_time": "14:10:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2000, "total_steps": 25254, "loss": 0.1697, "learning_rate": 4.968352153002488e-05, "epoch": 0.23758612497030174, "percentage": 7.92, "elapsed_time": "1:13:04", "remaining_time": "14:09:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2010, "total_steps": 25254, "loss": 0.1664, "learning_rate": 4.967841573993214e-05, "epoch": 0.23877405559515325, "percentage": 7.96, "elapsed_time": "1:13:25", "remaining_time": "14:09:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2020, "total_steps": 25254, "loss": 0.1712, "learning_rate": 4.9673269359132435e-05, "epoch": 0.23996198622000475, "percentage": 8.0, "elapsed_time": "1:13:46", "remaining_time": "14:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2030, "total_steps": 25254, "loss": 0.1732, "learning_rate": 4.966808239609048e-05, "epoch": 0.24114991684485626, "percentage": 8.04, "elapsed_time": "1:14:09", "remaining_time": "14:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2040, "total_steps": 25254, "loss": 0.1701, "learning_rate": 4.9662854859337696e-05, "epoch": 0.24233784746970777, "percentage": 8.08, "elapsed_time": "1:14:31", "remaining_time": "14:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2050, "total_steps": 25254, "loss": 0.1711, "learning_rate": 4.965758675747226e-05, "epoch": 0.24352577809455928, "percentage": 8.12, "elapsed_time": "1:14:53", "remaining_time": "14:07:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2060, "total_steps": 25254, "loss": 0.1685, "learning_rate": 4.9652278099159097e-05, "epoch": 0.24471370871941078, "percentage": 8.16, "elapsed_time": "1:15:15", "remaining_time": "14:07:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2070, "total_steps": 25254, "loss": 0.1681, "learning_rate": 4.96469288931298e-05, "epoch": 0.2459016393442623, "percentage": 8.2, "elapsed_time": "1:15:36", "remaining_time": "14:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2080, "total_steps": 25254, "loss": 0.1677, "learning_rate": 4.964153914818266e-05, "epoch": 0.2470895699691138, "percentage": 8.24, "elapsed_time": "1:15:58", "remaining_time": "14:06:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2090, "total_steps": 25254, "loss": 0.1707, "learning_rate": 4.963610887318265e-05, "epoch": 0.2482775005939653, "percentage": 8.28, "elapsed_time": "1:16:21", "remaining_time": "14:06:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2100, "total_steps": 25254, "loss": 0.1683, "learning_rate": 4.963063807706142e-05, "epoch": 0.2494654312188168, "percentage": 8.32, "elapsed_time": "1:16:43", "remaining_time": "14:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2110, "total_steps": 25254, "loss": 0.1693, "learning_rate": 4.962512676881725e-05, "epoch": 0.2506533618436683, "percentage": 8.36, "elapsed_time": "1:17:05", "remaining_time": "14:05:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2120, "total_steps": 25254, "loss": 0.1637, "learning_rate": 4.961957495751508e-05, "epoch": 0.25184129246851983, "percentage": 8.39, "elapsed_time": "1:17:27", "remaining_time": "14:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2130, "total_steps": 25254, "loss": 0.1701, "learning_rate": 4.961398265228642e-05, "epoch": 0.25302922309337134, "percentage": 8.43, "elapsed_time": "1:17:48", "remaining_time": "14:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2140, "total_steps": 25254, "loss": 0.1634, "learning_rate": 4.960834986232943e-05, "epoch": 0.25421715371822284, "percentage": 8.47, "elapsed_time": "1:18:11", "remaining_time": "14:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2150, "total_steps": 25254, "loss": 0.1671, "learning_rate": 4.960267659690885e-05, "epoch": 0.25540508434307435, "percentage": 8.51, "elapsed_time": "1:18:33", "remaining_time": "14:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2160, "total_steps": 25254, "loss": 0.1669, "learning_rate": 4.959696286535598e-05, "epoch": 0.25659301496792586, "percentage": 8.55, "elapsed_time": "1:18:54", "remaining_time": "14:03:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2170, "total_steps": 25254, "loss": 0.1692, "learning_rate": 4.959120867706867e-05, "epoch": 0.25778094559277737, "percentage": 8.59, "elapsed_time": "1:19:16", "remaining_time": "14:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2180, "total_steps": 25254, "loss": 0.1671, "learning_rate": 4.958541404151135e-05, "epoch": 0.2589688762176289, "percentage": 8.63, "elapsed_time": "1:19:38", "remaining_time": "14:03:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2190, "total_steps": 25254, "loss": 0.1718, "learning_rate": 4.957957896821494e-05, "epoch": 0.2601568068424804, "percentage": 8.67, "elapsed_time": "1:20:00", "remaining_time": "14:02:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2200, "total_steps": 25254, "loss": 0.1641, "learning_rate": 4.957370346677688e-05, "epoch": 0.2613447374673319, "percentage": 8.71, "elapsed_time": "1:20:23", "remaining_time": "14:02:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2210, "total_steps": 25254, "loss": 0.1675, "learning_rate": 4.9567787546861135e-05, "epoch": 0.2625326680921834, "percentage": 8.75, "elapsed_time": "1:20:45", "remaining_time": "14:02:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2220, "total_steps": 25254, "loss": 0.1668, "learning_rate": 4.95618312181981e-05, "epoch": 0.2637205987170349, "percentage": 8.79, "elapsed_time": "1:21:07", "remaining_time": "14:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2230, "total_steps": 25254, "loss": 0.1674, "learning_rate": 4.9555834490584675e-05, "epoch": 0.2649085293418864, "percentage": 8.83, "elapsed_time": "1:21:29", "remaining_time": "14:01:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2240, "total_steps": 25254, "loss": 0.1664, "learning_rate": 4.954979737388419e-05, "epoch": 0.2660964599667379, "percentage": 8.87, "elapsed_time": "1:21:51", "remaining_time": "14:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2250, "total_steps": 25254, "loss": 0.1647, "learning_rate": 4.954371987802641e-05, "epoch": 0.2672843905915894, "percentage": 8.91, "elapsed_time": "1:22:12", "remaining_time": "14:00:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2260, "total_steps": 25254, "loss": 0.1648, "learning_rate": 4.95376020130075e-05, "epoch": 0.26847232121644093, "percentage": 8.95, "elapsed_time": "1:22:34", "remaining_time": "14:00:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2270, "total_steps": 25254, "loss": 0.1706, "learning_rate": 4.9531443788890054e-05, "epoch": 0.26966025184129244, "percentage": 8.99, "elapsed_time": "1:22:56", "remaining_time": "13:59:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2280, "total_steps": 25254, "loss": 0.1714, "learning_rate": 4.952524521580302e-05, "epoch": 0.27084818246614395, "percentage": 9.03, "elapsed_time": "1:23:18", "remaining_time": "13:59:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2290, "total_steps": 25254, "loss": 0.1687, "learning_rate": 4.951900630394173e-05, "epoch": 0.2720361130909955, "percentage": 9.07, "elapsed_time": "1:23:39", "remaining_time": "13:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2300, "total_steps": 25254, "loss": 0.1676, "learning_rate": 4.9512727063567856e-05, "epoch": 0.273224043715847, "percentage": 9.11, "elapsed_time": "1:24:01", "remaining_time": "13:58:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2310, "total_steps": 25254, "loss": 0.1698, "learning_rate": 4.95064075050094e-05, "epoch": 0.27441197434069853, "percentage": 9.15, "elapsed_time": "1:24:23", "remaining_time": "13:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2320, "total_steps": 25254, "loss": 0.1686, "learning_rate": 4.950004763866069e-05, "epoch": 0.27559990496555004, "percentage": 9.19, "elapsed_time": "1:24:46", "remaining_time": "13:57:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2330, "total_steps": 25254, "loss": 0.1659, "learning_rate": 4.949364747498233e-05, "epoch": 0.27678783559040154, "percentage": 9.23, "elapsed_time": "1:25:08", "remaining_time": "13:57:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2340, "total_steps": 25254, "loss": 0.1636, "learning_rate": 4.9487207024501236e-05, "epoch": 0.27797576621525305, "percentage": 9.27, "elapsed_time": "1:25:30", "remaining_time": "13:57:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2350, "total_steps": 25254, "loss": 0.1642, "learning_rate": 4.948072629781056e-05, "epoch": 0.27916369684010456, "percentage": 9.31, "elapsed_time": "1:25:54", "remaining_time": "13:57:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2360, "total_steps": 25254, "loss": 0.1658, "learning_rate": 4.947420530556969e-05, "epoch": 0.28035162746495607, "percentage": 9.35, "elapsed_time": "1:26:16", "remaining_time": "13:56:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2370, "total_steps": 25254, "loss": 0.1635, "learning_rate": 4.9467644058504295e-05, "epoch": 0.2815395580898076, "percentage": 9.38, "elapsed_time": "1:26:38", "remaining_time": "13:56:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2380, "total_steps": 25254, "loss": 0.1666, "learning_rate": 4.9461042567406203e-05, "epoch": 0.2827274887146591, "percentage": 9.42, "elapsed_time": "1:27:00", "remaining_time": "13:56:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2390, "total_steps": 25254, "loss": 0.1676, "learning_rate": 4.945440084313345e-05, "epoch": 0.2839154193395106, "percentage": 9.46, "elapsed_time": "1:27:21", "remaining_time": "13:55:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2400, "total_steps": 25254, "loss": 0.1697, "learning_rate": 4.944771889661026e-05, "epoch": 0.2851033499643621, "percentage": 9.5, "elapsed_time": "1:27:43", "remaining_time": "13:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2410, "total_steps": 25254, "loss": 0.1658, "learning_rate": 4.9440996738826994e-05, "epoch": 0.2862912805892136, "percentage": 9.54, "elapsed_time": "1:28:04", "remaining_time": "13:54:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2420, "total_steps": 25254, "loss": 0.164, "learning_rate": 4.943423438084017e-05, "epoch": 0.2874792112140651, "percentage": 9.58, "elapsed_time": "1:28:26", "remaining_time": "13:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2430, "total_steps": 25254, "loss": 0.1676, "learning_rate": 4.942743183377241e-05, "epoch": 0.2886671418389166, "percentage": 9.62, "elapsed_time": "1:28:49", "remaining_time": "13:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2440, "total_steps": 25254, "loss": 0.1678, "learning_rate": 4.942058910881246e-05, "epoch": 0.2898550724637681, "percentage": 9.66, "elapsed_time": "1:29:10", "remaining_time": "13:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2450, "total_steps": 25254, "loss": 0.1662, "learning_rate": 4.941370621721511e-05, "epoch": 0.29104300308861963, "percentage": 9.7, "elapsed_time": "1:29:32", "remaining_time": "13:53:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2460, "total_steps": 25254, "loss": 0.1669, "learning_rate": 4.940678317030127e-05, "epoch": 0.29223093371347114, "percentage": 9.74, "elapsed_time": "1:29:53", "remaining_time": "13:52:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2470, "total_steps": 25254, "loss": 0.1704, "learning_rate": 4.9399819979457854e-05, "epoch": 0.29341886433832265, "percentage": 9.78, "elapsed_time": "1:30:15", "remaining_time": "13:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2480, "total_steps": 25254, "loss": 0.1635, "learning_rate": 4.9392816656137826e-05, "epoch": 0.29460679496317416, "percentage": 9.82, "elapsed_time": "1:30:37", "remaining_time": "13:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2490, "total_steps": 25254, "loss": 0.1679, "learning_rate": 4.938577321186014e-05, "epoch": 0.29579472558802566, "percentage": 9.86, "elapsed_time": "1:30:58", "remaining_time": "13:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2500, "total_steps": 25254, "loss": 0.1672, "learning_rate": 4.937868965820977e-05, "epoch": 0.29698265621287717, "percentage": 9.9, "elapsed_time": "1:31:21", "remaining_time": "13:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2510, "total_steps": 25254, "loss": 0.1669, "learning_rate": 4.937156600683764e-05, "epoch": 0.2981705868377287, "percentage": 9.94, "elapsed_time": "1:31:42", "remaining_time": "13:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2520, "total_steps": 25254, "loss": 0.1609, "learning_rate": 4.936440226946063e-05, "epoch": 0.2993585174625802, "percentage": 9.98, "elapsed_time": "1:32:04", "remaining_time": "13:50:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2530, "total_steps": 25254, "loss": 0.1676, "learning_rate": 4.935719845786154e-05, "epoch": 0.3005464480874317, "percentage": 10.02, "elapsed_time": "1:32:26", "remaining_time": "13:50:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2540, "total_steps": 25254, "loss": 0.1626, "learning_rate": 4.934995458388911e-05, "epoch": 0.3017343787122832, "percentage": 10.06, "elapsed_time": "1:32:48", "remaining_time": "13:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2550, "total_steps": 25254, "loss": 0.1607, "learning_rate": 4.934267065945797e-05, "epoch": 0.3029223093371347, "percentage": 10.1, "elapsed_time": "1:33:10", "remaining_time": "13:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2560, "total_steps": 25254, "loss": 0.1674, "learning_rate": 4.933534669654859e-05, "epoch": 0.3041102399619862, "percentage": 10.14, "elapsed_time": "1:33:32", "remaining_time": "13:49:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2570, "total_steps": 25254, "loss": 0.1674, "learning_rate": 4.932798270720734e-05, "epoch": 0.3052981705868377, "percentage": 10.18, "elapsed_time": "1:33:53", "remaining_time": "13:48:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2580, "total_steps": 25254, "loss": 0.1638, "learning_rate": 4.9320578703546396e-05, "epoch": 0.30648610121168923, "percentage": 10.22, "elapsed_time": "1:34:17", "remaining_time": "13:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2590, "total_steps": 25254, "loss": 0.1617, "learning_rate": 4.9313134697743756e-05, "epoch": 0.30767403183654074, "percentage": 10.26, "elapsed_time": "1:34:38", "remaining_time": "13:48:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2600, "total_steps": 25254, "loss": 0.1653, "learning_rate": 4.930565070204323e-05, "epoch": 0.30886196246139225, "percentage": 10.3, "elapsed_time": "1:35:01", "remaining_time": "13:47:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2610, "total_steps": 25254, "loss": 0.1685, "learning_rate": 4.9298126728754364e-05, "epoch": 0.31004989308624376, "percentage": 10.33, "elapsed_time": "1:35:23", "remaining_time": "13:47:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2620, "total_steps": 25254, "loss": 0.1642, "learning_rate": 4.9290562790252495e-05, "epoch": 0.31123782371109526, "percentage": 10.37, "elapsed_time": "1:35:44", "remaining_time": "13:47:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2630, "total_steps": 25254, "loss": 0.1663, "learning_rate": 4.928295889897869e-05, "epoch": 0.31242575433594677, "percentage": 10.41, "elapsed_time": "1:36:07", "remaining_time": "13:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2640, "total_steps": 25254, "loss": 0.1665, "learning_rate": 4.9275315067439706e-05, "epoch": 0.3136136849607983, "percentage": 10.45, "elapsed_time": "1:36:29", "remaining_time": "13:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2650, "total_steps": 25254, "loss": 0.1646, "learning_rate": 4.926763130820801e-05, "epoch": 0.3148016155856498, "percentage": 10.49, "elapsed_time": "1:36:51", "remaining_time": "13:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2660, "total_steps": 25254, "loss": 0.1617, "learning_rate": 4.925990763392175e-05, "epoch": 0.3159895462105013, "percentage": 10.53, "elapsed_time": "1:37:13", "remaining_time": "13:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2670, "total_steps": 25254, "loss": 0.1642, "learning_rate": 4.925214405728471e-05, "epoch": 0.3171774768353528, "percentage": 10.57, "elapsed_time": "1:37:35", "remaining_time": "13:45:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2680, "total_steps": 25254, "loss": 0.1608, "learning_rate": 4.9244340591066314e-05, "epoch": 0.3183654074602043, "percentage": 10.61, "elapsed_time": "1:37:58", "remaining_time": "13:45:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2690, "total_steps": 25254, "loss": 0.1649, "learning_rate": 4.923649724810158e-05, "epoch": 0.3195533380850558, "percentage": 10.65, "elapsed_time": "1:38:20", "remaining_time": "13:44:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2700, "total_steps": 25254, "loss": 0.1667, "learning_rate": 4.9228614041291145e-05, "epoch": 0.3207412687099073, "percentage": 10.69, "elapsed_time": "1:38:42", "remaining_time": "13:44:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2710, "total_steps": 25254, "loss": 0.1638, "learning_rate": 4.9220690983601174e-05, "epoch": 0.32192919933475883, "percentage": 10.73, "elapsed_time": "1:39:04", "remaining_time": "13:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2720, "total_steps": 25254, "loss": 0.1654, "learning_rate": 4.921272808806342e-05, "epoch": 0.32311712995961034, "percentage": 10.77, "elapsed_time": "1:39:24", "remaining_time": "13:43:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2730, "total_steps": 25254, "loss": 0.1603, "learning_rate": 4.920472536777512e-05, "epoch": 0.32430506058446185, "percentage": 10.81, "elapsed_time": "1:39:46", "remaining_time": "13:43:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2740, "total_steps": 25254, "loss": 0.1659, "learning_rate": 4.919668283589905e-05, "epoch": 0.32549299120931335, "percentage": 10.85, "elapsed_time": "1:40:08", "remaining_time": "13:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2750, "total_steps": 25254, "loss": 0.1649, "learning_rate": 4.9188600505663455e-05, "epoch": 0.32668092183416486, "percentage": 10.89, "elapsed_time": "1:40:30", "remaining_time": "13:42:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2760, "total_steps": 25254, "loss": 0.1658, "learning_rate": 4.9180478390362026e-05, "epoch": 0.32786885245901637, "percentage": 10.93, "elapsed_time": "1:40:51", "remaining_time": "13:42:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2770, "total_steps": 25254, "loss": 0.1685, "learning_rate": 4.917231650335391e-05, "epoch": 0.3290567830838679, "percentage": 10.97, "elapsed_time": "1:41:14", "remaining_time": "13:41:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2780, "total_steps": 25254, "loss": 0.1646, "learning_rate": 4.9164114858063645e-05, "epoch": 0.3302447137087194, "percentage": 11.01, "elapsed_time": "1:41:35", "remaining_time": "13:41:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2790, "total_steps": 25254, "loss": 0.1639, "learning_rate": 4.9155873467981205e-05, "epoch": 0.33143264433357095, "percentage": 11.05, "elapsed_time": "1:41:57", "remaining_time": "13:40:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2800, "total_steps": 25254, "loss": 0.1638, "learning_rate": 4.9147592346661896e-05, "epoch": 0.33262057495842245, "percentage": 11.09, "elapsed_time": "1:42:19", "remaining_time": "13:40:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2810, "total_steps": 25254, "loss": 0.1602, "learning_rate": 4.91392715077264e-05, "epoch": 0.33380850558327396, "percentage": 11.13, "elapsed_time": "1:42:41", "remaining_time": "13:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2820, "total_steps": 25254, "loss": 0.165, "learning_rate": 4.91309109648607e-05, "epoch": 0.33499643620812547, "percentage": 11.17, "elapsed_time": "1:43:03", "remaining_time": "13:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2830, "total_steps": 25254, "loss": 0.1638, "learning_rate": 4.912251073181611e-05, "epoch": 0.336184366832977, "percentage": 11.21, "elapsed_time": "1:43:25", "remaining_time": "13:39:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2840, "total_steps": 25254, "loss": 0.1638, "learning_rate": 4.91140708224092e-05, "epoch": 0.3373722974578285, "percentage": 11.25, "elapsed_time": "1:43:47", "remaining_time": "13:39:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2850, "total_steps": 25254, "loss": 0.1675, "learning_rate": 4.9105591250521834e-05, "epoch": 0.33856022808268, "percentage": 11.29, "elapsed_time": "1:44:10", "remaining_time": "13:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2860, "total_steps": 25254, "loss": 0.1659, "learning_rate": 4.909707203010107e-05, "epoch": 0.3397481587075315, "percentage": 11.32, "elapsed_time": "1:44:31", "remaining_time": "13:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2870, "total_steps": 25254, "loss": 0.159, "learning_rate": 4.908851317515921e-05, "epoch": 0.340936089332383, "percentage": 11.36, "elapsed_time": "1:44:53", "remaining_time": "13:38:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2880, "total_steps": 25254, "loss": 0.1608, "learning_rate": 4.907991469977373e-05, "epoch": 0.3421240199572345, "percentage": 11.4, "elapsed_time": "1:45:15", "remaining_time": "13:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2890, "total_steps": 25254, "loss": 0.1642, "learning_rate": 4.90712766180873e-05, "epoch": 0.343311950582086, "percentage": 11.44, "elapsed_time": "1:45:36", "remaining_time": "13:37:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2900, "total_steps": 25254, "loss": 0.1653, "learning_rate": 4.906259894430769e-05, "epoch": 0.34449988120693753, "percentage": 11.48, "elapsed_time": "1:45:57", "remaining_time": "13:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2910, "total_steps": 25254, "loss": 0.161, "learning_rate": 4.905388169270782e-05, "epoch": 0.34568781183178904, "percentage": 11.52, "elapsed_time": "1:46:19", "remaining_time": "13:36:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2920, "total_steps": 25254, "loss": 0.1606, "learning_rate": 4.904512487762572e-05, "epoch": 0.34687574245664055, "percentage": 11.56, "elapsed_time": "1:46:42", "remaining_time": "13:36:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2930, "total_steps": 25254, "loss": 0.1597, "learning_rate": 4.903632851346445e-05, "epoch": 0.34806367308149205, "percentage": 11.6, "elapsed_time": "1:47:04", "remaining_time": "13:35:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2940, "total_steps": 25254, "loss": 0.162, "learning_rate": 4.902749261469216e-05, "epoch": 0.34925160370634356, "percentage": 11.64, "elapsed_time": "1:47:25", "remaining_time": "13:35:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2950, "total_steps": 25254, "loss": 0.1654, "learning_rate": 4.9018617195842e-05, "epoch": 0.35043953433119507, "percentage": 11.68, "elapsed_time": "1:47:47", "remaining_time": "13:34:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2960, "total_steps": 25254, "loss": 0.1618, "learning_rate": 4.9009702271512134e-05, "epoch": 0.3516274649560466, "percentage": 11.72, "elapsed_time": "1:48:08", "remaining_time": "13:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2970, "total_steps": 25254, "loss": 0.1691, "learning_rate": 4.900074785636572e-05, "epoch": 0.3528153955808981, "percentage": 11.76, "elapsed_time": "1:48:30", "remaining_time": "13:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2980, "total_steps": 25254, "loss": 0.1627, "learning_rate": 4.899175396513083e-05, "epoch": 0.3540033262057496, "percentage": 11.8, "elapsed_time": "1:48:52", "remaining_time": "13:33:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 2990, "total_steps": 25254, "loss": 0.164, "learning_rate": 4.89827206126005e-05, "epoch": 0.3551912568306011, "percentage": 11.84, "elapsed_time": "1:49:13", "remaining_time": "13:33:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3000, "total_steps": 25254, "loss": 0.164, "learning_rate": 4.897364781363266e-05, "epoch": 0.3563791874554526, "percentage": 11.88, "elapsed_time": "1:49:35", "remaining_time": "13:32:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3010, "total_steps": 25254, "loss": 0.1634, "learning_rate": 4.896453558315011e-05, "epoch": 0.3575671180803041, "percentage": 11.92, "elapsed_time": "1:49:57", "remaining_time": "13:32:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3020, "total_steps": 25254, "loss": 0.1663, "learning_rate": 4.895538393614053e-05, "epoch": 0.3587550487051556, "percentage": 11.96, "elapsed_time": "1:50:19", "remaining_time": "13:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3030, "total_steps": 25254, "loss": 0.1653, "learning_rate": 4.894619288765642e-05, "epoch": 0.35994297933000713, "percentage": 12.0, "elapsed_time": "1:50:41", "remaining_time": "13:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3040, "total_steps": 25254, "loss": 0.1614, "learning_rate": 4.8936962452815064e-05, "epoch": 0.36113090995485864, "percentage": 12.04, "elapsed_time": "1:51:02", "remaining_time": "13:31:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3050, "total_steps": 25254, "loss": 0.1643, "learning_rate": 4.8927692646798574e-05, "epoch": 0.36231884057971014, "percentage": 12.08, "elapsed_time": "1:51:24", "remaining_time": "13:31:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3060, "total_steps": 25254, "loss": 0.1612, "learning_rate": 4.8918383484853784e-05, "epoch": 0.36350677120456165, "percentage": 12.12, "elapsed_time": "1:51:46", "remaining_time": "13:30:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3070, "total_steps": 25254, "loss": 0.1615, "learning_rate": 4.890903498229228e-05, "epoch": 0.36469470182941316, "percentage": 12.16, "elapsed_time": "1:52:08", "remaining_time": "13:30:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3080, "total_steps": 25254, "loss": 0.1623, "learning_rate": 4.889964715449033e-05, "epoch": 0.36588263245426467, "percentage": 12.2, "elapsed_time": "1:52:30", "remaining_time": "13:30:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3090, "total_steps": 25254, "loss": 0.1674, "learning_rate": 4.889022001688891e-05, "epoch": 0.3670705630791162, "percentage": 12.24, "elapsed_time": "1:52:52", "remaining_time": "13:29:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3100, "total_steps": 25254, "loss": 0.1625, "learning_rate": 4.888075358499364e-05, "epoch": 0.3682584937039677, "percentage": 12.28, "elapsed_time": "1:53:14", "remaining_time": "13:29:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3110, "total_steps": 25254, "loss": 0.1671, "learning_rate": 4.887124787437478e-05, "epoch": 0.3694464243288192, "percentage": 12.31, "elapsed_time": "1:53:35", "remaining_time": "13:28:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3120, "total_steps": 25254, "loss": 0.1642, "learning_rate": 4.8861702900667174e-05, "epoch": 0.3706343549536707, "percentage": 12.35, "elapsed_time": "1:53:58", "remaining_time": "13:28:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3130, "total_steps": 25254, "loss": 0.1631, "learning_rate": 4.8852118679570267e-05, "epoch": 0.3718222855785222, "percentage": 12.39, "elapsed_time": "1:54:21", "remaining_time": "13:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3140, "total_steps": 25254, "loss": 0.165, "learning_rate": 4.884249522684805e-05, "epoch": 0.3730102162033737, "percentage": 12.43, "elapsed_time": "1:54:42", "remaining_time": "13:27:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3150, "total_steps": 25254, "loss": 0.165, "learning_rate": 4.883283255832904e-05, "epoch": 0.3741981468282252, "percentage": 12.47, "elapsed_time": "1:55:04", "remaining_time": "13:27:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3160, "total_steps": 25254, "loss": 0.1598, "learning_rate": 4.882313068990625e-05, "epoch": 0.3753860774530767, "percentage": 12.51, "elapsed_time": "1:55:25", "remaining_time": "13:27:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3170, "total_steps": 25254, "loss": 0.1607, "learning_rate": 4.8813389637537175e-05, "epoch": 0.37657400807792824, "percentage": 12.55, "elapsed_time": "1:55:46", "remaining_time": "13:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3180, "total_steps": 25254, "loss": 0.1623, "learning_rate": 4.880360941724378e-05, "epoch": 0.37776193870277974, "percentage": 12.59, "elapsed_time": "1:56:08", "remaining_time": "13:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3190, "total_steps": 25254, "loss": 0.1627, "learning_rate": 4.879379004511241e-05, "epoch": 0.37894986932763125, "percentage": 12.63, "elapsed_time": "1:56:29", "remaining_time": "13:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3200, "total_steps": 25254, "loss": 0.1648, "learning_rate": 4.878393153729383e-05, "epoch": 0.38013779995248276, "percentage": 12.67, "elapsed_time": "1:56:51", "remaining_time": "13:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3210, "total_steps": 25254, "loss": 0.1595, "learning_rate": 4.877403391000318e-05, "epoch": 0.38132573057733427, "percentage": 12.71, "elapsed_time": "1:57:13", "remaining_time": "13:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3220, "total_steps": 25254, "loss": 0.1639, "learning_rate": 4.876409717951994e-05, "epoch": 0.3825136612021858, "percentage": 12.75, "elapsed_time": "1:57:34", "remaining_time": "13:24:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3230, "total_steps": 25254, "loss": 0.1613, "learning_rate": 4.87541213621879e-05, "epoch": 0.3837015918270373, "percentage": 12.79, "elapsed_time": "1:57:56", "remaining_time": "13:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3240, "total_steps": 25254, "loss": 0.1595, "learning_rate": 4.8744106474415134e-05, "epoch": 0.3848895224518888, "percentage": 12.83, "elapsed_time": "1:58:18", "remaining_time": "13:23:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3250, "total_steps": 25254, "loss": 0.1613, "learning_rate": 4.8734052532674e-05, "epoch": 0.3860774530767403, "percentage": 12.87, "elapsed_time": "1:58:39", "remaining_time": "13:23:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3260, "total_steps": 25254, "loss": 0.1594, "learning_rate": 4.872395955350106e-05, "epoch": 0.3872653837015918, "percentage": 12.91, "elapsed_time": "1:59:01", "remaining_time": "13:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3270, "total_steps": 25254, "loss": 0.1609, "learning_rate": 4.871382755349712e-05, "epoch": 0.3884533143264433, "percentage": 12.95, "elapsed_time": "1:59:24", "remaining_time": "13:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3280, "total_steps": 25254, "loss": 0.1613, "learning_rate": 4.870365654932716e-05, "epoch": 0.3896412449512948, "percentage": 12.99, "elapsed_time": "1:59:45", "remaining_time": "13:22:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3290, "total_steps": 25254, "loss": 0.161, "learning_rate": 4.869344655772027e-05, "epoch": 0.3908291755761463, "percentage": 13.03, "elapsed_time": "2:00:07", "remaining_time": "13:21:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3300, "total_steps": 25254, "loss": 0.1627, "learning_rate": 4.868319759546972e-05, "epoch": 0.3920171062009979, "percentage": 13.07, "elapsed_time": "2:00:29", "remaining_time": "13:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3310, "total_steps": 25254, "loss": 0.1561, "learning_rate": 4.8672909679432846e-05, "epoch": 0.3932050368258494, "percentage": 13.11, "elapsed_time": "2:00:51", "remaining_time": "13:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3320, "total_steps": 25254, "loss": 0.1578, "learning_rate": 4.866258282653108e-05, "epoch": 0.3943929674507009, "percentage": 13.15, "elapsed_time": "2:01:14", "remaining_time": "13:20:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3330, "total_steps": 25254, "loss": 0.161, "learning_rate": 4.865221705374987e-05, "epoch": 0.3955808980755524, "percentage": 13.19, "elapsed_time": "2:01:36", "remaining_time": "13:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3340, "total_steps": 25254, "loss": 0.1637, "learning_rate": 4.8641812378138695e-05, "epoch": 0.3967688287004039, "percentage": 13.23, "elapsed_time": "2:01:57", "remaining_time": "13:20:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3350, "total_steps": 25254, "loss": 0.1634, "learning_rate": 4.863136881681103e-05, "epoch": 0.3979567593252554, "percentage": 13.27, "elapsed_time": "2:02:19", "remaining_time": "13:19:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3360, "total_steps": 25254, "loss": 0.1596, "learning_rate": 4.862088638694428e-05, "epoch": 0.39914468995010693, "percentage": 13.3, "elapsed_time": "2:02:41", "remaining_time": "13:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3370, "total_steps": 25254, "loss": 0.1605, "learning_rate": 4.8610365105779794e-05, "epoch": 0.40033262057495844, "percentage": 13.34, "elapsed_time": "2:03:02", "remaining_time": "13:19:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3380, "total_steps": 25254, "loss": 0.1585, "learning_rate": 4.859980499062283e-05, "epoch": 0.40152055119980995, "percentage": 13.38, "elapsed_time": "2:03:24", "remaining_time": "13:18:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3390, "total_steps": 25254, "loss": 0.164, "learning_rate": 4.858920605884253e-05, "epoch": 0.40270848182466146, "percentage": 13.42, "elapsed_time": "2:03:46", "remaining_time": "13:18:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3400, "total_steps": 25254, "loss": 0.1648, "learning_rate": 4.857856832787185e-05, "epoch": 0.40389641244951296, "percentage": 13.46, "elapsed_time": "2:04:07", "remaining_time": "13:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3410, "total_steps": 25254, "loss": 0.1634, "learning_rate": 4.856789181520759e-05, "epoch": 0.4050843430743645, "percentage": 13.5, "elapsed_time": "2:04:29", "remaining_time": "13:17:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3420, "total_steps": 25254, "loss": 0.1616, "learning_rate": 4.855717653841031e-05, "epoch": 0.406272273699216, "percentage": 13.54, "elapsed_time": "2:04:51", "remaining_time": "13:17:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3430, "total_steps": 25254, "loss": 0.1618, "learning_rate": 4.854642251510435e-05, "epoch": 0.4074602043240675, "percentage": 13.58, "elapsed_time": "2:05:13", "remaining_time": "13:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3440, "total_steps": 25254, "loss": 0.1637, "learning_rate": 4.8535629762977784e-05, "epoch": 0.408648134948919, "percentage": 13.62, "elapsed_time": "2:05:36", "remaining_time": "13:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3450, "total_steps": 25254, "loss": 0.1604, "learning_rate": 4.852479829978237e-05, "epoch": 0.4098360655737705, "percentage": 13.66, "elapsed_time": "2:05:58", "remaining_time": "13:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3460, "total_steps": 25254, "loss": 0.1642, "learning_rate": 4.851392814333354e-05, "epoch": 0.411023996198622, "percentage": 13.7, "elapsed_time": "2:06:20", "remaining_time": "13:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3470, "total_steps": 25254, "loss": 0.1595, "learning_rate": 4.850301931151039e-05, "epoch": 0.4122119268234735, "percentage": 13.74, "elapsed_time": "2:06:42", "remaining_time": "13:15:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3480, "total_steps": 25254, "loss": 0.1625, "learning_rate": 4.849207182225559e-05, "epoch": 0.413399857448325, "percentage": 13.78, "elapsed_time": "2:07:03", "remaining_time": "13:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3490, "total_steps": 25254, "loss": 0.164, "learning_rate": 4.848108569357544e-05, "epoch": 0.41458778807317653, "percentage": 13.82, "elapsed_time": "2:07:25", "remaining_time": "13:14:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3500, "total_steps": 25254, "loss": 0.1586, "learning_rate": 4.8470060943539733e-05, "epoch": 0.41577571869802804, "percentage": 13.86, "elapsed_time": "2:07:47", "remaining_time": "13:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3510, "total_steps": 25254, "loss": 0.1621, "learning_rate": 4.845899759028184e-05, "epoch": 0.41696364932287955, "percentage": 13.9, "elapsed_time": "2:08:08", "remaining_time": "13:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3520, "total_steps": 25254, "loss": 0.1618, "learning_rate": 4.844789565199862e-05, "epoch": 0.41815157994773106, "percentage": 13.94, "elapsed_time": "2:08:31", "remaining_time": "13:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3530, "total_steps": 25254, "loss": 0.1602, "learning_rate": 4.8436755146950364e-05, "epoch": 0.41933951057258256, "percentage": 13.98, "elapsed_time": "2:08:53", "remaining_time": "13:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3540, "total_steps": 25254, "loss": 0.1607, "learning_rate": 4.842557609346082e-05, "epoch": 0.42052744119743407, "percentage": 14.02, "elapsed_time": "2:09:15", "remaining_time": "13:12:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3550, "total_steps": 25254, "loss": 0.1638, "learning_rate": 4.841435850991714e-05, "epoch": 0.4217153718222856, "percentage": 14.06, "elapsed_time": "2:09:37", "remaining_time": "13:12:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3560, "total_steps": 25254, "loss": 0.1596, "learning_rate": 4.840310241476984e-05, "epoch": 0.4229033024471371, "percentage": 14.1, "elapsed_time": "2:09:58", "remaining_time": "13:12:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3570, "total_steps": 25254, "loss": 0.1591, "learning_rate": 4.83918078265328e-05, "epoch": 0.4240912330719886, "percentage": 14.14, "elapsed_time": "2:10:20", "remaining_time": "13:11:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3580, "total_steps": 25254, "loss": 0.1583, "learning_rate": 4.838047476378318e-05, "epoch": 0.4252791636968401, "percentage": 14.18, "elapsed_time": "2:10:42", "remaining_time": "13:11:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3590, "total_steps": 25254, "loss": 0.1583, "learning_rate": 4.836910324516145e-05, "epoch": 0.4264670943216916, "percentage": 14.22, "elapsed_time": "2:11:04", "remaining_time": "13:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3600, "total_steps": 25254, "loss": 0.1614, "learning_rate": 4.835769328937131e-05, "epoch": 0.4276550249465431, "percentage": 14.26, "elapsed_time": "2:11:26", "remaining_time": "13:10:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3610, "total_steps": 25254, "loss": 0.1581, "learning_rate": 4.834624491517971e-05, "epoch": 0.4288429555713946, "percentage": 14.29, "elapsed_time": "2:11:47", "remaining_time": "13:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3620, "total_steps": 25254, "loss": 0.1633, "learning_rate": 4.833475814141677e-05, "epoch": 0.43003088619624613, "percentage": 14.33, "elapsed_time": "2:12:10", "remaining_time": "13:09:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3630, "total_steps": 25254, "loss": 0.1558, "learning_rate": 4.832323298697576e-05, "epoch": 0.43121881682109764, "percentage": 14.37, "elapsed_time": "2:12:32", "remaining_time": "13:09:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3640, "total_steps": 25254, "loss": 0.1613, "learning_rate": 4.8311669470813095e-05, "epoch": 0.43240674744594915, "percentage": 14.41, "elapsed_time": "2:12:54", "remaining_time": "13:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3650, "total_steps": 25254, "loss": 0.1592, "learning_rate": 4.830006761194828e-05, "epoch": 0.43359467807080065, "percentage": 14.45, "elapsed_time": "2:13:15", "remaining_time": "13:08:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3660, "total_steps": 25254, "loss": 0.1598, "learning_rate": 4.828842742946391e-05, "epoch": 0.43478260869565216, "percentage": 14.49, "elapsed_time": "2:13:37", "remaining_time": "13:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3670, "total_steps": 25254, "loss": 0.1581, "learning_rate": 4.827674894250556e-05, "epoch": 0.43597053932050367, "percentage": 14.53, "elapsed_time": "2:14:00", "remaining_time": "13:08:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3680, "total_steps": 25254, "loss": 0.1574, "learning_rate": 4.826503217028185e-05, "epoch": 0.4371584699453552, "percentage": 14.57, "elapsed_time": "2:14:22", "remaining_time": "13:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3690, "total_steps": 25254, "loss": 0.1624, "learning_rate": 4.825327713206437e-05, "epoch": 0.4383464005702067, "percentage": 14.61, "elapsed_time": "2:14:43", "remaining_time": "13:07:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3700, "total_steps": 25254, "loss": 0.1582, "learning_rate": 4.824148384718763e-05, "epoch": 0.4395343311950582, "percentage": 14.65, "elapsed_time": "2:15:04", "remaining_time": "13:06:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3710, "total_steps": 25254, "loss": 0.159, "learning_rate": 4.822965233504905e-05, "epoch": 0.4407222618199097, "percentage": 14.69, "elapsed_time": "2:15:26", "remaining_time": "13:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3720, "total_steps": 25254, "loss": 0.1596, "learning_rate": 4.821778261510895e-05, "epoch": 0.4419101924447612, "percentage": 14.73, "elapsed_time": "2:15:48", "remaining_time": "13:06:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3730, "total_steps": 25254, "loss": 0.1574, "learning_rate": 4.8205874706890466e-05, "epoch": 0.4430981230696127, "percentage": 14.77, "elapsed_time": "2:16:10", "remaining_time": "13:05:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3740, "total_steps": 25254, "loss": 0.1636, "learning_rate": 4.819392862997956e-05, "epoch": 0.4442860536944642, "percentage": 14.81, "elapsed_time": "2:16:32", "remaining_time": "13:05:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3750, "total_steps": 25254, "loss": 0.1604, "learning_rate": 4.818194440402496e-05, "epoch": 0.44547398431931573, "percentage": 14.85, "elapsed_time": "2:16:55", "remaining_time": "13:05:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3760, "total_steps": 25254, "loss": 0.1598, "learning_rate": 4.816992204873816e-05, "epoch": 0.44666191494416724, "percentage": 14.89, "elapsed_time": "2:17:16", "remaining_time": "13:04:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3770, "total_steps": 25254, "loss": 0.1582, "learning_rate": 4.815786158389336e-05, "epoch": 0.44784984556901875, "percentage": 14.93, "elapsed_time": "2:17:38", "remaining_time": "13:04:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3780, "total_steps": 25254, "loss": 0.1601, "learning_rate": 4.814576302932744e-05, "epoch": 0.44903777619387025, "percentage": 14.97, "elapsed_time": "2:18:00", "remaining_time": "13:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3790, "total_steps": 25254, "loss": 0.1554, "learning_rate": 4.8133626404939924e-05, "epoch": 0.45022570681872176, "percentage": 15.01, "elapsed_time": "2:18:22", "remaining_time": "13:03:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3800, "total_steps": 25254, "loss": 0.1591, "learning_rate": 4.8121451730692954e-05, "epoch": 0.45141363744357327, "percentage": 15.05, "elapsed_time": "2:18:43", "remaining_time": "13:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3810, "total_steps": 25254, "loss": 0.1619, "learning_rate": 4.810923902661128e-05, "epoch": 0.45260156806842483, "percentage": 15.09, "elapsed_time": "2:19:05", "remaining_time": "13:02:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3820, "total_steps": 25254, "loss": 0.1584, "learning_rate": 4.8096988312782174e-05, "epoch": 0.45378949869327634, "percentage": 15.13, "elapsed_time": "2:19:27", "remaining_time": "13:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3830, "total_steps": 25254, "loss": 0.1559, "learning_rate": 4.8084699609355436e-05, "epoch": 0.45497742931812785, "percentage": 15.17, "elapsed_time": "2:19:49", "remaining_time": "13:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3840, "total_steps": 25254, "loss": 0.1619, "learning_rate": 4.807237293654334e-05, "epoch": 0.45616535994297935, "percentage": 15.21, "elapsed_time": "2:20:10", "remaining_time": "13:01:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3850, "total_steps": 25254, "loss": 0.157, "learning_rate": 4.806000831462063e-05, "epoch": 0.45735329056783086, "percentage": 15.25, "elapsed_time": "2:20:32", "remaining_time": "13:01:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3860, "total_steps": 25254, "loss": 0.1561, "learning_rate": 4.804760576392448e-05, "epoch": 0.45854122119268237, "percentage": 15.28, "elapsed_time": "2:20:53", "remaining_time": "13:00:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3870, "total_steps": 25254, "loss": 0.1608, "learning_rate": 4.803516530485439e-05, "epoch": 0.4597291518175339, "percentage": 15.32, "elapsed_time": "2:21:16", "remaining_time": "13:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3880, "total_steps": 25254, "loss": 0.1568, "learning_rate": 4.802268695787228e-05, "epoch": 0.4609170824423854, "percentage": 15.36, "elapsed_time": "2:21:38", "remaining_time": "13:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3890, "total_steps": 25254, "loss": 0.1589, "learning_rate": 4.801017074350235e-05, "epoch": 0.4621050130672369, "percentage": 15.4, "elapsed_time": "2:21:59", "remaining_time": "12:59:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3900, "total_steps": 25254, "loss": 0.1585, "learning_rate": 4.7997616682331084e-05, "epoch": 0.4632929436920884, "percentage": 15.44, "elapsed_time": "2:22:21", "remaining_time": "12:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3910, "total_steps": 25254, "loss": 0.1598, "learning_rate": 4.7985024795007236e-05, "epoch": 0.4644808743169399, "percentage": 15.48, "elapsed_time": "2:22:42", "remaining_time": "12:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3920, "total_steps": 25254, "loss": 0.1593, "learning_rate": 4.797239510224175e-05, "epoch": 0.4656688049417914, "percentage": 15.52, "elapsed_time": "2:23:04", "remaining_time": "12:58:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3930, "total_steps": 25254, "loss": 0.163, "learning_rate": 4.795972762480777e-05, "epoch": 0.4668567355666429, "percentage": 15.56, "elapsed_time": "2:23:26", "remaining_time": "12:58:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3940, "total_steps": 25254, "loss": 0.1592, "learning_rate": 4.7947022383540585e-05, "epoch": 0.46804466619149443, "percentage": 15.6, "elapsed_time": "2:23:48", "remaining_time": "12:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3950, "total_steps": 25254, "loss": 0.1643, "learning_rate": 4.793427939933759e-05, "epoch": 0.46923259681634594, "percentage": 15.64, "elapsed_time": "2:24:09", "remaining_time": "12:57:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3960, "total_steps": 25254, "loss": 0.162, "learning_rate": 4.792149869315827e-05, "epoch": 0.47042052744119744, "percentage": 15.68, "elapsed_time": "2:24:31", "remaining_time": "12:57:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3970, "total_steps": 25254, "loss": 0.1559, "learning_rate": 4.7908680286024144e-05, "epoch": 0.47160845806604895, "percentage": 15.72, "elapsed_time": "2:24:53", "remaining_time": "12:56:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3980, "total_steps": 25254, "loss": 0.1566, "learning_rate": 4.789582419901875e-05, "epoch": 0.47279638869090046, "percentage": 15.76, "elapsed_time": "2:25:14", "remaining_time": "12:56:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 3990, "total_steps": 25254, "loss": 0.1575, "learning_rate": 4.788293045328759e-05, "epoch": 0.47398431931575197, "percentage": 15.8, "elapsed_time": "2:25:36", "remaining_time": "12:55:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4000, "total_steps": 25254, "loss": 0.1599, "learning_rate": 4.786999907003812e-05, "epoch": 0.4751722499406035, "percentage": 15.84, "elapsed_time": "2:25:58", "remaining_time": "12:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4010, "total_steps": 25254, "loss": 0.1597, "learning_rate": 4.785703007053969e-05, "epoch": 0.476360180565455, "percentage": 15.88, "elapsed_time": "2:26:20", "remaining_time": "12:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4020, "total_steps": 25254, "loss": 0.1544, "learning_rate": 4.7844023476123536e-05, "epoch": 0.4775481111903065, "percentage": 15.92, "elapsed_time": "2:26:42", "remaining_time": "12:54:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4030, "total_steps": 25254, "loss": 0.158, "learning_rate": 4.783097930818271e-05, "epoch": 0.478736041815158, "percentage": 15.96, "elapsed_time": "2:27:03", "remaining_time": "12:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4040, "total_steps": 25254, "loss": 0.1567, "learning_rate": 4.781789758817207e-05, "epoch": 0.4799239724400095, "percentage": 16.0, "elapsed_time": "2:27:25", "remaining_time": "12:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4050, "total_steps": 25254, "loss": 0.1605, "learning_rate": 4.780477833760825e-05, "epoch": 0.481111903064861, "percentage": 16.04, "elapsed_time": "2:27:47", "remaining_time": "12:53:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4060, "total_steps": 25254, "loss": 0.1605, "learning_rate": 4.779162157806961e-05, "epoch": 0.4822998336897125, "percentage": 16.08, "elapsed_time": "2:28:08", "remaining_time": "12:53:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4070, "total_steps": 25254, "loss": 0.1593, "learning_rate": 4.7778427331196195e-05, "epoch": 0.48348776431456403, "percentage": 16.12, "elapsed_time": "2:28:31", "remaining_time": "12:53:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4080, "total_steps": 25254, "loss": 0.1593, "learning_rate": 4.7765195618689705e-05, "epoch": 0.48467569493941554, "percentage": 16.16, "elapsed_time": "2:28:52", "remaining_time": "12:52:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4090, "total_steps": 25254, "loss": 0.1602, "learning_rate": 4.7751926462313493e-05, "epoch": 0.48586362556426704, "percentage": 16.2, "elapsed_time": "2:29:15", "remaining_time": "12:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4100, "total_steps": 25254, "loss": 0.1563, "learning_rate": 4.773861988389246e-05, "epoch": 0.48705155618911855, "percentage": 16.24, "elapsed_time": "2:29:37", "remaining_time": "12:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4110, "total_steps": 25254, "loss": 0.1553, "learning_rate": 4.7725275905313104e-05, "epoch": 0.48823948681397006, "percentage": 16.27, "elapsed_time": "2:29:59", "remaining_time": "12:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4120, "total_steps": 25254, "loss": 0.159, "learning_rate": 4.771189454852338e-05, "epoch": 0.48942741743882157, "percentage": 16.31, "elapsed_time": "2:30:20", "remaining_time": "12:51:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4130, "total_steps": 25254, "loss": 0.1583, "learning_rate": 4.769847583553276e-05, "epoch": 0.4906153480636731, "percentage": 16.35, "elapsed_time": "2:30:42", "remaining_time": "12:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4140, "total_steps": 25254, "loss": 0.1562, "learning_rate": 4.768501978841217e-05, "epoch": 0.4918032786885246, "percentage": 16.39, "elapsed_time": "2:31:04", "remaining_time": "12:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4150, "total_steps": 25254, "loss": 0.1572, "learning_rate": 4.76715264292939e-05, "epoch": 0.4929912093133761, "percentage": 16.43, "elapsed_time": "2:31:25", "remaining_time": "12:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4160, "total_steps": 25254, "loss": 0.1573, "learning_rate": 4.7657995780371654e-05, "epoch": 0.4941791399382276, "percentage": 16.47, "elapsed_time": "2:31:47", "remaining_time": "12:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4170, "total_steps": 25254, "loss": 0.1616, "learning_rate": 4.7644427863900444e-05, "epoch": 0.4953670705630791, "percentage": 16.51, "elapsed_time": "2:32:10", "remaining_time": "12:49:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4180, "total_steps": 25254, "loss": 0.1562, "learning_rate": 4.7630822702196586e-05, "epoch": 0.4965550011879306, "percentage": 16.55, "elapsed_time": "2:32:32", "remaining_time": "12:49:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4190, "total_steps": 25254, "loss": 0.1572, "learning_rate": 4.7617180317637654e-05, "epoch": 0.4977429318127821, "percentage": 16.59, "elapsed_time": "2:32:54", "remaining_time": "12:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4200, "total_steps": 25254, "loss": 0.1579, "learning_rate": 4.760350073266245e-05, "epoch": 0.4989308624376336, "percentage": 16.63, "elapsed_time": "2:33:15", "remaining_time": "12:48:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4210, "total_steps": 25254, "loss": 0.1615, "learning_rate": 4.7589783969770965e-05, "epoch": 0.5001187930624852, "percentage": 16.67, "elapsed_time": "2:33:36", "remaining_time": "12:47:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4220, "total_steps": 25254, "loss": 0.1586, "learning_rate": 4.7576030051524325e-05, "epoch": 0.5013067236873366, "percentage": 16.71, "elapsed_time": "2:33:58", "remaining_time": "12:47:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4230, "total_steps": 25254, "loss": 0.1577, "learning_rate": 4.756223900054479e-05, "epoch": 0.5024946543121882, "percentage": 16.75, "elapsed_time": "2:34:20", "remaining_time": "12:47:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4240, "total_steps": 25254, "loss": 0.1546, "learning_rate": 4.754841083951568e-05, "epoch": 0.5036825849370397, "percentage": 16.79, "elapsed_time": "2:34:42", "remaining_time": "12:46:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4250, "total_steps": 25254, "loss": 0.1599, "learning_rate": 4.753454559118135e-05, "epoch": 0.5048705155618912, "percentage": 16.83, "elapsed_time": "2:35:04", "remaining_time": "12:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4260, "total_steps": 25254, "loss": 0.1569, "learning_rate": 4.752064327834718e-05, "epoch": 0.5060584461867427, "percentage": 16.87, "elapsed_time": "2:35:26", "remaining_time": "12:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4270, "total_steps": 25254, "loss": 0.1561, "learning_rate": 4.750670392387948e-05, "epoch": 0.5072463768115942, "percentage": 16.91, "elapsed_time": "2:35:48", "remaining_time": "12:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4280, "total_steps": 25254, "loss": 0.155, "learning_rate": 4.749272755070552e-05, "epoch": 0.5084343074364457, "percentage": 16.95, "elapsed_time": "2:36:10", "remaining_time": "12:45:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4290, "total_steps": 25254, "loss": 0.1578, "learning_rate": 4.747871418181341e-05, "epoch": 0.5096222380612973, "percentage": 16.99, "elapsed_time": "2:36:33", "remaining_time": "12:45:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4300, "total_steps": 25254, "loss": 0.16, "learning_rate": 4.746466384025217e-05, "epoch": 0.5108101686861487, "percentage": 17.03, "elapsed_time": "2:36:54", "remaining_time": "12:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4310, "total_steps": 25254, "loss": 0.1551, "learning_rate": 4.7450576549131585e-05, "epoch": 0.5119980993110003, "percentage": 17.07, "elapsed_time": "2:37:16", "remaining_time": "12:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4320, "total_steps": 25254, "loss": 0.1545, "learning_rate": 4.7436452331622236e-05, "epoch": 0.5131860299358517, "percentage": 17.11, "elapsed_time": "2:37:38", "remaining_time": "12:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4330, "total_steps": 25254, "loss": 0.154, "learning_rate": 4.7422291210955436e-05, "epoch": 0.5143739605607033, "percentage": 17.15, "elapsed_time": "2:37:59", "remaining_time": "12:43:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4340, "total_steps": 25254, "loss": 0.1554, "learning_rate": 4.740809321042319e-05, "epoch": 0.5155618911855547, "percentage": 17.19, "elapsed_time": "2:38:21", "remaining_time": "12:43:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4350, "total_steps": 25254, "loss": 0.1564, "learning_rate": 4.7393858353378173e-05, "epoch": 0.5167498218104063, "percentage": 17.22, "elapsed_time": "2:38:43", "remaining_time": "12:42:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4360, "total_steps": 25254, "loss": 0.1613, "learning_rate": 4.7379586663233673e-05, "epoch": 0.5179377524352577, "percentage": 17.26, "elapsed_time": "2:39:05", "remaining_time": "12:42:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4370, "total_steps": 25254, "loss": 0.1574, "learning_rate": 4.736527816346356e-05, "epoch": 0.5191256830601093, "percentage": 17.3, "elapsed_time": "2:39:27", "remaining_time": "12:42:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4380, "total_steps": 25254, "loss": 0.1516, "learning_rate": 4.735093287760225e-05, "epoch": 0.5203136136849608, "percentage": 17.34, "elapsed_time": "2:39:49", "remaining_time": "12:41:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4390, "total_steps": 25254, "loss": 0.1581, "learning_rate": 4.733655082924467e-05, "epoch": 0.5215015443098123, "percentage": 17.38, "elapsed_time": "2:40:12", "remaining_time": "12:41:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4400, "total_steps": 25254, "loss": 0.1559, "learning_rate": 4.732213204204622e-05, "epoch": 0.5226894749346638, "percentage": 17.42, "elapsed_time": "2:40:34", "remaining_time": "12:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4410, "total_steps": 25254, "loss": 0.1567, "learning_rate": 4.730767653972269e-05, "epoch": 0.5238774055595153, "percentage": 17.46, "elapsed_time": "2:40:55", "remaining_time": "12:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4420, "total_steps": 25254, "loss": 0.1563, "learning_rate": 4.7293184346050296e-05, "epoch": 0.5250653361843668, "percentage": 17.5, "elapsed_time": "2:41:17", "remaining_time": "12:40:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4430, "total_steps": 25254, "loss": 0.1587, "learning_rate": 4.7278655484865595e-05, "epoch": 0.5262532668092184, "percentage": 17.54, "elapsed_time": "2:41:38", "remaining_time": "12:39:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4440, "total_steps": 25254, "loss": 0.1581, "learning_rate": 4.726408998006545e-05, "epoch": 0.5274411974340698, "percentage": 17.58, "elapsed_time": "2:42:00", "remaining_time": "12:39:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4450, "total_steps": 25254, "loss": 0.156, "learning_rate": 4.7249487855606994e-05, "epoch": 0.5286291280589214, "percentage": 17.62, "elapsed_time": "2:42:21", "remaining_time": "12:39:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4460, "total_steps": 25254, "loss": 0.1554, "learning_rate": 4.723484913550759e-05, "epoch": 0.5298170586837728, "percentage": 17.66, "elapsed_time": "2:42:44", "remaining_time": "12:38:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4470, "total_steps": 25254, "loss": 0.1575, "learning_rate": 4.722017384384481e-05, "epoch": 0.5310049893086244, "percentage": 17.7, "elapsed_time": "2:43:06", "remaining_time": "12:38:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4480, "total_steps": 25254, "loss": 0.1541, "learning_rate": 4.720546200475635e-05, "epoch": 0.5321929199334758, "percentage": 17.74, "elapsed_time": "2:43:28", "remaining_time": "12:38:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4490, "total_steps": 25254, "loss": 0.1536, "learning_rate": 4.7190713642440044e-05, "epoch": 0.5333808505583274, "percentage": 17.78, "elapsed_time": "2:43:50", "remaining_time": "12:37:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4500, "total_steps": 25254, "loss": 0.1587, "learning_rate": 4.717592878115378e-05, "epoch": 0.5345687811831789, "percentage": 17.82, "elapsed_time": "2:44:13", "remaining_time": "12:37:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4510, "total_steps": 25254, "loss": 0.1548, "learning_rate": 4.716110744521548e-05, "epoch": 0.5357567118080304, "percentage": 17.86, "elapsed_time": "2:44:35", "remaining_time": "12:37:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4520, "total_steps": 25254, "loss": 0.1604, "learning_rate": 4.714624965900309e-05, "epoch": 0.5369446424328819, "percentage": 17.9, "elapsed_time": "2:44:56", "remaining_time": "12:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4530, "total_steps": 25254, "loss": 0.1548, "learning_rate": 4.7131355446954476e-05, "epoch": 0.5381325730577334, "percentage": 17.94, "elapsed_time": "2:45:18", "remaining_time": "12:36:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4540, "total_steps": 25254, "loss": 0.151, "learning_rate": 4.711642483356742e-05, "epoch": 0.5393205036825849, "percentage": 17.98, "elapsed_time": "2:45:40", "remaining_time": "12:35:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4550, "total_steps": 25254, "loss": 0.1566, "learning_rate": 4.710145784339958e-05, "epoch": 0.5405084343074364, "percentage": 18.02, "elapsed_time": "2:46:02", "remaining_time": "12:35:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4560, "total_steps": 25254, "loss": 0.1529, "learning_rate": 4.708645450106846e-05, "epoch": 0.5416963649322879, "percentage": 18.06, "elapsed_time": "2:46:24", "remaining_time": "12:35:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4570, "total_steps": 25254, "loss": 0.1588, "learning_rate": 4.707141483125133e-05, "epoch": 0.5428842955571395, "percentage": 18.1, "elapsed_time": "2:46:46", "remaining_time": "12:34:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4580, "total_steps": 25254, "loss": 0.1542, "learning_rate": 4.705633885868524e-05, "epoch": 0.544072226181991, "percentage": 18.14, "elapsed_time": "2:47:08", "remaining_time": "12:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4590, "total_steps": 25254, "loss": 0.1561, "learning_rate": 4.704122660816692e-05, "epoch": 0.5452601568068425, "percentage": 18.18, "elapsed_time": "2:47:30", "remaining_time": "12:34:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4600, "total_steps": 25254, "loss": 0.154, "learning_rate": 4.7026078104552794e-05, "epoch": 0.546448087431694, "percentage": 18.21, "elapsed_time": "2:47:51", "remaining_time": "12:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4610, "total_steps": 25254, "loss": 0.1574, "learning_rate": 4.7010893372758914e-05, "epoch": 0.5476360180565455, "percentage": 18.25, "elapsed_time": "2:48:13", "remaining_time": "12:33:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4620, "total_steps": 25254, "loss": 0.1568, "learning_rate": 4.699567243776088e-05, "epoch": 0.5488239486813971, "percentage": 18.29, "elapsed_time": "2:48:35", "remaining_time": "12:32:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4630, "total_steps": 25254, "loss": 0.1564, "learning_rate": 4.6980415324593904e-05, "epoch": 0.5500118793062485, "percentage": 18.33, "elapsed_time": "2:48:56", "remaining_time": "12:32:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4640, "total_steps": 25254, "loss": 0.1579, "learning_rate": 4.696512205835265e-05, "epoch": 0.5511998099311001, "percentage": 18.37, "elapsed_time": "2:49:18", "remaining_time": "12:32:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4650, "total_steps": 25254, "loss": 0.1518, "learning_rate": 4.694979266419127e-05, "epoch": 0.5523877405559515, "percentage": 18.41, "elapsed_time": "2:49:40", "remaining_time": "12:31:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4660, "total_steps": 25254, "loss": 0.1598, "learning_rate": 4.693442716732333e-05, "epoch": 0.5535756711808031, "percentage": 18.45, "elapsed_time": "2:50:01", "remaining_time": "12:31:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4670, "total_steps": 25254, "loss": 0.1574, "learning_rate": 4.6919025593021784e-05, "epoch": 0.5547636018056545, "percentage": 18.49, "elapsed_time": "2:50:23", "remaining_time": "12:31:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4680, "total_steps": 25254, "loss": 0.1535, "learning_rate": 4.690358796661891e-05, "epoch": 0.5559515324305061, "percentage": 18.53, "elapsed_time": "2:50:44", "remaining_time": "12:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4690, "total_steps": 25254, "loss": 0.1543, "learning_rate": 4.688811431350632e-05, "epoch": 0.5571394630553576, "percentage": 18.57, "elapsed_time": "2:51:06", "remaining_time": "12:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4700, "total_steps": 25254, "loss": 0.16, "learning_rate": 4.6872604659134836e-05, "epoch": 0.5583273936802091, "percentage": 18.61, "elapsed_time": "2:51:28", "remaining_time": "12:29:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4710, "total_steps": 25254, "loss": 0.1568, "learning_rate": 4.6857059029014534e-05, "epoch": 0.5595153243050606, "percentage": 18.65, "elapsed_time": "2:51:49", "remaining_time": "12:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4720, "total_steps": 25254, "loss": 0.156, "learning_rate": 4.684147744871463e-05, "epoch": 0.5607032549299121, "percentage": 18.69, "elapsed_time": "2:52:12", "remaining_time": "12:29:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4730, "total_steps": 25254, "loss": 0.1554, "learning_rate": 4.6825859943863493e-05, "epoch": 0.5618911855547636, "percentage": 18.73, "elapsed_time": "2:52:33", "remaining_time": "12:28:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4740, "total_steps": 25254, "loss": 0.1566, "learning_rate": 4.681020654014858e-05, "epoch": 0.5630791161796151, "percentage": 18.77, "elapsed_time": "2:52:54", "remaining_time": "12:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4750, "total_steps": 25254, "loss": 0.1552, "learning_rate": 4.679451726331637e-05, "epoch": 0.5642670468044666, "percentage": 18.81, "elapsed_time": "2:53:17", "remaining_time": "12:28:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4760, "total_steps": 25254, "loss": 0.1543, "learning_rate": 4.677879213917237e-05, "epoch": 0.5654549774293182, "percentage": 18.85, "elapsed_time": "2:53:38", "remaining_time": "12:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4770, "total_steps": 25254, "loss": 0.1575, "learning_rate": 4.676303119358104e-05, "epoch": 0.5666429080541696, "percentage": 18.89, "elapsed_time": "2:54:00", "remaining_time": "12:27:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4780, "total_steps": 25254, "loss": 0.1617, "learning_rate": 4.6747234452465774e-05, "epoch": 0.5678308386790212, "percentage": 18.93, "elapsed_time": "2:54:21", "remaining_time": "12:26:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4790, "total_steps": 25254, "loss": 0.1561, "learning_rate": 4.6731401941808806e-05, "epoch": 0.5690187693038726, "percentage": 18.97, "elapsed_time": "2:54:43", "remaining_time": "12:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4800, "total_steps": 25254, "loss": 0.1513, "learning_rate": 4.6715533687651224e-05, "epoch": 0.5702066999287242, "percentage": 19.01, "elapsed_time": "2:55:05", "remaining_time": "12:26:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4810, "total_steps": 25254, "loss": 0.1551, "learning_rate": 4.669962971609292e-05, "epoch": 0.5713946305535756, "percentage": 19.05, "elapsed_time": "2:55:27", "remaining_time": "12:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4820, "total_steps": 25254, "loss": 0.1514, "learning_rate": 4.6683690053292515e-05, "epoch": 0.5725825611784272, "percentage": 19.09, "elapsed_time": "2:55:49", "remaining_time": "12:25:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4830, "total_steps": 25254, "loss": 0.1573, "learning_rate": 4.666771472546734e-05, "epoch": 0.5737704918032787, "percentage": 19.13, "elapsed_time": "2:56:10", "remaining_time": "12:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4840, "total_steps": 25254, "loss": 0.1573, "learning_rate": 4.6651703758893376e-05, "epoch": 0.5749584224281302, "percentage": 19.17, "elapsed_time": "2:56:32", "remaining_time": "12:24:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4850, "total_steps": 25254, "loss": 0.1553, "learning_rate": 4.663565717990525e-05, "epoch": 0.5761463530529817, "percentage": 19.2, "elapsed_time": "2:56:54", "remaining_time": "12:24:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4860, "total_steps": 25254, "loss": 0.1521, "learning_rate": 4.661957501489614e-05, "epoch": 0.5773342836778332, "percentage": 19.24, "elapsed_time": "2:57:16", "remaining_time": "12:23:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4870, "total_steps": 25254, "loss": 0.1563, "learning_rate": 4.6603457290317755e-05, "epoch": 0.5785222143026847, "percentage": 19.28, "elapsed_time": "2:57:38", "remaining_time": "12:23:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4880, "total_steps": 25254, "loss": 0.1556, "learning_rate": 4.658730403268031e-05, "epoch": 0.5797101449275363, "percentage": 19.32, "elapsed_time": "2:57:59", "remaining_time": "12:23:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4890, "total_steps": 25254, "loss": 0.1554, "learning_rate": 4.6571115268552446e-05, "epoch": 0.5808980755523877, "percentage": 19.36, "elapsed_time": "2:58:21", "remaining_time": "12:22:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4900, "total_steps": 25254, "loss": 0.1546, "learning_rate": 4.655489102456122e-05, "epoch": 0.5820860061772393, "percentage": 19.4, "elapsed_time": "2:58:43", "remaining_time": "12:22:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4910, "total_steps": 25254, "loss": 0.1523, "learning_rate": 4.6538631327392024e-05, "epoch": 0.5832739368020907, "percentage": 19.44, "elapsed_time": "2:59:04", "remaining_time": "12:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4920, "total_steps": 25254, "loss": 0.1616, "learning_rate": 4.6522336203788584e-05, "epoch": 0.5844618674269423, "percentage": 19.48, "elapsed_time": "2:59:26", "remaining_time": "12:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4930, "total_steps": 25254, "loss": 0.1565, "learning_rate": 4.6506005680552896e-05, "epoch": 0.5856497980517937, "percentage": 19.52, "elapsed_time": "2:59:48", "remaining_time": "12:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4940, "total_steps": 25254, "loss": 0.158, "learning_rate": 4.648963978454516e-05, "epoch": 0.5868377286766453, "percentage": 19.56, "elapsed_time": "3:00:11", "remaining_time": "12:20:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4950, "total_steps": 25254, "loss": 0.1556, "learning_rate": 4.6473238542683775e-05, "epoch": 0.5880256593014968, "percentage": 19.6, "elapsed_time": "3:00:32", "remaining_time": "12:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4960, "total_steps": 25254, "loss": 0.1501, "learning_rate": 4.645680198194526e-05, "epoch": 0.5892135899263483, "percentage": 19.64, "elapsed_time": "3:00:54", "remaining_time": "12:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4970, "total_steps": 25254, "loss": 0.1576, "learning_rate": 4.6440330129364244e-05, "epoch": 0.5904015205511998, "percentage": 19.68, "elapsed_time": "3:01:17", "remaining_time": "12:19:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4980, "total_steps": 25254, "loss": 0.1519, "learning_rate": 4.642382301203341e-05, "epoch": 0.5915894511760513, "percentage": 19.72, "elapsed_time": "3:01:38", "remaining_time": "12:19:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 4990, "total_steps": 25254, "loss": 0.155, "learning_rate": 4.6407280657103404e-05, "epoch": 0.5927773818009028, "percentage": 19.76, "elapsed_time": "3:02:00", "remaining_time": "12:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5000, "total_steps": 25254, "loss": 0.1553, "learning_rate": 4.639070309178286e-05, "epoch": 0.5939653124257543, "percentage": 19.8, "elapsed_time": "3:02:21", "remaining_time": "12:18:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5010, "total_steps": 25254, "loss": 0.155, "learning_rate": 4.637409034333834e-05, "epoch": 0.5951532430506058, "percentage": 19.84, "elapsed_time": "3:02:43", "remaining_time": "12:18:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5020, "total_steps": 25254, "loss": 0.1605, "learning_rate": 4.635744243909424e-05, "epoch": 0.5963411736754574, "percentage": 19.88, "elapsed_time": "3:03:05", "remaining_time": "12:17:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5030, "total_steps": 25254, "loss": 0.1535, "learning_rate": 4.6340759406432805e-05, "epoch": 0.5975291043003088, "percentage": 19.92, "elapsed_time": "3:03:27", "remaining_time": "12:17:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5040, "total_steps": 25254, "loss": 0.1557, "learning_rate": 4.632404127279404e-05, "epoch": 0.5987170349251604, "percentage": 19.96, "elapsed_time": "3:03:49", "remaining_time": "12:17:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5050, "total_steps": 25254, "loss": 0.155, "learning_rate": 4.63072880656757e-05, "epoch": 0.5999049655500118, "percentage": 20.0, "elapsed_time": "3:04:11", "remaining_time": "12:16:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5060, "total_steps": 25254, "loss": 0.1564, "learning_rate": 4.629049981263323e-05, "epoch": 0.6010928961748634, "percentage": 20.04, "elapsed_time": "3:04:33", "remaining_time": "12:16:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5070, "total_steps": 25254, "loss": 0.1546, "learning_rate": 4.6273676541279686e-05, "epoch": 0.6022808267997148, "percentage": 20.08, "elapsed_time": "3:04:55", "remaining_time": "12:16:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5080, "total_steps": 25254, "loss": 0.1552, "learning_rate": 4.6256818279285773e-05, "epoch": 0.6034687574245664, "percentage": 20.12, "elapsed_time": "3:05:17", "remaining_time": "12:15:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5090, "total_steps": 25254, "loss": 0.1535, "learning_rate": 4.62399250543797e-05, "epoch": 0.604656688049418, "percentage": 20.16, "elapsed_time": "3:05:39", "remaining_time": "12:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5100, "total_steps": 25254, "loss": 0.1544, "learning_rate": 4.62229968943472e-05, "epoch": 0.6058446186742694, "percentage": 20.19, "elapsed_time": "3:06:01", "remaining_time": "12:15:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5110, "total_steps": 25254, "loss": 0.156, "learning_rate": 4.620603382703149e-05, "epoch": 0.607032549299121, "percentage": 20.23, "elapsed_time": "3:06:22", "remaining_time": "12:14:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5120, "total_steps": 25254, "loss": 0.1566, "learning_rate": 4.618903588033318e-05, "epoch": 0.6082204799239724, "percentage": 20.27, "elapsed_time": "3:06:44", "remaining_time": "12:14:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5130, "total_steps": 25254, "loss": 0.1535, "learning_rate": 4.6172003082210225e-05, "epoch": 0.609408410548824, "percentage": 20.31, "elapsed_time": "3:07:06", "remaining_time": "12:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5140, "total_steps": 25254, "loss": 0.1569, "learning_rate": 4.6154935460677954e-05, "epoch": 0.6105963411736754, "percentage": 20.35, "elapsed_time": "3:07:28", "remaining_time": "12:13:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5150, "total_steps": 25254, "loss": 0.1498, "learning_rate": 4.613783304380893e-05, "epoch": 0.611784271798527, "percentage": 20.39, "elapsed_time": "3:07:50", "remaining_time": "12:13:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5160, "total_steps": 25254, "loss": 0.1537, "learning_rate": 4.612069585973299e-05, "epoch": 0.6129722024233785, "percentage": 20.43, "elapsed_time": "3:08:12", "remaining_time": "12:12:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5170, "total_steps": 25254, "loss": 0.1523, "learning_rate": 4.61035239366371e-05, "epoch": 0.61416013304823, "percentage": 20.47, "elapsed_time": "3:08:34", "remaining_time": "12:12:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5180, "total_steps": 25254, "loss": 0.153, "learning_rate": 4.6086317302765414e-05, "epoch": 0.6153480636730815, "percentage": 20.51, "elapsed_time": "3:08:56", "remaining_time": "12:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5190, "total_steps": 25254, "loss": 0.154, "learning_rate": 4.6069075986419165e-05, "epoch": 0.616535994297933, "percentage": 20.55, "elapsed_time": "3:09:17", "remaining_time": "12:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5200, "total_steps": 25254, "loss": 0.1552, "learning_rate": 4.60518000159566e-05, "epoch": 0.6177239249227845, "percentage": 20.59, "elapsed_time": "3:09:39", "remaining_time": "12:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5210, "total_steps": 25254, "loss": 0.1501, "learning_rate": 4.603448941979301e-05, "epoch": 0.6189118555476361, "percentage": 20.63, "elapsed_time": "3:10:00", "remaining_time": "12:11:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5220, "total_steps": 25254, "loss": 0.1521, "learning_rate": 4.601714422640061e-05, "epoch": 0.6200997861724875, "percentage": 20.67, "elapsed_time": "3:10:22", "remaining_time": "12:10:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5230, "total_steps": 25254, "loss": 0.157, "learning_rate": 4.5999764464308524e-05, "epoch": 0.6212877167973391, "percentage": 20.71, "elapsed_time": "3:10:44", "remaining_time": "12:10:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5240, "total_steps": 25254, "loss": 0.1537, "learning_rate": 4.598235016210274e-05, "epoch": 0.6224756474221905, "percentage": 20.75, "elapsed_time": "3:11:06", "remaining_time": "12:09:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5250, "total_steps": 25254, "loss": 0.1561, "learning_rate": 4.596490134842606e-05, "epoch": 0.6236635780470421, "percentage": 20.79, "elapsed_time": "3:11:27", "remaining_time": "12:09:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5260, "total_steps": 25254, "loss": 0.15, "learning_rate": 4.594741805197804e-05, "epoch": 0.6248515086718935, "percentage": 20.83, "elapsed_time": "3:11:49", "remaining_time": "12:09:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5270, "total_steps": 25254, "loss": 0.156, "learning_rate": 4.592990030151495e-05, "epoch": 0.6260394392967451, "percentage": 20.87, "elapsed_time": "3:12:12", "remaining_time": "12:08:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5280, "total_steps": 25254, "loss": 0.1509, "learning_rate": 4.5912348125849745e-05, "epoch": 0.6272273699215966, "percentage": 20.91, "elapsed_time": "3:12:34", "remaining_time": "12:08:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5290, "total_steps": 25254, "loss": 0.1529, "learning_rate": 4.5894761553852e-05, "epoch": 0.6284153005464481, "percentage": 20.95, "elapsed_time": "3:12:56", "remaining_time": "12:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5300, "total_steps": 25254, "loss": 0.1549, "learning_rate": 4.587714061444784e-05, "epoch": 0.6296032311712996, "percentage": 20.99, "elapsed_time": "3:13:18", "remaining_time": "12:07:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5310, "total_steps": 25254, "loss": 0.1537, "learning_rate": 4.5859485336619956e-05, "epoch": 0.6307911617961511, "percentage": 21.03, "elapsed_time": "3:13:40", "remaining_time": "12:07:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5320, "total_steps": 25254, "loss": 0.1539, "learning_rate": 4.5841795749407486e-05, "epoch": 0.6319790924210026, "percentage": 21.07, "elapsed_time": "3:14:02", "remaining_time": "12:07:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5330, "total_steps": 25254, "loss": 0.154, "learning_rate": 4.5824071881906006e-05, "epoch": 0.6331670230458541, "percentage": 21.11, "elapsed_time": "3:14:23", "remaining_time": "12:06:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5340, "total_steps": 25254, "loss": 0.1564, "learning_rate": 4.580631376326749e-05, "epoch": 0.6343549536707056, "percentage": 21.15, "elapsed_time": "3:14:45", "remaining_time": "12:06:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5350, "total_steps": 25254, "loss": 0.1542, "learning_rate": 4.578852142270024e-05, "epoch": 0.6355428842955572, "percentage": 21.18, "elapsed_time": "3:15:07", "remaining_time": "12:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5360, "total_steps": 25254, "loss": 0.1491, "learning_rate": 4.577069488946883e-05, "epoch": 0.6367308149204086, "percentage": 21.22, "elapsed_time": "3:15:29", "remaining_time": "12:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5370, "total_steps": 25254, "loss": 0.1558, "learning_rate": 4.5752834192894115e-05, "epoch": 0.6379187455452602, "percentage": 21.26, "elapsed_time": "3:15:50", "remaining_time": "12:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5380, "total_steps": 25254, "loss": 0.1561, "learning_rate": 4.5734939362353093e-05, "epoch": 0.6391066761701116, "percentage": 21.3, "elapsed_time": "3:16:12", "remaining_time": "12:04:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5390, "total_steps": 25254, "loss": 0.1567, "learning_rate": 4.571701042727893e-05, "epoch": 0.6402946067949632, "percentage": 21.34, "elapsed_time": "3:16:34", "remaining_time": "12:04:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5400, "total_steps": 25254, "loss": 0.1526, "learning_rate": 4.5699047417160887e-05, "epoch": 0.6414825374198146, "percentage": 21.38, "elapsed_time": "3:16:56", "remaining_time": "12:04:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5410, "total_steps": 25254, "loss": 0.1515, "learning_rate": 4.5681050361544266e-05, "epoch": 0.6426704680446662, "percentage": 21.42, "elapsed_time": "3:17:18", "remaining_time": "12:03:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5420, "total_steps": 25254, "loss": 0.1549, "learning_rate": 4.566301929003036e-05, "epoch": 0.6438583986695177, "percentage": 21.46, "elapsed_time": "3:17:40", "remaining_time": "12:03:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5430, "total_steps": 25254, "loss": 0.1514, "learning_rate": 4.564495423227644e-05, "epoch": 0.6450463292943692, "percentage": 21.5, "elapsed_time": "3:18:02", "remaining_time": "12:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5440, "total_steps": 25254, "loss": 0.152, "learning_rate": 4.562685521799564e-05, "epoch": 0.6462342599192207, "percentage": 21.54, "elapsed_time": "3:18:23", "remaining_time": "12:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5450, "total_steps": 25254, "loss": 0.1527, "learning_rate": 4.5608722276956954e-05, "epoch": 0.6474221905440722, "percentage": 21.58, "elapsed_time": "3:18:45", "remaining_time": "12:02:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5460, "total_steps": 25254, "loss": 0.1552, "learning_rate": 4.5590555438985207e-05, "epoch": 0.6486101211689237, "percentage": 21.62, "elapsed_time": "3:19:07", "remaining_time": "12:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5470, "total_steps": 25254, "loss": 0.1529, "learning_rate": 4.557235473396093e-05, "epoch": 0.6497980517937753, "percentage": 21.66, "elapsed_time": "3:19:29", "remaining_time": "12:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5480, "total_steps": 25254, "loss": 0.1501, "learning_rate": 4.55541201918204e-05, "epoch": 0.6509859824186267, "percentage": 21.7, "elapsed_time": "3:19:50", "remaining_time": "12:01:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5490, "total_steps": 25254, "loss": 0.1512, "learning_rate": 4.5535851842555536e-05, "epoch": 0.6521739130434783, "percentage": 21.74, "elapsed_time": "3:20:12", "remaining_time": "12:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5500, "total_steps": 25254, "loss": 0.1491, "learning_rate": 4.5517549716213845e-05, "epoch": 0.6533618436683297, "percentage": 21.78, "elapsed_time": "3:20:34", "remaining_time": "12:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5510, "total_steps": 25254, "loss": 0.1498, "learning_rate": 4.5499213842898426e-05, "epoch": 0.6545497742931813, "percentage": 21.82, "elapsed_time": "3:20:55", "remaining_time": "11:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5520, "total_steps": 25254, "loss": 0.1585, "learning_rate": 4.548084425276783e-05, "epoch": 0.6557377049180327, "percentage": 21.86, "elapsed_time": "3:21:16", "remaining_time": "11:59:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5530, "total_steps": 25254, "loss": 0.1571, "learning_rate": 4.546244097603612e-05, "epoch": 0.6569256355428843, "percentage": 21.9, "elapsed_time": "3:21:38", "remaining_time": "11:59:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5540, "total_steps": 25254, "loss": 0.1568, "learning_rate": 4.5444004042972744e-05, "epoch": 0.6581135661677358, "percentage": 21.94, "elapsed_time": "3:22:01", "remaining_time": "11:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5550, "total_steps": 25254, "loss": 0.1536, "learning_rate": 4.5425533483902494e-05, "epoch": 0.6593014967925873, "percentage": 21.98, "elapsed_time": "3:22:22", "remaining_time": "11:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5560, "total_steps": 25254, "loss": 0.1579, "learning_rate": 4.5407029329205494e-05, "epoch": 0.6604894274174388, "percentage": 22.02, "elapsed_time": "3:22:45", "remaining_time": "11:58:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5570, "total_steps": 25254, "loss": 0.155, "learning_rate": 4.538849160931711e-05, "epoch": 0.6616773580422903, "percentage": 22.06, "elapsed_time": "3:23:07", "remaining_time": "11:57:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5580, "total_steps": 25254, "loss": 0.1479, "learning_rate": 4.536992035472793e-05, "epoch": 0.6628652886671419, "percentage": 22.1, "elapsed_time": "3:23:28", "remaining_time": "11:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5590, "total_steps": 25254, "loss": 0.1524, "learning_rate": 4.5351315595983666e-05, "epoch": 0.6640532192919933, "percentage": 22.14, "elapsed_time": "3:23:50", "remaining_time": "11:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5600, "total_steps": 25254, "loss": 0.152, "learning_rate": 4.533267736368518e-05, "epoch": 0.6652411499168449, "percentage": 22.17, "elapsed_time": "3:24:12", "remaining_time": "11:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5610, "total_steps": 25254, "loss": 0.1559, "learning_rate": 4.5314005688488356e-05, "epoch": 0.6664290805416964, "percentage": 22.21, "elapsed_time": "3:24:34", "remaining_time": "11:56:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5620, "total_steps": 25254, "loss": 0.1564, "learning_rate": 4.529530060110412e-05, "epoch": 0.6676170111665479, "percentage": 22.25, "elapsed_time": "3:24:55", "remaining_time": "11:55:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5630, "total_steps": 25254, "loss": 0.151, "learning_rate": 4.5276562132298315e-05, "epoch": 0.6688049417913994, "percentage": 22.29, "elapsed_time": "3:25:16", "remaining_time": "11:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5640, "total_steps": 25254, "loss": 0.1496, "learning_rate": 4.5257790312891726e-05, "epoch": 0.6699928724162509, "percentage": 22.33, "elapsed_time": "3:25:37", "remaining_time": "11:55:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5650, "total_steps": 25254, "loss": 0.1559, "learning_rate": 4.523898517375995e-05, "epoch": 0.6711808030411024, "percentage": 22.37, "elapsed_time": "3:26:00", "remaining_time": "11:54:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5660, "total_steps": 25254, "loss": 0.1507, "learning_rate": 4.522014674583344e-05, "epoch": 0.672368733665954, "percentage": 22.41, "elapsed_time": "3:26:21", "remaining_time": "11:54:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5670, "total_steps": 25254, "loss": 0.1512, "learning_rate": 4.520127506009735e-05, "epoch": 0.6735566642908054, "percentage": 22.45, "elapsed_time": "3:26:43", "remaining_time": "11:54:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5680, "total_steps": 25254, "loss": 0.1561, "learning_rate": 4.518237014759157e-05, "epoch": 0.674744594915657, "percentage": 22.49, "elapsed_time": "3:27:05", "remaining_time": "11:53:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5690, "total_steps": 25254, "loss": 0.1557, "learning_rate": 4.516343203941063e-05, "epoch": 0.6759325255405084, "percentage": 22.53, "elapsed_time": "3:27:27", "remaining_time": "11:53:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5700, "total_steps": 25254, "loss": 0.1539, "learning_rate": 4.514446076670367e-05, "epoch": 0.67712045616536, "percentage": 22.57, "elapsed_time": "3:27:49", "remaining_time": "11:52:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5710, "total_steps": 25254, "loss": 0.1539, "learning_rate": 4.5125456360674354e-05, "epoch": 0.6783083867902114, "percentage": 22.61, "elapsed_time": "3:28:11", "remaining_time": "11:52:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5720, "total_steps": 25254, "loss": 0.1528, "learning_rate": 4.5106418852580866e-05, "epoch": 0.679496317415063, "percentage": 22.65, "elapsed_time": "3:28:32", "remaining_time": "11:52:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5730, "total_steps": 25254, "loss": 0.1529, "learning_rate": 4.508734827373582e-05, "epoch": 0.6806842480399145, "percentage": 22.69, "elapsed_time": "3:28:54", "remaining_time": "11:51:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5740, "total_steps": 25254, "loss": 0.1539, "learning_rate": 4.506824465550625e-05, "epoch": 0.681872178664766, "percentage": 22.73, "elapsed_time": "3:29:16", "remaining_time": "11:51:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5750, "total_steps": 25254, "loss": 0.1552, "learning_rate": 4.504910802931351e-05, "epoch": 0.6830601092896175, "percentage": 22.77, "elapsed_time": "3:29:38", "remaining_time": "11:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5760, "total_steps": 25254, "loss": 0.1496, "learning_rate": 4.502993842663324e-05, "epoch": 0.684248039914469, "percentage": 22.81, "elapsed_time": "3:29:59", "remaining_time": "11:50:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5770, "total_steps": 25254, "loss": 0.1524, "learning_rate": 4.501073587899534e-05, "epoch": 0.6854359705393205, "percentage": 22.85, "elapsed_time": "3:30:22", "remaining_time": "11:50:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5780, "total_steps": 25254, "loss": 0.1506, "learning_rate": 4.4991500417983876e-05, "epoch": 0.686623901164172, "percentage": 22.89, "elapsed_time": "3:30:43", "remaining_time": "11:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5790, "total_steps": 25254, "loss": 0.1499, "learning_rate": 4.4972232075237075e-05, "epoch": 0.6878118317890235, "percentage": 22.93, "elapsed_time": "3:31:04", "remaining_time": "11:49:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5800, "total_steps": 25254, "loss": 0.1523, "learning_rate": 4.495293088244722e-05, "epoch": 0.6889997624138751, "percentage": 22.97, "elapsed_time": "3:31:26", "remaining_time": "11:49:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5810, "total_steps": 25254, "loss": 0.1506, "learning_rate": 4.493359687136064e-05, "epoch": 0.6901876930387265, "percentage": 23.01, "elapsed_time": "3:31:49", "remaining_time": "11:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5820, "total_steps": 25254, "loss": 0.1555, "learning_rate": 4.4914230073777654e-05, "epoch": 0.6913756236635781, "percentage": 23.05, "elapsed_time": "3:32:11", "remaining_time": "11:48:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5830, "total_steps": 25254, "loss": 0.1516, "learning_rate": 4.489483052155248e-05, "epoch": 0.6925635542884295, "percentage": 23.09, "elapsed_time": "3:32:32", "remaining_time": "11:48:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5840, "total_steps": 25254, "loss": 0.1472, "learning_rate": 4.4875398246593234e-05, "epoch": 0.6937514849132811, "percentage": 23.13, "elapsed_time": "3:32:54", "remaining_time": "11:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5850, "total_steps": 25254, "loss": 0.1499, "learning_rate": 4.4855933280861836e-05, "epoch": 0.6949394155381325, "percentage": 23.16, "elapsed_time": "3:33:16", "remaining_time": "11:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5860, "total_steps": 25254, "loss": 0.1506, "learning_rate": 4.4836435656373995e-05, "epoch": 0.6961273461629841, "percentage": 23.2, "elapsed_time": "3:33:37", "remaining_time": "11:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5870, "total_steps": 25254, "loss": 0.1523, "learning_rate": 4.481690540519913e-05, "epoch": 0.6973152767878356, "percentage": 23.24, "elapsed_time": "3:33:59", "remaining_time": "11:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5880, "total_steps": 25254, "loss": 0.153, "learning_rate": 4.479734255946031e-05, "epoch": 0.6985032074126871, "percentage": 23.28, "elapsed_time": "3:34:21", "remaining_time": "11:46:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5890, "total_steps": 25254, "loss": 0.1551, "learning_rate": 4.477774715133422e-05, "epoch": 0.6996911380375386, "percentage": 23.32, "elapsed_time": "3:34:43", "remaining_time": "11:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5900, "total_steps": 25254, "loss": 0.1527, "learning_rate": 4.475811921305112e-05, "epoch": 0.7008790686623901, "percentage": 23.36, "elapsed_time": "3:35:04", "remaining_time": "11:45:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5910, "total_steps": 25254, "loss": 0.1536, "learning_rate": 4.4738458776894754e-05, "epoch": 0.7020669992872416, "percentage": 23.4, "elapsed_time": "3:35:27", "remaining_time": "11:45:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5920, "total_steps": 25254, "loss": 0.1522, "learning_rate": 4.471876587520234e-05, "epoch": 0.7032549299120932, "percentage": 23.44, "elapsed_time": "3:35:48", "remaining_time": "11:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5930, "total_steps": 25254, "loss": 0.1498, "learning_rate": 4.469904054036448e-05, "epoch": 0.7044428605369446, "percentage": 23.48, "elapsed_time": "3:36:09", "remaining_time": "11:44:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5940, "total_steps": 25254, "loss": 0.1488, "learning_rate": 4.467928280482511e-05, "epoch": 0.7056307911617962, "percentage": 23.52, "elapsed_time": "3:36:31", "remaining_time": "11:44:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5950, "total_steps": 25254, "loss": 0.1517, "learning_rate": 4.4659492701081486e-05, "epoch": 0.7068187217866476, "percentage": 23.56, "elapsed_time": "3:36:53", "remaining_time": "11:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5960, "total_steps": 25254, "loss": 0.1532, "learning_rate": 4.4639670261684083e-05, "epoch": 0.7080066524114992, "percentage": 23.6, "elapsed_time": "3:37:15", "remaining_time": "11:43:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5970, "total_steps": 25254, "loss": 0.1505, "learning_rate": 4.461981551923657e-05, "epoch": 0.7091945830363506, "percentage": 23.64, "elapsed_time": "3:37:37", "remaining_time": "11:42:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5980, "total_steps": 25254, "loss": 0.1467, "learning_rate": 4.459992850639574e-05, "epoch": 0.7103825136612022, "percentage": 23.68, "elapsed_time": "3:37:59", "remaining_time": "11:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 5990, "total_steps": 25254, "loss": 0.1519, "learning_rate": 4.458000925587148e-05, "epoch": 0.7115704442860536, "percentage": 23.72, "elapsed_time": "3:38:20", "remaining_time": "11:42:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6000, "total_steps": 25254, "loss": 0.1559, "learning_rate": 4.456005780042668e-05, "epoch": 0.7127583749109052, "percentage": 23.76, "elapsed_time": "3:38:42", "remaining_time": "11:41:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6010, "total_steps": 25254, "loss": 0.1497, "learning_rate": 4.45400741728772e-05, "epoch": 0.7139463055357567, "percentage": 23.8, "elapsed_time": "3:39:04", "remaining_time": "11:41:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6020, "total_steps": 25254, "loss": 0.1548, "learning_rate": 4.4520058406091846e-05, "epoch": 0.7151342361606082, "percentage": 23.84, "elapsed_time": "3:39:26", "remaining_time": "11:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6030, "total_steps": 25254, "loss": 0.1552, "learning_rate": 4.450001053299226e-05, "epoch": 0.7163221667854597, "percentage": 23.88, "elapsed_time": "3:39:47", "remaining_time": "11:40:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6040, "total_steps": 25254, "loss": 0.1495, "learning_rate": 4.44799305865529e-05, "epoch": 0.7175100974103112, "percentage": 23.92, "elapsed_time": "3:40:09", "remaining_time": "11:40:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6050, "total_steps": 25254, "loss": 0.1471, "learning_rate": 4.445981859980097e-05, "epoch": 0.7186980280351627, "percentage": 23.96, "elapsed_time": "3:40:31", "remaining_time": "11:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6060, "total_steps": 25254, "loss": 0.1535, "learning_rate": 4.4439674605816385e-05, "epoch": 0.7198859586600143, "percentage": 24.0, "elapsed_time": "3:40:53", "remaining_time": "11:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6070, "total_steps": 25254, "loss": 0.15, "learning_rate": 4.4419498637731694e-05, "epoch": 0.7210738892848657, "percentage": 24.04, "elapsed_time": "3:41:15", "remaining_time": "11:39:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6080, "total_steps": 25254, "loss": 0.1477, "learning_rate": 4.439929072873204e-05, "epoch": 0.7222618199097173, "percentage": 24.08, "elapsed_time": "3:41:37", "remaining_time": "11:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6090, "total_steps": 25254, "loss": 0.1485, "learning_rate": 4.437905091205512e-05, "epoch": 0.7234497505345688, "percentage": 24.11, "elapsed_time": "3:41:59", "remaining_time": "11:38:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6100, "total_steps": 25254, "loss": 0.1469, "learning_rate": 4.4358779220991074e-05, "epoch": 0.7246376811594203, "percentage": 24.15, "elapsed_time": "3:42:21", "remaining_time": "11:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6110, "total_steps": 25254, "loss": 0.1525, "learning_rate": 4.433847568888251e-05, "epoch": 0.7258256117842719, "percentage": 24.19, "elapsed_time": "3:42:44", "remaining_time": "11:37:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6120, "total_steps": 25254, "loss": 0.1491, "learning_rate": 4.431814034912438e-05, "epoch": 0.7270135424091233, "percentage": 24.23, "elapsed_time": "3:43:06", "remaining_time": "11:37:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6130, "total_steps": 25254, "loss": 0.1499, "learning_rate": 4.429777323516397e-05, "epoch": 0.7282014730339749, "percentage": 24.27, "elapsed_time": "3:43:27", "remaining_time": "11:37:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6140, "total_steps": 25254, "loss": 0.1542, "learning_rate": 4.42773743805008e-05, "epoch": 0.7293894036588263, "percentage": 24.31, "elapsed_time": "3:43:49", "remaining_time": "11:36:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6150, "total_steps": 25254, "loss": 0.1474, "learning_rate": 4.4256943818686635e-05, "epoch": 0.7305773342836779, "percentage": 24.35, "elapsed_time": "3:44:11", "remaining_time": "11:36:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6160, "total_steps": 25254, "loss": 0.1531, "learning_rate": 4.4236481583325364e-05, "epoch": 0.7317652649085293, "percentage": 24.39, "elapsed_time": "3:44:33", "remaining_time": "11:36:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6170, "total_steps": 25254, "loss": 0.1511, "learning_rate": 4.421598770807297e-05, "epoch": 0.7329531955333809, "percentage": 24.43, "elapsed_time": "3:44:54", "remaining_time": "11:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6180, "total_steps": 25254, "loss": 0.1497, "learning_rate": 4.419546222663752e-05, "epoch": 0.7341411261582323, "percentage": 24.47, "elapsed_time": "3:45:16", "remaining_time": "11:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6190, "total_steps": 25254, "loss": 0.1497, "learning_rate": 4.417490517277899e-05, "epoch": 0.7353290567830839, "percentage": 24.51, "elapsed_time": "3:45:38", "remaining_time": "11:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6200, "total_steps": 25254, "loss": 0.1536, "learning_rate": 4.415431658030936e-05, "epoch": 0.7365169874079354, "percentage": 24.55, "elapsed_time": "3:46:00", "remaining_time": "11:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6210, "total_steps": 25254, "loss": 0.1489, "learning_rate": 4.413369648309246e-05, "epoch": 0.7377049180327869, "percentage": 24.59, "elapsed_time": "3:46:22", "remaining_time": "11:34:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6220, "total_steps": 25254, "loss": 0.1531, "learning_rate": 4.41130449150439e-05, "epoch": 0.7388928486576384, "percentage": 24.63, "elapsed_time": "3:46:45", "remaining_time": "11:33:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6230, "total_steps": 25254, "loss": 0.1477, "learning_rate": 4.4092361910131106e-05, "epoch": 0.7400807792824899, "percentage": 24.67, "elapsed_time": "3:47:06", "remaining_time": "11:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6240, "total_steps": 25254, "loss": 0.1556, "learning_rate": 4.4071647502373197e-05, "epoch": 0.7412687099073414, "percentage": 24.71, "elapsed_time": "3:47:28", "remaining_time": "11:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6250, "total_steps": 25254, "loss": 0.1514, "learning_rate": 4.405090172584092e-05, "epoch": 0.742456640532193, "percentage": 24.75, "elapsed_time": "3:47:50", "remaining_time": "11:32:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6260, "total_steps": 25254, "loss": 0.1536, "learning_rate": 4.4030124614656644e-05, "epoch": 0.7436445711570444, "percentage": 24.79, "elapsed_time": "3:48:12", "remaining_time": "11:32:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6270, "total_steps": 25254, "loss": 0.1499, "learning_rate": 4.4009316202994254e-05, "epoch": 0.744832501781896, "percentage": 24.83, "elapsed_time": "3:48:34", "remaining_time": "11:32:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6280, "total_steps": 25254, "loss": 0.1504, "learning_rate": 4.398847652507914e-05, "epoch": 0.7460204324067474, "percentage": 24.87, "elapsed_time": "3:48:56", "remaining_time": "11:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6290, "total_steps": 25254, "loss": 0.1497, "learning_rate": 4.3967605615188106e-05, "epoch": 0.747208363031599, "percentage": 24.91, "elapsed_time": "3:49:17", "remaining_time": "11:31:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6300, "total_steps": 25254, "loss": 0.1512, "learning_rate": 4.394670350764932e-05, "epoch": 0.7483962936564504, "percentage": 24.95, "elapsed_time": "3:49:39", "remaining_time": "11:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6310, "total_steps": 25254, "loss": 0.1527, "learning_rate": 4.392577023684229e-05, "epoch": 0.749584224281302, "percentage": 24.99, "elapsed_time": "3:50:00", "remaining_time": "11:30:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6320, "total_steps": 25254, "loss": 0.1479, "learning_rate": 4.3904805837197737e-05, "epoch": 0.7507721549061535, "percentage": 25.03, "elapsed_time": "3:50:22", "remaining_time": "11:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6330, "total_steps": 25254, "loss": 0.1489, "learning_rate": 4.388381034319762e-05, "epoch": 0.751960085531005, "percentage": 25.07, "elapsed_time": "3:50:43", "remaining_time": "11:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6340, "total_steps": 25254, "loss": 0.1491, "learning_rate": 4.386278378937503e-05, "epoch": 0.7531480161558565, "percentage": 25.1, "elapsed_time": "3:51:05", "remaining_time": "11:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6350, "total_steps": 25254, "loss": 0.1496, "learning_rate": 4.3841726210314136e-05, "epoch": 0.754335946780708, "percentage": 25.14, "elapsed_time": "3:51:27", "remaining_time": "11:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6360, "total_steps": 25254, "loss": 0.1514, "learning_rate": 4.382063764065016e-05, "epoch": 0.7555238774055595, "percentage": 25.18, "elapsed_time": "3:51:48", "remaining_time": "11:28:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6370, "total_steps": 25254, "loss": 0.1519, "learning_rate": 4.379951811506926e-05, "epoch": 0.756711808030411, "percentage": 25.22, "elapsed_time": "3:52:10", "remaining_time": "11:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6380, "total_steps": 25254, "loss": 0.1514, "learning_rate": 4.377836766830855e-05, "epoch": 0.7578997386552625, "percentage": 25.26, "elapsed_time": "3:52:32", "remaining_time": "11:27:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6390, "total_steps": 25254, "loss": 0.1474, "learning_rate": 4.375718633515597e-05, "epoch": 0.7590876692801141, "percentage": 25.3, "elapsed_time": "3:52:55", "remaining_time": "11:27:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6400, "total_steps": 25254, "loss": 0.1508, "learning_rate": 4.3735974150450275e-05, "epoch": 0.7602755999049655, "percentage": 25.34, "elapsed_time": "3:53:17", "remaining_time": "11:27:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6410, "total_steps": 25254, "loss": 0.1521, "learning_rate": 4.371473114908098e-05, "epoch": 0.7614635305298171, "percentage": 25.38, "elapsed_time": "3:53:38", "remaining_time": "11:26:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6420, "total_steps": 25254, "loss": 0.147, "learning_rate": 4.369345736598826e-05, "epoch": 0.7626514611546685, "percentage": 25.42, "elapsed_time": "3:54:00", "remaining_time": "11:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6430, "total_steps": 25254, "loss": 0.1514, "learning_rate": 4.3672152836162926e-05, "epoch": 0.7638393917795201, "percentage": 25.46, "elapsed_time": "3:54:22", "remaining_time": "11:26:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6440, "total_steps": 25254, "loss": 0.1501, "learning_rate": 4.3650817594646374e-05, "epoch": 0.7650273224043715, "percentage": 25.5, "elapsed_time": "3:54:44", "remaining_time": "11:25:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6450, "total_steps": 25254, "loss": 0.1479, "learning_rate": 4.3629451676530506e-05, "epoch": 0.7662152530292231, "percentage": 25.54, "elapsed_time": "3:55:06", "remaining_time": "11:25:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6460, "total_steps": 25254, "loss": 0.1465, "learning_rate": 4.360805511695768e-05, "epoch": 0.7674031836540746, "percentage": 25.58, "elapsed_time": "3:55:29", "remaining_time": "11:25:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6470, "total_steps": 25254, "loss": 0.1511, "learning_rate": 4.3586627951120646e-05, "epoch": 0.7685911142789261, "percentage": 25.62, "elapsed_time": "3:55:51", "remaining_time": "11:24:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6480, "total_steps": 25254, "loss": 0.152, "learning_rate": 4.35651702142625e-05, "epoch": 0.7697790449037776, "percentage": 25.66, "elapsed_time": "3:56:13", "remaining_time": "11:24:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6490, "total_steps": 25254, "loss": 0.1521, "learning_rate": 4.354368194167664e-05, "epoch": 0.7709669755286291, "percentage": 25.7, "elapsed_time": "3:56:34", "remaining_time": "11:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6500, "total_steps": 25254, "loss": 0.1503, "learning_rate": 4.352216316870664e-05, "epoch": 0.7721549061534806, "percentage": 25.74, "elapsed_time": "3:56:55", "remaining_time": "11:23:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6510, "total_steps": 25254, "loss": 0.1497, "learning_rate": 4.35006139307463e-05, "epoch": 0.7733428367783322, "percentage": 25.78, "elapsed_time": "3:57:17", "remaining_time": "11:23:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6520, "total_steps": 25254, "loss": 0.1478, "learning_rate": 4.347903426323949e-05, "epoch": 0.7745307674031836, "percentage": 25.82, "elapsed_time": "3:57:38", "remaining_time": "11:22:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6530, "total_steps": 25254, "loss": 0.1487, "learning_rate": 4.3457424201680145e-05, "epoch": 0.7757186980280352, "percentage": 25.86, "elapsed_time": "3:58:01", "remaining_time": "11:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6540, "total_steps": 25254, "loss": 0.1473, "learning_rate": 4.343578378161217e-05, "epoch": 0.7769066286528866, "percentage": 25.9, "elapsed_time": "3:58:22", "remaining_time": "11:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6550, "total_steps": 25254, "loss": 0.1439, "learning_rate": 4.3414113038629436e-05, "epoch": 0.7780945592777382, "percentage": 25.94, "elapsed_time": "3:58:44", "remaining_time": "11:21:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6560, "total_steps": 25254, "loss": 0.1517, "learning_rate": 4.339241200837567e-05, "epoch": 0.7792824899025896, "percentage": 25.98, "elapsed_time": "3:59:06", "remaining_time": "11:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6570, "total_steps": 25254, "loss": 0.1508, "learning_rate": 4.337068072654441e-05, "epoch": 0.7804704205274412, "percentage": 26.02, "elapsed_time": "3:59:28", "remaining_time": "11:21:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6580, "total_steps": 25254, "loss": 0.1513, "learning_rate": 4.334891922887897e-05, "epoch": 0.7816583511522927, "percentage": 26.06, "elapsed_time": "3:59:49", "remaining_time": "11:20:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6590, "total_steps": 25254, "loss": 0.1489, "learning_rate": 4.332712755117234e-05, "epoch": 0.7828462817771442, "percentage": 26.09, "elapsed_time": "4:00:12", "remaining_time": "11:20:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6600, "total_steps": 25254, "loss": 0.1472, "learning_rate": 4.330530572926718e-05, "epoch": 0.7840342124019958, "percentage": 26.13, "elapsed_time": "4:00:33", "remaining_time": "11:19:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6610, "total_steps": 25254, "loss": 0.1495, "learning_rate": 4.3283453799055684e-05, "epoch": 0.7852221430268472, "percentage": 26.17, "elapsed_time": "4:00:55", "remaining_time": "11:19:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6620, "total_steps": 25254, "loss": 0.1498, "learning_rate": 4.3261571796479615e-05, "epoch": 0.7864100736516988, "percentage": 26.21, "elapsed_time": "4:01:16", "remaining_time": "11:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6630, "total_steps": 25254, "loss": 0.1473, "learning_rate": 4.323965975753018e-05, "epoch": 0.7875980042765502, "percentage": 26.25, "elapsed_time": "4:01:39", "remaining_time": "11:18:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6640, "total_steps": 25254, "loss": 0.1533, "learning_rate": 4.321771771824798e-05, "epoch": 0.7887859349014018, "percentage": 26.29, "elapsed_time": "4:02:00", "remaining_time": "11:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6650, "total_steps": 25254, "loss": 0.1462, "learning_rate": 4.319574571472298e-05, "epoch": 0.7899738655262533, "percentage": 26.33, "elapsed_time": "4:02:22", "remaining_time": "11:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6660, "total_steps": 25254, "loss": 0.1511, "learning_rate": 4.317374378309441e-05, "epoch": 0.7911617961511048, "percentage": 26.37, "elapsed_time": "4:02:43", "remaining_time": "11:17:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6670, "total_steps": 25254, "loss": 0.1492, "learning_rate": 4.3151711959550736e-05, "epoch": 0.7923497267759563, "percentage": 26.41, "elapsed_time": "4:03:05", "remaining_time": "11:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6680, "total_steps": 25254, "loss": 0.1522, "learning_rate": 4.3129650280329584e-05, "epoch": 0.7935376574008078, "percentage": 26.45, "elapsed_time": "4:03:27", "remaining_time": "11:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6690, "total_steps": 25254, "loss": 0.1484, "learning_rate": 4.3107558781717693e-05, "epoch": 0.7947255880256593, "percentage": 26.49, "elapsed_time": "4:03:49", "remaining_time": "11:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6700, "total_steps": 25254, "loss": 0.1524, "learning_rate": 4.3085437500050854e-05, "epoch": 0.7959135186505109, "percentage": 26.53, "elapsed_time": "4:04:12", "remaining_time": "11:16:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6710, "total_steps": 25254, "loss": 0.1509, "learning_rate": 4.306328647171383e-05, "epoch": 0.7971014492753623, "percentage": 26.57, "elapsed_time": "4:04:34", "remaining_time": "11:15:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6720, "total_steps": 25254, "loss": 0.1481, "learning_rate": 4.3041105733140305e-05, "epoch": 0.7982893799002139, "percentage": 26.61, "elapsed_time": "4:04:56", "remaining_time": "11:15:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6730, "total_steps": 25254, "loss": 0.1486, "learning_rate": 4.301889532081285e-05, "epoch": 0.7994773105250653, "percentage": 26.65, "elapsed_time": "4:05:18", "remaining_time": "11:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6740, "total_steps": 25254, "loss": 0.144, "learning_rate": 4.299665527126285e-05, "epoch": 0.8006652411499169, "percentage": 26.69, "elapsed_time": "4:05:40", "remaining_time": "11:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6750, "total_steps": 25254, "loss": 0.1524, "learning_rate": 4.29743856210704e-05, "epoch": 0.8018531717747683, "percentage": 26.73, "elapsed_time": "4:06:02", "remaining_time": "11:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6760, "total_steps": 25254, "loss": 0.1486, "learning_rate": 4.295208640686432e-05, "epoch": 0.8030411023996199, "percentage": 26.77, "elapsed_time": "4:06:23", "remaining_time": "11:14:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6770, "total_steps": 25254, "loss": 0.1507, "learning_rate": 4.292975766532204e-05, "epoch": 0.8042290330244714, "percentage": 26.81, "elapsed_time": "4:06:45", "remaining_time": "11:13:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6780, "total_steps": 25254, "loss": 0.1465, "learning_rate": 4.290739943316954e-05, "epoch": 0.8054169636493229, "percentage": 26.85, "elapsed_time": "4:07:07", "remaining_time": "11:13:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6790, "total_steps": 25254, "loss": 0.1494, "learning_rate": 4.2885011747181326e-05, "epoch": 0.8066048942741744, "percentage": 26.89, "elapsed_time": "4:07:29", "remaining_time": "11:13:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6800, "total_steps": 25254, "loss": 0.1491, "learning_rate": 4.2862594644180356e-05, "epoch": 0.8077928248990259, "percentage": 26.93, "elapsed_time": "4:07:51", "remaining_time": "11:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6810, "total_steps": 25254, "loss": 0.1476, "learning_rate": 4.2840148161037966e-05, "epoch": 0.8089807555238774, "percentage": 26.97, "elapsed_time": "4:08:13", "remaining_time": "11:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6820, "total_steps": 25254, "loss": 0.1467, "learning_rate": 4.2817672334673795e-05, "epoch": 0.810168686148729, "percentage": 27.01, "elapsed_time": "4:08:34", "remaining_time": "11:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6830, "total_steps": 25254, "loss": 0.1467, "learning_rate": 4.279516720205577e-05, "epoch": 0.8113566167735804, "percentage": 27.05, "elapsed_time": "4:08:56", "remaining_time": "11:11:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6840, "total_steps": 25254, "loss": 0.148, "learning_rate": 4.277263280020002e-05, "epoch": 0.812544547398432, "percentage": 27.08, "elapsed_time": "4:09:18", "remaining_time": "11:11:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6850, "total_steps": 25254, "loss": 0.151, "learning_rate": 4.275006916617079e-05, "epoch": 0.8137324780232834, "percentage": 27.12, "elapsed_time": "4:09:40", "remaining_time": "11:10:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6860, "total_steps": 25254, "loss": 0.1467, "learning_rate": 4.272747633708044e-05, "epoch": 0.814920408648135, "percentage": 27.16, "elapsed_time": "4:10:01", "remaining_time": "11:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6870, "total_steps": 25254, "loss": 0.1481, "learning_rate": 4.2704854350089335e-05, "epoch": 0.8161083392729864, "percentage": 27.2, "elapsed_time": "4:10:23", "remaining_time": "11:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6880, "total_steps": 25254, "loss": 0.149, "learning_rate": 4.268220324240579e-05, "epoch": 0.817296269897838, "percentage": 27.24, "elapsed_time": "4:10:45", "remaining_time": "11:09:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6890, "total_steps": 25254, "loss": 0.1498, "learning_rate": 4.265952305128602e-05, "epoch": 0.8184842005226894, "percentage": 27.28, "elapsed_time": "4:11:06", "remaining_time": "11:09:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6900, "total_steps": 25254, "loss": 0.1513, "learning_rate": 4.2636813814034096e-05, "epoch": 0.819672131147541, "percentage": 27.32, "elapsed_time": "4:11:28", "remaining_time": "11:08:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6910, "total_steps": 25254, "loss": 0.1498, "learning_rate": 4.261407556800183e-05, "epoch": 0.8208600617723925, "percentage": 27.36, "elapsed_time": "4:11:50", "remaining_time": "11:08:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6920, "total_steps": 25254, "loss": 0.1479, "learning_rate": 4.2591308350588775e-05, "epoch": 0.822047992397244, "percentage": 27.4, "elapsed_time": "4:12:12", "remaining_time": "11:08:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6930, "total_steps": 25254, "loss": 0.1449, "learning_rate": 4.2568512199242136e-05, "epoch": 0.8232359230220955, "percentage": 27.44, "elapsed_time": "4:12:34", "remaining_time": "11:07:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6940, "total_steps": 25254, "loss": 0.1512, "learning_rate": 4.254568715145668e-05, "epoch": 0.824423853646947, "percentage": 27.48, "elapsed_time": "4:12:55", "remaining_time": "11:07:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6950, "total_steps": 25254, "loss": 0.1491, "learning_rate": 4.252283324477473e-05, "epoch": 0.8256117842717985, "percentage": 27.52, "elapsed_time": "4:13:17", "remaining_time": "11:07:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6960, "total_steps": 25254, "loss": 0.1509, "learning_rate": 4.2499950516786056e-05, "epoch": 0.82679971489665, "percentage": 27.56, "elapsed_time": "4:13:38", "remaining_time": "11:06:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6970, "total_steps": 25254, "loss": 0.1463, "learning_rate": 4.247703900512786e-05, "epoch": 0.8279876455215015, "percentage": 27.6, "elapsed_time": "4:14:00", "remaining_time": "11:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6980, "total_steps": 25254, "loss": 0.1491, "learning_rate": 4.2454098747484674e-05, "epoch": 0.8291755761463531, "percentage": 27.64, "elapsed_time": "4:14:23", "remaining_time": "11:05:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 6990, "total_steps": 25254, "loss": 0.1436, "learning_rate": 4.2431129781588275e-05, "epoch": 0.8303635067712045, "percentage": 27.68, "elapsed_time": "4:14:44", "remaining_time": "11:05:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7000, "total_steps": 25254, "loss": 0.1473, "learning_rate": 4.240813214521772e-05, "epoch": 0.8315514373960561, "percentage": 27.72, "elapsed_time": "4:15:06", "remaining_time": "11:05:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7010, "total_steps": 25254, "loss": 0.1471, "learning_rate": 4.2385105876199194e-05, "epoch": 0.8327393680209075, "percentage": 27.76, "elapsed_time": "4:15:28", "remaining_time": "11:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7020, "total_steps": 25254, "loss": 0.1524, "learning_rate": 4.2362051012405954e-05, "epoch": 0.8339272986457591, "percentage": 27.8, "elapsed_time": "4:15:50", "remaining_time": "11:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7030, "total_steps": 25254, "loss": 0.1503, "learning_rate": 4.233896759175834e-05, "epoch": 0.8351152292706105, "percentage": 27.84, "elapsed_time": "4:16:11", "remaining_time": "11:04:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7040, "total_steps": 25254, "loss": 0.1438, "learning_rate": 4.231585565222361e-05, "epoch": 0.8363031598954621, "percentage": 27.88, "elapsed_time": "4:16:33", "remaining_time": "11:03:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7050, "total_steps": 25254, "loss": 0.1491, "learning_rate": 4.2292715231815974e-05, "epoch": 0.8374910905203136, "percentage": 27.92, "elapsed_time": "4:16:55", "remaining_time": "11:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7060, "total_steps": 25254, "loss": 0.1451, "learning_rate": 4.226954636859644e-05, "epoch": 0.8386790211451651, "percentage": 27.96, "elapsed_time": "4:17:18", "remaining_time": "11:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7070, "total_steps": 25254, "loss": 0.1494, "learning_rate": 4.224634910067285e-05, "epoch": 0.8398669517700166, "percentage": 28.0, "elapsed_time": "4:17:40", "remaining_time": "11:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7080, "total_steps": 25254, "loss": 0.1493, "learning_rate": 4.222312346619973e-05, "epoch": 0.8410548823948681, "percentage": 28.04, "elapsed_time": "4:18:02", "remaining_time": "11:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7090, "total_steps": 25254, "loss": 0.1438, "learning_rate": 4.219986950337826e-05, "epoch": 0.8422428130197196, "percentage": 28.07, "elapsed_time": "4:18:24", "remaining_time": "11:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7100, "total_steps": 25254, "loss": 0.1467, "learning_rate": 4.2176587250456255e-05, "epoch": 0.8434307436445712, "percentage": 28.11, "elapsed_time": "4:18:45", "remaining_time": "11:01:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7110, "total_steps": 25254, "loss": 0.1427, "learning_rate": 4.215327674572802e-05, "epoch": 0.8446186742694227, "percentage": 28.15, "elapsed_time": "4:19:07", "remaining_time": "11:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7120, "total_steps": 25254, "loss": 0.1467, "learning_rate": 4.212993802753433e-05, "epoch": 0.8458066048942742, "percentage": 28.19, "elapsed_time": "4:19:29", "remaining_time": "11:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7130, "total_steps": 25254, "loss": 0.1496, "learning_rate": 4.210657113426239e-05, "epoch": 0.8469945355191257, "percentage": 28.23, "elapsed_time": "4:19:51", "remaining_time": "11:00:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7140, "total_steps": 25254, "loss": 0.1494, "learning_rate": 4.2083176104345736e-05, "epoch": 0.8481824661439772, "percentage": 28.27, "elapsed_time": "4:20:13", "remaining_time": "11:00:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7150, "total_steps": 25254, "loss": 0.1462, "learning_rate": 4.205975297626416e-05, "epoch": 0.8493703967688288, "percentage": 28.31, "elapsed_time": "4:20:34", "remaining_time": "10:59:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7160, "total_steps": 25254, "loss": 0.1484, "learning_rate": 4.203630178854371e-05, "epoch": 0.8505583273936802, "percentage": 28.35, "elapsed_time": "4:20:56", "remaining_time": "10:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7170, "total_steps": 25254, "loss": 0.147, "learning_rate": 4.201282257975656e-05, "epoch": 0.8517462580185318, "percentage": 28.39, "elapsed_time": "4:21:18", "remaining_time": "10:59:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7180, "total_steps": 25254, "loss": 0.1473, "learning_rate": 4.198931538852098e-05, "epoch": 0.8529341886433832, "percentage": 28.43, "elapsed_time": "4:21:39", "remaining_time": "10:58:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7190, "total_steps": 25254, "loss": 0.1481, "learning_rate": 4.1965780253501256e-05, "epoch": 0.8541221192682348, "percentage": 28.47, "elapsed_time": "4:22:01", "remaining_time": "10:58:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7200, "total_steps": 25254, "loss": 0.149, "learning_rate": 4.194221721340765e-05, "epoch": 0.8553100498930862, "percentage": 28.51, "elapsed_time": "4:22:23", "remaining_time": "10:57:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7210, "total_steps": 25254, "loss": 0.1443, "learning_rate": 4.191862630699631e-05, "epoch": 0.8564979805179378, "percentage": 28.55, "elapsed_time": "4:22:44", "remaining_time": "10:57:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7220, "total_steps": 25254, "loss": 0.1501, "learning_rate": 4.189500757306923e-05, "epoch": 0.8576859111427892, "percentage": 28.59, "elapsed_time": "4:23:07", "remaining_time": "10:57:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7230, "total_steps": 25254, "loss": 0.1456, "learning_rate": 4.1871361050474165e-05, "epoch": 0.8588738417676408, "percentage": 28.63, "elapsed_time": "4:23:28", "remaining_time": "10:56:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7240, "total_steps": 25254, "loss": 0.147, "learning_rate": 4.1847686778104575e-05, "epoch": 0.8600617723924923, "percentage": 28.67, "elapsed_time": "4:23:50", "remaining_time": "10:56:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7250, "total_steps": 25254, "loss": 0.1474, "learning_rate": 4.1823984794899575e-05, "epoch": 0.8612497030173438, "percentage": 28.71, "elapsed_time": "4:24:12", "remaining_time": "10:56:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7260, "total_steps": 25254, "loss": 0.1493, "learning_rate": 4.1800255139843836e-05, "epoch": 0.8624376336421953, "percentage": 28.75, "elapsed_time": "4:24:34", "remaining_time": "10:55:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7270, "total_steps": 25254, "loss": 0.146, "learning_rate": 4.177649785196757e-05, "epoch": 0.8636255642670468, "percentage": 28.79, "elapsed_time": "4:24:55", "remaining_time": "10:55:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7280, "total_steps": 25254, "loss": 0.1496, "learning_rate": 4.175271297034642e-05, "epoch": 0.8648134948918983, "percentage": 28.83, "elapsed_time": "4:25:17", "remaining_time": "10:55:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7290, "total_steps": 25254, "loss": 0.1477, "learning_rate": 4.1728900534101415e-05, "epoch": 0.8660014255167499, "percentage": 28.87, "elapsed_time": "4:25:39", "remaining_time": "10:54:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7300, "total_steps": 25254, "loss": 0.1455, "learning_rate": 4.170506058239893e-05, "epoch": 0.8671893561416013, "percentage": 28.91, "elapsed_time": "4:26:00", "remaining_time": "10:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7310, "total_steps": 25254, "loss": 0.1457, "learning_rate": 4.1681193154450546e-05, "epoch": 0.8683772867664529, "percentage": 28.95, "elapsed_time": "4:26:22", "remaining_time": "10:53:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7320, "total_steps": 25254, "loss": 0.1459, "learning_rate": 4.1657298289513096e-05, "epoch": 0.8695652173913043, "percentage": 28.99, "elapsed_time": "4:26:44", "remaining_time": "10:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7330, "total_steps": 25254, "loss": 0.1465, "learning_rate": 4.163337602688851e-05, "epoch": 0.8707531480161559, "percentage": 29.03, "elapsed_time": "4:27:05", "remaining_time": "10:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7340, "total_steps": 25254, "loss": 0.1484, "learning_rate": 4.160942640592378e-05, "epoch": 0.8719410786410073, "percentage": 29.06, "elapsed_time": "4:27:28", "remaining_time": "10:52:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7350, "total_steps": 25254, "loss": 0.1477, "learning_rate": 4.158544946601091e-05, "epoch": 0.8731290092658589, "percentage": 29.1, "elapsed_time": "4:27:50", "remaining_time": "10:52:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7360, "total_steps": 25254, "loss": 0.1466, "learning_rate": 4.15614452465868e-05, "epoch": 0.8743169398907104, "percentage": 29.14, "elapsed_time": "4:28:11", "remaining_time": "10:52:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7370, "total_steps": 25254, "loss": 0.1469, "learning_rate": 4.153741378713329e-05, "epoch": 0.8755048705155619, "percentage": 29.18, "elapsed_time": "4:28:34", "remaining_time": "10:51:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7380, "total_steps": 25254, "loss": 0.1496, "learning_rate": 4.151335512717696e-05, "epoch": 0.8766928011404134, "percentage": 29.22, "elapsed_time": "4:28:56", "remaining_time": "10:51:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7390, "total_steps": 25254, "loss": 0.1493, "learning_rate": 4.148926930628915e-05, "epoch": 0.8778807317652649, "percentage": 29.26, "elapsed_time": "4:29:18", "remaining_time": "10:50:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7400, "total_steps": 25254, "loss": 0.1458, "learning_rate": 4.146515636408589e-05, "epoch": 0.8790686623901164, "percentage": 29.3, "elapsed_time": "4:29:40", "remaining_time": "10:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7410, "total_steps": 25254, "loss": 0.1498, "learning_rate": 4.144101634022779e-05, "epoch": 0.880256593014968, "percentage": 29.34, "elapsed_time": "4:30:02", "remaining_time": "10:50:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7420, "total_steps": 25254, "loss": 0.145, "learning_rate": 4.1416849274420013e-05, "epoch": 0.8814445236398194, "percentage": 29.38, "elapsed_time": "4:30:24", "remaining_time": "10:49:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7430, "total_steps": 25254, "loss": 0.1506, "learning_rate": 4.1392655206412223e-05, "epoch": 0.882632454264671, "percentage": 29.42, "elapsed_time": "4:30:46", "remaining_time": "10:49:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7440, "total_steps": 25254, "loss": 0.1484, "learning_rate": 4.136843417599846e-05, "epoch": 0.8838203848895224, "percentage": 29.46, "elapsed_time": "4:31:08", "remaining_time": "10:49:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7450, "total_steps": 25254, "loss": 0.1445, "learning_rate": 4.1344186223017146e-05, "epoch": 0.885008315514374, "percentage": 29.5, "elapsed_time": "4:31:30", "remaining_time": "10:48:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7460, "total_steps": 25254, "loss": 0.1417, "learning_rate": 4.131991138735096e-05, "epoch": 0.8861962461392254, "percentage": 29.54, "elapsed_time": "4:31:52", "remaining_time": "10:48:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7470, "total_steps": 25254, "loss": 0.1458, "learning_rate": 4.1295609708926817e-05, "epoch": 0.887384176764077, "percentage": 29.58, "elapsed_time": "4:32:14", "remaining_time": "10:48:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7480, "total_steps": 25254, "loss": 0.1445, "learning_rate": 4.1271281227715755e-05, "epoch": 0.8885721073889284, "percentage": 29.62, "elapsed_time": "4:32:35", "remaining_time": "10:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7490, "total_steps": 25254, "loss": 0.142, "learning_rate": 4.124692598373292e-05, "epoch": 0.88976003801378, "percentage": 29.66, "elapsed_time": "4:32:57", "remaining_time": "10:47:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7500, "total_steps": 25254, "loss": 0.1477, "learning_rate": 4.122254401703748e-05, "epoch": 0.8909479686386315, "percentage": 29.7, "elapsed_time": "4:33:19", "remaining_time": "10:47:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7510, "total_steps": 25254, "loss": 0.1424, "learning_rate": 4.1198135367732534e-05, "epoch": 0.892135899263483, "percentage": 29.74, "elapsed_time": "4:33:41", "remaining_time": "10:46:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7520, "total_steps": 25254, "loss": 0.1466, "learning_rate": 4.117370007596508e-05, "epoch": 0.8933238298883345, "percentage": 29.78, "elapsed_time": "4:34:04", "remaining_time": "10:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7530, "total_steps": 25254, "loss": 0.1488, "learning_rate": 4.114923818192595e-05, "epoch": 0.894511760513186, "percentage": 29.82, "elapsed_time": "4:34:25", "remaining_time": "10:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7540, "total_steps": 25254, "loss": 0.1496, "learning_rate": 4.112474972584972e-05, "epoch": 0.8956996911380375, "percentage": 29.86, "elapsed_time": "4:34:48", "remaining_time": "10:45:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7550, "total_steps": 25254, "loss": 0.1455, "learning_rate": 4.110023474801465e-05, "epoch": 0.896887621762889, "percentage": 29.9, "elapsed_time": "4:35:09", "remaining_time": "10:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7560, "total_steps": 25254, "loss": 0.1456, "learning_rate": 4.107569328874261e-05, "epoch": 0.8980755523877405, "percentage": 29.94, "elapsed_time": "4:35:31", "remaining_time": "10:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7570, "total_steps": 25254, "loss": 0.1459, "learning_rate": 4.105112538839907e-05, "epoch": 0.8992634830125921, "percentage": 29.98, "elapsed_time": "4:35:53", "remaining_time": "10:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7580, "total_steps": 25254, "loss": 0.1489, "learning_rate": 4.1026531087392945e-05, "epoch": 0.9004514136374435, "percentage": 30.02, "elapsed_time": "4:36:15", "remaining_time": "10:44:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7590, "total_steps": 25254, "loss": 0.1454, "learning_rate": 4.1001910426176596e-05, "epoch": 0.9016393442622951, "percentage": 30.05, "elapsed_time": "4:36:37", "remaining_time": "10:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7600, "total_steps": 25254, "loss": 0.1438, "learning_rate": 4.097726344524574e-05, "epoch": 0.9028272748871465, "percentage": 30.09, "elapsed_time": "4:36:58", "remaining_time": "10:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7610, "total_steps": 25254, "loss": 0.1432, "learning_rate": 4.095259018513937e-05, "epoch": 0.9040152055119981, "percentage": 30.13, "elapsed_time": "4:37:19", "remaining_time": "10:43:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7620, "total_steps": 25254, "loss": 0.1432, "learning_rate": 4.0927890686439726e-05, "epoch": 0.9052031361368497, "percentage": 30.17, "elapsed_time": "4:37:41", "remaining_time": "10:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7630, "total_steps": 25254, "loss": 0.1461, "learning_rate": 4.090316498977218e-05, "epoch": 0.9063910667617011, "percentage": 30.21, "elapsed_time": "4:38:04", "remaining_time": "10:42:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7640, "total_steps": 25254, "loss": 0.1482, "learning_rate": 4.087841313580521e-05, "epoch": 0.9075789973865527, "percentage": 30.25, "elapsed_time": "4:38:25", "remaining_time": "10:41:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7650, "total_steps": 25254, "loss": 0.148, "learning_rate": 4.085363516525033e-05, "epoch": 0.9087669280114041, "percentage": 30.29, "elapsed_time": "4:38:47", "remaining_time": "10:41:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7660, "total_steps": 25254, "loss": 0.1456, "learning_rate": 4.082883111886197e-05, "epoch": 0.9099548586362557, "percentage": 30.33, "elapsed_time": "4:39:09", "remaining_time": "10:41:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7670, "total_steps": 25254, "loss": 0.1491, "learning_rate": 4.0804001037437474e-05, "epoch": 0.9111427892611071, "percentage": 30.37, "elapsed_time": "4:39:31", "remaining_time": "10:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7680, "total_steps": 25254, "loss": 0.1458, "learning_rate": 4.0779144961817015e-05, "epoch": 0.9123307198859587, "percentage": 30.41, "elapsed_time": "4:39:53", "remaining_time": "10:40:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7690, "total_steps": 25254, "loss": 0.1417, "learning_rate": 4.075426293288351e-05, "epoch": 0.9135186505108102, "percentage": 30.45, "elapsed_time": "4:40:14", "remaining_time": "10:40:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7700, "total_steps": 25254, "loss": 0.1418, "learning_rate": 4.072935499156257e-05, "epoch": 0.9147065811356617, "percentage": 30.49, "elapsed_time": "4:40:36", "remaining_time": "10:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7710, "total_steps": 25254, "loss": 0.1477, "learning_rate": 4.070442117882242e-05, "epoch": 0.9158945117605132, "percentage": 30.53, "elapsed_time": "4:40:57", "remaining_time": "10:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7720, "total_steps": 25254, "loss": 0.1436, "learning_rate": 4.0679461535673837e-05, "epoch": 0.9170824423853647, "percentage": 30.57, "elapsed_time": "4:41:19", "remaining_time": "10:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7730, "total_steps": 25254, "loss": 0.147, "learning_rate": 4.0654476103170086e-05, "epoch": 0.9182703730102162, "percentage": 30.61, "elapsed_time": "4:41:41", "remaining_time": "10:38:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7740, "total_steps": 25254, "loss": 0.1473, "learning_rate": 4.0629464922406854e-05, "epoch": 0.9194583036350678, "percentage": 30.65, "elapsed_time": "4:42:02", "remaining_time": "10:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7750, "total_steps": 25254, "loss": 0.1484, "learning_rate": 4.060442803452218e-05, "epoch": 0.9206462342599192, "percentage": 30.69, "elapsed_time": "4:42:24", "remaining_time": "10:37:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7760, "total_steps": 25254, "loss": 0.1451, "learning_rate": 4.057936548069637e-05, "epoch": 0.9218341648847708, "percentage": 30.73, "elapsed_time": "4:42:45", "remaining_time": "10:37:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7770, "total_steps": 25254, "loss": 0.1475, "learning_rate": 4.055427730215197e-05, "epoch": 0.9230220955096222, "percentage": 30.77, "elapsed_time": "4:43:07", "remaining_time": "10:37:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7780, "total_steps": 25254, "loss": 0.1475, "learning_rate": 4.0529163540153646e-05, "epoch": 0.9242100261344738, "percentage": 30.81, "elapsed_time": "4:43:29", "remaining_time": "10:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7790, "total_steps": 25254, "loss": 0.1472, "learning_rate": 4.0504024236008156e-05, "epoch": 0.9253979567593252, "percentage": 30.85, "elapsed_time": "4:43:50", "remaining_time": "10:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7800, "total_steps": 25254, "loss": 0.1452, "learning_rate": 4.047885943106428e-05, "epoch": 0.9265858873841768, "percentage": 30.89, "elapsed_time": "4:44:12", "remaining_time": "10:35:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7810, "total_steps": 25254, "loss": 0.1425, "learning_rate": 4.0453669166712724e-05, "epoch": 0.9277738180090283, "percentage": 30.93, "elapsed_time": "4:44:34", "remaining_time": "10:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7820, "total_steps": 25254, "loss": 0.1447, "learning_rate": 4.0428453484386076e-05, "epoch": 0.9289617486338798, "percentage": 30.97, "elapsed_time": "4:44:55", "remaining_time": "10:35:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7830, "total_steps": 25254, "loss": 0.1456, "learning_rate": 4.040321242555874e-05, "epoch": 0.9301496792587313, "percentage": 31.0, "elapsed_time": "4:45:17", "remaining_time": "10:34:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7840, "total_steps": 25254, "loss": 0.1423, "learning_rate": 4.037794603174684e-05, "epoch": 0.9313376098835828, "percentage": 31.04, "elapsed_time": "4:45:39", "remaining_time": "10:34:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7850, "total_steps": 25254, "loss": 0.1438, "learning_rate": 4.035265434450818e-05, "epoch": 0.9325255405084343, "percentage": 31.08, "elapsed_time": "4:46:00", "remaining_time": "10:34:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7860, "total_steps": 25254, "loss": 0.1431, "learning_rate": 4.032733740544217e-05, "epoch": 0.9337134711332858, "percentage": 31.12, "elapsed_time": "4:46:22", "remaining_time": "10:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7870, "total_steps": 25254, "loss": 0.1456, "learning_rate": 4.030199525618976e-05, "epoch": 0.9349014017581373, "percentage": 31.16, "elapsed_time": "4:46:44", "remaining_time": "10:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7880, "total_steps": 25254, "loss": 0.1499, "learning_rate": 4.027662793843334e-05, "epoch": 0.9360893323829889, "percentage": 31.2, "elapsed_time": "4:47:05", "remaining_time": "10:32:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7890, "total_steps": 25254, "loss": 0.1502, "learning_rate": 4.0251235493896733e-05, "epoch": 0.9372772630078403, "percentage": 31.24, "elapsed_time": "4:47:27", "remaining_time": "10:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7900, "total_steps": 25254, "loss": 0.1437, "learning_rate": 4.0225817964345056e-05, "epoch": 0.9384651936326919, "percentage": 31.28, "elapsed_time": "4:47:50", "remaining_time": "10:32:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7910, "total_steps": 25254, "loss": 0.1448, "learning_rate": 4.02003753915847e-05, "epoch": 0.9396531242575433, "percentage": 31.32, "elapsed_time": "4:48:11", "remaining_time": "10:31:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7920, "total_steps": 25254, "loss": 0.146, "learning_rate": 4.017490781746325e-05, "epoch": 0.9408410548823949, "percentage": 31.36, "elapsed_time": "4:48:33", "remaining_time": "10:31:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7930, "total_steps": 25254, "loss": 0.1437, "learning_rate": 4.0149415283869404e-05, "epoch": 0.9420289855072463, "percentage": 31.4, "elapsed_time": "4:48:55", "remaining_time": "10:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7940, "total_steps": 25254, "loss": 0.1482, "learning_rate": 4.012389783273293e-05, "epoch": 0.9432169161320979, "percentage": 31.44, "elapsed_time": "4:49:17", "remaining_time": "10:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7950, "total_steps": 25254, "loss": 0.1452, "learning_rate": 4.009835550602456e-05, "epoch": 0.9444048467569494, "percentage": 31.48, "elapsed_time": "4:49:39", "remaining_time": "10:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7960, "total_steps": 25254, "loss": 0.1421, "learning_rate": 4.0072788345755956e-05, "epoch": 0.9455927773818009, "percentage": 31.52, "elapsed_time": "4:50:01", "remaining_time": "10:30:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7970, "total_steps": 25254, "loss": 0.1441, "learning_rate": 4.0047196393979616e-05, "epoch": 0.9467807080066524, "percentage": 31.56, "elapsed_time": "4:50:23", "remaining_time": "10:29:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7980, "total_steps": 25254, "loss": 0.1448, "learning_rate": 4.0021579692788816e-05, "epoch": 0.9479686386315039, "percentage": 31.6, "elapsed_time": "4:50:45", "remaining_time": "10:29:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 7990, "total_steps": 25254, "loss": 0.147, "learning_rate": 3.999593828431754e-05, "epoch": 0.9491565692563554, "percentage": 31.64, "elapsed_time": "4:51:06", "remaining_time": "10:29:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8000, "total_steps": 25254, "loss": 0.146, "learning_rate": 3.997027221074041e-05, "epoch": 0.950344499881207, "percentage": 31.68, "elapsed_time": "4:51:28", "remaining_time": "10:28:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8010, "total_steps": 25254, "loss": 0.1447, "learning_rate": 3.994458151427263e-05, "epoch": 0.9515324305060584, "percentage": 31.72, "elapsed_time": "4:51:50", "remaining_time": "10:28:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8020, "total_steps": 25254, "loss": 0.1457, "learning_rate": 3.991886623716988e-05, "epoch": 0.95272036113091, "percentage": 31.76, "elapsed_time": "4:52:13", "remaining_time": "10:27:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8030, "total_steps": 25254, "loss": 0.144, "learning_rate": 3.989312642172828e-05, "epoch": 0.9539082917557614, "percentage": 31.8, "elapsed_time": "4:52:34", "remaining_time": "10:27:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8040, "total_steps": 25254, "loss": 0.1474, "learning_rate": 3.9867362110284327e-05, "epoch": 0.955096222380613, "percentage": 31.84, "elapsed_time": "4:52:56", "remaining_time": "10:27:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8050, "total_steps": 25254, "loss": 0.1448, "learning_rate": 3.9841573345214784e-05, "epoch": 0.9562841530054644, "percentage": 31.88, "elapsed_time": "4:53:17", "remaining_time": "10:26:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8060, "total_steps": 25254, "loss": 0.1459, "learning_rate": 3.9815760168936645e-05, "epoch": 0.957472083630316, "percentage": 31.92, "elapsed_time": "4:53:39", "remaining_time": "10:26:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8070, "total_steps": 25254, "loss": 0.1461, "learning_rate": 3.9789922623907064e-05, "epoch": 0.9586600142551674, "percentage": 31.96, "elapsed_time": "4:54:01", "remaining_time": "10:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8080, "total_steps": 25254, "loss": 0.1449, "learning_rate": 3.976406075262324e-05, "epoch": 0.959847944880019, "percentage": 31.99, "elapsed_time": "4:54:24", "remaining_time": "10:25:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8090, "total_steps": 25254, "loss": 0.1448, "learning_rate": 3.973817459762244e-05, "epoch": 0.9610358755048705, "percentage": 32.03, "elapsed_time": "4:54:45", "remaining_time": "10:25:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8100, "total_steps": 25254, "loss": 0.1452, "learning_rate": 3.9712264201481834e-05, "epoch": 0.962223806129722, "percentage": 32.07, "elapsed_time": "4:55:06", "remaining_time": "10:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8110, "total_steps": 25254, "loss": 0.1463, "learning_rate": 3.9686329606818475e-05, "epoch": 0.9634117367545735, "percentage": 32.11, "elapsed_time": "4:55:27", "remaining_time": "10:24:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8120, "total_steps": 25254, "loss": 0.1437, "learning_rate": 3.966037085628921e-05, "epoch": 0.964599667379425, "percentage": 32.15, "elapsed_time": "4:55:49", "remaining_time": "10:24:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8130, "total_steps": 25254, "loss": 0.1479, "learning_rate": 3.9634387992590625e-05, "epoch": 0.9657875980042766, "percentage": 32.19, "elapsed_time": "4:56:10", "remaining_time": "10:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8140, "total_steps": 25254, "loss": 0.1452, "learning_rate": 3.960838105845897e-05, "epoch": 0.9669755286291281, "percentage": 32.23, "elapsed_time": "4:56:32", "remaining_time": "10:23:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8150, "total_steps": 25254, "loss": 0.1457, "learning_rate": 3.958235009667006e-05, "epoch": 0.9681634592539796, "percentage": 32.27, "elapsed_time": "4:56:54", "remaining_time": "10:23:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8160, "total_steps": 25254, "loss": 0.1459, "learning_rate": 3.955629515003927e-05, "epoch": 0.9693513898788311, "percentage": 32.31, "elapsed_time": "4:57:15", "remaining_time": "10:22:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8170, "total_steps": 25254, "loss": 0.1467, "learning_rate": 3.95302162614214e-05, "epoch": 0.9705393205036826, "percentage": 32.35, "elapsed_time": "4:57:37", "remaining_time": "10:22:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8180, "total_steps": 25254, "loss": 0.1431, "learning_rate": 3.950411347371064e-05, "epoch": 0.9717272511285341, "percentage": 32.39, "elapsed_time": "4:57:59", "remaining_time": "10:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8190, "total_steps": 25254, "loss": 0.1439, "learning_rate": 3.947798682984046e-05, "epoch": 0.9729151817533856, "percentage": 32.43, "elapsed_time": "4:58:22", "remaining_time": "10:21:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8200, "total_steps": 25254, "loss": 0.1473, "learning_rate": 3.945183637278364e-05, "epoch": 0.9741031123782371, "percentage": 32.47, "elapsed_time": "4:58:43", "remaining_time": "10:21:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8210, "total_steps": 25254, "loss": 0.143, "learning_rate": 3.942566214555203e-05, "epoch": 0.9752910430030887, "percentage": 32.51, "elapsed_time": "4:59:06", "remaining_time": "10:20:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8220, "total_steps": 25254, "loss": 0.1411, "learning_rate": 3.9399464191196643e-05, "epoch": 0.9764789736279401, "percentage": 32.55, "elapsed_time": "4:59:28", "remaining_time": "10:20:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8230, "total_steps": 25254, "loss": 0.1436, "learning_rate": 3.9373242552807514e-05, "epoch": 0.9776669042527917, "percentage": 32.59, "elapsed_time": "4:59:49", "remaining_time": "10:20:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8240, "total_steps": 25254, "loss": 0.1467, "learning_rate": 3.9346997273513606e-05, "epoch": 0.9788548348776431, "percentage": 32.63, "elapsed_time": "5:00:11", "remaining_time": "10:19:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8250, "total_steps": 25254, "loss": 0.1413, "learning_rate": 3.9320728396482795e-05, "epoch": 0.9800427655024947, "percentage": 32.67, "elapsed_time": "5:00:32", "remaining_time": "10:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8260, "total_steps": 25254, "loss": 0.1403, "learning_rate": 3.9294435964921736e-05, "epoch": 0.9812306961273461, "percentage": 32.71, "elapsed_time": "5:00:54", "remaining_time": "10:19:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8270, "total_steps": 25254, "loss": 0.1468, "learning_rate": 3.926812002207586e-05, "epoch": 0.9824186267521977, "percentage": 32.75, "elapsed_time": "5:01:15", "remaining_time": "10:18:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8280, "total_steps": 25254, "loss": 0.1465, "learning_rate": 3.924178061122926e-05, "epoch": 0.9836065573770492, "percentage": 32.79, "elapsed_time": "5:01:36", "remaining_time": "10:18:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8290, "total_steps": 25254, "loss": 0.1456, "learning_rate": 3.921541777570461e-05, "epoch": 0.9847944880019007, "percentage": 32.83, "elapsed_time": "5:01:58", "remaining_time": "10:17:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8300, "total_steps": 25254, "loss": 0.1447, "learning_rate": 3.918903155886314e-05, "epoch": 0.9859824186267522, "percentage": 32.87, "elapsed_time": "5:02:19", "remaining_time": "10:17:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8310, "total_steps": 25254, "loss": 0.1463, "learning_rate": 3.916262200410451e-05, "epoch": 0.9871703492516037, "percentage": 32.91, "elapsed_time": "5:02:41", "remaining_time": "10:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8320, "total_steps": 25254, "loss": 0.1431, "learning_rate": 3.9136189154866784e-05, "epoch": 0.9883582798764552, "percentage": 32.95, "elapsed_time": "5:03:04", "remaining_time": "10:16:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8330, "total_steps": 25254, "loss": 0.1441, "learning_rate": 3.9109733054626354e-05, "epoch": 0.9895462105013068, "percentage": 32.98, "elapsed_time": "5:03:26", "remaining_time": "10:16:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8340, "total_steps": 25254, "loss": 0.1428, "learning_rate": 3.908325374689781e-05, "epoch": 0.9907341411261582, "percentage": 33.02, "elapsed_time": "5:03:48", "remaining_time": "10:16:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8350, "total_steps": 25254, "loss": 0.143, "learning_rate": 3.905675127523396e-05, "epoch": 0.9919220717510098, "percentage": 33.06, "elapsed_time": "5:04:10", "remaining_time": "10:15:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8360, "total_steps": 25254, "loss": 0.1441, "learning_rate": 3.903022568322567e-05, "epoch": 0.9931100023758612, "percentage": 33.1, "elapsed_time": "5:04:32", "remaining_time": "10:15:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8370, "total_steps": 25254, "loss": 0.1455, "learning_rate": 3.900367701450189e-05, "epoch": 0.9942979330007128, "percentage": 33.14, "elapsed_time": "5:04:54", "remaining_time": "10:15:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8380, "total_steps": 25254, "loss": 0.1414, "learning_rate": 3.897710531272947e-05, "epoch": 0.9954858636255642, "percentage": 33.18, "elapsed_time": "5:05:16", "remaining_time": "10:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8390, "total_steps": 25254, "loss": 0.1433, "learning_rate": 3.895051062161316e-05, "epoch": 0.9966737942504158, "percentage": 33.22, "elapsed_time": "5:05:38", "remaining_time": "10:14:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8400, "total_steps": 25254, "loss": 0.1429, "learning_rate": 3.892389298489555e-05, "epoch": 0.9978617248752673, "percentage": 33.26, "elapsed_time": "5:06:00", "remaining_time": "10:13:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8410, "total_steps": 25254, "loss": 0.141, "learning_rate": 3.8897252446356934e-05, "epoch": 0.9990496555001188, "percentage": 33.3, "elapsed_time": "5:06:22", "remaining_time": "10:13:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8420, "total_steps": 25254, "loss": 0.14, "learning_rate": 3.88705890498153e-05, "epoch": 1.0002375861249704, "percentage": 33.34, "elapsed_time": "5:06:52", "remaining_time": "10:13:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8430, "total_steps": 25254, "loss": 0.1254, "learning_rate": 3.8843902839126215e-05, "epoch": 1.0014255167498218, "percentage": 33.38, "elapsed_time": "5:07:14", "remaining_time": "10:13:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8440, "total_steps": 25254, "loss": 0.125, "learning_rate": 3.881719385818279e-05, "epoch": 1.0026134473746733, "percentage": 33.42, "elapsed_time": "5:07:36", "remaining_time": "10:12:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8450, "total_steps": 25254, "loss": 0.1222, "learning_rate": 3.8790462150915566e-05, "epoch": 1.0038013779995247, "percentage": 33.46, "elapsed_time": "5:07:59", "remaining_time": "10:12:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8460, "total_steps": 25254, "loss": 0.1233, "learning_rate": 3.876370776129248e-05, "epoch": 1.0049893086243764, "percentage": 33.5, "elapsed_time": "5:08:20", "remaining_time": "10:12:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8470, "total_steps": 25254, "loss": 0.1244, "learning_rate": 3.873693073331877e-05, "epoch": 1.0061772392492279, "percentage": 33.54, "elapsed_time": "5:08:42", "remaining_time": "10:11:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8480, "total_steps": 25254, "loss": 0.1259, "learning_rate": 3.8710131111036904e-05, "epoch": 1.0073651698740793, "percentage": 33.58, "elapsed_time": "5:09:04", "remaining_time": "10:11:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8490, "total_steps": 25254, "loss": 0.1209, "learning_rate": 3.868330893852653e-05, "epoch": 1.0085531004989308, "percentage": 33.62, "elapsed_time": "5:09:26", "remaining_time": "10:11:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8500, "total_steps": 25254, "loss": 0.1256, "learning_rate": 3.8656464259904375e-05, "epoch": 1.0097410311237824, "percentage": 33.66, "elapsed_time": "5:09:47", "remaining_time": "10:10:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8510, "total_steps": 25254, "loss": 0.1232, "learning_rate": 3.862959711932418e-05, "epoch": 1.010928961748634, "percentage": 33.7, "elapsed_time": "5:10:09", "remaining_time": "10:10:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8520, "total_steps": 25254, "loss": 0.1242, "learning_rate": 3.860270756097663e-05, "epoch": 1.0121168923734853, "percentage": 33.74, "elapsed_time": "5:10:31", "remaining_time": "10:09:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8530, "total_steps": 25254, "loss": 0.1224, "learning_rate": 3.8575795629089294e-05, "epoch": 1.0133048229983368, "percentage": 33.78, "elapsed_time": "5:10:52", "remaining_time": "10:09:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8540, "total_steps": 25254, "loss": 0.1232, "learning_rate": 3.8548861367926534e-05, "epoch": 1.0144927536231885, "percentage": 33.82, "elapsed_time": "5:11:14", "remaining_time": "10:09:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8550, "total_steps": 25254, "loss": 0.1217, "learning_rate": 3.8521904821789447e-05, "epoch": 1.01568068424804, "percentage": 33.86, "elapsed_time": "5:11:35", "remaining_time": "10:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8560, "total_steps": 25254, "loss": 0.1215, "learning_rate": 3.849492603501577e-05, "epoch": 1.0168686148728914, "percentage": 33.9, "elapsed_time": "5:11:57", "remaining_time": "10:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8570, "total_steps": 25254, "loss": 0.1193, "learning_rate": 3.8467925051979816e-05, "epoch": 1.0180565454977428, "percentage": 33.94, "elapsed_time": "5:12:20", "remaining_time": "10:08:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8580, "total_steps": 25254, "loss": 0.1255, "learning_rate": 3.8440901917092434e-05, "epoch": 1.0192444761225945, "percentage": 33.97, "elapsed_time": "5:12:42", "remaining_time": "10:07:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8590, "total_steps": 25254, "loss": 0.122, "learning_rate": 3.841385667480089e-05, "epoch": 1.020432406747446, "percentage": 34.01, "elapsed_time": "5:13:04", "remaining_time": "10:07:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8600, "total_steps": 25254, "loss": 0.1254, "learning_rate": 3.83867893695888e-05, "epoch": 1.0216203373722974, "percentage": 34.05, "elapsed_time": "5:13:26", "remaining_time": "10:06:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8610, "total_steps": 25254, "loss": 0.1217, "learning_rate": 3.83597000459761e-05, "epoch": 1.0228082679971489, "percentage": 34.09, "elapsed_time": "5:13:48", "remaining_time": "10:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8620, "total_steps": 25254, "loss": 0.1226, "learning_rate": 3.83325887485189e-05, "epoch": 1.0239961986220005, "percentage": 34.13, "elapsed_time": "5:14:10", "remaining_time": "10:06:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8630, "total_steps": 25254, "loss": 0.1211, "learning_rate": 3.830545552180951e-05, "epoch": 1.025184129246852, "percentage": 34.17, "elapsed_time": "5:14:32", "remaining_time": "10:05:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8640, "total_steps": 25254, "loss": 0.1253, "learning_rate": 3.827830041047624e-05, "epoch": 1.0263720598717034, "percentage": 34.21, "elapsed_time": "5:14:55", "remaining_time": "10:05:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8650, "total_steps": 25254, "loss": 0.1239, "learning_rate": 3.8251123459183466e-05, "epoch": 1.027559990496555, "percentage": 34.25, "elapsed_time": "5:15:16", "remaining_time": "10:05:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8660, "total_steps": 25254, "loss": 0.1267, "learning_rate": 3.822392471263142e-05, "epoch": 1.0287479211214066, "percentage": 34.29, "elapsed_time": "5:15:37", "remaining_time": "10:04:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8670, "total_steps": 25254, "loss": 0.1237, "learning_rate": 3.8196704215556235e-05, "epoch": 1.029935851746258, "percentage": 34.33, "elapsed_time": "5:15:59", "remaining_time": "10:04:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8680, "total_steps": 25254, "loss": 0.1207, "learning_rate": 3.8169462012729784e-05, "epoch": 1.0311237823711095, "percentage": 34.37, "elapsed_time": "5:16:21", "remaining_time": "10:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8690, "total_steps": 25254, "loss": 0.1231, "learning_rate": 3.814219814895965e-05, "epoch": 1.0323117129959611, "percentage": 34.41, "elapsed_time": "5:16:42", "remaining_time": "10:03:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8700, "total_steps": 25254, "loss": 0.1231, "learning_rate": 3.811491266908906e-05, "epoch": 1.0334996436208126, "percentage": 34.45, "elapsed_time": "5:17:05", "remaining_time": "10:03:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8710, "total_steps": 25254, "loss": 0.124, "learning_rate": 3.808760561799678e-05, "epoch": 1.034687574245664, "percentage": 34.49, "elapsed_time": "5:17:27", "remaining_time": "10:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8720, "total_steps": 25254, "loss": 0.1231, "learning_rate": 3.806027704059706e-05, "epoch": 1.0358755048705155, "percentage": 34.53, "elapsed_time": "5:17:48", "remaining_time": "10:02:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8730, "total_steps": 25254, "loss": 0.1251, "learning_rate": 3.803292698183955e-05, "epoch": 1.0370634354953672, "percentage": 34.57, "elapsed_time": "5:18:10", "remaining_time": "10:02:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8740, "total_steps": 25254, "loss": 0.1219, "learning_rate": 3.800555548670924e-05, "epoch": 1.0382513661202186, "percentage": 34.61, "elapsed_time": "5:18:32", "remaining_time": "10:01:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8750, "total_steps": 25254, "loss": 0.1243, "learning_rate": 3.797816260022639e-05, "epoch": 1.03943929674507, "percentage": 34.65, "elapsed_time": "5:18:54", "remaining_time": "10:01:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8760, "total_steps": 25254, "loss": 0.1228, "learning_rate": 3.7950748367446396e-05, "epoch": 1.0406272273699215, "percentage": 34.69, "elapsed_time": "5:19:16", "remaining_time": "10:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8770, "total_steps": 25254, "loss": 0.1233, "learning_rate": 3.7923312833459837e-05, "epoch": 1.0418151579947732, "percentage": 34.73, "elapsed_time": "5:19:39", "remaining_time": "10:00:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8780, "total_steps": 25254, "loss": 0.1243, "learning_rate": 3.7895856043392255e-05, "epoch": 1.0430030886196247, "percentage": 34.77, "elapsed_time": "5:20:01", "remaining_time": "10:00:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8790, "total_steps": 25254, "loss": 0.1203, "learning_rate": 3.78683780424042e-05, "epoch": 1.044191019244476, "percentage": 34.81, "elapsed_time": "5:20:22", "remaining_time": "10:00:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8800, "total_steps": 25254, "loss": 0.1208, "learning_rate": 3.784087887569111e-05, "epoch": 1.0453789498693276, "percentage": 34.85, "elapsed_time": "5:20:44", "remaining_time": "9:59:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8810, "total_steps": 25254, "loss": 0.1231, "learning_rate": 3.78133585884832e-05, "epoch": 1.0465668804941792, "percentage": 34.89, "elapsed_time": "5:21:06", "remaining_time": "9:59:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8820, "total_steps": 25254, "loss": 0.1248, "learning_rate": 3.7785817226045467e-05, "epoch": 1.0477548111190307, "percentage": 34.93, "elapsed_time": "5:21:27", "remaining_time": "9:58:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8830, "total_steps": 25254, "loss": 0.126, "learning_rate": 3.775825483367754e-05, "epoch": 1.0489427417438821, "percentage": 34.96, "elapsed_time": "5:21:49", "remaining_time": "9:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8840, "total_steps": 25254, "loss": 0.1228, "learning_rate": 3.773067145671366e-05, "epoch": 1.0501306723687336, "percentage": 35.0, "elapsed_time": "5:22:10", "remaining_time": "9:58:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8850, "total_steps": 25254, "loss": 0.1241, "learning_rate": 3.770306714052256e-05, "epoch": 1.0513186029935853, "percentage": 35.04, "elapsed_time": "5:22:31", "remaining_time": "9:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8860, "total_steps": 25254, "loss": 0.121, "learning_rate": 3.7675441930507435e-05, "epoch": 1.0525065336184367, "percentage": 35.08, "elapsed_time": "5:22:53", "remaining_time": "9:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8870, "total_steps": 25254, "loss": 0.1217, "learning_rate": 3.7647795872105836e-05, "epoch": 1.0536944642432882, "percentage": 35.12, "elapsed_time": "5:23:15", "remaining_time": "9:57:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8880, "total_steps": 25254, "loss": 0.1214, "learning_rate": 3.7620129010789596e-05, "epoch": 1.0548823948681396, "percentage": 35.16, "elapsed_time": "5:23:37", "remaining_time": "9:56:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8890, "total_steps": 25254, "loss": 0.1233, "learning_rate": 3.7592441392064793e-05, "epoch": 1.0560703254929913, "percentage": 35.2, "elapsed_time": "5:23:58", "remaining_time": "9:56:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8900, "total_steps": 25254, "loss": 0.1234, "learning_rate": 3.7564733061471614e-05, "epoch": 1.0572582561178427, "percentage": 35.24, "elapsed_time": "5:24:21", "remaining_time": "9:56:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8910, "total_steps": 25254, "loss": 0.1229, "learning_rate": 3.753700406458434e-05, "epoch": 1.0584461867426942, "percentage": 35.28, "elapsed_time": "5:24:42", "remaining_time": "9:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8920, "total_steps": 25254, "loss": 0.1233, "learning_rate": 3.7509254447011214e-05, "epoch": 1.0596341173675456, "percentage": 35.32, "elapsed_time": "5:25:04", "remaining_time": "9:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8930, "total_steps": 25254, "loss": 0.1215, "learning_rate": 3.748148425439442e-05, "epoch": 1.0608220479923973, "percentage": 35.36, "elapsed_time": "5:25:26", "remaining_time": "9:54:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8940, "total_steps": 25254, "loss": 0.1233, "learning_rate": 3.7453693532409983e-05, "epoch": 1.0620099786172488, "percentage": 35.4, "elapsed_time": "5:25:48", "remaining_time": "9:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8950, "total_steps": 25254, "loss": 0.1281, "learning_rate": 3.742588232676767e-05, "epoch": 1.0631979092421002, "percentage": 35.44, "elapsed_time": "5:26:10", "remaining_time": "9:54:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8960, "total_steps": 25254, "loss": 0.12, "learning_rate": 3.7398050683210975e-05, "epoch": 1.0643858398669517, "percentage": 35.48, "elapsed_time": "5:26:32", "remaining_time": "9:53:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8970, "total_steps": 25254, "loss": 0.1219, "learning_rate": 3.737019864751698e-05, "epoch": 1.0655737704918034, "percentage": 35.52, "elapsed_time": "5:26:54", "remaining_time": "9:53:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8980, "total_steps": 25254, "loss": 0.1269, "learning_rate": 3.7342326265496305e-05, "epoch": 1.0667617011166548, "percentage": 35.56, "elapsed_time": "5:27:16", "remaining_time": "9:53:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 8990, "total_steps": 25254, "loss": 0.1233, "learning_rate": 3.731443358299307e-05, "epoch": 1.0679496317415063, "percentage": 35.6, "elapsed_time": "5:27:38", "remaining_time": "9:52:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9000, "total_steps": 25254, "loss": 0.1236, "learning_rate": 3.728652064588475e-05, "epoch": 1.0691375623663577, "percentage": 35.64, "elapsed_time": "5:28:00", "remaining_time": "9:52:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9010, "total_steps": 25254, "loss": 0.1246, "learning_rate": 3.7258587500082154e-05, "epoch": 1.0703254929912094, "percentage": 35.68, "elapsed_time": "5:28:22", "remaining_time": "9:52:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9020, "total_steps": 25254, "loss": 0.1228, "learning_rate": 3.72306341915293e-05, "epoch": 1.0715134236160608, "percentage": 35.72, "elapsed_time": "5:28:44", "remaining_time": "9:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9030, "total_steps": 25254, "loss": 0.1251, "learning_rate": 3.7202660766203425e-05, "epoch": 1.0727013542409123, "percentage": 35.76, "elapsed_time": "5:29:06", "remaining_time": "9:51:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9040, "total_steps": 25254, "loss": 0.1224, "learning_rate": 3.717466727011479e-05, "epoch": 1.0738892848657637, "percentage": 35.8, "elapsed_time": "5:29:28", "remaining_time": "9:50:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9050, "total_steps": 25254, "loss": 0.1224, "learning_rate": 3.7146653749306724e-05, "epoch": 1.0750772154906154, "percentage": 35.84, "elapsed_time": "5:29:49", "remaining_time": "9:50:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9060, "total_steps": 25254, "loss": 0.1242, "learning_rate": 3.711862024985546e-05, "epoch": 1.0762651461154669, "percentage": 35.88, "elapsed_time": "5:30:11", "remaining_time": "9:50:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9070, "total_steps": 25254, "loss": 0.1238, "learning_rate": 3.7090566817870085e-05, "epoch": 1.0774530767403183, "percentage": 35.92, "elapsed_time": "5:30:33", "remaining_time": "9:49:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9080, "total_steps": 25254, "loss": 0.1249, "learning_rate": 3.7062493499492504e-05, "epoch": 1.07864100736517, "percentage": 35.95, "elapsed_time": "5:30:55", "remaining_time": "9:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9090, "total_steps": 25254, "loss": 0.1244, "learning_rate": 3.70344003408973e-05, "epoch": 1.0798289379900214, "percentage": 35.99, "elapsed_time": "5:31:17", "remaining_time": "9:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9100, "total_steps": 25254, "loss": 0.1246, "learning_rate": 3.70062873882917e-05, "epoch": 1.081016868614873, "percentage": 36.03, "elapsed_time": "5:31:39", "remaining_time": "9:48:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9110, "total_steps": 25254, "loss": 0.1254, "learning_rate": 3.6978154687915496e-05, "epoch": 1.0822047992397243, "percentage": 36.07, "elapsed_time": "5:32:01", "remaining_time": "9:48:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9120, "total_steps": 25254, "loss": 0.1244, "learning_rate": 3.695000228604095e-05, "epoch": 1.0833927298645758, "percentage": 36.11, "elapsed_time": "5:32:23", "remaining_time": "9:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9130, "total_steps": 25254, "loss": 0.127, "learning_rate": 3.692183022897273e-05, "epoch": 1.0845806604894275, "percentage": 36.15, "elapsed_time": "5:32:45", "remaining_time": "9:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9140, "total_steps": 25254, "loss": 0.1212, "learning_rate": 3.689363856304783e-05, "epoch": 1.085768591114279, "percentage": 36.19, "elapsed_time": "5:33:07", "remaining_time": "9:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9150, "total_steps": 25254, "loss": 0.1244, "learning_rate": 3.6865427334635506e-05, "epoch": 1.0869565217391304, "percentage": 36.23, "elapsed_time": "5:33:28", "remaining_time": "9:46:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9160, "total_steps": 25254, "loss": 0.1237, "learning_rate": 3.683719659013719e-05, "epoch": 1.088144452363982, "percentage": 36.27, "elapsed_time": "5:33:49", "remaining_time": "9:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9170, "total_steps": 25254, "loss": 0.1219, "learning_rate": 3.6808946375986404e-05, "epoch": 1.0893323829888335, "percentage": 36.31, "elapsed_time": "5:34:12", "remaining_time": "9:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9180, "total_steps": 25254, "loss": 0.12, "learning_rate": 3.678067673864869e-05, "epoch": 1.090520313613685, "percentage": 36.35, "elapsed_time": "5:34:34", "remaining_time": "9:45:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9190, "total_steps": 25254, "loss": 0.1283, "learning_rate": 3.6752387724621564e-05, "epoch": 1.0917082442385364, "percentage": 36.39, "elapsed_time": "5:34:56", "remaining_time": "9:45:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9200, "total_steps": 25254, "loss": 0.1227, "learning_rate": 3.672407938043438e-05, "epoch": 1.092896174863388, "percentage": 36.43, "elapsed_time": "5:35:17", "remaining_time": "9:45:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9210, "total_steps": 25254, "loss": 0.1221, "learning_rate": 3.669575175264829e-05, "epoch": 1.0940841054882395, "percentage": 36.47, "elapsed_time": "5:35:39", "remaining_time": "9:44:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9220, "total_steps": 25254, "loss": 0.1252, "learning_rate": 3.66674048878562e-05, "epoch": 1.095272036113091, "percentage": 36.51, "elapsed_time": "5:36:01", "remaining_time": "9:44:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9230, "total_steps": 25254, "loss": 0.1204, "learning_rate": 3.6639038832682607e-05, "epoch": 1.0964599667379424, "percentage": 36.55, "elapsed_time": "5:36:22", "remaining_time": "9:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9240, "total_steps": 25254, "loss": 0.124, "learning_rate": 3.661065363378361e-05, "epoch": 1.0976478973627941, "percentage": 36.59, "elapsed_time": "5:36:44", "remaining_time": "9:43:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9250, "total_steps": 25254, "loss": 0.1227, "learning_rate": 3.6582249337846766e-05, "epoch": 1.0988358279876456, "percentage": 36.63, "elapsed_time": "5:37:06", "remaining_time": "9:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9260, "total_steps": 25254, "loss": 0.1259, "learning_rate": 3.6553825991591064e-05, "epoch": 1.100023758612497, "percentage": 36.67, "elapsed_time": "5:37:27", "remaining_time": "9:42:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9270, "total_steps": 25254, "loss": 0.1201, "learning_rate": 3.652538364176682e-05, "epoch": 1.1012116892373485, "percentage": 36.71, "elapsed_time": "5:37:49", "remaining_time": "9:42:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9280, "total_steps": 25254, "loss": 0.1267, "learning_rate": 3.64969223351556e-05, "epoch": 1.1023996198622001, "percentage": 36.75, "elapsed_time": "5:38:11", "remaining_time": "9:42:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9290, "total_steps": 25254, "loss": 0.1223, "learning_rate": 3.6468442118570165e-05, "epoch": 1.1035875504870516, "percentage": 36.79, "elapsed_time": "5:38:33", "remaining_time": "9:41:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9300, "total_steps": 25254, "loss": 0.1248, "learning_rate": 3.643994303885437e-05, "epoch": 1.104775481111903, "percentage": 36.83, "elapsed_time": "5:38:55", "remaining_time": "9:41:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9310, "total_steps": 25254, "loss": 0.1226, "learning_rate": 3.6411425142883084e-05, "epoch": 1.1059634117367545, "percentage": 36.87, "elapsed_time": "5:39:16", "remaining_time": "9:41:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9320, "total_steps": 25254, "loss": 0.1217, "learning_rate": 3.638288847756216e-05, "epoch": 1.1071513423616062, "percentage": 36.91, "elapsed_time": "5:39:39", "remaining_time": "9:40:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9330, "total_steps": 25254, "loss": 0.1229, "learning_rate": 3.6354333089828266e-05, "epoch": 1.1083392729864576, "percentage": 36.94, "elapsed_time": "5:40:01", "remaining_time": "9:40:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9340, "total_steps": 25254, "loss": 0.1234, "learning_rate": 3.632575902664893e-05, "epoch": 1.109527203611309, "percentage": 36.98, "elapsed_time": "5:40:23", "remaining_time": "9:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9350, "total_steps": 25254, "loss": 0.1247, "learning_rate": 3.629716633502233e-05, "epoch": 1.1107151342361605, "percentage": 37.02, "elapsed_time": "5:40:44", "remaining_time": "9:39:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9360, "total_steps": 25254, "loss": 0.1229, "learning_rate": 3.626855506197735e-05, "epoch": 1.1119030648610122, "percentage": 37.06, "elapsed_time": "5:41:06", "remaining_time": "9:39:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9370, "total_steps": 25254, "loss": 0.1263, "learning_rate": 3.623992525457338e-05, "epoch": 1.1130909954858637, "percentage": 37.1, "elapsed_time": "5:41:28", "remaining_time": "9:38:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9380, "total_steps": 25254, "loss": 0.123, "learning_rate": 3.621127695990034e-05, "epoch": 1.114278926110715, "percentage": 37.14, "elapsed_time": "5:41:50", "remaining_time": "9:38:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9390, "total_steps": 25254, "loss": 0.1236, "learning_rate": 3.618261022507853e-05, "epoch": 1.1154668567355666, "percentage": 37.18, "elapsed_time": "5:42:12", "remaining_time": "9:38:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9400, "total_steps": 25254, "loss": 0.1252, "learning_rate": 3.615392509725858e-05, "epoch": 1.1166547873604182, "percentage": 37.22, "elapsed_time": "5:42:34", "remaining_time": "9:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9410, "total_steps": 25254, "loss": 0.1243, "learning_rate": 3.6125221623621396e-05, "epoch": 1.1178427179852697, "percentage": 37.26, "elapsed_time": "5:42:57", "remaining_time": "9:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9420, "total_steps": 25254, "loss": 0.1224, "learning_rate": 3.609649985137802e-05, "epoch": 1.1190306486101211, "percentage": 37.3, "elapsed_time": "5:43:19", "remaining_time": "9:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9430, "total_steps": 25254, "loss": 0.1235, "learning_rate": 3.606775982776964e-05, "epoch": 1.1202185792349726, "percentage": 37.34, "elapsed_time": "5:43:41", "remaining_time": "9:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9440, "total_steps": 25254, "loss": 0.1194, "learning_rate": 3.6039001600067414e-05, "epoch": 1.1214065098598243, "percentage": 37.38, "elapsed_time": "5:44:03", "remaining_time": "9:36:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9450, "total_steps": 25254, "loss": 0.1229, "learning_rate": 3.601022521557248e-05, "epoch": 1.1225944404846757, "percentage": 37.42, "elapsed_time": "5:44:25", "remaining_time": "9:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9460, "total_steps": 25254, "loss": 0.1257, "learning_rate": 3.5981430721615824e-05, "epoch": 1.1237823711095272, "percentage": 37.46, "elapsed_time": "5:44:46", "remaining_time": "9:35:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9470, "total_steps": 25254, "loss": 0.1223, "learning_rate": 3.5952618165558215e-05, "epoch": 1.1249703017343786, "percentage": 37.5, "elapsed_time": "5:45:08", "remaining_time": "9:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9480, "total_steps": 25254, "loss": 0.1242, "learning_rate": 3.592378759479014e-05, "epoch": 1.1261582323592303, "percentage": 37.54, "elapsed_time": "5:45:30", "remaining_time": "9:34:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9490, "total_steps": 25254, "loss": 0.1217, "learning_rate": 3.589493905673171e-05, "epoch": 1.1273461629840817, "percentage": 37.58, "elapsed_time": "5:45:52", "remaining_time": "9:34:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9500, "total_steps": 25254, "loss": 0.1246, "learning_rate": 3.58660725988326e-05, "epoch": 1.1285340936089332, "percentage": 37.62, "elapsed_time": "5:46:13", "remaining_time": "9:34:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9510, "total_steps": 25254, "loss": 0.1228, "learning_rate": 3.583718826857192e-05, "epoch": 1.1297220242337849, "percentage": 37.66, "elapsed_time": "5:46:35", "remaining_time": "9:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9520, "total_steps": 25254, "loss": 0.1229, "learning_rate": 3.580828611345823e-05, "epoch": 1.1309099548586363, "percentage": 37.7, "elapsed_time": "5:46:58", "remaining_time": "9:33:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9530, "total_steps": 25254, "loss": 0.1257, "learning_rate": 3.577936618102938e-05, "epoch": 1.1320978854834878, "percentage": 37.74, "elapsed_time": "5:47:19", "remaining_time": "9:33:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9540, "total_steps": 25254, "loss": 0.1236, "learning_rate": 3.575042851885245e-05, "epoch": 1.1332858161083392, "percentage": 37.78, "elapsed_time": "5:47:41", "remaining_time": "9:32:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9550, "total_steps": 25254, "loss": 0.1215, "learning_rate": 3.572147317452372e-05, "epoch": 1.1344737467331907, "percentage": 37.82, "elapsed_time": "5:48:03", "remaining_time": "9:32:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9560, "total_steps": 25254, "loss": 0.1252, "learning_rate": 3.5692500195668505e-05, "epoch": 1.1356616773580424, "percentage": 37.86, "elapsed_time": "5:48:25", "remaining_time": "9:31:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9570, "total_steps": 25254, "loss": 0.1253, "learning_rate": 3.566350962994116e-05, "epoch": 1.1368496079828938, "percentage": 37.89, "elapsed_time": "5:48:47", "remaining_time": "9:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9580, "total_steps": 25254, "loss": 0.1213, "learning_rate": 3.563450152502495e-05, "epoch": 1.1380375386077453, "percentage": 37.93, "elapsed_time": "5:49:09", "remaining_time": "9:31:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9590, "total_steps": 25254, "loss": 0.1203, "learning_rate": 3.560547592863199e-05, "epoch": 1.139225469232597, "percentage": 37.97, "elapsed_time": "5:49:30", "remaining_time": "9:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9600, "total_steps": 25254, "loss": 0.1236, "learning_rate": 3.557643288850318e-05, "epoch": 1.1404133998574484, "percentage": 38.01, "elapsed_time": "5:49:53", "remaining_time": "9:30:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9610, "total_steps": 25254, "loss": 0.1244, "learning_rate": 3.5547372452408084e-05, "epoch": 1.1416013304822998, "percentage": 38.05, "elapsed_time": "5:50:14", "remaining_time": "9:30:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9620, "total_steps": 25254, "loss": 0.121, "learning_rate": 3.551829466814491e-05, "epoch": 1.1427892611071513, "percentage": 38.09, "elapsed_time": "5:50:36", "remaining_time": "9:29:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9630, "total_steps": 25254, "loss": 0.1221, "learning_rate": 3.548919958354037e-05, "epoch": 1.1439771917320027, "percentage": 38.13, "elapsed_time": "5:50:58", "remaining_time": "9:29:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9640, "total_steps": 25254, "loss": 0.1194, "learning_rate": 3.5460087246449644e-05, "epoch": 1.1451651223568544, "percentage": 38.17, "elapsed_time": "5:51:20", "remaining_time": "9:29:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9650, "total_steps": 25254, "loss": 0.1213, "learning_rate": 3.5430957704756304e-05, "epoch": 1.1463530529817059, "percentage": 38.21, "elapsed_time": "5:51:42", "remaining_time": "9:28:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9660, "total_steps": 25254, "loss": 0.1232, "learning_rate": 3.5401811006372196e-05, "epoch": 1.1475409836065573, "percentage": 38.25, "elapsed_time": "5:52:04", "remaining_time": "9:28:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9670, "total_steps": 25254, "loss": 0.122, "learning_rate": 3.53726471992374e-05, "epoch": 1.148728914231409, "percentage": 38.29, "elapsed_time": "5:52:26", "remaining_time": "9:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9680, "total_steps": 25254, "loss": 0.1248, "learning_rate": 3.5343466331320114e-05, "epoch": 1.1499168448562604, "percentage": 38.33, "elapsed_time": "5:52:48", "remaining_time": "9:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9690, "total_steps": 25254, "loss": 0.1226, "learning_rate": 3.5314268450616636e-05, "epoch": 1.151104775481112, "percentage": 38.37, "elapsed_time": "5:53:10", "remaining_time": "9:27:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9700, "total_steps": 25254, "loss": 0.1232, "learning_rate": 3.528505360515121e-05, "epoch": 1.1522927061059633, "percentage": 38.41, "elapsed_time": "5:53:32", "remaining_time": "9:26:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9710, "total_steps": 25254, "loss": 0.1239, "learning_rate": 3.5255821842976005e-05, "epoch": 1.1534806367308148, "percentage": 38.45, "elapsed_time": "5:53:55", "remaining_time": "9:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9720, "total_steps": 25254, "loss": 0.1219, "learning_rate": 3.522657321217101e-05, "epoch": 1.1546685673556665, "percentage": 38.49, "elapsed_time": "5:54:16", "remaining_time": "9:26:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9730, "total_steps": 25254, "loss": 0.1232, "learning_rate": 3.519730776084395e-05, "epoch": 1.155856497980518, "percentage": 38.53, "elapsed_time": "5:54:38", "remaining_time": "9:25:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9740, "total_steps": 25254, "loss": 0.1218, "learning_rate": 3.516802553713023e-05, "epoch": 1.1570444286053694, "percentage": 38.57, "elapsed_time": "5:55:00", "remaining_time": "9:25:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9750, "total_steps": 25254, "loss": 0.121, "learning_rate": 3.513872658919282e-05, "epoch": 1.158232359230221, "percentage": 38.61, "elapsed_time": "5:55:22", "remaining_time": "9:25:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9760, "total_steps": 25254, "loss": 0.1228, "learning_rate": 3.5109410965222226e-05, "epoch": 1.1594202898550725, "percentage": 38.65, "elapsed_time": "5:55:44", "remaining_time": "9:24:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9770, "total_steps": 25254, "loss": 0.126, "learning_rate": 3.5080078713436366e-05, "epoch": 1.160608220479924, "percentage": 38.69, "elapsed_time": "5:56:07", "remaining_time": "9:24:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9780, "total_steps": 25254, "loss": 0.1212, "learning_rate": 3.505072988208051e-05, "epoch": 1.1617961511047754, "percentage": 38.73, "elapsed_time": "5:56:29", "remaining_time": "9:24:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9790, "total_steps": 25254, "loss": 0.1253, "learning_rate": 3.5021364519427205e-05, "epoch": 1.162984081729627, "percentage": 38.77, "elapsed_time": "5:56:50", "remaining_time": "9:23:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9800, "total_steps": 25254, "loss": 0.1235, "learning_rate": 3.499198267377616e-05, "epoch": 1.1641720123544785, "percentage": 38.81, "elapsed_time": "5:57:11", "remaining_time": "9:23:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9810, "total_steps": 25254, "loss": 0.1226, "learning_rate": 3.4962584393454244e-05, "epoch": 1.16535994297933, "percentage": 38.85, "elapsed_time": "5:57:35", "remaining_time": "9:22:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9820, "total_steps": 25254, "loss": 0.1227, "learning_rate": 3.493316972681531e-05, "epoch": 1.1665478736041814, "percentage": 38.88, "elapsed_time": "5:57:56", "remaining_time": "9:22:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9830, "total_steps": 25254, "loss": 0.122, "learning_rate": 3.49037387222402e-05, "epoch": 1.1677358042290331, "percentage": 38.92, "elapsed_time": "5:58:18", "remaining_time": "9:22:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9840, "total_steps": 25254, "loss": 0.1217, "learning_rate": 3.4874291428136586e-05, "epoch": 1.1689237348538846, "percentage": 38.96, "elapsed_time": "5:58:39", "remaining_time": "9:21:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9850, "total_steps": 25254, "loss": 0.1201, "learning_rate": 3.4844827892938985e-05, "epoch": 1.170111665478736, "percentage": 39.0, "elapsed_time": "5:59:01", "remaining_time": "9:21:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9860, "total_steps": 25254, "loss": 0.1187, "learning_rate": 3.4815348165108585e-05, "epoch": 1.1712995961035875, "percentage": 39.04, "elapsed_time": "5:59:22", "remaining_time": "9:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9870, "total_steps": 25254, "loss": 0.1238, "learning_rate": 3.4785852293133224e-05, "epoch": 1.1724875267284391, "percentage": 39.08, "elapsed_time": "5:59:44", "remaining_time": "9:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9880, "total_steps": 25254, "loss": 0.1241, "learning_rate": 3.4756340325527305e-05, "epoch": 1.1736754573532906, "percentage": 39.12, "elapsed_time": "6:00:05", "remaining_time": "9:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9890, "total_steps": 25254, "loss": 0.1254, "learning_rate": 3.4726812310831676e-05, "epoch": 1.174863387978142, "percentage": 39.16, "elapsed_time": "6:00:27", "remaining_time": "9:19:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9900, "total_steps": 25254, "loss": 0.1228, "learning_rate": 3.469726829761361e-05, "epoch": 1.1760513186029935, "percentage": 39.2, "elapsed_time": "6:00:49", "remaining_time": "9:19:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9910, "total_steps": 25254, "loss": 0.1216, "learning_rate": 3.4667708334466655e-05, "epoch": 1.1772392492278452, "percentage": 39.24, "elapsed_time": "6:01:11", "remaining_time": "9:19:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9920, "total_steps": 25254, "loss": 0.1224, "learning_rate": 3.4638132470010645e-05, "epoch": 1.1784271798526966, "percentage": 39.28, "elapsed_time": "6:01:33", "remaining_time": "9:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9930, "total_steps": 25254, "loss": 0.1212, "learning_rate": 3.4608540752891525e-05, "epoch": 1.179615110477548, "percentage": 39.32, "elapsed_time": "6:01:55", "remaining_time": "9:18:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9940, "total_steps": 25254, "loss": 0.1217, "learning_rate": 3.4578933231781336e-05, "epoch": 1.1808030411023995, "percentage": 39.36, "elapsed_time": "6:02:17", "remaining_time": "9:18:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9950, "total_steps": 25254, "loss": 0.1223, "learning_rate": 3.4549309955378107e-05, "epoch": 1.1819909717272512, "percentage": 39.4, "elapsed_time": "6:02:39", "remaining_time": "9:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9960, "total_steps": 25254, "loss": 0.1254, "learning_rate": 3.4519670972405776e-05, "epoch": 1.1831789023521027, "percentage": 39.44, "elapsed_time": "6:03:01", "remaining_time": "9:17:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9970, "total_steps": 25254, "loss": 0.1225, "learning_rate": 3.4490016331614124e-05, "epoch": 1.184366832976954, "percentage": 39.48, "elapsed_time": "6:03:22", "remaining_time": "9:17:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9980, "total_steps": 25254, "loss": 0.1227, "learning_rate": 3.446034608177869e-05, "epoch": 1.1855547636018056, "percentage": 39.52, "elapsed_time": "6:03:44", "remaining_time": "9:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 9990, "total_steps": 25254, "loss": 0.1224, "learning_rate": 3.443066027170068e-05, "epoch": 1.1867426942266572, "percentage": 39.56, "elapsed_time": "6:04:06", "remaining_time": "9:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10000, "total_steps": 25254, "loss": 0.1239, "learning_rate": 3.4400958950206876e-05, "epoch": 1.1879306248515087, "percentage": 39.6, "elapsed_time": "6:04:29", "remaining_time": "9:15:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10010, "total_steps": 25254, "loss": 0.1245, "learning_rate": 3.437124216614959e-05, "epoch": 1.1891185554763601, "percentage": 39.64, "elapsed_time": "6:04:50", "remaining_time": "9:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10020, "total_steps": 25254, "loss": 0.1238, "learning_rate": 3.4341509968406576e-05, "epoch": 1.1903064861012118, "percentage": 39.68, "elapsed_time": "6:05:12", "remaining_time": "9:15:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10030, "total_steps": 25254, "loss": 0.123, "learning_rate": 3.431176240588092e-05, "epoch": 1.1914944167260633, "percentage": 39.72, "elapsed_time": "6:05:35", "remaining_time": "9:14:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10040, "total_steps": 25254, "loss": 0.1236, "learning_rate": 3.4281999527501e-05, "epoch": 1.1926823473509147, "percentage": 39.76, "elapsed_time": "6:05:56", "remaining_time": "9:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10050, "total_steps": 25254, "loss": 0.1218, "learning_rate": 3.425222138222037e-05, "epoch": 1.1938702779757662, "percentage": 39.8, "elapsed_time": "6:06:17", "remaining_time": "9:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10060, "total_steps": 25254, "loss": 0.1219, "learning_rate": 3.42224280190177e-05, "epoch": 1.1950582086006176, "percentage": 39.84, "elapsed_time": "6:06:39", "remaining_time": "9:13:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10070, "total_steps": 25254, "loss": 0.1231, "learning_rate": 3.419261948689669e-05, "epoch": 1.1962461392254693, "percentage": 39.87, "elapsed_time": "6:07:00", "remaining_time": "9:13:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10080, "total_steps": 25254, "loss": 0.124, "learning_rate": 3.4162795834885984e-05, "epoch": 1.1974340698503207, "percentage": 39.91, "elapsed_time": "6:07:22", "remaining_time": "9:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10090, "total_steps": 25254, "loss": 0.1198, "learning_rate": 3.413295711203911e-05, "epoch": 1.1986220004751722, "percentage": 39.95, "elapsed_time": "6:07:43", "remaining_time": "9:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10100, "total_steps": 25254, "loss": 0.1212, "learning_rate": 3.4103103367434365e-05, "epoch": 1.1998099311000239, "percentage": 39.99, "elapsed_time": "6:08:05", "remaining_time": "9:12:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10110, "total_steps": 25254, "loss": 0.1183, "learning_rate": 3.407323465017477e-05, "epoch": 1.2009978617248753, "percentage": 40.03, "elapsed_time": "6:08:26", "remaining_time": "9:11:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10120, "total_steps": 25254, "loss": 0.1198, "learning_rate": 3.4043351009387964e-05, "epoch": 1.2021857923497268, "percentage": 40.07, "elapsed_time": "6:08:47", "remaining_time": "9:11:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10130, "total_steps": 25254, "loss": 0.124, "learning_rate": 3.401345249422613e-05, "epoch": 1.2033737229745782, "percentage": 40.11, "elapsed_time": "6:09:09", "remaining_time": "9:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10140, "total_steps": 25254, "loss": 0.1238, "learning_rate": 3.398353915386593e-05, "epoch": 1.2045616535994297, "percentage": 40.15, "elapsed_time": "6:09:30", "remaining_time": "9:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10150, "total_steps": 25254, "loss": 0.1204, "learning_rate": 3.3953611037508384e-05, "epoch": 1.2057495842242814, "percentage": 40.19, "elapsed_time": "6:09:52", "remaining_time": "9:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10160, "total_steps": 25254, "loss": 0.1228, "learning_rate": 3.3923668194378856e-05, "epoch": 1.2069375148491328, "percentage": 40.23, "elapsed_time": "6:10:14", "remaining_time": "9:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10170, "total_steps": 25254, "loss": 0.1197, "learning_rate": 3.389371067372688e-05, "epoch": 1.2081254454739843, "percentage": 40.27, "elapsed_time": "6:10:36", "remaining_time": "9:09:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10180, "total_steps": 25254, "loss": 0.1203, "learning_rate": 3.3863738524826184e-05, "epoch": 1.209313376098836, "percentage": 40.31, "elapsed_time": "6:10:58", "remaining_time": "9:09:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10190, "total_steps": 25254, "loss": 0.1219, "learning_rate": 3.3833751796974514e-05, "epoch": 1.2105013067236874, "percentage": 40.35, "elapsed_time": "6:11:20", "remaining_time": "9:08:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10200, "total_steps": 25254, "loss": 0.1192, "learning_rate": 3.380375053949362e-05, "epoch": 1.2116892373485388, "percentage": 40.39, "elapsed_time": "6:11:41", "remaining_time": "9:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10210, "total_steps": 25254, "loss": 0.1243, "learning_rate": 3.377373480172915e-05, "epoch": 1.2128771679733903, "percentage": 40.43, "elapsed_time": "6:12:04", "remaining_time": "9:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10220, "total_steps": 25254, "loss": 0.1209, "learning_rate": 3.374370463305056e-05, "epoch": 1.2140650985982417, "percentage": 40.47, "elapsed_time": "6:12:25", "remaining_time": "9:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10230, "total_steps": 25254, "loss": 0.1202, "learning_rate": 3.3713660082851036e-05, "epoch": 1.2152530292230934, "percentage": 40.51, "elapsed_time": "6:12:46", "remaining_time": "9:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10240, "total_steps": 25254, "loss": 0.1239, "learning_rate": 3.3683601200547424e-05, "epoch": 1.2164409598479449, "percentage": 40.55, "elapsed_time": "6:13:08", "remaining_time": "9:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10250, "total_steps": 25254, "loss": 0.1207, "learning_rate": 3.365352803558016e-05, "epoch": 1.2176288904727963, "percentage": 40.59, "elapsed_time": "6:13:30", "remaining_time": "9:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10260, "total_steps": 25254, "loss": 0.12, "learning_rate": 3.3623440637413154e-05, "epoch": 1.218816821097648, "percentage": 40.63, "elapsed_time": "6:13:53", "remaining_time": "9:06:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10270, "total_steps": 25254, "loss": 0.1226, "learning_rate": 3.359333905553372e-05, "epoch": 1.2200047517224994, "percentage": 40.67, "elapsed_time": "6:14:15", "remaining_time": "9:06:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10280, "total_steps": 25254, "loss": 0.1206, "learning_rate": 3.356322333945252e-05, "epoch": 1.221192682347351, "percentage": 40.71, "elapsed_time": "6:14:37", "remaining_time": "9:05:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10290, "total_steps": 25254, "loss": 0.1224, "learning_rate": 3.3533093538703454e-05, "epoch": 1.2223806129722024, "percentage": 40.75, "elapsed_time": "6:14:59", "remaining_time": "9:05:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10300, "total_steps": 25254, "loss": 0.1214, "learning_rate": 3.350294970284359e-05, "epoch": 1.223568543597054, "percentage": 40.79, "elapsed_time": "6:15:21", "remaining_time": "9:04:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10310, "total_steps": 25254, "loss": 0.1228, "learning_rate": 3.347279188145308e-05, "epoch": 1.2247564742219055, "percentage": 40.83, "elapsed_time": "6:15:42", "remaining_time": "9:04:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10320, "total_steps": 25254, "loss": 0.119, "learning_rate": 3.344262012413507e-05, "epoch": 1.225944404846757, "percentage": 40.86, "elapsed_time": "6:16:04", "remaining_time": "9:04:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10330, "total_steps": 25254, "loss": 0.1269, "learning_rate": 3.341243448051565e-05, "epoch": 1.2271323354716084, "percentage": 40.9, "elapsed_time": "6:16:25", "remaining_time": "9:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10340, "total_steps": 25254, "loss": 0.1228, "learning_rate": 3.338223500024373e-05, "epoch": 1.22832026609646, "percentage": 40.94, "elapsed_time": "6:16:47", "remaining_time": "9:03:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10350, "total_steps": 25254, "loss": 0.1187, "learning_rate": 3.3352021732991e-05, "epoch": 1.2295081967213115, "percentage": 40.98, "elapsed_time": "6:17:09", "remaining_time": "9:03:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10360, "total_steps": 25254, "loss": 0.1226, "learning_rate": 3.3321794728451784e-05, "epoch": 1.230696127346163, "percentage": 41.02, "elapsed_time": "6:17:31", "remaining_time": "9:02:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10370, "total_steps": 25254, "loss": 0.1186, "learning_rate": 3.329155403634305e-05, "epoch": 1.2318840579710144, "percentage": 41.06, "elapsed_time": "6:17:53", "remaining_time": "9:02:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10380, "total_steps": 25254, "loss": 0.1271, "learning_rate": 3.326129970640425e-05, "epoch": 1.233071988595866, "percentage": 41.1, "elapsed_time": "6:18:16", "remaining_time": "9:02:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10390, "total_steps": 25254, "loss": 0.1238, "learning_rate": 3.323103178839729e-05, "epoch": 1.2342599192207175, "percentage": 41.14, "elapsed_time": "6:18:38", "remaining_time": "9:01:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10400, "total_steps": 25254, "loss": 0.1186, "learning_rate": 3.320075033210639e-05, "epoch": 1.235447849845569, "percentage": 41.18, "elapsed_time": "6:19:00", "remaining_time": "9:01:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10410, "total_steps": 25254, "loss": 0.1224, "learning_rate": 3.3170455387338064e-05, "epoch": 1.2366357804704204, "percentage": 41.22, "elapsed_time": "6:19:21", "remaining_time": "9:00:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10420, "total_steps": 25254, "loss": 0.1224, "learning_rate": 3.314014700392101e-05, "epoch": 1.2378237110952721, "percentage": 41.26, "elapsed_time": "6:19:43", "remaining_time": "9:00:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10430, "total_steps": 25254, "loss": 0.1262, "learning_rate": 3.310982523170601e-05, "epoch": 1.2390116417201236, "percentage": 41.3, "elapsed_time": "6:20:05", "remaining_time": "9:00:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10440, "total_steps": 25254, "loss": 0.1229, "learning_rate": 3.307949012056592e-05, "epoch": 1.240199572344975, "percentage": 41.34, "elapsed_time": "6:20:26", "remaining_time": "8:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10450, "total_steps": 25254, "loss": 0.1195, "learning_rate": 3.304914172039547e-05, "epoch": 1.2413875029698265, "percentage": 41.38, "elapsed_time": "6:20:48", "remaining_time": "8:59:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10460, "total_steps": 25254, "loss": 0.1221, "learning_rate": 3.301878008111128e-05, "epoch": 1.2425754335946781, "percentage": 41.42, "elapsed_time": "6:21:10", "remaining_time": "8:59:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10470, "total_steps": 25254, "loss": 0.1217, "learning_rate": 3.298840525265175e-05, "epoch": 1.2437633642195296, "percentage": 41.46, "elapsed_time": "6:21:31", "remaining_time": "8:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10480, "total_steps": 25254, "loss": 0.1219, "learning_rate": 3.295801728497696e-05, "epoch": 1.244951294844381, "percentage": 41.5, "elapsed_time": "6:21:54", "remaining_time": "8:58:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10490, "total_steps": 25254, "loss": 0.1221, "learning_rate": 3.2927616228068605e-05, "epoch": 1.2461392254692325, "percentage": 41.54, "elapsed_time": "6:22:15", "remaining_time": "8:58:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10500, "total_steps": 25254, "loss": 0.1245, "learning_rate": 3.289720213192991e-05, "epoch": 1.2473271560940842, "percentage": 41.58, "elapsed_time": "6:22:37", "remaining_time": "8:57:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10510, "total_steps": 25254, "loss": 0.1211, "learning_rate": 3.286677504658556e-05, "epoch": 1.2485150867189356, "percentage": 41.62, "elapsed_time": "6:22:59", "remaining_time": "8:57:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10520, "total_steps": 25254, "loss": 0.1214, "learning_rate": 3.283633502208158e-05, "epoch": 1.249703017343787, "percentage": 41.66, "elapsed_time": "6:23:20", "remaining_time": "8:56:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10530, "total_steps": 25254, "loss": 0.1234, "learning_rate": 3.2805882108485284e-05, "epoch": 1.2508909479686388, "percentage": 41.7, "elapsed_time": "6:23:42", "remaining_time": "8:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10540, "total_steps": 25254, "loss": 0.1239, "learning_rate": 3.2775416355885204e-05, "epoch": 1.2520788785934902, "percentage": 41.74, "elapsed_time": "6:24:05", "remaining_time": "8:56:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10550, "total_steps": 25254, "loss": 0.1191, "learning_rate": 3.2744937814390974e-05, "epoch": 1.2532668092183417, "percentage": 41.78, "elapsed_time": "6:24:27", "remaining_time": "8:55:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10560, "total_steps": 25254, "loss": 0.1232, "learning_rate": 3.2714446534133256e-05, "epoch": 1.2544547398431931, "percentage": 41.82, "elapsed_time": "6:24:49", "remaining_time": "8:55:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10570, "total_steps": 25254, "loss": 0.1224, "learning_rate": 3.268394256526368e-05, "epoch": 1.2556426704680446, "percentage": 41.85, "elapsed_time": "6:25:10", "remaining_time": "8:55:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10580, "total_steps": 25254, "loss": 0.1191, "learning_rate": 3.265342595795475e-05, "epoch": 1.2568306010928962, "percentage": 41.89, "elapsed_time": "6:25:32", "remaining_time": "8:54:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10590, "total_steps": 25254, "loss": 0.1207, "learning_rate": 3.262289676239973e-05, "epoch": 1.2580185317177477, "percentage": 41.93, "elapsed_time": "6:25:53", "remaining_time": "8:54:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10600, "total_steps": 25254, "loss": 0.1218, "learning_rate": 3.259235502881261e-05, "epoch": 1.2592064623425991, "percentage": 41.97, "elapsed_time": "6:26:15", "remaining_time": "8:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10610, "total_steps": 25254, "loss": 0.1217, "learning_rate": 3.256180080742801e-05, "epoch": 1.2603943929674508, "percentage": 42.01, "elapsed_time": "6:26:37", "remaining_time": "8:53:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10620, "total_steps": 25254, "loss": 0.1251, "learning_rate": 3.253123414850107e-05, "epoch": 1.2615823235923023, "percentage": 42.05, "elapsed_time": "6:26:59", "remaining_time": "8:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10630, "total_steps": 25254, "loss": 0.1177, "learning_rate": 3.2500655102307386e-05, "epoch": 1.2627702542171537, "percentage": 42.09, "elapsed_time": "6:27:21", "remaining_time": "8:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10640, "total_steps": 25254, "loss": 0.124, "learning_rate": 3.247006371914295e-05, "epoch": 1.2639581848420052, "percentage": 42.13, "elapsed_time": "6:27:43", "remaining_time": "8:52:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10650, "total_steps": 25254, "loss": 0.1188, "learning_rate": 3.243946004932404e-05, "epoch": 1.2651461154668566, "percentage": 42.17, "elapsed_time": "6:28:05", "remaining_time": "8:52:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10660, "total_steps": 25254, "loss": 0.1234, "learning_rate": 3.2408844143187126e-05, "epoch": 1.2663340460917083, "percentage": 42.21, "elapsed_time": "6:28:27", "remaining_time": "8:51:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10670, "total_steps": 25254, "loss": 0.1179, "learning_rate": 3.237821605108881e-05, "epoch": 1.2675219767165598, "percentage": 42.25, "elapsed_time": "6:28:48", "remaining_time": "8:51:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10680, "total_steps": 25254, "loss": 0.1214, "learning_rate": 3.234757582340575e-05, "epoch": 1.2687099073414112, "percentage": 42.29, "elapsed_time": "6:29:10", "remaining_time": "8:51:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10690, "total_steps": 25254, "loss": 0.1214, "learning_rate": 3.231692351053456e-05, "epoch": 1.2698978379662629, "percentage": 42.33, "elapsed_time": "6:29:31", "remaining_time": "8:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10700, "total_steps": 25254, "loss": 0.1229, "learning_rate": 3.2286259162891724e-05, "epoch": 1.2710857685911143, "percentage": 42.37, "elapsed_time": "6:29:53", "remaining_time": "8:50:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10710, "total_steps": 25254, "loss": 0.1194, "learning_rate": 3.2255582830913525e-05, "epoch": 1.2722736992159658, "percentage": 42.41, "elapsed_time": "6:30:16", "remaining_time": "8:49:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10720, "total_steps": 25254, "loss": 0.1183, "learning_rate": 3.222489456505595e-05, "epoch": 1.2734616298408172, "percentage": 42.45, "elapsed_time": "6:30:38", "remaining_time": "8:49:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10730, "total_steps": 25254, "loss": 0.1222, "learning_rate": 3.219419441579463e-05, "epoch": 1.2746495604656687, "percentage": 42.49, "elapsed_time": "6:31:00", "remaining_time": "8:49:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10740, "total_steps": 25254, "loss": 0.1234, "learning_rate": 3.216348243362472e-05, "epoch": 1.2758374910905204, "percentage": 42.53, "elapsed_time": "6:31:21", "remaining_time": "8:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10750, "total_steps": 25254, "loss": 0.1192, "learning_rate": 3.213275866906088e-05, "epoch": 1.2770254217153718, "percentage": 42.57, "elapsed_time": "6:31:43", "remaining_time": "8:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10760, "total_steps": 25254, "loss": 0.1263, "learning_rate": 3.21020231726371e-05, "epoch": 1.2782133523402233, "percentage": 42.61, "elapsed_time": "6:32:04", "remaining_time": "8:48:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10770, "total_steps": 25254, "loss": 0.1242, "learning_rate": 3.207127599490668e-05, "epoch": 1.279401282965075, "percentage": 42.65, "elapsed_time": "6:32:26", "remaining_time": "8:47:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10780, "total_steps": 25254, "loss": 0.123, "learning_rate": 3.204051718644216e-05, "epoch": 1.2805892135899264, "percentage": 42.69, "elapsed_time": "6:32:47", "remaining_time": "8:47:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10790, "total_steps": 25254, "loss": 0.1186, "learning_rate": 3.2009746797835185e-05, "epoch": 1.2817771442147778, "percentage": 42.73, "elapsed_time": "6:33:09", "remaining_time": "8:47:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10800, "total_steps": 25254, "loss": 0.1207, "learning_rate": 3.1978964879696437e-05, "epoch": 1.2829650748396293, "percentage": 42.77, "elapsed_time": "6:33:30", "remaining_time": "8:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10810, "total_steps": 25254, "loss": 0.1215, "learning_rate": 3.194817148265559e-05, "epoch": 1.2841530054644807, "percentage": 42.81, "elapsed_time": "6:33:53", "remaining_time": "8:46:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10820, "total_steps": 25254, "loss": 0.1229, "learning_rate": 3.191736665736118e-05, "epoch": 1.2853409360893324, "percentage": 42.84, "elapsed_time": "6:34:14", "remaining_time": "8:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10830, "total_steps": 25254, "loss": 0.1218, "learning_rate": 3.188655045448056e-05, "epoch": 1.2865288667141839, "percentage": 42.88, "elapsed_time": "6:34:35", "remaining_time": "8:45:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10840, "total_steps": 25254, "loss": 0.1209, "learning_rate": 3.185572292469976e-05, "epoch": 1.2877167973390353, "percentage": 42.92, "elapsed_time": "6:34:57", "remaining_time": "8:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10850, "total_steps": 25254, "loss": 0.1254, "learning_rate": 3.182488411872348e-05, "epoch": 1.288904727963887, "percentage": 42.96, "elapsed_time": "6:35:18", "remaining_time": "8:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10860, "total_steps": 25254, "loss": 0.1206, "learning_rate": 3.1794034087274935e-05, "epoch": 1.2900926585887385, "percentage": 43.0, "elapsed_time": "6:35:40", "remaining_time": "8:44:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10870, "total_steps": 25254, "loss": 0.1219, "learning_rate": 3.1763172881095826e-05, "epoch": 1.29128058921359, "percentage": 43.04, "elapsed_time": "6:36:02", "remaining_time": "8:44:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10880, "total_steps": 25254, "loss": 0.1213, "learning_rate": 3.1732300550946226e-05, "epoch": 1.2924685198384414, "percentage": 43.08, "elapsed_time": "6:36:24", "remaining_time": "8:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10890, "total_steps": 25254, "loss": 0.1197, "learning_rate": 3.17014171476045e-05, "epoch": 1.2936564504632928, "percentage": 43.12, "elapsed_time": "6:36:46", "remaining_time": "8:43:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10900, "total_steps": 25254, "loss": 0.1217, "learning_rate": 3.167052272186722e-05, "epoch": 1.2948443810881445, "percentage": 43.16, "elapsed_time": "6:37:07", "remaining_time": "8:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10910, "total_steps": 25254, "loss": 0.1215, "learning_rate": 3.163961732454913e-05, "epoch": 1.296032311712996, "percentage": 43.2, "elapsed_time": "6:37:29", "remaining_time": "8:42:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10920, "total_steps": 25254, "loss": 0.1216, "learning_rate": 3.160870100648296e-05, "epoch": 1.2972202423378474, "percentage": 43.24, "elapsed_time": "6:37:51", "remaining_time": "8:42:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10930, "total_steps": 25254, "loss": 0.125, "learning_rate": 3.1577773818519434e-05, "epoch": 1.298408172962699, "percentage": 43.28, "elapsed_time": "6:38:13", "remaining_time": "8:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10940, "total_steps": 25254, "loss": 0.1241, "learning_rate": 3.154683581152716e-05, "epoch": 1.2995961035875505, "percentage": 43.32, "elapsed_time": "6:38:34", "remaining_time": "8:41:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10950, "total_steps": 25254, "loss": 0.1229, "learning_rate": 3.151588703639252e-05, "epoch": 1.300784034212402, "percentage": 43.36, "elapsed_time": "6:38:56", "remaining_time": "8:41:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10960, "total_steps": 25254, "loss": 0.1203, "learning_rate": 3.1484927544019624e-05, "epoch": 1.3019719648372536, "percentage": 43.4, "elapsed_time": "6:39:17", "remaining_time": "8:40:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10970, "total_steps": 25254, "loss": 0.1209, "learning_rate": 3.145395738533021e-05, "epoch": 1.303159895462105, "percentage": 43.44, "elapsed_time": "6:39:40", "remaining_time": "8:40:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10980, "total_steps": 25254, "loss": 0.1262, "learning_rate": 3.142297661126355e-05, "epoch": 1.3043478260869565, "percentage": 43.48, "elapsed_time": "6:40:01", "remaining_time": "8:40:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 10990, "total_steps": 25254, "loss": 0.1225, "learning_rate": 3.1391985272776375e-05, "epoch": 1.305535756711808, "percentage": 43.52, "elapsed_time": "6:40:23", "remaining_time": "8:39:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11000, "total_steps": 25254, "loss": 0.1208, "learning_rate": 3.13609834208428e-05, "epoch": 1.3067236873366594, "percentage": 43.56, "elapsed_time": "6:40:43", "remaining_time": "8:39:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11010, "total_steps": 25254, "loss": 0.1212, "learning_rate": 3.1329971106454234e-05, "epoch": 1.3079116179615111, "percentage": 43.6, "elapsed_time": "6:41:05", "remaining_time": "8:38:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11020, "total_steps": 25254, "loss": 0.1219, "learning_rate": 3.129894838061929e-05, "epoch": 1.3090995485863626, "percentage": 43.64, "elapsed_time": "6:41:27", "remaining_time": "8:38:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11030, "total_steps": 25254, "loss": 0.1232, "learning_rate": 3.12679152943637e-05, "epoch": 1.310287479211214, "percentage": 43.68, "elapsed_time": "6:41:48", "remaining_time": "8:38:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11040, "total_steps": 25254, "loss": 0.1219, "learning_rate": 3.123687189873025e-05, "epoch": 1.3114754098360657, "percentage": 43.72, "elapsed_time": "6:42:10", "remaining_time": "8:37:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11050, "total_steps": 25254, "loss": 0.1237, "learning_rate": 3.1205818244778666e-05, "epoch": 1.3126633404609171, "percentage": 43.76, "elapsed_time": "6:42:33", "remaining_time": "8:37:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11060, "total_steps": 25254, "loss": 0.1257, "learning_rate": 3.117475438358557e-05, "epoch": 1.3138512710857686, "percentage": 43.8, "elapsed_time": "6:42:54", "remaining_time": "8:37:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11070, "total_steps": 25254, "loss": 0.1212, "learning_rate": 3.1143680366244344e-05, "epoch": 1.31503920171062, "percentage": 43.83, "elapsed_time": "6:43:17", "remaining_time": "8:36:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11080, "total_steps": 25254, "loss": 0.1191, "learning_rate": 3.11125962438651e-05, "epoch": 1.3162271323354715, "percentage": 43.87, "elapsed_time": "6:43:39", "remaining_time": "8:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11090, "total_steps": 25254, "loss": 0.1199, "learning_rate": 3.108150206757455e-05, "epoch": 1.3174150629603232, "percentage": 43.91, "elapsed_time": "6:44:01", "remaining_time": "8:36:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11100, "total_steps": 25254, "loss": 0.1243, "learning_rate": 3.105039788851596e-05, "epoch": 1.3186029935851746, "percentage": 43.95, "elapsed_time": "6:44:23", "remaining_time": "8:35:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11110, "total_steps": 25254, "loss": 0.1201, "learning_rate": 3.101928375784904e-05, "epoch": 1.319790924210026, "percentage": 43.99, "elapsed_time": "6:44:45", "remaining_time": "8:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11120, "total_steps": 25254, "loss": 0.122, "learning_rate": 3.0988159726749875e-05, "epoch": 1.3209788548348778, "percentage": 44.03, "elapsed_time": "6:45:07", "remaining_time": "8:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11130, "total_steps": 25254, "loss": 0.1227, "learning_rate": 3.095702584641082e-05, "epoch": 1.3221667854597292, "percentage": 44.07, "elapsed_time": "6:45:29", "remaining_time": "8:34:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11140, "total_steps": 25254, "loss": 0.1211, "learning_rate": 3.092588216804043e-05, "epoch": 1.3233547160845807, "percentage": 44.11, "elapsed_time": "6:45:52", "remaining_time": "8:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11150, "total_steps": 25254, "loss": 0.1239, "learning_rate": 3.08947287428634e-05, "epoch": 1.3245426467094321, "percentage": 44.15, "elapsed_time": "6:46:13", "remaining_time": "8:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11160, "total_steps": 25254, "loss": 0.1221, "learning_rate": 3.0863565622120436e-05, "epoch": 1.3257305773342836, "percentage": 44.19, "elapsed_time": "6:46:36", "remaining_time": "8:33:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11170, "total_steps": 25254, "loss": 0.122, "learning_rate": 3.08323928570682e-05, "epoch": 1.3269185079591352, "percentage": 44.23, "elapsed_time": "6:46:58", "remaining_time": "8:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11180, "total_steps": 25254, "loss": 0.1167, "learning_rate": 3.08012104989792e-05, "epoch": 1.3281064385839867, "percentage": 44.27, "elapsed_time": "6:47:20", "remaining_time": "8:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11190, "total_steps": 25254, "loss": 0.1236, "learning_rate": 3.077001859914174e-05, "epoch": 1.3292943692088381, "percentage": 44.31, "elapsed_time": "6:47:41", "remaining_time": "8:32:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11200, "total_steps": 25254, "loss": 0.121, "learning_rate": 3.0738817208859816e-05, "epoch": 1.3304822998336898, "percentage": 44.35, "elapsed_time": "6:48:03", "remaining_time": "8:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11210, "total_steps": 25254, "loss": 0.1193, "learning_rate": 3.070760637945303e-05, "epoch": 1.3316702304585413, "percentage": 44.39, "elapsed_time": "6:48:25", "remaining_time": "8:31:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11220, "total_steps": 25254, "loss": 0.1198, "learning_rate": 3.0676386162256505e-05, "epoch": 1.3328581610833927, "percentage": 44.43, "elapsed_time": "6:48:47", "remaining_time": "8:31:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11230, "total_steps": 25254, "loss": 0.1229, "learning_rate": 3.0645156608620815e-05, "epoch": 1.3340460917082442, "percentage": 44.47, "elapsed_time": "6:49:08", "remaining_time": "8:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11240, "total_steps": 25254, "loss": 0.1199, "learning_rate": 3.061391776991188e-05, "epoch": 1.3352340223330956, "percentage": 44.51, "elapsed_time": "6:49:31", "remaining_time": "8:30:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11250, "total_steps": 25254, "loss": 0.1197, "learning_rate": 3.0582669697510906e-05, "epoch": 1.3364219529579473, "percentage": 44.55, "elapsed_time": "6:49:52", "remaining_time": "8:30:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11260, "total_steps": 25254, "loss": 0.1187, "learning_rate": 3.055141244281427e-05, "epoch": 1.3376098835827988, "percentage": 44.59, "elapsed_time": "6:50:14", "remaining_time": "8:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11270, "total_steps": 25254, "loss": 0.1205, "learning_rate": 3.0520146057233466e-05, "epoch": 1.3387978142076502, "percentage": 44.63, "elapsed_time": "6:50:37", "remaining_time": "8:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11280, "total_steps": 25254, "loss": 0.1213, "learning_rate": 3.0488870592194994e-05, "epoch": 1.3399857448325019, "percentage": 44.67, "elapsed_time": "6:50:59", "remaining_time": "8:29:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11290, "total_steps": 25254, "loss": 0.1215, "learning_rate": 3.04575860991403e-05, "epoch": 1.3411736754573533, "percentage": 44.71, "elapsed_time": "6:51:21", "remaining_time": "8:28:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11300, "total_steps": 25254, "loss": 0.1218, "learning_rate": 3.042629262952566e-05, "epoch": 1.3423616060822048, "percentage": 44.75, "elapsed_time": "6:51:43", "remaining_time": "8:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11310, "total_steps": 25254, "loss": 0.119, "learning_rate": 3.0394990234822147e-05, "epoch": 1.3435495367070562, "percentage": 44.78, "elapsed_time": "6:52:04", "remaining_time": "8:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11320, "total_steps": 25254, "loss": 0.118, "learning_rate": 3.036367896651548e-05, "epoch": 1.3447374673319077, "percentage": 44.82, "elapsed_time": "6:52:25", "remaining_time": "8:27:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11330, "total_steps": 25254, "loss": 0.1192, "learning_rate": 3.033235887610598e-05, "epoch": 1.3459253979567594, "percentage": 44.86, "elapsed_time": "6:52:46", "remaining_time": "8:27:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11340, "total_steps": 25254, "loss": 0.1179, "learning_rate": 3.0301030015108512e-05, "epoch": 1.3471133285816108, "percentage": 44.9, "elapsed_time": "6:53:08", "remaining_time": "8:26:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11350, "total_steps": 25254, "loss": 0.1175, "learning_rate": 3.026969243505232e-05, "epoch": 1.3483012592064623, "percentage": 44.94, "elapsed_time": "6:53:30", "remaining_time": "8:26:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11360, "total_steps": 25254, "loss": 0.1236, "learning_rate": 3.023834618748102e-05, "epoch": 1.349489189831314, "percentage": 44.98, "elapsed_time": "6:53:53", "remaining_time": "8:26:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11370, "total_steps": 25254, "loss": 0.119, "learning_rate": 3.020699132395246e-05, "epoch": 1.3506771204561654, "percentage": 45.02, "elapsed_time": "6:54:16", "remaining_time": "8:25:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11380, "total_steps": 25254, "loss": 0.1205, "learning_rate": 3.017562789603869e-05, "epoch": 1.3518650510810168, "percentage": 45.06, "elapsed_time": "6:54:38", "remaining_time": "8:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11390, "total_steps": 25254, "loss": 0.1221, "learning_rate": 3.0144255955325824e-05, "epoch": 1.3530529817058683, "percentage": 45.1, "elapsed_time": "6:54:59", "remaining_time": "8:25:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11400, "total_steps": 25254, "loss": 0.1215, "learning_rate": 3.0112875553413973e-05, "epoch": 1.3542409123307197, "percentage": 45.14, "elapsed_time": "6:55:22", "remaining_time": "8:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11410, "total_steps": 25254, "loss": 0.118, "learning_rate": 3.0081486741917194e-05, "epoch": 1.3554288429555714, "percentage": 45.18, "elapsed_time": "6:55:44", "remaining_time": "8:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11420, "total_steps": 25254, "loss": 0.1198, "learning_rate": 3.0050089572463337e-05, "epoch": 1.3566167735804229, "percentage": 45.22, "elapsed_time": "6:56:06", "remaining_time": "8:24:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11430, "total_steps": 25254, "loss": 0.1204, "learning_rate": 3.001868409669404e-05, "epoch": 1.3578047042052743, "percentage": 45.26, "elapsed_time": "6:56:28", "remaining_time": "8:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11440, "total_steps": 25254, "loss": 0.1171, "learning_rate": 2.9987270366264563e-05, "epoch": 1.358992634830126, "percentage": 45.3, "elapsed_time": "6:56:49", "remaining_time": "8:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11450, "total_steps": 25254, "loss": 0.12, "learning_rate": 2.995584843284378e-05, "epoch": 1.3601805654549775, "percentage": 45.34, "elapsed_time": "6:57:11", "remaining_time": "8:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11460, "total_steps": 25254, "loss": 0.1211, "learning_rate": 2.9924418348114035e-05, "epoch": 1.361368496079829, "percentage": 45.38, "elapsed_time": "6:57:33", "remaining_time": "8:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11470, "total_steps": 25254, "loss": 0.1193, "learning_rate": 2.989298016377107e-05, "epoch": 1.3625564267046806, "percentage": 45.42, "elapsed_time": "6:57:55", "remaining_time": "8:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11480, "total_steps": 25254, "loss": 0.121, "learning_rate": 2.986153393152398e-05, "epoch": 1.363744357329532, "percentage": 45.46, "elapsed_time": "6:58:18", "remaining_time": "8:21:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11490, "total_steps": 25254, "loss": 0.1215, "learning_rate": 2.9830079703095077e-05, "epoch": 1.3649322879543835, "percentage": 45.5, "elapsed_time": "6:58:40", "remaining_time": "8:21:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11500, "total_steps": 25254, "loss": 0.1188, "learning_rate": 2.9798617530219826e-05, "epoch": 1.366120218579235, "percentage": 45.54, "elapsed_time": "6:59:02", "remaining_time": "8:21:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11510, "total_steps": 25254, "loss": 0.1219, "learning_rate": 2.976714746464676e-05, "epoch": 1.3673081492040864, "percentage": 45.58, "elapsed_time": "6:59:23", "remaining_time": "8:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11520, "total_steps": 25254, "loss": 0.1196, "learning_rate": 2.9735669558137398e-05, "epoch": 1.368496079828938, "percentage": 45.62, "elapsed_time": "6:59:46", "remaining_time": "8:20:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11530, "total_steps": 25254, "loss": 0.1226, "learning_rate": 2.970418386246615e-05, "epoch": 1.3696840104537895, "percentage": 45.66, "elapsed_time": "7:00:08", "remaining_time": "8:20:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11540, "total_steps": 25254, "loss": 0.122, "learning_rate": 2.9672690429420236e-05, "epoch": 1.370871941078641, "percentage": 45.7, "elapsed_time": "7:00:29", "remaining_time": "8:19:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11550, "total_steps": 25254, "loss": 0.1176, "learning_rate": 2.964118931079961e-05, "epoch": 1.3720598717034926, "percentage": 45.74, "elapsed_time": "7:00:52", "remaining_time": "8:19:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11560, "total_steps": 25254, "loss": 0.1194, "learning_rate": 2.9609680558416863e-05, "epoch": 1.373247802328344, "percentage": 45.77, "elapsed_time": "7:01:14", "remaining_time": "8:18:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11570, "total_steps": 25254, "loss": 0.1209, "learning_rate": 2.9578164224097154e-05, "epoch": 1.3744357329531955, "percentage": 45.81, "elapsed_time": "7:01:35", "remaining_time": "8:18:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11580, "total_steps": 25254, "loss": 0.1192, "learning_rate": 2.9546640359678086e-05, "epoch": 1.375623663578047, "percentage": 45.85, "elapsed_time": "7:01:58", "remaining_time": "8:18:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11590, "total_steps": 25254, "loss": 0.1186, "learning_rate": 2.951510901700966e-05, "epoch": 1.3768115942028984, "percentage": 45.89, "elapsed_time": "7:02:20", "remaining_time": "8:17:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11600, "total_steps": 25254, "loss": 0.1213, "learning_rate": 2.9483570247954202e-05, "epoch": 1.3779995248277501, "percentage": 45.93, "elapsed_time": "7:02:42", "remaining_time": "8:17:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11610, "total_steps": 25254, "loss": 0.1199, "learning_rate": 2.945202410438621e-05, "epoch": 1.3791874554526016, "percentage": 45.97, "elapsed_time": "7:03:04", "remaining_time": "8:17:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11620, "total_steps": 25254, "loss": 0.1193, "learning_rate": 2.9420470638192338e-05, "epoch": 1.380375386077453, "percentage": 46.01, "elapsed_time": "7:03:26", "remaining_time": "8:16:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11630, "total_steps": 25254, "loss": 0.1221, "learning_rate": 2.9388909901271273e-05, "epoch": 1.3815633167023047, "percentage": 46.05, "elapsed_time": "7:03:49", "remaining_time": "8:16:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11640, "total_steps": 25254, "loss": 0.1153, "learning_rate": 2.9357341945533673e-05, "epoch": 1.3827512473271562, "percentage": 46.09, "elapsed_time": "7:04:11", "remaining_time": "8:16:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11650, "total_steps": 25254, "loss": 0.1209, "learning_rate": 2.9325766822902063e-05, "epoch": 1.3839391779520076, "percentage": 46.13, "elapsed_time": "7:04:33", "remaining_time": "8:15:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11660, "total_steps": 25254, "loss": 0.1195, "learning_rate": 2.9294184585310745e-05, "epoch": 1.385127108576859, "percentage": 46.17, "elapsed_time": "7:04:54", "remaining_time": "8:15:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11670, "total_steps": 25254, "loss": 0.12, "learning_rate": 2.9262595284705747e-05, "epoch": 1.3863150392017105, "percentage": 46.21, "elapsed_time": "7:05:16", "remaining_time": "8:15:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11680, "total_steps": 25254, "loss": 0.1194, "learning_rate": 2.9230998973044693e-05, "epoch": 1.3875029698265622, "percentage": 46.25, "elapsed_time": "7:05:39", "remaining_time": "8:14:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11690, "total_steps": 25254, "loss": 0.1192, "learning_rate": 2.919939570229675e-05, "epoch": 1.3886909004514136, "percentage": 46.29, "elapsed_time": "7:06:01", "remaining_time": "8:14:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11700, "total_steps": 25254, "loss": 0.1206, "learning_rate": 2.9167785524442527e-05, "epoch": 1.389878831076265, "percentage": 46.33, "elapsed_time": "7:06:22", "remaining_time": "8:13:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11710, "total_steps": 25254, "loss": 0.1244, "learning_rate": 2.913616849147399e-05, "epoch": 1.3910667617011168, "percentage": 46.37, "elapsed_time": "7:06:44", "remaining_time": "8:13:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11720, "total_steps": 25254, "loss": 0.1188, "learning_rate": 2.9104544655394395e-05, "epoch": 1.3922546923259682, "percentage": 46.41, "elapsed_time": "7:07:07", "remaining_time": "8:13:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11730, "total_steps": 25254, "loss": 0.1236, "learning_rate": 2.9072914068218166e-05, "epoch": 1.3934426229508197, "percentage": 46.45, "elapsed_time": "7:07:29", "remaining_time": "8:12:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11740, "total_steps": 25254, "loss": 0.1142, "learning_rate": 2.9041276781970856e-05, "epoch": 1.3946305535756711, "percentage": 46.49, "elapsed_time": "7:07:52", "remaining_time": "8:12:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11750, "total_steps": 25254, "loss": 0.122, "learning_rate": 2.9009632848689007e-05, "epoch": 1.3958184842005226, "percentage": 46.53, "elapsed_time": "7:08:13", "remaining_time": "8:12:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11760, "total_steps": 25254, "loss": 0.1194, "learning_rate": 2.8977982320420123e-05, "epoch": 1.3970064148253742, "percentage": 46.57, "elapsed_time": "7:08:35", "remaining_time": "8:11:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11770, "total_steps": 25254, "loss": 0.1159, "learning_rate": 2.8946325249222534e-05, "epoch": 1.3981943454502257, "percentage": 46.61, "elapsed_time": "7:08:56", "remaining_time": "8:11:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11780, "total_steps": 25254, "loss": 0.1201, "learning_rate": 2.891466168716535e-05, "epoch": 1.3993822760750771, "percentage": 46.65, "elapsed_time": "7:09:18", "remaining_time": "8:11:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11790, "total_steps": 25254, "loss": 0.1202, "learning_rate": 2.8882991686328337e-05, "epoch": 1.4005702066999288, "percentage": 46.69, "elapsed_time": "7:09:40", "remaining_time": "8:10:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11800, "total_steps": 25254, "loss": 0.1185, "learning_rate": 2.8851315298801864e-05, "epoch": 1.4017581373247803, "percentage": 46.73, "elapsed_time": "7:10:02", "remaining_time": "8:10:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11810, "total_steps": 25254, "loss": 0.1189, "learning_rate": 2.8819632576686805e-05, "epoch": 1.4029460679496317, "percentage": 46.76, "elapsed_time": "7:10:24", "remaining_time": "8:09:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11820, "total_steps": 25254, "loss": 0.1188, "learning_rate": 2.878794357209445e-05, "epoch": 1.4041339985744832, "percentage": 46.8, "elapsed_time": "7:10:46", "remaining_time": "8:09:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11830, "total_steps": 25254, "loss": 0.1189, "learning_rate": 2.8756248337146424e-05, "epoch": 1.4053219291993346, "percentage": 46.84, "elapsed_time": "7:11:08", "remaining_time": "8:09:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11840, "total_steps": 25254, "loss": 0.1208, "learning_rate": 2.87245469239746e-05, "epoch": 1.4065098598241863, "percentage": 46.88, "elapsed_time": "7:11:30", "remaining_time": "8:08:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11850, "total_steps": 25254, "loss": 0.12, "learning_rate": 2.8692839384721003e-05, "epoch": 1.4076977904490378, "percentage": 46.92, "elapsed_time": "7:11:52", "remaining_time": "8:08:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11860, "total_steps": 25254, "loss": 0.1175, "learning_rate": 2.866112577153775e-05, "epoch": 1.4088857210738892, "percentage": 46.96, "elapsed_time": "7:12:13", "remaining_time": "8:08:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11870, "total_steps": 25254, "loss": 0.1228, "learning_rate": 2.862940613658693e-05, "epoch": 1.4100736516987409, "percentage": 47.0, "elapsed_time": "7:12:35", "remaining_time": "8:07:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11880, "total_steps": 25254, "loss": 0.1216, "learning_rate": 2.8597680532040562e-05, "epoch": 1.4112615823235923, "percentage": 47.04, "elapsed_time": "7:12:57", "remaining_time": "8:07:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11890, "total_steps": 25254, "loss": 0.1227, "learning_rate": 2.8565949010080452e-05, "epoch": 1.4124495129484438, "percentage": 47.08, "elapsed_time": "7:13:19", "remaining_time": "8:07:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11900, "total_steps": 25254, "loss": 0.1184, "learning_rate": 2.8534211622898175e-05, "epoch": 1.4136374435732952, "percentage": 47.12, "elapsed_time": "7:13:41", "remaining_time": "8:06:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11910, "total_steps": 25254, "loss": 0.1196, "learning_rate": 2.8502468422694922e-05, "epoch": 1.4148253741981467, "percentage": 47.16, "elapsed_time": "7:14:03", "remaining_time": "8:06:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11920, "total_steps": 25254, "loss": 0.1186, "learning_rate": 2.847071946168145e-05, "epoch": 1.4160133048229984, "percentage": 47.2, "elapsed_time": "7:14:26", "remaining_time": "8:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11930, "total_steps": 25254, "loss": 0.1185, "learning_rate": 2.843896479207802e-05, "epoch": 1.4172012354478498, "percentage": 47.24, "elapsed_time": "7:14:47", "remaining_time": "8:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11940, "total_steps": 25254, "loss": 0.1203, "learning_rate": 2.840720446611424e-05, "epoch": 1.4183891660727013, "percentage": 47.28, "elapsed_time": "7:15:09", "remaining_time": "8:05:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11950, "total_steps": 25254, "loss": 0.1193, "learning_rate": 2.8375438536029053e-05, "epoch": 1.419577096697553, "percentage": 47.32, "elapsed_time": "7:15:30", "remaining_time": "8:04:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11960, "total_steps": 25254, "loss": 0.117, "learning_rate": 2.83436670540706e-05, "epoch": 1.4207650273224044, "percentage": 47.36, "elapsed_time": "7:15:52", "remaining_time": "8:04:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11970, "total_steps": 25254, "loss": 0.1202, "learning_rate": 2.8311890072496173e-05, "epoch": 1.4219529579472558, "percentage": 47.4, "elapsed_time": "7:16:14", "remaining_time": "8:04:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11980, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.828010764357209e-05, "epoch": 1.4231408885721075, "percentage": 47.44, "elapsed_time": "7:16:36", "remaining_time": "8:03:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 11990, "total_steps": 25254, "loss": 0.1221, "learning_rate": 2.8248319819573644e-05, "epoch": 1.424328819196959, "percentage": 47.48, "elapsed_time": "7:16:58", "remaining_time": "8:03:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12000, "total_steps": 25254, "loss": 0.1223, "learning_rate": 2.821652665278499e-05, "epoch": 1.4255167498218104, "percentage": 47.52, "elapsed_time": "7:17:20", "remaining_time": "8:03:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12010, "total_steps": 25254, "loss": 0.1202, "learning_rate": 2.818472819549908e-05, "epoch": 1.4267046804466619, "percentage": 47.56, "elapsed_time": "7:17:41", "remaining_time": "8:02:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12020, "total_steps": 25254, "loss": 0.1182, "learning_rate": 2.8152924500017564e-05, "epoch": 1.4278926110715133, "percentage": 47.6, "elapsed_time": "7:18:03", "remaining_time": "8:02:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12030, "total_steps": 25254, "loss": 0.1185, "learning_rate": 2.8121115618650705e-05, "epoch": 1.429080541696365, "percentage": 47.64, "elapsed_time": "7:18:25", "remaining_time": "8:01:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12040, "total_steps": 25254, "loss": 0.1167, "learning_rate": 2.80893016037173e-05, "epoch": 1.4302684723212165, "percentage": 47.68, "elapsed_time": "7:18:47", "remaining_time": "8:01:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12050, "total_steps": 25254, "loss": 0.1205, "learning_rate": 2.8057482507544593e-05, "epoch": 1.431456402946068, "percentage": 47.72, "elapsed_time": "7:19:09", "remaining_time": "8:01:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12060, "total_steps": 25254, "loss": 0.121, "learning_rate": 2.8025658382468163e-05, "epoch": 1.4326443335709196, "percentage": 47.75, "elapsed_time": "7:19:30", "remaining_time": "8:00:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12070, "total_steps": 25254, "loss": 0.1171, "learning_rate": 2.7993829280831902e-05, "epoch": 1.433832264195771, "percentage": 47.79, "elapsed_time": "7:19:52", "remaining_time": "8:00:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12080, "total_steps": 25254, "loss": 0.1199, "learning_rate": 2.7961995254987845e-05, "epoch": 1.4350201948206225, "percentage": 47.83, "elapsed_time": "7:20:14", "remaining_time": "8:00:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12090, "total_steps": 25254, "loss": 0.1222, "learning_rate": 2.793015635729616e-05, "epoch": 1.436208125445474, "percentage": 47.87, "elapsed_time": "7:20:35", "remaining_time": "7:59:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12100, "total_steps": 25254, "loss": 0.1176, "learning_rate": 2.789831264012499e-05, "epoch": 1.4373960560703254, "percentage": 47.91, "elapsed_time": "7:20:56", "remaining_time": "7:59:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12110, "total_steps": 25254, "loss": 0.118, "learning_rate": 2.7866464155850454e-05, "epoch": 1.438583986695177, "percentage": 47.95, "elapsed_time": "7:21:19", "remaining_time": "7:59:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12120, "total_steps": 25254, "loss": 0.1189, "learning_rate": 2.783461095685647e-05, "epoch": 1.4397719173200285, "percentage": 47.99, "elapsed_time": "7:21:40", "remaining_time": "7:58:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12130, "total_steps": 25254, "loss": 0.1201, "learning_rate": 2.7802753095534727e-05, "epoch": 1.44095984794488, "percentage": 48.03, "elapsed_time": "7:22:02", "remaining_time": "7:58:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12140, "total_steps": 25254, "loss": 0.1189, "learning_rate": 2.7770890624284585e-05, "epoch": 1.4421477785697316, "percentage": 48.07, "elapsed_time": "7:22:25", "remaining_time": "7:57:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12150, "total_steps": 25254, "loss": 0.1199, "learning_rate": 2.773902359551298e-05, "epoch": 1.443335709194583, "percentage": 48.11, "elapsed_time": "7:22:46", "remaining_time": "7:57:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12160, "total_steps": 25254, "loss": 0.1189, "learning_rate": 2.7707152061634356e-05, "epoch": 1.4445236398194345, "percentage": 48.15, "elapsed_time": "7:23:08", "remaining_time": "7:57:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12170, "total_steps": 25254, "loss": 0.1208, "learning_rate": 2.7675276075070555e-05, "epoch": 1.445711570444286, "percentage": 48.19, "elapsed_time": "7:23:30", "remaining_time": "7:56:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12180, "total_steps": 25254, "loss": 0.1187, "learning_rate": 2.764339568825074e-05, "epoch": 1.4468995010691375, "percentage": 48.23, "elapsed_time": "7:23:51", "remaining_time": "7:56:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12190, "total_steps": 25254, "loss": 0.1171, "learning_rate": 2.761151095361132e-05, "epoch": 1.4480874316939891, "percentage": 48.27, "elapsed_time": "7:24:13", "remaining_time": "7:56:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12200, "total_steps": 25254, "loss": 0.1182, "learning_rate": 2.757962192359585e-05, "epoch": 1.4492753623188406, "percentage": 48.31, "elapsed_time": "7:24:35", "remaining_time": "7:55:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12210, "total_steps": 25254, "loss": 0.1206, "learning_rate": 2.7547728650654962e-05, "epoch": 1.450463292943692, "percentage": 48.35, "elapsed_time": "7:24:56", "remaining_time": "7:55:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12220, "total_steps": 25254, "loss": 0.1215, "learning_rate": 2.751583118724625e-05, "epoch": 1.4516512235685437, "percentage": 48.39, "elapsed_time": "7:25:18", "remaining_time": "7:54:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12230, "total_steps": 25254, "loss": 0.1215, "learning_rate": 2.7483929585834213e-05, "epoch": 1.4528391541933952, "percentage": 48.43, "elapsed_time": "7:25:40", "remaining_time": "7:54:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12240, "total_steps": 25254, "loss": 0.1206, "learning_rate": 2.7452023898890138e-05, "epoch": 1.4540270848182466, "percentage": 48.47, "elapsed_time": "7:26:01", "remaining_time": "7:54:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12250, "total_steps": 25254, "loss": 0.1202, "learning_rate": 2.7420114178892064e-05, "epoch": 1.455215015443098, "percentage": 48.51, "elapsed_time": "7:26:23", "remaining_time": "7:53:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12260, "total_steps": 25254, "loss": 0.1179, "learning_rate": 2.738820047832463e-05, "epoch": 1.4564029460679495, "percentage": 48.55, "elapsed_time": "7:26:45", "remaining_time": "7:53:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12270, "total_steps": 25254, "loss": 0.1178, "learning_rate": 2.7356282849679043e-05, "epoch": 1.4575908766928012, "percentage": 48.59, "elapsed_time": "7:27:07", "remaining_time": "7:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12280, "total_steps": 25254, "loss": 0.1183, "learning_rate": 2.732436134545296e-05, "epoch": 1.4587788073176526, "percentage": 48.63, "elapsed_time": "7:27:29", "remaining_time": "7:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12290, "total_steps": 25254, "loss": 0.1211, "learning_rate": 2.729243601815042e-05, "epoch": 1.459966737942504, "percentage": 48.67, "elapsed_time": "7:27:51", "remaining_time": "7:52:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12300, "total_steps": 25254, "loss": 0.1189, "learning_rate": 2.726050692028174e-05, "epoch": 1.4611546685673558, "percentage": 48.71, "elapsed_time": "7:28:13", "remaining_time": "7:52:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12310, "total_steps": 25254, "loss": 0.1176, "learning_rate": 2.7228574104363462e-05, "epoch": 1.4623425991922072, "percentage": 48.74, "elapsed_time": "7:28:35", "remaining_time": "7:51:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12320, "total_steps": 25254, "loss": 0.119, "learning_rate": 2.719663762291821e-05, "epoch": 1.4635305298170587, "percentage": 48.78, "elapsed_time": "7:28:57", "remaining_time": "7:51:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12330, "total_steps": 25254, "loss": 0.1165, "learning_rate": 2.7164697528474663e-05, "epoch": 1.4647184604419101, "percentage": 48.82, "elapsed_time": "7:29:19", "remaining_time": "7:50:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12340, "total_steps": 25254, "loss": 0.1209, "learning_rate": 2.7132753873567434e-05, "epoch": 1.4659063910667616, "percentage": 48.86, "elapsed_time": "7:29:41", "remaining_time": "7:50:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12350, "total_steps": 25254, "loss": 0.119, "learning_rate": 2.7100806710736994e-05, "epoch": 1.4670943216916132, "percentage": 48.9, "elapsed_time": "7:30:04", "remaining_time": "7:50:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12360, "total_steps": 25254, "loss": 0.1148, "learning_rate": 2.7068856092529565e-05, "epoch": 1.4682822523164647, "percentage": 48.94, "elapsed_time": "7:30:25", "remaining_time": "7:49:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12370, "total_steps": 25254, "loss": 0.1178, "learning_rate": 2.703690207149709e-05, "epoch": 1.4694701829413161, "percentage": 48.98, "elapsed_time": "7:30:47", "remaining_time": "7:49:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12380, "total_steps": 25254, "loss": 0.1184, "learning_rate": 2.7004944700197075e-05, "epoch": 1.4706581135661678, "percentage": 49.02, "elapsed_time": "7:31:09", "remaining_time": "7:49:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12390, "total_steps": 25254, "loss": 0.1196, "learning_rate": 2.6972984031192554e-05, "epoch": 1.4718460441910193, "percentage": 49.06, "elapsed_time": "7:31:31", "remaining_time": "7:48:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12400, "total_steps": 25254, "loss": 0.1241, "learning_rate": 2.6941020117051984e-05, "epoch": 1.4730339748158707, "percentage": 49.1, "elapsed_time": "7:31:53", "remaining_time": "7:48:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12410, "total_steps": 25254, "loss": 0.1179, "learning_rate": 2.6909053010349155e-05, "epoch": 1.4742219054407222, "percentage": 49.14, "elapsed_time": "7:32:15", "remaining_time": "7:48:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12420, "total_steps": 25254, "loss": 0.12, "learning_rate": 2.6877082763663104e-05, "epoch": 1.4754098360655736, "percentage": 49.18, "elapsed_time": "7:32:37", "remaining_time": "7:47:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12430, "total_steps": 25254, "loss": 0.12, "learning_rate": 2.6845109429578037e-05, "epoch": 1.4765977666904253, "percentage": 49.22, "elapsed_time": "7:33:00", "remaining_time": "7:47:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12440, "total_steps": 25254, "loss": 0.1179, "learning_rate": 2.6813133060683242e-05, "epoch": 1.4777856973152768, "percentage": 49.26, "elapsed_time": "7:33:22", "remaining_time": "7:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12450, "total_steps": 25254, "loss": 0.117, "learning_rate": 2.6781153709572997e-05, "epoch": 1.4789736279401282, "percentage": 49.3, "elapsed_time": "7:33:44", "remaining_time": "7:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12460, "total_steps": 25254, "loss": 0.1149, "learning_rate": 2.674917142884648e-05, "epoch": 1.4801615585649799, "percentage": 49.34, "elapsed_time": "7:34:05", "remaining_time": "7:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12470, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.6717186271107698e-05, "epoch": 1.4813494891898313, "percentage": 49.38, "elapsed_time": "7:34:27", "remaining_time": "7:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12480, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.6685198288965372e-05, "epoch": 1.4825374198146828, "percentage": 49.42, "elapsed_time": "7:34:49", "remaining_time": "7:45:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12490, "total_steps": 25254, "loss": 0.1184, "learning_rate": 2.665320753503289e-05, "epoch": 1.4837253504395345, "percentage": 49.46, "elapsed_time": "7:35:10", "remaining_time": "7:45:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12500, "total_steps": 25254, "loss": 0.1172, "learning_rate": 2.662121406192819e-05, "epoch": 1.484913281064386, "percentage": 49.5, "elapsed_time": "7:35:32", "remaining_time": "7:44:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12510, "total_steps": 25254, "loss": 0.1223, "learning_rate": 2.6589217922273667e-05, "epoch": 1.4861012116892374, "percentage": 49.54, "elapsed_time": "7:35:54", "remaining_time": "7:44:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12520, "total_steps": 25254, "loss": 0.1177, "learning_rate": 2.6557219168696135e-05, "epoch": 1.4872891423140888, "percentage": 49.58, "elapsed_time": "7:36:16", "remaining_time": "7:44:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12530, "total_steps": 25254, "loss": 0.1218, "learning_rate": 2.6525217853826668e-05, "epoch": 1.4884770729389403, "percentage": 49.62, "elapsed_time": "7:36:38", "remaining_time": "7:43:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12540, "total_steps": 25254, "loss": 0.118, "learning_rate": 2.649321403030059e-05, "epoch": 1.489665003563792, "percentage": 49.66, "elapsed_time": "7:37:01", "remaining_time": "7:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12550, "total_steps": 25254, "loss": 0.1176, "learning_rate": 2.646120775075732e-05, "epoch": 1.4908529341886434, "percentage": 49.7, "elapsed_time": "7:37:22", "remaining_time": "7:42:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12560, "total_steps": 25254, "loss": 0.1208, "learning_rate": 2.6429199067840348e-05, "epoch": 1.4920408648134948, "percentage": 49.73, "elapsed_time": "7:37:43", "remaining_time": "7:42:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12570, "total_steps": 25254, "loss": 0.1174, "learning_rate": 2.639718803419709e-05, "epoch": 1.4932287954383465, "percentage": 49.77, "elapsed_time": "7:38:05", "remaining_time": "7:42:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12580, "total_steps": 25254, "loss": 0.1161, "learning_rate": 2.6365174702478838e-05, "epoch": 1.494416726063198, "percentage": 49.81, "elapsed_time": "7:38:27", "remaining_time": "7:41:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12590, "total_steps": 25254, "loss": 0.1183, "learning_rate": 2.6333159125340668e-05, "epoch": 1.4956046566880494, "percentage": 49.85, "elapsed_time": "7:38:49", "remaining_time": "7:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12600, "total_steps": 25254, "loss": 0.1194, "learning_rate": 2.630114135544134e-05, "epoch": 1.4967925873129009, "percentage": 49.89, "elapsed_time": "7:39:11", "remaining_time": "7:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12610, "total_steps": 25254, "loss": 0.1207, "learning_rate": 2.6269121445443236e-05, "epoch": 1.4979805179377523, "percentage": 49.93, "elapsed_time": "7:39:34", "remaining_time": "7:40:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12620, "total_steps": 25254, "loss": 0.1178, "learning_rate": 2.623709944801223e-05, "epoch": 1.499168448562604, "percentage": 49.97, "elapsed_time": "7:39:56", "remaining_time": "7:40:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12630, "total_steps": 25254, "loss": 0.1199, "learning_rate": 2.6205075415817672e-05, "epoch": 1.5003563791874555, "percentage": 50.01, "elapsed_time": "7:40:17", "remaining_time": "7:40:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12640, "total_steps": 25254, "loss": 0.121, "learning_rate": 2.6173049401532217e-05, "epoch": 1.501544309812307, "percentage": 50.05, "elapsed_time": "7:40:39", "remaining_time": "7:39:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12650, "total_steps": 25254, "loss": 0.1189, "learning_rate": 2.6141021457831804e-05, "epoch": 1.5027322404371586, "percentage": 50.09, "elapsed_time": "7:41:01", "remaining_time": "7:39:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12660, "total_steps": 25254, "loss": 0.1228, "learning_rate": 2.6108991637395534e-05, "epoch": 1.5039201710620098, "percentage": 50.13, "elapsed_time": "7:41:23", "remaining_time": "7:38:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12670, "total_steps": 25254, "loss": 0.1184, "learning_rate": 2.6076959992905613e-05, "epoch": 1.5051081016868615, "percentage": 50.17, "elapsed_time": "7:41:46", "remaining_time": "7:38:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12680, "total_steps": 25254, "loss": 0.1189, "learning_rate": 2.604492657704722e-05, "epoch": 1.5062960323117132, "percentage": 50.21, "elapsed_time": "7:42:09", "remaining_time": "7:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12690, "total_steps": 25254, "loss": 0.1196, "learning_rate": 2.6012891442508458e-05, "epoch": 1.5074839629365644, "percentage": 50.25, "elapsed_time": "7:42:30", "remaining_time": "7:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12700, "total_steps": 25254, "loss": 0.1207, "learning_rate": 2.5980854641980272e-05, "epoch": 1.508671893561416, "percentage": 50.29, "elapsed_time": "7:42:51", "remaining_time": "7:37:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12710, "total_steps": 25254, "loss": 0.1196, "learning_rate": 2.5948816228156336e-05, "epoch": 1.5098598241862675, "percentage": 50.33, "elapsed_time": "7:43:13", "remaining_time": "7:37:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12720, "total_steps": 25254, "loss": 0.1186, "learning_rate": 2.5916776253732965e-05, "epoch": 1.511047754811119, "percentage": 50.37, "elapsed_time": "7:43:35", "remaining_time": "7:36:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12730, "total_steps": 25254, "loss": 0.1158, "learning_rate": 2.588473477140907e-05, "epoch": 1.5122356854359706, "percentage": 50.41, "elapsed_time": "7:43:56", "remaining_time": "7:36:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12740, "total_steps": 25254, "loss": 0.1187, "learning_rate": 2.5852691833886013e-05, "epoch": 1.513423616060822, "percentage": 50.45, "elapsed_time": "7:44:18", "remaining_time": "7:36:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12750, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.5820647493867568e-05, "epoch": 1.5146115466856735, "percentage": 50.49, "elapsed_time": "7:44:40", "remaining_time": "7:35:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12760, "total_steps": 25254, "loss": 0.1183, "learning_rate": 2.5788601804059793e-05, "epoch": 1.5157994773105252, "percentage": 50.53, "elapsed_time": "7:45:02", "remaining_time": "7:35:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12770, "total_steps": 25254, "loss": 0.1184, "learning_rate": 2.5756554817171e-05, "epoch": 1.5169874079353765, "percentage": 50.57, "elapsed_time": "7:45:24", "remaining_time": "7:34:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12780, "total_steps": 25254, "loss": 0.1162, "learning_rate": 2.5724506585911616e-05, "epoch": 1.5181753385602281, "percentage": 50.61, "elapsed_time": "7:45:46", "remaining_time": "7:34:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12790, "total_steps": 25254, "loss": 0.1194, "learning_rate": 2.569245716299411e-05, "epoch": 1.5193632691850796, "percentage": 50.65, "elapsed_time": "7:46:07", "remaining_time": "7:34:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12800, "total_steps": 25254, "loss": 0.1191, "learning_rate": 2.566040660113292e-05, "epoch": 1.520551199809931, "percentage": 50.69, "elapsed_time": "7:46:29", "remaining_time": "7:33:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12810, "total_steps": 25254, "loss": 0.1208, "learning_rate": 2.5628354953044343e-05, "epoch": 1.5217391304347827, "percentage": 50.72, "elapsed_time": "7:46:51", "remaining_time": "7:33:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12820, "total_steps": 25254, "loss": 0.1191, "learning_rate": 2.5596302271446487e-05, "epoch": 1.5229270610596342, "percentage": 50.76, "elapsed_time": "7:47:13", "remaining_time": "7:33:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12830, "total_steps": 25254, "loss": 0.1172, "learning_rate": 2.556424860905915e-05, "epoch": 1.5241149916844856, "percentage": 50.8, "elapsed_time": "7:47:34", "remaining_time": "7:32:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12840, "total_steps": 25254, "loss": 0.1188, "learning_rate": 2.5532194018603726e-05, "epoch": 1.5253029223093373, "percentage": 50.84, "elapsed_time": "7:47:57", "remaining_time": "7:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12850, "total_steps": 25254, "loss": 0.1161, "learning_rate": 2.550013855280316e-05, "epoch": 1.5264908529341885, "percentage": 50.88, "elapsed_time": "7:48:19", "remaining_time": "7:32:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12860, "total_steps": 25254, "loss": 0.116, "learning_rate": 2.546808226438181e-05, "epoch": 1.5276787835590402, "percentage": 50.92, "elapsed_time": "7:48:40", "remaining_time": "7:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12870, "total_steps": 25254, "loss": 0.1155, "learning_rate": 2.5436025206065423e-05, "epoch": 1.5288667141838916, "percentage": 50.96, "elapsed_time": "7:49:03", "remaining_time": "7:31:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12880, "total_steps": 25254, "loss": 0.1208, "learning_rate": 2.5403967430580978e-05, "epoch": 1.530054644808743, "percentage": 51.0, "elapsed_time": "7:49:24", "remaining_time": "7:30:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12890, "total_steps": 25254, "loss": 0.1187, "learning_rate": 2.5371908990656655e-05, "epoch": 1.5312425754335948, "percentage": 51.04, "elapsed_time": "7:49:46", "remaining_time": "7:30:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12900, "total_steps": 25254, "loss": 0.1175, "learning_rate": 2.533984993902172e-05, "epoch": 1.5324305060584462, "percentage": 51.08, "elapsed_time": "7:50:08", "remaining_time": "7:30:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12910, "total_steps": 25254, "loss": 0.1213, "learning_rate": 2.530779032840644e-05, "epoch": 1.5336184366832977, "percentage": 51.12, "elapsed_time": "7:50:30", "remaining_time": "7:29:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12920, "total_steps": 25254, "loss": 0.1175, "learning_rate": 2.5275730211542008e-05, "epoch": 1.5348063673081493, "percentage": 51.16, "elapsed_time": "7:50:52", "remaining_time": "7:29:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12930, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.524366964116045e-05, "epoch": 1.5359942979330006, "percentage": 51.2, "elapsed_time": "7:51:14", "remaining_time": "7:29:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12940, "total_steps": 25254, "loss": 0.1172, "learning_rate": 2.5211608669994536e-05, "epoch": 1.5371822285578522, "percentage": 51.24, "elapsed_time": "7:51:36", "remaining_time": "7:28:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12950, "total_steps": 25254, "loss": 0.1177, "learning_rate": 2.517954735077769e-05, "epoch": 1.5383701591827037, "percentage": 51.28, "elapsed_time": "7:51:58", "remaining_time": "7:28:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12960, "total_steps": 25254, "loss": 0.1162, "learning_rate": 2.5147485736243913e-05, "epoch": 1.5395580898075552, "percentage": 51.32, "elapsed_time": "7:52:20", "remaining_time": "7:28:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12970, "total_steps": 25254, "loss": 0.1143, "learning_rate": 2.511542387912771e-05, "epoch": 1.5407460204324068, "percentage": 51.36, "elapsed_time": "7:52:42", "remaining_time": "7:27:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12980, "total_steps": 25254, "loss": 0.1172, "learning_rate": 2.5083361832163942e-05, "epoch": 1.5419339510572583, "percentage": 51.4, "elapsed_time": "7:53:03", "remaining_time": "7:27:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 12990, "total_steps": 25254, "loss": 0.1185, "learning_rate": 2.505129964808782e-05, "epoch": 1.5431218816821097, "percentage": 51.44, "elapsed_time": "7:53:26", "remaining_time": "7:26:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13000, "total_steps": 25254, "loss": 0.1161, "learning_rate": 2.501923737963477e-05, "epoch": 1.5443098123069614, "percentage": 51.48, "elapsed_time": "7:53:47", "remaining_time": "7:26:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13010, "total_steps": 25254, "loss": 0.1156, "learning_rate": 2.498717507954035e-05, "epoch": 1.5454977429318126, "percentage": 51.52, "elapsed_time": "7:54:10", "remaining_time": "7:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13020, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.495511280054018e-05, "epoch": 1.5466856735566643, "percentage": 51.56, "elapsed_time": "7:54:31", "remaining_time": "7:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13030, "total_steps": 25254, "loss": 0.1222, "learning_rate": 2.4923050595369825e-05, "epoch": 1.5478736041815158, "percentage": 51.6, "elapsed_time": "7:54:53", "remaining_time": "7:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13040, "total_steps": 25254, "loss": 0.1214, "learning_rate": 2.4890988516764765e-05, "epoch": 1.5490615348063672, "percentage": 51.64, "elapsed_time": "7:55:15", "remaining_time": "7:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13050, "total_steps": 25254, "loss": 0.1184, "learning_rate": 2.4858926617460243e-05, "epoch": 1.5502494654312189, "percentage": 51.67, "elapsed_time": "7:55:36", "remaining_time": "7:24:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13060, "total_steps": 25254, "loss": 0.1201, "learning_rate": 2.4826864950191216e-05, "epoch": 1.5514373960560703, "percentage": 51.71, "elapsed_time": "7:55:58", "remaining_time": "7:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13070, "total_steps": 25254, "loss": 0.121, "learning_rate": 2.479480356769225e-05, "epoch": 1.5526253266809218, "percentage": 51.75, "elapsed_time": "7:56:20", "remaining_time": "7:24:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13080, "total_steps": 25254, "loss": 0.1183, "learning_rate": 2.476274252269745e-05, "epoch": 1.5538132573057735, "percentage": 51.79, "elapsed_time": "7:56:42", "remaining_time": "7:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13090, "total_steps": 25254, "loss": 0.1204, "learning_rate": 2.4730681867940375e-05, "epoch": 1.5550011879306247, "percentage": 51.83, "elapsed_time": "7:57:04", "remaining_time": "7:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13100, "total_steps": 25254, "loss": 0.1174, "learning_rate": 2.4698621656153932e-05, "epoch": 1.5561891185554764, "percentage": 51.87, "elapsed_time": "7:57:25", "remaining_time": "7:22:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13110, "total_steps": 25254, "loss": 0.1167, "learning_rate": 2.4666561940070303e-05, "epoch": 1.5573770491803278, "percentage": 51.91, "elapsed_time": "7:57:47", "remaining_time": "7:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13120, "total_steps": 25254, "loss": 0.1175, "learning_rate": 2.4634502772420845e-05, "epoch": 1.5585649798051793, "percentage": 51.95, "elapsed_time": "7:58:09", "remaining_time": "7:22:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13130, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.4602444205936014e-05, "epoch": 1.559752910430031, "percentage": 51.99, "elapsed_time": "7:58:31", "remaining_time": "7:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13140, "total_steps": 25254, "loss": 0.1147, "learning_rate": 2.4570386293345317e-05, "epoch": 1.5609408410548824, "percentage": 52.03, "elapsed_time": "7:58:53", "remaining_time": "7:21:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13150, "total_steps": 25254, "loss": 0.119, "learning_rate": 2.4538329087377118e-05, "epoch": 1.5621287716797339, "percentage": 52.07, "elapsed_time": "7:59:17", "remaining_time": "7:21:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13160, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.4506272640758666e-05, "epoch": 1.5633167023045855, "percentage": 52.11, "elapsed_time": "7:59:39", "remaining_time": "7:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13170, "total_steps": 25254, "loss": 0.1164, "learning_rate": 2.4474217006215948e-05, "epoch": 1.5645046329294368, "percentage": 52.15, "elapsed_time": "8:00:00", "remaining_time": "7:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13180, "total_steps": 25254, "loss": 0.1164, "learning_rate": 2.4442162236473605e-05, "epoch": 1.5656925635542884, "percentage": 52.19, "elapsed_time": "8:00:22", "remaining_time": "7:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13190, "total_steps": 25254, "loss": 0.117, "learning_rate": 2.4410108384254884e-05, "epoch": 1.56688049417914, "percentage": 52.23, "elapsed_time": "8:00:43", "remaining_time": "7:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13200, "total_steps": 25254, "loss": 0.1185, "learning_rate": 2.4378055502281498e-05, "epoch": 1.5680684248039913, "percentage": 52.27, "elapsed_time": "8:01:05", "remaining_time": "7:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13210, "total_steps": 25254, "loss": 0.1192, "learning_rate": 2.434600364327357e-05, "epoch": 1.569256355428843, "percentage": 52.31, "elapsed_time": "8:01:27", "remaining_time": "7:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13220, "total_steps": 25254, "loss": 0.1169, "learning_rate": 2.4313952859949536e-05, "epoch": 1.5704442860536945, "percentage": 52.35, "elapsed_time": "8:01:49", "remaining_time": "7:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13230, "total_steps": 25254, "loss": 0.1156, "learning_rate": 2.4281903205026073e-05, "epoch": 1.571632216678546, "percentage": 52.39, "elapsed_time": "8:02:11", "remaining_time": "7:18:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13240, "total_steps": 25254, "loss": 0.1161, "learning_rate": 2.4249854731218004e-05, "epoch": 1.5728201473033976, "percentage": 52.43, "elapsed_time": "8:02:32", "remaining_time": "7:17:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13250, "total_steps": 25254, "loss": 0.1147, "learning_rate": 2.4217807491238194e-05, "epoch": 1.574008077928249, "percentage": 52.47, "elapsed_time": "8:02:54", "remaining_time": "7:17:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13260, "total_steps": 25254, "loss": 0.1186, "learning_rate": 2.418576153779749e-05, "epoch": 1.5751960085531005, "percentage": 52.51, "elapsed_time": "8:03:16", "remaining_time": "7:17:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13270, "total_steps": 25254, "loss": 0.1188, "learning_rate": 2.4153716923604606e-05, "epoch": 1.5763839391779522, "percentage": 52.55, "elapsed_time": "8:03:37", "remaining_time": "7:16:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13280, "total_steps": 25254, "loss": 0.1175, "learning_rate": 2.4121673701366095e-05, "epoch": 1.5775718698028034, "percentage": 52.59, "elapsed_time": "8:03:59", "remaining_time": "7:16:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13290, "total_steps": 25254, "loss": 0.1186, "learning_rate": 2.408963192378618e-05, "epoch": 1.578759800427655, "percentage": 52.63, "elapsed_time": "8:04:21", "remaining_time": "7:16:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13300, "total_steps": 25254, "loss": 0.1159, "learning_rate": 2.4057591643566716e-05, "epoch": 1.5799477310525065, "percentage": 52.66, "elapsed_time": "8:04:42", "remaining_time": "7:15:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13310, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.4025552913407104e-05, "epoch": 1.581135661677358, "percentage": 52.7, "elapsed_time": "8:05:04", "remaining_time": "7:15:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13320, "total_steps": 25254, "loss": 0.1194, "learning_rate": 2.3993515786004184e-05, "epoch": 1.5823235923022096, "percentage": 52.74, "elapsed_time": "8:05:26", "remaining_time": "7:14:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13330, "total_steps": 25254, "loss": 0.1144, "learning_rate": 2.3961480314052183e-05, "epoch": 1.583511522927061, "percentage": 52.78, "elapsed_time": "8:05:48", "remaining_time": "7:14:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13340, "total_steps": 25254, "loss": 0.1194, "learning_rate": 2.3929446550242575e-05, "epoch": 1.5846994535519126, "percentage": 52.82, "elapsed_time": "8:06:09", "remaining_time": "7:14:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13350, "total_steps": 25254, "loss": 0.1154, "learning_rate": 2.3897414547264048e-05, "epoch": 1.5858873841767642, "percentage": 52.86, "elapsed_time": "8:06:31", "remaining_time": "7:13:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13360, "total_steps": 25254, "loss": 0.1153, "learning_rate": 2.3865384357802363e-05, "epoch": 1.5870753148016155, "percentage": 52.9, "elapsed_time": "8:06:54", "remaining_time": "7:13:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13370, "total_steps": 25254, "loss": 0.1173, "learning_rate": 2.3833356034540354e-05, "epoch": 1.5882632454264671, "percentage": 52.94, "elapsed_time": "8:07:15", "remaining_time": "7:13:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13380, "total_steps": 25254, "loss": 0.1171, "learning_rate": 2.3801329630157735e-05, "epoch": 1.5894511760513186, "percentage": 52.98, "elapsed_time": "8:07:36", "remaining_time": "7:12:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13390, "total_steps": 25254, "loss": 0.1175, "learning_rate": 2.3769305197331077e-05, "epoch": 1.59063910667617, "percentage": 53.02, "elapsed_time": "8:07:58", "remaining_time": "7:12:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13400, "total_steps": 25254, "loss": 0.1158, "learning_rate": 2.373728278873371e-05, "epoch": 1.5918270373010217, "percentage": 53.06, "elapsed_time": "8:08:20", "remaining_time": "7:12:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13410, "total_steps": 25254, "loss": 0.1176, "learning_rate": 2.3705262457035642e-05, "epoch": 1.5930149679258732, "percentage": 53.1, "elapsed_time": "8:08:42", "remaining_time": "7:11:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13420, "total_steps": 25254, "loss": 0.1187, "learning_rate": 2.3673244254903455e-05, "epoch": 1.5942028985507246, "percentage": 53.14, "elapsed_time": "8:09:04", "remaining_time": "7:11:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13430, "total_steps": 25254, "loss": 0.1176, "learning_rate": 2.3641228235000238e-05, "epoch": 1.5953908291755763, "percentage": 53.18, "elapsed_time": "8:09:27", "remaining_time": "7:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13440, "total_steps": 25254, "loss": 0.1179, "learning_rate": 2.360921444998548e-05, "epoch": 1.5965787598004275, "percentage": 53.22, "elapsed_time": "8:09:49", "remaining_time": "7:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13450, "total_steps": 25254, "loss": 0.1164, "learning_rate": 2.3577202952514994e-05, "epoch": 1.5977666904252792, "percentage": 53.26, "elapsed_time": "8:10:11", "remaining_time": "7:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13460, "total_steps": 25254, "loss": 0.1175, "learning_rate": 2.354519379524084e-05, "epoch": 1.5989546210501306, "percentage": 53.3, "elapsed_time": "8:10:33", "remaining_time": "7:09:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13470, "total_steps": 25254, "loss": 0.117, "learning_rate": 2.351318703081123e-05, "epoch": 1.600142551674982, "percentage": 53.34, "elapsed_time": "8:10:56", "remaining_time": "7:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13480, "total_steps": 25254, "loss": 0.1151, "learning_rate": 2.348118271187043e-05, "epoch": 1.6013304822998338, "percentage": 53.38, "elapsed_time": "8:11:18", "remaining_time": "7:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13490, "total_steps": 25254, "loss": 0.1197, "learning_rate": 2.344918089105869e-05, "epoch": 1.6025184129246852, "percentage": 53.42, "elapsed_time": "8:11:40", "remaining_time": "7:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13500, "total_steps": 25254, "loss": 0.1176, "learning_rate": 2.3417181621012144e-05, "epoch": 1.6037063435495367, "percentage": 53.46, "elapsed_time": "8:12:02", "remaining_time": "7:08:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13510, "total_steps": 25254, "loss": 0.1165, "learning_rate": 2.3385184954362725e-05, "epoch": 1.6048942741743883, "percentage": 53.5, "elapsed_time": "8:12:24", "remaining_time": "7:08:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13520, "total_steps": 25254, "loss": 0.1174, "learning_rate": 2.3353190943738128e-05, "epoch": 1.6060822047992396, "percentage": 53.54, "elapsed_time": "8:12:45", "remaining_time": "7:07:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13530, "total_steps": 25254, "loss": 0.1138, "learning_rate": 2.332119964176162e-05, "epoch": 1.6072701354240913, "percentage": 53.58, "elapsed_time": "8:13:07", "remaining_time": "7:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13540, "total_steps": 25254, "loss": 0.1163, "learning_rate": 2.328921110105205e-05, "epoch": 1.6084580660489427, "percentage": 53.62, "elapsed_time": "8:13:28", "remaining_time": "7:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13550, "total_steps": 25254, "loss": 0.1173, "learning_rate": 2.3257225374223706e-05, "epoch": 1.6096459966737942, "percentage": 53.65, "elapsed_time": "8:13:50", "remaining_time": "7:06:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13560, "total_steps": 25254, "loss": 0.1167, "learning_rate": 2.3225242513886267e-05, "epoch": 1.6108339272986458, "percentage": 53.69, "elapsed_time": "8:14:13", "remaining_time": "7:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13570, "total_steps": 25254, "loss": 0.119, "learning_rate": 2.319326257264468e-05, "epoch": 1.6120218579234973, "percentage": 53.73, "elapsed_time": "8:14:35", "remaining_time": "7:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13580, "total_steps": 25254, "loss": 0.1151, "learning_rate": 2.3161285603099097e-05, "epoch": 1.6132097885483487, "percentage": 53.77, "elapsed_time": "8:14:57", "remaining_time": "7:05:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13590, "total_steps": 25254, "loss": 0.1125, "learning_rate": 2.3129311657844783e-05, "epoch": 1.6143977191732004, "percentage": 53.81, "elapsed_time": "8:15:19", "remaining_time": "7:05:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13600, "total_steps": 25254, "loss": 0.1188, "learning_rate": 2.309734078947202e-05, "epoch": 1.6155856497980516, "percentage": 53.85, "elapsed_time": "8:15:41", "remaining_time": "7:04:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13610, "total_steps": 25254, "loss": 0.1178, "learning_rate": 2.3065373050566055e-05, "epoch": 1.6167735804229033, "percentage": 53.89, "elapsed_time": "8:16:03", "remaining_time": "7:04:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13620, "total_steps": 25254, "loss": 0.1143, "learning_rate": 2.303340849370696e-05, "epoch": 1.6179615110477548, "percentage": 53.93, "elapsed_time": "8:16:25", "remaining_time": "7:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13630, "total_steps": 25254, "loss": 0.1178, "learning_rate": 2.3001447171469584e-05, "epoch": 1.6191494416726062, "percentage": 53.97, "elapsed_time": "8:16:47", "remaining_time": "7:03:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13640, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.2969489136423456e-05, "epoch": 1.620337372297458, "percentage": 54.01, "elapsed_time": "8:17:08", "remaining_time": "7:03:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13650, "total_steps": 25254, "loss": 0.1146, "learning_rate": 2.2937534441132687e-05, "epoch": 1.6215253029223093, "percentage": 54.05, "elapsed_time": "8:17:30", "remaining_time": "7:02:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13660, "total_steps": 25254, "loss": 0.1173, "learning_rate": 2.2905583138155922e-05, "epoch": 1.6227132335471608, "percentage": 54.09, "elapsed_time": "8:17:52", "remaining_time": "7:02:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13670, "total_steps": 25254, "loss": 0.1156, "learning_rate": 2.28736352800462e-05, "epoch": 1.6239011641720125, "percentage": 54.13, "elapsed_time": "8:18:14", "remaining_time": "7:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13680, "total_steps": 25254, "loss": 0.1144, "learning_rate": 2.2841690919350907e-05, "epoch": 1.6250890947968637, "percentage": 54.17, "elapsed_time": "8:18:36", "remaining_time": "7:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13690, "total_steps": 25254, "loss": 0.1141, "learning_rate": 2.2809750108611656e-05, "epoch": 1.6262770254217154, "percentage": 54.21, "elapsed_time": "8:18:58", "remaining_time": "7:01:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13700, "total_steps": 25254, "loss": 0.1143, "learning_rate": 2.2777812900364263e-05, "epoch": 1.627464956046567, "percentage": 54.25, "elapsed_time": "8:19:20", "remaining_time": "7:01:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13710, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.2745879347138582e-05, "epoch": 1.6286528866714183, "percentage": 54.29, "elapsed_time": "8:19:41", "remaining_time": "7:00:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13720, "total_steps": 25254, "loss": 0.1144, "learning_rate": 2.2713949501458477e-05, "epoch": 1.62984081729627, "percentage": 54.33, "elapsed_time": "8:20:03", "remaining_time": "7:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13730, "total_steps": 25254, "loss": 0.1158, "learning_rate": 2.268202341584168e-05, "epoch": 1.6310287479211214, "percentage": 54.37, "elapsed_time": "8:20:25", "remaining_time": "7:00:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13740, "total_steps": 25254, "loss": 0.1207, "learning_rate": 2.2650101142799775e-05, "epoch": 1.6322166785459729, "percentage": 54.41, "elapsed_time": "8:20:47", "remaining_time": "6:59:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13750, "total_steps": 25254, "loss": 0.117, "learning_rate": 2.2618182734838074e-05, "epoch": 1.6334046091708245, "percentage": 54.45, "elapsed_time": "8:21:08", "remaining_time": "6:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13760, "total_steps": 25254, "loss": 0.117, "learning_rate": 2.2586268244455504e-05, "epoch": 1.634592539795676, "percentage": 54.49, "elapsed_time": "8:21:30", "remaining_time": "6:58:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13770, "total_steps": 25254, "loss": 0.1164, "learning_rate": 2.2554357724144575e-05, "epoch": 1.6357804704205274, "percentage": 54.53, "elapsed_time": "8:21:51", "remaining_time": "6:58:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13780, "total_steps": 25254, "loss": 0.1146, "learning_rate": 2.252245122639125e-05, "epoch": 1.636968401045379, "percentage": 54.57, "elapsed_time": "8:22:13", "remaining_time": "6:58:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13790, "total_steps": 25254, "loss": 0.1186, "learning_rate": 2.2490548803674878e-05, "epoch": 1.6381563316702303, "percentage": 54.61, "elapsed_time": "8:22:35", "remaining_time": "6:57:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13800, "total_steps": 25254, "loss": 0.1171, "learning_rate": 2.2458650508468127e-05, "epoch": 1.639344262295082, "percentage": 54.64, "elapsed_time": "8:22:56", "remaining_time": "6:57:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13810, "total_steps": 25254, "loss": 0.1196, "learning_rate": 2.242675639323684e-05, "epoch": 1.6405321929199335, "percentage": 54.68, "elapsed_time": "8:23:18", "remaining_time": "6:57:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13820, "total_steps": 25254, "loss": 0.1158, "learning_rate": 2.239486651044002e-05, "epoch": 1.641720123544785, "percentage": 54.72, "elapsed_time": "8:23:39", "remaining_time": "6:56:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13830, "total_steps": 25254, "loss": 0.1147, "learning_rate": 2.236298091252968e-05, "epoch": 1.6429080541696366, "percentage": 54.76, "elapsed_time": "8:24:01", "remaining_time": "6:56:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13840, "total_steps": 25254, "loss": 0.1171, "learning_rate": 2.233109965195079e-05, "epoch": 1.644095984794488, "percentage": 54.8, "elapsed_time": "8:24:23", "remaining_time": "6:55:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13850, "total_steps": 25254, "loss": 0.1154, "learning_rate": 2.229922278114122e-05, "epoch": 1.6452839154193395, "percentage": 54.84, "elapsed_time": "8:24:45", "remaining_time": "6:55:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13860, "total_steps": 25254, "loss": 0.1163, "learning_rate": 2.226735035253158e-05, "epoch": 1.6464718460441912, "percentage": 54.88, "elapsed_time": "8:25:07", "remaining_time": "6:55:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13870, "total_steps": 25254, "loss": 0.1163, "learning_rate": 2.2235482418545178e-05, "epoch": 1.6476597766690424, "percentage": 54.92, "elapsed_time": "8:25:28", "remaining_time": "6:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13880, "total_steps": 25254, "loss": 0.1158, "learning_rate": 2.2203619031597945e-05, "epoch": 1.648847707293894, "percentage": 54.96, "elapsed_time": "8:25:50", "remaining_time": "6:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13890, "total_steps": 25254, "loss": 0.1187, "learning_rate": 2.217176024409833e-05, "epoch": 1.6500356379187455, "percentage": 55.0, "elapsed_time": "8:26:12", "remaining_time": "6:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13900, "total_steps": 25254, "loss": 0.1153, "learning_rate": 2.2139906108447218e-05, "epoch": 1.651223568543597, "percentage": 55.04, "elapsed_time": "8:26:34", "remaining_time": "6:53:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13910, "total_steps": 25254, "loss": 0.1171, "learning_rate": 2.2108056677037825e-05, "epoch": 1.6524114991684486, "percentage": 55.08, "elapsed_time": "8:26:56", "remaining_time": "6:53:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13920, "total_steps": 25254, "loss": 0.1176, "learning_rate": 2.207621200225565e-05, "epoch": 1.6535994297933, "percentage": 55.12, "elapsed_time": "8:27:18", "remaining_time": "6:53:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13930, "total_steps": 25254, "loss": 0.1148, "learning_rate": 2.2044372136478348e-05, "epoch": 1.6547873604181516, "percentage": 55.16, "elapsed_time": "8:27:40", "remaining_time": "6:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13940, "total_steps": 25254, "loss": 0.1118, "learning_rate": 2.2012537132075697e-05, "epoch": 1.6559752910430032, "percentage": 55.2, "elapsed_time": "8:28:01", "remaining_time": "6:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13950, "total_steps": 25254, "loss": 0.1149, "learning_rate": 2.1980707041409452e-05, "epoch": 1.6571632216678545, "percentage": 55.24, "elapsed_time": "8:28:23", "remaining_time": "6:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13960, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.1948881916833287e-05, "epoch": 1.6583511522927061, "percentage": 55.28, "elapsed_time": "8:28:45", "remaining_time": "6:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13970, "total_steps": 25254, "loss": 0.1192, "learning_rate": 2.1917061810692724e-05, "epoch": 1.6595390829175576, "percentage": 55.32, "elapsed_time": "8:29:07", "remaining_time": "6:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13980, "total_steps": 25254, "loss": 0.1145, "learning_rate": 2.1885246775325006e-05, "epoch": 1.660727013542409, "percentage": 55.36, "elapsed_time": "8:29:28", "remaining_time": "6:50:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 13990, "total_steps": 25254, "loss": 0.1146, "learning_rate": 2.1853436863059066e-05, "epoch": 1.6619149441672607, "percentage": 55.4, "elapsed_time": "8:29:50", "remaining_time": "6:50:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14000, "total_steps": 25254, "loss": 0.1135, "learning_rate": 2.1821632126215386e-05, "epoch": 1.6631028747921122, "percentage": 55.44, "elapsed_time": "8:30:12", "remaining_time": "6:50:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14010, "total_steps": 25254, "loss": 0.1182, "learning_rate": 2.178983261710595e-05, "epoch": 1.6642908054169636, "percentage": 55.48, "elapsed_time": "8:30:34", "remaining_time": "6:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14020, "total_steps": 25254, "loss": 0.1152, "learning_rate": 2.175803838803412e-05, "epoch": 1.6654787360418153, "percentage": 55.52, "elapsed_time": "8:30:56", "remaining_time": "6:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14030, "total_steps": 25254, "loss": 0.1192, "learning_rate": 2.1726249491294613e-05, "epoch": 1.6666666666666665, "percentage": 55.56, "elapsed_time": "8:31:17", "remaining_time": "6:49:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14040, "total_steps": 25254, "loss": 0.1185, "learning_rate": 2.169446597917336e-05, "epoch": 1.6678545972915182, "percentage": 55.6, "elapsed_time": "8:31:39", "remaining_time": "6:48:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14050, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.1662687903947408e-05, "epoch": 1.6690425279163696, "percentage": 55.63, "elapsed_time": "8:32:01", "remaining_time": "6:48:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14060, "total_steps": 25254, "loss": 0.1188, "learning_rate": 2.163091531788489e-05, "epoch": 1.670230458541221, "percentage": 55.67, "elapsed_time": "8:32:23", "remaining_time": "6:47:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14070, "total_steps": 25254, "loss": 0.119, "learning_rate": 2.1599148273244896e-05, "epoch": 1.6714183891660728, "percentage": 55.71, "elapsed_time": "8:32:45", "remaining_time": "6:47:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14080, "total_steps": 25254, "loss": 0.1163, "learning_rate": 2.1567386822277425e-05, "epoch": 1.6726063197909242, "percentage": 55.75, "elapsed_time": "8:33:06", "remaining_time": "6:47:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14090, "total_steps": 25254, "loss": 0.1162, "learning_rate": 2.1535631017223252e-05, "epoch": 1.6737942504157757, "percentage": 55.79, "elapsed_time": "8:33:28", "remaining_time": "6:46:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14100, "total_steps": 25254, "loss": 0.1183, "learning_rate": 2.1503880910313872e-05, "epoch": 1.6749821810406273, "percentage": 55.83, "elapsed_time": "8:33:50", "remaining_time": "6:46:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14110, "total_steps": 25254, "loss": 0.1169, "learning_rate": 2.1472136553771414e-05, "epoch": 1.6761701116654786, "percentage": 55.87, "elapsed_time": "8:34:11", "remaining_time": "6:46:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14120, "total_steps": 25254, "loss": 0.1142, "learning_rate": 2.144039799980853e-05, "epoch": 1.6773580422903303, "percentage": 55.91, "elapsed_time": "8:34:33", "remaining_time": "6:45:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14130, "total_steps": 25254, "loss": 0.1161, "learning_rate": 2.140866530062836e-05, "epoch": 1.6785459729151817, "percentage": 55.95, "elapsed_time": "8:34:54", "remaining_time": "6:45:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14140, "total_steps": 25254, "loss": 0.1195, "learning_rate": 2.1376938508424384e-05, "epoch": 1.6797339035400332, "percentage": 55.99, "elapsed_time": "8:35:17", "remaining_time": "6:45:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14150, "total_steps": 25254, "loss": 0.1182, "learning_rate": 2.1345217675380386e-05, "epoch": 1.6809218341648848, "percentage": 56.03, "elapsed_time": "8:35:38", "remaining_time": "6:44:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14160, "total_steps": 25254, "loss": 0.1188, "learning_rate": 2.1313502853670332e-05, "epoch": 1.6821097647897363, "percentage": 56.07, "elapsed_time": "8:36:00", "remaining_time": "6:44:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14170, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.1281794095458303e-05, "epoch": 1.6832976954145877, "percentage": 56.11, "elapsed_time": "8:36:21", "remaining_time": "6:43:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14180, "total_steps": 25254, "loss": 0.115, "learning_rate": 2.1250091452898438e-05, "epoch": 1.6844856260394394, "percentage": 56.15, "elapsed_time": "8:36:44", "remaining_time": "6:43:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14190, "total_steps": 25254, "loss": 0.1143, "learning_rate": 2.1218394978134776e-05, "epoch": 1.6856735566642906, "percentage": 56.19, "elapsed_time": "8:37:07", "remaining_time": "6:43:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14200, "total_steps": 25254, "loss": 0.1154, "learning_rate": 2.118670472330123e-05, "epoch": 1.6868614872891423, "percentage": 56.23, "elapsed_time": "8:37:28", "remaining_time": "6:42:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14210, "total_steps": 25254, "loss": 0.1159, "learning_rate": 2.1155020740521476e-05, "epoch": 1.688049417913994, "percentage": 56.27, "elapsed_time": "8:37:50", "remaining_time": "6:42:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14220, "total_steps": 25254, "loss": 0.1154, "learning_rate": 2.1123343081908885e-05, "epoch": 1.6892373485388452, "percentage": 56.31, "elapsed_time": "8:38:12", "remaining_time": "6:42:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14230, "total_steps": 25254, "loss": 0.1176, "learning_rate": 2.1091671799566414e-05, "epoch": 1.690425279163697, "percentage": 56.35, "elapsed_time": "8:38:33", "remaining_time": "6:41:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14240, "total_steps": 25254, "loss": 0.1142, "learning_rate": 2.106000694558654e-05, "epoch": 1.6916132097885483, "percentage": 56.39, "elapsed_time": "8:38:54", "remaining_time": "6:41:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14250, "total_steps": 25254, "loss": 0.1149, "learning_rate": 2.1028348572051166e-05, "epoch": 1.6928011404133998, "percentage": 56.43, "elapsed_time": "8:39:17", "remaining_time": "6:41:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14260, "total_steps": 25254, "loss": 0.1124, "learning_rate": 2.0996696731031518e-05, "epoch": 1.6939890710382515, "percentage": 56.47, "elapsed_time": "8:39:39", "remaining_time": "6:40:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14270, "total_steps": 25254, "loss": 0.1161, "learning_rate": 2.0965051474588118e-05, "epoch": 1.695177001663103, "percentage": 56.51, "elapsed_time": "8:40:01", "remaining_time": "6:40:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14280, "total_steps": 25254, "loss": 0.1165, "learning_rate": 2.0933412854770622e-05, "epoch": 1.6963649322879544, "percentage": 56.55, "elapsed_time": "8:40:23", "remaining_time": "6:39:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14290, "total_steps": 25254, "loss": 0.1119, "learning_rate": 2.0901780923617783e-05, "epoch": 1.697552862912806, "percentage": 56.59, "elapsed_time": "8:40:46", "remaining_time": "6:39:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14300, "total_steps": 25254, "loss": 0.1151, "learning_rate": 2.0870155733157352e-05, "epoch": 1.6987407935376573, "percentage": 56.62, "elapsed_time": "8:41:08", "remaining_time": "6:39:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14310, "total_steps": 25254, "loss": 0.1146, "learning_rate": 2.0838537335405984e-05, "epoch": 1.699928724162509, "percentage": 56.66, "elapsed_time": "8:41:29", "remaining_time": "6:38:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14320, "total_steps": 25254, "loss": 0.114, "learning_rate": 2.0806925782369175e-05, "epoch": 1.7011166547873604, "percentage": 56.7, "elapsed_time": "8:41:51", "remaining_time": "6:38:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14330, "total_steps": 25254, "loss": 0.1157, "learning_rate": 2.0775321126041167e-05, "epoch": 1.7023045854122119, "percentage": 56.74, "elapsed_time": "8:42:13", "remaining_time": "6:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14340, "total_steps": 25254, "loss": 0.1185, "learning_rate": 2.0743723418404835e-05, "epoch": 1.7034925160370635, "percentage": 56.78, "elapsed_time": "8:42:35", "remaining_time": "6:37:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14350, "total_steps": 25254, "loss": 0.1172, "learning_rate": 2.071213271143164e-05, "epoch": 1.704680446661915, "percentage": 56.82, "elapsed_time": "8:42:56", "remaining_time": "6:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14360, "total_steps": 25254, "loss": 0.116, "learning_rate": 2.0680549057081537e-05, "epoch": 1.7058683772867664, "percentage": 56.86, "elapsed_time": "8:43:18", "remaining_time": "6:36:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14370, "total_steps": 25254, "loss": 0.1133, "learning_rate": 2.0648972507302867e-05, "epoch": 1.707056307911618, "percentage": 56.9, "elapsed_time": "8:43:39", "remaining_time": "6:36:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14380, "total_steps": 25254, "loss": 0.1209, "learning_rate": 2.0617403114032287e-05, "epoch": 1.7082442385364693, "percentage": 56.94, "elapsed_time": "8:44:01", "remaining_time": "6:36:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14390, "total_steps": 25254, "loss": 0.1126, "learning_rate": 2.0585840929194684e-05, "epoch": 1.709432169161321, "percentage": 56.98, "elapsed_time": "8:44:23", "remaining_time": "6:35:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14400, "total_steps": 25254, "loss": 0.1123, "learning_rate": 2.0554286004703082e-05, "epoch": 1.7106200997861725, "percentage": 57.02, "elapsed_time": "8:44:45", "remaining_time": "6:35:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14410, "total_steps": 25254, "loss": 0.1163, "learning_rate": 2.0522738392458594e-05, "epoch": 1.711808030411024, "percentage": 57.06, "elapsed_time": "8:45:07", "remaining_time": "6:35:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14420, "total_steps": 25254, "loss": 0.1156, "learning_rate": 2.0491198144350277e-05, "epoch": 1.7129959610358756, "percentage": 57.1, "elapsed_time": "8:45:30", "remaining_time": "6:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14430, "total_steps": 25254, "loss": 0.1184, "learning_rate": 2.0459665312255075e-05, "epoch": 1.714183891660727, "percentage": 57.14, "elapsed_time": "8:45:52", "remaining_time": "6:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14440, "total_steps": 25254, "loss": 0.1181, "learning_rate": 2.0428139948037742e-05, "epoch": 1.7153718222855785, "percentage": 57.18, "elapsed_time": "8:46:14", "remaining_time": "6:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14450, "total_steps": 25254, "loss": 0.1136, "learning_rate": 2.0396622103550748e-05, "epoch": 1.7165597529104302, "percentage": 57.22, "elapsed_time": "8:46:36", "remaining_time": "6:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14460, "total_steps": 25254, "loss": 0.1129, "learning_rate": 2.03651118306342e-05, "epoch": 1.7177476835352814, "percentage": 57.26, "elapsed_time": "8:46:58", "remaining_time": "6:33:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14470, "total_steps": 25254, "loss": 0.1168, "learning_rate": 2.0333609181115742e-05, "epoch": 1.718935614160133, "percentage": 57.3, "elapsed_time": "8:47:20", "remaining_time": "6:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14480, "total_steps": 25254, "loss": 0.115, "learning_rate": 2.0302114206810492e-05, "epoch": 1.7201235447849845, "percentage": 57.34, "elapsed_time": "8:47:41", "remaining_time": "6:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14490, "total_steps": 25254, "loss": 0.1144, "learning_rate": 2.027062695952091e-05, "epoch": 1.721311475409836, "percentage": 57.38, "elapsed_time": "8:48:03", "remaining_time": "6:32:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14500, "total_steps": 25254, "loss": 0.1156, "learning_rate": 2.023914749103681e-05, "epoch": 1.7224994060346877, "percentage": 57.42, "elapsed_time": "8:48:25", "remaining_time": "6:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14510, "total_steps": 25254, "loss": 0.1142, "learning_rate": 2.0207675853135147e-05, "epoch": 1.723687336659539, "percentage": 57.46, "elapsed_time": "8:48:47", "remaining_time": "6:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14520, "total_steps": 25254, "loss": 0.1131, "learning_rate": 2.0176212097580033e-05, "epoch": 1.7248752672843906, "percentage": 57.5, "elapsed_time": "8:49:09", "remaining_time": "6:31:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14530, "total_steps": 25254, "loss": 0.1162, "learning_rate": 2.0144756276122604e-05, "epoch": 1.7260631979092422, "percentage": 57.54, "elapsed_time": "8:49:30", "remaining_time": "6:30:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14540, "total_steps": 25254, "loss": 0.1158, "learning_rate": 2.0113308440500942e-05, "epoch": 1.7272511285340935, "percentage": 57.58, "elapsed_time": "8:49:52", "remaining_time": "6:30:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14550, "total_steps": 25254, "loss": 0.1144, "learning_rate": 2.0081868642440007e-05, "epoch": 1.7284390591589451, "percentage": 57.61, "elapsed_time": "8:50:14", "remaining_time": "6:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14560, "total_steps": 25254, "loss": 0.1166, "learning_rate": 2.0050436933651528e-05, "epoch": 1.7296269897837966, "percentage": 57.65, "elapsed_time": "8:50:36", "remaining_time": "6:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14570, "total_steps": 25254, "loss": 0.1148, "learning_rate": 2.0019013365833935e-05, "epoch": 1.730814920408648, "percentage": 57.69, "elapsed_time": "8:50:58", "remaining_time": "6:29:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14580, "total_steps": 25254, "loss": 0.1153, "learning_rate": 1.998759799067226e-05, "epoch": 1.7320028510334997, "percentage": 57.73, "elapsed_time": "8:51:19", "remaining_time": "6:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14590, "total_steps": 25254, "loss": 0.1099, "learning_rate": 1.995619085983806e-05, "epoch": 1.7331907816583512, "percentage": 57.77, "elapsed_time": "8:51:41", "remaining_time": "6:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14600, "total_steps": 25254, "loss": 0.1166, "learning_rate": 1.992479202498935e-05, "epoch": 1.7343787122832026, "percentage": 57.81, "elapsed_time": "8:52:03", "remaining_time": "6:28:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14610, "total_steps": 25254, "loss": 0.1158, "learning_rate": 1.9893401537770486e-05, "epoch": 1.7355666429080543, "percentage": 57.85, "elapsed_time": "8:52:25", "remaining_time": "6:27:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14620, "total_steps": 25254, "loss": 0.1166, "learning_rate": 1.9862019449812092e-05, "epoch": 1.7367545735329055, "percentage": 57.89, "elapsed_time": "8:52:47", "remaining_time": "6:27:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14630, "total_steps": 25254, "loss": 0.1149, "learning_rate": 1.9830645812730972e-05, "epoch": 1.7379425041577572, "percentage": 57.93, "elapsed_time": "8:53:09", "remaining_time": "6:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14640, "total_steps": 25254, "loss": 0.1157, "learning_rate": 1.979928067813003e-05, "epoch": 1.7391304347826086, "percentage": 57.97, "elapsed_time": "8:53:31", "remaining_time": "6:26:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14650, "total_steps": 25254, "loss": 0.1131, "learning_rate": 1.976792409759822e-05, "epoch": 1.74031836540746, "percentage": 58.01, "elapsed_time": "8:53:53", "remaining_time": "6:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14660, "total_steps": 25254, "loss": 0.1155, "learning_rate": 1.9736576122710386e-05, "epoch": 1.7415062960323118, "percentage": 58.05, "elapsed_time": "8:54:15", "remaining_time": "6:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14670, "total_steps": 25254, "loss": 0.118, "learning_rate": 1.9705236805027226e-05, "epoch": 1.7426942266571632, "percentage": 58.09, "elapsed_time": "8:54:37", "remaining_time": "6:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14680, "total_steps": 25254, "loss": 0.114, "learning_rate": 1.9673906196095203e-05, "epoch": 1.7438821572820147, "percentage": 58.13, "elapsed_time": "8:54:59", "remaining_time": "6:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14690, "total_steps": 25254, "loss": 0.1135, "learning_rate": 1.9642584347446468e-05, "epoch": 1.7450700879068664, "percentage": 58.17, "elapsed_time": "8:55:20", "remaining_time": "6:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14700, "total_steps": 25254, "loss": 0.115, "learning_rate": 1.9611271310598746e-05, "epoch": 1.7462580185317176, "percentage": 58.21, "elapsed_time": "8:55:42", "remaining_time": "6:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14710, "total_steps": 25254, "loss": 0.1143, "learning_rate": 1.9579967137055273e-05, "epoch": 1.7474459491565693, "percentage": 58.25, "elapsed_time": "8:56:03", "remaining_time": "6:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14720, "total_steps": 25254, "loss": 0.1138, "learning_rate": 1.9548671878304708e-05, "epoch": 1.748633879781421, "percentage": 58.29, "elapsed_time": "8:56:25", "remaining_time": "6:23:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14730, "total_steps": 25254, "loss": 0.1102, "learning_rate": 1.9517385585821037e-05, "epoch": 1.7498218104062722, "percentage": 58.33, "elapsed_time": "8:56:47", "remaining_time": "6:23:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14740, "total_steps": 25254, "loss": 0.1118, "learning_rate": 1.9486108311063527e-05, "epoch": 1.7510097410311238, "percentage": 58.37, "elapsed_time": "8:57:10", "remaining_time": "6:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14750, "total_steps": 25254, "loss": 0.1155, "learning_rate": 1.945484010547659e-05, "epoch": 1.7521976716559753, "percentage": 58.41, "elapsed_time": "8:57:31", "remaining_time": "6:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14760, "total_steps": 25254, "loss": 0.1126, "learning_rate": 1.9423581020489723e-05, "epoch": 1.7533856022808267, "percentage": 58.45, "elapsed_time": "8:57:53", "remaining_time": "6:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14770, "total_steps": 25254, "loss": 0.1128, "learning_rate": 1.939233110751742e-05, "epoch": 1.7545735329056784, "percentage": 58.49, "elapsed_time": "8:58:15", "remaining_time": "6:22:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14780, "total_steps": 25254, "loss": 0.1157, "learning_rate": 1.9361090417959097e-05, "epoch": 1.7557614635305299, "percentage": 58.53, "elapsed_time": "8:58:37", "remaining_time": "6:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14790, "total_steps": 25254, "loss": 0.1136, "learning_rate": 1.9329859003198997e-05, "epoch": 1.7569493941553813, "percentage": 58.56, "elapsed_time": "8:59:00", "remaining_time": "6:21:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14800, "total_steps": 25254, "loss": 0.1158, "learning_rate": 1.9298636914606102e-05, "epoch": 1.758137324780233, "percentage": 58.6, "elapsed_time": "8:59:21", "remaining_time": "6:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14810, "total_steps": 25254, "loss": 0.1131, "learning_rate": 1.9267424203534062e-05, "epoch": 1.7593252554050842, "percentage": 58.64, "elapsed_time": "8:59:43", "remaining_time": "6:20:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14820, "total_steps": 25254, "loss": 0.1153, "learning_rate": 1.923622092132109e-05, "epoch": 1.760513186029936, "percentage": 58.68, "elapsed_time": "9:00:05", "remaining_time": "6:20:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14830, "total_steps": 25254, "loss": 0.116, "learning_rate": 1.920502711928992e-05, "epoch": 1.7617011166547873, "percentage": 58.72, "elapsed_time": "9:00:27", "remaining_time": "6:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14840, "total_steps": 25254, "loss": 0.114, "learning_rate": 1.9173842848747665e-05, "epoch": 1.7628890472796388, "percentage": 58.76, "elapsed_time": "9:00:49", "remaining_time": "6:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14850, "total_steps": 25254, "loss": 0.1127, "learning_rate": 1.9142668160985762e-05, "epoch": 1.7640769779044905, "percentage": 58.8, "elapsed_time": "9:01:11", "remaining_time": "6:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14860, "total_steps": 25254, "loss": 0.1104, "learning_rate": 1.9111503107279904e-05, "epoch": 1.765264908529342, "percentage": 58.84, "elapsed_time": "9:01:32", "remaining_time": "6:18:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14870, "total_steps": 25254, "loss": 0.1159, "learning_rate": 1.9080347738889916e-05, "epoch": 1.7664528391541934, "percentage": 58.88, "elapsed_time": "9:01:54", "remaining_time": "6:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14880, "total_steps": 25254, "loss": 0.1154, "learning_rate": 1.904920210705972e-05, "epoch": 1.767640769779045, "percentage": 58.92, "elapsed_time": "9:02:15", "remaining_time": "6:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14890, "total_steps": 25254, "loss": 0.1149, "learning_rate": 1.9018066263017195e-05, "epoch": 1.7688287004038963, "percentage": 58.96, "elapsed_time": "9:02:37", "remaining_time": "6:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14900, "total_steps": 25254, "loss": 0.1123, "learning_rate": 1.898694025797414e-05, "epoch": 1.770016631028748, "percentage": 59.0, "elapsed_time": "9:02:59", "remaining_time": "6:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14910, "total_steps": 25254, "loss": 0.1152, "learning_rate": 1.8955824143126164e-05, "epoch": 1.7712045616535994, "percentage": 59.04, "elapsed_time": "9:03:20", "remaining_time": "6:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14920, "total_steps": 25254, "loss": 0.116, "learning_rate": 1.89247179696526e-05, "epoch": 1.7723924922784509, "percentage": 59.08, "elapsed_time": "9:03:42", "remaining_time": "6:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14930, "total_steps": 25254, "loss": 0.1136, "learning_rate": 1.8893621788716456e-05, "epoch": 1.7735804229033025, "percentage": 59.12, "elapsed_time": "9:04:04", "remaining_time": "6:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14940, "total_steps": 25254, "loss": 0.1151, "learning_rate": 1.886253565146429e-05, "epoch": 1.774768353528154, "percentage": 59.16, "elapsed_time": "9:04:25", "remaining_time": "6:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14950, "total_steps": 25254, "loss": 0.1161, "learning_rate": 1.883145960902612e-05, "epoch": 1.7759562841530054, "percentage": 59.2, "elapsed_time": "9:04:48", "remaining_time": "6:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14960, "total_steps": 25254, "loss": 0.1165, "learning_rate": 1.880039371251539e-05, "epoch": 1.7771442147778571, "percentage": 59.24, "elapsed_time": "9:05:09", "remaining_time": "6:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14970, "total_steps": 25254, "loss": 0.1145, "learning_rate": 1.8769338013028828e-05, "epoch": 1.7783321454027083, "percentage": 59.28, "elapsed_time": "9:05:31", "remaining_time": "6:14:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14980, "total_steps": 25254, "loss": 0.1119, "learning_rate": 1.873829256164643e-05, "epoch": 1.77952007602756, "percentage": 59.32, "elapsed_time": "9:05:54", "remaining_time": "6:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 14990, "total_steps": 25254, "loss": 0.114, "learning_rate": 1.8707257409431307e-05, "epoch": 1.7807080066524115, "percentage": 59.36, "elapsed_time": "9:06:16", "remaining_time": "6:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15000, "total_steps": 25254, "loss": 0.1141, "learning_rate": 1.8676232607429627e-05, "epoch": 1.781895937277263, "percentage": 59.4, "elapsed_time": "9:06:38", "remaining_time": "6:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15010, "total_steps": 25254, "loss": 0.1138, "learning_rate": 1.8645218206670545e-05, "epoch": 1.7830838679021146, "percentage": 59.44, "elapsed_time": "9:07:00", "remaining_time": "6:13:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15020, "total_steps": 25254, "loss": 0.1114, "learning_rate": 1.861421425816611e-05, "epoch": 1.784271798526966, "percentage": 59.48, "elapsed_time": "9:07:22", "remaining_time": "6:12:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15030, "total_steps": 25254, "loss": 0.1196, "learning_rate": 1.8583220812911174e-05, "epoch": 1.7854597291518175, "percentage": 59.52, "elapsed_time": "9:07:43", "remaining_time": "6:12:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15040, "total_steps": 25254, "loss": 0.1124, "learning_rate": 1.8552237921883314e-05, "epoch": 1.7866476597766692, "percentage": 59.55, "elapsed_time": "9:08:05", "remaining_time": "6:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15050, "total_steps": 25254, "loss": 0.1145, "learning_rate": 1.8521265636042752e-05, "epoch": 1.7878355904015204, "percentage": 59.59, "elapsed_time": "9:08:28", "remaining_time": "6:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15060, "total_steps": 25254, "loss": 0.1167, "learning_rate": 1.849030400633224e-05, "epoch": 1.789023521026372, "percentage": 59.63, "elapsed_time": "9:08:50", "remaining_time": "6:11:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15070, "total_steps": 25254, "loss": 0.1109, "learning_rate": 1.845935308367706e-05, "epoch": 1.7902114516512235, "percentage": 59.67, "elapsed_time": "9:09:12", "remaining_time": "6:11:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15080, "total_steps": 25254, "loss": 0.1136, "learning_rate": 1.8428412918984833e-05, "epoch": 1.791399382276075, "percentage": 59.71, "elapsed_time": "9:09:33", "remaining_time": "6:10:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15090, "total_steps": 25254, "loss": 0.1145, "learning_rate": 1.8397483563145503e-05, "epoch": 1.7925873129009267, "percentage": 59.75, "elapsed_time": "9:09:55", "remaining_time": "6:10:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15100, "total_steps": 25254, "loss": 0.1127, "learning_rate": 1.836656506703123e-05, "epoch": 1.793775243525778, "percentage": 59.79, "elapsed_time": "9:10:17", "remaining_time": "6:10:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15110, "total_steps": 25254, "loss": 0.1107, "learning_rate": 1.8335657481496316e-05, "epoch": 1.7949631741506296, "percentage": 59.83, "elapsed_time": "9:10:39", "remaining_time": "6:09:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15120, "total_steps": 25254, "loss": 0.114, "learning_rate": 1.830476085737713e-05, "epoch": 1.7961511047754812, "percentage": 59.87, "elapsed_time": "9:11:01", "remaining_time": "6:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15130, "total_steps": 25254, "loss": 0.1128, "learning_rate": 1.8273875245491988e-05, "epoch": 1.7973390354003325, "percentage": 59.91, "elapsed_time": "9:11:22", "remaining_time": "6:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15140, "total_steps": 25254, "loss": 0.1115, "learning_rate": 1.824300069664111e-05, "epoch": 1.7985269660251841, "percentage": 59.95, "elapsed_time": "9:11:44", "remaining_time": "6:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15150, "total_steps": 25254, "loss": 0.1183, "learning_rate": 1.8212137261606498e-05, "epoch": 1.7997148966500356, "percentage": 59.99, "elapsed_time": "9:12:06", "remaining_time": "6:08:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15160, "total_steps": 25254, "loss": 0.1144, "learning_rate": 1.818128499115192e-05, "epoch": 1.800902827274887, "percentage": 60.03, "elapsed_time": "9:12:28", "remaining_time": "6:07:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15170, "total_steps": 25254, "loss": 0.1138, "learning_rate": 1.8150443936022736e-05, "epoch": 1.8020907578997387, "percentage": 60.07, "elapsed_time": "9:12:49", "remaining_time": "6:07:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15180, "total_steps": 25254, "loss": 0.1109, "learning_rate": 1.8119614146945874e-05, "epoch": 1.8032786885245902, "percentage": 60.11, "elapsed_time": "9:13:11", "remaining_time": "6:07:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15190, "total_steps": 25254, "loss": 0.1124, "learning_rate": 1.8088795674629733e-05, "epoch": 1.8044666191494416, "percentage": 60.15, "elapsed_time": "9:13:32", "remaining_time": "6:06:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15200, "total_steps": 25254, "loss": 0.1137, "learning_rate": 1.805798856976409e-05, "epoch": 1.8056545497742933, "percentage": 60.19, "elapsed_time": "9:13:54", "remaining_time": "6:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15210, "total_steps": 25254, "loss": 0.1144, "learning_rate": 1.802719288302005e-05, "epoch": 1.8068424803991445, "percentage": 60.23, "elapsed_time": "9:14:16", "remaining_time": "6:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15220, "total_steps": 25254, "loss": 0.1118, "learning_rate": 1.799640866504991e-05, "epoch": 1.8080304110239962, "percentage": 60.27, "elapsed_time": "9:14:38", "remaining_time": "6:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15230, "total_steps": 25254, "loss": 0.1152, "learning_rate": 1.7965635966487112e-05, "epoch": 1.8092183416488479, "percentage": 60.31, "elapsed_time": "9:15:00", "remaining_time": "6:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15240, "total_steps": 25254, "loss": 0.1128, "learning_rate": 1.7934874837946156e-05, "epoch": 1.810406272273699, "percentage": 60.35, "elapsed_time": "9:15:21", "remaining_time": "6:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15250, "total_steps": 25254, "loss": 0.1126, "learning_rate": 1.7904125330022504e-05, "epoch": 1.8115942028985508, "percentage": 60.39, "elapsed_time": "9:15:42", "remaining_time": "6:04:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15260, "total_steps": 25254, "loss": 0.1142, "learning_rate": 1.7873387493292515e-05, "epoch": 1.8127821335234022, "percentage": 60.43, "elapsed_time": "9:16:05", "remaining_time": "6:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15270, "total_steps": 25254, "loss": 0.1127, "learning_rate": 1.7842661378313342e-05, "epoch": 1.8139700641482537, "percentage": 60.47, "elapsed_time": "9:16:27", "remaining_time": "6:03:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15280, "total_steps": 25254, "loss": 0.118, "learning_rate": 1.781194703562286e-05, "epoch": 1.8151579947731054, "percentage": 60.51, "elapsed_time": "9:16:49", "remaining_time": "6:03:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15290, "total_steps": 25254, "loss": 0.1141, "learning_rate": 1.7781244515739594e-05, "epoch": 1.8163459253979568, "percentage": 60.54, "elapsed_time": "9:17:10", "remaining_time": "6:03:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15300, "total_steps": 25254, "loss": 0.1127, "learning_rate": 1.7750553869162585e-05, "epoch": 1.8175338560228083, "percentage": 60.58, "elapsed_time": "9:17:31", "remaining_time": "6:02:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15310, "total_steps": 25254, "loss": 0.1118, "learning_rate": 1.77198751463714e-05, "epoch": 1.81872178664766, "percentage": 60.62, "elapsed_time": "9:17:53", "remaining_time": "6:02:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15320, "total_steps": 25254, "loss": 0.1151, "learning_rate": 1.7689208397825956e-05, "epoch": 1.8199097172725112, "percentage": 60.66, "elapsed_time": "9:18:15", "remaining_time": "6:01:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15330, "total_steps": 25254, "loss": 0.1156, "learning_rate": 1.7658553673966483e-05, "epoch": 1.8210976478973628, "percentage": 60.7, "elapsed_time": "9:18:37", "remaining_time": "6:01:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15340, "total_steps": 25254, "loss": 0.1143, "learning_rate": 1.7627911025213428e-05, "epoch": 1.8222855785222143, "percentage": 60.74, "elapsed_time": "9:18:59", "remaining_time": "6:01:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15350, "total_steps": 25254, "loss": 0.1118, "learning_rate": 1.75972805019674e-05, "epoch": 1.8234735091470657, "percentage": 60.78, "elapsed_time": "9:19:20", "remaining_time": "6:00:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15360, "total_steps": 25254, "loss": 0.1109, "learning_rate": 1.756666215460903e-05, "epoch": 1.8246614397719174, "percentage": 60.82, "elapsed_time": "9:19:42", "remaining_time": "6:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15370, "total_steps": 25254, "loss": 0.1089, "learning_rate": 1.7536056033498953e-05, "epoch": 1.8258493703967689, "percentage": 60.86, "elapsed_time": "9:20:04", "remaining_time": "6:00:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15380, "total_steps": 25254, "loss": 0.1163, "learning_rate": 1.750546218897768e-05, "epoch": 1.8270373010216203, "percentage": 60.9, "elapsed_time": "9:20:25", "remaining_time": "5:59:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15390, "total_steps": 25254, "loss": 0.1132, "learning_rate": 1.7474880671365513e-05, "epoch": 1.828225231646472, "percentage": 60.94, "elapsed_time": "9:20:47", "remaining_time": "5:59:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15400, "total_steps": 25254, "loss": 0.1124, "learning_rate": 1.744431153096252e-05, "epoch": 1.8294131622713232, "percentage": 60.98, "elapsed_time": "9:21:09", "remaining_time": "5:59:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15410, "total_steps": 25254, "loss": 0.1133, "learning_rate": 1.7413754818048384e-05, "epoch": 1.830601092896175, "percentage": 61.02, "elapsed_time": "9:21:30", "remaining_time": "5:58:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15420, "total_steps": 25254, "loss": 0.112, "learning_rate": 1.7383210582882342e-05, "epoch": 1.8317890235210263, "percentage": 61.06, "elapsed_time": "9:21:52", "remaining_time": "5:58:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15430, "total_steps": 25254, "loss": 0.1153, "learning_rate": 1.7352678875703126e-05, "epoch": 1.8329769541458778, "percentage": 61.1, "elapsed_time": "9:22:14", "remaining_time": "5:57:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15440, "total_steps": 25254, "loss": 0.1128, "learning_rate": 1.732215974672884e-05, "epoch": 1.8341648847707295, "percentage": 61.14, "elapsed_time": "9:22:36", "remaining_time": "5:57:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15450, "total_steps": 25254, "loss": 0.1133, "learning_rate": 1.729165324615693e-05, "epoch": 1.835352815395581, "percentage": 61.18, "elapsed_time": "9:22:57", "remaining_time": "5:57:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15460, "total_steps": 25254, "loss": 0.1139, "learning_rate": 1.726115942416405e-05, "epoch": 1.8365407460204324, "percentage": 61.22, "elapsed_time": "9:23:19", "remaining_time": "5:56:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15470, "total_steps": 25254, "loss": 0.1122, "learning_rate": 1.7230678330905998e-05, "epoch": 1.837728676645284, "percentage": 61.26, "elapsed_time": "9:23:41", "remaining_time": "5:56:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15480, "total_steps": 25254, "loss": 0.1168, "learning_rate": 1.7200210016517633e-05, "epoch": 1.8389166072701353, "percentage": 61.3, "elapsed_time": "9:24:02", "remaining_time": "5:56:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15490, "total_steps": 25254, "loss": 0.1168, "learning_rate": 1.7169754531112826e-05, "epoch": 1.840104537894987, "percentage": 61.34, "elapsed_time": "9:24:24", "remaining_time": "5:55:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15500, "total_steps": 25254, "loss": 0.1125, "learning_rate": 1.7139311924784318e-05, "epoch": 1.8412924685198384, "percentage": 61.38, "elapsed_time": "9:24:45", "remaining_time": "5:55:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15510, "total_steps": 25254, "loss": 0.1143, "learning_rate": 1.7108882247603674e-05, "epoch": 1.8424803991446899, "percentage": 61.42, "elapsed_time": "9:25:07", "remaining_time": "5:55:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15520, "total_steps": 25254, "loss": 0.1141, "learning_rate": 1.7078465549621197e-05, "epoch": 1.8436683297695415, "percentage": 61.46, "elapsed_time": "9:25:28", "remaining_time": "5:54:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15530, "total_steps": 25254, "loss": 0.1138, "learning_rate": 1.7048061880865822e-05, "epoch": 1.844856260394393, "percentage": 61.5, "elapsed_time": "9:25:50", "remaining_time": "5:54:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15540, "total_steps": 25254, "loss": 0.1176, "learning_rate": 1.7017671291345095e-05, "epoch": 1.8460441910192444, "percentage": 61.53, "elapsed_time": "9:26:12", "remaining_time": "5:53:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15550, "total_steps": 25254, "loss": 0.1138, "learning_rate": 1.698729383104501e-05, "epoch": 1.8472321216440961, "percentage": 61.57, "elapsed_time": "9:26:34", "remaining_time": "5:53:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15560, "total_steps": 25254, "loss": 0.1112, "learning_rate": 1.695692954992999e-05, "epoch": 1.8484200522689473, "percentage": 61.61, "elapsed_time": "9:26:56", "remaining_time": "5:53:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15570, "total_steps": 25254, "loss": 0.1151, "learning_rate": 1.6926578497942766e-05, "epoch": 1.849607982893799, "percentage": 61.65, "elapsed_time": "9:27:18", "remaining_time": "5:52:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15580, "total_steps": 25254, "loss": 0.1125, "learning_rate": 1.689624072500431e-05, "epoch": 1.8507959135186505, "percentage": 61.69, "elapsed_time": "9:27:39", "remaining_time": "5:52:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15590, "total_steps": 25254, "loss": 0.1145, "learning_rate": 1.6865916281013776e-05, "epoch": 1.851983844143502, "percentage": 61.73, "elapsed_time": "9:28:01", "remaining_time": "5:52:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15600, "total_steps": 25254, "loss": 0.1131, "learning_rate": 1.6835605215848368e-05, "epoch": 1.8531717747683536, "percentage": 61.77, "elapsed_time": "9:28:22", "remaining_time": "5:51:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15610, "total_steps": 25254, "loss": 0.1089, "learning_rate": 1.6805307579363294e-05, "epoch": 1.854359705393205, "percentage": 61.81, "elapsed_time": "9:28:44", "remaining_time": "5:51:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15620, "total_steps": 25254, "loss": 0.111, "learning_rate": 1.677502342139168e-05, "epoch": 1.8555476360180565, "percentage": 61.85, "elapsed_time": "9:29:06", "remaining_time": "5:51:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15630, "total_steps": 25254, "loss": 0.1124, "learning_rate": 1.6744752791744462e-05, "epoch": 1.8567355666429082, "percentage": 61.89, "elapsed_time": "9:29:27", "remaining_time": "5:50:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15640, "total_steps": 25254, "loss": 0.1156, "learning_rate": 1.6714495740210363e-05, "epoch": 1.8579234972677594, "percentage": 61.93, "elapsed_time": "9:29:49", "remaining_time": "5:50:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15650, "total_steps": 25254, "loss": 0.1126, "learning_rate": 1.6684252316555742e-05, "epoch": 1.859111427892611, "percentage": 61.97, "elapsed_time": "9:30:11", "remaining_time": "5:49:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15660, "total_steps": 25254, "loss": 0.1127, "learning_rate": 1.665402257052455e-05, "epoch": 1.8602993585174625, "percentage": 62.01, "elapsed_time": "9:30:33", "remaining_time": "5:49:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15670, "total_steps": 25254, "loss": 0.1151, "learning_rate": 1.6623806551838243e-05, "epoch": 1.861487289142314, "percentage": 62.05, "elapsed_time": "9:30:55", "remaining_time": "5:49:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15680, "total_steps": 25254, "loss": 0.1125, "learning_rate": 1.6593604310195704e-05, "epoch": 1.8626752197671657, "percentage": 62.09, "elapsed_time": "9:31:17", "remaining_time": "5:48:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15690, "total_steps": 25254, "loss": 0.1145, "learning_rate": 1.6563415895273143e-05, "epoch": 1.863863150392017, "percentage": 62.13, "elapsed_time": "9:31:39", "remaining_time": "5:48:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15700, "total_steps": 25254, "loss": 0.1132, "learning_rate": 1.6533241356724038e-05, "epoch": 1.8650510810168686, "percentage": 62.17, "elapsed_time": "9:32:01", "remaining_time": "5:48:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15710, "total_steps": 25254, "loss": 0.114, "learning_rate": 1.650308074417904e-05, "epoch": 1.8662390116417202, "percentage": 62.21, "elapsed_time": "9:32:23", "remaining_time": "5:47:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15720, "total_steps": 25254, "loss": 0.1138, "learning_rate": 1.6472934107245886e-05, "epoch": 1.8674269422665715, "percentage": 62.25, "elapsed_time": "9:32:45", "remaining_time": "5:47:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15730, "total_steps": 25254, "loss": 0.1133, "learning_rate": 1.644280149550936e-05, "epoch": 1.8686148728914231, "percentage": 62.29, "elapsed_time": "9:33:07", "remaining_time": "5:47:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15740, "total_steps": 25254, "loss": 0.1165, "learning_rate": 1.6412682958531134e-05, "epoch": 1.8698028035162748, "percentage": 62.33, "elapsed_time": "9:33:29", "remaining_time": "5:46:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15750, "total_steps": 25254, "loss": 0.1129, "learning_rate": 1.6382578545849754e-05, "epoch": 1.870990734141126, "percentage": 62.37, "elapsed_time": "9:33:50", "remaining_time": "5:46:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15760, "total_steps": 25254, "loss": 0.1122, "learning_rate": 1.6352488306980522e-05, "epoch": 1.8721786647659777, "percentage": 62.41, "elapsed_time": "9:34:12", "remaining_time": "5:45:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15770, "total_steps": 25254, "loss": 0.1124, "learning_rate": 1.6322412291415442e-05, "epoch": 1.8733665953908292, "percentage": 62.45, "elapsed_time": "9:34:34", "remaining_time": "5:45:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15780, "total_steps": 25254, "loss": 0.1144, "learning_rate": 1.629235054862312e-05, "epoch": 1.8745545260156806, "percentage": 62.49, "elapsed_time": "9:34:56", "remaining_time": "5:45:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15790, "total_steps": 25254, "loss": 0.113, "learning_rate": 1.6262303128048678e-05, "epoch": 1.8757424566405323, "percentage": 62.52, "elapsed_time": "9:35:18", "remaining_time": "5:44:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15800, "total_steps": 25254, "loss": 0.1132, "learning_rate": 1.6232270079113685e-05, "epoch": 1.8769303872653837, "percentage": 62.56, "elapsed_time": "9:35:40", "remaining_time": "5:44:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15810, "total_steps": 25254, "loss": 0.1133, "learning_rate": 1.6202251451216062e-05, "epoch": 1.8781183178902352, "percentage": 62.6, "elapsed_time": "9:36:02", "remaining_time": "5:44:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15820, "total_steps": 25254, "loss": 0.1177, "learning_rate": 1.6172247293730043e-05, "epoch": 1.8793062485150869, "percentage": 62.64, "elapsed_time": "9:36:24", "remaining_time": "5:43:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15830, "total_steps": 25254, "loss": 0.111, "learning_rate": 1.6142257656006027e-05, "epoch": 1.880494179139938, "percentage": 62.68, "elapsed_time": "9:36:45", "remaining_time": "5:43:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15840, "total_steps": 25254, "loss": 0.1149, "learning_rate": 1.6112282587370554e-05, "epoch": 1.8816821097647898, "percentage": 62.72, "elapsed_time": "9:37:07", "remaining_time": "5:42:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15850, "total_steps": 25254, "loss": 0.1143, "learning_rate": 1.608232213712617e-05, "epoch": 1.8828700403896412, "percentage": 62.76, "elapsed_time": "9:37:28", "remaining_time": "5:42:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15860, "total_steps": 25254, "loss": 0.113, "learning_rate": 1.60523763545514e-05, "epoch": 1.8840579710144927, "percentage": 62.8, "elapsed_time": "9:37:49", "remaining_time": "5:42:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15870, "total_steps": 25254, "loss": 0.1159, "learning_rate": 1.602244528890066e-05, "epoch": 1.8852459016393444, "percentage": 62.84, "elapsed_time": "9:38:12", "remaining_time": "5:41:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15880, "total_steps": 25254, "loss": 0.1126, "learning_rate": 1.5992528989404125e-05, "epoch": 1.8864338322641958, "percentage": 62.88, "elapsed_time": "9:38:33", "remaining_time": "5:41:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15890, "total_steps": 25254, "loss": 0.1114, "learning_rate": 1.596262750526771e-05, "epoch": 1.8876217628890473, "percentage": 62.92, "elapsed_time": "9:38:55", "remaining_time": "5:41:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15900, "total_steps": 25254, "loss": 0.1155, "learning_rate": 1.5932740885672937e-05, "epoch": 1.888809693513899, "percentage": 62.96, "elapsed_time": "9:39:17", "remaining_time": "5:40:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15910, "total_steps": 25254, "loss": 0.1143, "learning_rate": 1.5902869179776897e-05, "epoch": 1.8899976241387502, "percentage": 63.0, "elapsed_time": "9:39:38", "remaining_time": "5:40:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15920, "total_steps": 25254, "loss": 0.1128, "learning_rate": 1.5873012436712154e-05, "epoch": 1.8911855547636018, "percentage": 63.04, "elapsed_time": "9:40:00", "remaining_time": "5:40:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15930, "total_steps": 25254, "loss": 0.1104, "learning_rate": 1.5843170705586653e-05, "epoch": 1.8923734853884533, "percentage": 63.08, "elapsed_time": "9:40:22", "remaining_time": "5:39:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15940, "total_steps": 25254, "loss": 0.1152, "learning_rate": 1.5813344035483637e-05, "epoch": 1.8935614160133047, "percentage": 63.12, "elapsed_time": "9:40:43", "remaining_time": "5:39:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15950, "total_steps": 25254, "loss": 0.1135, "learning_rate": 1.57835324754616e-05, "epoch": 1.8947493466381564, "percentage": 63.16, "elapsed_time": "9:41:05", "remaining_time": "5:38:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15960, "total_steps": 25254, "loss": 0.1134, "learning_rate": 1.5753736074554156e-05, "epoch": 1.8959372772630079, "percentage": 63.2, "elapsed_time": "9:41:27", "remaining_time": "5:38:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15970, "total_steps": 25254, "loss": 0.1115, "learning_rate": 1.5723954881770024e-05, "epoch": 1.8971252078878593, "percentage": 63.24, "elapsed_time": "9:41:48", "remaining_time": "5:38:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15980, "total_steps": 25254, "loss": 0.1127, "learning_rate": 1.5694188946092875e-05, "epoch": 1.898313138512711, "percentage": 63.28, "elapsed_time": "9:42:11", "remaining_time": "5:37:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 15990, "total_steps": 25254, "loss": 0.1124, "learning_rate": 1.5664438316481293e-05, "epoch": 1.8995010691375622, "percentage": 63.32, "elapsed_time": "9:42:32", "remaining_time": "5:37:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16000, "total_steps": 25254, "loss": 0.1138, "learning_rate": 1.5634703041868692e-05, "epoch": 1.900688999762414, "percentage": 63.36, "elapsed_time": "9:42:54", "remaining_time": "5:37:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16010, "total_steps": 25254, "loss": 0.1137, "learning_rate": 1.5604983171163235e-05, "epoch": 1.9018769303872654, "percentage": 63.4, "elapsed_time": "9:43:16", "remaining_time": "5:36:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16020, "total_steps": 25254, "loss": 0.1135, "learning_rate": 1.5575278753247734e-05, "epoch": 1.9030648610121168, "percentage": 63.44, "elapsed_time": "9:43:37", "remaining_time": "5:36:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16030, "total_steps": 25254, "loss": 0.1147, "learning_rate": 1.5545589836979597e-05, "epoch": 1.9042527916369685, "percentage": 63.48, "elapsed_time": "9:43:59", "remaining_time": "5:36:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16040, "total_steps": 25254, "loss": 0.1128, "learning_rate": 1.551591647119073e-05, "epoch": 1.90544072226182, "percentage": 63.51, "elapsed_time": "9:44:21", "remaining_time": "5:35:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16050, "total_steps": 25254, "loss": 0.1121, "learning_rate": 1.548625870468745e-05, "epoch": 1.9066286528866714, "percentage": 63.55, "elapsed_time": "9:44:43", "remaining_time": "5:35:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16060, "total_steps": 25254, "loss": 0.114, "learning_rate": 1.5456616586250457e-05, "epoch": 1.907816583511523, "percentage": 63.59, "elapsed_time": "9:45:05", "remaining_time": "5:34:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16070, "total_steps": 25254, "loss": 0.1099, "learning_rate": 1.5426990164634662e-05, "epoch": 1.9090045141363743, "percentage": 63.63, "elapsed_time": "9:45:27", "remaining_time": "5:34:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16080, "total_steps": 25254, "loss": 0.1142, "learning_rate": 1.5397379488569195e-05, "epoch": 1.910192444761226, "percentage": 63.67, "elapsed_time": "9:45:49", "remaining_time": "5:34:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16090, "total_steps": 25254, "loss": 0.1137, "learning_rate": 1.536778460675727e-05, "epoch": 1.9113803753860774, "percentage": 63.71, "elapsed_time": "9:46:11", "remaining_time": "5:33:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16100, "total_steps": 25254, "loss": 0.1133, "learning_rate": 1.533820556787612e-05, "epoch": 1.9125683060109289, "percentage": 63.75, "elapsed_time": "9:46:33", "remaining_time": "5:33:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16110, "total_steps": 25254, "loss": 0.1132, "learning_rate": 1.530864242057694e-05, "epoch": 1.9137562366357805, "percentage": 63.79, "elapsed_time": "9:46:55", "remaining_time": "5:33:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16120, "total_steps": 25254, "loss": 0.1124, "learning_rate": 1.5279095213484768e-05, "epoch": 1.914944167260632, "percentage": 63.83, "elapsed_time": "9:47:17", "remaining_time": "5:32:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16130, "total_steps": 25254, "loss": 0.1098, "learning_rate": 1.5249563995198426e-05, "epoch": 1.9161320978854834, "percentage": 63.87, "elapsed_time": "9:47:40", "remaining_time": "5:32:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16140, "total_steps": 25254, "loss": 0.1152, "learning_rate": 1.5220048814290438e-05, "epoch": 1.9173200285103351, "percentage": 63.91, "elapsed_time": "9:48:01", "remaining_time": "5:32:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16150, "total_steps": 25254, "loss": 0.1118, "learning_rate": 1.5190549719306974e-05, "epoch": 1.9185079591351863, "percentage": 63.95, "elapsed_time": "9:48:23", "remaining_time": "5:31:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16160, "total_steps": 25254, "loss": 0.1133, "learning_rate": 1.5161066758767706e-05, "epoch": 1.919695889760038, "percentage": 63.99, "elapsed_time": "9:48:45", "remaining_time": "5:31:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16170, "total_steps": 25254, "loss": 0.1127, "learning_rate": 1.5131599981165795e-05, "epoch": 1.9208838203848895, "percentage": 64.03, "elapsed_time": "9:49:06", "remaining_time": "5:30:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16180, "total_steps": 25254, "loss": 0.1144, "learning_rate": 1.5102149434967778e-05, "epoch": 1.922071751009741, "percentage": 64.07, "elapsed_time": "9:49:27", "remaining_time": "5:30:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16190, "total_steps": 25254, "loss": 0.1135, "learning_rate": 1.5072715168613477e-05, "epoch": 1.9232596816345926, "percentage": 64.11, "elapsed_time": "9:49:50", "remaining_time": "5:30:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16200, "total_steps": 25254, "loss": 0.1072, "learning_rate": 1.5043297230515985e-05, "epoch": 1.924447612259444, "percentage": 64.15, "elapsed_time": "9:50:12", "remaining_time": "5:29:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16210, "total_steps": 25254, "loss": 0.1145, "learning_rate": 1.501389566906149e-05, "epoch": 1.9256355428842955, "percentage": 64.19, "elapsed_time": "9:50:34", "remaining_time": "5:29:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16220, "total_steps": 25254, "loss": 0.1159, "learning_rate": 1.4984510532609263e-05, "epoch": 1.9268234735091472, "percentage": 64.23, "elapsed_time": "9:50:56", "remaining_time": "5:29:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16230, "total_steps": 25254, "loss": 0.1127, "learning_rate": 1.4955141869491562e-05, "epoch": 1.9280114041339986, "percentage": 64.27, "elapsed_time": "9:51:19", "remaining_time": "5:28:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16240, "total_steps": 25254, "loss": 0.1109, "learning_rate": 1.4925789728013536e-05, "epoch": 1.92919933475885, "percentage": 64.31, "elapsed_time": "9:51:40", "remaining_time": "5:28:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16250, "total_steps": 25254, "loss": 0.1142, "learning_rate": 1.4896454156453185e-05, "epoch": 1.9303872653837018, "percentage": 64.35, "elapsed_time": "9:52:02", "remaining_time": "5:28:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16260, "total_steps": 25254, "loss": 0.1104, "learning_rate": 1.486713520306123e-05, "epoch": 1.931575196008553, "percentage": 64.39, "elapsed_time": "9:52:24", "remaining_time": "5:27:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16270, "total_steps": 25254, "loss": 0.1145, "learning_rate": 1.4837832916061074e-05, "epoch": 1.9327631266334047, "percentage": 64.43, "elapsed_time": "9:52:46", "remaining_time": "5:27:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16280, "total_steps": 25254, "loss": 0.115, "learning_rate": 1.4808547343648682e-05, "epoch": 1.9339510572582561, "percentage": 64.47, "elapsed_time": "9:53:08", "remaining_time": "5:26:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16290, "total_steps": 25254, "loss": 0.111, "learning_rate": 1.4779278533992574e-05, "epoch": 1.9351389878831076, "percentage": 64.5, "elapsed_time": "9:53:30", "remaining_time": "5:26:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16300, "total_steps": 25254, "loss": 0.1133, "learning_rate": 1.475002653523366e-05, "epoch": 1.9363269185079592, "percentage": 64.54, "elapsed_time": "9:53:52", "remaining_time": "5:26:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16310, "total_steps": 25254, "loss": 0.1119, "learning_rate": 1.4720791395485211e-05, "epoch": 1.9375148491328107, "percentage": 64.58, "elapsed_time": "9:54:15", "remaining_time": "5:25:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16320, "total_steps": 25254, "loss": 0.1107, "learning_rate": 1.4691573162832766e-05, "epoch": 1.9387027797576621, "percentage": 64.62, "elapsed_time": "9:54:37", "remaining_time": "5:25:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16330, "total_steps": 25254, "loss": 0.1112, "learning_rate": 1.4662371885334062e-05, "epoch": 1.9398907103825138, "percentage": 64.66, "elapsed_time": "9:54:59", "remaining_time": "5:25:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16340, "total_steps": 25254, "loss": 0.1115, "learning_rate": 1.4633187611018945e-05, "epoch": 1.941078641007365, "percentage": 64.7, "elapsed_time": "9:55:21", "remaining_time": "5:24:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16350, "total_steps": 25254, "loss": 0.1126, "learning_rate": 1.4604020387889295e-05, "epoch": 1.9422665716322167, "percentage": 64.74, "elapsed_time": "9:55:43", "remaining_time": "5:24:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16360, "total_steps": 25254, "loss": 0.1147, "learning_rate": 1.4574870263918939e-05, "epoch": 1.9434545022570682, "percentage": 64.78, "elapsed_time": "9:56:05", "remaining_time": "5:24:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16370, "total_steps": 25254, "loss": 0.1152, "learning_rate": 1.454573728705359e-05, "epoch": 1.9446424328819196, "percentage": 64.82, "elapsed_time": "9:56:26", "remaining_time": "5:23:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16380, "total_steps": 25254, "loss": 0.1107, "learning_rate": 1.4516621505210748e-05, "epoch": 1.9458303635067713, "percentage": 64.86, "elapsed_time": "9:56:48", "remaining_time": "5:23:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16390, "total_steps": 25254, "loss": 0.1147, "learning_rate": 1.4487522966279648e-05, "epoch": 1.9470182941316228, "percentage": 64.9, "elapsed_time": "9:57:10", "remaining_time": "5:22:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16400, "total_steps": 25254, "loss": 0.1131, "learning_rate": 1.4458441718121149e-05, "epoch": 1.9482062247564742, "percentage": 64.94, "elapsed_time": "9:57:32", "remaining_time": "5:22:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16410, "total_steps": 25254, "loss": 0.1097, "learning_rate": 1.4429377808567673e-05, "epoch": 1.9493941553813259, "percentage": 64.98, "elapsed_time": "9:57:54", "remaining_time": "5:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16420, "total_steps": 25254, "loss": 0.109, "learning_rate": 1.4400331285423122e-05, "epoch": 1.950582086006177, "percentage": 65.02, "elapsed_time": "9:58:15", "remaining_time": "5:21:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16430, "total_steps": 25254, "loss": 0.1128, "learning_rate": 1.4371302196462793e-05, "epoch": 1.9517700166310288, "percentage": 65.06, "elapsed_time": "9:58:37", "remaining_time": "5:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16440, "total_steps": 25254, "loss": 0.1147, "learning_rate": 1.4342290589433354e-05, "epoch": 1.9529579472558802, "percentage": 65.1, "elapsed_time": "9:59:00", "remaining_time": "5:21:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16450, "total_steps": 25254, "loss": 0.1105, "learning_rate": 1.4313296512052655e-05, "epoch": 1.9541458778807317, "percentage": 65.14, "elapsed_time": "9:59:21", "remaining_time": "5:20:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16460, "total_steps": 25254, "loss": 0.1111, "learning_rate": 1.4284320012009739e-05, "epoch": 1.9553338085055834, "percentage": 65.18, "elapsed_time": "9:59:43", "remaining_time": "5:20:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16470, "total_steps": 25254, "loss": 0.108, "learning_rate": 1.4255361136964742e-05, "epoch": 1.9565217391304348, "percentage": 65.22, "elapsed_time": "10:00:05", "remaining_time": "5:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16480, "total_steps": 25254, "loss": 0.1141, "learning_rate": 1.4226419934548829e-05, "epoch": 1.9577096697552863, "percentage": 65.26, "elapsed_time": "10:00:27", "remaining_time": "5:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16490, "total_steps": 25254, "loss": 0.1116, "learning_rate": 1.4197496452364063e-05, "epoch": 1.958897600380138, "percentage": 65.3, "elapsed_time": "10:00:48", "remaining_time": "5:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16500, "total_steps": 25254, "loss": 0.1149, "learning_rate": 1.4168590737983376e-05, "epoch": 1.9600855310049892, "percentage": 65.34, "elapsed_time": "10:01:11", "remaining_time": "5:18:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16510, "total_steps": 25254, "loss": 0.1123, "learning_rate": 1.4139702838950481e-05, "epoch": 1.9612734616298408, "percentage": 65.38, "elapsed_time": "10:01:34", "remaining_time": "5:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16520, "total_steps": 25254, "loss": 0.1132, "learning_rate": 1.4110832802779767e-05, "epoch": 1.9624613922546923, "percentage": 65.42, "elapsed_time": "10:01:56", "remaining_time": "5:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16530, "total_steps": 25254, "loss": 0.113, "learning_rate": 1.408198067695628e-05, "epoch": 1.9636493228795437, "percentage": 65.45, "elapsed_time": "10:02:18", "remaining_time": "5:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16540, "total_steps": 25254, "loss": 0.1098, "learning_rate": 1.405314650893558e-05, "epoch": 1.9648372535043954, "percentage": 65.49, "elapsed_time": "10:02:40", "remaining_time": "5:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16550, "total_steps": 25254, "loss": 0.1082, "learning_rate": 1.4024330346143694e-05, "epoch": 1.9660251841292469, "percentage": 65.53, "elapsed_time": "10:03:03", "remaining_time": "5:17:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16560, "total_steps": 25254, "loss": 0.1126, "learning_rate": 1.3995532235977036e-05, "epoch": 1.9672131147540983, "percentage": 65.57, "elapsed_time": "10:03:24", "remaining_time": "5:16:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16570, "total_steps": 25254, "loss": 0.1082, "learning_rate": 1.3966752225802316e-05, "epoch": 1.96840104537895, "percentage": 65.61, "elapsed_time": "10:03:46", "remaining_time": "5:16:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16580, "total_steps": 25254, "loss": 0.1145, "learning_rate": 1.3937990362956505e-05, "epoch": 1.9695889760038012, "percentage": 65.65, "elapsed_time": "10:04:07", "remaining_time": "5:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16590, "total_steps": 25254, "loss": 0.1101, "learning_rate": 1.39092466947467e-05, "epoch": 1.970776906628653, "percentage": 65.69, "elapsed_time": "10:04:29", "remaining_time": "5:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16600, "total_steps": 25254, "loss": 0.1097, "learning_rate": 1.3880521268450075e-05, "epoch": 1.9719648372535044, "percentage": 65.73, "elapsed_time": "10:04:51", "remaining_time": "5:15:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16610, "total_steps": 25254, "loss": 0.1113, "learning_rate": 1.38518141313138e-05, "epoch": 1.9731527678783558, "percentage": 65.77, "elapsed_time": "10:05:12", "remaining_time": "5:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16620, "total_steps": 25254, "loss": 0.1107, "learning_rate": 1.3823125330554967e-05, "epoch": 1.9743406985032075, "percentage": 65.81, "elapsed_time": "10:05:34", "remaining_time": "5:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16630, "total_steps": 25254, "loss": 0.1121, "learning_rate": 1.379445491336051e-05, "epoch": 1.975528629128059, "percentage": 65.85, "elapsed_time": "10:05:56", "remaining_time": "5:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16640, "total_steps": 25254, "loss": 0.1132, "learning_rate": 1.3765802926887119e-05, "epoch": 1.9767165597529104, "percentage": 65.89, "elapsed_time": "10:06:18", "remaining_time": "5:13:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16650, "total_steps": 25254, "loss": 0.1104, "learning_rate": 1.3737169418261176e-05, "epoch": 1.977904490377762, "percentage": 65.93, "elapsed_time": "10:06:39", "remaining_time": "5:13:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16660, "total_steps": 25254, "loss": 0.1124, "learning_rate": 1.3708554434578658e-05, "epoch": 1.9790924210026133, "percentage": 65.97, "elapsed_time": "10:07:00", "remaining_time": "5:13:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16670, "total_steps": 25254, "loss": 0.1097, "learning_rate": 1.3679958022905104e-05, "epoch": 1.980280351627465, "percentage": 66.01, "elapsed_time": "10:07:22", "remaining_time": "5:12:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16680, "total_steps": 25254, "loss": 0.1128, "learning_rate": 1.3651380230275471e-05, "epoch": 1.9814682822523164, "percentage": 66.05, "elapsed_time": "10:07:44", "remaining_time": "5:12:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16690, "total_steps": 25254, "loss": 0.1094, "learning_rate": 1.362282110369411e-05, "epoch": 1.9826562128771679, "percentage": 66.09, "elapsed_time": "10:08:05", "remaining_time": "5:12:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16700, "total_steps": 25254, "loss": 0.1104, "learning_rate": 1.3594280690134664e-05, "epoch": 1.9838441435020195, "percentage": 66.13, "elapsed_time": "10:08:27", "remaining_time": "5:11:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16710, "total_steps": 25254, "loss": 0.1116, "learning_rate": 1.3565759036539988e-05, "epoch": 1.985032074126871, "percentage": 66.17, "elapsed_time": "10:08:48", "remaining_time": "5:11:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16720, "total_steps": 25254, "loss": 0.112, "learning_rate": 1.3537256189822113e-05, "epoch": 1.9862200047517224, "percentage": 66.21, "elapsed_time": "10:09:10", "remaining_time": "5:10:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16730, "total_steps": 25254, "loss": 0.1123, "learning_rate": 1.3508772196862104e-05, "epoch": 1.9874079353765741, "percentage": 66.25, "elapsed_time": "10:09:31", "remaining_time": "5:10:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16740, "total_steps": 25254, "loss": 0.1118, "learning_rate": 1.3480307104510031e-05, "epoch": 1.9885958660014256, "percentage": 66.29, "elapsed_time": "10:09:53", "remaining_time": "5:10:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16750, "total_steps": 25254, "loss": 0.1114, "learning_rate": 1.3451860959584869e-05, "epoch": 1.989783796626277, "percentage": 66.33, "elapsed_time": "10:10:15", "remaining_time": "5:09:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16760, "total_steps": 25254, "loss": 0.1089, "learning_rate": 1.3423433808874436e-05, "epoch": 1.9909717272511287, "percentage": 66.37, "elapsed_time": "10:10:37", "remaining_time": "5:09:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16770, "total_steps": 25254, "loss": 0.1135, "learning_rate": 1.3395025699135299e-05, "epoch": 1.99215965787598, "percentage": 66.41, "elapsed_time": "10:10:59", "remaining_time": "5:09:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16780, "total_steps": 25254, "loss": 0.1088, "learning_rate": 1.336663667709272e-05, "epoch": 1.9933475885008316, "percentage": 66.44, "elapsed_time": "10:11:21", "remaining_time": "5:08:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16790, "total_steps": 25254, "loss": 0.1091, "learning_rate": 1.333826678944055e-05, "epoch": 1.994535519125683, "percentage": 66.48, "elapsed_time": "10:11:42", "remaining_time": "5:08:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16800, "total_steps": 25254, "loss": 0.1118, "learning_rate": 1.3309916082841179e-05, "epoch": 1.9957234497505345, "percentage": 66.52, "elapsed_time": "10:12:05", "remaining_time": "5:08:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16810, "total_steps": 25254, "loss": 0.1101, "learning_rate": 1.3281584603925451e-05, "epoch": 1.9969113803753862, "percentage": 66.56, "elapsed_time": "10:12:28", "remaining_time": "5:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16820, "total_steps": 25254, "loss": 0.1142, "learning_rate": 1.3253272399292577e-05, "epoch": 1.9980993110002376, "percentage": 66.6, "elapsed_time": "10:12:50", "remaining_time": "5:07:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16830, "total_steps": 25254, "loss": 0.1095, "learning_rate": 1.3224979515510066e-05, "epoch": 1.999287241625089, "percentage": 66.64, "elapsed_time": "10:13:11", "remaining_time": "5:06:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16840, "total_steps": 25254, "loss": 0.1009, "learning_rate": 1.3196705999113656e-05, "epoch": 2.0004751722499408, "percentage": 66.68, "elapsed_time": "10:13:42", "remaining_time": "5:06:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16850, "total_steps": 25254, "loss": 0.089, "learning_rate": 1.316845189660721e-05, "epoch": 2.001663102874792, "percentage": 66.72, "elapsed_time": "10:14:04", "remaining_time": "5:06:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16860, "total_steps": 25254, "loss": 0.0899, "learning_rate": 1.3140217254462688e-05, "epoch": 2.0028510334996437, "percentage": 66.76, "elapsed_time": "10:14:26", "remaining_time": "5:05:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16870, "total_steps": 25254, "loss": 0.0851, "learning_rate": 1.3112002119120025e-05, "epoch": 2.0040389641244953, "percentage": 66.8, "elapsed_time": "10:14:48", "remaining_time": "5:05:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16880, "total_steps": 25254, "loss": 0.0891, "learning_rate": 1.3083806536987075e-05, "epoch": 2.0052268947493466, "percentage": 66.84, "elapsed_time": "10:15:10", "remaining_time": "5:05:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16890, "total_steps": 25254, "loss": 0.087, "learning_rate": 1.3055630554439527e-05, "epoch": 2.0064148253741982, "percentage": 66.88, "elapsed_time": "10:15:32", "remaining_time": "5:04:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16900, "total_steps": 25254, "loss": 0.0879, "learning_rate": 1.3027474217820825e-05, "epoch": 2.0076027559990495, "percentage": 66.92, "elapsed_time": "10:15:53", "remaining_time": "5:04:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16910, "total_steps": 25254, "loss": 0.0888, "learning_rate": 1.2999337573442133e-05, "epoch": 2.008790686623901, "percentage": 66.96, "elapsed_time": "10:16:15", "remaining_time": "5:04:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16920, "total_steps": 25254, "loss": 0.087, "learning_rate": 1.2971220667582196e-05, "epoch": 2.009978617248753, "percentage": 67.0, "elapsed_time": "10:16:37", "remaining_time": "5:03:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16930, "total_steps": 25254, "loss": 0.088, "learning_rate": 1.294312354648729e-05, "epoch": 2.011166547873604, "percentage": 67.04, "elapsed_time": "10:16:58", "remaining_time": "5:03:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16940, "total_steps": 25254, "loss": 0.0865, "learning_rate": 1.291504625637117e-05, "epoch": 2.0123544784984557, "percentage": 67.08, "elapsed_time": "10:17:20", "remaining_time": "5:02:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16950, "total_steps": 25254, "loss": 0.0863, "learning_rate": 1.2886988843414962e-05, "epoch": 2.0135424091233074, "percentage": 67.12, "elapsed_time": "10:17:41", "remaining_time": "5:02:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16960, "total_steps": 25254, "loss": 0.0868, "learning_rate": 1.2858951353767096e-05, "epoch": 2.0147303397481586, "percentage": 67.16, "elapsed_time": "10:18:03", "remaining_time": "5:02:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16970, "total_steps": 25254, "loss": 0.0869, "learning_rate": 1.2830933833543237e-05, "epoch": 2.0159182703730103, "percentage": 67.2, "elapsed_time": "10:18:25", "remaining_time": "5:01:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16980, "total_steps": 25254, "loss": 0.0856, "learning_rate": 1.2802936328826204e-05, "epoch": 2.0171062009978615, "percentage": 67.24, "elapsed_time": "10:18:46", "remaining_time": "5:01:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 16990, "total_steps": 25254, "loss": 0.0876, "learning_rate": 1.2774958885665883e-05, "epoch": 2.018294131622713, "percentage": 67.28, "elapsed_time": "10:19:08", "remaining_time": "5:01:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17000, "total_steps": 25254, "loss": 0.0871, "learning_rate": 1.27470015500792e-05, "epoch": 2.019482062247565, "percentage": 67.32, "elapsed_time": "10:19:29", "remaining_time": "5:00:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17010, "total_steps": 25254, "loss": 0.0847, "learning_rate": 1.2719064368049962e-05, "epoch": 2.020669992872416, "percentage": 67.36, "elapsed_time": "10:19:52", "remaining_time": "5:00:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17020, "total_steps": 25254, "loss": 0.087, "learning_rate": 1.269114738552886e-05, "epoch": 2.021857923497268, "percentage": 67.4, "elapsed_time": "10:20:14", "remaining_time": "5:00:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17030, "total_steps": 25254, "loss": 0.0853, "learning_rate": 1.266325064843334e-05, "epoch": 2.0230458541221195, "percentage": 67.43, "elapsed_time": "10:20:35", "remaining_time": "4:59:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17040, "total_steps": 25254, "loss": 0.0881, "learning_rate": 1.2635374202647554e-05, "epoch": 2.0242337847469707, "percentage": 67.47, "elapsed_time": "10:20:57", "remaining_time": "4:59:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17050, "total_steps": 25254, "loss": 0.0859, "learning_rate": 1.26075180940223e-05, "epoch": 2.0254217153718224, "percentage": 67.51, "elapsed_time": "10:21:19", "remaining_time": "4:58:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17060, "total_steps": 25254, "loss": 0.0881, "learning_rate": 1.2579682368374901e-05, "epoch": 2.0266096459966736, "percentage": 67.55, "elapsed_time": "10:21:41", "remaining_time": "4:58:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17070, "total_steps": 25254, "loss": 0.084, "learning_rate": 1.2551867071489163e-05, "epoch": 2.0277975766215253, "percentage": 67.59, "elapsed_time": "10:22:03", "remaining_time": "4:58:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17080, "total_steps": 25254, "loss": 0.0874, "learning_rate": 1.2524072249115288e-05, "epoch": 2.028985507246377, "percentage": 67.63, "elapsed_time": "10:22:25", "remaining_time": "4:57:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17090, "total_steps": 25254, "loss": 0.0874, "learning_rate": 1.2496297946969804e-05, "epoch": 2.030173437871228, "percentage": 67.67, "elapsed_time": "10:22:47", "remaining_time": "4:57:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17100, "total_steps": 25254, "loss": 0.0852, "learning_rate": 1.2468544210735492e-05, "epoch": 2.03136136849608, "percentage": 67.71, "elapsed_time": "10:23:08", "remaining_time": "4:57:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17110, "total_steps": 25254, "loss": 0.0884, "learning_rate": 1.2440811086061297e-05, "epoch": 2.0325492991209315, "percentage": 67.75, "elapsed_time": "10:23:30", "remaining_time": "4:56:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17120, "total_steps": 25254, "loss": 0.0843, "learning_rate": 1.2413098618562272e-05, "epoch": 2.0337372297457827, "percentage": 67.79, "elapsed_time": "10:23:51", "remaining_time": "4:56:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17130, "total_steps": 25254, "loss": 0.0887, "learning_rate": 1.2385406853819475e-05, "epoch": 2.0349251603706344, "percentage": 67.83, "elapsed_time": "10:24:12", "remaining_time": "4:56:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17140, "total_steps": 25254, "loss": 0.0847, "learning_rate": 1.2357735837379949e-05, "epoch": 2.0361130909954857, "percentage": 67.87, "elapsed_time": "10:24:34", "remaining_time": "4:55:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17150, "total_steps": 25254, "loss": 0.0855, "learning_rate": 1.2330085614756582e-05, "epoch": 2.0373010216203373, "percentage": 67.91, "elapsed_time": "10:24:56", "remaining_time": "4:55:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17160, "total_steps": 25254, "loss": 0.0851, "learning_rate": 1.2302456231428059e-05, "epoch": 2.038488952245189, "percentage": 67.95, "elapsed_time": "10:25:18", "remaining_time": "4:54:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17170, "total_steps": 25254, "loss": 0.0886, "learning_rate": 1.2274847732838801e-05, "epoch": 2.0396768828700402, "percentage": 67.99, "elapsed_time": "10:25:40", "remaining_time": "4:54:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17180, "total_steps": 25254, "loss": 0.0901, "learning_rate": 1.2247260164398864e-05, "epoch": 2.040864813494892, "percentage": 68.03, "elapsed_time": "10:26:03", "remaining_time": "4:54:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17190, "total_steps": 25254, "loss": 0.0893, "learning_rate": 1.2219693571483904e-05, "epoch": 2.0420527441197436, "percentage": 68.07, "elapsed_time": "10:26:24", "remaining_time": "4:53:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17200, "total_steps": 25254, "loss": 0.0877, "learning_rate": 1.2192147999435052e-05, "epoch": 2.043240674744595, "percentage": 68.11, "elapsed_time": "10:26:47", "remaining_time": "4:53:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17210, "total_steps": 25254, "loss": 0.0894, "learning_rate": 1.2164623493558875e-05, "epoch": 2.0444286053694465, "percentage": 68.15, "elapsed_time": "10:27:09", "remaining_time": "4:53:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17220, "total_steps": 25254, "loss": 0.0876, "learning_rate": 1.2137120099127289e-05, "epoch": 2.0456165359942977, "percentage": 68.19, "elapsed_time": "10:27:31", "remaining_time": "4:52:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17230, "total_steps": 25254, "loss": 0.0852, "learning_rate": 1.210963786137747e-05, "epoch": 2.0468044666191494, "percentage": 68.23, "elapsed_time": "10:27:52", "remaining_time": "4:52:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17240, "total_steps": 25254, "loss": 0.0842, "learning_rate": 1.208217682551184e-05, "epoch": 2.047992397244001, "percentage": 68.27, "elapsed_time": "10:28:14", "remaining_time": "4:52:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17250, "total_steps": 25254, "loss": 0.0848, "learning_rate": 1.2054737036697905e-05, "epoch": 2.0491803278688523, "percentage": 68.31, "elapsed_time": "10:28:37", "remaining_time": "4:51:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17260, "total_steps": 25254, "loss": 0.0855, "learning_rate": 1.202731854006824e-05, "epoch": 2.050368258493704, "percentage": 68.35, "elapsed_time": "10:28:59", "remaining_time": "4:51:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17270, "total_steps": 25254, "loss": 0.0847, "learning_rate": 1.1999921380720394e-05, "epoch": 2.0515561891185556, "percentage": 68.39, "elapsed_time": "10:29:21", "remaining_time": "4:50:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17280, "total_steps": 25254, "loss": 0.0835, "learning_rate": 1.1972545603716832e-05, "epoch": 2.052744119743407, "percentage": 68.42, "elapsed_time": "10:29:43", "remaining_time": "4:50:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17290, "total_steps": 25254, "loss": 0.0885, "learning_rate": 1.1945191254084833e-05, "epoch": 2.0539320503682585, "percentage": 68.46, "elapsed_time": "10:30:05", "remaining_time": "4:50:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17300, "total_steps": 25254, "loss": 0.0852, "learning_rate": 1.1917858376816454e-05, "epoch": 2.05511998099311, "percentage": 68.5, "elapsed_time": "10:30:26", "remaining_time": "4:49:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17310, "total_steps": 25254, "loss": 0.0837, "learning_rate": 1.1890547016868415e-05, "epoch": 2.0563079116179614, "percentage": 68.54, "elapsed_time": "10:30:48", "remaining_time": "4:49:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17320, "total_steps": 25254, "loss": 0.0869, "learning_rate": 1.1863257219162041e-05, "epoch": 2.057495842242813, "percentage": 68.58, "elapsed_time": "10:31:10", "remaining_time": "4:49:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17330, "total_steps": 25254, "loss": 0.0881, "learning_rate": 1.1835989028583228e-05, "epoch": 2.0586837728676644, "percentage": 68.62, "elapsed_time": "10:31:31", "remaining_time": "4:48:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17340, "total_steps": 25254, "loss": 0.0881, "learning_rate": 1.1808742489982291e-05, "epoch": 2.059871703492516, "percentage": 68.66, "elapsed_time": "10:31:53", "remaining_time": "4:48:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17350, "total_steps": 25254, "loss": 0.0843, "learning_rate": 1.1781517648173954e-05, "epoch": 2.0610596341173677, "percentage": 68.7, "elapsed_time": "10:32:14", "remaining_time": "4:48:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17360, "total_steps": 25254, "loss": 0.0894, "learning_rate": 1.175431454793725e-05, "epoch": 2.062247564742219, "percentage": 68.74, "elapsed_time": "10:32:37", "remaining_time": "4:47:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17370, "total_steps": 25254, "loss": 0.088, "learning_rate": 1.1727133234015439e-05, "epoch": 2.0634354953670706, "percentage": 68.78, "elapsed_time": "10:32:59", "remaining_time": "4:47:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17380, "total_steps": 25254, "loss": 0.0912, "learning_rate": 1.1699973751115977e-05, "epoch": 2.0646234259919223, "percentage": 68.82, "elapsed_time": "10:33:20", "remaining_time": "4:46:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17390, "total_steps": 25254, "loss": 0.0876, "learning_rate": 1.167283614391039e-05, "epoch": 2.0658113566167735, "percentage": 68.86, "elapsed_time": "10:33:42", "remaining_time": "4:46:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17400, "total_steps": 25254, "loss": 0.0877, "learning_rate": 1.1645720457034224e-05, "epoch": 2.066999287241625, "percentage": 68.9, "elapsed_time": "10:34:03", "remaining_time": "4:46:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17410, "total_steps": 25254, "loss": 0.0851, "learning_rate": 1.1618626735086974e-05, "epoch": 2.0681872178664764, "percentage": 68.94, "elapsed_time": "10:34:25", "remaining_time": "4:45:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17420, "total_steps": 25254, "loss": 0.085, "learning_rate": 1.1591555022632013e-05, "epoch": 2.069375148491328, "percentage": 68.98, "elapsed_time": "10:34:46", "remaining_time": "4:45:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17430, "total_steps": 25254, "loss": 0.0869, "learning_rate": 1.1564505364196506e-05, "epoch": 2.0705630791161798, "percentage": 69.02, "elapsed_time": "10:35:08", "remaining_time": "4:45:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17440, "total_steps": 25254, "loss": 0.0863, "learning_rate": 1.1537477804271346e-05, "epoch": 2.071751009741031, "percentage": 69.06, "elapsed_time": "10:35:30", "remaining_time": "4:44:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17450, "total_steps": 25254, "loss": 0.0868, "learning_rate": 1.1510472387311078e-05, "epoch": 2.0729389403658827, "percentage": 69.1, "elapsed_time": "10:35:52", "remaining_time": "4:44:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17460, "total_steps": 25254, "loss": 0.0856, "learning_rate": 1.1483489157733817e-05, "epoch": 2.0741268709907343, "percentage": 69.14, "elapsed_time": "10:36:14", "remaining_time": "4:44:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17470, "total_steps": 25254, "loss": 0.0854, "learning_rate": 1.1456528159921217e-05, "epoch": 2.0753148016155856, "percentage": 69.18, "elapsed_time": "10:36:36", "remaining_time": "4:43:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17480, "total_steps": 25254, "loss": 0.0873, "learning_rate": 1.1429589438218336e-05, "epoch": 2.0765027322404372, "percentage": 69.22, "elapsed_time": "10:36:58", "remaining_time": "4:43:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17490, "total_steps": 25254, "loss": 0.0845, "learning_rate": 1.1402673036933592e-05, "epoch": 2.0776906628652885, "percentage": 69.26, "elapsed_time": "10:37:21", "remaining_time": "4:42:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17500, "total_steps": 25254, "loss": 0.0845, "learning_rate": 1.1375779000338708e-05, "epoch": 2.07887859349014, "percentage": 69.3, "elapsed_time": "10:37:43", "remaining_time": "4:42:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17510, "total_steps": 25254, "loss": 0.0846, "learning_rate": 1.1348907372668593e-05, "epoch": 2.080066524114992, "percentage": 69.34, "elapsed_time": "10:38:04", "remaining_time": "4:42:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17520, "total_steps": 25254, "loss": 0.0854, "learning_rate": 1.1322058198121347e-05, "epoch": 2.081254454739843, "percentage": 69.38, "elapsed_time": "10:38:26", "remaining_time": "4:41:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17530, "total_steps": 25254, "loss": 0.0871, "learning_rate": 1.1295231520858093e-05, "epoch": 2.0824423853646947, "percentage": 69.41, "elapsed_time": "10:38:49", "remaining_time": "4:41:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17540, "total_steps": 25254, "loss": 0.0874, "learning_rate": 1.1268427385002972e-05, "epoch": 2.0836303159895464, "percentage": 69.45, "elapsed_time": "10:39:10", "remaining_time": "4:41:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17550, "total_steps": 25254, "loss": 0.084, "learning_rate": 1.1241645834643045e-05, "epoch": 2.0848182466143976, "percentage": 69.49, "elapsed_time": "10:39:32", "remaining_time": "4:40:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17560, "total_steps": 25254, "loss": 0.0863, "learning_rate": 1.1214886913828212e-05, "epoch": 2.0860061772392493, "percentage": 69.53, "elapsed_time": "10:39:54", "remaining_time": "4:40:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17570, "total_steps": 25254, "loss": 0.0839, "learning_rate": 1.118815066657119e-05, "epoch": 2.0871941078641005, "percentage": 69.57, "elapsed_time": "10:40:16", "remaining_time": "4:40:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17580, "total_steps": 25254, "loss": 0.0862, "learning_rate": 1.116143713684736e-05, "epoch": 2.088382038488952, "percentage": 69.61, "elapsed_time": "10:40:37", "remaining_time": "4:39:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17590, "total_steps": 25254, "loss": 0.0836, "learning_rate": 1.1134746368594765e-05, "epoch": 2.089569969113804, "percentage": 69.65, "elapsed_time": "10:41:00", "remaining_time": "4:39:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17600, "total_steps": 25254, "loss": 0.0857, "learning_rate": 1.1108078405713992e-05, "epoch": 2.090757899738655, "percentage": 69.69, "elapsed_time": "10:41:21", "remaining_time": "4:38:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17610, "total_steps": 25254, "loss": 0.0854, "learning_rate": 1.1081433292068133e-05, "epoch": 2.091945830363507, "percentage": 69.73, "elapsed_time": "10:41:44", "remaining_time": "4:38:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17620, "total_steps": 25254, "loss": 0.0837, "learning_rate": 1.105481107148269e-05, "epoch": 2.0931337609883585, "percentage": 69.77, "elapsed_time": "10:42:06", "remaining_time": "4:38:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17630, "total_steps": 25254, "loss": 0.0867, "learning_rate": 1.1028211787745512e-05, "epoch": 2.0943216916132097, "percentage": 69.81, "elapsed_time": "10:42:28", "remaining_time": "4:37:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17640, "total_steps": 25254, "loss": 0.0876, "learning_rate": 1.100163548460672e-05, "epoch": 2.0955096222380614, "percentage": 69.85, "elapsed_time": "10:42:50", "remaining_time": "4:37:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17650, "total_steps": 25254, "loss": 0.0854, "learning_rate": 1.0975082205778637e-05, "epoch": 2.0966975528629126, "percentage": 69.89, "elapsed_time": "10:43:12", "remaining_time": "4:37:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17660, "total_steps": 25254, "loss": 0.0854, "learning_rate": 1.0948551994935726e-05, "epoch": 2.0978854834877643, "percentage": 69.93, "elapsed_time": "10:43:34", "remaining_time": "4:36:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17670, "total_steps": 25254, "loss": 0.0846, "learning_rate": 1.09220448957145e-05, "epoch": 2.099073414112616, "percentage": 69.97, "elapsed_time": "10:43:56", "remaining_time": "4:36:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17680, "total_steps": 25254, "loss": 0.0876, "learning_rate": 1.0895560951713455e-05, "epoch": 2.100261344737467, "percentage": 70.01, "elapsed_time": "10:44:19", "remaining_time": "4:36:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17690, "total_steps": 25254, "loss": 0.0843, "learning_rate": 1.0869100206493004e-05, "epoch": 2.101449275362319, "percentage": 70.05, "elapsed_time": "10:44:40", "remaining_time": "4:35:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17700, "total_steps": 25254, "loss": 0.0861, "learning_rate": 1.0842662703575398e-05, "epoch": 2.1026372059871705, "percentage": 70.09, "elapsed_time": "10:45:02", "remaining_time": "4:35:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17710, "total_steps": 25254, "loss": 0.0894, "learning_rate": 1.0816248486444684e-05, "epoch": 2.1038251366120218, "percentage": 70.13, "elapsed_time": "10:45:24", "remaining_time": "4:34:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17720, "total_steps": 25254, "loss": 0.0885, "learning_rate": 1.0789857598546575e-05, "epoch": 2.1050130672368734, "percentage": 70.17, "elapsed_time": "10:45:46", "remaining_time": "4:34:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17730, "total_steps": 25254, "loss": 0.087, "learning_rate": 1.0763490083288433e-05, "epoch": 2.106200997861725, "percentage": 70.21, "elapsed_time": "10:46:08", "remaining_time": "4:34:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17740, "total_steps": 25254, "loss": 0.084, "learning_rate": 1.0737145984039174e-05, "epoch": 2.1073889284865763, "percentage": 70.25, "elapsed_time": "10:46:30", "remaining_time": "4:33:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17750, "total_steps": 25254, "loss": 0.0854, "learning_rate": 1.071082534412919e-05, "epoch": 2.108576859111428, "percentage": 70.29, "elapsed_time": "10:46:51", "remaining_time": "4:33:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17760, "total_steps": 25254, "loss": 0.0832, "learning_rate": 1.0684528206850303e-05, "epoch": 2.1097647897362792, "percentage": 70.33, "elapsed_time": "10:47:13", "remaining_time": "4:33:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17770, "total_steps": 25254, "loss": 0.0868, "learning_rate": 1.0658254615455664e-05, "epoch": 2.110952720361131, "percentage": 70.37, "elapsed_time": "10:47:35", "remaining_time": "4:32:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17780, "total_steps": 25254, "loss": 0.087, "learning_rate": 1.0632004613159707e-05, "epoch": 2.1121406509859826, "percentage": 70.4, "elapsed_time": "10:47:57", "remaining_time": "4:32:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17790, "total_steps": 25254, "loss": 0.0848, "learning_rate": 1.060577824313805e-05, "epoch": 2.113328581610834, "percentage": 70.44, "elapsed_time": "10:48:19", "remaining_time": "4:32:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17800, "total_steps": 25254, "loss": 0.0851, "learning_rate": 1.0579575548527474e-05, "epoch": 2.1145165122356855, "percentage": 70.48, "elapsed_time": "10:48:40", "remaining_time": "4:31:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17810, "total_steps": 25254, "loss": 0.0844, "learning_rate": 1.0553396572425783e-05, "epoch": 2.1157044428605367, "percentage": 70.52, "elapsed_time": "10:49:02", "remaining_time": "4:31:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17820, "total_steps": 25254, "loss": 0.0864, "learning_rate": 1.052724135789179e-05, "epoch": 2.1168923734853884, "percentage": 70.56, "elapsed_time": "10:49:24", "remaining_time": "4:30:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17830, "total_steps": 25254, "loss": 0.0848, "learning_rate": 1.0501109947945217e-05, "epoch": 2.11808030411024, "percentage": 70.6, "elapsed_time": "10:49:46", "remaining_time": "4:30:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17840, "total_steps": 25254, "loss": 0.0831, "learning_rate": 1.0475002385566629e-05, "epoch": 2.1192682347350913, "percentage": 70.64, "elapsed_time": "10:50:08", "remaining_time": "4:30:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17850, "total_steps": 25254, "loss": 0.0849, "learning_rate": 1.044891871369739e-05, "epoch": 2.120456165359943, "percentage": 70.68, "elapsed_time": "10:50:30", "remaining_time": "4:29:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17860, "total_steps": 25254, "loss": 0.0853, "learning_rate": 1.0422858975239539e-05, "epoch": 2.1216440959847946, "percentage": 70.72, "elapsed_time": "10:50:52", "remaining_time": "4:29:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17870, "total_steps": 25254, "loss": 0.0878, "learning_rate": 1.0396823213055767e-05, "epoch": 2.122832026609646, "percentage": 70.76, "elapsed_time": "10:51:13", "remaining_time": "4:29:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17880, "total_steps": 25254, "loss": 0.0845, "learning_rate": 1.0370811469969327e-05, "epoch": 2.1240199572344975, "percentage": 70.8, "elapsed_time": "10:51:35", "remaining_time": "4:28:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17890, "total_steps": 25254, "loss": 0.0816, "learning_rate": 1.0344823788763949e-05, "epoch": 2.125207887859349, "percentage": 70.84, "elapsed_time": "10:51:57", "remaining_time": "4:28:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17900, "total_steps": 25254, "loss": 0.0833, "learning_rate": 1.0318860212183823e-05, "epoch": 2.1263958184842005, "percentage": 70.88, "elapsed_time": "10:52:19", "remaining_time": "4:27:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17910, "total_steps": 25254, "loss": 0.0863, "learning_rate": 1.029292078293346e-05, "epoch": 2.127583749109052, "percentage": 70.92, "elapsed_time": "10:52:40", "remaining_time": "4:27:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17920, "total_steps": 25254, "loss": 0.0875, "learning_rate": 1.0267005543677678e-05, "epoch": 2.1287716797339034, "percentage": 70.96, "elapsed_time": "10:53:02", "remaining_time": "4:27:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17930, "total_steps": 25254, "loss": 0.0873, "learning_rate": 1.0241114537041458e-05, "epoch": 2.129959610358755, "percentage": 71.0, "elapsed_time": "10:53:23", "remaining_time": "4:26:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17940, "total_steps": 25254, "loss": 0.0876, "learning_rate": 1.021524780560999e-05, "epoch": 2.1311475409836067, "percentage": 71.04, "elapsed_time": "10:53:45", "remaining_time": "4:26:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17950, "total_steps": 25254, "loss": 0.0873, "learning_rate": 1.0189405391928497e-05, "epoch": 2.132335471608458, "percentage": 71.08, "elapsed_time": "10:54:06", "remaining_time": "4:26:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17960, "total_steps": 25254, "loss": 0.0855, "learning_rate": 1.0163587338502214e-05, "epoch": 2.1335234022333096, "percentage": 71.12, "elapsed_time": "10:54:28", "remaining_time": "4:25:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17970, "total_steps": 25254, "loss": 0.0833, "learning_rate": 1.0137793687796307e-05, "epoch": 2.1347113328581613, "percentage": 71.16, "elapsed_time": "10:54:50", "remaining_time": "4:25:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17980, "total_steps": 25254, "loss": 0.0835, "learning_rate": 1.0112024482235799e-05, "epoch": 2.1358992634830125, "percentage": 71.2, "elapsed_time": "10:55:12", "remaining_time": "4:25:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 17990, "total_steps": 25254, "loss": 0.0869, "learning_rate": 1.0086279764205525e-05, "epoch": 2.137087194107864, "percentage": 71.24, "elapsed_time": "10:55:34", "remaining_time": "4:24:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18000, "total_steps": 25254, "loss": 0.085, "learning_rate": 1.0060559576050027e-05, "epoch": 2.1382751247327154, "percentage": 71.28, "elapsed_time": "10:55:56", "remaining_time": "4:24:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18010, "total_steps": 25254, "loss": 0.0858, "learning_rate": 1.00348639600735e-05, "epoch": 2.139463055357567, "percentage": 71.32, "elapsed_time": "10:56:18", "remaining_time": "4:23:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18020, "total_steps": 25254, "loss": 0.0888, "learning_rate": 1.0009192958539731e-05, "epoch": 2.1406509859824188, "percentage": 71.36, "elapsed_time": "10:56:40", "remaining_time": "4:23:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18030, "total_steps": 25254, "loss": 0.0847, "learning_rate": 9.983546613672007e-06, "epoch": 2.14183891660727, "percentage": 71.39, "elapsed_time": "10:57:01", "remaining_time": "4:23:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18040, "total_steps": 25254, "loss": 0.0833, "learning_rate": 9.957924967653092e-06, "epoch": 2.1430268472321217, "percentage": 71.43, "elapsed_time": "10:57:23", "remaining_time": "4:22:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18050, "total_steps": 25254, "loss": 0.0872, "learning_rate": 9.932328062625093e-06, "epoch": 2.1442147778569733, "percentage": 71.47, "elapsed_time": "10:57:45", "remaining_time": "4:22:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18060, "total_steps": 25254, "loss": 0.0832, "learning_rate": 9.906755940689433e-06, "epoch": 2.1454027084818246, "percentage": 71.51, "elapsed_time": "10:58:07", "remaining_time": "4:22:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18070, "total_steps": 25254, "loss": 0.0863, "learning_rate": 9.881208643906777e-06, "epoch": 2.1465906391066762, "percentage": 71.55, "elapsed_time": "10:58:30", "remaining_time": "4:21:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18080, "total_steps": 25254, "loss": 0.0853, "learning_rate": 9.855686214296958e-06, "epoch": 2.1477785697315275, "percentage": 71.59, "elapsed_time": "10:58:52", "remaining_time": "4:21:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18090, "total_steps": 25254, "loss": 0.0856, "learning_rate": 9.830188693838899e-06, "epoch": 2.148966500356379, "percentage": 71.63, "elapsed_time": "10:59:14", "remaining_time": "4:21:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18100, "total_steps": 25254, "loss": 0.0843, "learning_rate": 9.804716124470561e-06, "epoch": 2.150154430981231, "percentage": 71.67, "elapsed_time": "10:59:36", "remaining_time": "4:20:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18110, "total_steps": 25254, "loss": 0.0898, "learning_rate": 9.779268548088866e-06, "epoch": 2.151342361606082, "percentage": 71.71, "elapsed_time": "10:59:58", "remaining_time": "4:20:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18120, "total_steps": 25254, "loss": 0.085, "learning_rate": 9.753846006549613e-06, "epoch": 2.1525302922309337, "percentage": 71.75, "elapsed_time": "11:00:21", "remaining_time": "4:19:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18130, "total_steps": 25254, "loss": 0.0834, "learning_rate": 9.728448541667456e-06, "epoch": 2.1537182228557854, "percentage": 71.79, "elapsed_time": "11:00:43", "remaining_time": "4:19:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18140, "total_steps": 25254, "loss": 0.0892, "learning_rate": 9.703076195215776e-06, "epoch": 2.1549061534806366, "percentage": 71.83, "elapsed_time": "11:01:05", "remaining_time": "4:19:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18150, "total_steps": 25254, "loss": 0.0854, "learning_rate": 9.677729008926645e-06, "epoch": 2.1560940841054883, "percentage": 71.87, "elapsed_time": "11:01:26", "remaining_time": "4:18:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18160, "total_steps": 25254, "loss": 0.0842, "learning_rate": 9.652407024490757e-06, "epoch": 2.15728201473034, "percentage": 71.91, "elapsed_time": "11:01:49", "remaining_time": "4:18:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18170, "total_steps": 25254, "loss": 0.0857, "learning_rate": 9.627110283557339e-06, "epoch": 2.158469945355191, "percentage": 71.95, "elapsed_time": "11:02:10", "remaining_time": "4:18:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18180, "total_steps": 25254, "loss": 0.0869, "learning_rate": 9.60183882773413e-06, "epoch": 2.159657875980043, "percentage": 71.99, "elapsed_time": "11:02:32", "remaining_time": "4:17:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18190, "total_steps": 25254, "loss": 0.0849, "learning_rate": 9.576592698587253e-06, "epoch": 2.160845806604894, "percentage": 72.03, "elapsed_time": "11:02:54", "remaining_time": "4:17:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18200, "total_steps": 25254, "loss": 0.0848, "learning_rate": 9.551371937641178e-06, "epoch": 2.162033737229746, "percentage": 72.07, "elapsed_time": "11:03:16", "remaining_time": "4:17:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18210, "total_steps": 25254, "loss": 0.0852, "learning_rate": 9.526176586378663e-06, "epoch": 2.1632216678545975, "percentage": 72.11, "elapsed_time": "11:03:38", "remaining_time": "4:16:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18220, "total_steps": 25254, "loss": 0.0865, "learning_rate": 9.501006686240643e-06, "epoch": 2.1644095984794487, "percentage": 72.15, "elapsed_time": "11:04:00", "remaining_time": "4:16:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18230, "total_steps": 25254, "loss": 0.0837, "learning_rate": 9.475862278626236e-06, "epoch": 2.1655975291043004, "percentage": 72.19, "elapsed_time": "11:04:21", "remaining_time": "4:15:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18240, "total_steps": 25254, "loss": 0.0847, "learning_rate": 9.450743404892603e-06, "epoch": 2.1667854597291516, "percentage": 72.23, "elapsed_time": "11:04:44", "remaining_time": "4:15:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18250, "total_steps": 25254, "loss": 0.0827, "learning_rate": 9.425650106354894e-06, "epoch": 2.1679733903540033, "percentage": 72.27, "elapsed_time": "11:05:06", "remaining_time": "4:15:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18260, "total_steps": 25254, "loss": 0.0852, "learning_rate": 9.400582424286205e-06, "epoch": 2.169161320978855, "percentage": 72.31, "elapsed_time": "11:05:28", "remaining_time": "4:14:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18270, "total_steps": 25254, "loss": 0.0855, "learning_rate": 9.375540399917529e-06, "epoch": 2.170349251603706, "percentage": 72.34, "elapsed_time": "11:05:50", "remaining_time": "4:14:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18280, "total_steps": 25254, "loss": 0.0866, "learning_rate": 9.350524074437613e-06, "epoch": 2.171537182228558, "percentage": 72.38, "elapsed_time": "11:06:11", "remaining_time": "4:14:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18290, "total_steps": 25254, "loss": 0.0837, "learning_rate": 9.32553348899296e-06, "epoch": 2.1727251128534095, "percentage": 72.42, "elapsed_time": "11:06:34", "remaining_time": "4:13:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18300, "total_steps": 25254, "loss": 0.0852, "learning_rate": 9.300568684687727e-06, "epoch": 2.1739130434782608, "percentage": 72.46, "elapsed_time": "11:06:57", "remaining_time": "4:13:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18310, "total_steps": 25254, "loss": 0.0861, "learning_rate": 9.275629702583658e-06, "epoch": 2.1751009741031124, "percentage": 72.5, "elapsed_time": "11:07:18", "remaining_time": "4:13:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18320, "total_steps": 25254, "loss": 0.0865, "learning_rate": 9.250716583700057e-06, "epoch": 2.176288904727964, "percentage": 72.54, "elapsed_time": "11:07:40", "remaining_time": "4:12:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18330, "total_steps": 25254, "loss": 0.0861, "learning_rate": 9.225829369013652e-06, "epoch": 2.1774768353528153, "percentage": 72.58, "elapsed_time": "11:08:02", "remaining_time": "4:12:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18340, "total_steps": 25254, "loss": 0.085, "learning_rate": 9.200968099458588e-06, "epoch": 2.178664765977667, "percentage": 72.62, "elapsed_time": "11:08:24", "remaining_time": "4:11:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18350, "total_steps": 25254, "loss": 0.0839, "learning_rate": 9.176132815926322e-06, "epoch": 2.1798526966025182, "percentage": 72.66, "elapsed_time": "11:08:46", "remaining_time": "4:11:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18360, "total_steps": 25254, "loss": 0.085, "learning_rate": 9.151323559265568e-06, "epoch": 2.18104062722737, "percentage": 72.7, "elapsed_time": "11:09:07", "remaining_time": "4:11:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18370, "total_steps": 25254, "loss": 0.0879, "learning_rate": 9.126540370282253e-06, "epoch": 2.1822285578522216, "percentage": 72.74, "elapsed_time": "11:09:29", "remaining_time": "4:10:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18380, "total_steps": 25254, "loss": 0.0876, "learning_rate": 9.10178328973941e-06, "epoch": 2.183416488477073, "percentage": 72.78, "elapsed_time": "11:09:51", "remaining_time": "4:10:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18390, "total_steps": 25254, "loss": 0.0861, "learning_rate": 9.077052358357128e-06, "epoch": 2.1846044191019245, "percentage": 72.82, "elapsed_time": "11:10:13", "remaining_time": "4:10:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18400, "total_steps": 25254, "loss": 0.0865, "learning_rate": 9.052347616812492e-06, "epoch": 2.185792349726776, "percentage": 72.86, "elapsed_time": "11:10:35", "remaining_time": "4:09:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18410, "total_steps": 25254, "loss": 0.0832, "learning_rate": 9.02766910573951e-06, "epoch": 2.1869802803516274, "percentage": 72.9, "elapsed_time": "11:10:56", "remaining_time": "4:09:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18420, "total_steps": 25254, "loss": 0.0858, "learning_rate": 9.003016865729047e-06, "epoch": 2.188168210976479, "percentage": 72.94, "elapsed_time": "11:11:18", "remaining_time": "4:09:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18430, "total_steps": 25254, "loss": 0.086, "learning_rate": 8.978390937328755e-06, "epoch": 2.1893561416013303, "percentage": 72.98, "elapsed_time": "11:11:39", "remaining_time": "4:08:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18440, "total_steps": 25254, "loss": 0.0851, "learning_rate": 8.953791361043007e-06, "epoch": 2.190544072226182, "percentage": 73.02, "elapsed_time": "11:12:01", "remaining_time": "4:08:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18450, "total_steps": 25254, "loss": 0.0851, "learning_rate": 8.929218177332834e-06, "epoch": 2.1917320028510336, "percentage": 73.06, "elapsed_time": "11:12:24", "remaining_time": "4:07:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18460, "total_steps": 25254, "loss": 0.0849, "learning_rate": 8.904671426615874e-06, "epoch": 2.192919933475885, "percentage": 73.1, "elapsed_time": "11:12:46", "remaining_time": "4:07:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18470, "total_steps": 25254, "loss": 0.0868, "learning_rate": 8.880151149266261e-06, "epoch": 2.1941078641007365, "percentage": 73.14, "elapsed_time": "11:13:08", "remaining_time": "4:07:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18480, "total_steps": 25254, "loss": 0.0863, "learning_rate": 8.855657385614602e-06, "epoch": 2.1952957947255882, "percentage": 73.18, "elapsed_time": "11:13:30", "remaining_time": "4:06:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18490, "total_steps": 25254, "loss": 0.0835, "learning_rate": 8.83119017594789e-06, "epoch": 2.1964837253504395, "percentage": 73.22, "elapsed_time": "11:13:51", "remaining_time": "4:06:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18500, "total_steps": 25254, "loss": 0.084, "learning_rate": 8.806749560509434e-06, "epoch": 2.197671655975291, "percentage": 73.26, "elapsed_time": "11:14:13", "remaining_time": "4:06:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18510, "total_steps": 25254, "loss": 0.0822, "learning_rate": 8.782335579498827e-06, "epoch": 2.1988595866001424, "percentage": 73.3, "elapsed_time": "11:14:35", "remaining_time": "4:05:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18520, "total_steps": 25254, "loss": 0.0848, "learning_rate": 8.75794827307183e-06, "epoch": 2.200047517224994, "percentage": 73.33, "elapsed_time": "11:14:57", "remaining_time": "4:05:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18530, "total_steps": 25254, "loss": 0.084, "learning_rate": 8.733587681340336e-06, "epoch": 2.2012354478498457, "percentage": 73.37, "elapsed_time": "11:15:19", "remaining_time": "4:05:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18540, "total_steps": 25254, "loss": 0.0849, "learning_rate": 8.709253844372303e-06, "epoch": 2.202423378474697, "percentage": 73.41, "elapsed_time": "11:15:41", "remaining_time": "4:04:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18550, "total_steps": 25254, "loss": 0.082, "learning_rate": 8.684946802191677e-06, "epoch": 2.2036113090995486, "percentage": 73.45, "elapsed_time": "11:16:02", "remaining_time": "4:04:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18560, "total_steps": 25254, "loss": 0.0824, "learning_rate": 8.660666594778333e-06, "epoch": 2.2047992397244003, "percentage": 73.49, "elapsed_time": "11:16:23", "remaining_time": "4:03:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18570, "total_steps": 25254, "loss": 0.0846, "learning_rate": 8.636413262068016e-06, "epoch": 2.2059871703492515, "percentage": 73.53, "elapsed_time": "11:16:46", "remaining_time": "4:03:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18580, "total_steps": 25254, "loss": 0.0862, "learning_rate": 8.612186843952258e-06, "epoch": 2.207175100974103, "percentage": 73.57, "elapsed_time": "11:17:07", "remaining_time": "4:03:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18590, "total_steps": 25254, "loss": 0.0836, "learning_rate": 8.58798738027832e-06, "epoch": 2.2083630315989544, "percentage": 73.61, "elapsed_time": "11:17:29", "remaining_time": "4:02:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18600, "total_steps": 25254, "loss": 0.0862, "learning_rate": 8.563814910849149e-06, "epoch": 2.209550962223806, "percentage": 73.65, "elapsed_time": "11:17:51", "remaining_time": "4:02:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18610, "total_steps": 25254, "loss": 0.0856, "learning_rate": 8.539669475423279e-06, "epoch": 2.2107388928486578, "percentage": 73.69, "elapsed_time": "11:18:13", "remaining_time": "4:02:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18620, "total_steps": 25254, "loss": 0.0839, "learning_rate": 8.515551113714767e-06, "epoch": 2.211926823473509, "percentage": 73.73, "elapsed_time": "11:18:35", "remaining_time": "4:01:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18630, "total_steps": 25254, "loss": 0.0857, "learning_rate": 8.491459865393162e-06, "epoch": 2.2131147540983607, "percentage": 73.77, "elapsed_time": "11:18:57", "remaining_time": "4:01:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18640, "total_steps": 25254, "loss": 0.0854, "learning_rate": 8.46739577008339e-06, "epoch": 2.2143026847232123, "percentage": 73.81, "elapsed_time": "11:19:19", "remaining_time": "4:01:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18650, "total_steps": 25254, "loss": 0.0845, "learning_rate": 8.443358867365749e-06, "epoch": 2.2154906153480636, "percentage": 73.85, "elapsed_time": "11:19:42", "remaining_time": "4:00:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18660, "total_steps": 25254, "loss": 0.0829, "learning_rate": 8.419349196775794e-06, "epoch": 2.2166785459729152, "percentage": 73.89, "elapsed_time": "11:20:06", "remaining_time": "4:00:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18670, "total_steps": 25254, "loss": 0.0848, "learning_rate": 8.395366797804283e-06, "epoch": 2.2178664765977665, "percentage": 73.93, "elapsed_time": "11:20:28", "remaining_time": "3:59:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18680, "total_steps": 25254, "loss": 0.0846, "learning_rate": 8.371411709897125e-06, "epoch": 2.219054407222618, "percentage": 73.97, "elapsed_time": "11:20:50", "remaining_time": "3:59:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18690, "total_steps": 25254, "loss": 0.0849, "learning_rate": 8.347483972455302e-06, "epoch": 2.22024233784747, "percentage": 74.01, "elapsed_time": "11:21:12", "remaining_time": "3:59:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18700, "total_steps": 25254, "loss": 0.0869, "learning_rate": 8.323583624834829e-06, "epoch": 2.221430268472321, "percentage": 74.05, "elapsed_time": "11:21:34", "remaining_time": "3:58:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18710, "total_steps": 25254, "loss": 0.0826, "learning_rate": 8.299710706346653e-06, "epoch": 2.2226181990971727, "percentage": 74.09, "elapsed_time": "11:21:55", "remaining_time": "3:58:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18720, "total_steps": 25254, "loss": 0.0841, "learning_rate": 8.275865256256607e-06, "epoch": 2.2238061297220244, "percentage": 74.13, "elapsed_time": "11:22:17", "remaining_time": "3:58:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18730, "total_steps": 25254, "loss": 0.082, "learning_rate": 8.25204731378535e-06, "epoch": 2.2249940603468756, "percentage": 74.17, "elapsed_time": "11:22:39", "remaining_time": "3:57:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18740, "total_steps": 25254, "loss": 0.0879, "learning_rate": 8.228256918108295e-06, "epoch": 2.2261819909717273, "percentage": 74.21, "elapsed_time": "11:23:01", "remaining_time": "3:57:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18750, "total_steps": 25254, "loss": 0.0854, "learning_rate": 8.204494108355546e-06, "epoch": 2.227369921596579, "percentage": 74.25, "elapsed_time": "11:23:23", "remaining_time": "3:57:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18760, "total_steps": 25254, "loss": 0.0861, "learning_rate": 8.180758923611834e-06, "epoch": 2.22855785222143, "percentage": 74.29, "elapsed_time": "11:23:45", "remaining_time": "3:56:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18770, "total_steps": 25254, "loss": 0.0811, "learning_rate": 8.157051402916452e-06, "epoch": 2.229745782846282, "percentage": 74.32, "elapsed_time": "11:24:07", "remaining_time": "3:56:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18780, "total_steps": 25254, "loss": 0.0839, "learning_rate": 8.133371585263183e-06, "epoch": 2.230933713471133, "percentage": 74.36, "elapsed_time": "11:24:28", "remaining_time": "3:55:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18790, "total_steps": 25254, "loss": 0.0805, "learning_rate": 8.109719509600278e-06, "epoch": 2.232121644095985, "percentage": 74.4, "elapsed_time": "11:24:50", "remaining_time": "3:55:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18800, "total_steps": 25254, "loss": 0.0838, "learning_rate": 8.086095214830317e-06, "epoch": 2.2333095747208365, "percentage": 74.44, "elapsed_time": "11:25:12", "remaining_time": "3:55:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18810, "total_steps": 25254, "loss": 0.0867, "learning_rate": 8.06249873981021e-06, "epoch": 2.2344975053456877, "percentage": 74.48, "elapsed_time": "11:25:34", "remaining_time": "3:54:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18820, "total_steps": 25254, "loss": 0.0829, "learning_rate": 8.038930123351098e-06, "epoch": 2.2356854359705394, "percentage": 74.52, "elapsed_time": "11:25:56", "remaining_time": "3:54:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18830, "total_steps": 25254, "loss": 0.0862, "learning_rate": 8.015389404218305e-06, "epoch": 2.2368733665953906, "percentage": 74.56, "elapsed_time": "11:26:18", "remaining_time": "3:54:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18840, "total_steps": 25254, "loss": 0.0835, "learning_rate": 7.991876621131278e-06, "epoch": 2.2380612972202423, "percentage": 74.6, "elapsed_time": "11:26:40", "remaining_time": "3:53:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18850, "total_steps": 25254, "loss": 0.0847, "learning_rate": 7.968391812763507e-06, "epoch": 2.239249227845094, "percentage": 74.64, "elapsed_time": "11:27:02", "remaining_time": "3:53:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18860, "total_steps": 25254, "loss": 0.0865, "learning_rate": 7.944935017742469e-06, "epoch": 2.240437158469945, "percentage": 74.68, "elapsed_time": "11:27:24", "remaining_time": "3:53:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18870, "total_steps": 25254, "loss": 0.0832, "learning_rate": 7.921506274649564e-06, "epoch": 2.241625089094797, "percentage": 74.72, "elapsed_time": "11:27:46", "remaining_time": "3:52:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18880, "total_steps": 25254, "loss": 0.0865, "learning_rate": 7.898105622020058e-06, "epoch": 2.2428130197196485, "percentage": 74.76, "elapsed_time": "11:28:08", "remaining_time": "3:52:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18890, "total_steps": 25254, "loss": 0.0826, "learning_rate": 7.87473309834301e-06, "epoch": 2.2440009503444998, "percentage": 74.8, "elapsed_time": "11:28:31", "remaining_time": "3:51:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18900, "total_steps": 25254, "loss": 0.0833, "learning_rate": 7.851388742061214e-06, "epoch": 2.2451888809693514, "percentage": 74.84, "elapsed_time": "11:28:52", "remaining_time": "3:51:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18910, "total_steps": 25254, "loss": 0.0844, "learning_rate": 7.828072591571136e-06, "epoch": 2.246376811594203, "percentage": 74.88, "elapsed_time": "11:29:14", "remaining_time": "3:51:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18920, "total_steps": 25254, "loss": 0.0889, "learning_rate": 7.80478468522284e-06, "epoch": 2.2475647422190543, "percentage": 74.92, "elapsed_time": "11:29:36", "remaining_time": "3:50:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18930, "total_steps": 25254, "loss": 0.0843, "learning_rate": 7.781525061319961e-06, "epoch": 2.248752672843906, "percentage": 74.96, "elapsed_time": "11:29:59", "remaining_time": "3:50:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18940, "total_steps": 25254, "loss": 0.0854, "learning_rate": 7.758293758119583e-06, "epoch": 2.2499406034687572, "percentage": 75.0, "elapsed_time": "11:30:21", "remaining_time": "3:50:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18950, "total_steps": 25254, "loss": 0.0822, "learning_rate": 7.73509081383223e-06, "epoch": 2.251128534093609, "percentage": 75.04, "elapsed_time": "11:30:43", "remaining_time": "3:49:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18960, "total_steps": 25254, "loss": 0.0856, "learning_rate": 7.711916266621772e-06, "epoch": 2.2523164647184606, "percentage": 75.08, "elapsed_time": "11:31:05", "remaining_time": "3:49:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18970, "total_steps": 25254, "loss": 0.0834, "learning_rate": 7.688770154605366e-06, "epoch": 2.253504395343312, "percentage": 75.12, "elapsed_time": "11:31:26", "remaining_time": "3:49:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18980, "total_steps": 25254, "loss": 0.0846, "learning_rate": 7.665652515853421e-06, "epoch": 2.2546923259681635, "percentage": 75.16, "elapsed_time": "11:31:49", "remaining_time": "3:48:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 18990, "total_steps": 25254, "loss": 0.083, "learning_rate": 7.642563388389495e-06, "epoch": 2.2558802565930147, "percentage": 75.2, "elapsed_time": "11:32:10", "remaining_time": "3:48:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19000, "total_steps": 25254, "loss": 0.0825, "learning_rate": 7.61950281019026e-06, "epoch": 2.2570681872178664, "percentage": 75.24, "elapsed_time": "11:32:32", "remaining_time": "3:47:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19010, "total_steps": 25254, "loss": 0.0836, "learning_rate": 7.596470819185419e-06, "epoch": 2.258256117842718, "percentage": 75.28, "elapsed_time": "11:32:55", "remaining_time": "3:47:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19020, "total_steps": 25254, "loss": 0.0839, "learning_rate": 7.57346745325766e-06, "epoch": 2.2594440484675697, "percentage": 75.31, "elapsed_time": "11:33:17", "remaining_time": "3:47:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19030, "total_steps": 25254, "loss": 0.0863, "learning_rate": 7.550492750242605e-06, "epoch": 2.260631979092421, "percentage": 75.35, "elapsed_time": "11:33:38", "remaining_time": "3:46:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19040, "total_steps": 25254, "loss": 0.0869, "learning_rate": 7.5275467479287155e-06, "epoch": 2.2618199097172726, "percentage": 75.39, "elapsed_time": "11:34:00", "remaining_time": "3:46:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19050, "total_steps": 25254, "loss": 0.0856, "learning_rate": 7.504629484057243e-06, "epoch": 2.263007840342124, "percentage": 75.43, "elapsed_time": "11:34:21", "remaining_time": "3:46:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19060, "total_steps": 25254, "loss": 0.085, "learning_rate": 7.481740996322182e-06, "epoch": 2.2641957709669756, "percentage": 75.47, "elapsed_time": "11:34:43", "remaining_time": "3:45:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19070, "total_steps": 25254, "loss": 0.0835, "learning_rate": 7.4588813223701895e-06, "epoch": 2.2653837015918272, "percentage": 75.51, "elapsed_time": "11:35:05", "remaining_time": "3:45:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19080, "total_steps": 25254, "loss": 0.0866, "learning_rate": 7.436050499800532e-06, "epoch": 2.2665716322166785, "percentage": 75.55, "elapsed_time": "11:35:27", "remaining_time": "3:45:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19090, "total_steps": 25254, "loss": 0.0883, "learning_rate": 7.413248566165018e-06, "epoch": 2.26775956284153, "percentage": 75.59, "elapsed_time": "11:35:49", "remaining_time": "3:44:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19100, "total_steps": 25254, "loss": 0.0834, "learning_rate": 7.390475558967949e-06, "epoch": 2.2689474934663814, "percentage": 75.63, "elapsed_time": "11:36:11", "remaining_time": "3:44:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19110, "total_steps": 25254, "loss": 0.0832, "learning_rate": 7.3677315156660346e-06, "epoch": 2.270135424091233, "percentage": 75.67, "elapsed_time": "11:36:32", "remaining_time": "3:43:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19120, "total_steps": 25254, "loss": 0.0841, "learning_rate": 7.345016473668365e-06, "epoch": 2.2713233547160847, "percentage": 75.71, "elapsed_time": "11:36:54", "remaining_time": "3:43:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19130, "total_steps": 25254, "loss": 0.0825, "learning_rate": 7.3223304703363135e-06, "epoch": 2.272511285340936, "percentage": 75.75, "elapsed_time": "11:37:16", "remaining_time": "3:43:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19140, "total_steps": 25254, "loss": 0.085, "learning_rate": 7.299673542983496e-06, "epoch": 2.2736992159657876, "percentage": 75.79, "elapsed_time": "11:37:38", "remaining_time": "3:42:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19150, "total_steps": 25254, "loss": 0.082, "learning_rate": 7.277045728875701e-06, "epoch": 2.2748871465906393, "percentage": 75.83, "elapsed_time": "11:38:00", "remaining_time": "3:42:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19160, "total_steps": 25254, "loss": 0.0835, "learning_rate": 7.2544470652308295e-06, "epoch": 2.2760750772154905, "percentage": 75.87, "elapsed_time": "11:38:22", "remaining_time": "3:42:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19170, "total_steps": 25254, "loss": 0.0857, "learning_rate": 7.231877589218858e-06, "epoch": 2.277263007840342, "percentage": 75.91, "elapsed_time": "11:38:44", "remaining_time": "3:41:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19180, "total_steps": 25254, "loss": 0.0876, "learning_rate": 7.2093373379617305e-06, "epoch": 2.278450938465194, "percentage": 75.95, "elapsed_time": "11:39:05", "remaining_time": "3:41:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19190, "total_steps": 25254, "loss": 0.0864, "learning_rate": 7.186826348533329e-06, "epoch": 2.279638869090045, "percentage": 75.99, "elapsed_time": "11:39:27", "remaining_time": "3:41:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19200, "total_steps": 25254, "loss": 0.0842, "learning_rate": 7.164344657959413e-06, "epoch": 2.2808267997148968, "percentage": 76.03, "elapsed_time": "11:39:49", "remaining_time": "3:40:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19210, "total_steps": 25254, "loss": 0.0835, "learning_rate": 7.141892303217546e-06, "epoch": 2.282014730339748, "percentage": 76.07, "elapsed_time": "11:40:11", "remaining_time": "3:40:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19220, "total_steps": 25254, "loss": 0.0841, "learning_rate": 7.119469321237041e-06, "epoch": 2.2832026609645997, "percentage": 76.11, "elapsed_time": "11:40:32", "remaining_time": "3:39:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19230, "total_steps": 25254, "loss": 0.0846, "learning_rate": 7.097075748898896e-06, "epoch": 2.2843905915894513, "percentage": 76.15, "elapsed_time": "11:40:54", "remaining_time": "3:39:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19240, "total_steps": 25254, "loss": 0.0856, "learning_rate": 7.074711623035745e-06, "epoch": 2.2855785222143026, "percentage": 76.19, "elapsed_time": "11:41:16", "remaining_time": "3:39:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19250, "total_steps": 25254, "loss": 0.0867, "learning_rate": 7.052376980431777e-06, "epoch": 2.2867664528391543, "percentage": 76.23, "elapsed_time": "11:41:38", "remaining_time": "3:38:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19260, "total_steps": 25254, "loss": 0.0827, "learning_rate": 7.030071857822703e-06, "epoch": 2.2879543834640055, "percentage": 76.27, "elapsed_time": "11:41:59", "remaining_time": "3:38:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19270, "total_steps": 25254, "loss": 0.0812, "learning_rate": 7.0077962918956715e-06, "epoch": 2.289142314088857, "percentage": 76.3, "elapsed_time": "11:42:22", "remaining_time": "3:38:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19280, "total_steps": 25254, "loss": 0.0839, "learning_rate": 6.9855503192892105e-06, "epoch": 2.290330244713709, "percentage": 76.34, "elapsed_time": "11:42:44", "remaining_time": "3:37:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19290, "total_steps": 25254, "loss": 0.0839, "learning_rate": 6.963333976593183e-06, "epoch": 2.29151817533856, "percentage": 76.38, "elapsed_time": "11:43:05", "remaining_time": "3:37:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19300, "total_steps": 25254, "loss": 0.0833, "learning_rate": 6.941147300348702e-06, "epoch": 2.2927061059634117, "percentage": 76.42, "elapsed_time": "11:43:27", "remaining_time": "3:37:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19310, "total_steps": 25254, "loss": 0.0836, "learning_rate": 6.9189903270481135e-06, "epoch": 2.2938940365882634, "percentage": 76.46, "elapsed_time": "11:43:48", "remaining_time": "3:36:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19320, "total_steps": 25254, "loss": 0.0835, "learning_rate": 6.8968630931348864e-06, "epoch": 2.2950819672131146, "percentage": 76.5, "elapsed_time": "11:44:10", "remaining_time": "3:36:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19330, "total_steps": 25254, "loss": 0.0854, "learning_rate": 6.874765635003577e-06, "epoch": 2.2962698978379663, "percentage": 76.54, "elapsed_time": "11:44:32", "remaining_time": "3:35:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19340, "total_steps": 25254, "loss": 0.0831, "learning_rate": 6.852697988999774e-06, "epoch": 2.297457828462818, "percentage": 76.58, "elapsed_time": "11:44:54", "remaining_time": "3:35:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19350, "total_steps": 25254, "loss": 0.0846, "learning_rate": 6.830660191420013e-06, "epoch": 2.298645759087669, "percentage": 76.62, "elapsed_time": "11:45:16", "remaining_time": "3:35:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19360, "total_steps": 25254, "loss": 0.0844, "learning_rate": 6.808652278511771e-06, "epoch": 2.299833689712521, "percentage": 76.66, "elapsed_time": "11:45:38", "remaining_time": "3:34:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19370, "total_steps": 25254, "loss": 0.0861, "learning_rate": 6.786674286473338e-06, "epoch": 2.301021620337372, "percentage": 76.7, "elapsed_time": "11:46:00", "remaining_time": "3:34:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19380, "total_steps": 25254, "loss": 0.0846, "learning_rate": 6.764726251453807e-06, "epoch": 2.302209550962224, "percentage": 76.74, "elapsed_time": "11:46:21", "remaining_time": "3:34:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19390, "total_steps": 25254, "loss": 0.0852, "learning_rate": 6.742808209552992e-06, "epoch": 2.3033974815870755, "percentage": 76.78, "elapsed_time": "11:46:43", "remaining_time": "3:33:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19400, "total_steps": 25254, "loss": 0.0828, "learning_rate": 6.720920196821373e-06, "epoch": 2.3045854122119267, "percentage": 76.82, "elapsed_time": "11:47:05", "remaining_time": "3:33:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19410, "total_steps": 25254, "loss": 0.0845, "learning_rate": 6.6990622492600464e-06, "epoch": 2.3057733428367784, "percentage": 76.86, "elapsed_time": "11:47:27", "remaining_time": "3:33:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19420, "total_steps": 25254, "loss": 0.0848, "learning_rate": 6.677234402820651e-06, "epoch": 2.3069612734616296, "percentage": 76.9, "elapsed_time": "11:47:49", "remaining_time": "3:32:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19430, "total_steps": 25254, "loss": 0.0823, "learning_rate": 6.65543669340532e-06, "epoch": 2.3081492040864813, "percentage": 76.94, "elapsed_time": "11:48:12", "remaining_time": "3:32:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19440, "total_steps": 25254, "loss": 0.083, "learning_rate": 6.633669156866604e-06, "epoch": 2.309337134711333, "percentage": 76.98, "elapsed_time": "11:48:33", "remaining_time": "3:31:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19450, "total_steps": 25254, "loss": 0.0847, "learning_rate": 6.611931829007456e-06, "epoch": 2.310525065336184, "percentage": 77.02, "elapsed_time": "11:48:55", "remaining_time": "3:31:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19460, "total_steps": 25254, "loss": 0.0862, "learning_rate": 6.590224745581114e-06, "epoch": 2.311712995961036, "percentage": 77.06, "elapsed_time": "11:49:17", "remaining_time": "3:31:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19470, "total_steps": 25254, "loss": 0.0809, "learning_rate": 6.5685479422910815e-06, "epoch": 2.3129009265858875, "percentage": 77.1, "elapsed_time": "11:49:39", "remaining_time": "3:30:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19480, "total_steps": 25254, "loss": 0.083, "learning_rate": 6.546901454791055e-06, "epoch": 2.3140888572107388, "percentage": 77.14, "elapsed_time": "11:50:02", "remaining_time": "3:30:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19490, "total_steps": 25254, "loss": 0.0832, "learning_rate": 6.5252853186848595e-06, "epoch": 2.3152767878355904, "percentage": 77.18, "elapsed_time": "11:50:23", "remaining_time": "3:30:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19500, "total_steps": 25254, "loss": 0.087, "learning_rate": 6.503699569526428e-06, "epoch": 2.316464718460442, "percentage": 77.22, "elapsed_time": "11:50:45", "remaining_time": "3:29:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19510, "total_steps": 25254, "loss": 0.0864, "learning_rate": 6.482144242819682e-06, "epoch": 2.3176526490852933, "percentage": 77.26, "elapsed_time": "11:51:07", "remaining_time": "3:29:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19520, "total_steps": 25254, "loss": 0.0855, "learning_rate": 6.460619374018518e-06, "epoch": 2.318840579710145, "percentage": 77.29, "elapsed_time": "11:51:28", "remaining_time": "3:28:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19530, "total_steps": 25254, "loss": 0.0833, "learning_rate": 6.43912499852673e-06, "epoch": 2.3200285103349962, "percentage": 77.33, "elapsed_time": "11:51:50", "remaining_time": "3:28:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19540, "total_steps": 25254, "loss": 0.0869, "learning_rate": 6.417661151697965e-06, "epoch": 2.321216440959848, "percentage": 77.37, "elapsed_time": "11:52:12", "remaining_time": "3:28:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19550, "total_steps": 25254, "loss": 0.0826, "learning_rate": 6.396227868835653e-06, "epoch": 2.3224043715846996, "percentage": 77.41, "elapsed_time": "11:52:34", "remaining_time": "3:27:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19560, "total_steps": 25254, "loss": 0.087, "learning_rate": 6.3748251851929504e-06, "epoch": 2.323592302209551, "percentage": 77.45, "elapsed_time": "11:52:55", "remaining_time": "3:27:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19570, "total_steps": 25254, "loss": 0.0833, "learning_rate": 6.353453135972687e-06, "epoch": 2.3247802328344025, "percentage": 77.49, "elapsed_time": "11:53:17", "remaining_time": "3:27:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19580, "total_steps": 25254, "loss": 0.0841, "learning_rate": 6.3321117563273e-06, "epoch": 2.325968163459254, "percentage": 77.53, "elapsed_time": "11:53:39", "remaining_time": "3:26:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19590, "total_steps": 25254, "loss": 0.084, "learning_rate": 6.310801081358797e-06, "epoch": 2.3271560940841054, "percentage": 77.57, "elapsed_time": "11:54:00", "remaining_time": "3:26:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19600, "total_steps": 25254, "loss": 0.0855, "learning_rate": 6.289521146118671e-06, "epoch": 2.328344024708957, "percentage": 77.61, "elapsed_time": "11:54:22", "remaining_time": "3:26:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19610, "total_steps": 25254, "loss": 0.085, "learning_rate": 6.268271985607854e-06, "epoch": 2.3295319553338087, "percentage": 77.65, "elapsed_time": "11:54:44", "remaining_time": "3:25:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19620, "total_steps": 25254, "loss": 0.0823, "learning_rate": 6.2470536347766615e-06, "epoch": 2.33071988595866, "percentage": 77.69, "elapsed_time": "11:55:05", "remaining_time": "3:25:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19630, "total_steps": 25254, "loss": 0.085, "learning_rate": 6.225866128524729e-06, "epoch": 2.3319078165835117, "percentage": 77.73, "elapsed_time": "11:55:27", "remaining_time": "3:24:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19640, "total_steps": 25254, "loss": 0.0856, "learning_rate": 6.204709501700978e-06, "epoch": 2.333095747208363, "percentage": 77.77, "elapsed_time": "11:55:49", "remaining_time": "3:24:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19650, "total_steps": 25254, "loss": 0.0859, "learning_rate": 6.183583789103525e-06, "epoch": 2.3342836778332146, "percentage": 77.81, "elapsed_time": "11:56:11", "remaining_time": "3:24:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19660, "total_steps": 25254, "loss": 0.084, "learning_rate": 6.162489025479637e-06, "epoch": 2.3354716084580662, "percentage": 77.85, "elapsed_time": "11:56:33", "remaining_time": "3:23:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19670, "total_steps": 25254, "loss": 0.0826, "learning_rate": 6.141425245525681e-06, "epoch": 2.3366595390829175, "percentage": 77.89, "elapsed_time": "11:56:56", "remaining_time": "3:23:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19680, "total_steps": 25254, "loss": 0.0834, "learning_rate": 6.120392483887055e-06, "epoch": 2.337847469707769, "percentage": 77.93, "elapsed_time": "11:57:17", "remaining_time": "3:23:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19690, "total_steps": 25254, "loss": 0.0849, "learning_rate": 6.0993907751581644e-06, "epoch": 2.3390354003326204, "percentage": 77.97, "elapsed_time": "11:57:39", "remaining_time": "3:22:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19700, "total_steps": 25254, "loss": 0.0856, "learning_rate": 6.078420153882308e-06, "epoch": 2.340223330957472, "percentage": 78.01, "elapsed_time": "11:58:01", "remaining_time": "3:22:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19710, "total_steps": 25254, "loss": 0.0829, "learning_rate": 6.0574806545516695e-06, "epoch": 2.3414112615823237, "percentage": 78.05, "elapsed_time": "11:58:24", "remaining_time": "3:22:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19720, "total_steps": 25254, "loss": 0.0831, "learning_rate": 6.036572311607239e-06, "epoch": 2.342599192207175, "percentage": 78.09, "elapsed_time": "11:58:45", "remaining_time": "3:21:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19730, "total_steps": 25254, "loss": 0.0826, "learning_rate": 6.015695159438759e-06, "epoch": 2.3437871228320266, "percentage": 78.13, "elapsed_time": "11:59:08", "remaining_time": "3:21:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19740, "total_steps": 25254, "loss": 0.0832, "learning_rate": 5.994849232384672e-06, "epoch": 2.3449750534568783, "percentage": 78.17, "elapsed_time": "11:59:29", "remaining_time": "3:20:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19750, "total_steps": 25254, "loss": 0.083, "learning_rate": 5.974034564732065e-06, "epoch": 2.3461629840817295, "percentage": 78.21, "elapsed_time": "11:59:51", "remaining_time": "3:20:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19760, "total_steps": 25254, "loss": 0.0832, "learning_rate": 5.953251190716605e-06, "epoch": 2.347350914706581, "percentage": 78.25, "elapsed_time": "12:00:13", "remaining_time": "3:20:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19770, "total_steps": 25254, "loss": 0.0839, "learning_rate": 5.932499144522483e-06, "epoch": 2.348538845331433, "percentage": 78.28, "elapsed_time": "12:00:35", "remaining_time": "3:19:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19780, "total_steps": 25254, "loss": 0.0839, "learning_rate": 5.911778460282386e-06, "epoch": 2.349726775956284, "percentage": 78.32, "elapsed_time": "12:00:57", "remaining_time": "3:19:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19790, "total_steps": 25254, "loss": 0.0833, "learning_rate": 5.891089172077388e-06, "epoch": 2.3509147065811358, "percentage": 78.36, "elapsed_time": "12:01:18", "remaining_time": "3:19:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19800, "total_steps": 25254, "loss": 0.0849, "learning_rate": 5.870431313936941e-06, "epoch": 2.352102637205987, "percentage": 78.4, "elapsed_time": "12:01:40", "remaining_time": "3:18:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19810, "total_steps": 25254, "loss": 0.0815, "learning_rate": 5.849804919838795e-06, "epoch": 2.3532905678308387, "percentage": 78.44, "elapsed_time": "12:02:02", "remaining_time": "3:18:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19820, "total_steps": 25254, "loss": 0.0831, "learning_rate": 5.829210023708939e-06, "epoch": 2.3544784984556903, "percentage": 78.48, "elapsed_time": "12:02:23", "remaining_time": "3:18:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19830, "total_steps": 25254, "loss": 0.0832, "learning_rate": 5.808646659421582e-06, "epoch": 2.3556664290805416, "percentage": 78.52, "elapsed_time": "12:02:44", "remaining_time": "3:17:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19840, "total_steps": 25254, "loss": 0.0822, "learning_rate": 5.788114860799043e-06, "epoch": 2.3568543597053933, "percentage": 78.56, "elapsed_time": "12:03:06", "remaining_time": "3:17:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19850, "total_steps": 25254, "loss": 0.0832, "learning_rate": 5.767614661611739e-06, "epoch": 2.3580422903302445, "percentage": 78.6, "elapsed_time": "12:03:27", "remaining_time": "3:16:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19860, "total_steps": 25254, "loss": 0.0837, "learning_rate": 5.747146095578099e-06, "epoch": 2.359230220955096, "percentage": 78.64, "elapsed_time": "12:03:49", "remaining_time": "3:16:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19870, "total_steps": 25254, "loss": 0.0803, "learning_rate": 5.726709196364532e-06, "epoch": 2.360418151579948, "percentage": 78.68, "elapsed_time": "12:04:11", "remaining_time": "3:16:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19880, "total_steps": 25254, "loss": 0.0814, "learning_rate": 5.706303997585358e-06, "epoch": 2.361606082204799, "percentage": 78.72, "elapsed_time": "12:04:32", "remaining_time": "3:15:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19890, "total_steps": 25254, "loss": 0.0832, "learning_rate": 5.685930532802758e-06, "epoch": 2.3627940128296507, "percentage": 78.76, "elapsed_time": "12:04:54", "remaining_time": "3:15:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19900, "total_steps": 25254, "loss": 0.0833, "learning_rate": 5.665588835526714e-06, "epoch": 2.3639819434545024, "percentage": 78.8, "elapsed_time": "12:05:15", "remaining_time": "3:15:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19910, "total_steps": 25254, "loss": 0.0858, "learning_rate": 5.64527893921496e-06, "epoch": 2.3651698740793536, "percentage": 78.84, "elapsed_time": "12:05:38", "remaining_time": "3:14:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19920, "total_steps": 25254, "loss": 0.0813, "learning_rate": 5.625000877272932e-06, "epoch": 2.3663578047042053, "percentage": 78.88, "elapsed_time": "12:06:00", "remaining_time": "3:14:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19930, "total_steps": 25254, "loss": 0.0837, "learning_rate": 5.604754683053693e-06, "epoch": 2.367545735329057, "percentage": 78.92, "elapsed_time": "12:06:21", "remaining_time": "3:14:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19940, "total_steps": 25254, "loss": 0.0831, "learning_rate": 5.584540389857895e-06, "epoch": 2.368733665953908, "percentage": 78.96, "elapsed_time": "12:06:43", "remaining_time": "3:13:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19950, "total_steps": 25254, "loss": 0.0846, "learning_rate": 5.564358030933719e-06, "epoch": 2.36992159657876, "percentage": 79.0, "elapsed_time": "12:07:06", "remaining_time": "3:13:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19960, "total_steps": 25254, "loss": 0.0842, "learning_rate": 5.544207639476817e-06, "epoch": 2.371109527203611, "percentage": 79.04, "elapsed_time": "12:07:28", "remaining_time": "3:12:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19970, "total_steps": 25254, "loss": 0.0823, "learning_rate": 5.524089248630279e-06, "epoch": 2.372297457828463, "percentage": 79.08, "elapsed_time": "12:07:49", "remaining_time": "3:12:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19980, "total_steps": 25254, "loss": 0.0839, "learning_rate": 5.504002891484539e-06, "epoch": 2.3734853884533145, "percentage": 79.12, "elapsed_time": "12:08:12", "remaining_time": "3:12:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 19990, "total_steps": 25254, "loss": 0.0837, "learning_rate": 5.483948601077354e-06, "epoch": 2.3746733190781657, "percentage": 79.16, "elapsed_time": "12:08:33", "remaining_time": "3:11:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20000, "total_steps": 25254, "loss": 0.0821, "learning_rate": 5.4639264103937325e-06, "epoch": 2.3758612497030174, "percentage": 79.2, "elapsed_time": "12:08:55", "remaining_time": "3:11:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20010, "total_steps": 25254, "loss": 0.0819, "learning_rate": 5.443936352365886e-06, "epoch": 2.3770491803278686, "percentage": 79.23, "elapsed_time": "12:09:17", "remaining_time": "3:11:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20020, "total_steps": 25254, "loss": 0.0848, "learning_rate": 5.423978459873186e-06, "epoch": 2.3782371109527203, "percentage": 79.27, "elapsed_time": "12:09:39", "remaining_time": "3:10:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20030, "total_steps": 25254, "loss": 0.0828, "learning_rate": 5.404052765742096e-06, "epoch": 2.379425041577572, "percentage": 79.31, "elapsed_time": "12:10:00", "remaining_time": "3:10:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20040, "total_steps": 25254, "loss": 0.0881, "learning_rate": 5.384159302746095e-06, "epoch": 2.3806129722024236, "percentage": 79.35, "elapsed_time": "12:10:22", "remaining_time": "3:10:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20050, "total_steps": 25254, "loss": 0.082, "learning_rate": 5.364298103605669e-06, "epoch": 2.381800902827275, "percentage": 79.39, "elapsed_time": "12:10:44", "remaining_time": "3:09:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20060, "total_steps": 25254, "loss": 0.0834, "learning_rate": 5.344469200988251e-06, "epoch": 2.3829888334521265, "percentage": 79.43, "elapsed_time": "12:11:06", "remaining_time": "3:09:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20070, "total_steps": 25254, "loss": 0.0836, "learning_rate": 5.324672627508129e-06, "epoch": 2.3841767640769778, "percentage": 79.47, "elapsed_time": "12:11:28", "remaining_time": "3:08:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20080, "total_steps": 25254, "loss": 0.083, "learning_rate": 5.3049084157264285e-06, "epoch": 2.3853646947018294, "percentage": 79.51, "elapsed_time": "12:11:50", "remaining_time": "3:08:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20090, "total_steps": 25254, "loss": 0.084, "learning_rate": 5.285176598151043e-06, "epoch": 2.386552625326681, "percentage": 79.55, "elapsed_time": "12:12:12", "remaining_time": "3:08:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20100, "total_steps": 25254, "loss": 0.0838, "learning_rate": 5.2654772072365744e-06, "epoch": 2.3877405559515323, "percentage": 79.59, "elapsed_time": "12:12:34", "remaining_time": "3:07:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20110, "total_steps": 25254, "loss": 0.0825, "learning_rate": 5.2458102753843166e-06, "epoch": 2.388928486576384, "percentage": 79.63, "elapsed_time": "12:12:56", "remaining_time": "3:07:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20120, "total_steps": 25254, "loss": 0.0823, "learning_rate": 5.226175834942154e-06, "epoch": 2.3901164172012352, "percentage": 79.67, "elapsed_time": "12:13:18", "remaining_time": "3:07:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20130, "total_steps": 25254, "loss": 0.0851, "learning_rate": 5.206573918204533e-06, "epoch": 2.391304347826087, "percentage": 79.71, "elapsed_time": "12:13:40", "remaining_time": "3:06:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20140, "total_steps": 25254, "loss": 0.085, "learning_rate": 5.1870045574124084e-06, "epoch": 2.3924922784509386, "percentage": 79.75, "elapsed_time": "12:14:01", "remaining_time": "3:06:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20150, "total_steps": 25254, "loss": 0.0809, "learning_rate": 5.1674677847531776e-06, "epoch": 2.39368020907579, "percentage": 79.79, "elapsed_time": "12:14:23", "remaining_time": "3:06:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20160, "total_steps": 25254, "loss": 0.0844, "learning_rate": 5.1479636323606614e-06, "epoch": 2.3948681397006415, "percentage": 79.83, "elapsed_time": "12:14:44", "remaining_time": "3:05:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20170, "total_steps": 25254, "loss": 0.0819, "learning_rate": 5.128492132315005e-06, "epoch": 2.396056070325493, "percentage": 79.87, "elapsed_time": "12:15:06", "remaining_time": "3:05:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20180, "total_steps": 25254, "loss": 0.0823, "learning_rate": 5.109053316642654e-06, "epoch": 2.3972440009503444, "percentage": 79.91, "elapsed_time": "12:15:28", "remaining_time": "3:04:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20190, "total_steps": 25254, "loss": 0.0855, "learning_rate": 5.089647217316296e-06, "epoch": 2.398431931575196, "percentage": 79.95, "elapsed_time": "12:15:50", "remaining_time": "3:04:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20200, "total_steps": 25254, "loss": 0.0841, "learning_rate": 5.070273866254807e-06, "epoch": 2.3996198622000477, "percentage": 79.99, "elapsed_time": "12:16:12", "remaining_time": "3:04:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20210, "total_steps": 25254, "loss": 0.0863, "learning_rate": 5.0509332953231985e-06, "epoch": 2.400807792824899, "percentage": 80.03, "elapsed_time": "12:16:34", "remaining_time": "3:03:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20220, "total_steps": 25254, "loss": 0.0823, "learning_rate": 5.0316255363325686e-06, "epoch": 2.4019957234497507, "percentage": 80.07, "elapsed_time": "12:16:56", "remaining_time": "3:03:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20230, "total_steps": 25254, "loss": 0.0842, "learning_rate": 5.012350621040041e-06, "epoch": 2.403183654074602, "percentage": 80.11, "elapsed_time": "12:17:17", "remaining_time": "3:03:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20240, "total_steps": 25254, "loss": 0.085, "learning_rate": 4.993108581148717e-06, "epoch": 2.4043715846994536, "percentage": 80.15, "elapsed_time": "12:17:39", "remaining_time": "3:02:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20250, "total_steps": 25254, "loss": 0.0813, "learning_rate": 4.973899448307645e-06, "epoch": 2.4055595153243052, "percentage": 80.19, "elapsed_time": "12:18:01", "remaining_time": "3:02:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20260, "total_steps": 25254, "loss": 0.0853, "learning_rate": 4.954723254111724e-06, "epoch": 2.4067474459491565, "percentage": 80.22, "elapsed_time": "12:18:23", "remaining_time": "3:02:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20270, "total_steps": 25254, "loss": 0.0835, "learning_rate": 4.935580030101686e-06, "epoch": 2.407935376574008, "percentage": 80.26, "elapsed_time": "12:18:44", "remaining_time": "3:01:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20280, "total_steps": 25254, "loss": 0.0834, "learning_rate": 4.9164698077640344e-06, "epoch": 2.4091233071988594, "percentage": 80.3, "elapsed_time": "12:19:06", "remaining_time": "3:01:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20290, "total_steps": 25254, "loss": 0.0822, "learning_rate": 4.897392618530983e-06, "epoch": 2.410311237823711, "percentage": 80.34, "elapsed_time": "12:19:28", "remaining_time": "3:00:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20300, "total_steps": 25254, "loss": 0.083, "learning_rate": 4.878348493780435e-06, "epoch": 2.4114991684485627, "percentage": 80.38, "elapsed_time": "12:19:50", "remaining_time": "3:00:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20310, "total_steps": 25254, "loss": 0.0838, "learning_rate": 4.859337464835889e-06, "epoch": 2.412687099073414, "percentage": 80.42, "elapsed_time": "12:20:11", "remaining_time": "3:00:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20320, "total_steps": 25254, "loss": 0.0845, "learning_rate": 4.840359562966415e-06, "epoch": 2.4138750296982656, "percentage": 80.46, "elapsed_time": "12:20:33", "remaining_time": "2:59:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20330, "total_steps": 25254, "loss": 0.086, "learning_rate": 4.821414819386597e-06, "epoch": 2.4150629603231173, "percentage": 80.5, "elapsed_time": "12:20:55", "remaining_time": "2:59:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20340, "total_steps": 25254, "loss": 0.0837, "learning_rate": 4.802503265256469e-06, "epoch": 2.4162508909479685, "percentage": 80.54, "elapsed_time": "12:21:16", "remaining_time": "2:59:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20350, "total_steps": 25254, "loss": 0.0821, "learning_rate": 4.783624931681513e-06, "epoch": 2.41743882157282, "percentage": 80.58, "elapsed_time": "12:21:38", "remaining_time": "2:58:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20360, "total_steps": 25254, "loss": 0.0825, "learning_rate": 4.764779849712514e-06, "epoch": 2.418626752197672, "percentage": 80.62, "elapsed_time": "12:22:00", "remaining_time": "2:58:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20370, "total_steps": 25254, "loss": 0.0841, "learning_rate": 4.745968050345609e-06, "epoch": 2.419814682822523, "percentage": 80.66, "elapsed_time": "12:22:22", "remaining_time": "2:57:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20380, "total_steps": 25254, "loss": 0.0845, "learning_rate": 4.72718956452217e-06, "epoch": 2.4210026134473748, "percentage": 80.7, "elapsed_time": "12:22:44", "remaining_time": "2:57:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20390, "total_steps": 25254, "loss": 0.0851, "learning_rate": 4.7084444231287935e-06, "epoch": 2.422190544072226, "percentage": 80.74, "elapsed_time": "12:23:06", "remaining_time": "2:57:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20400, "total_steps": 25254, "loss": 0.0811, "learning_rate": 4.6897326569972145e-06, "epoch": 2.4233784746970777, "percentage": 80.78, "elapsed_time": "12:23:28", "remaining_time": "2:56:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20410, "total_steps": 25254, "loss": 0.0853, "learning_rate": 4.671054296904284e-06, "epoch": 2.4245664053219294, "percentage": 80.82, "elapsed_time": "12:23:49", "remaining_time": "2:56:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20420, "total_steps": 25254, "loss": 0.0846, "learning_rate": 4.652409373571898e-06, "epoch": 2.4257543359467806, "percentage": 80.86, "elapsed_time": "12:24:11", "remaining_time": "2:56:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20430, "total_steps": 25254, "loss": 0.0817, "learning_rate": 4.6337979176669575e-06, "epoch": 2.4269422665716323, "percentage": 80.9, "elapsed_time": "12:24:33", "remaining_time": "2:55:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20440, "total_steps": 25254, "loss": 0.0828, "learning_rate": 4.615219959801332e-06, "epoch": 2.4281301971964835, "percentage": 80.94, "elapsed_time": "12:24:54", "remaining_time": "2:55:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20450, "total_steps": 25254, "loss": 0.0831, "learning_rate": 4.596675530531777e-06, "epoch": 2.429318127821335, "percentage": 80.98, "elapsed_time": "12:25:17", "remaining_time": "2:55:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20460, "total_steps": 25254, "loss": 0.0849, "learning_rate": 4.578164660359904e-06, "epoch": 2.430506058446187, "percentage": 81.02, "elapsed_time": "12:25:39", "remaining_time": "2:54:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20470, "total_steps": 25254, "loss": 0.083, "learning_rate": 4.55968737973213e-06, "epoch": 2.431693989071038, "percentage": 81.06, "elapsed_time": "12:26:01", "remaining_time": "2:54:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20480, "total_steps": 25254, "loss": 0.085, "learning_rate": 4.541243719039617e-06, "epoch": 2.4328819196958897, "percentage": 81.1, "elapsed_time": "12:26:22", "remaining_time": "2:53:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20490, "total_steps": 25254, "loss": 0.0814, "learning_rate": 4.522833708618246e-06, "epoch": 2.4340698503207414, "percentage": 81.14, "elapsed_time": "12:26:44", "remaining_time": "2:53:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20500, "total_steps": 25254, "loss": 0.083, "learning_rate": 4.504457378748536e-06, "epoch": 2.4352577809455926, "percentage": 81.18, "elapsed_time": "12:27:06", "remaining_time": "2:53:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20510, "total_steps": 25254, "loss": 0.0853, "learning_rate": 4.486114759655613e-06, "epoch": 2.4364457115704443, "percentage": 81.21, "elapsed_time": "12:27:27", "remaining_time": "2:52:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20520, "total_steps": 25254, "loss": 0.0807, "learning_rate": 4.467805881509157e-06, "epoch": 2.437633642195296, "percentage": 81.25, "elapsed_time": "12:27:49", "remaining_time": "2:52:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20530, "total_steps": 25254, "loss": 0.0844, "learning_rate": 4.449530774423347e-06, "epoch": 2.438821572820147, "percentage": 81.29, "elapsed_time": "12:28:10", "remaining_time": "2:52:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20540, "total_steps": 25254, "loss": 0.0823, "learning_rate": 4.43128946845682e-06, "epoch": 2.440009503444999, "percentage": 81.33, "elapsed_time": "12:28:32", "remaining_time": "2:51:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20550, "total_steps": 25254, "loss": 0.0822, "learning_rate": 4.413081993612617e-06, "epoch": 2.44119743406985, "percentage": 81.37, "elapsed_time": "12:28:53", "remaining_time": "2:51:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20560, "total_steps": 25254, "loss": 0.0799, "learning_rate": 4.394908379838133e-06, "epoch": 2.442385364694702, "percentage": 81.41, "elapsed_time": "12:29:15", "remaining_time": "2:51:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20570, "total_steps": 25254, "loss": 0.0823, "learning_rate": 4.376768657025062e-06, "epoch": 2.4435732953195535, "percentage": 81.45, "elapsed_time": "12:29:37", "remaining_time": "2:50:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20580, "total_steps": 25254, "loss": 0.0839, "learning_rate": 4.3586628550093766e-06, "epoch": 2.4447612259444047, "percentage": 81.49, "elapsed_time": "12:29:59", "remaining_time": "2:50:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20590, "total_steps": 25254, "loss": 0.0825, "learning_rate": 4.340591003571237e-06, "epoch": 2.4459491565692564, "percentage": 81.53, "elapsed_time": "12:30:21", "remaining_time": "2:49:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20600, "total_steps": 25254, "loss": 0.0821, "learning_rate": 4.322553132434965e-06, "epoch": 2.447137087194108, "percentage": 81.57, "elapsed_time": "12:30:42", "remaining_time": "2:49:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20610, "total_steps": 25254, "loss": 0.0842, "learning_rate": 4.304549271268993e-06, "epoch": 2.4483250178189593, "percentage": 81.61, "elapsed_time": "12:31:05", "remaining_time": "2:49:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20620, "total_steps": 25254, "loss": 0.0839, "learning_rate": 4.28657944968581e-06, "epoch": 2.449512948443811, "percentage": 81.65, "elapsed_time": "12:31:27", "remaining_time": "2:48:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20630, "total_steps": 25254, "loss": 0.0812, "learning_rate": 4.268643697241939e-06, "epoch": 2.4507008790686626, "percentage": 81.69, "elapsed_time": "12:31:48", "remaining_time": "2:48:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20640, "total_steps": 25254, "loss": 0.083, "learning_rate": 4.250742043437839e-06, "epoch": 2.451888809693514, "percentage": 81.73, "elapsed_time": "12:32:10", "remaining_time": "2:48:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20650, "total_steps": 25254, "loss": 0.0858, "learning_rate": 4.2328745177179e-06, "epoch": 2.4530767403183655, "percentage": 81.77, "elapsed_time": "12:32:32", "remaining_time": "2:47:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20660, "total_steps": 25254, "loss": 0.0841, "learning_rate": 4.21504114947037e-06, "epoch": 2.4542646709432168, "percentage": 81.81, "elapsed_time": "12:32:54", "remaining_time": "2:47:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20670, "total_steps": 25254, "loss": 0.0851, "learning_rate": 4.197241968027321e-06, "epoch": 2.4554526015680684, "percentage": 81.85, "elapsed_time": "12:33:15", "remaining_time": "2:47:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20680, "total_steps": 25254, "loss": 0.0838, "learning_rate": 4.1794770026645945e-06, "epoch": 2.45664053219292, "percentage": 81.89, "elapsed_time": "12:33:38", "remaining_time": "2:46:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20690, "total_steps": 25254, "loss": 0.085, "learning_rate": 4.16174628260175e-06, "epoch": 2.4578284628177713, "percentage": 81.93, "elapsed_time": "12:33:59", "remaining_time": "2:46:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20700, "total_steps": 25254, "loss": 0.0818, "learning_rate": 4.144049837002026e-06, "epoch": 2.459016393442623, "percentage": 81.97, "elapsed_time": "12:34:21", "remaining_time": "2:45:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20710, "total_steps": 25254, "loss": 0.0824, "learning_rate": 4.126387694972278e-06, "epoch": 2.4602043240674742, "percentage": 82.01, "elapsed_time": "12:34:42", "remaining_time": "2:45:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20720, "total_steps": 25254, "loss": 0.0821, "learning_rate": 4.108759885562955e-06, "epoch": 2.461392254692326, "percentage": 82.05, "elapsed_time": "12:35:04", "remaining_time": "2:45:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20730, "total_steps": 25254, "loss": 0.0831, "learning_rate": 4.091166437768023e-06, "epoch": 2.4625801853171776, "percentage": 82.09, "elapsed_time": "12:35:25", "remaining_time": "2:44:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20740, "total_steps": 25254, "loss": 0.0821, "learning_rate": 4.0736073805249355e-06, "epoch": 2.463768115942029, "percentage": 82.13, "elapsed_time": "12:35:46", "remaining_time": "2:44:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20750, "total_steps": 25254, "loss": 0.0851, "learning_rate": 4.056082742714582e-06, "epoch": 2.4649560465668805, "percentage": 82.17, "elapsed_time": "12:36:08", "remaining_time": "2:44:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20760, "total_steps": 25254, "loss": 0.0835, "learning_rate": 4.038592553161224e-06, "epoch": 2.466143977191732, "percentage": 82.2, "elapsed_time": "12:36:30", "remaining_time": "2:43:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20770, "total_steps": 25254, "loss": 0.0858, "learning_rate": 4.021136840632495e-06, "epoch": 2.4673319078165834, "percentage": 82.24, "elapsed_time": "12:36:52", "remaining_time": "2:43:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20780, "total_steps": 25254, "loss": 0.0842, "learning_rate": 4.003715633839294e-06, "epoch": 2.468519838441435, "percentage": 82.28, "elapsed_time": "12:37:14", "remaining_time": "2:43:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20790, "total_steps": 25254, "loss": 0.0834, "learning_rate": 3.986328961435773e-06, "epoch": 2.4697077690662868, "percentage": 82.32, "elapsed_time": "12:37:36", "remaining_time": "2:42:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20800, "total_steps": 25254, "loss": 0.082, "learning_rate": 3.968976852019285e-06, "epoch": 2.470895699691138, "percentage": 82.36, "elapsed_time": "12:37:57", "remaining_time": "2:42:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20810, "total_steps": 25254, "loss": 0.082, "learning_rate": 3.951659334130329e-06, "epoch": 2.4720836303159897, "percentage": 82.4, "elapsed_time": "12:38:19", "remaining_time": "2:41:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20820, "total_steps": 25254, "loss": 0.082, "learning_rate": 3.934376436252518e-06, "epoch": 2.473271560940841, "percentage": 82.44, "elapsed_time": "12:38:41", "remaining_time": "2:41:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20830, "total_steps": 25254, "loss": 0.0824, "learning_rate": 3.9171281868125135e-06, "epoch": 2.4744594915656926, "percentage": 82.48, "elapsed_time": "12:39:02", "remaining_time": "2:41:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20840, "total_steps": 25254, "loss": 0.0818, "learning_rate": 3.8999146141799915e-06, "epoch": 2.4756474221905442, "percentage": 82.52, "elapsed_time": "12:39:24", "remaining_time": "2:40:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20850, "total_steps": 25254, "loss": 0.0851, "learning_rate": 3.88273574666759e-06, "epoch": 2.4768353528153955, "percentage": 82.56, "elapsed_time": "12:39:45", "remaining_time": "2:40:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20860, "total_steps": 25254, "loss": 0.0828, "learning_rate": 3.865591612530866e-06, "epoch": 2.478023283440247, "percentage": 82.6, "elapsed_time": "12:40:07", "remaining_time": "2:40:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20870, "total_steps": 25254, "loss": 0.0822, "learning_rate": 3.848482239968249e-06, "epoch": 2.4792112140650984, "percentage": 82.64, "elapsed_time": "12:40:29", "remaining_time": "2:39:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20880, "total_steps": 25254, "loss": 0.083, "learning_rate": 3.831407657120989e-06, "epoch": 2.48039914468995, "percentage": 82.68, "elapsed_time": "12:40:51", "remaining_time": "2:39:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20890, "total_steps": 25254, "loss": 0.0828, "learning_rate": 3.8143678920731174e-06, "epoch": 2.4815870753148017, "percentage": 82.72, "elapsed_time": "12:41:13", "remaining_time": "2:39:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20900, "total_steps": 25254, "loss": 0.0809, "learning_rate": 3.797362972851393e-06, "epoch": 2.482775005939653, "percentage": 82.76, "elapsed_time": "12:41:34", "remaining_time": "2:38:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20910, "total_steps": 25254, "loss": 0.0801, "learning_rate": 3.7803929274252746e-06, "epoch": 2.4839629365645046, "percentage": 82.8, "elapsed_time": "12:41:55", "remaining_time": "2:38:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20920, "total_steps": 25254, "loss": 0.0806, "learning_rate": 3.7634577837068476e-06, "epoch": 2.4851508671893563, "percentage": 82.84, "elapsed_time": "12:42:17", "remaining_time": "2:37:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20930, "total_steps": 25254, "loss": 0.0855, "learning_rate": 3.7465575695507933e-06, "epoch": 2.4863387978142075, "percentage": 82.88, "elapsed_time": "12:42:40", "remaining_time": "2:37:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20940, "total_steps": 25254, "loss": 0.0844, "learning_rate": 3.729692312754343e-06, "epoch": 2.487526728439059, "percentage": 82.92, "elapsed_time": "12:43:03", "remaining_time": "2:37:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20950, "total_steps": 25254, "loss": 0.086, "learning_rate": 3.712862041057227e-06, "epoch": 2.488714659063911, "percentage": 82.96, "elapsed_time": "12:43:25", "remaining_time": "2:36:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20960, "total_steps": 25254, "loss": 0.0832, "learning_rate": 3.6960667821416494e-06, "epoch": 2.489902589688762, "percentage": 83.0, "elapsed_time": "12:43:46", "remaining_time": "2:36:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20970, "total_steps": 25254, "loss": 0.0825, "learning_rate": 3.6793065636322036e-06, "epoch": 2.4910905203136138, "percentage": 83.04, "elapsed_time": "12:44:08", "remaining_time": "2:36:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20980, "total_steps": 25254, "loss": 0.0833, "learning_rate": 3.6625814130958614e-06, "epoch": 2.492278450938465, "percentage": 83.08, "elapsed_time": "12:44:29", "remaining_time": "2:35:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 20990, "total_steps": 25254, "loss": 0.0817, "learning_rate": 3.645891358041911e-06, "epoch": 2.4934663815633167, "percentage": 83.12, "elapsed_time": "12:44:50", "remaining_time": "2:35:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21000, "total_steps": 25254, "loss": 0.0829, "learning_rate": 3.629236425921917e-06, "epoch": 2.4946543121881684, "percentage": 83.16, "elapsed_time": "12:45:12", "remaining_time": "2:35:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21010, "total_steps": 25254, "loss": 0.0823, "learning_rate": 3.6126166441296767e-06, "epoch": 2.4958422428130196, "percentage": 83.19, "elapsed_time": "12:45:33", "remaining_time": "2:34:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21020, "total_steps": 25254, "loss": 0.083, "learning_rate": 3.596032040001168e-06, "epoch": 2.4970301734378713, "percentage": 83.23, "elapsed_time": "12:45:55", "remaining_time": "2:34:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21030, "total_steps": 25254, "loss": 0.0838, "learning_rate": 3.579482640814513e-06, "epoch": 2.4982181040627225, "percentage": 83.27, "elapsed_time": "12:46:16", "remaining_time": "2:33:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21040, "total_steps": 25254, "loss": 0.0818, "learning_rate": 3.5629684737899238e-06, "epoch": 2.499406034687574, "percentage": 83.31, "elapsed_time": "12:46:38", "remaining_time": "2:33:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21050, "total_steps": 25254, "loss": 0.0839, "learning_rate": 3.546489566089678e-06, "epoch": 2.500593965312426, "percentage": 83.35, "elapsed_time": "12:47:00", "remaining_time": "2:33:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21060, "total_steps": 25254, "loss": 0.0826, "learning_rate": 3.530045944818039e-06, "epoch": 2.5017818959372775, "percentage": 83.39, "elapsed_time": "12:47:23", "remaining_time": "2:32:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21070, "total_steps": 25254, "loss": 0.084, "learning_rate": 3.513637637021244e-06, "epoch": 2.5029698265621287, "percentage": 83.43, "elapsed_time": "12:47:44", "remaining_time": "2:32:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21080, "total_steps": 25254, "loss": 0.0824, "learning_rate": 3.4972646696874473e-06, "epoch": 2.5041577571869804, "percentage": 83.47, "elapsed_time": "12:48:06", "remaining_time": "2:32:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21090, "total_steps": 25254, "loss": 0.0807, "learning_rate": 3.480927069746659e-06, "epoch": 2.5053456878118316, "percentage": 83.51, "elapsed_time": "12:48:28", "remaining_time": "2:31:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21100, "total_steps": 25254, "loss": 0.0883, "learning_rate": 3.4646248640707508e-06, "epoch": 2.5065336184366833, "percentage": 83.55, "elapsed_time": "12:48:50", "remaining_time": "2:31:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21110, "total_steps": 25254, "loss": 0.0833, "learning_rate": 3.448358079473346e-06, "epoch": 2.507721549061535, "percentage": 83.59, "elapsed_time": "12:49:12", "remaining_time": "2:31:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21120, "total_steps": 25254, "loss": 0.083, "learning_rate": 3.4321267427098263e-06, "epoch": 2.5089094796863862, "percentage": 83.63, "elapsed_time": "12:49:34", "remaining_time": "2:30:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21130, "total_steps": 25254, "loss": 0.0827, "learning_rate": 3.415930880477258e-06, "epoch": 2.510097410311238, "percentage": 83.67, "elapsed_time": "12:49:56", "remaining_time": "2:30:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21140, "total_steps": 25254, "loss": 0.0845, "learning_rate": 3.399770519414364e-06, "epoch": 2.511285340936089, "percentage": 83.71, "elapsed_time": "12:50:18", "remaining_time": "2:29:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21150, "total_steps": 25254, "loss": 0.0848, "learning_rate": 3.383645686101483e-06, "epoch": 2.512473271560941, "percentage": 83.75, "elapsed_time": "12:50:39", "remaining_time": "2:29:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21160, "total_steps": 25254, "loss": 0.0835, "learning_rate": 3.367556407060507e-06, "epoch": 2.5136612021857925, "percentage": 83.79, "elapsed_time": "12:51:01", "remaining_time": "2:29:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21170, "total_steps": 25254, "loss": 0.0808, "learning_rate": 3.3515027087548555e-06, "epoch": 2.5148491328106437, "percentage": 83.83, "elapsed_time": "12:51:22", "remaining_time": "2:28:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21180, "total_steps": 25254, "loss": 0.0816, "learning_rate": 3.335484617589421e-06, "epoch": 2.5160370634354954, "percentage": 83.87, "elapsed_time": "12:51:45", "remaining_time": "2:28:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21190, "total_steps": 25254, "loss": 0.0815, "learning_rate": 3.3195021599105312e-06, "epoch": 2.5172249940603466, "percentage": 83.91, "elapsed_time": "12:52:06", "remaining_time": "2:28:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21200, "total_steps": 25254, "loss": 0.084, "learning_rate": 3.3035553620059086e-06, "epoch": 2.5184129246851983, "percentage": 83.95, "elapsed_time": "12:52:28", "remaining_time": "2:27:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21210, "total_steps": 25254, "loss": 0.0846, "learning_rate": 3.2876442501046156e-06, "epoch": 2.51960085531005, "percentage": 83.99, "elapsed_time": "12:52:50", "remaining_time": "2:27:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21220, "total_steps": 25254, "loss": 0.0849, "learning_rate": 3.2717688503770216e-06, "epoch": 2.5207887859349016, "percentage": 84.03, "elapsed_time": "12:53:12", "remaining_time": "2:26:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21230, "total_steps": 25254, "loss": 0.0826, "learning_rate": 3.255929188934759e-06, "epoch": 2.521976716559753, "percentage": 84.07, "elapsed_time": "12:53:34", "remaining_time": "2:26:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21240, "total_steps": 25254, "loss": 0.0823, "learning_rate": 3.2401252918306815e-06, "epoch": 2.5231646471846045, "percentage": 84.11, "elapsed_time": "12:53:56", "remaining_time": "2:26:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21250, "total_steps": 25254, "loss": 0.085, "learning_rate": 3.22435718505881e-06, "epoch": 2.5243525778094558, "percentage": 84.15, "elapsed_time": "12:54:18", "remaining_time": "2:25:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21260, "total_steps": 25254, "loss": 0.0806, "learning_rate": 3.2086248945543072e-06, "epoch": 2.5255405084343074, "percentage": 84.18, "elapsed_time": "12:54:40", "remaining_time": "2:25:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21270, "total_steps": 25254, "loss": 0.0832, "learning_rate": 3.1929284461934132e-06, "epoch": 2.526728439059159, "percentage": 84.22, "elapsed_time": "12:55:02", "remaining_time": "2:25:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21280, "total_steps": 25254, "loss": 0.0861, "learning_rate": 3.1772678657934237e-06, "epoch": 2.5279163696840103, "percentage": 84.26, "elapsed_time": "12:55:24", "remaining_time": "2:24:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21290, "total_steps": 25254, "loss": 0.0829, "learning_rate": 3.1616431791126473e-06, "epoch": 2.529104300308862, "percentage": 84.3, "elapsed_time": "12:55:45", "remaining_time": "2:24:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21300, "total_steps": 25254, "loss": 0.0845, "learning_rate": 3.1460544118503382e-06, "epoch": 2.5302922309337132, "percentage": 84.34, "elapsed_time": "12:56:07", "remaining_time": "2:24:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21310, "total_steps": 25254, "loss": 0.0826, "learning_rate": 3.130501589646684e-06, "epoch": 2.531480161558565, "percentage": 84.38, "elapsed_time": "12:56:28", "remaining_time": "2:23:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21320, "total_steps": 25254, "loss": 0.0803, "learning_rate": 3.114984738082738e-06, "epoch": 2.5326680921834166, "percentage": 84.42, "elapsed_time": "12:56:49", "remaining_time": "2:23:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21330, "total_steps": 25254, "loss": 0.0822, "learning_rate": 3.0995038826804047e-06, "epoch": 2.5338560228082683, "percentage": 84.46, "elapsed_time": "12:57:11", "remaining_time": "2:22:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21340, "total_steps": 25254, "loss": 0.0828, "learning_rate": 3.0840590489023687e-06, "epoch": 2.5350439534331195, "percentage": 84.5, "elapsed_time": "12:57:32", "remaining_time": "2:22:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21350, "total_steps": 25254, "loss": 0.0828, "learning_rate": 3.0686502621520756e-06, "epoch": 2.536231884057971, "percentage": 84.54, "elapsed_time": "12:57:54", "remaining_time": "2:22:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21360, "total_steps": 25254, "loss": 0.0838, "learning_rate": 3.0532775477736808e-06, "epoch": 2.5374198146828224, "percentage": 84.58, "elapsed_time": "12:58:15", "remaining_time": "2:21:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21370, "total_steps": 25254, "loss": 0.0868, "learning_rate": 3.037940931051997e-06, "epoch": 2.538607745307674, "percentage": 84.62, "elapsed_time": "12:58:37", "remaining_time": "2:21:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21380, "total_steps": 25254, "loss": 0.0819, "learning_rate": 3.0226404372124817e-06, "epoch": 2.5397956759325258, "percentage": 84.66, "elapsed_time": "12:58:59", "remaining_time": "2:21:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21390, "total_steps": 25254, "loss": 0.0852, "learning_rate": 3.0073760914211714e-06, "epoch": 2.540983606557377, "percentage": 84.7, "elapsed_time": "12:59:21", "remaining_time": "2:20:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21400, "total_steps": 25254, "loss": 0.0816, "learning_rate": 2.992147918784638e-06, "epoch": 2.5421715371822287, "percentage": 84.74, "elapsed_time": "12:59:43", "remaining_time": "2:20:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21410, "total_steps": 25254, "loss": 0.0818, "learning_rate": 2.9769559443499655e-06, "epoch": 2.54335946780708, "percentage": 84.78, "elapsed_time": "13:00:05", "remaining_time": "2:20:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21420, "total_steps": 25254, "loss": 0.0829, "learning_rate": 2.961800193104694e-06, "epoch": 2.5445473984319316, "percentage": 84.82, "elapsed_time": "13:00:27", "remaining_time": "2:19:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21430, "total_steps": 25254, "loss": 0.087, "learning_rate": 2.946680689976794e-06, "epoch": 2.5457353290567832, "percentage": 84.86, "elapsed_time": "13:00:49", "remaining_time": "2:19:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21440, "total_steps": 25254, "loss": 0.0837, "learning_rate": 2.931597459834609e-06, "epoch": 2.5469232596816345, "percentage": 84.9, "elapsed_time": "13:01:12", "remaining_time": "2:18:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21450, "total_steps": 25254, "loss": 0.0837, "learning_rate": 2.9165505274868165e-06, "epoch": 2.548111190306486, "percentage": 84.94, "elapsed_time": "13:01:33", "remaining_time": "2:18:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21460, "total_steps": 25254, "loss": 0.0835, "learning_rate": 2.901539917682397e-06, "epoch": 2.5492991209313374, "percentage": 84.98, "elapsed_time": "13:01:55", "remaining_time": "2:18:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21470, "total_steps": 25254, "loss": 0.082, "learning_rate": 2.8865656551105844e-06, "epoch": 2.550487051556189, "percentage": 85.02, "elapsed_time": "13:02:16", "remaining_time": "2:17:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21480, "total_steps": 25254, "loss": 0.0835, "learning_rate": 2.8716277644008445e-06, "epoch": 2.5516749821810407, "percentage": 85.06, "elapsed_time": "13:02:38", "remaining_time": "2:17:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21490, "total_steps": 25254, "loss": 0.0811, "learning_rate": 2.8567262701228e-06, "epoch": 2.5528629128058924, "percentage": 85.1, "elapsed_time": "13:03:00", "remaining_time": "2:17:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21500, "total_steps": 25254, "loss": 0.0804, "learning_rate": 2.8418611967862165e-06, "epoch": 2.5540508434307436, "percentage": 85.14, "elapsed_time": "13:03:22", "remaining_time": "2:16:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21510, "total_steps": 25254, "loss": 0.0815, "learning_rate": 2.827032568840954e-06, "epoch": 2.5552387740555953, "percentage": 85.17, "elapsed_time": "13:03:44", "remaining_time": "2:16:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21520, "total_steps": 25254, "loss": 0.0816, "learning_rate": 2.8122404106769307e-06, "epoch": 2.5564267046804465, "percentage": 85.21, "elapsed_time": "13:04:06", "remaining_time": "2:16:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21530, "total_steps": 25254, "loss": 0.0811, "learning_rate": 2.7974847466240768e-06, "epoch": 2.557614635305298, "percentage": 85.25, "elapsed_time": "13:04:28", "remaining_time": "2:15:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21540, "total_steps": 25254, "loss": 0.0813, "learning_rate": 2.7827656009523e-06, "epoch": 2.55880256593015, "percentage": 85.29, "elapsed_time": "13:04:50", "remaining_time": "2:15:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21550, "total_steps": 25254, "loss": 0.0811, "learning_rate": 2.7680829978714405e-06, "epoch": 2.559990496555001, "percentage": 85.33, "elapsed_time": "13:05:12", "remaining_time": "2:14:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21560, "total_steps": 25254, "loss": 0.0826, "learning_rate": 2.7534369615312306e-06, "epoch": 2.561178427179853, "percentage": 85.37, "elapsed_time": "13:05:34", "remaining_time": "2:14:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21570, "total_steps": 25254, "loss": 0.0789, "learning_rate": 2.7388275160212696e-06, "epoch": 2.562366357804704, "percentage": 85.41, "elapsed_time": "13:05:56", "remaining_time": "2:14:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21580, "total_steps": 25254, "loss": 0.0811, "learning_rate": 2.7242546853709638e-06, "epoch": 2.5635542884295557, "percentage": 85.45, "elapsed_time": "13:06:17", "remaining_time": "2:13:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21590, "total_steps": 25254, "loss": 0.0811, "learning_rate": 2.709718493549496e-06, "epoch": 2.5647422190544074, "percentage": 85.49, "elapsed_time": "13:06:39", "remaining_time": "2:13:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21600, "total_steps": 25254, "loss": 0.0816, "learning_rate": 2.69521896446579e-06, "epoch": 2.5659301496792586, "percentage": 85.53, "elapsed_time": "13:07:01", "remaining_time": "2:13:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21610, "total_steps": 25254, "loss": 0.0826, "learning_rate": 2.6807561219684557e-06, "epoch": 2.5671180803041103, "percentage": 85.57, "elapsed_time": "13:07:22", "remaining_time": "2:12:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21620, "total_steps": 25254, "loss": 0.082, "learning_rate": 2.666329989845784e-06, "epoch": 2.5683060109289615, "percentage": 85.61, "elapsed_time": "13:07:43", "remaining_time": "2:12:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21630, "total_steps": 25254, "loss": 0.0826, "learning_rate": 2.6519405918256635e-06, "epoch": 2.569493941553813, "percentage": 85.65, "elapsed_time": "13:08:05", "remaining_time": "2:12:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21640, "total_steps": 25254, "loss": 0.0867, "learning_rate": 2.6375879515755737e-06, "epoch": 2.570681872178665, "percentage": 85.69, "elapsed_time": "13:08:27", "remaining_time": "2:11:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21650, "total_steps": 25254, "loss": 0.0868, "learning_rate": 2.6232720927025362e-06, "epoch": 2.5718698028035165, "percentage": 85.73, "elapsed_time": "13:08:48", "remaining_time": "2:11:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21660, "total_steps": 25254, "loss": 0.0842, "learning_rate": 2.608993038753063e-06, "epoch": 2.5730577334283677, "percentage": 85.77, "elapsed_time": "13:09:10", "remaining_time": "2:10:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21670, "total_steps": 25254, "loss": 0.0826, "learning_rate": 2.594750813213148e-06, "epoch": 2.5742456640532194, "percentage": 85.81, "elapsed_time": "13:09:31", "remaining_time": "2:10:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21680, "total_steps": 25254, "loss": 0.0829, "learning_rate": 2.5805454395081947e-06, "epoch": 2.5754335946780706, "percentage": 85.85, "elapsed_time": "13:09:53", "remaining_time": "2:10:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21690, "total_steps": 25254, "loss": 0.0824, "learning_rate": 2.5663769410030042e-06, "epoch": 2.5766215253029223, "percentage": 85.89, "elapsed_time": "13:10:15", "remaining_time": "2:09:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21700, "total_steps": 25254, "loss": 0.0825, "learning_rate": 2.5522453410017135e-06, "epoch": 2.577809455927774, "percentage": 85.93, "elapsed_time": "13:10:36", "remaining_time": "2:09:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21710, "total_steps": 25254, "loss": 0.082, "learning_rate": 2.5381506627477874e-06, "epoch": 2.5789973865526252, "percentage": 85.97, "elapsed_time": "13:10:57", "remaining_time": "2:09:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21720, "total_steps": 25254, "loss": 0.0795, "learning_rate": 2.524092929423946e-06, "epoch": 2.580185317177477, "percentage": 86.01, "elapsed_time": "13:11:20", "remaining_time": "2:08:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21730, "total_steps": 25254, "loss": 0.0833, "learning_rate": 2.5100721641521523e-06, "epoch": 2.581373247802328, "percentage": 86.05, "elapsed_time": "13:11:42", "remaining_time": "2:08:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21740, "total_steps": 25254, "loss": 0.0825, "learning_rate": 2.496088389993559e-06, "epoch": 2.58256117842718, "percentage": 86.09, "elapsed_time": "13:12:05", "remaining_time": "2:08:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21750, "total_steps": 25254, "loss": 0.0833, "learning_rate": 2.482141629948473e-06, "epoch": 2.5837491090520315, "percentage": 86.12, "elapsed_time": "13:12:26", "remaining_time": "2:07:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21760, "total_steps": 25254, "loss": 0.0824, "learning_rate": 2.4682319069563394e-06, "epoch": 2.5849370396768827, "percentage": 86.16, "elapsed_time": "13:12:48", "remaining_time": "2:07:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21770, "total_steps": 25254, "loss": 0.0843, "learning_rate": 2.454359243895665e-06, "epoch": 2.5861249703017344, "percentage": 86.2, "elapsed_time": "13:13:09", "remaining_time": "2:06:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21780, "total_steps": 25254, "loss": 0.0817, "learning_rate": 2.44052366358401e-06, "epoch": 2.5873129009265856, "percentage": 86.24, "elapsed_time": "13:13:32", "remaining_time": "2:06:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21790, "total_steps": 25254, "loss": 0.0842, "learning_rate": 2.4267251887779395e-06, "epoch": 2.5885008315514373, "percentage": 86.28, "elapsed_time": "13:13:53", "remaining_time": "2:06:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21800, "total_steps": 25254, "loss": 0.0814, "learning_rate": 2.4129638421729857e-06, "epoch": 2.589688762176289, "percentage": 86.32, "elapsed_time": "13:14:15", "remaining_time": "2:05:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21810, "total_steps": 25254, "loss": 0.0808, "learning_rate": 2.3992396464036225e-06, "epoch": 2.5908766928011406, "percentage": 86.36, "elapsed_time": "13:14:37", "remaining_time": "2:05:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21820, "total_steps": 25254, "loss": 0.0818, "learning_rate": 2.385552624043205e-06, "epoch": 2.592064623425992, "percentage": 86.4, "elapsed_time": "13:14:59", "remaining_time": "2:05:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21830, "total_steps": 25254, "loss": 0.0824, "learning_rate": 2.371902797603964e-06, "epoch": 2.5932525540508435, "percentage": 86.44, "elapsed_time": "13:15:21", "remaining_time": "2:04:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21840, "total_steps": 25254, "loss": 0.0831, "learning_rate": 2.3582901895369213e-06, "epoch": 2.5944404846756948, "percentage": 86.48, "elapsed_time": "13:15:43", "remaining_time": "2:04:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21850, "total_steps": 25254, "loss": 0.0829, "learning_rate": 2.3447148222319138e-06, "epoch": 2.5956284153005464, "percentage": 86.52, "elapsed_time": "13:16:05", "remaining_time": "2:04:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21860, "total_steps": 25254, "loss": 0.0822, "learning_rate": 2.331176718017511e-06, "epoch": 2.596816345925398, "percentage": 86.56, "elapsed_time": "13:16:27", "remaining_time": "2:03:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21870, "total_steps": 25254, "loss": 0.0842, "learning_rate": 2.3176758991609928e-06, "epoch": 2.5980042765502493, "percentage": 86.6, "elapsed_time": "13:16:49", "remaining_time": "2:03:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21880, "total_steps": 25254, "loss": 0.0851, "learning_rate": 2.3042123878683126e-06, "epoch": 2.599192207175101, "percentage": 86.64, "elapsed_time": "13:17:11", "remaining_time": "2:02:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21890, "total_steps": 25254, "loss": 0.0821, "learning_rate": 2.2907862062840596e-06, "epoch": 2.6003801377999523, "percentage": 86.68, "elapsed_time": "13:17:33", "remaining_time": "2:02:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21900, "total_steps": 25254, "loss": 0.0791, "learning_rate": 2.2773973764914356e-06, "epoch": 2.601568068424804, "percentage": 86.72, "elapsed_time": "13:17:56", "remaining_time": "2:02:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21910, "total_steps": 25254, "loss": 0.0828, "learning_rate": 2.2640459205121894e-06, "epoch": 2.6027559990496556, "percentage": 86.76, "elapsed_time": "13:18:18", "remaining_time": "2:01:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21920, "total_steps": 25254, "loss": 0.0815, "learning_rate": 2.2507318603066097e-06, "epoch": 2.6039439296745073, "percentage": 86.8, "elapsed_time": "13:18:40", "remaining_time": "2:01:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21930, "total_steps": 25254, "loss": 0.0792, "learning_rate": 2.237455217773468e-06, "epoch": 2.6051318602993585, "percentage": 86.84, "elapsed_time": "13:19:02", "remaining_time": "2:01:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21940, "total_steps": 25254, "loss": 0.0824, "learning_rate": 2.2242160147499995e-06, "epoch": 2.60631979092421, "percentage": 86.88, "elapsed_time": "13:19:24", "remaining_time": "2:00:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21950, "total_steps": 25254, "loss": 0.0815, "learning_rate": 2.2110142730118607e-06, "epoch": 2.6075077215490614, "percentage": 86.92, "elapsed_time": "13:19:45", "remaining_time": "2:00:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21960, "total_steps": 25254, "loss": 0.0836, "learning_rate": 2.1978500142730867e-06, "epoch": 2.608695652173913, "percentage": 86.96, "elapsed_time": "13:20:07", "remaining_time": "2:00:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21970, "total_steps": 25254, "loss": 0.0817, "learning_rate": 2.184723260186061e-06, "epoch": 2.6098835827987648, "percentage": 87.0, "elapsed_time": "13:20:29", "remaining_time": "1:59:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21980, "total_steps": 25254, "loss": 0.0845, "learning_rate": 2.1716340323414825e-06, "epoch": 2.611071513423616, "percentage": 87.04, "elapsed_time": "13:20:51", "remaining_time": "1:59:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 21990, "total_steps": 25254, "loss": 0.082, "learning_rate": 2.1585823522683264e-06, "epoch": 2.6122594440484677, "percentage": 87.08, "elapsed_time": "13:21:13", "remaining_time": "1:58:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22000, "total_steps": 25254, "loss": 0.0802, "learning_rate": 2.1455682414338123e-06, "epoch": 2.613447374673319, "percentage": 87.11, "elapsed_time": "13:21:34", "remaining_time": "1:58:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22010, "total_steps": 25254, "loss": 0.081, "learning_rate": 2.13259172124336e-06, "epoch": 2.6146353052981706, "percentage": 87.15, "elapsed_time": "13:21:56", "remaining_time": "1:58:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22020, "total_steps": 25254, "loss": 0.082, "learning_rate": 2.119652813040571e-06, "epoch": 2.6158232359230222, "percentage": 87.19, "elapsed_time": "13:22:18", "remaining_time": "1:57:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22030, "total_steps": 25254, "loss": 0.0826, "learning_rate": 2.1067515381071713e-06, "epoch": 2.6170111665478735, "percentage": 87.23, "elapsed_time": "13:22:40", "remaining_time": "1:57:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22040, "total_steps": 25254, "loss": 0.0831, "learning_rate": 2.093887917663001e-06, "epoch": 2.618199097172725, "percentage": 87.27, "elapsed_time": "13:23:03", "remaining_time": "1:57:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22050, "total_steps": 25254, "loss": 0.0824, "learning_rate": 2.0810619728659552e-06, "epoch": 2.6193870277975764, "percentage": 87.31, "elapsed_time": "13:23:24", "remaining_time": "1:56:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22060, "total_steps": 25254, "loss": 0.0833, "learning_rate": 2.068273724811967e-06, "epoch": 2.620574958422428, "percentage": 87.35, "elapsed_time": "13:23:45", "remaining_time": "1:56:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22070, "total_steps": 25254, "loss": 0.082, "learning_rate": 2.0555231945349667e-06, "epoch": 2.6217628890472797, "percentage": 87.39, "elapsed_time": "13:24:07", "remaining_time": "1:56:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22080, "total_steps": 25254, "loss": 0.0822, "learning_rate": 2.0428104030068367e-06, "epoch": 2.6229508196721314, "percentage": 87.43, "elapsed_time": "13:24:29", "remaining_time": "1:55:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22090, "total_steps": 25254, "loss": 0.0819, "learning_rate": 2.0301353711374065e-06, "epoch": 2.6241387502969826, "percentage": 87.47, "elapsed_time": "13:24:52", "remaining_time": "1:55:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22100, "total_steps": 25254, "loss": 0.0839, "learning_rate": 2.017498119774383e-06, "epoch": 2.6253266809218343, "percentage": 87.51, "elapsed_time": "13:25:14", "remaining_time": "1:54:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22110, "total_steps": 25254, "loss": 0.0836, "learning_rate": 2.0048986697033366e-06, "epoch": 2.6265146115466855, "percentage": 87.55, "elapsed_time": "13:25:36", "remaining_time": "1:54:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22120, "total_steps": 25254, "loss": 0.0844, "learning_rate": 1.9923370416476655e-06, "epoch": 2.627702542171537, "percentage": 87.59, "elapsed_time": "13:25:57", "remaining_time": "1:54:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22130, "total_steps": 25254, "loss": 0.082, "learning_rate": 1.979813256268551e-06, "epoch": 2.628890472796389, "percentage": 87.63, "elapsed_time": "13:26:19", "remaining_time": "1:53:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22140, "total_steps": 25254, "loss": 0.0845, "learning_rate": 1.967327334164951e-06, "epoch": 2.63007840342124, "percentage": 87.67, "elapsed_time": "13:26:40", "remaining_time": "1:53:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22150, "total_steps": 25254, "loss": 0.0845, "learning_rate": 1.9548792958735185e-06, "epoch": 2.631266334046092, "percentage": 87.71, "elapsed_time": "13:27:02", "remaining_time": "1:53:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22160, "total_steps": 25254, "loss": 0.0821, "learning_rate": 1.9424691618686152e-06, "epoch": 2.632454264670943, "percentage": 87.75, "elapsed_time": "13:27:24", "remaining_time": "1:52:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22170, "total_steps": 25254, "loss": 0.0805, "learning_rate": 1.9300969525622464e-06, "epoch": 2.6336421952957947, "percentage": 87.79, "elapsed_time": "13:27:46", "remaining_time": "1:52:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22180, "total_steps": 25254, "loss": 0.0836, "learning_rate": 1.917762688304059e-06, "epoch": 2.6348301259206464, "percentage": 87.83, "elapsed_time": "13:28:08", "remaining_time": "1:52:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22190, "total_steps": 25254, "loss": 0.0825, "learning_rate": 1.9054663893812635e-06, "epoch": 2.6360180565454976, "percentage": 87.87, "elapsed_time": "13:28:30", "remaining_time": "1:51:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22200, "total_steps": 25254, "loss": 0.0818, "learning_rate": 1.893208076018646e-06, "epoch": 2.6372059871703493, "percentage": 87.91, "elapsed_time": "13:28:52", "remaining_time": "1:51:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22210, "total_steps": 25254, "loss": 0.0813, "learning_rate": 1.8809877683784977e-06, "epoch": 2.6383939177952005, "percentage": 87.95, "elapsed_time": "13:29:14", "remaining_time": "1:50:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22220, "total_steps": 25254, "loss": 0.0852, "learning_rate": 1.8688054865606098e-06, "epoch": 2.639581848420052, "percentage": 87.99, "elapsed_time": "13:29:36", "remaining_time": "1:50:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22230, "total_steps": 25254, "loss": 0.0808, "learning_rate": 1.856661250602229e-06, "epoch": 2.640769779044904, "percentage": 88.03, "elapsed_time": "13:29:58", "remaining_time": "1:50:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22240, "total_steps": 25254, "loss": 0.0824, "learning_rate": 1.8445550804780192e-06, "epoch": 2.6419577096697555, "percentage": 88.07, "elapsed_time": "13:30:20", "remaining_time": "1:49:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22250, "total_steps": 25254, "loss": 0.0838, "learning_rate": 1.8324869961000385e-06, "epoch": 2.6431456402946067, "percentage": 88.1, "elapsed_time": "13:30:42", "remaining_time": "1:49:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22260, "total_steps": 25254, "loss": 0.0825, "learning_rate": 1.8204570173176977e-06, "epoch": 2.6443335709194584, "percentage": 88.14, "elapsed_time": "13:31:03", "remaining_time": "1:49:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22270, "total_steps": 25254, "loss": 0.0832, "learning_rate": 1.808465163917733e-06, "epoch": 2.6455215015443097, "percentage": 88.18, "elapsed_time": "13:31:25", "remaining_time": "1:48:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22280, "total_steps": 25254, "loss": 0.081, "learning_rate": 1.796511455624178e-06, "epoch": 2.6467094321691613, "percentage": 88.22, "elapsed_time": "13:31:47", "remaining_time": "1:48:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22290, "total_steps": 25254, "loss": 0.0817, "learning_rate": 1.7845959120983247e-06, "epoch": 2.647897362794013, "percentage": 88.26, "elapsed_time": "13:32:09", "remaining_time": "1:47:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22300, "total_steps": 25254, "loss": 0.0809, "learning_rate": 1.7727185529386848e-06, "epoch": 2.6490852934188642, "percentage": 88.3, "elapsed_time": "13:32:31", "remaining_time": "1:47:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22310, "total_steps": 25254, "loss": 0.0816, "learning_rate": 1.76087939768097e-06, "epoch": 2.650273224043716, "percentage": 88.34, "elapsed_time": "13:32:53", "remaining_time": "1:47:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22320, "total_steps": 25254, "loss": 0.0819, "learning_rate": 1.7490784657980541e-06, "epoch": 2.651461154668567, "percentage": 88.38, "elapsed_time": "13:33:14", "remaining_time": "1:46:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22330, "total_steps": 25254, "loss": 0.0813, "learning_rate": 1.7373157766999437e-06, "epoch": 2.652649085293419, "percentage": 88.42, "elapsed_time": "13:33:36", "remaining_time": "1:46:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22340, "total_steps": 25254, "loss": 0.0832, "learning_rate": 1.7255913497337435e-06, "epoch": 2.6538370159182705, "percentage": 88.46, "elapsed_time": "13:33:58", "remaining_time": "1:46:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22350, "total_steps": 25254, "loss": 0.0811, "learning_rate": 1.713905204183619e-06, "epoch": 2.655024946543122, "percentage": 88.5, "elapsed_time": "13:34:20", "remaining_time": "1:45:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22360, "total_steps": 25254, "loss": 0.084, "learning_rate": 1.7022573592707759e-06, "epoch": 2.6562128771679734, "percentage": 88.54, "elapsed_time": "13:34:41", "remaining_time": "1:45:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22370, "total_steps": 25254, "loss": 0.0828, "learning_rate": 1.6906478341534303e-06, "epoch": 2.657400807792825, "percentage": 88.58, "elapsed_time": "13:35:03", "remaining_time": "1:45:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22380, "total_steps": 25254, "loss": 0.0788, "learning_rate": 1.679076647926761e-06, "epoch": 2.6585887384176763, "percentage": 88.62, "elapsed_time": "13:35:25", "remaining_time": "1:44:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22390, "total_steps": 25254, "loss": 0.0838, "learning_rate": 1.667543819622891e-06, "epoch": 2.659776669042528, "percentage": 88.66, "elapsed_time": "13:35:47", "remaining_time": "1:44:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22400, "total_steps": 25254, "loss": 0.0832, "learning_rate": 1.656049368210852e-06, "epoch": 2.6609645996673796, "percentage": 88.7, "elapsed_time": "13:36:09", "remaining_time": "1:43:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22410, "total_steps": 25254, "loss": 0.0827, "learning_rate": 1.6445933125965458e-06, "epoch": 2.662152530292231, "percentage": 88.74, "elapsed_time": "13:36:31", "remaining_time": "1:43:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22420, "total_steps": 25254, "loss": 0.0825, "learning_rate": 1.6331756716227442e-06, "epoch": 2.6633404609170825, "percentage": 88.78, "elapsed_time": "13:36:53", "remaining_time": "1:43:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22430, "total_steps": 25254, "loss": 0.0817, "learning_rate": 1.6217964640690113e-06, "epoch": 2.6645283915419338, "percentage": 88.82, "elapsed_time": "13:37:14", "remaining_time": "1:42:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22440, "total_steps": 25254, "loss": 0.0796, "learning_rate": 1.6104557086517092e-06, "epoch": 2.6657163221667854, "percentage": 88.86, "elapsed_time": "13:37:36", "remaining_time": "1:42:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22450, "total_steps": 25254, "loss": 0.0821, "learning_rate": 1.599153424023947e-06, "epoch": 2.666904252791637, "percentage": 88.9, "elapsed_time": "13:37:58", "remaining_time": "1:42:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22460, "total_steps": 25254, "loss": 0.0824, "learning_rate": 1.5878896287755657e-06, "epoch": 2.6680921834164883, "percentage": 88.94, "elapsed_time": "13:38:20", "remaining_time": "1:41:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22470, "total_steps": 25254, "loss": 0.0861, "learning_rate": 1.5766643414330956e-06, "epoch": 2.66928011404134, "percentage": 88.98, "elapsed_time": "13:38:42", "remaining_time": "1:41:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22480, "total_steps": 25254, "loss": 0.0831, "learning_rate": 1.565477580459726e-06, "epoch": 2.6704680446661913, "percentage": 89.02, "elapsed_time": "13:39:04", "remaining_time": "1:41:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22490, "total_steps": 25254, "loss": 0.081, "learning_rate": 1.5543293642552831e-06, "epoch": 2.671655975291043, "percentage": 89.06, "elapsed_time": "13:39:27", "remaining_time": "1:40:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22500, "total_steps": 25254, "loss": 0.0835, "learning_rate": 1.5432197111561937e-06, "epoch": 2.6728439059158946, "percentage": 89.09, "elapsed_time": "13:39:48", "remaining_time": "1:40:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22510, "total_steps": 25254, "loss": 0.0817, "learning_rate": 1.5321486394354601e-06, "epoch": 2.6740318365407463, "percentage": 89.13, "elapsed_time": "13:40:11", "remaining_time": "1:39:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22520, "total_steps": 25254, "loss": 0.0808, "learning_rate": 1.521116167302622e-06, "epoch": 2.6752197671655975, "percentage": 89.17, "elapsed_time": "13:40:33", "remaining_time": "1:39:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22530, "total_steps": 25254, "loss": 0.0808, "learning_rate": 1.5101223129037333e-06, "epoch": 2.676407697790449, "percentage": 89.21, "elapsed_time": "13:40:54", "remaining_time": "1:39:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22540, "total_steps": 25254, "loss": 0.0833, "learning_rate": 1.499167094321327e-06, "epoch": 2.6775956284153004, "percentage": 89.25, "elapsed_time": "13:41:15", "remaining_time": "1:38:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22550, "total_steps": 25254, "loss": 0.0811, "learning_rate": 1.4882505295743894e-06, "epoch": 2.678783559040152, "percentage": 89.29, "elapsed_time": "13:41:38", "remaining_time": "1:38:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22560, "total_steps": 25254, "loss": 0.0803, "learning_rate": 1.4773726366183377e-06, "epoch": 2.6799714896650038, "percentage": 89.33, "elapsed_time": "13:42:00", "remaining_time": "1:38:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22570, "total_steps": 25254, "loss": 0.0835, "learning_rate": 1.4665334333449714e-06, "epoch": 2.681159420289855, "percentage": 89.37, "elapsed_time": "13:42:22", "remaining_time": "1:37:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22580, "total_steps": 25254, "loss": 0.081, "learning_rate": 1.4557329375824574e-06, "epoch": 2.6823473509147067, "percentage": 89.41, "elapsed_time": "13:42:43", "remaining_time": "1:37:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22590, "total_steps": 25254, "loss": 0.0823, "learning_rate": 1.4449711670952966e-06, "epoch": 2.683535281539558, "percentage": 89.45, "elapsed_time": "13:43:05", "remaining_time": "1:37:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22600, "total_steps": 25254, "loss": 0.0852, "learning_rate": 1.4342481395842933e-06, "epoch": 2.6847232121644096, "percentage": 89.49, "elapsed_time": "13:43:27", "remaining_time": "1:36:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22610, "total_steps": 25254, "loss": 0.0829, "learning_rate": 1.423563872686537e-06, "epoch": 2.6859111427892612, "percentage": 89.53, "elapsed_time": "13:43:49", "remaining_time": "1:36:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22620, "total_steps": 25254, "loss": 0.0853, "learning_rate": 1.4129183839753535e-06, "epoch": 2.6870990734141125, "percentage": 89.57, "elapsed_time": "13:44:11", "remaining_time": "1:35:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22630, "total_steps": 25254, "loss": 0.083, "learning_rate": 1.4023116909602952e-06, "epoch": 2.688287004038964, "percentage": 89.61, "elapsed_time": "13:44:33", "remaining_time": "1:35:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22640, "total_steps": 25254, "loss": 0.0834, "learning_rate": 1.3917438110870984e-06, "epoch": 2.6894749346638154, "percentage": 89.65, "elapsed_time": "13:44:54", "remaining_time": "1:35:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22650, "total_steps": 25254, "loss": 0.0819, "learning_rate": 1.3812147617376563e-06, "epoch": 2.690662865288667, "percentage": 89.69, "elapsed_time": "13:45:15", "remaining_time": "1:34:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22660, "total_steps": 25254, "loss": 0.0824, "learning_rate": 1.370724560230005e-06, "epoch": 2.6918507959135187, "percentage": 89.73, "elapsed_time": "13:45:37", "remaining_time": "1:34:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22670, "total_steps": 25254, "loss": 0.0859, "learning_rate": 1.3602732238182786e-06, "epoch": 2.6930387265383704, "percentage": 89.77, "elapsed_time": "13:45:59", "remaining_time": "1:34:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22680, "total_steps": 25254, "loss": 0.0819, "learning_rate": 1.3498607696926818e-06, "epoch": 2.6942266571632216, "percentage": 89.81, "elapsed_time": "13:46:21", "remaining_time": "1:33:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22690, "total_steps": 25254, "loss": 0.0834, "learning_rate": 1.3394872149794736e-06, "epoch": 2.6954145877880733, "percentage": 89.85, "elapsed_time": "13:46:42", "remaining_time": "1:33:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22700, "total_steps": 25254, "loss": 0.0814, "learning_rate": 1.3291525767409303e-06, "epoch": 2.6966025184129245, "percentage": 89.89, "elapsed_time": "13:47:04", "remaining_time": "1:33:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22710, "total_steps": 25254, "loss": 0.0807, "learning_rate": 1.3188568719753185e-06, "epoch": 2.697790449037776, "percentage": 89.93, "elapsed_time": "13:47:25", "remaining_time": "1:32:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22720, "total_steps": 25254, "loss": 0.0826, "learning_rate": 1.308600117616865e-06, "epoch": 2.698978379662628, "percentage": 89.97, "elapsed_time": "13:47:47", "remaining_time": "1:32:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22730, "total_steps": 25254, "loss": 0.0827, "learning_rate": 1.2983823305357329e-06, "epoch": 2.700166310287479, "percentage": 90.01, "elapsed_time": "13:48:09", "remaining_time": "1:31:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22740, "total_steps": 25254, "loss": 0.0827, "learning_rate": 1.2882035275379928e-06, "epoch": 2.701354240912331, "percentage": 90.05, "elapsed_time": "13:48:31", "remaining_time": "1:31:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22750, "total_steps": 25254, "loss": 0.0817, "learning_rate": 1.278063725365597e-06, "epoch": 2.702542171537182, "percentage": 90.08, "elapsed_time": "13:48:55", "remaining_time": "1:31:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22760, "total_steps": 25254, "loss": 0.0817, "learning_rate": 1.2679629406963462e-06, "epoch": 2.7037301021620337, "percentage": 90.12, "elapsed_time": "13:49:17", "remaining_time": "1:30:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22770, "total_steps": 25254, "loss": 0.0804, "learning_rate": 1.2579011901438704e-06, "epoch": 2.7049180327868854, "percentage": 90.16, "elapsed_time": "13:49:39", "remaining_time": "1:30:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22780, "total_steps": 25254, "loss": 0.0836, "learning_rate": 1.2478784902575896e-06, "epoch": 2.7061059634117366, "percentage": 90.2, "elapsed_time": "13:50:01", "remaining_time": "1:30:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22790, "total_steps": 25254, "loss": 0.0798, "learning_rate": 1.2378948575227006e-06, "epoch": 2.7072938940365883, "percentage": 90.24, "elapsed_time": "13:50:22", "remaining_time": "1:29:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22800, "total_steps": 25254, "loss": 0.0831, "learning_rate": 1.2279503083601373e-06, "epoch": 2.7084818246614395, "percentage": 90.28, "elapsed_time": "13:50:44", "remaining_time": "1:29:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22810, "total_steps": 25254, "loss": 0.0832, "learning_rate": 1.2180448591265548e-06, "epoch": 2.709669755286291, "percentage": 90.32, "elapsed_time": "13:51:06", "remaining_time": "1:29:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22820, "total_steps": 25254, "loss": 0.0812, "learning_rate": 1.2081785261142952e-06, "epoch": 2.710857685911143, "percentage": 90.36, "elapsed_time": "13:51:28", "remaining_time": "1:28:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22830, "total_steps": 25254, "loss": 0.0823, "learning_rate": 1.1983513255513612e-06, "epoch": 2.7120456165359945, "percentage": 90.4, "elapsed_time": "13:51:50", "remaining_time": "1:28:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22840, "total_steps": 25254, "loss": 0.0825, "learning_rate": 1.1885632736013923e-06, "epoch": 2.7132335471608457, "percentage": 90.44, "elapsed_time": "13:52:12", "remaining_time": "1:27:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22850, "total_steps": 25254, "loss": 0.0826, "learning_rate": 1.1788143863636413e-06, "epoch": 2.7144214777856974, "percentage": 90.48, "elapsed_time": "13:52:33", "remaining_time": "1:27:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22860, "total_steps": 25254, "loss": 0.0799, "learning_rate": 1.1691046798729372e-06, "epoch": 2.7156094084105487, "percentage": 90.52, "elapsed_time": "13:52:55", "remaining_time": "1:27:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22870, "total_steps": 25254, "loss": 0.0812, "learning_rate": 1.159434170099663e-06, "epoch": 2.7167973390354003, "percentage": 90.56, "elapsed_time": "13:53:17", "remaining_time": "1:26:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22880, "total_steps": 25254, "loss": 0.0834, "learning_rate": 1.1498028729497344e-06, "epoch": 2.717985269660252, "percentage": 90.6, "elapsed_time": "13:53:38", "remaining_time": "1:26:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22890, "total_steps": 25254, "loss": 0.0794, "learning_rate": 1.1402108042645825e-06, "epoch": 2.7191732002851032, "percentage": 90.64, "elapsed_time": "13:54:01", "remaining_time": "1:26:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22900, "total_steps": 25254, "loss": 0.0827, "learning_rate": 1.1306579798210953e-06, "epoch": 2.720361130909955, "percentage": 90.68, "elapsed_time": "13:54:23", "remaining_time": "1:25:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22910, "total_steps": 25254, "loss": 0.0819, "learning_rate": 1.121144415331629e-06, "epoch": 2.721549061534806, "percentage": 90.72, "elapsed_time": "13:54:45", "remaining_time": "1:25:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22920, "total_steps": 25254, "loss": 0.0813, "learning_rate": 1.1116701264439534e-06, "epoch": 2.722736992159658, "percentage": 90.76, "elapsed_time": "13:55:07", "remaining_time": "1:25:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22930, "total_steps": 25254, "loss": 0.0821, "learning_rate": 1.1022351287412442e-06, "epoch": 2.7239249227845095, "percentage": 90.8, "elapsed_time": "13:55:28", "remaining_time": "1:24:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22940, "total_steps": 25254, "loss": 0.0844, "learning_rate": 1.0928394377420576e-06, "epoch": 2.725112853409361, "percentage": 90.84, "elapsed_time": "13:55:50", "remaining_time": "1:24:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22950, "total_steps": 25254, "loss": 0.0793, "learning_rate": 1.08348306890029e-06, "epoch": 2.7263007840342124, "percentage": 90.88, "elapsed_time": "13:56:11", "remaining_time": "1:23:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22960, "total_steps": 25254, "loss": 0.0798, "learning_rate": 1.0741660376051593e-06, "epoch": 2.727488714659064, "percentage": 90.92, "elapsed_time": "13:56:33", "remaining_time": "1:23:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22970, "total_steps": 25254, "loss": 0.0832, "learning_rate": 1.0648883591811903e-06, "epoch": 2.7286766452839153, "percentage": 90.96, "elapsed_time": "13:56:54", "remaining_time": "1:23:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22980, "total_steps": 25254, "loss": 0.0771, "learning_rate": 1.0556500488881737e-06, "epoch": 2.729864575908767, "percentage": 91.0, "elapsed_time": "13:57:17", "remaining_time": "1:22:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 22990, "total_steps": 25254, "loss": 0.0819, "learning_rate": 1.046451121921152e-06, "epoch": 2.7310525065336186, "percentage": 91.04, "elapsed_time": "13:57:39", "remaining_time": "1:22:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23000, "total_steps": 25254, "loss": 0.0827, "learning_rate": 1.0372915934103916e-06, "epoch": 2.73224043715847, "percentage": 91.07, "elapsed_time": "13:58:01", "remaining_time": "1:22:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23010, "total_steps": 25254, "loss": 0.0831, "learning_rate": 1.0281714784213526e-06, "epoch": 2.7334283677833215, "percentage": 91.11, "elapsed_time": "13:58:23", "remaining_time": "1:21:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23020, "total_steps": 25254, "loss": 0.0812, "learning_rate": 1.0190907919546634e-06, "epoch": 2.7346162984081728, "percentage": 91.15, "elapsed_time": "13:58:45", "remaining_time": "1:21:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23030, "total_steps": 25254, "loss": 0.0813, "learning_rate": 1.010049548946121e-06, "epoch": 2.7358042290330244, "percentage": 91.19, "elapsed_time": "13:59:08", "remaining_time": "1:21:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23040, "total_steps": 25254, "loss": 0.081, "learning_rate": 1.0010477642666244e-06, "epoch": 2.736992159657876, "percentage": 91.23, "elapsed_time": "13:59:29", "remaining_time": "1:20:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23050, "total_steps": 25254, "loss": 0.0814, "learning_rate": 9.920854527221857e-07, "epoch": 2.7381800902827274, "percentage": 91.27, "elapsed_time": "13:59:51", "remaining_time": "1:20:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23060, "total_steps": 25254, "loss": 0.0828, "learning_rate": 9.831626290538853e-07, "epoch": 2.739368020907579, "percentage": 91.31, "elapsed_time": "14:00:14", "remaining_time": "1:19:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23070, "total_steps": 25254, "loss": 0.0831, "learning_rate": 9.742793079378505e-07, "epoch": 2.7405559515324303, "percentage": 91.35, "elapsed_time": "14:00:35", "remaining_time": "1:19:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23080, "total_steps": 25254, "loss": 0.0823, "learning_rate": 9.654355039852514e-07, "epoch": 2.741743882157282, "percentage": 91.39, "elapsed_time": "14:00:57", "remaining_time": "1:19:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23090, "total_steps": 25254, "loss": 0.0829, "learning_rate": 9.566312317422471e-07, "epoch": 2.7429318127821336, "percentage": 91.43, "elapsed_time": "14:01:19", "remaining_time": "1:18:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23100, "total_steps": 25254, "loss": 0.0812, "learning_rate": 9.478665056899789e-07, "epoch": 2.7441197434069853, "percentage": 91.47, "elapsed_time": "14:01:41", "remaining_time": "1:18:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23110, "total_steps": 25254, "loss": 0.0826, "learning_rate": 9.391413402445454e-07, "epoch": 2.7453076740318365, "percentage": 91.51, "elapsed_time": "14:02:03", "remaining_time": "1:18:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23120, "total_steps": 25254, "loss": 0.0834, "learning_rate": 9.3045574975697e-07, "epoch": 2.746495604656688, "percentage": 91.55, "elapsed_time": "14:02:25", "remaining_time": "1:17:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23130, "total_steps": 25254, "loss": 0.0827, "learning_rate": 9.218097485131915e-07, "epoch": 2.7476835352815394, "percentage": 91.59, "elapsed_time": "14:02:47", "remaining_time": "1:17:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23140, "total_steps": 25254, "loss": 0.0816, "learning_rate": 9.132033507340293e-07, "epoch": 2.748871465906391, "percentage": 91.63, "elapsed_time": "14:03:08", "remaining_time": "1:17:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23150, "total_steps": 25254, "loss": 0.0813, "learning_rate": 9.046365705751625e-07, "epoch": 2.7500593965312428, "percentage": 91.67, "elapsed_time": "14:03:30", "remaining_time": "1:16:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23160, "total_steps": 25254, "loss": 0.0828, "learning_rate": 8.961094221271088e-07, "epoch": 2.751247327156094, "percentage": 91.71, "elapsed_time": "14:03:52", "remaining_time": "1:16:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23170, "total_steps": 25254, "loss": 0.084, "learning_rate": 8.876219194152046e-07, "epoch": 2.7524352577809457, "percentage": 91.75, "elapsed_time": "14:04:14", "remaining_time": "1:15:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23180, "total_steps": 25254, "loss": 0.0818, "learning_rate": 8.791740763995721e-07, "epoch": 2.753623188405797, "percentage": 91.79, "elapsed_time": "14:04:35", "remaining_time": "1:15:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23190, "total_steps": 25254, "loss": 0.0836, "learning_rate": 8.707659069751018e-07, "epoch": 2.7548111190306486, "percentage": 91.83, "elapsed_time": "14:04:57", "remaining_time": "1:15:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23200, "total_steps": 25254, "loss": 0.0806, "learning_rate": 8.623974249714311e-07, "epoch": 2.7559990496555002, "percentage": 91.87, "elapsed_time": "14:05:19", "remaining_time": "1:14:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23210, "total_steps": 25254, "loss": 0.0811, "learning_rate": 8.540686441529166e-07, "epoch": 2.7571869802803515, "percentage": 91.91, "elapsed_time": "14:05:42", "remaining_time": "1:14:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23220, "total_steps": 25254, "loss": 0.0821, "learning_rate": 8.457795782186278e-07, "epoch": 2.758374910905203, "percentage": 91.95, "elapsed_time": "14:06:03", "remaining_time": "1:14:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23230, "total_steps": 25254, "loss": 0.0809, "learning_rate": 8.37530240802295e-07, "epoch": 2.7595628415300544, "percentage": 91.99, "elapsed_time": "14:06:24", "remaining_time": "1:13:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23240, "total_steps": 25254, "loss": 0.0796, "learning_rate": 8.293206454723145e-07, "epoch": 2.760750772154906, "percentage": 92.03, "elapsed_time": "14:06:47", "remaining_time": "1:13:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23250, "total_steps": 25254, "loss": 0.0824, "learning_rate": 8.211508057317074e-07, "epoch": 2.7619387027797577, "percentage": 92.06, "elapsed_time": "14:07:08", "remaining_time": "1:13:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23260, "total_steps": 25254, "loss": 0.0836, "learning_rate": 8.130207350181135e-07, "epoch": 2.7631266334046094, "percentage": 92.1, "elapsed_time": "14:07:30", "remaining_time": "1:12:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23270, "total_steps": 25254, "loss": 0.0813, "learning_rate": 8.049304467037583e-07, "epoch": 2.7643145640294606, "percentage": 92.14, "elapsed_time": "14:07:52", "remaining_time": "1:12:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23280, "total_steps": 25254, "loss": 0.0815, "learning_rate": 7.968799540954308e-07, "epoch": 2.7655024946543123, "percentage": 92.18, "elapsed_time": "14:08:14", "remaining_time": "1:11:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23290, "total_steps": 25254, "loss": 0.0829, "learning_rate": 7.888692704344669e-07, "epoch": 2.7666904252791635, "percentage": 92.22, "elapsed_time": "14:08:36", "remaining_time": "1:11:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23300, "total_steps": 25254, "loss": 0.0805, "learning_rate": 7.80898408896727e-07, "epoch": 2.767878355904015, "percentage": 92.26, "elapsed_time": "14:08:59", "remaining_time": "1:11:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23310, "total_steps": 25254, "loss": 0.0795, "learning_rate": 7.729673825925654e-07, "epoch": 2.769066286528867, "percentage": 92.3, "elapsed_time": "14:09:21", "remaining_time": "1:10:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23320, "total_steps": 25254, "loss": 0.0812, "learning_rate": 7.650762045668281e-07, "epoch": 2.770254217153718, "percentage": 92.34, "elapsed_time": "14:09:43", "remaining_time": "1:10:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23330, "total_steps": 25254, "loss": 0.0845, "learning_rate": 7.572248877988075e-07, "epoch": 2.77144214777857, "percentage": 92.38, "elapsed_time": "14:10:05", "remaining_time": "1:10:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23340, "total_steps": 25254, "loss": 0.0827, "learning_rate": 7.494134452022406e-07, "epoch": 2.772630078403421, "percentage": 92.42, "elapsed_time": "14:10:27", "remaining_time": "1:09:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23350, "total_steps": 25254, "loss": 0.0836, "learning_rate": 7.416418896252719e-07, "epoch": 2.7738180090282727, "percentage": 92.46, "elapsed_time": "14:10:48", "remaining_time": "1:09:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23360, "total_steps": 25254, "loss": 0.0832, "learning_rate": 7.339102338504516e-07, "epoch": 2.7750059396531244, "percentage": 92.5, "elapsed_time": "14:11:11", "remaining_time": "1:09:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23370, "total_steps": 25254, "loss": 0.0807, "learning_rate": 7.262184905946962e-07, "epoch": 2.776193870277976, "percentage": 92.54, "elapsed_time": "14:11:33", "remaining_time": "1:08:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23380, "total_steps": 25254, "loss": 0.0838, "learning_rate": 7.185666725092716e-07, "epoch": 2.7773818009028273, "percentage": 92.58, "elapsed_time": "14:11:55", "remaining_time": "1:08:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23390, "total_steps": 25254, "loss": 0.0844, "learning_rate": 7.109547921797827e-07, "epoch": 2.778569731527679, "percentage": 92.62, "elapsed_time": "14:12:17", "remaining_time": "1:07:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23400, "total_steps": 25254, "loss": 0.0857, "learning_rate": 7.033828621261396e-07, "epoch": 2.77975766215253, "percentage": 92.66, "elapsed_time": "14:12:38", "remaining_time": "1:07:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23410, "total_steps": 25254, "loss": 0.0839, "learning_rate": 6.958508948025494e-07, "epoch": 2.780945592777382, "percentage": 92.7, "elapsed_time": "14:13:00", "remaining_time": "1:07:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23420, "total_steps": 25254, "loss": 0.0836, "learning_rate": 6.883589025974801e-07, "epoch": 2.7821335234022335, "percentage": 92.74, "elapsed_time": "14:13:22", "remaining_time": "1:06:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23430, "total_steps": 25254, "loss": 0.0818, "learning_rate": 6.809068978336553e-07, "epoch": 2.7833214540270848, "percentage": 92.78, "elapsed_time": "14:13:44", "remaining_time": "1:06:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23440, "total_steps": 25254, "loss": 0.0831, "learning_rate": 6.734948927680257e-07, "epoch": 2.7845093846519364, "percentage": 92.82, "elapsed_time": "14:14:06", "remaining_time": "1:06:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23450, "total_steps": 25254, "loss": 0.0814, "learning_rate": 6.661228995917534e-07, "epoch": 2.7856973152767877, "percentage": 92.86, "elapsed_time": "14:14:28", "remaining_time": "1:05:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23460, "total_steps": 25254, "loss": 0.083, "learning_rate": 6.587909304301893e-07, "epoch": 2.7868852459016393, "percentage": 92.9, "elapsed_time": "14:14:50", "remaining_time": "1:05:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23470, "total_steps": 25254, "loss": 0.0813, "learning_rate": 6.514989973428476e-07, "epoch": 2.788073176526491, "percentage": 92.94, "elapsed_time": "14:15:12", "remaining_time": "1:05:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23480, "total_steps": 25254, "loss": 0.0786, "learning_rate": 6.442471123233984e-07, "epoch": 2.7892611071513422, "percentage": 92.98, "elapsed_time": "14:15:34", "remaining_time": "1:04:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23490, "total_steps": 25254, "loss": 0.081, "learning_rate": 6.370352872996338e-07, "epoch": 2.790449037776194, "percentage": 93.01, "elapsed_time": "14:15:56", "remaining_time": "1:04:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23500, "total_steps": 25254, "loss": 0.0844, "learning_rate": 6.298635341334708e-07, "epoch": 2.791636968401045, "percentage": 93.05, "elapsed_time": "14:16:17", "remaining_time": "1:03:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23510, "total_steps": 25254, "loss": 0.0828, "learning_rate": 6.22731864620904e-07, "epoch": 2.792824899025897, "percentage": 93.09, "elapsed_time": "14:16:40", "remaining_time": "1:03:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23520, "total_steps": 25254, "loss": 0.0821, "learning_rate": 6.15640290491995e-07, "epoch": 2.7940128296507485, "percentage": 93.13, "elapsed_time": "14:17:02", "remaining_time": "1:03:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23530, "total_steps": 25254, "loss": 0.0797, "learning_rate": 6.085888234108716e-07, "epoch": 2.7952007602756, "percentage": 93.17, "elapsed_time": "14:17:24", "remaining_time": "1:02:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23540, "total_steps": 25254, "loss": 0.0791, "learning_rate": 6.015774749756814e-07, "epoch": 2.7963886909004514, "percentage": 93.21, "elapsed_time": "14:17:45", "remaining_time": "1:02:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23550, "total_steps": 25254, "loss": 0.0827, "learning_rate": 5.946062567185967e-07, "epoch": 2.797576621525303, "percentage": 93.25, "elapsed_time": "14:18:07", "remaining_time": "1:02:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23560, "total_steps": 25254, "loss": 0.0818, "learning_rate": 5.876751801057706e-07, "epoch": 2.7987645521501543, "percentage": 93.29, "elapsed_time": "14:18:29", "remaining_time": "1:01:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23570, "total_steps": 25254, "loss": 0.0841, "learning_rate": 5.807842565373451e-07, "epoch": 2.799952482775006, "percentage": 93.33, "elapsed_time": "14:18:52", "remaining_time": "1:01:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23580, "total_steps": 25254, "loss": 0.0808, "learning_rate": 5.739334973474119e-07, "epoch": 2.8011404133998576, "percentage": 93.37, "elapsed_time": "14:19:14", "remaining_time": "1:00:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23590, "total_steps": 25254, "loss": 0.0822, "learning_rate": 5.671229138039968e-07, "epoch": 2.802328344024709, "percentage": 93.41, "elapsed_time": "14:19:36", "remaining_time": "1:00:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23600, "total_steps": 25254, "loss": 0.081, "learning_rate": 5.603525171090584e-07, "epoch": 2.8035162746495605, "percentage": 93.45, "elapsed_time": "14:19:58", "remaining_time": "1:00:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23610, "total_steps": 25254, "loss": 0.0841, "learning_rate": 5.536223183984446e-07, "epoch": 2.8047042052744118, "percentage": 93.49, "elapsed_time": "14:20:20", "remaining_time": "0:59:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23620, "total_steps": 25254, "loss": 0.0828, "learning_rate": 5.469323287418948e-07, "epoch": 2.8058921358992635, "percentage": 93.53, "elapsed_time": "14:20:41", "remaining_time": "0:59:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23630, "total_steps": 25254, "loss": 0.0815, "learning_rate": 5.402825591430016e-07, "epoch": 2.807080066524115, "percentage": 93.57, "elapsed_time": "14:21:03", "remaining_time": "0:59:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23640, "total_steps": 25254, "loss": 0.0812, "learning_rate": 5.33673020539216e-07, "epoch": 2.8082679971489664, "percentage": 93.61, "elapsed_time": "14:21:25", "remaining_time": "0:58:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23650, "total_steps": 25254, "loss": 0.08, "learning_rate": 5.271037238018139e-07, "epoch": 2.809455927773818, "percentage": 93.65, "elapsed_time": "14:21:46", "remaining_time": "0:58:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23660, "total_steps": 25254, "loss": 0.0783, "learning_rate": 5.205746797358773e-07, "epoch": 2.8106438583986693, "percentage": 93.69, "elapsed_time": "14:22:08", "remaining_time": "0:58:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23670, "total_steps": 25254, "loss": 0.0822, "learning_rate": 5.140858990802882e-07, "epoch": 2.811831789023521, "percentage": 93.73, "elapsed_time": "14:22:30", "remaining_time": "0:57:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23680, "total_steps": 25254, "loss": 0.0835, "learning_rate": 5.076373925076955e-07, "epoch": 2.8130197196483726, "percentage": 93.77, "elapsed_time": "14:22:53", "remaining_time": "0:57:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23690, "total_steps": 25254, "loss": 0.081, "learning_rate": 5.012291706245204e-07, "epoch": 2.8142076502732243, "percentage": 93.81, "elapsed_time": "14:23:14", "remaining_time": "0:56:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23700, "total_steps": 25254, "loss": 0.0819, "learning_rate": 4.948612439709066e-07, "epoch": 2.8153955808980755, "percentage": 93.85, "elapsed_time": "14:23:36", "remaining_time": "0:56:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23710, "total_steps": 25254, "loss": 0.082, "learning_rate": 4.885336230207344e-07, "epoch": 2.816583511522927, "percentage": 93.89, "elapsed_time": "14:23:58", "remaining_time": "0:56:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23720, "total_steps": 25254, "loss": 0.0817, "learning_rate": 4.822463181815812e-07, "epoch": 2.8177714421477784, "percentage": 93.93, "elapsed_time": "14:24:20", "remaining_time": "0:55:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23730, "total_steps": 25254, "loss": 0.0833, "learning_rate": 4.7599933979471655e-07, "epoch": 2.81895937277263, "percentage": 93.97, "elapsed_time": "14:24:42", "remaining_time": "0:55:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23740, "total_steps": 25254, "loss": 0.0825, "learning_rate": 4.697926981350853e-07, "epoch": 2.8201473033974818, "percentage": 94.0, "elapsed_time": "14:25:03", "remaining_time": "0:55:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23750, "total_steps": 25254, "loss": 0.0835, "learning_rate": 4.636264034112797e-07, "epoch": 2.821335234022333, "percentage": 94.04, "elapsed_time": "14:25:26", "remaining_time": "0:54:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23760, "total_steps": 25254, "loss": 0.0833, "learning_rate": 4.5750046576553684e-07, "epoch": 2.8225231646471847, "percentage": 94.08, "elapsed_time": "14:25:47", "remaining_time": "0:54:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23770, "total_steps": 25254, "loss": 0.0831, "learning_rate": 4.5141489527370796e-07, "epoch": 2.823711095272036, "percentage": 94.12, "elapsed_time": "14:26:09", "remaining_time": "0:54:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23780, "total_steps": 25254, "loss": 0.079, "learning_rate": 4.4536970194525573e-07, "epoch": 2.8248990258968876, "percentage": 94.16, "elapsed_time": "14:26:31", "remaining_time": "0:53:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23790, "total_steps": 25254, "loss": 0.0828, "learning_rate": 4.393648957232266e-07, "epoch": 2.8260869565217392, "percentage": 94.2, "elapsed_time": "14:26:53", "remaining_time": "0:53:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23800, "total_steps": 25254, "loss": 0.0805, "learning_rate": 4.334004864842395e-07, "epoch": 2.8272748871465905, "percentage": 94.24, "elapsed_time": "14:27:15", "remaining_time": "0:52:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23810, "total_steps": 25254, "loss": 0.0823, "learning_rate": 4.274764840384721e-07, "epoch": 2.828462817771442, "percentage": 94.28, "elapsed_time": "14:27:37", "remaining_time": "0:52:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23820, "total_steps": 25254, "loss": 0.0826, "learning_rate": 4.215928981296358e-07, "epoch": 2.8296507483962934, "percentage": 94.32, "elapsed_time": "14:27:59", "remaining_time": "0:52:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23830, "total_steps": 25254, "loss": 0.0844, "learning_rate": 4.157497384349729e-07, "epoch": 2.830838679021145, "percentage": 94.36, "elapsed_time": "14:28:20", "remaining_time": "0:51:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23840, "total_steps": 25254, "loss": 0.0818, "learning_rate": 4.09947014565229e-07, "epoch": 2.8320266096459967, "percentage": 94.4, "elapsed_time": "14:28:41", "remaining_time": "0:51:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23850, "total_steps": 25254, "loss": 0.08, "learning_rate": 4.041847360646389e-07, "epoch": 2.8332145402708484, "percentage": 94.44, "elapsed_time": "14:29:03", "remaining_time": "0:51:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23860, "total_steps": 25254, "loss": 0.0821, "learning_rate": 3.984629124109185e-07, "epoch": 2.8344024708956996, "percentage": 94.48, "elapsed_time": "14:29:26", "remaining_time": "0:50:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23870, "total_steps": 25254, "loss": 0.0827, "learning_rate": 3.927815530152396e-07, "epoch": 2.8355904015205513, "percentage": 94.52, "elapsed_time": "14:29:48", "remaining_time": "0:50:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23880, "total_steps": 25254, "loss": 0.0821, "learning_rate": 3.8714066722222444e-07, "epoch": 2.8367783321454025, "percentage": 94.56, "elapsed_time": "14:30:11", "remaining_time": "0:50:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23890, "total_steps": 25254, "loss": 0.0816, "learning_rate": 3.8154026430992085e-07, "epoch": 2.837966262770254, "percentage": 94.6, "elapsed_time": "14:30:33", "remaining_time": "0:49:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23900, "total_steps": 25254, "loss": 0.0819, "learning_rate": 3.75980353489791e-07, "epoch": 2.839154193395106, "percentage": 94.64, "elapsed_time": "14:30:56", "remaining_time": "0:49:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23910, "total_steps": 25254, "loss": 0.0816, "learning_rate": 3.704609439066975e-07, "epoch": 2.840342124019957, "percentage": 94.68, "elapsed_time": "14:31:17", "remaining_time": "0:48:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23920, "total_steps": 25254, "loss": 0.0789, "learning_rate": 3.6498204463888406e-07, "epoch": 2.841530054644809, "percentage": 94.72, "elapsed_time": "14:31:39", "remaining_time": "0:48:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23930, "total_steps": 25254, "loss": 0.082, "learning_rate": 3.5954366469797e-07, "epoch": 2.84271798526966, "percentage": 94.76, "elapsed_time": "14:32:01", "remaining_time": "0:48:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23940, "total_steps": 25254, "loss": 0.0807, "learning_rate": 3.541458130289277e-07, "epoch": 2.8439059158945117, "percentage": 94.8, "elapsed_time": "14:32:24", "remaining_time": "0:47:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23950, "total_steps": 25254, "loss": 0.082, "learning_rate": 3.4878849851005814e-07, "epoch": 2.8450938465193634, "percentage": 94.84, "elapsed_time": "14:32:46", "remaining_time": "0:47:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23960, "total_steps": 25254, "loss": 0.0822, "learning_rate": 3.434717299530016e-07, "epoch": 2.846281777144215, "percentage": 94.88, "elapsed_time": "14:33:07", "remaining_time": "0:47:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23970, "total_steps": 25254, "loss": 0.0802, "learning_rate": 3.381955161027017e-07, "epoch": 2.8474697077690663, "percentage": 94.92, "elapsed_time": "14:33:29", "remaining_time": "0:46:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23980, "total_steps": 25254, "loss": 0.0816, "learning_rate": 3.329598656374028e-07, "epoch": 2.848657638393918, "percentage": 94.96, "elapsed_time": "14:33:51", "remaining_time": "0:46:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 23990, "total_steps": 25254, "loss": 0.0812, "learning_rate": 3.277647871686246e-07, "epoch": 2.849845569018769, "percentage": 94.99, "elapsed_time": "14:34:13", "remaining_time": "0:46:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24000, "total_steps": 25254, "loss": 0.0825, "learning_rate": 3.2261028924115975e-07, "epoch": 2.851033499643621, "percentage": 95.03, "elapsed_time": "14:34:36", "remaining_time": "0:45:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24010, "total_steps": 25254, "loss": 0.084, "learning_rate": 3.174963803330544e-07, "epoch": 2.8522214302684725, "percentage": 95.07, "elapsed_time": "14:34:57", "remaining_time": "0:45:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24020, "total_steps": 25254, "loss": 0.084, "learning_rate": 3.1242306885558846e-07, "epoch": 2.8534093608933238, "percentage": 95.11, "elapsed_time": "14:35:19", "remaining_time": "0:44:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24030, "total_steps": 25254, "loss": 0.0826, "learning_rate": 3.0739036315327876e-07, "epoch": 2.8545972915181754, "percentage": 95.15, "elapsed_time": "14:35:41", "remaining_time": "0:44:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24040, "total_steps": 25254, "loss": 0.0838, "learning_rate": 3.0239827150384536e-07, "epoch": 2.8557852221430267, "percentage": 95.19, "elapsed_time": "14:36:03", "remaining_time": "0:44:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24050, "total_steps": 25254, "loss": 0.0791, "learning_rate": 2.9744680211820916e-07, "epoch": 2.8569731527678783, "percentage": 95.23, "elapsed_time": "14:36:25", "remaining_time": "0:43:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24060, "total_steps": 25254, "loss": 0.0843, "learning_rate": 2.925359631404723e-07, "epoch": 2.85816108339273, "percentage": 95.27, "elapsed_time": "14:36:47", "remaining_time": "0:43:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24070, "total_steps": 25254, "loss": 0.0841, "learning_rate": 2.8766576264792066e-07, "epoch": 2.8593490140175812, "percentage": 95.31, "elapsed_time": "14:37:08", "remaining_time": "0:43:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24080, "total_steps": 25254, "loss": 0.0823, "learning_rate": 2.8283620865098836e-07, "epoch": 2.860536944642433, "percentage": 95.35, "elapsed_time": "14:37:29", "remaining_time": "0:42:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24090, "total_steps": 25254, "loss": 0.0818, "learning_rate": 2.780473090932545e-07, "epoch": 2.861724875267284, "percentage": 95.39, "elapsed_time": "14:37:52", "remaining_time": "0:42:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24100, "total_steps": 25254, "loss": 0.0803, "learning_rate": 2.73299071851435e-07, "epoch": 2.862912805892136, "percentage": 95.43, "elapsed_time": "14:38:14", "remaining_time": "0:42:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24110, "total_steps": 25254, "loss": 0.0823, "learning_rate": 2.6859150473536044e-07, "epoch": 2.8641007365169875, "percentage": 95.47, "elapsed_time": "14:38:36", "remaining_time": "0:41:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24120, "total_steps": 25254, "loss": 0.0789, "learning_rate": 2.639246154879732e-07, "epoch": 2.865288667141839, "percentage": 95.51, "elapsed_time": "14:38:58", "remaining_time": "0:41:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24130, "total_steps": 25254, "loss": 0.0794, "learning_rate": 2.592984117853053e-07, "epoch": 2.8664765977666904, "percentage": 95.55, "elapsed_time": "14:39:20", "remaining_time": "0:40:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24140, "total_steps": 25254, "loss": 0.0806, "learning_rate": 2.547129012364702e-07, "epoch": 2.867664528391542, "percentage": 95.59, "elapsed_time": "14:39:42", "remaining_time": "0:40:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24150, "total_steps": 25254, "loss": 0.0785, "learning_rate": 2.501680913836485e-07, "epoch": 2.8688524590163933, "percentage": 95.63, "elapsed_time": "14:40:03", "remaining_time": "0:40:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24160, "total_steps": 25254, "loss": 0.0807, "learning_rate": 2.456639897020829e-07, "epoch": 2.870040389641245, "percentage": 95.67, "elapsed_time": "14:40:27", "remaining_time": "0:39:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24170, "total_steps": 25254, "loss": 0.0797, "learning_rate": 2.4120060360005305e-07, "epoch": 2.8712283202660966, "percentage": 95.71, "elapsed_time": "14:40:48", "remaining_time": "0:39:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24180, "total_steps": 25254, "loss": 0.0803, "learning_rate": 2.3677794041887523e-07, "epoch": 2.872416250890948, "percentage": 95.75, "elapsed_time": "14:41:10", "remaining_time": "0:39:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24190, "total_steps": 25254, "loss": 0.0834, "learning_rate": 2.3239600743287792e-07, "epoch": 2.8736041815157995, "percentage": 95.79, "elapsed_time": "14:41:31", "remaining_time": "0:38:46", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24200, "total_steps": 25254, "loss": 0.0828, "learning_rate": 2.280548118494069e-07, "epoch": 2.874792112140651, "percentage": 95.83, "elapsed_time": "14:41:53", "remaining_time": "0:38:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24210, "total_steps": 25254, "loss": 0.0842, "learning_rate": 2.2375436080879774e-07, "epoch": 2.8759800427655025, "percentage": 95.87, "elapsed_time": "14:42:14", "remaining_time": "0:38:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24220, "total_steps": 25254, "loss": 0.0824, "learning_rate": 2.1949466138437292e-07, "epoch": 2.877167973390354, "percentage": 95.91, "elapsed_time": "14:42:36", "remaining_time": "0:37:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24230, "total_steps": 25254, "loss": 0.0806, "learning_rate": 2.1527572058241963e-07, "epoch": 2.8783559040152054, "percentage": 95.95, "elapsed_time": "14:42:58", "remaining_time": "0:37:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24240, "total_steps": 25254, "loss": 0.0812, "learning_rate": 2.1109754534219815e-07, "epoch": 2.879543834640057, "percentage": 95.98, "elapsed_time": "14:43:20", "remaining_time": "0:36:57", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24250, "total_steps": 25254, "loss": 0.0832, "learning_rate": 2.0696014253590857e-07, "epoch": 2.8807317652649083, "percentage": 96.02, "elapsed_time": "14:43:41", "remaining_time": "0:36:35", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24260, "total_steps": 25254, "loss": 0.081, "learning_rate": 2.028635189686906e-07, "epoch": 2.88191969588976, "percentage": 96.06, "elapsed_time": "14:44:03", "remaining_time": "0:36:13", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24270, "total_steps": 25254, "loss": 0.0821, "learning_rate": 1.988076813786155e-07, "epoch": 2.8831076265146116, "percentage": 96.1, "elapsed_time": "14:44:25", "remaining_time": "0:35:51", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24280, "total_steps": 25254, "loss": 0.0843, "learning_rate": 1.9479263643666644e-07, "epoch": 2.8842955571394633, "percentage": 96.14, "elapsed_time": "14:44:47", "remaining_time": "0:35:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24290, "total_steps": 25254, "loss": 0.0836, "learning_rate": 1.908183907467276e-07, "epoch": 2.8854834877643145, "percentage": 96.18, "elapsed_time": "14:45:09", "remaining_time": "0:35:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24300, "total_steps": 25254, "loss": 0.0818, "learning_rate": 1.8688495084558944e-07, "epoch": 2.886671418389166, "percentage": 96.22, "elapsed_time": "14:45:31", "remaining_time": "0:34:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24310, "total_steps": 25254, "loss": 0.0826, "learning_rate": 1.8299232320291292e-07, "epoch": 2.8878593490140174, "percentage": 96.26, "elapsed_time": "14:45:53", "remaining_time": "0:34:24", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24320, "total_steps": 25254, "loss": 0.0833, "learning_rate": 1.7914051422124044e-07, "epoch": 2.889047279638869, "percentage": 96.3, "elapsed_time": "14:46:15", "remaining_time": "0:34:02", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24330, "total_steps": 25254, "loss": 0.0828, "learning_rate": 1.753295302359681e-07, "epoch": 2.8902352102637208, "percentage": 96.34, "elapsed_time": "14:46:37", "remaining_time": "0:33:40", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24340, "total_steps": 25254, "loss": 0.0826, "learning_rate": 1.7155937751534845e-07, "epoch": 2.891423140888572, "percentage": 96.38, "elapsed_time": "14:46:59", "remaining_time": "0:33:18", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24350, "total_steps": 25254, "loss": 0.0797, "learning_rate": 1.6783006226047671e-07, "epoch": 2.8926110715134237, "percentage": 96.42, "elapsed_time": "14:47:21", "remaining_time": "0:32:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24360, "total_steps": 25254, "loss": 0.0835, "learning_rate": 1.6414159060527956e-07, "epoch": 2.893799002138275, "percentage": 96.46, "elapsed_time": "14:47:42", "remaining_time": "0:32:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24370, "total_steps": 25254, "loss": 0.0811, "learning_rate": 1.6049396861650133e-07, "epoch": 2.8949869327631266, "percentage": 96.5, "elapsed_time": "14:48:04", "remaining_time": "0:32:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24380, "total_steps": 25254, "loss": 0.0817, "learning_rate": 1.568872022936957e-07, "epoch": 2.8961748633879782, "percentage": 96.54, "elapsed_time": "14:48:26", "remaining_time": "0:31:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24390, "total_steps": 25254, "loss": 0.0839, "learning_rate": 1.5332129756922276e-07, "epoch": 2.89736279401283, "percentage": 96.58, "elapsed_time": "14:48:47", "remaining_time": "0:31:29", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24400, "total_steps": 25254, "loss": 0.0811, "learning_rate": 1.4979626030823258e-07, "epoch": 2.898550724637681, "percentage": 96.62, "elapsed_time": "14:49:09", "remaining_time": "0:31:07", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24410, "total_steps": 25254, "loss": 0.0819, "learning_rate": 1.463120963086567e-07, "epoch": 2.899738655262533, "percentage": 96.66, "elapsed_time": "14:49:32", "remaining_time": "0:30:45", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24420, "total_steps": 25254, "loss": 0.0831, "learning_rate": 1.4286881130119722e-07, "epoch": 2.900926585887384, "percentage": 96.7, "elapsed_time": "14:49:53", "remaining_time": "0:30:23", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24430, "total_steps": 25254, "loss": 0.0806, "learning_rate": 1.3946641094931823e-07, "epoch": 2.9021145165122357, "percentage": 96.74, "elapsed_time": "14:50:15", "remaining_time": "0:30:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24440, "total_steps": 25254, "loss": 0.0836, "learning_rate": 1.3610490084924322e-07, "epoch": 2.9033024471370874, "percentage": 96.78, "elapsed_time": "14:50:37", "remaining_time": "0:29:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24450, "total_steps": 25254, "loss": 0.0786, "learning_rate": 1.327842865299356e-07, "epoch": 2.9044903777619386, "percentage": 96.82, "elapsed_time": "14:50:58", "remaining_time": "0:29:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24460, "total_steps": 25254, "loss": 0.0796, "learning_rate": 1.2950457345309307e-07, "epoch": 2.9056783083867903, "percentage": 96.86, "elapsed_time": "14:51:20", "remaining_time": "0:28:56", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24470, "total_steps": 25254, "loss": 0.0782, "learning_rate": 1.262657670131423e-07, "epoch": 2.9068662390116415, "percentage": 96.9, "elapsed_time": "14:51:42", "remaining_time": "0:28:34", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24480, "total_steps": 25254, "loss": 0.0811, "learning_rate": 1.2306787253722195e-07, "epoch": 2.908054169636493, "percentage": 96.94, "elapsed_time": "14:52:04", "remaining_time": "0:28:12", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24490, "total_steps": 25254, "loss": 0.0816, "learning_rate": 1.199108952851885e-07, "epoch": 2.909242100261345, "percentage": 96.97, "elapsed_time": "14:52:26", "remaining_time": "0:27:50", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24500, "total_steps": 25254, "loss": 0.0812, "learning_rate": 1.1679484044959111e-07, "epoch": 2.910430030886196, "percentage": 97.01, "elapsed_time": "14:52:49", "remaining_time": "0:27:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24510, "total_steps": 25254, "loss": 0.0837, "learning_rate": 1.1371971315567442e-07, "epoch": 2.911617961511048, "percentage": 97.05, "elapsed_time": "14:53:10", "remaining_time": "0:27:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24520, "total_steps": 25254, "loss": 0.0814, "learning_rate": 1.1068551846135922e-07, "epoch": 2.912805892135899, "percentage": 97.09, "elapsed_time": "14:53:31", "remaining_time": "0:26:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24530, "total_steps": 25254, "loss": 0.0827, "learning_rate": 1.0769226135725064e-07, "epoch": 2.9139938227607507, "percentage": 97.13, "elapsed_time": "14:53:53", "remaining_time": "0:26:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24540, "total_steps": 25254, "loss": 0.08, "learning_rate": 1.0473994676661326e-07, "epoch": 2.9151817533856024, "percentage": 97.17, "elapsed_time": "14:54:15", "remaining_time": "0:26:01", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24550, "total_steps": 25254, "loss": 0.0808, "learning_rate": 1.0182857954537106e-07, "epoch": 2.916369684010454, "percentage": 97.21, "elapsed_time": "14:54:37", "remaining_time": "0:25:39", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24560, "total_steps": 25254, "loss": 0.0804, "learning_rate": 9.895816448210194e-08, "epoch": 2.9175576146353053, "percentage": 97.25, "elapsed_time": "14:54:59", "remaining_time": "0:25:17", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24570, "total_steps": 25254, "loss": 0.079, "learning_rate": 9.612870629802373e-08, "epoch": 2.918745545260157, "percentage": 97.29, "elapsed_time": "14:55:21", "remaining_time": "0:24:55", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24580, "total_steps": 25254, "loss": 0.0796, "learning_rate": 9.334020964698598e-08, "epoch": 2.919933475885008, "percentage": 97.33, "elapsed_time": "14:55:43", "remaining_time": "0:24:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24590, "total_steps": 25254, "loss": 0.0805, "learning_rate": 9.059267911547265e-08, "epoch": 2.92112140650986, "percentage": 97.37, "elapsed_time": "14:56:05", "remaining_time": "0:24:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24600, "total_steps": 25254, "loss": 0.0831, "learning_rate": 8.788611922257717e-08, "epoch": 2.9223093371347115, "percentage": 97.41, "elapsed_time": "14:56:27", "remaining_time": "0:23:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24610, "total_steps": 25254, "loss": 0.0788, "learning_rate": 8.522053442001354e-08, "epoch": 2.9234972677595628, "percentage": 97.45, "elapsed_time": "14:56:49", "remaining_time": "0:23:28", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24620, "total_steps": 25254, "loss": 0.0829, "learning_rate": 8.259592909209968e-08, "epoch": 2.9246851983844144, "percentage": 97.49, "elapsed_time": "14:57:11", "remaining_time": "0:23:06", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24630, "total_steps": 25254, "loss": 0.0827, "learning_rate": 8.001230755574629e-08, "epoch": 2.9258731290092657, "percentage": 97.53, "elapsed_time": "14:57:32", "remaining_time": "0:22:44", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24640, "total_steps": 25254, "loss": 0.0819, "learning_rate": 7.746967406045969e-08, "epoch": 2.9270610596341173, "percentage": 97.57, "elapsed_time": "14:57:54", "remaining_time": "0:22:22", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24650, "total_steps": 25254, "loss": 0.0817, "learning_rate": 7.496803278832509e-08, "epoch": 2.928248990258969, "percentage": 97.61, "elapsed_time": "14:58:16", "remaining_time": "0:22:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24660, "total_steps": 25254, "loss": 0.0802, "learning_rate": 7.250738785400668e-08, "epoch": 2.9294369208838202, "percentage": 97.65, "elapsed_time": "14:58:37", "remaining_time": "0:21:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24670, "total_steps": 25254, "loss": 0.0823, "learning_rate": 7.008774330473922e-08, "epoch": 2.930624851508672, "percentage": 97.69, "elapsed_time": "14:58:59", "remaining_time": "0:21:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24680, "total_steps": 25254, "loss": 0.0807, "learning_rate": 6.770910312031975e-08, "epoch": 2.931812782133523, "percentage": 97.73, "elapsed_time": "14:59:20", "remaining_time": "0:20:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24690, "total_steps": 25254, "loss": 0.0806, "learning_rate": 6.537147121310205e-08, "epoch": 2.933000712758375, "percentage": 97.77, "elapsed_time": "14:59:42", "remaining_time": "0:20:33", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24700, "total_steps": 25254, "loss": 0.0814, "learning_rate": 6.307485142798831e-08, "epoch": 2.9341886433832265, "percentage": 97.81, "elapsed_time": "15:00:04", "remaining_time": "0:20:11", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24710, "total_steps": 25254, "loss": 0.0825, "learning_rate": 6.08192475424263e-08, "epoch": 2.935376574008078, "percentage": 97.85, "elapsed_time": "15:00:26", "remaining_time": "0:19:49", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24720, "total_steps": 25254, "loss": 0.0805, "learning_rate": 5.860466326640113e-08, "epoch": 2.9365645046329294, "percentage": 97.89, "elapsed_time": "15:00:48", "remaining_time": "0:19:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24730, "total_steps": 25254, "loss": 0.079, "learning_rate": 5.643110224243242e-08, "epoch": 2.937752435257781, "percentage": 97.93, "elapsed_time": "15:01:11", "remaining_time": "0:19:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24740, "total_steps": 25254, "loss": 0.083, "learning_rate": 5.4298568045557664e-08, "epoch": 2.9389403658826323, "percentage": 97.96, "elapsed_time": "15:01:33", "remaining_time": "0:18:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24750, "total_steps": 25254, "loss": 0.0822, "learning_rate": 5.220706418334331e-08, "epoch": 2.940128296507484, "percentage": 98.0, "elapsed_time": "15:01:55", "remaining_time": "0:18:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24760, "total_steps": 25254, "loss": 0.0849, "learning_rate": 5.0156594095862596e-08, "epoch": 2.9413162271323356, "percentage": 98.04, "elapsed_time": "15:02:17", "remaining_time": "0:18:00", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24770, "total_steps": 25254, "loss": 0.0814, "learning_rate": 4.8147161155698284e-08, "epoch": 2.942504157757187, "percentage": 98.08, "elapsed_time": "15:02:39", "remaining_time": "0:17:38", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24780, "total_steps": 25254, "loss": 0.082, "learning_rate": 4.6178768667939906e-08, "epoch": 2.9436920883820386, "percentage": 98.12, "elapsed_time": "15:03:00", "remaining_time": "0:17:16", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24790, "total_steps": 25254, "loss": 0.0797, "learning_rate": 4.42514198701699e-08, "epoch": 2.94488001900689, "percentage": 98.16, "elapsed_time": "15:03:22", "remaining_time": "0:16:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24800, "total_steps": 25254, "loss": 0.0813, "learning_rate": 4.236511793246356e-08, "epoch": 2.9460679496317415, "percentage": 98.2, "elapsed_time": "15:03:44", "remaining_time": "0:16:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24810, "total_steps": 25254, "loss": 0.0824, "learning_rate": 4.051986595738633e-08, "epoch": 2.947255880256593, "percentage": 98.24, "elapsed_time": "15:04:06", "remaining_time": "0:16:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24820, "total_steps": 25254, "loss": 0.083, "learning_rate": 3.8715666979977085e-08, "epoch": 2.9484438108814444, "percentage": 98.28, "elapsed_time": "15:04:29", "remaining_time": "0:15:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24830, "total_steps": 25254, "loss": 0.079, "learning_rate": 3.695252396776483e-08, "epoch": 2.949631741506296, "percentage": 98.32, "elapsed_time": "15:04:50", "remaining_time": "0:15:27", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24840, "total_steps": 25254, "loss": 0.083, "learning_rate": 3.52304398207326e-08, "epoch": 2.9508196721311473, "percentage": 98.36, "elapsed_time": "15:05:13", "remaining_time": "0:15:05", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24850, "total_steps": 25254, "loss": 0.0828, "learning_rate": 3.354941737134798e-08, "epoch": 2.952007602755999, "percentage": 98.4, "elapsed_time": "15:05:35", "remaining_time": "0:14:43", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24860, "total_steps": 25254, "loss": 0.0824, "learning_rate": 3.190945938452705e-08, "epoch": 2.9531955333808506, "percentage": 98.44, "elapsed_time": "15:05:57", "remaining_time": "0:14:21", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24870, "total_steps": 25254, "loss": 0.0815, "learning_rate": 3.031056855765102e-08, "epoch": 2.9543834640057023, "percentage": 98.48, "elapsed_time": "15:06:18", "remaining_time": "0:13:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24880, "total_steps": 25254, "loss": 0.0806, "learning_rate": 2.8752747520555124e-08, "epoch": 2.9555713946305535, "percentage": 98.52, "elapsed_time": "15:06:40", "remaining_time": "0:13:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24890, "total_steps": 25254, "loss": 0.0766, "learning_rate": 2.7235998835520303e-08, "epoch": 2.956759325255405, "percentage": 98.56, "elapsed_time": "15:07:02", "remaining_time": "0:13:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24900, "total_steps": 25254, "loss": 0.0795, "learning_rate": 2.5760324997270434e-08, "epoch": 2.9579472558802564, "percentage": 98.6, "elapsed_time": "15:07:23", "remaining_time": "0:12:54", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24910, "total_steps": 25254, "loss": 0.0822, "learning_rate": 2.4325728432975094e-08, "epoch": 2.959135186505108, "percentage": 98.64, "elapsed_time": "15:07:45", "remaining_time": "0:12:32", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24920, "total_steps": 25254, "loss": 0.0789, "learning_rate": 2.2932211502238453e-08, "epoch": 2.9603231171299598, "percentage": 98.68, "elapsed_time": "15:08:07", "remaining_time": "0:12:10", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24930, "total_steps": 25254, "loss": 0.0811, "learning_rate": 2.1579776497096525e-08, "epoch": 2.961511047754811, "percentage": 98.72, "elapsed_time": "15:08:30", "remaining_time": "0:11:48", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24940, "total_steps": 25254, "loss": 0.0807, "learning_rate": 2.0268425642017142e-08, "epoch": 2.9626989783796627, "percentage": 98.76, "elapsed_time": "15:08:52", "remaining_time": "0:11:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24950, "total_steps": 25254, "loss": 0.0817, "learning_rate": 1.899816109388608e-08, "epoch": 2.963886909004514, "percentage": 98.8, "elapsed_time": "15:09:14", "remaining_time": "0:11:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24960, "total_steps": 25254, "loss": 0.0809, "learning_rate": 1.7768984942023725e-08, "epoch": 2.9650748396293656, "percentage": 98.84, "elapsed_time": "15:09:36", "remaining_time": "0:10:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24970, "total_steps": 25254, "loss": 0.0846, "learning_rate": 1.6580899208157307e-08, "epoch": 2.9662627702542173, "percentage": 98.88, "elapsed_time": "15:09:58", "remaining_time": "0:10:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24980, "total_steps": 25254, "loss": 0.0804, "learning_rate": 1.5433905846432008e-08, "epoch": 2.967450700879069, "percentage": 98.92, "elapsed_time": "15:10:20", "remaining_time": "0:09:59", "throughput": "0.00", "total_tokens": 0} {"current_steps": 24990, "total_steps": 25254, "loss": 0.0814, "learning_rate": 1.432800674341095e-08, "epoch": 2.96863863150392, "percentage": 98.95, "elapsed_time": "15:10:42", "remaining_time": "0:09:37", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25000, "total_steps": 25254, "loss": 0.0815, "learning_rate": 1.3263203718055783e-08, "epoch": 2.969826562128772, "percentage": 98.99, "elapsed_time": "15:11:04", "remaining_time": "0:09:15", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25010, "total_steps": 25254, "loss": 0.0807, "learning_rate": 1.223949852174333e-08, "epoch": 2.971014492753623, "percentage": 99.03, "elapsed_time": "15:11:26", "remaining_time": "0:08:53", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25020, "total_steps": 25254, "loss": 0.0823, "learning_rate": 1.1256892838248934e-08, "epoch": 2.9722024233784747, "percentage": 99.07, "elapsed_time": "15:11:48", "remaining_time": "0:08:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25030, "total_steps": 25254, "loss": 0.0821, "learning_rate": 1.0315388283746452e-08, "epoch": 2.9733903540033264, "percentage": 99.11, "elapsed_time": "15:12:10", "remaining_time": "0:08:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25040, "total_steps": 25254, "loss": 0.0805, "learning_rate": 9.414986406808268e-09, "epoch": 2.9745782846281776, "percentage": 99.15, "elapsed_time": "15:12:32", "remaining_time": "0:07:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25050, "total_steps": 25254, "loss": 0.0811, "learning_rate": 8.555688688408059e-09, "epoch": 2.9757662152530293, "percentage": 99.19, "elapsed_time": "15:12:53", "remaining_time": "0:07:26", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25060, "total_steps": 25254, "loss": 0.0828, "learning_rate": 7.737496541901368e-09, "epoch": 2.9769541458778805, "percentage": 99.23, "elapsed_time": "15:13:15", "remaining_time": "0:07:04", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25070, "total_steps": 25254, "loss": 0.0824, "learning_rate": 6.960411313039484e-09, "epoch": 2.978142076502732, "percentage": 99.27, "elapsed_time": "15:13:37", "remaining_time": "0:06:42", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25080, "total_steps": 25254, "loss": 0.0808, "learning_rate": 6.224434279963887e-09, "epoch": 2.979330007127584, "percentage": 99.31, "elapsed_time": "15:13:59", "remaining_time": "0:06:20", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25090, "total_steps": 25254, "loss": 0.0834, "learning_rate": 5.529566653197926e-09, "epoch": 2.980517937752435, "percentage": 99.35, "elapsed_time": "15:14:20", "remaining_time": "0:05:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25100, "total_steps": 25254, "loss": 0.0801, "learning_rate": 4.875809575649593e-09, "epoch": 2.981705868377287, "percentage": 99.39, "elapsed_time": "15:14:42", "remaining_time": "0:05:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25110, "total_steps": 25254, "loss": 0.0793, "learning_rate": 4.263164122608743e-09, "epoch": 2.982893799002138, "percentage": 99.43, "elapsed_time": "15:15:04", "remaining_time": "0:05:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25120, "total_steps": 25254, "loss": 0.0786, "learning_rate": 3.691631301744325e-09, "epoch": 2.9840817296269897, "percentage": 99.47, "elapsed_time": "15:15:26", "remaining_time": "0:04:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25130, "total_steps": 25254, "loss": 0.0813, "learning_rate": 3.1612120531099298e-09, "epoch": 2.9852696602518414, "percentage": 99.51, "elapsed_time": "15:15:47", "remaining_time": "0:04:31", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25140, "total_steps": 25254, "loss": 0.0827, "learning_rate": 2.6719072491271368e-09, "epoch": 2.986457590876693, "percentage": 99.55, "elapsed_time": "15:16:10", "remaining_time": "0:04:09", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25150, "total_steps": 25254, "loss": 0.0832, "learning_rate": 2.2237176946021675e-09, "epoch": 2.9876455215015443, "percentage": 99.59, "elapsed_time": "15:16:31", "remaining_time": "0:03:47", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25160, "total_steps": 25254, "loss": 0.0835, "learning_rate": 1.8166441267064572e-09, "epoch": 2.988833452126396, "percentage": 99.63, "elapsed_time": "15:16:53", "remaining_time": "0:03:25", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25170, "total_steps": 25254, "loss": 0.0827, "learning_rate": 1.4506872149905315e-09, "epoch": 2.990021382751247, "percentage": 99.67, "elapsed_time": "15:17:15", "remaining_time": "0:03:03", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25180, "total_steps": 25254, "loss": 0.0808, "learning_rate": 1.1258475613729059e-09, "epoch": 2.991209313376099, "percentage": 99.71, "elapsed_time": "15:17:37", "remaining_time": "0:02:41", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25190, "total_steps": 25254, "loss": 0.0841, "learning_rate": 8.421257001511862e-10, "epoch": 2.9923972440009505, "percentage": 99.75, "elapsed_time": "15:17:59", "remaining_time": "0:02:19", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25200, "total_steps": 25254, "loss": 0.0841, "learning_rate": 5.995220979798655e-10, "epoch": 2.9935851746258018, "percentage": 99.79, "elapsed_time": "15:18:20", "remaining_time": "0:01:58", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25210, "total_steps": 25254, "loss": 0.0807, "learning_rate": 3.980371538953032e-10, "epoch": 2.9947731052506534, "percentage": 99.83, "elapsed_time": "15:18:42", "remaining_time": "0:01:36", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25220, "total_steps": 25254, "loss": 0.0797, "learning_rate": 2.37671199293521e-10, "epoch": 2.9959610358755047, "percentage": 99.87, "elapsed_time": "15:19:04", "remaining_time": "0:01:14", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25230, "total_steps": 25254, "loss": 0.0825, "learning_rate": 1.1842449794685627e-10, "epoch": 2.9971489665003563, "percentage": 99.9, "elapsed_time": "15:19:26", "remaining_time": "0:00:52", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25240, "total_steps": 25254, "loss": 0.0803, "learning_rate": 4.0297245984532995e-11, "epoch": 2.998336897125208, "percentage": 99.94, "elapsed_time": "15:19:48", "remaining_time": "0:00:30", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25250, "total_steps": 25254, "loss": 0.0855, "learning_rate": 3.289571912090672e-12, "epoch": 2.9995248277500592, "percentage": 99.98, "elapsed_time": "15:20:10", "remaining_time": "0:00:08", "throughput": "0.00", "total_tokens": 0} {"current_steps": 25254, "total_steps": 25254, "epoch": 3.0, "percentage": 100.0, "elapsed_time": "15:20:47", "remaining_time": "0:00:00", "throughput": "0.00", "total_tokens": 0}