{"current_steps": 5, "total_steps": 3400, "loss": 1.0954, "lr": 2.9411764705882355e-06, "epoch": 0.0025753283543651817, "percentage": 0.15, "elapsed_time": "0:02:44", "remaining_time": "1 day, 6:59:16", "throughput": 303.84, "total_tokens": 49920} {"current_steps": 10, "total_steps": 3400, "loss": 0.9793, "lr": 5.882352941176471e-06, "epoch": 0.0051506567087303634, "percentage": 0.29, "elapsed_time": "0:04:11", "remaining_time": "23:42:34", "throughput": 396.53, "total_tokens": 99840} {"current_steps": 15, "total_steps": 3400, "loss": 1.0964, "lr": 8.823529411764707e-06, "epoch": 0.007725985063095545, "percentage": 0.44, "elapsed_time": "0:05:38", "remaining_time": "21:11:48", "throughput": 442.89, "total_tokens": 149760} {"current_steps": 20, "total_steps": 3400, "loss": 0.7079, "lr": 1.1764705882352942e-05, "epoch": 0.010301313417460727, "percentage": 0.59, "elapsed_time": "0:07:04", "remaining_time": "19:56:13", "throughput": 470.17, "total_tokens": 199680} {"current_steps": 25, "total_steps": 3400, "loss": 0.4213, "lr": 1.4705882352941177e-05, "epoch": 0.012876641771825908, "percentage": 0.74, "elapsed_time": "0:08:30", "remaining_time": "19:08:45", "throughput": 488.88, "total_tokens": 249600} {"current_steps": 30, "total_steps": 3400, "loss": 0.3359, "lr": 1.7647058823529414e-05, "epoch": 0.01545197012619109, "percentage": 0.88, "elapsed_time": "0:09:58", "remaining_time": "18:39:49", "throughput": 500.76, "total_tokens": 299520} {"current_steps": 35, "total_steps": 3400, "loss": 0.3463, "lr": 2.058823529411765e-05, "epoch": 0.018027298480556272, "percentage": 1.03, "elapsed_time": "0:11:24", "remaining_time": "18:16:36", "throughput": 510.61, "total_tokens": 349440} {"current_steps": 40, "total_steps": 3400, "loss": 0.28, "lr": 2.3529411764705884e-05, "epoch": 0.020602626834921454, "percentage": 1.18, "elapsed_time": "0:12:51", "remaining_time": "18:00:30", "throughput": 517.44, "total_tokens": 399360} {"current_steps": 45, "total_steps": 3400, "loss": 0.3442, "lr": 2.647058823529412e-05, "epoch": 0.023177955189286635, "percentage": 1.32, "elapsed_time": "0:14:18", "remaining_time": "17:46:12", "throughput": 523.61, "total_tokens": 449280} {"current_steps": 50, "total_steps": 3400, "loss": 0.3441, "lr": 2.9411764705882354e-05, "epoch": 0.025753283543651816, "percentage": 1.47, "elapsed_time": "0:15:45", "remaining_time": "17:36:13", "throughput": 527.77, "total_tokens": 499200} {"current_steps": 50, "total_steps": 3400, "eval_loss": 0.33834776282310486, "epoch": 0.025753283543651816, "percentage": 1.47, "elapsed_time": "0:16:33", "remaining_time": "18:29:12", "throughput": 502.56, "total_tokens": 499200} {"current_steps": 55, "total_steps": 3400, "loss": 0.3182, "lr": 3.235294117647059e-05, "epoch": 0.028328611898016998, "percentage": 1.62, "elapsed_time": "0:18:08", "remaining_time": "18:22:58", "throughput": 504.64, "total_tokens": 549120} {"current_steps": 60, "total_steps": 3400, "loss": 0.3294, "lr": 3.529411764705883e-05, "epoch": 0.03090394025238218, "percentage": 1.76, "elapsed_time": "0:19:36", "remaining_time": "18:11:07", "throughput": 509.36, "total_tokens": 599040} {"current_steps": 65, "total_steps": 3400, "loss": 0.3097, "lr": 3.8235294117647055e-05, "epoch": 0.03347926860674736, "percentage": 1.91, "elapsed_time": "0:21:02", "remaining_time": "17:59:13", "throughput": 514.21, "total_tokens": 648960} {"current_steps": 70, "total_steps": 3400, "loss": 0.3008, "lr": 4.11764705882353e-05, "epoch": 0.036054596961112545, "percentage": 2.06, "elapsed_time": "0:22:28", "remaining_time": "17:49:24", "throughput": 518.15, "total_tokens": 698880} {"current_steps": 75, "total_steps": 3400, "loss": 0.3278, "lr": 4.411764705882353e-05, "epoch": 0.03862992531547772, "percentage": 2.21, "elapsed_time": "0:23:55", "remaining_time": "17:40:18", "throughput": 521.81, "total_tokens": 748800} {"current_steps": 80, "total_steps": 3400, "loss": 0.3074, "lr": 4.705882352941177e-05, "epoch": 0.04120525366984291, "percentage": 2.35, "elapsed_time": "0:25:22", "remaining_time": "17:32:47", "throughput": 524.74, "total_tokens": 798720} {"current_steps": 85, "total_steps": 3400, "loss": 0.3423, "lr": 5e-05, "epoch": 0.043780582024208085, "percentage": 2.5, "elapsed_time": "0:26:47", "remaining_time": "17:25:06", "throughput": 527.8, "total_tokens": 848640} {"current_steps": 90, "total_steps": 3400, "loss": 0.3008, "lr": 5.294117647058824e-05, "epoch": 0.04635591037857327, "percentage": 2.65, "elapsed_time": "0:28:13", "remaining_time": "17:17:59", "throughput": 530.62, "total_tokens": 898560} {"current_steps": 95, "total_steps": 3400, "loss": 0.2815, "lr": 5.588235294117647e-05, "epoch": 0.04893123873293845, "percentage": 2.79, "elapsed_time": "0:29:38", "remaining_time": "17:11:24", "throughput": 533.21, "total_tokens": 948480} {"current_steps": 100, "total_steps": 3400, "loss": 0.2274, "lr": 5.882352941176471e-05, "epoch": 0.05150656708730363, "percentage": 2.94, "elapsed_time": "0:31:05", "remaining_time": "17:06:03", "throughput": 535.17, "total_tokens": 998400} {"current_steps": 100, "total_steps": 3400, "eval_loss": 0.18663176894187927, "epoch": 0.05150656708730363, "percentage": 2.94, "elapsed_time": "0:31:24", "remaining_time": "17:16:28", "throughput": 529.8, "total_tokens": 998400} {"current_steps": 105, "total_steps": 3400, "loss": 0.168, "lr": 6.176470588235295e-05, "epoch": 0.05408189544166881, "percentage": 3.09, "elapsed_time": "0:32:56", "remaining_time": "17:13:45", "throughput": 530.38, "total_tokens": 1048320} {"current_steps": 110, "total_steps": 3400, "loss": 0.0709, "lr": 6.470588235294118e-05, "epoch": 0.056657223796033995, "percentage": 3.24, "elapsed_time": "0:34:22", "remaining_time": "17:08:05", "throughput": 532.5, "total_tokens": 1098240} {"current_steps": 115, "total_steps": 3400, "loss": 0.1609, "lr": 6.764705882352942e-05, "epoch": 0.05923255215039917, "percentage": 3.38, "elapsed_time": "0:35:49", "remaining_time": "17:03:19", "throughput": 534.16, "total_tokens": 1148160} {"current_steps": 120, "total_steps": 3400, "loss": 0.0354, "lr": 7.058823529411765e-05, "epoch": 0.06180788050476436, "percentage": 3.53, "elapsed_time": "0:37:15", "remaining_time": "16:58:19", "throughput": 535.97, "total_tokens": 1198080} {"current_steps": 125, "total_steps": 3400, "loss": 0.1133, "lr": 7.352941176470589e-05, "epoch": 0.06438320885912954, "percentage": 3.68, "elapsed_time": "0:38:42", "remaining_time": "16:54:05", "throughput": 537.39, "total_tokens": 1248000} {"current_steps": 130, "total_steps": 3400, "loss": 0.0867, "lr": 7.647058823529411e-05, "epoch": 0.06695853721349472, "percentage": 3.82, "elapsed_time": "0:40:08", "remaining_time": "16:49:31", "throughput": 539.0, "total_tokens": 1297920} {"current_steps": 135, "total_steps": 3400, "loss": 0.1352, "lr": 7.941176470588235e-05, "epoch": 0.0695338655678599, "percentage": 3.97, "elapsed_time": "0:41:35", "remaining_time": "16:45:43", "throughput": 540.2, "total_tokens": 1347840} {"current_steps": 140, "total_steps": 3400, "loss": 0.101, "lr": 8.23529411764706e-05, "epoch": 0.07210919392222509, "percentage": 4.12, "elapsed_time": "0:43:00", "remaining_time": "16:41:36", "throughput": 541.59, "total_tokens": 1397760} {"current_steps": 145, "total_steps": 3400, "loss": 0.0334, "lr": 8.529411764705883e-05, "epoch": 0.07468452227659027, "percentage": 4.26, "elapsed_time": "0:44:28", "remaining_time": "16:38:14", "throughput": 542.59, "total_tokens": 1447680} {"current_steps": 150, "total_steps": 3400, "loss": 0.0667, "lr": 8.823529411764706e-05, "epoch": 0.07725985063095545, "percentage": 4.41, "elapsed_time": "0:45:53", "remaining_time": "16:34:25", "throughput": 543.83, "total_tokens": 1497600} {"current_steps": 150, "total_steps": 3400, "eval_loss": 0.09665286540985107, "epoch": 0.07725985063095545, "percentage": 4.41, "elapsed_time": "0:46:13", "remaining_time": "16:41:23", "throughput": 540.05, "total_tokens": 1497600} {"current_steps": 155, "total_steps": 3400, "loss": 0.06, "lr": 9.11764705882353e-05, "epoch": 0.07983517898532062, "percentage": 4.56, "elapsed_time": "0:47:46", "remaining_time": "16:40:10", "throughput": 539.88, "total_tokens": 1547520} {"current_steps": 160, "total_steps": 3400, "loss": 0.0265, "lr": 9.411764705882353e-05, "epoch": 0.08241050733968582, "percentage": 4.71, "elapsed_time": "0:49:12", "remaining_time": "16:36:21", "throughput": 541.11, "total_tokens": 1597440} {"current_steps": 165, "total_steps": 3400, "loss": 0.1743, "lr": 9.705882352941177e-05, "epoch": 0.08498583569405099, "percentage": 4.85, "elapsed_time": "0:50:39", "remaining_time": "16:33:07", "throughput": 542.03, "total_tokens": 1647360} {"current_steps": 170, "total_steps": 3400, "loss": 0.051, "lr": 0.0001, "epoch": 0.08756116404841617, "percentage": 5.0, "elapsed_time": "0:52:04", "remaining_time": "16:29:34", "throughput": 543.14, "total_tokens": 1697280} {"current_steps": 175, "total_steps": 3400, "loss": 0.0584, "lr": 9.999940874631277e-05, "epoch": 0.09013649240278135, "percentage": 5.15, "elapsed_time": "0:53:31", "remaining_time": "16:26:31", "throughput": 543.97, "total_tokens": 1747200} {"current_steps": 180, "total_steps": 3400, "loss": 0.0704, "lr": 9.999763499923432e-05, "epoch": 0.09271182075714654, "percentage": 5.29, "elapsed_time": "0:54:57", "remaining_time": "16:23:09", "throughput": 544.99, "total_tokens": 1797120} {"current_steps": 185, "total_steps": 3400, "loss": 0.0278, "lr": 9.999467880071402e-05, "epoch": 0.09528714911151172, "percentage": 5.44, "elapsed_time": "0:56:23", "remaining_time": "16:20:03", "throughput": 545.86, "total_tokens": 1847040} {"current_steps": 190, "total_steps": 3400, "loss": 0.0862, "lr": 9.999054022066641e-05, "epoch": 0.0978624774658769, "percentage": 5.59, "elapsed_time": "0:57:49", "remaining_time": "16:16:57", "throughput": 546.74, "total_tokens": 1896960} {"current_steps": 195, "total_steps": 3400, "loss": 0.0565, "lr": 9.998521935696953e-05, "epoch": 0.10043780582024209, "percentage": 5.74, "elapsed_time": "0:59:16", "remaining_time": "16:14:07", "throughput": 547.48, "total_tokens": 1946880} {"current_steps": 200, "total_steps": 3400, "loss": 0.0459, "lr": 9.997871633546257e-05, "epoch": 0.10301313417460727, "percentage": 5.88, "elapsed_time": "1:00:42", "remaining_time": "16:11:15", "throughput": 548.24, "total_tokens": 1996800} {"current_steps": 200, "total_steps": 3400, "eval_loss": 0.09957947582006454, "epoch": 0.10301313417460727, "percentage": 5.88, "elapsed_time": "1:01:01", "remaining_time": "16:16:23", "throughput": 545.35, "total_tokens": 1996800} {"current_steps": 205, "total_steps": 3400, "loss": 0.0539, "lr": 9.997103130994296e-05, "epoch": 0.10558846252897244, "percentage": 6.03, "elapsed_time": "1:02:33", "remaining_time": "16:14:54", "throughput": 545.33, "total_tokens": 2046720} {"current_steps": 210, "total_steps": 3400, "loss": 0.0654, "lr": 9.996216446216267e-05, "epoch": 0.10816379088333762, "percentage": 6.18, "elapsed_time": "1:03:59", "remaining_time": "16:12:04", "throughput": 546.06, "total_tokens": 2096640} {"current_steps": 215, "total_steps": 3400, "loss": 0.0316, "lr": 9.995211600182397e-05, "epoch": 0.11073911923770281, "percentage": 6.32, "elapsed_time": "1:05:25", "remaining_time": "16:09:07", "throughput": 546.87, "total_tokens": 2146560} {"current_steps": 220, "total_steps": 3400, "loss": 0.1169, "lr": 9.994088616657444e-05, "epoch": 0.11331444759206799, "percentage": 6.47, "elapsed_time": "1:06:52", "remaining_time": "16:06:35", "throughput": 547.44, "total_tokens": 2196480} {"current_steps": 225, "total_steps": 3400, "loss": 0.0382, "lr": 9.992847522200133e-05, "epoch": 0.11588977594643317, "percentage": 6.62, "elapsed_time": "1:08:18", "remaining_time": "16:03:50", "throughput": 548.14, "total_tokens": 2246400} {"current_steps": 230, "total_steps": 3400, "loss": 0.0406, "lr": 9.99148834616253e-05, "epoch": 0.11846510430079835, "percentage": 6.76, "elapsed_time": "1:09:45", "remaining_time": "16:01:25", "throughput": 548.65, "total_tokens": 2296320} {"current_steps": 235, "total_steps": 3400, "loss": 0.0182, "lr": 9.990011120689351e-05, "epoch": 0.12104043265516354, "percentage": 6.91, "elapsed_time": "1:11:10", "remaining_time": "15:58:33", "throughput": 549.42, "total_tokens": 2346240} {"current_steps": 240, "total_steps": 3400, "loss": 0.0881, "lr": 9.988415880717194e-05, "epoch": 0.12361576100952872, "percentage": 7.06, "elapsed_time": "1:12:36", "remaining_time": "15:56:06", "throughput": 549.96, "total_tokens": 2396160} {"current_steps": 245, "total_steps": 3400, "loss": 0.0565, "lr": 9.986702663973722e-05, "epoch": 0.1261910893638939, "percentage": 7.21, "elapsed_time": "1:14:02", "remaining_time": "15:53:33", "throughput": 550.56, "total_tokens": 2446080} {"current_steps": 250, "total_steps": 3400, "loss": 0.0805, "lr": 9.98487151097676e-05, "epoch": 0.12876641771825909, "percentage": 7.35, "elapsed_time": "1:15:30", "remaining_time": "15:51:18", "throughput": 550.98, "total_tokens": 2496000} {"current_steps": 250, "total_steps": 3400, "eval_loss": 0.055875860154628754, "epoch": 0.12876641771825909, "percentage": 7.35, "elapsed_time": "1:15:49", "remaining_time": "15:55:24", "throughput": 548.62, "total_tokens": 2496000} {"current_steps": 255, "total_steps": 3400, "loss": 0.0235, "lr": 9.98292246503335e-05, "epoch": 0.13134174607262425, "percentage": 7.5, "elapsed_time": "1:17:21", "remaining_time": "15:54:02", "throughput": 548.54, "total_tokens": 2545920} {"current_steps": 260, "total_steps": 3400, "loss": 0.0137, "lr": 9.980855572238714e-05, "epoch": 0.13391707442698944, "percentage": 7.65, "elapsed_time": "1:18:48", "remaining_time": "15:51:46", "throughput": 548.97, "total_tokens": 2595840} {"current_steps": 265, "total_steps": 3400, "loss": 0.0605, "lr": 9.978670881475172e-05, "epoch": 0.13649240278135463, "percentage": 7.79, "elapsed_time": "1:20:15", "remaining_time": "15:49:23", "throughput": 549.47, "total_tokens": 2645760} {"current_steps": 270, "total_steps": 3400, "loss": 0.0585, "lr": 9.976368444410985e-05, "epoch": 0.1390677311357198, "percentage": 7.94, "elapsed_time": "1:21:42", "remaining_time": "15:47:09", "throughput": 549.89, "total_tokens": 2695680} {"current_steps": 275, "total_steps": 3400, "loss": 0.0096, "lr": 9.973948315499126e-05, "epoch": 0.141643059490085, "percentage": 8.09, "elapsed_time": "1:23:08", "remaining_time": "15:44:48", "throughput": 550.37, "total_tokens": 2745600} {"current_steps": 280, "total_steps": 3400, "loss": 0.1383, "lr": 9.971410551976002e-05, "epoch": 0.14421838784445018, "percentage": 8.24, "elapsed_time": "1:24:35", "remaining_time": "15:42:37", "throughput": 550.77, "total_tokens": 2795520} {"current_steps": 285, "total_steps": 3400, "loss": 0.049, "lr": 9.968755213860094e-05, "epoch": 0.14679371619881534, "percentage": 8.38, "elapsed_time": "1:26:02", "remaining_time": "15:40:23", "throughput": 551.19, "total_tokens": 2845440} {"current_steps": 290, "total_steps": 3400, "loss": 0.0336, "lr": 9.96598236395054e-05, "epoch": 0.14936904455318054, "percentage": 8.53, "elapsed_time": "1:27:29", "remaining_time": "15:38:15", "throughput": 551.56, "total_tokens": 2895360} {"current_steps": 295, "total_steps": 3400, "loss": 0.019, "lr": 9.96309206782565e-05, "epoch": 0.1519443729075457, "percentage": 8.68, "elapsed_time": "1:28:55", "remaining_time": "15:36:01", "throughput": 551.98, "total_tokens": 2945280} {"current_steps": 300, "total_steps": 3400, "loss": 0.0381, "lr": 9.960084393841355e-05, "epoch": 0.1545197012619109, "percentage": 8.82, "elapsed_time": "1:30:22", "remaining_time": "15:33:51", "throughput": 552.37, "total_tokens": 2995200} {"current_steps": 300, "total_steps": 3400, "eval_loss": 0.030908752232789993, "epoch": 0.1545197012619109, "percentage": 8.82, "elapsed_time": "1:30:42", "remaining_time": "15:37:17", "throughput": 550.35, "total_tokens": 2995200} {"current_steps": 305, "total_steps": 3400, "loss": 0.0245, "lr": 9.956959413129585e-05, "epoch": 0.15709502961627608, "percentage": 8.97, "elapsed_time": "1:32:14", "remaining_time": "15:36:04", "throughput": 550.18, "total_tokens": 3045120} {"current_steps": 310, "total_steps": 3400, "loss": 0.0121, "lr": 9.953717199596598e-05, "epoch": 0.15967035797064125, "percentage": 9.12, "elapsed_time": "1:33:40", "remaining_time": "15:33:47", "throughput": 550.63, "total_tokens": 3095040} {"current_steps": 315, "total_steps": 3400, "loss": 0.054, "lr": 9.95035782992122e-05, "epoch": 0.16224568632500644, "percentage": 9.26, "elapsed_time": "1:35:08", "remaining_time": "15:31:46", "throughput": 550.93, "total_tokens": 3144960} {"current_steps": 320, "total_steps": 3400, "loss": 0.0849, "lr": 9.94688138355304e-05, "epoch": 0.16482101467937163, "percentage": 9.41, "elapsed_time": "1:36:34", "remaining_time": "15:29:34", "throughput": 551.34, "total_tokens": 3194880} {"current_steps": 325, "total_steps": 3400, "loss": 0.0503, "lr": 9.943287942710527e-05, "epoch": 0.1673963430337368, "percentage": 9.56, "elapsed_time": "1:38:02", "remaining_time": "15:27:35", "throughput": 551.62, "total_tokens": 3244800} {"current_steps": 330, "total_steps": 3400, "loss": 0.0302, "lr": 9.939577592379088e-05, "epoch": 0.16997167138810199, "percentage": 9.71, "elapsed_time": "1:39:28", "remaining_time": "15:25:25", "throughput": 552.01, "total_tokens": 3294720} {"current_steps": 335, "total_steps": 3400, "loss": 0.082, "lr": 9.935750420309055e-05, "epoch": 0.17254699974246718, "percentage": 9.85, "elapsed_time": "1:40:56", "remaining_time": "15:23:29", "throughput": 552.27, "total_tokens": 3344640} {"current_steps": 340, "total_steps": 3400, "loss": 0.0411, "lr": 9.931806517013612e-05, "epoch": 0.17512232809683234, "percentage": 10.0, "elapsed_time": "1:42:22", "remaining_time": "15:21:21", "throughput": 552.64, "total_tokens": 3394560} {"current_steps": 345, "total_steps": 3400, "loss": 0.1158, "lr": 9.927745975766654e-05, "epoch": 0.17769765645119753, "percentage": 10.15, "elapsed_time": "1:43:49", "remaining_time": "15:19:24", "throughput": 552.91, "total_tokens": 3444480} {"current_steps": 350, "total_steps": 3400, "loss": 0.1761, "lr": 9.923568892600578e-05, "epoch": 0.1802729848055627, "percentage": 10.29, "elapsed_time": "1:45:15", "remaining_time": "15:17:17", "throughput": 553.28, "total_tokens": 3494400} {"current_steps": 350, "total_steps": 3400, "eval_loss": 0.043948542326688766, "epoch": 0.1802729848055627, "percentage": 10.29, "elapsed_time": "1:45:35", "remaining_time": "15:20:06", "throughput": 551.59, "total_tokens": 3494400} {"current_steps": 355, "total_steps": 3400, "loss": 0.0267, "lr": 9.91927536630402e-05, "epoch": 0.1828483131599279, "percentage": 10.44, "elapsed_time": "1:47:07", "remaining_time": "15:18:49", "throughput": 551.45, "total_tokens": 3544320} {"current_steps": 360, "total_steps": 3400, "loss": 0.0642, "lr": 9.91486549841951e-05, "epoch": 0.18542364151429308, "percentage": 10.59, "elapsed_time": "1:48:32", "remaining_time": "15:16:32", "throughput": 551.91, "total_tokens": 3594240} {"current_steps": 365, "total_steps": 3400, "loss": 0.0302, "lr": 9.91033939324107e-05, "epoch": 0.18799896986865824, "percentage": 10.74, "elapsed_time": "1:49:58", "remaining_time": "15:14:24", "throughput": 552.3, "total_tokens": 3644160} {"current_steps": 370, "total_steps": 3400, "loss": 0.0099, "lr": 9.905697157811761e-05, "epoch": 0.19057429822302344, "percentage": 10.88, "elapsed_time": "1:51:23", "remaining_time": "15:12:12", "throughput": 552.72, "total_tokens": 3694080} {"current_steps": 375, "total_steps": 3400, "loss": 0.0573, "lr": 9.900938901921131e-05, "epoch": 0.19314962657738863, "percentage": 11.03, "elapsed_time": "1:52:49", "remaining_time": "15:10:05", "throughput": 553.08, "total_tokens": 3744000} {"current_steps": 380, "total_steps": 3400, "loss": 0.0302, "lr": 9.896064738102635e-05, "epoch": 0.1957249549317538, "percentage": 11.18, "elapsed_time": "1:54:14", "remaining_time": "15:07:55", "throughput": 553.49, "total_tokens": 3793920} {"current_steps": 385, "total_steps": 3400, "loss": 0.0374, "lr": 9.891074781630966e-05, "epoch": 0.19830028328611898, "percentage": 11.32, "elapsed_time": "1:55:39", "remaining_time": "15:05:47", "throughput": 553.87, "total_tokens": 3843840} {"current_steps": 390, "total_steps": 3400, "loss": 0.0227, "lr": 9.885969150519331e-05, "epoch": 0.20087561164048418, "percentage": 11.47, "elapsed_time": "1:57:05", "remaining_time": "15:03:41", "throughput": 554.24, "total_tokens": 3893760} {"current_steps": 395, "total_steps": 3400, "loss": 0.0104, "lr": 9.88074796551666e-05, "epoch": 0.20345093999484934, "percentage": 11.62, "elapsed_time": "1:58:30", "remaining_time": "15:01:31", "throughput": 554.65, "total_tokens": 3943680} {"current_steps": 400, "total_steps": 3400, "loss": 0.0146, "lr": 9.875411350104744e-05, "epoch": 0.20602626834921453, "percentage": 11.76, "elapsed_time": "1:59:55", "remaining_time": "14:59:29", "throughput": 554.98, "total_tokens": 3993600} {"current_steps": 400, "total_steps": 3400, "eval_loss": 0.024433813989162445, "epoch": 0.20602626834921453, "percentage": 11.76, "elapsed_time": "2:00:14", "remaining_time": "15:01:50", "throughput": 553.54, "total_tokens": 3993600} {"current_steps": 405, "total_steps": 3400, "loss": 0.0074, "lr": 9.86995943049533e-05, "epoch": 0.2086015967035797, "percentage": 11.91, "elapsed_time": "2:01:44", "remaining_time": "15:00:19", "throughput": 553.54, "total_tokens": 4043520} {"current_steps": 410, "total_steps": 3400, "loss": 0.0375, "lr": 9.864392335627117e-05, "epoch": 0.2111769250579449, "percentage": 12.06, "elapsed_time": "2:03:10", "remaining_time": "14:58:16", "throughput": 553.88, "total_tokens": 4093440} {"current_steps": 415, "total_steps": 3400, "loss": 0.0217, "lr": 9.858710197162721e-05, "epoch": 0.21375225341231008, "percentage": 12.21, "elapsed_time": "2:04:35", "remaining_time": "14:56:06", "throughput": 554.29, "total_tokens": 4143360} {"current_steps": 420, "total_steps": 3400, "loss": 0.016, "lr": 9.852913149485556e-05, "epoch": 0.21632758176667524, "percentage": 12.35, "elapsed_time": "2:06:01", "remaining_time": "14:54:07", "throughput": 554.59, "total_tokens": 4193280} {"current_steps": 425, "total_steps": 3400, "loss": 0.0832, "lr": 9.847001329696653e-05, "epoch": 0.21890291012104043, "percentage": 12.5, "elapsed_time": "2:07:25", "remaining_time": "14:52:00", "throughput": 554.97, "total_tokens": 4243200} {"current_steps": 430, "total_steps": 3400, "loss": 0.0444, "lr": 9.840974877611422e-05, "epoch": 0.22147823847540563, "percentage": 12.65, "elapsed_time": "2:08:51", "remaining_time": "14:50:03", "throughput": 555.25, "total_tokens": 4293120} {"current_steps": 435, "total_steps": 3400, "loss": 0.0465, "lr": 9.834833935756344e-05, "epoch": 0.2240535668297708, "percentage": 12.79, "elapsed_time": "2:10:16", "remaining_time": "14:47:58", "throughput": 555.61, "total_tokens": 4343040} {"current_steps": 440, "total_steps": 3400, "loss": 0.0428, "lr": 9.828578649365601e-05, "epoch": 0.22662889518413598, "percentage": 12.94, "elapsed_time": "2:11:42", "remaining_time": "14:46:01", "throughput": 555.91, "total_tokens": 4392960} {"current_steps": 445, "total_steps": 3400, "loss": 0.02, "lr": 9.822209166377635e-05, "epoch": 0.22920422353850115, "percentage": 13.09, "elapsed_time": "2:13:07", "remaining_time": "14:44:00", "throughput": 556.23, "total_tokens": 4442880} {"current_steps": 450, "total_steps": 3400, "loss": 0.0157, "lr": 9.815725637431662e-05, "epoch": 0.23177955189286634, "percentage": 13.24, "elapsed_time": "2:14:33", "remaining_time": "14:42:03", "throughput": 556.51, "total_tokens": 4492800} {"current_steps": 450, "total_steps": 3400, "eval_loss": 0.006690301466733217, "epoch": 0.23177955189286634, "percentage": 13.24, "elapsed_time": "2:14:51", "remaining_time": "14:44:06", "throughput": 555.22, "total_tokens": 4492800} {"current_steps": 455, "total_steps": 3400, "loss": 0.0596, "lr": 9.809128215864097e-05, "epoch": 0.23435488024723153, "percentage": 13.38, "elapsed_time": "2:16:22", "remaining_time": "14:42:43", "throughput": 555.15, "total_tokens": 4542720} {"current_steps": 460, "total_steps": 3400, "loss": 0.0238, "lr": 9.802417057704931e-05, "epoch": 0.2369302086015967, "percentage": 13.53, "elapsed_time": "2:17:48", "remaining_time": "14:40:47", "throughput": 555.43, "total_tokens": 4592640} {"current_steps": 465, "total_steps": 3400, "loss": 0.0331, "lr": 9.795592321674045e-05, "epoch": 0.23950553695596188, "percentage": 13.68, "elapsed_time": "2:19:13", "remaining_time": "14:38:47", "throughput": 555.74, "total_tokens": 4642560} {"current_steps": 470, "total_steps": 3400, "loss": 0.0177, "lr": 9.788654169177453e-05, "epoch": 0.24208086531032708, "percentage": 13.82, "elapsed_time": "2:20:39", "remaining_time": "14:36:50", "throughput": 556.04, "total_tokens": 4692480} {"current_steps": 475, "total_steps": 3400, "loss": 0.028, "lr": 9.781602764303487e-05, "epoch": 0.24465619366469224, "percentage": 13.97, "elapsed_time": "2:22:04", "remaining_time": "14:34:51", "throughput": 556.34, "total_tokens": 4742400} {"current_steps": 480, "total_steps": 3400, "loss": 0.0561, "lr": 9.774438273818911e-05, "epoch": 0.24723152201905743, "percentage": 14.12, "elapsed_time": "2:23:28", "remaining_time": "14:32:51", "throughput": 556.67, "total_tokens": 4792320} {"current_steps": 485, "total_steps": 3400, "loss": 0.0242, "lr": 9.767160867164979e-05, "epoch": 0.24980685037342262, "percentage": 14.26, "elapsed_time": "2:24:54", "remaining_time": "14:30:57", "throughput": 556.92, "total_tokens": 4842240} {"current_steps": 490, "total_steps": 3400, "loss": 0.0286, "lr": 9.759770716453436e-05, "epoch": 0.2523821787277878, "percentage": 14.41, "elapsed_time": "2:26:19", "remaining_time": "14:28:59", "throughput": 557.22, "total_tokens": 4892160} {"current_steps": 495, "total_steps": 3400, "loss": 0.0394, "lr": 9.752267996462434e-05, "epoch": 0.254957507082153, "percentage": 14.56, "elapsed_time": "2:27:45", "remaining_time": "14:27:06", "throughput": 557.47, "total_tokens": 4942080} {"current_steps": 500, "total_steps": 3400, "loss": 0.0122, "lr": 9.744652884632406e-05, "epoch": 0.25753283543651817, "percentage": 14.71, "elapsed_time": "2:29:10", "remaining_time": "14:25:10", "throughput": 557.76, "total_tokens": 4992000} {"current_steps": 500, "total_steps": 3400, "eval_loss": 0.007972972467541695, "epoch": 0.25753283543651817, "percentage": 14.71, "elapsed_time": "2:29:28", "remaining_time": "14:26:59", "throughput": 556.59, "total_tokens": 4992000} {"current_steps": 505, "total_steps": 3400, "loss": 0.0184, "lr": 9.736925561061871e-05, "epoch": 0.26010816379088336, "percentage": 14.85, "elapsed_time": "2:31:00", "remaining_time": "14:25:42", "throughput": 556.46, "total_tokens": 5041920} {"current_steps": 510, "total_steps": 3400, "loss": 0.0046, "lr": 9.729086208503174e-05, "epoch": 0.2626834921452485, "percentage": 15.0, "elapsed_time": "2:32:25", "remaining_time": "14:23:44", "throughput": 556.76, "total_tokens": 5091840} {"current_steps": 515, "total_steps": 3400, "loss": 0.0226, "lr": 9.721135012358156e-05, "epoch": 0.2652588204996137, "percentage": 15.15, "elapsed_time": "2:33:51", "remaining_time": "14:21:54", "throughput": 556.98, "total_tokens": 5141760} {"current_steps": 520, "total_steps": 3400, "loss": 0.0475, "lr": 9.713072160673777e-05, "epoch": 0.2678341488539789, "percentage": 15.29, "elapsed_time": "2:35:15", "remaining_time": "14:19:56", "throughput": 557.29, "total_tokens": 5191680} {"current_steps": 525, "total_steps": 3400, "loss": 0.0572, "lr": 9.704897844137673e-05, "epoch": 0.2704094772083441, "percentage": 15.44, "elapsed_time": "2:36:41", "remaining_time": "14:18:06", "throughput": 557.51, "total_tokens": 5241600} {"current_steps": 530, "total_steps": 3400, "loss": 0.025, "lr": 9.696612256073633e-05, "epoch": 0.27298480556270927, "percentage": 15.59, "elapsed_time": "2:38:06", "remaining_time": "14:16:09", "throughput": 557.81, "total_tokens": 5291520} {"current_steps": 535, "total_steps": 3400, "loss": 0.0122, "lr": 9.688215592437039e-05, "epoch": 0.2755601339170744, "percentage": 15.74, "elapsed_time": "2:39:31", "remaining_time": "14:14:18", "throughput": 558.04, "total_tokens": 5341440} {"current_steps": 540, "total_steps": 3400, "loss": 0.0045, "lr": 9.679708051810221e-05, "epoch": 0.2781354622714396, "percentage": 15.88, "elapsed_time": "2:40:56", "remaining_time": "14:12:24", "throughput": 558.3, "total_tokens": 5391360} {"current_steps": 545, "total_steps": 3400, "loss": 0.0431, "lr": 9.67108983539777e-05, "epoch": 0.2807107906258048, "percentage": 16.03, "elapsed_time": "2:42:22", "remaining_time": "14:10:33", "throughput": 558.54, "total_tokens": 5441280} {"current_steps": 550, "total_steps": 3400, "loss": 0.0339, "lr": 9.662361147021779e-05, "epoch": 0.28328611898017, "percentage": 16.18, "elapsed_time": "2:43:46", "remaining_time": "14:08:40", "throughput": 558.8, "total_tokens": 5491200} {"current_steps": 550, "total_steps": 3400, "eval_loss": 0.0033526704646646976, "epoch": 0.28328611898017, "percentage": 16.18, "elapsed_time": "2:44:05", "remaining_time": "14:10:18", "throughput": 557.73, "total_tokens": 5491200} {"current_steps": 555, "total_steps": 3400, "loss": 0.0341, "lr": 9.653522193117013e-05, "epoch": 0.28586144733453517, "percentage": 16.32, "elapsed_time": "2:45:37", "remaining_time": "14:09:00", "throughput": 557.6, "total_tokens": 5541120} {"current_steps": 560, "total_steps": 3400, "loss": 0.0341, "lr": 9.644573182726035e-05, "epoch": 0.28843677568890036, "percentage": 16.47, "elapsed_time": "2:47:02", "remaining_time": "14:07:07", "throughput": 557.86, "total_tokens": 5591040} {"current_steps": 565, "total_steps": 3400, "loss": 0.0453, "lr": 9.63551432749426e-05, "epoch": 0.2910121040432655, "percentage": 16.62, "elapsed_time": "2:48:27", "remaining_time": "14:05:18", "throughput": 558.08, "total_tokens": 5640960} {"current_steps": 570, "total_steps": 3400, "loss": 0.0227, "lr": 9.626345841664953e-05, "epoch": 0.2935874323976307, "percentage": 16.76, "elapsed_time": "2:49:53", "remaining_time": "14:03:28", "throughput": 558.3, "total_tokens": 5690880} {"current_steps": 575, "total_steps": 3400, "loss": 0.0135, "lr": 9.617067942074153e-05, "epoch": 0.2961627607519959, "percentage": 16.91, "elapsed_time": "2:51:18", "remaining_time": "14:01:39", "throughput": 558.51, "total_tokens": 5740800} {"current_steps": 580, "total_steps": 3400, "loss": 0.0439, "lr": 9.607680848145558e-05, "epoch": 0.29873808910636107, "percentage": 17.06, "elapsed_time": "2:52:44", "remaining_time": "13:59:53", "throughput": 558.7, "total_tokens": 5790720} {"current_steps": 585, "total_steps": 3400, "loss": 0.0344, "lr": 9.598184781885318e-05, "epoch": 0.30131341746072626, "percentage": 17.21, "elapsed_time": "2:54:09", "remaining_time": "13:58:03", "throughput": 558.93, "total_tokens": 5840640} {"current_steps": 590, "total_steps": 3400, "loss": 0.0244, "lr": 9.588579967876806e-05, "epoch": 0.3038887458150914, "percentage": 17.35, "elapsed_time": "2:55:35", "remaining_time": "13:56:19", "throughput": 559.09, "total_tokens": 5890560} {"current_steps": 595, "total_steps": 3400, "loss": 0.022, "lr": 9.578866633275288e-05, "epoch": 0.3064640741694566, "percentage": 17.5, "elapsed_time": "2:57:00", "remaining_time": "13:54:29", "throughput": 559.32, "total_tokens": 5940480} {"current_steps": 600, "total_steps": 3400, "loss": 0.0217, "lr": 9.569045007802559e-05, "epoch": 0.3090394025238218, "percentage": 17.65, "elapsed_time": "2:58:27", "remaining_time": "13:52:46", "throughput": 559.48, "total_tokens": 5990400} {"current_steps": 600, "total_steps": 3400, "eval_loss": 0.013290103524923325, "epoch": 0.3090394025238218, "percentage": 17.65, "elapsed_time": "2:58:45", "remaining_time": "13:54:14", "throughput": 558.49, "total_tokens": 5990400} {"current_steps": 605, "total_steps": 3400, "loss": 0.0207, "lr": 9.55911532374151e-05, "epoch": 0.311614730878187, "percentage": 17.79, "elapsed_time": "3:00:16", "remaining_time": "13:52:50", "throughput": 558.44, "total_tokens": 6040320} {"current_steps": 610, "total_steps": 3400, "loss": 0.023, "lr": 9.549077815930636e-05, "epoch": 0.31419005923255217, "percentage": 17.94, "elapsed_time": "3:01:42", "remaining_time": "13:51:07", "throughput": 558.59, "total_tokens": 6090240} {"current_steps": 615, "total_steps": 3400, "loss": 0.017, "lr": 9.538932721758474e-05, "epoch": 0.31676538758691736, "percentage": 18.09, "elapsed_time": "3:03:08", "remaining_time": "13:49:20", "throughput": 558.78, "total_tokens": 6140160} {"current_steps": 620, "total_steps": 3400, "loss": 0.009, "lr": 9.528680281157999e-05, "epoch": 0.3193407159412825, "percentage": 18.24, "elapsed_time": "3:04:35", "remaining_time": "13:47:41", "throughput": 558.9, "total_tokens": 6190080} {"current_steps": 625, "total_steps": 3400, "loss": 0.0421, "lr": 9.518320736600943e-05, "epoch": 0.3219160442956477, "percentage": 18.38, "elapsed_time": "3:06:01", "remaining_time": "13:45:59", "throughput": 559.04, "total_tokens": 6240000} {"current_steps": 630, "total_steps": 3400, "loss": 0.0324, "lr": 9.507854333092063e-05, "epoch": 0.3244913726500129, "percentage": 18.53, "elapsed_time": "3:07:28", "remaining_time": "13:44:17", "throughput": 559.18, "total_tokens": 6289920} {"current_steps": 635, "total_steps": 3400, "loss": 0.0139, "lr": 9.497281318163346e-05, "epoch": 0.32706670100437807, "percentage": 18.68, "elapsed_time": "3:08:54", "remaining_time": "13:42:33", "throughput": 559.35, "total_tokens": 6339840} {"current_steps": 640, "total_steps": 3400, "loss": 0.0375, "lr": 9.486601941868154e-05, "epoch": 0.32964202935874326, "percentage": 18.82, "elapsed_time": "3:10:21", "remaining_time": "13:40:54", "throughput": 559.46, "total_tokens": 6389760} {"current_steps": 645, "total_steps": 3400, "loss": 0.0618, "lr": 9.475816456775313e-05, "epoch": 0.3322173577131084, "percentage": 18.97, "elapsed_time": "3:11:47", "remaining_time": "13:39:13", "throughput": 559.59, "total_tokens": 6439680} {"current_steps": 650, "total_steps": 3400, "loss": 0.0327, "lr": 9.464925117963133e-05, "epoch": 0.3347926860674736, "percentage": 19.12, "elapsed_time": "3:13:14", "remaining_time": "13:37:33", "throughput": 559.72, "total_tokens": 6489600} {"current_steps": 650, "total_steps": 3400, "eval_loss": 0.02095886506140232, "epoch": 0.3347926860674736, "percentage": 19.12, "elapsed_time": "3:13:33", "remaining_time": "13:38:54", "throughput": 558.79, "total_tokens": 6489600} {"current_steps": 655, "total_steps": 3400, "loss": 0.037, "lr": 9.453928183013385e-05, "epoch": 0.3373680144218388, "percentage": 19.26, "elapsed_time": "3:15:04", "remaining_time": "13:37:31", "throughput": 558.72, "total_tokens": 6539520} {"current_steps": 660, "total_steps": 3400, "loss": 0.034, "lr": 9.442825912005202e-05, "epoch": 0.33994334277620397, "percentage": 19.41, "elapsed_time": "3:16:30", "remaining_time": "13:35:50", "throughput": 558.86, "total_tokens": 6589440} {"current_steps": 665, "total_steps": 3400, "loss": 0.0584, "lr": 9.431618567508933e-05, "epoch": 0.34251867113056916, "percentage": 19.56, "elapsed_time": "3:17:56", "remaining_time": "13:34:06", "throughput": 559.03, "total_tokens": 6639360} {"current_steps": 670, "total_steps": 3400, "loss": 0.059, "lr": 9.420306414579925e-05, "epoch": 0.34509399948493436, "percentage": 19.71, "elapsed_time": "3:19:22", "remaining_time": "13:32:22", "throughput": 559.19, "total_tokens": 6689280} {"current_steps": 675, "total_steps": 3400, "loss": 0.023, "lr": 9.408889720752266e-05, "epoch": 0.3476693278392995, "percentage": 19.85, "elapsed_time": "3:20:48", "remaining_time": "13:30:39", "throughput": 559.34, "total_tokens": 6739200} {"current_steps": 680, "total_steps": 3400, "loss": 0.0327, "lr": 9.397368756032445e-05, "epoch": 0.3502446561936647, "percentage": 20.0, "elapsed_time": "3:22:13", "remaining_time": "13:28:55", "throughput": 559.52, "total_tokens": 6789120} {"current_steps": 685, "total_steps": 3400, "loss": 0.0241, "lr": 9.385743792892982e-05, "epoch": 0.3528199845480299, "percentage": 20.15, "elapsed_time": "3:23:40", "remaining_time": "13:27:16", "throughput": 559.63, "total_tokens": 6839040} {"current_steps": 690, "total_steps": 3400, "loss": 0.0227, "lr": 9.374015106265968e-05, "epoch": 0.35539531290239507, "percentage": 20.29, "elapsed_time": "3:25:05", "remaining_time": "13:25:32", "throughput": 559.81, "total_tokens": 6888960} {"current_steps": 695, "total_steps": 3400, "loss": 0.0171, "lr": 9.362182973536569e-05, "epoch": 0.35797064125676026, "percentage": 20.44, "elapsed_time": "3:26:32", "remaining_time": "13:23:51", "throughput": 559.94, "total_tokens": 6938880} {"current_steps": 700, "total_steps": 3400, "loss": 0.0267, "lr": 9.35024767453647e-05, "epoch": 0.3605459696111254, "percentage": 20.59, "elapsed_time": "3:27:56", "remaining_time": "13:22:04", "throughput": 560.15, "total_tokens": 6988800} {"current_steps": 700, "total_steps": 3400, "eval_loss": 0.005286735948175192, "epoch": 0.3605459696111254, "percentage": 20.59, "elapsed_time": "3:28:16", "remaining_time": "13:23:18", "throughput": 559.28, "total_tokens": 6988800} {"current_steps": 705, "total_steps": 3400, "loss": 0.0335, "lr": 9.338209491537257e-05, "epoch": 0.3631212979654906, "percentage": 20.74, "elapsed_time": "3:29:47", "remaining_time": "13:21:58", "throughput": 559.17, "total_tokens": 7038720} {"current_steps": 710, "total_steps": 3400, "loss": 0.0108, "lr": 9.326068709243727e-05, "epoch": 0.3656966263198558, "percentage": 20.88, "elapsed_time": "3:31:13", "remaining_time": "13:20:14", "throughput": 559.35, "total_tokens": 7088640} {"current_steps": 715, "total_steps": 3400, "loss": 0.0296, "lr": 9.313825614787177e-05, "epoch": 0.36827195467422097, "percentage": 21.03, "elapsed_time": "3:32:39", "remaining_time": "13:18:34", "throughput": 559.48, "total_tokens": 7138560} {"current_steps": 720, "total_steps": 3400, "loss": 0.042, "lr": 9.301480497718593e-05, "epoch": 0.37084728302858616, "percentage": 21.18, "elapsed_time": "3:34:04", "remaining_time": "13:16:51", "throughput": 559.64, "total_tokens": 7188480} {"current_steps": 725, "total_steps": 3400, "loss": 0.0083, "lr": 9.289033650001817e-05, "epoch": 0.37342261138295135, "percentage": 21.32, "elapsed_time": "3:35:31", "remaining_time": "13:15:11", "throughput": 559.76, "total_tokens": 7238400} {"current_steps": 730, "total_steps": 3400, "loss": 0.0109, "lr": 9.276485366006634e-05, "epoch": 0.3759979397373165, "percentage": 21.47, "elapsed_time": "3:36:56", "remaining_time": "13:13:29", "throughput": 559.92, "total_tokens": 7288320} {"current_steps": 735, "total_steps": 3400, "loss": 0.0122, "lr": 9.263835942501807e-05, "epoch": 0.3785732680916817, "percentage": 21.62, "elapsed_time": "3:38:23", "remaining_time": "13:11:49", "throughput": 560.04, "total_tokens": 7338240} {"current_steps": 740, "total_steps": 3400, "loss": 0.017, "lr": 9.251085678648072e-05, "epoch": 0.3811485964460469, "percentage": 21.76, "elapsed_time": "3:39:49", "remaining_time": "13:10:10", "throughput": 560.16, "total_tokens": 7388160} {"current_steps": 745, "total_steps": 3400, "loss": 0.0236, "lr": 9.238234875991046e-05, "epoch": 0.38372392480041206, "percentage": 21.91, "elapsed_time": "3:41:16", "remaining_time": "13:08:33", "throughput": 560.25, "total_tokens": 7438080} {"current_steps": 750, "total_steps": 3400, "loss": 0.014, "lr": 9.225283838454111e-05, "epoch": 0.38629925315477726, "percentage": 22.06, "elapsed_time": "3:42:42", "remaining_time": "13:06:53", "throughput": 560.39, "total_tokens": 7488000} {"current_steps": 750, "total_steps": 3400, "eval_loss": 0.005334165878593922, "epoch": 0.38629925315477726, "percentage": 22.06, "elapsed_time": "3:43:01", "remaining_time": "13:08:01", "throughput": 559.58, "total_tokens": 7488000} {"current_steps": 755, "total_steps": 3400, "loss": 0.0426, "lr": 9.21223287233121e-05, "epoch": 0.3888745815091424, "percentage": 22.21, "elapsed_time": "3:44:33", "remaining_time": "13:06:41", "throughput": 559.46, "total_tokens": 7537920} {"current_steps": 760, "total_steps": 3400, "loss": 0.0094, "lr": 9.199082286279622e-05, "epoch": 0.3914499098635076, "percentage": 22.35, "elapsed_time": "3:45:59", "remaining_time": "13:05:02", "throughput": 559.58, "total_tokens": 7587840} {"current_steps": 765, "total_steps": 3400, "loss": 0.008, "lr": 9.185832391312644e-05, "epoch": 0.3940252382178728, "percentage": 22.5, "elapsed_time": "3:47:26", "remaining_time": "13:03:24", "throughput": 559.69, "total_tokens": 7637760} {"current_steps": 770, "total_steps": 3400, "loss": 0.0297, "lr": 9.172483500792244e-05, "epoch": 0.39660056657223797, "percentage": 22.65, "elapsed_time": "3:48:53", "remaining_time": "13:01:46", "throughput": 559.79, "total_tokens": 7687680} {"current_steps": 775, "total_steps": 3400, "loss": 0.0239, "lr": 9.159035930421658e-05, "epoch": 0.39917589492660316, "percentage": 22.79, "elapsed_time": "3:50:19", "remaining_time": "13:00:08", "throughput": 559.9, "total_tokens": 7737600} {"current_steps": 780, "total_steps": 3400, "loss": 0.0162, "lr": 9.145489998237902e-05, "epoch": 0.40175122328096835, "percentage": 22.94, "elapsed_time": "3:51:46", "remaining_time": "12:58:31", "throughput": 559.99, "total_tokens": 7787520} {"current_steps": 785, "total_steps": 3400, "loss": 0.0309, "lr": 9.131846024604274e-05, "epoch": 0.4043265516353335, "percentage": 23.09, "elapsed_time": "3:53:12", "remaining_time": "12:56:51", "throughput": 560.13, "total_tokens": 7837440} {"current_steps": 790, "total_steps": 3400, "loss": 0.0432, "lr": 9.11810433220276e-05, "epoch": 0.4069018799896987, "percentage": 23.24, "elapsed_time": "3:54:38", "remaining_time": "12:55:12", "throughput": 560.24, "total_tokens": 7887360} {"current_steps": 795, "total_steps": 3400, "loss": 0.0022, "lr": 9.104265246026415e-05, "epoch": 0.40947720834406387, "percentage": 23.38, "elapsed_time": "3:56:04", "remaining_time": "12:53:34", "throughput": 560.35, "total_tokens": 7937280} {"current_steps": 800, "total_steps": 3400, "loss": 0.0065, "lr": 9.090329093371666e-05, "epoch": 0.41205253669842906, "percentage": 23.53, "elapsed_time": "3:57:31", "remaining_time": "12:51:57", "throughput": 560.44, "total_tokens": 7987200} {"current_steps": 800, "total_steps": 3400, "eval_loss": 0.006797688081860542, "epoch": 0.41205253669842906, "percentage": 23.53, "elapsed_time": "3:57:50", "remaining_time": "12:53:00", "throughput": 559.68, "total_tokens": 7987200} {"current_steps": 805, "total_steps": 3400, "loss": 0.0025, "lr": 9.076296203830579e-05, "epoch": 0.41462786505279425, "percentage": 23.68, "elapsed_time": "3:59:22", "remaining_time": "12:51:39", "throughput": 559.58, "total_tokens": 8037120} {"current_steps": 810, "total_steps": 3400, "loss": 0.0338, "lr": 9.062166909283062e-05, "epoch": 0.4172031934071594, "percentage": 23.82, "elapsed_time": "4:00:49", "remaining_time": "12:50:02", "throughput": 559.68, "total_tokens": 8087040} {"current_steps": 815, "total_steps": 3400, "loss": 0.0505, "lr": 9.047941543889014e-05, "epoch": 0.4197785217615246, "percentage": 23.97, "elapsed_time": "4:02:15", "remaining_time": "12:48:23", "throughput": 559.8, "total_tokens": 8136960} {"current_steps": 820, "total_steps": 3400, "loss": 0.0335, "lr": 9.033620444080428e-05, "epoch": 0.4223538501158898, "percentage": 24.12, "elapsed_time": "4:03:41", "remaining_time": "12:46:44", "throughput": 559.91, "total_tokens": 8186880} {"current_steps": 825, "total_steps": 3400, "loss": 0.0196, "lr": 9.019203948553422e-05, "epoch": 0.42492917847025496, "percentage": 24.26, "elapsed_time": "4:05:07", "remaining_time": "12:45:05", "throughput": 560.04, "total_tokens": 8236800} {"current_steps": 830, "total_steps": 3400, "loss": 0.018, "lr": 9.004692398260244e-05, "epoch": 0.42750450682462016, "percentage": 24.41, "elapsed_time": "4:06:34", "remaining_time": "12:43:28", "throughput": 560.13, "total_tokens": 8286720} {"current_steps": 835, "total_steps": 3400, "loss": 0.012, "lr": 8.9900861364012e-05, "epoch": 0.43007983517898535, "percentage": 24.56, "elapsed_time": "4:08:00", "remaining_time": "12:41:49", "throughput": 560.26, "total_tokens": 8336640} {"current_steps": 840, "total_steps": 3400, "loss": 0.0062, "lr": 8.975385508416532e-05, "epoch": 0.4326551635333505, "percentage": 24.71, "elapsed_time": "4:09:26", "remaining_time": "12:40:12", "throughput": 560.35, "total_tokens": 8386560} {"current_steps": 845, "total_steps": 3400, "loss": 0.0232, "lr": 8.960590861978265e-05, "epoch": 0.4352304918877157, "percentage": 24.85, "elapsed_time": "4:10:52", "remaining_time": "12:38:33", "throughput": 560.48, "total_tokens": 8436480} {"current_steps": 850, "total_steps": 3400, "loss": 0.0306, "lr": 8.945702546981969e-05, "epoch": 0.43780582024208087, "percentage": 25.0, "elapsed_time": "4:12:18", "remaining_time": "12:36:54", "throughput": 560.6, "total_tokens": 8486400} {"current_steps": 850, "total_steps": 3400, "eval_loss": 0.007198736071586609, "epoch": 0.43780582024208087, "percentage": 25.0, "elapsed_time": "4:12:37", "remaining_time": "12:37:53", "throughput": 559.87, "total_tokens": 8486400} {"current_steps": 855, "total_steps": 3400, "loss": 0.0255, "lr": 8.930720915538487e-05, "epoch": 0.44038114859644606, "percentage": 25.15, "elapsed_time": "4:14:08", "remaining_time": "12:36:30", "throughput": 559.8, "total_tokens": 8536320} {"current_steps": 860, "total_steps": 3400, "loss": 0.0267, "lr": 8.915646321965614e-05, "epoch": 0.44295647695081125, "percentage": 25.29, "elapsed_time": "4:15:34", "remaining_time": "12:34:50", "throughput": 559.92, "total_tokens": 8586240} {"current_steps": 865, "total_steps": 3400, "loss": 0.0107, "lr": 8.900479122779712e-05, "epoch": 0.4455318053051764, "percentage": 25.44, "elapsed_time": "4:17:01", "remaining_time": "12:33:13", "throughput": 560.02, "total_tokens": 8636160} {"current_steps": 870, "total_steps": 3400, "loss": 0.0277, "lr": 8.885219676687277e-05, "epoch": 0.4481071336595416, "percentage": 25.59, "elapsed_time": "4:18:26", "remaining_time": "12:31:34", "throughput": 560.15, "total_tokens": 8686080} {"current_steps": 875, "total_steps": 3400, "loss": 0.0175, "lr": 8.869868344576459e-05, "epoch": 0.45068246201390677, "percentage": 25.74, "elapsed_time": "4:19:52", "remaining_time": "12:29:56", "throughput": 560.25, "total_tokens": 8736000} {"current_steps": 880, "total_steps": 3400, "loss": 0.0065, "lr": 8.854425489508532e-05, "epoch": 0.45325779036827196, "percentage": 25.88, "elapsed_time": "4:21:18", "remaining_time": "12:28:18", "throughput": 560.37, "total_tokens": 8785920} {"current_steps": 885, "total_steps": 3400, "loss": 0.0476, "lr": 8.838891476709288e-05, "epoch": 0.45583311872263715, "percentage": 26.03, "elapsed_time": "4:22:44", "remaining_time": "12:26:40", "throughput": 560.48, "total_tokens": 8835840} {"current_steps": 890, "total_steps": 3400, "loss": 0.018, "lr": 8.823266673560426e-05, "epoch": 0.4584084470770023, "percentage": 26.18, "elapsed_time": "4:24:10", "remaining_time": "12:25:01", "throughput": 560.6, "total_tokens": 8885760} {"current_steps": 895, "total_steps": 3400, "loss": 0.0337, "lr": 8.807551449590846e-05, "epoch": 0.4609837754313675, "percentage": 26.32, "elapsed_time": "4:25:36", "remaining_time": "12:23:24", "throughput": 560.71, "total_tokens": 8935680} {"current_steps": 900, "total_steps": 3400, "loss": 0.0063, "lr": 8.791746176467907e-05, "epoch": 0.4635591037857327, "percentage": 26.47, "elapsed_time": "4:27:02", "remaining_time": "12:21:46", "throughput": 560.81, "total_tokens": 8985600} {"current_steps": 900, "total_steps": 3400, "eval_loss": 0.010749292559921741, "epoch": 0.4635591037857327, "percentage": 26.47, "elapsed_time": "4:27:21", "remaining_time": "12:22:40", "throughput": 560.14, "total_tokens": 8985600} {"current_steps": 905, "total_steps": 3400, "loss": 0.0318, "lr": 8.775851227988656e-05, "epoch": 0.46613443214009787, "percentage": 26.62, "elapsed_time": "4:28:53", "remaining_time": "12:21:17", "throughput": 560.05, "total_tokens": 9035520} {"current_steps": 910, "total_steps": 3400, "loss": 0.0635, "lr": 8.759866980070963e-05, "epoch": 0.46870976049446306, "percentage": 26.76, "elapsed_time": "4:30:19", "remaining_time": "12:19:40", "throughput": 560.16, "total_tokens": 9085440} {"current_steps": 915, "total_steps": 3400, "loss": 0.0035, "lr": 8.743793810744654e-05, "epoch": 0.47128508884882825, "percentage": 26.91, "elapsed_time": "4:31:45", "remaining_time": "12:18:03", "throughput": 560.26, "total_tokens": 9135360} {"current_steps": 920, "total_steps": 3400, "loss": 0.0047, "lr": 8.727632100142551e-05, "epoch": 0.4738604172031934, "percentage": 27.06, "elapsed_time": "4:33:11", "remaining_time": "12:16:25", "throughput": 560.37, "total_tokens": 9185280} {"current_steps": 925, "total_steps": 3400, "loss": 0.0194, "lr": 8.711382230491493e-05, "epoch": 0.4764357455575586, "percentage": 27.21, "elapsed_time": "4:34:37", "remaining_time": "12:14:48", "throughput": 560.47, "total_tokens": 9235200} {"current_steps": 930, "total_steps": 3400, "loss": 0.0234, "lr": 8.695044586103296e-05, "epoch": 0.47901107391192377, "percentage": 27.35, "elapsed_time": "4:36:03", "remaining_time": "12:13:11", "throughput": 560.58, "total_tokens": 9285120} {"current_steps": 935, "total_steps": 3400, "loss": 0.0253, "lr": 8.678619553365659e-05, "epoch": 0.48158640226628896, "percentage": 27.5, "elapsed_time": "4:37:29", "remaining_time": "12:11:34", "throughput": 560.67, "total_tokens": 9335040} {"current_steps": 940, "total_steps": 3400, "loss": 0.0191, "lr": 8.662107520733027e-05, "epoch": 0.48416173062065415, "percentage": 27.65, "elapsed_time": "4:38:55", "remaining_time": "12:09:56", "throughput": 560.79, "total_tokens": 9384960} {"current_steps": 945, "total_steps": 3400, "loss": 0.0469, "lr": 8.64550887871741e-05, "epoch": 0.4867370589750193, "percentage": 27.79, "elapsed_time": "4:40:21", "remaining_time": "12:08:19", "throughput": 560.9, "total_tokens": 9434880} {"current_steps": 950, "total_steps": 3400, "loss": 0.0415, "lr": 8.628824019879137e-05, "epoch": 0.4893123873293845, "percentage": 27.94, "elapsed_time": "4:41:47", "remaining_time": "12:06:43", "throughput": 560.99, "total_tokens": 9484800} {"current_steps": 950, "total_steps": 3400, "eval_loss": 0.007216573692858219, "epoch": 0.4893123873293845, "percentage": 27.94, "elapsed_time": "4:42:06", "remaining_time": "12:07:32", "throughput": 560.35, "total_tokens": 9484800} {"current_steps": 955, "total_steps": 3400, "loss": 0.0393, "lr": 8.612053338817581e-05, "epoch": 0.49188771568374967, "percentage": 28.09, "elapsed_time": "4:43:37", "remaining_time": "12:06:08", "throughput": 560.28, "total_tokens": 9534720} {"current_steps": 960, "total_steps": 3400, "loss": 0.0102, "lr": 8.595197232161824e-05, "epoch": 0.49446304403811486, "percentage": 28.24, "elapsed_time": "4:45:03", "remaining_time": "12:04:31", "throughput": 560.38, "total_tokens": 9584640} {"current_steps": 965, "total_steps": 3400, "loss": 0.0087, "lr": 8.578256098561275e-05, "epoch": 0.49703837239248005, "percentage": 28.38, "elapsed_time": "4:46:29", "remaining_time": "12:02:55", "throughput": 560.48, "total_tokens": 9634560} {"current_steps": 970, "total_steps": 3400, "loss": 0.0097, "lr": 8.561230338676239e-05, "epoch": 0.49961370074684525, "percentage": 28.53, "elapsed_time": "4:47:55", "remaining_time": "12:01:18", "throughput": 560.59, "total_tokens": 9684480} {"current_steps": 975, "total_steps": 3400, "loss": 0.0013, "lr": 8.544120355168451e-05, "epoch": 0.5021890291012104, "percentage": 28.68, "elapsed_time": "4:49:21", "remaining_time": "11:59:41", "throughput": 560.69, "total_tokens": 9734400} {"current_steps": 980, "total_steps": 3400, "loss": 0.0268, "lr": 8.526926552691544e-05, "epoch": 0.5047643574555756, "percentage": 28.82, "elapsed_time": "4:50:47", "remaining_time": "11:58:04", "throughput": 560.78, "total_tokens": 9784320} {"current_steps": 985, "total_steps": 3400, "loss": 0.0418, "lr": 8.509649337881483e-05, "epoch": 0.5073396858099408, "percentage": 28.97, "elapsed_time": "4:52:13", "remaining_time": "11:56:27", "throughput": 560.89, "total_tokens": 9834240} {"current_steps": 990, "total_steps": 3400, "loss": 0.0011, "lr": 8.492289119346943e-05, "epoch": 0.509915014164306, "percentage": 29.12, "elapsed_time": "4:53:39", "remaining_time": "11:54:52", "throughput": 560.97, "total_tokens": 9884160} {"current_steps": 995, "total_steps": 3400, "loss": 0.0058, "lr": 8.474846307659658e-05, "epoch": 0.5124903425186711, "percentage": 29.26, "elapsed_time": "4:55:05", "remaining_time": "11:53:15", "throughput": 561.07, "total_tokens": 9934080} {"current_steps": 1000, "total_steps": 3400, "loss": 0.0547, "lr": 8.457321315344694e-05, "epoch": 0.5150656708730363, "percentage": 29.41, "elapsed_time": "4:56:31", "remaining_time": "11:51:40", "throughput": 561.16, "total_tokens": 9984000} {"current_steps": 1000, "total_steps": 3400, "eval_loss": 0.0007357922149822116, "epoch": 0.5150656708730363, "percentage": 29.41, "elapsed_time": "4:56:50", "remaining_time": "11:52:26", "throughput": 560.55, "total_tokens": 9984000} {"current_steps": 1005, "total_steps": 3400, "loss": 0.0042, "lr": 8.439714556870704e-05, "epoch": 0.5176409992274015, "percentage": 29.56, "elapsed_time": "4:58:22", "remaining_time": "11:51:02", "throughput": 560.49, "total_tokens": 10033920} {"current_steps": 1010, "total_steps": 3400, "loss": 0.0419, "lr": 8.422026448640124e-05, "epoch": 0.5202163275817667, "percentage": 29.71, "elapsed_time": "4:59:48", "remaining_time": "11:49:26", "throughput": 560.57, "total_tokens": 10083840} {"current_steps": 1015, "total_steps": 3400, "loss": 0.0313, "lr": 8.40425740897932e-05, "epoch": 0.5227916559361319, "percentage": 29.85, "elapsed_time": "5:01:14", "remaining_time": "11:47:49", "throughput": 560.68, "total_tokens": 10133760} {"current_steps": 1020, "total_steps": 3400, "loss": 0.005, "lr": 8.386407858128706e-05, "epoch": 0.525366984290497, "percentage": 30.0, "elapsed_time": "5:02:40", "remaining_time": "11:46:13", "throughput": 560.77, "total_tokens": 10183680} {"current_steps": 1025, "total_steps": 3400, "loss": 0.0171, "lr": 8.368478218232787e-05, "epoch": 0.5279423126448622, "percentage": 30.15, "elapsed_time": "5:04:06", "remaining_time": "11:44:37", "throughput": 560.87, "total_tokens": 10233600} {"current_steps": 1030, "total_steps": 3400, "loss": 0.0019, "lr": 8.350468913330192e-05, "epoch": 0.5305176409992274, "percentage": 30.29, "elapsed_time": "5:05:31", "remaining_time": "11:42:59", "throughput": 560.98, "total_tokens": 10283520} {"current_steps": 1035, "total_steps": 3400, "loss": 0.0256, "lr": 8.33238036934364e-05, "epoch": 0.5330929693535926, "percentage": 30.44, "elapsed_time": "5:06:57", "remaining_time": "11:41:24", "throughput": 561.06, "total_tokens": 10333440} {"current_steps": 1040, "total_steps": 3400, "loss": 0.0019, "lr": 8.31421301406986e-05, "epoch": 0.5356682977079578, "percentage": 30.59, "elapsed_time": "5:08:23", "remaining_time": "11:39:48", "throughput": 561.15, "total_tokens": 10383360} {"current_steps": 1045, "total_steps": 3400, "loss": 0.018, "lr": 8.29596727716949e-05, "epoch": 0.5382436260623229, "percentage": 30.74, "elapsed_time": "5:09:50", "remaining_time": "11:38:14", "throughput": 561.23, "total_tokens": 10433280} {"current_steps": 1050, "total_steps": 3400, "loss": 0.0007, "lr": 8.277643590156894e-05, "epoch": 0.5408189544166881, "percentage": 30.88, "elapsed_time": "5:11:16", "remaining_time": "11:36:40", "throughput": 561.3, "total_tokens": 10483200} {"current_steps": 1050, "total_steps": 3400, "eval_loss": 0.05677948147058487, "epoch": 0.5408189544166881, "percentage": 30.88, "elapsed_time": "5:11:35", "remaining_time": "11:37:22", "throughput": 560.73, "total_tokens": 10483200} {"current_steps": 1055, "total_steps": 3400, "loss": 0.0436, "lr": 8.259242386389973e-05, "epoch": 0.5433942827710533, "percentage": 31.03, "elapsed_time": "5:13:08", "remaining_time": "11:36:01", "throughput": 560.63, "total_tokens": 10533120} {"current_steps": 1060, "total_steps": 3400, "loss": 0.0124, "lr": 8.240764101059912e-05, "epoch": 0.5459696111254185, "percentage": 31.18, "elapsed_time": "5:14:34", "remaining_time": "11:34:26", "throughput": 560.71, "total_tokens": 10583040} {"current_steps": 1065, "total_steps": 3400, "loss": 0.0155, "lr": 8.222209171180883e-05, "epoch": 0.5485449394797837, "percentage": 31.32, "elapsed_time": "5:16:00", "remaining_time": "11:32:50", "throughput": 560.79, "total_tokens": 10632960} {"current_steps": 1070, "total_steps": 3400, "loss": 0.0206, "lr": 8.203578035579715e-05, "epoch": 0.5511202678341488, "percentage": 31.47, "elapsed_time": "5:17:26", "remaining_time": "11:31:15", "throughput": 560.88, "total_tokens": 10682880} {"current_steps": 1075, "total_steps": 3400, "loss": 0.0237, "lr": 8.184871134885513e-05, "epoch": 0.553695596188514, "percentage": 31.62, "elapsed_time": "5:18:53", "remaining_time": "11:29:41", "throughput": 560.95, "total_tokens": 10732800} {"current_steps": 1080, "total_steps": 3400, "loss": 0.0018, "lr": 8.166088911519235e-05, "epoch": 0.5562709245428792, "percentage": 31.76, "elapsed_time": "5:20:19", "remaining_time": "11:28:06", "throughput": 561.03, "total_tokens": 10782720} {"current_steps": 1085, "total_steps": 3400, "loss": 0.0296, "lr": 8.147231809683236e-05, "epoch": 0.5588462528972444, "percentage": 31.91, "elapsed_time": "5:21:46", "remaining_time": "11:26:32", "throughput": 561.1, "total_tokens": 10832640} {"current_steps": 1090, "total_steps": 3400, "loss": 0.0006, "lr": 8.128300275350756e-05, "epoch": 0.5614215812516096, "percentage": 32.06, "elapsed_time": "5:23:12", "remaining_time": "11:24:56", "throughput": 561.19, "total_tokens": 10882560} {"current_steps": 1095, "total_steps": 3400, "loss": 0.0004, "lr": 8.109294756255375e-05, "epoch": 0.5639969096059748, "percentage": 32.21, "elapsed_time": "5:24:38", "remaining_time": "11:23:23", "throughput": 561.25, "total_tokens": 10932480} {"current_steps": 1100, "total_steps": 3400, "loss": 0.0056, "lr": 8.090215701880419e-05, "epoch": 0.56657223796034, "percentage": 32.35, "elapsed_time": "5:26:04", "remaining_time": "11:21:47", "throughput": 561.34, "total_tokens": 10982400} {"current_steps": 1100, "total_steps": 3400, "eval_loss": 0.0003656313638202846, "epoch": 0.56657223796034, "percentage": 32.35, "elapsed_time": "5:26:23", "remaining_time": "11:22:28", "throughput": 560.79, "total_tokens": 10982400} {"current_steps": 1105, "total_steps": 3400, "loss": 0.0005, "lr": 8.07106356344834e-05, "epoch": 0.5691475663147051, "percentage": 32.5, "elapsed_time": "5:27:55", "remaining_time": "11:21:04", "throughput": 560.71, "total_tokens": 11032320} {"current_steps": 1110, "total_steps": 3400, "loss": 0.0008, "lr": 8.051838793910038e-05, "epoch": 0.5717228946690703, "percentage": 32.65, "elapsed_time": "5:29:21", "remaining_time": "11:19:29", "throughput": 560.8, "total_tokens": 11082240} {"current_steps": 1115, "total_steps": 3400, "loss": 0.001, "lr": 8.032541847934146e-05, "epoch": 0.5742982230234355, "percentage": 32.79, "elapsed_time": "5:30:48", "remaining_time": "11:17:55", "throughput": 560.87, "total_tokens": 11132160} {"current_steps": 1120, "total_steps": 3400, "loss": 0.0219, "lr": 8.013173181896283e-05, "epoch": 0.5768735513778007, "percentage": 32.94, "elapsed_time": "5:32:14", "remaining_time": "11:16:20", "throughput": 560.95, "total_tokens": 11182080} {"current_steps": 1125, "total_steps": 3400, "loss": 0.0, "lr": 7.993733253868256e-05, "epoch": 0.5794488797321659, "percentage": 33.09, "elapsed_time": "5:33:39", "remaining_time": "11:14:44", "throughput": 561.04, "total_tokens": 11232000} {"current_steps": 1130, "total_steps": 3400, "loss": 0.0, "lr": 7.974222523607236e-05, "epoch": 0.582024208086531, "percentage": 33.24, "elapsed_time": "5:35:06", "remaining_time": "11:13:10", "throughput": 561.11, "total_tokens": 11281920} {"current_steps": 1135, "total_steps": 3400, "loss": 0.0001, "lr": 7.954641452544865e-05, "epoch": 0.5845995364408962, "percentage": 33.38, "elapsed_time": "5:36:32", "remaining_time": "11:11:35", "throughput": 561.2, "total_tokens": 11331840} {"current_steps": 1140, "total_steps": 3400, "loss": 0.0, "lr": 7.934990503776363e-05, "epoch": 0.5871748647952614, "percentage": 33.53, "elapsed_time": "5:37:58", "remaining_time": "11:10:00", "throughput": 561.28, "total_tokens": 11381760} {"current_steps": 1145, "total_steps": 3400, "loss": 0.0001, "lr": 7.915270142049566e-05, "epoch": 0.5897501931496266, "percentage": 33.68, "elapsed_time": "5:39:24", "remaining_time": "11:08:26", "throughput": 561.35, "total_tokens": 11431680} {"current_steps": 1150, "total_steps": 3400, "loss": 0.0127, "lr": 7.89548083375394e-05, "epoch": 0.5923255215039918, "percentage": 33.82, "elapsed_time": "5:40:50", "remaining_time": "11:06:51", "throughput": 561.43, "total_tokens": 11481600} {"current_steps": 1150, "total_steps": 3400, "eval_loss": 1.5566551155643538e-05, "epoch": 0.5923255215039918, "percentage": 33.82, "elapsed_time": "5:41:09", "remaining_time": "11:07:29", "throughput": 560.9, "total_tokens": 11481600} {"current_steps": 1155, "total_steps": 3400, "loss": 0.0003, "lr": 7.875623046909544e-05, "epoch": 0.5949008498583569, "percentage": 33.97, "elapsed_time": "5:42:40", "remaining_time": "11:06:04", "throughput": 560.85, "total_tokens": 11531520} {"current_steps": 1160, "total_steps": 3400, "loss": 0.0, "lr": 7.855697251155967e-05, "epoch": 0.5974761782127221, "percentage": 34.12, "elapsed_time": "5:44:07", "remaining_time": "11:04:30", "throughput": 560.92, "total_tokens": 11581440} {"current_steps": 1165, "total_steps": 3400, "loss": 0.0414, "lr": 7.835703917741212e-05, "epoch": 0.6000515065670873, "percentage": 34.26, "elapsed_time": "5:45:33", "remaining_time": "11:02:55", "throughput": 561.0, "total_tokens": 11631360} {"current_steps": 1170, "total_steps": 3400, "loss": 0.02, "lr": 7.81564351951057e-05, "epoch": 0.6026268349214525, "percentage": 34.41, "elapsed_time": "5:46:58", "remaining_time": "11:01:20", "throughput": 561.09, "total_tokens": 11681280} {"current_steps": 1175, "total_steps": 3400, "loss": 0.0002, "lr": 7.795516530895414e-05, "epoch": 0.6052021632758177, "percentage": 34.56, "elapsed_time": "5:48:23", "remaining_time": "10:59:44", "throughput": 561.2, "total_tokens": 11731200} {"current_steps": 1180, "total_steps": 3400, "loss": 0.0026, "lr": 7.775323427901993e-05, "epoch": 0.6077774916301828, "percentage": 34.71, "elapsed_time": "5:49:49", "remaining_time": "10:58:08", "throughput": 561.28, "total_tokens": 11781120} {"current_steps": 1185, "total_steps": 3400, "loss": 0.0168, "lr": 7.755064688100171e-05, "epoch": 0.610352819984548, "percentage": 34.85, "elapsed_time": "5:51:14", "remaining_time": "10:56:32", "throughput": 561.38, "total_tokens": 11831040} {"current_steps": 1190, "total_steps": 3400, "loss": 0.0037, "lr": 7.734740790612136e-05, "epoch": 0.6129281483389132, "percentage": 35.0, "elapsed_time": "5:52:40", "remaining_time": "10:54:57", "throughput": 561.47, "total_tokens": 11880960} {"current_steps": 1195, "total_steps": 3400, "loss": 0.0007, "lr": 7.714352216101055e-05, "epoch": 0.6155034766932784, "percentage": 35.15, "elapsed_time": "5:54:05", "remaining_time": "10:53:21", "throughput": 561.58, "total_tokens": 11930880} {"current_steps": 1200, "total_steps": 3400, "loss": 0.0038, "lr": 7.693899446759727e-05, "epoch": 0.6180788050476436, "percentage": 35.29, "elapsed_time": "5:55:30", "remaining_time": "10:51:46", "throughput": 561.67, "total_tokens": 11980800} {"current_steps": 1200, "total_steps": 3400, "eval_loss": 0.0022160401567816734, "epoch": 0.6180788050476436, "percentage": 35.29, "elapsed_time": "5:55:49", "remaining_time": "10:52:20", "throughput": 561.17, "total_tokens": 11980800} {"current_steps": 1205, "total_steps": 3400, "loss": 0.0002, "lr": 7.673382966299163e-05, "epoch": 0.6206541334020087, "percentage": 35.44, "elapsed_time": "5:57:20", "remaining_time": "10:50:55", "throughput": 561.12, "total_tokens": 12030720} {"current_steps": 1210, "total_steps": 3400, "loss": 0.0262, "lr": 7.65280325993715e-05, "epoch": 0.623229461756374, "percentage": 35.59, "elapsed_time": "5:58:47", "remaining_time": "10:49:22", "throughput": 561.18, "total_tokens": 12080640} {"current_steps": 1215, "total_steps": 3400, "loss": 0.0403, "lr": 7.63216081438678e-05, "epoch": 0.6258047901107391, "percentage": 35.74, "elapsed_time": "6:00:13", "remaining_time": "10:47:48", "throughput": 561.25, "total_tokens": 12130560} {"current_steps": 1220, "total_steps": 3400, "loss": 0.002, "lr": 7.611456117844934e-05, "epoch": 0.6283801184651043, "percentage": 35.88, "elapsed_time": "6:01:39", "remaining_time": "10:46:14", "throughput": 561.32, "total_tokens": 12180480} {"current_steps": 1201, "total_steps": 1200, "epoch": 0.6185938707185166, "percentage": 100.08, "elapsed_time": "0:01:42", "remaining_time": "0:00:00", "throughput": 117150.6, "total_tokens": 11990784}